diff --git "a/wandb/run-20220324_170224-3nn5zxhl/files/wandb-summary.json" "b/wandb/run-20220324_170224-3nn5zxhl/files/wandb-summary.json" --- "a/wandb/run-20220324_170224-3nn5zxhl/files/wandb-summary.json" +++ "b/wandb/run-20220324_170224-3nn5zxhl/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 5.4388, "train/learning_rate": 2.718450704225352e-05, "train/epoch": 3.36, "train/global_step": 3000, "_runtime": 17848, "_timestamp": 1648159192, "_step": 3001, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 4.0, 5.0, 6.0, 11.0, 7.0, 12.0, 13.0, 21.0, 23.0, 25.0, 23.0, 31.0, 46.0, 47.0, 38.0, 49.0, 54.0, 50.0, 66.0, 47.0, 52.0, 45.0, 64.0, 48.0, 46.0, 37.0, 23.0, 29.0, 17.0, 11.0, 14.0, 4.0, 10.0, 8.0, 7.0, 6.0, 5.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-78.06173706054688, -75.80459594726562, -73.54745483398438, -71.29032135009766, -69.0331802368164, -66.77603912353516, -64.51890563964844, -62.26176452636719, -60.00462341308594, -57.74748229980469, -55.4903450012207, -53.23320770263672, -50.97606658935547, -48.71892547607422, -46.461788177490234, -44.20465087890625, -41.947509765625, -39.69036865234375, -37.433231353759766, -35.17609405517578, -32.91895294189453, -30.661813735961914, -28.404674530029297, -26.14753532409668, -23.890396118164062, -21.633256912231445, -19.376117706298828, -17.11897850036621, -14.861839294433594, -12.604700088500977, -10.34756088256836, -8.090421676635742, -5.833290100097656, -3.576150894165039, -1.3190116882324219, 0.9381275177001953, 3.1952667236328125, 5.45240592956543, 7.709545135498047, 9.966684341430664, 12.223823547363281, 14.480962753295898, 16.738101959228516, 18.995241165161133, 21.25238037109375, 23.509519577026367, 25.766658782958984, 28.0237979888916, 30.28093719482422, 32.53807830810547, 34.79521560668945, 37.05235290527344, 39.30949401855469, 41.56663513183594, 43.82377243041992, 46.080909729003906, 48.338050842285156, 50.595191955566406, 52.85232925415039, 55.109466552734375, 57.366607666015625, 59.623748779296875, 61.88088607788086, 64.13802337646484, 66.3951644897461]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 6.0, 6.0, 13.0, 13.0, 10.0, 14.0, 18.0, 18.0, 18.0, 18.0, 23.0, 30.0, 35.0, 28.0, 38.0, 35.0, 33.0, 47.0, 52.0, 48.0, 36.0, 40.0, 40.0, 30.0, 41.0, 38.0, 42.0, 26.0, 27.0, 31.0, 23.0, 20.0, 16.0, 17.0, 18.0, 12.0, 6.0, 11.0, 6.0, 7.0, 2.0, 5.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-60.63709259033203, -58.81853485107422, -56.999977111816406, -55.18142318725586, -53.36286544799805, -51.544307708740234, -49.72575378417969, -47.907196044921875, -46.08863830566406, -44.27008056640625, -42.45152282714844, -40.63296890258789, -38.81441116333008, -36.995853424072266, -35.17729949951172, -33.358741760253906, -31.540184020996094, -29.72162628173828, -27.9030704498291, -26.084514617919922, -24.26595687866211, -22.447399139404297, -20.628843307495117, -18.810287475585938, -16.991729736328125, -15.173172950744629, -13.354616165161133, -11.536059379577637, -9.71750259399414, -7.8989458084106445, -6.080389022827148, -4.261832237243652, -2.4432754516601562, -0.6247186660766602, 1.193838119506836, 3.012394905090332, 4.830951690673828, 6.649508476257324, 8.46806526184082, 10.286622047424316, 12.105178833007812, 13.923735618591309, 15.742292404174805, 17.560848236083984, 19.379405975341797, 21.19796371459961, 23.01651954650879, 24.83507537841797, 26.65363311767578, 28.472190856933594, 30.290746688842773, 32.10930252075195, 33.927860260009766, 35.74641799926758, 37.564971923828125, 39.38352966308594, 41.20208740234375, 43.02064514160156, 44.839202880859375, 46.65775680541992, 48.476314544677734, 50.29487228393555, 52.113426208496094, 53.931983947753906, 55.75054168701172]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 9.0, 10.0, 14.0, 22.0, 46.0, 71.0, 123.0, 214.0, 366.0, 592.0, 1049.0, 1829.0, 2957.0, 5431.0, 9784.0, 17781.0, 31737.0, 59061.0, 108717.0, 194431.0, 329891.0, 504693.0, 657690.0, 697545.0, 589223.0, 411198.0, 252856.0, 142775.0, 78256.0, 42971.0, 23178.0, 12903.0, 7223.0, 4075.0, 2355.0, 1346.0, 754.0, 450.0, 276.0, 144.0, 86.0, 72.0, 31.0, 22.0, 12.0, 8.0, 5.0, 3.0, 1.0, 5.0, 0.0, 0.0, 1.0], "bins": [-43.25, -41.98681640625, -40.7236328125, -39.46044921875, -38.197265625, -36.93408203125, -35.6708984375, -34.40771484375, -33.14453125, -31.88134765625, -30.6181640625, -29.35498046875, -28.091796875, -26.82861328125, -25.5654296875, -24.30224609375, -23.0390625, -21.77587890625, -20.5126953125, -19.24951171875, -17.986328125, -16.72314453125, -15.4599609375, -14.19677734375, -12.93359375, -11.67041015625, -10.4072265625, -9.14404296875, -7.880859375, -6.61767578125, -5.3544921875, -4.09130859375, -2.828125, -1.56494140625, -0.3017578125, 0.96142578125, 2.224609375, 3.48779296875, 4.7509765625, 6.01416015625, 7.27734375, 8.54052734375, 9.8037109375, 11.06689453125, 12.330078125, 13.59326171875, 14.8564453125, 16.11962890625, 17.3828125, 18.64599609375, 19.9091796875, 21.17236328125, 22.435546875, 23.69873046875, 24.9619140625, 26.22509765625, 27.48828125, 28.75146484375, 30.0146484375, 31.27783203125, 32.541015625, 33.80419921875, 35.0673828125, 36.33056640625, 37.59375]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 3.0, 9.0, 8.0, 13.0, 12.0, 12.0, 15.0, 17.0, 9.0, 23.0, 18.0, 38.0, 43.0, 24.0, 40.0, 38.0, 48.0, 39.0, 36.0, 40.0, 47.0, 42.0, 40.0, 40.0, 34.0, 41.0, 37.0, 29.0, 19.0, 26.0, 32.0, 21.0, 22.0, 15.0, 17.0, 16.0, 9.0, 11.0, 8.0, 4.0, 8.0, 3.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.59375, -48.0654296875, -46.537109375, -45.0087890625, -43.48046875, -41.9521484375, -40.423828125, -38.8955078125, -37.3671875, -35.8388671875, -34.310546875, -32.7822265625, -31.25390625, -29.7255859375, -28.197265625, -26.6689453125, -25.140625, -23.6123046875, -22.083984375, -20.5556640625, -19.02734375, -17.4990234375, -15.970703125, -14.4423828125, -12.9140625, -11.3857421875, -9.857421875, -8.3291015625, -6.80078125, -5.2724609375, -3.744140625, -2.2158203125, -0.6875, 0.8408203125, 2.369140625, 3.8974609375, 5.42578125, 6.9541015625, 8.482421875, 10.0107421875, 11.5390625, 13.0673828125, 14.595703125, 16.1240234375, 17.65234375, 19.1806640625, 20.708984375, 22.2373046875, 23.765625, 25.2939453125, 26.822265625, 28.3505859375, 29.87890625, 31.4072265625, 32.935546875, 34.4638671875, 35.9921875, 37.5205078125, 39.048828125, 40.5771484375, 42.10546875, 43.6337890625, 45.162109375, 46.6904296875, 48.21875]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 8.0, 10.0, 22.0, 29.0, 56.0, 83.0, 101.0, 194.0, 297.0, 466.0, 683.0, 1026.0, 1571.0, 2516.0, 3766.0, 5693.0, 8547.0, 13014.0, 19812.0, 30244.0, 45341.0, 67588.0, 98853.0, 143344.0, 204170.0, 281418.0, 374439.0, 471201.0, 526729.0, 487888.0, 398331.0, 301924.0, 219679.0, 156694.0, 108257.0, 73661.0, 49482.0, 33402.0, 21755.0, 14565.0, 9392.0, 6206.0, 4082.0, 2697.0, 1708.0, 1181.0, 746.0, 500.0, 339.0, 216.0, 119.0, 95.0, 65.0, 35.0, 21.0, 12.0, 8.0, 6.0, 4.0, 3.0, 3.0], "bins": [-33.375, -32.3193359375, -31.263671875, -30.2080078125, -29.15234375, -28.0966796875, -27.041015625, -25.9853515625, -24.9296875, -23.8740234375, -22.818359375, -21.7626953125, -20.70703125, -19.6513671875, -18.595703125, -17.5400390625, -16.484375, -15.4287109375, -14.373046875, -13.3173828125, -12.26171875, -11.2060546875, -10.150390625, -9.0947265625, -8.0390625, -6.9833984375, -5.927734375, -4.8720703125, -3.81640625, -2.7607421875, -1.705078125, -0.6494140625, 0.40625, 1.4619140625, 2.517578125, 3.5732421875, 4.62890625, 5.6845703125, 6.740234375, 7.7958984375, 8.8515625, 9.9072265625, 10.962890625, 12.0185546875, 13.07421875, 14.1298828125, 15.185546875, 16.2412109375, 17.296875, 18.3525390625, 19.408203125, 20.4638671875, 21.51953125, 22.5751953125, 23.630859375, 24.6865234375, 25.7421875, 26.7978515625, 27.853515625, 28.9091796875, 29.96484375, 31.0205078125, 32.076171875, 33.1318359375, 34.1875]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 6.0, 9.0, 12.0, 9.0, 12.0, 14.0, 39.0, 34.0, 42.0, 51.0, 55.0, 102.0, 109.0, 113.0, 116.0, 171.0, 208.0, 202.0, 229.0, 256.0, 261.0, 250.0, 251.0, 250.0, 198.0, 173.0, 137.0, 143.0, 110.0, 90.0, 77.0, 64.0, 52.0, 37.0, 35.0, 33.0, 22.0, 27.0, 14.0, 12.0, 8.0, 8.0, 8.0, 6.0, 6.0, 6.0, 3.0, 1.0, 1.0, 4.0, 3.0, 2.0, 1.0, 2.0], "bins": [-17.859375, -17.2802734375, -16.701171875, -16.1220703125, -15.54296875, -14.9638671875, -14.384765625, -13.8056640625, -13.2265625, -12.6474609375, -12.068359375, -11.4892578125, -10.91015625, -10.3310546875, -9.751953125, -9.1728515625, -8.59375, -8.0146484375, -7.435546875, -6.8564453125, -6.27734375, -5.6982421875, -5.119140625, -4.5400390625, -3.9609375, -3.3818359375, -2.802734375, -2.2236328125, -1.64453125, -1.0654296875, -0.486328125, 0.0927734375, 0.671875, 1.2509765625, 1.830078125, 2.4091796875, 2.98828125, 3.5673828125, 4.146484375, 4.7255859375, 5.3046875, 5.8837890625, 6.462890625, 7.0419921875, 7.62109375, 8.2001953125, 8.779296875, 9.3583984375, 9.9375, 10.5166015625, 11.095703125, 11.6748046875, 12.25390625, 12.8330078125, 13.412109375, 13.9912109375, 14.5703125, 15.1494140625, 15.728515625, 16.3076171875, 16.88671875, 17.4658203125, 18.044921875, 18.6240234375, 19.203125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 1.0, 2.0, 3.0, 8.0, 7.0, 3.0, 5.0, 7.0, 11.0, 9.0, 15.0, 24.0, 22.0, 16.0, 25.0, 32.0, 30.0, 31.0, 39.0, 50.0, 60.0, 46.0, 46.0, 35.0, 51.0, 51.0, 36.0, 52.0, 42.0, 37.0, 38.0, 37.0, 19.0, 24.0, 15.0, 18.0, 11.0, 11.0, 11.0, 12.0, 5.0, 6.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.551883697509766, -41.90956497192383, -40.267250061035156, -38.62493133544922, -36.98261642456055, -35.34029769897461, -33.69798278808594, -32.0556640625, -30.413349151611328, -28.771032333374023, -27.12871551513672, -25.486398696899414, -23.84408187866211, -22.201763153076172, -20.5594482421875, -18.917129516601562, -17.274812698364258, -15.632495880126953, -13.990179061889648, -12.347862243652344, -10.705545425415039, -9.063227653503418, -7.420910835266113, -5.778594017028809, -4.136277198791504, -2.493960380554199, -0.8516433238983154, 0.7906737327575684, 2.432990550994873, 4.075307846069336, 5.717624664306641, 7.359941482543945, 9.00225830078125, 10.644575119018555, 12.28689193725586, 13.929208755493164, 15.571525573730469, 17.213844299316406, 18.856159210205078, 20.498477935791016, 22.140792846679688, 23.783109664916992, 25.425426483154297, 27.0677433013916, 28.710060119628906, 30.352378845214844, 31.994693756103516, 33.63701248168945, 35.279327392578125, 36.92164611816406, 38.563961029052734, 40.20627975463867, 41.848594665527344, 43.49091339111328, 45.13322830200195, 46.77554702758789, 48.41786575317383, 50.060184478759766, 51.70249938964844, 53.344818115234375, 54.98713302612305, 56.629451751708984, 58.271766662597656, 59.914085388183594, 61.556400299072266]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 10.0, 8.0, 12.0, 9.0, 15.0, 11.0, 17.0, 15.0, 28.0, 17.0, 25.0, 33.0, 39.0, 37.0, 43.0, 44.0, 43.0, 35.0, 46.0, 52.0, 45.0, 40.0, 42.0, 37.0, 35.0, 39.0, 28.0, 27.0, 28.0, 18.0, 13.0, 21.0, 19.0, 17.0, 20.0, 11.0, 9.0, 2.0, 5.0, 5.0, 0.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-60.92025375366211, -59.243980407714844, -57.567710876464844, -55.89143753051758, -54.21516799926758, -52.53889465332031, -50.86262512207031, -49.18635177612305, -47.51007843017578, -45.833805084228516, -44.157535552978516, -42.48126220703125, -40.80499267578125, -39.128719329833984, -37.45244598388672, -35.77617645263672, -34.09990692138672, -32.42363357543945, -30.747364044189453, -29.071090698242188, -27.394821166992188, -25.718547821044922, -24.04227638244629, -22.366004943847656, -20.689733505249023, -19.01346206665039, -17.337190628051758, -15.660918235778809, -13.984646797180176, -12.308375358581543, -10.632102966308594, -8.955831527709961, -7.2795562744140625, -5.60328483581543, -3.9270129203796387, -2.2507410049438477, -0.5744695663452148, 1.101801872253418, 2.778074264526367, 4.454345703125, 6.130617141723633, 7.806888580322266, 9.483160018920898, 11.159432411193848, 12.83570384979248, 14.511975288391113, 16.188247680664062, 17.864519119262695, 19.540790557861328, 21.21706199645996, 22.893333435058594, 24.56960678100586, 26.24587631225586, 27.922149658203125, 29.598421096801758, 31.27469253540039, 32.950965881347656, 34.62723922729492, 36.30350875854492, 37.97978210449219, 39.65605163574219, 41.33232498168945, 43.00859832763672, 44.68486785888672, 46.36113739013672]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 4.0, 3.0, 5.0, 12.0, 16.0, 20.0, 45.0, 47.0, 88.0, 130.0, 196.0, 258.0, 407.0, 589.0, 879.0, 1317.0, 2077.0, 3182.0, 5109.0, 8155.0, 13420.0, 22239.0, 37998.0, 65861.0, 115379.0, 184381.0, 214125.0, 153324.0, 90489.0, 51861.0, 29810.0, 17825.0, 10779.0, 6600.0, 4217.0, 2682.0, 1741.0, 1081.0, 757.0, 490.0, 323.0, 227.0, 141.0, 103.0, 60.0, 31.0, 15.0, 26.0, 14.0, 7.0, 6.0, 4.0, 5.0, 1.0, 3.0, 1.0, 4.0, 0.0, 1.0, 2.0], "bins": [-28.1875, -27.256591796875, -26.32568359375, -25.394775390625, -24.4638671875, -23.532958984375, -22.60205078125, -21.671142578125, -20.740234375, -19.809326171875, -18.87841796875, -17.947509765625, -17.0166015625, -16.085693359375, -15.15478515625, -14.223876953125, -13.29296875, -12.362060546875, -11.43115234375, -10.500244140625, -9.5693359375, -8.638427734375, -7.70751953125, -6.776611328125, -5.845703125, -4.914794921875, -3.98388671875, -3.052978515625, -2.1220703125, -1.191162109375, -0.26025390625, 0.670654296875, 1.6015625, 2.532470703125, 3.46337890625, 4.394287109375, 5.3251953125, 6.256103515625, 7.18701171875, 8.117919921875, 9.048828125, 9.979736328125, 10.91064453125, 11.841552734375, 12.7724609375, 13.703369140625, 14.63427734375, 15.565185546875, 16.49609375, 17.427001953125, 18.35791015625, 19.288818359375, 20.2197265625, 21.150634765625, 22.08154296875, 23.012451171875, 23.943359375, 24.874267578125, 25.80517578125, 26.736083984375, 27.6669921875, 28.597900390625, 29.52880859375, 30.459716796875, 31.390625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 6.0, 4.0, 5.0, 5.0, 11.0, 12.0, 10.0, 13.0, 15.0, 25.0, 12.0, 24.0, 23.0, 29.0, 42.0, 24.0, 42.0, 43.0, 43.0, 35.0, 41.0, 40.0, 41.0, 45.0, 41.0, 36.0, 27.0, 44.0, 26.0, 28.0, 26.0, 24.0, 26.0, 26.0, 14.0, 20.0, 13.0, 8.0, 16.0, 8.0, 11.0, 8.0, 6.0, 2.0, 7.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-50.09375, -48.5712890625, -47.048828125, -45.5263671875, -44.00390625, -42.4814453125, -40.958984375, -39.4365234375, -37.9140625, -36.3916015625, -34.869140625, -33.3466796875, -31.82421875, -30.3017578125, -28.779296875, -27.2568359375, -25.734375, -24.2119140625, -22.689453125, -21.1669921875, -19.64453125, -18.1220703125, -16.599609375, -15.0771484375, -13.5546875, -12.0322265625, -10.509765625, -8.9873046875, -7.46484375, -5.9423828125, -4.419921875, -2.8974609375, -1.375, 0.1474609375, 1.669921875, 3.1923828125, 4.71484375, 6.2373046875, 7.759765625, 9.2822265625, 10.8046875, 12.3271484375, 13.849609375, 15.3720703125, 16.89453125, 18.4169921875, 19.939453125, 21.4619140625, 22.984375, 24.5068359375, 26.029296875, 27.5517578125, 29.07421875, 30.5966796875, 32.119140625, 33.6416015625, 35.1640625, 36.6865234375, 38.208984375, 39.7314453125, 41.25390625, 42.7763671875, 44.298828125, 45.8212890625, 47.34375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 6.0, 5.0, 9.0, 9.0, 9.0, 12.0, 16.0, 25.0, 33.0, 33.0, 56.0, 63.0, 87.0, 133.0, 192.0, 288.0, 411.0, 629.0, 954.0, 1609.0, 2687.0, 4600.0, 8076.0, 14688.0, 29051.0, 59421.0, 124690.0, 231141.0, 257896.0, 157322.0, 75845.0, 36315.0, 18455.0, 9737.0, 5519.0, 3129.0, 1906.0, 1211.0, 742.0, 497.0, 315.0, 214.0, 159.0, 111.0, 64.0, 52.0, 44.0, 35.0, 17.0, 17.0, 9.0, 9.0, 4.0, 7.0, 0.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-21.21875, -20.537841796875, -19.85693359375, -19.176025390625, -18.4951171875, -17.814208984375, -17.13330078125, -16.452392578125, -15.771484375, -15.090576171875, -14.40966796875, -13.728759765625, -13.0478515625, -12.366943359375, -11.68603515625, -11.005126953125, -10.32421875, -9.643310546875, -8.96240234375, -8.281494140625, -7.6005859375, -6.919677734375, -6.23876953125, -5.557861328125, -4.876953125, -4.196044921875, -3.51513671875, -2.834228515625, -2.1533203125, -1.472412109375, -0.79150390625, -0.110595703125, 0.5703125, 1.251220703125, 1.93212890625, 2.613037109375, 3.2939453125, 3.974853515625, 4.65576171875, 5.336669921875, 6.017578125, 6.698486328125, 7.37939453125, 8.060302734375, 8.7412109375, 9.422119140625, 10.10302734375, 10.783935546875, 11.46484375, 12.145751953125, 12.82666015625, 13.507568359375, 14.1884765625, 14.869384765625, 15.55029296875, 16.231201171875, 16.912109375, 17.593017578125, 18.27392578125, 18.954833984375, 19.6357421875, 20.316650390625, 20.99755859375, 21.678466796875, 22.359375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 5.0, 4.0, 2.0, 4.0, 8.0, 13.0, 15.0, 9.0, 14.0, 18.0, 35.0, 23.0, 25.0, 23.0, 24.0, 27.0, 28.0, 38.0, 36.0, 50.0, 37.0, 41.0, 53.0, 37.0, 37.0, 42.0, 33.0, 32.0, 40.0, 38.0, 36.0, 19.0, 19.0, 26.0, 16.0, 18.0, 9.0, 12.0, 11.0, 12.0, 12.0, 7.0, 7.0, 5.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-31.859375, -30.811767578125, -29.76416015625, -28.716552734375, -27.6689453125, -26.621337890625, -25.57373046875, -24.526123046875, -23.478515625, -22.430908203125, -21.38330078125, -20.335693359375, -19.2880859375, -18.240478515625, -17.19287109375, -16.145263671875, -15.09765625, -14.050048828125, -13.00244140625, -11.954833984375, -10.9072265625, -9.859619140625, -8.81201171875, -7.764404296875, -6.716796875, -5.669189453125, -4.62158203125, -3.573974609375, -2.5263671875, -1.478759765625, -0.43115234375, 0.616455078125, 1.6640625, 2.711669921875, 3.75927734375, 4.806884765625, 5.8544921875, 6.902099609375, 7.94970703125, 8.997314453125, 10.044921875, 11.092529296875, 12.14013671875, 13.187744140625, 14.2353515625, 15.282958984375, 16.33056640625, 17.378173828125, 18.42578125, 19.473388671875, 20.52099609375, 21.568603515625, 22.6162109375, 23.663818359375, 24.71142578125, 25.759033203125, 26.806640625, 27.854248046875, 28.90185546875, 29.949462890625, 30.9970703125, 32.044677734375, 33.09228515625, 34.139892578125, 35.1875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 3.0, 3.0, 10.0, 6.0, 5.0, 10.0, 8.0, 15.0, 26.0, 39.0, 39.0, 64.0, 89.0, 115.0, 184.0, 231.0, 339.0, 459.0, 654.0, 955.0, 1319.0, 2036.0, 3166.0, 5110.0, 8550.0, 15198.0, 30030.0, 72718.0, 279225.0, 433477.0, 108777.0, 39282.0, 18874.0, 10018.0, 6089.0, 3782.0, 2339.0, 1558.0, 1146.0, 775.0, 543.0, 382.0, 256.0, 180.0, 135.0, 93.0, 69.0, 65.0, 27.0, 21.0, 21.0, 13.0, 13.0, 12.0, 10.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-15.640625, -15.138916015625, -14.63720703125, -14.135498046875, -13.6337890625, -13.132080078125, -12.63037109375, -12.128662109375, -11.626953125, -11.125244140625, -10.62353515625, -10.121826171875, -9.6201171875, -9.118408203125, -8.61669921875, -8.114990234375, -7.61328125, -7.111572265625, -6.60986328125, -6.108154296875, -5.6064453125, -5.104736328125, -4.60302734375, -4.101318359375, -3.599609375, -3.097900390625, -2.59619140625, -2.094482421875, -1.5927734375, -1.091064453125, -0.58935546875, -0.087646484375, 0.4140625, 0.915771484375, 1.41748046875, 1.919189453125, 2.4208984375, 2.922607421875, 3.42431640625, 3.926025390625, 4.427734375, 4.929443359375, 5.43115234375, 5.932861328125, 6.4345703125, 6.936279296875, 7.43798828125, 7.939697265625, 8.44140625, 8.943115234375, 9.44482421875, 9.946533203125, 10.4482421875, 10.949951171875, 11.45166015625, 11.953369140625, 12.455078125, 12.956787109375, 13.45849609375, 13.960205078125, 14.4619140625, 14.963623046875, 15.46533203125, 15.967041015625, 16.46875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 7.0, 6.0, 4.0, 3.0, 12.0, 16.0, 15.0, 9.0, 26.0, 25.0, 51.0, 104.0, 180.0, 201.0, 113.0, 57.0, 45.0, 33.0, 27.0, 17.0, 14.0, 9.0, 6.0, 9.0, 1.0, 3.0, 4.0, 4.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0042877197265625, -0.004154324531555176, -0.0040209293365478516, -0.0038875341415405273, -0.003754138946533203, -0.003620743751525879, -0.0034873485565185547, -0.0033539533615112305, -0.0032205581665039062, -0.003087162971496582, -0.002953767776489258, -0.0028203725814819336, -0.0026869773864746094, -0.002553582191467285, -0.002420186996459961, -0.0022867918014526367, -0.0021533966064453125, -0.0020200014114379883, -0.001886606216430664, -0.0017532110214233398, -0.0016198158264160156, -0.0014864206314086914, -0.0013530254364013672, -0.001219630241394043, -0.0010862350463867188, -0.0009528398513793945, -0.0008194446563720703, -0.0006860494613647461, -0.0005526542663574219, -0.00041925907135009766, -0.00028586387634277344, -0.00015246868133544922, -1.9073486328125e-05, 0.00011432170867919922, 0.00024771690368652344, 0.00038111209869384766, 0.0005145072937011719, 0.0006479024887084961, 0.0007812976837158203, 0.0009146928787231445, 0.0010480880737304688, 0.001181483268737793, 0.0013148784637451172, 0.0014482736587524414, 0.0015816688537597656, 0.0017150640487670898, 0.001848459243774414, 0.0019818544387817383, 0.0021152496337890625, 0.0022486448287963867, 0.002382040023803711, 0.002515435218811035, 0.0026488304138183594, 0.0027822256088256836, 0.002915620803833008, 0.003049015998840332, 0.0031824111938476562, 0.0033158063888549805, 0.0034492015838623047, 0.003582596778869629, 0.003715991973876953, 0.0038493871688842773, 0.0039827823638916016, 0.004116177558898926, 0.00424957275390625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 3.0, 14.0, 18.0, 30.0, 37.0, 52.0, 75.0, 105.0, 169.0, 243.0, 353.0, 479.0, 707.0, 1053.0, 1531.0, 2225.0, 3399.0, 5310.0, 8285.0, 13562.0, 22394.0, 40037.0, 74961.0, 151805.0, 296265.0, 204997.0, 97008.0, 50373.0, 28144.0, 16286.0, 10054.0, 6278.0, 4103.0, 2634.0, 1741.0, 1198.0, 826.0, 558.0, 376.0, 258.0, 208.0, 135.0, 77.0, 66.0, 49.0, 27.0, 16.0, 14.0, 8.0, 5.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.6484375, -13.2177734375, -12.787109375, -12.3564453125, -11.92578125, -11.4951171875, -11.064453125, -10.6337890625, -10.203125, -9.7724609375, -9.341796875, -8.9111328125, -8.48046875, -8.0498046875, -7.619140625, -7.1884765625, -6.7578125, -6.3271484375, -5.896484375, -5.4658203125, -5.03515625, -4.6044921875, -4.173828125, -3.7431640625, -3.3125, -2.8818359375, -2.451171875, -2.0205078125, -1.58984375, -1.1591796875, -0.728515625, -0.2978515625, 0.1328125, 0.5634765625, 0.994140625, 1.4248046875, 1.85546875, 2.2861328125, 2.716796875, 3.1474609375, 3.578125, 4.0087890625, 4.439453125, 4.8701171875, 5.30078125, 5.7314453125, 6.162109375, 6.5927734375, 7.0234375, 7.4541015625, 7.884765625, 8.3154296875, 8.74609375, 9.1767578125, 9.607421875, 10.0380859375, 10.46875, 10.8994140625, 11.330078125, 11.7607421875, 12.19140625, 12.6220703125, 13.052734375, 13.4833984375, 13.9140625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 6.0, 4.0, 6.0, 6.0, 10.0, 4.0, 14.0, 13.0, 19.0, 15.0, 16.0, 38.0, 38.0, 49.0, 63.0, 66.0, 67.0, 101.0, 92.0, 65.0, 61.0, 60.0, 45.0, 25.0, 19.0, 17.0, 12.0, 19.0, 8.0, 6.0, 3.0, 5.0, 6.0, 4.0, 2.0, 5.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-4.9375, -4.79742431640625, -4.6573486328125, -4.51727294921875, -4.377197265625, -4.23712158203125, -4.0970458984375, -3.95697021484375, -3.81689453125, -3.67681884765625, -3.5367431640625, -3.39666748046875, -3.256591796875, -3.11651611328125, -2.9764404296875, -2.83636474609375, -2.6962890625, -2.55621337890625, -2.4161376953125, -2.27606201171875, -2.135986328125, -1.99591064453125, -1.8558349609375, -1.71575927734375, -1.57568359375, -1.43560791015625, -1.2955322265625, -1.15545654296875, -1.015380859375, -0.87530517578125, -0.7352294921875, -0.59515380859375, -0.455078125, -0.31500244140625, -0.1749267578125, -0.03485107421875, 0.105224609375, 0.24530029296875, 0.3853759765625, 0.52545166015625, 0.66552734375, 0.80560302734375, 0.9456787109375, 1.08575439453125, 1.225830078125, 1.36590576171875, 1.5059814453125, 1.64605712890625, 1.7861328125, 1.92620849609375, 2.0662841796875, 2.20635986328125, 2.346435546875, 2.48651123046875, 2.6265869140625, 2.76666259765625, 2.90673828125, 3.04681396484375, 3.1868896484375, 3.32696533203125, 3.467041015625, 3.60711669921875, 3.7471923828125, 3.88726806640625, 4.02734375]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 4.0, 5.0, 5.0, 11.0, 9.0, 8.0, 10.0, 7.0, 18.0, 18.0, 27.0, 19.0, 22.0, 42.0, 42.0, 43.0, 47.0, 34.0, 50.0, 44.0, 52.0, 46.0, 51.0, 46.0, 44.0, 35.0, 51.0, 38.0, 31.0, 32.0, 29.0, 14.0, 12.0, 12.0, 12.0, 6.0, 11.0, 10.0, 9.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.960784912109375, -45.37490463256836, -43.789024353027344, -42.20314025878906, -40.61725997924805, -39.03137969970703, -37.44549560546875, -35.859615325927734, -34.27373504638672, -32.6878547668457, -31.101972579956055, -29.516090393066406, -27.93021011352539, -26.344329833984375, -24.758447647094727, -23.172565460205078, -21.586685180664062, -20.000804901123047, -18.4149227142334, -16.82904052734375, -15.243160247802734, -13.657279014587402, -12.07139778137207, -10.485516548156738, -8.899635314941406, -7.313754081726074, -5.727872848510742, -4.14199161529541, -2.556110382080078, -0.9702291488647461, 0.6156520843505859, 2.201533317565918, 3.7874183654785156, 5.373299598693848, 6.95918083190918, 8.545062065124512, 10.130943298339844, 11.716824531555176, 13.302705764770508, 14.88858699798584, 16.474468231201172, 18.060348510742188, 19.646230697631836, 21.232112884521484, 22.8179931640625, 24.403873443603516, 25.989755630493164, 27.575637817382812, 29.161518096923828, 30.747398376464844, 32.333282470703125, 33.91916275024414, 35.505043029785156, 37.09092330932617, 38.67680358886719, 40.26268768310547, 41.848567962646484, 43.4344482421875, 45.02033233642578, 46.6062126159668, 48.19209289550781, 49.77797317504883, 51.363853454589844, 52.949737548828125, 54.53561782836914]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 5.0, 5.0, 7.0, 10.0, 13.0, 13.0, 14.0, 16.0, 14.0, 17.0, 25.0, 29.0, 32.0, 35.0, 28.0, 44.0, 44.0, 44.0, 51.0, 45.0, 41.0, 42.0, 45.0, 42.0, 37.0, 40.0, 34.0, 25.0, 30.0, 31.0, 17.0, 21.0, 21.0, 17.0, 16.0, 25.0, 10.0, 6.0, 5.0, 3.0, 5.0, 0.0, 5.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-56.730491638183594, -55.174625396728516, -53.6187629699707, -52.062896728515625, -50.50703430175781, -48.951168060302734, -47.395301818847656, -45.839439392089844, -44.28357696533203, -42.72771072387695, -41.17184829711914, -39.61598205566406, -38.06011962890625, -36.50425338745117, -34.948387145996094, -33.39252471923828, -31.836658477783203, -30.280794143676758, -28.724929809570312, -27.169063568115234, -25.613201141357422, -24.057334899902344, -22.5014705657959, -20.945606231689453, -19.389741897583008, -17.833877563476562, -16.278013229370117, -14.722147941589355, -13.16628360748291, -11.610419273376465, -10.054553985595703, -8.498689651489258, -6.942829132080078, -5.386964797973633, -3.8310999870300293, -2.275235176086426, -0.7193708419799805, 0.8364934921264648, 2.3923587799072266, 3.948223114013672, 5.504087448120117, 7.0599517822265625, 8.615816116333008, 10.17168140411377, 11.727545738220215, 13.28341007232666, 14.839275360107422, 16.395139694213867, 17.951004028320312, 19.506868362426758, 21.062732696533203, 22.61859893798828, 24.174461364746094, 25.730327606201172, 27.286191940307617, 28.842056274414062, 30.397920608520508, 31.953784942626953, 33.50965118408203, 35.065513610839844, 36.62137985229492, 38.177242279052734, 39.73310852050781, 41.288970947265625, 42.8448371887207]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 9.0, 11.0, 11.0, 23.0, 40.0, 51.0, 93.0, 128.0, 210.0, 354.0, 563.0, 859.0, 1282.0, 2009.0, 3122.0, 4727.0, 7262.0, 11127.0, 16647.0, 24240.0, 34748.0, 48068.0, 63970.0, 80513.0, 94429.0, 104199.0, 105437.0, 100115.0, 87733.0, 71920.0, 55916.0, 40866.0, 28949.0, 20057.0, 13515.0, 8838.0, 5765.0, 3785.0, 2503.0, 1618.0, 1007.0, 669.0, 449.0, 266.0, 187.0, 91.0, 72.0, 48.0, 23.0, 19.0, 10.0, 4.0, 5.0, 3.0, 2.0, 1.0], "bins": [-32.65625, -31.702392578125, -30.74853515625, -29.794677734375, -28.8408203125, -27.886962890625, -26.93310546875, -25.979248046875, -25.025390625, -24.071533203125, -23.11767578125, -22.163818359375, -21.2099609375, -20.256103515625, -19.30224609375, -18.348388671875, -17.39453125, -16.440673828125, -15.48681640625, -14.532958984375, -13.5791015625, -12.625244140625, -11.67138671875, -10.717529296875, -9.763671875, -8.809814453125, -7.85595703125, -6.902099609375, -5.9482421875, -4.994384765625, -4.04052734375, -3.086669921875, -2.1328125, -1.178955078125, -0.22509765625, 0.728759765625, 1.6826171875, 2.636474609375, 3.59033203125, 4.544189453125, 5.498046875, 6.451904296875, 7.40576171875, 8.359619140625, 9.3134765625, 10.267333984375, 11.22119140625, 12.175048828125, 13.12890625, 14.082763671875, 15.03662109375, 15.990478515625, 16.9443359375, 17.898193359375, 18.85205078125, 19.805908203125, 20.759765625, 21.713623046875, 22.66748046875, 23.621337890625, 24.5751953125, 25.529052734375, 26.48291015625, 27.436767578125, 28.390625]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 3.0, 6.0, 4.0, 2.0, 9.0, 6.0, 10.0, 15.0, 12.0, 21.0, 11.0, 27.0, 31.0, 23.0, 40.0, 35.0, 29.0, 36.0, 35.0, 45.0, 39.0, 36.0, 43.0, 41.0, 35.0, 51.0, 32.0, 32.0, 38.0, 34.0, 31.0, 19.0, 28.0, 24.0, 21.0, 20.0, 13.0, 8.0, 18.0, 13.0, 8.0, 10.0, 8.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-50.8125, -49.4169921875, -48.021484375, -46.6259765625, -45.23046875, -43.8349609375, -42.439453125, -41.0439453125, -39.6484375, -38.2529296875, -36.857421875, -35.4619140625, -34.06640625, -32.6708984375, -31.275390625, -29.8798828125, -28.484375, -27.0888671875, -25.693359375, -24.2978515625, -22.90234375, -21.5068359375, -20.111328125, -18.7158203125, -17.3203125, -15.9248046875, -14.529296875, -13.1337890625, -11.73828125, -10.3427734375, -8.947265625, -7.5517578125, -6.15625, -4.7607421875, -3.365234375, -1.9697265625, -0.57421875, 0.8212890625, 2.216796875, 3.6123046875, 5.0078125, 6.4033203125, 7.798828125, 9.1943359375, 10.58984375, 11.9853515625, 13.380859375, 14.7763671875, 16.171875, 17.5673828125, 18.962890625, 20.3583984375, 21.75390625, 23.1494140625, 24.544921875, 25.9404296875, 27.3359375, 28.7314453125, 30.126953125, 31.5224609375, 32.91796875, 34.3134765625, 35.708984375, 37.1044921875, 38.5]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 6.0, 6.0, 7.0, 8.0, 33.0, 55.0, 77.0, 115.0, 226.0, 358.0, 509.0, 844.0, 1332.0, 2060.0, 3229.0, 5107.0, 7945.0, 12442.0, 18378.0, 26769.0, 39058.0, 54026.0, 71789.0, 88862.0, 104032.0, 110916.0, 108697.0, 98298.0, 81919.0, 63473.0, 47355.0, 33657.0, 23046.0, 15568.0, 10185.0, 6558.0, 4283.0, 2646.0, 1752.0, 1113.0, 702.0, 417.0, 277.0, 184.0, 108.0, 57.0, 36.0, 17.0, 12.0, 8.0, 4.0, 3.0, 5.0, 1.0, 1.0], "bins": [-42.3125, -41.09619140625, -39.8798828125, -38.66357421875, -37.447265625, -36.23095703125, -35.0146484375, -33.79833984375, -32.58203125, -31.36572265625, -30.1494140625, -28.93310546875, -27.716796875, -26.50048828125, -25.2841796875, -24.06787109375, -22.8515625, -21.63525390625, -20.4189453125, -19.20263671875, -17.986328125, -16.77001953125, -15.5537109375, -14.33740234375, -13.12109375, -11.90478515625, -10.6884765625, -9.47216796875, -8.255859375, -7.03955078125, -5.8232421875, -4.60693359375, -3.390625, -2.17431640625, -0.9580078125, 0.25830078125, 1.474609375, 2.69091796875, 3.9072265625, 5.12353515625, 6.33984375, 7.55615234375, 8.7724609375, 9.98876953125, 11.205078125, 12.42138671875, 13.6376953125, 14.85400390625, 16.0703125, 17.28662109375, 18.5029296875, 19.71923828125, 20.935546875, 22.15185546875, 23.3681640625, 24.58447265625, 25.80078125, 27.01708984375, 28.2333984375, 29.44970703125, 30.666015625, 31.88232421875, 33.0986328125, 34.31494140625, 35.53125]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 4.0, 6.0, 3.0, 3.0, 5.0, 12.0, 14.0, 21.0, 11.0, 23.0, 26.0, 25.0, 27.0, 32.0, 27.0, 37.0, 34.0, 44.0, 37.0, 47.0, 26.0, 46.0, 43.0, 36.0, 53.0, 28.0, 37.0, 30.0, 37.0, 34.0, 28.0, 37.0, 20.0, 17.0, 15.0, 15.0, 11.0, 7.0, 15.0, 9.0, 4.0, 5.0, 4.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-32.9375, -31.984375, -31.03125, -30.078125, -29.125, -28.171875, -27.21875, -26.265625, -25.3125, -24.359375, -23.40625, -22.453125, -21.5, -20.546875, -19.59375, -18.640625, -17.6875, -16.734375, -15.78125, -14.828125, -13.875, -12.921875, -11.96875, -11.015625, -10.0625, -9.109375, -8.15625, -7.203125, -6.25, -5.296875, -4.34375, -3.390625, -2.4375, -1.484375, -0.53125, 0.421875, 1.375, 2.328125, 3.28125, 4.234375, 5.1875, 6.140625, 7.09375, 8.046875, 9.0, 9.953125, 10.90625, 11.859375, 12.8125, 13.765625, 14.71875, 15.671875, 16.625, 17.578125, 18.53125, 19.484375, 20.4375, 21.390625, 22.34375, 23.296875, 24.25, 25.203125, 26.15625, 27.109375, 28.0625]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 1.0, 5.0, 11.0, 11.0, 20.0, 29.0, 45.0, 64.0, 95.0, 134.0, 201.0, 316.0, 439.0, 730.0, 1188.0, 1932.0, 3170.0, 5159.0, 8377.0, 13529.0, 21633.0, 34756.0, 52675.0, 75986.0, 103619.0, 127321.0, 137029.0, 127711.0, 105843.0, 78568.0, 53851.0, 35391.0, 22439.0, 13764.0, 8598.0, 5242.0, 3242.0, 1937.0, 1238.0, 755.0, 534.0, 342.0, 196.0, 146.0, 100.0, 72.0, 37.0, 29.0, 18.0, 12.0, 7.0, 9.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-10.28125, -9.9652099609375, -9.649169921875, -9.3331298828125, -9.01708984375, -8.7010498046875, -8.385009765625, -8.0689697265625, -7.7529296875, -7.4368896484375, -7.120849609375, -6.8048095703125, -6.48876953125, -6.1727294921875, -5.856689453125, -5.5406494140625, -5.224609375, -4.9085693359375, -4.592529296875, -4.2764892578125, -3.96044921875, -3.6444091796875, -3.328369140625, -3.0123291015625, -2.6962890625, -2.3802490234375, -2.064208984375, -1.7481689453125, -1.43212890625, -1.1160888671875, -0.800048828125, -0.4840087890625, -0.16796875, 0.1480712890625, 0.464111328125, 0.7801513671875, 1.09619140625, 1.4122314453125, 1.728271484375, 2.0443115234375, 2.3603515625, 2.6763916015625, 2.992431640625, 3.3084716796875, 3.62451171875, 3.9405517578125, 4.256591796875, 4.5726318359375, 4.888671875, 5.2047119140625, 5.520751953125, 5.8367919921875, 6.15283203125, 6.4688720703125, 6.784912109375, 7.1009521484375, 7.4169921875, 7.7330322265625, 8.049072265625, 8.3651123046875, 8.68115234375, 8.9971923828125, 9.313232421875, 9.6292724609375, 9.9453125]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 6.0, 6.0, 3.0, 3.0, 7.0, 7.0, 7.0, 4.0, 5.0, 13.0, 16.0, 17.0, 17.0, 28.0, 19.0, 26.0, 33.0, 28.0, 41.0, 30.0, 49.0, 45.0, 42.0, 47.0, 36.0, 46.0, 50.0, 43.0, 37.0, 41.0, 37.0, 25.0, 18.0, 27.0, 29.0, 21.0, 20.0, 17.0, 10.0, 10.0, 10.0, 9.0, 0.0, 5.0, 6.0, 2.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0010251998901367188, -0.0009941458702087402, -0.0009630918502807617, -0.0009320378303527832, -0.0009009838104248047, -0.0008699297904968262, -0.0008388757705688477, -0.0008078217506408691, -0.0007767677307128906, -0.0007457137107849121, -0.0007146596908569336, -0.0006836056709289551, -0.0006525516510009766, -0.000621497631072998, -0.0005904436111450195, -0.000559389591217041, -0.0005283355712890625, -0.000497281551361084, -0.00046622753143310547, -0.00043517351150512695, -0.00040411949157714844, -0.0003730654716491699, -0.0003420114517211914, -0.0003109574317932129, -0.0002799034118652344, -0.00024884939193725586, -0.00021779537200927734, -0.00018674135208129883, -0.0001556873321533203, -0.0001246333122253418, -9.357929229736328e-05, -6.252527236938477e-05, -3.147125244140625e-05, -4.172325134277344e-07, 3.063678741455078e-05, 6.16908073425293e-05, 9.274482727050781e-05, 0.00012379884719848633, 0.00015485286712646484, 0.00018590688705444336, 0.00021696090698242188, 0.0002480149269104004, 0.0002790689468383789, 0.0003101229667663574, 0.00034117698669433594, 0.00037223100662231445, 0.00040328502655029297, 0.0004343390464782715, 0.00046539306640625, 0.0004964470863342285, 0.000527501106262207, 0.0005585551261901855, 0.0005896091461181641, 0.0006206631660461426, 0.0006517171859741211, 0.0006827712059020996, 0.0007138252258300781, 0.0007448792457580566, 0.0007759332656860352, 0.0008069872856140137, 0.0008380413055419922, 0.0008690953254699707, 0.0009001493453979492, 0.0009312033653259277, 0.0009622573852539062]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 6.0, 3.0, 8.0, 11.0, 20.0, 33.0, 42.0, 41.0, 80.0, 133.0, 191.0, 325.0, 557.0, 861.0, 1410.0, 2214.0, 3621.0, 5442.0, 8759.0, 13867.0, 21410.0, 32883.0, 48388.0, 68165.0, 89608.0, 108746.0, 120212.0, 119691.0, 107951.0, 88696.0, 66784.0, 47606.0, 32467.0, 21296.0, 13675.0, 8743.0, 5424.0, 3461.0, 2097.0, 1321.0, 845.0, 532.0, 332.0, 234.0, 118.0, 90.0, 55.0, 43.0, 27.0, 23.0, 10.0, 4.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-9.2109375, -8.931640625, -8.65234375, -8.373046875, -8.09375, -7.814453125, -7.53515625, -7.255859375, -6.9765625, -6.697265625, -6.41796875, -6.138671875, -5.859375, -5.580078125, -5.30078125, -5.021484375, -4.7421875, -4.462890625, -4.18359375, -3.904296875, -3.625, -3.345703125, -3.06640625, -2.787109375, -2.5078125, -2.228515625, -1.94921875, -1.669921875, -1.390625, -1.111328125, -0.83203125, -0.552734375, -0.2734375, 0.005859375, 0.28515625, 0.564453125, 0.84375, 1.123046875, 1.40234375, 1.681640625, 1.9609375, 2.240234375, 2.51953125, 2.798828125, 3.078125, 3.357421875, 3.63671875, 3.916015625, 4.1953125, 4.474609375, 4.75390625, 5.033203125, 5.3125, 5.591796875, 5.87109375, 6.150390625, 6.4296875, 6.708984375, 6.98828125, 7.267578125, 7.546875, 7.826171875, 8.10546875, 8.384765625, 8.6640625]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 6.0, 2.0, 6.0, 17.0, 11.0, 11.0, 17.0, 22.0, 20.0, 20.0, 28.0, 43.0, 44.0, 45.0, 50.0, 46.0, 41.0, 55.0, 50.0, 58.0, 47.0, 47.0, 47.0, 37.0, 43.0, 31.0, 27.0, 17.0, 15.0, 19.0, 12.0, 16.0, 6.0, 12.0, 5.0, 5.0, 3.0, 6.0, 6.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-4.76953125, -4.64056396484375, -4.5115966796875, -4.38262939453125, -4.253662109375, -4.12469482421875, -3.9957275390625, -3.86676025390625, -3.73779296875, -3.60882568359375, -3.4798583984375, -3.35089111328125, -3.221923828125, -3.09295654296875, -2.9639892578125, -2.83502197265625, -2.7060546875, -2.57708740234375, -2.4481201171875, -2.31915283203125, -2.190185546875, -2.06121826171875, -1.9322509765625, -1.80328369140625, -1.67431640625, -1.54534912109375, -1.4163818359375, -1.28741455078125, -1.158447265625, -1.02947998046875, -0.9005126953125, -0.77154541015625, -0.642578125, -0.51361083984375, -0.3846435546875, -0.25567626953125, -0.126708984375, 0.00225830078125, 0.1312255859375, 0.26019287109375, 0.38916015625, 0.51812744140625, 0.6470947265625, 0.77606201171875, 0.905029296875, 1.03399658203125, 1.1629638671875, 1.29193115234375, 1.4208984375, 1.54986572265625, 1.6788330078125, 1.80780029296875, 1.936767578125, 2.06573486328125, 2.1947021484375, 2.32366943359375, 2.45263671875, 2.58160400390625, 2.7105712890625, 2.83953857421875, 2.968505859375, 3.09747314453125, 3.2264404296875, 3.35540771484375, 3.484375]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 4.0, 7.0, 3.0, 10.0, 7.0, 5.0, 10.0, 8.0, 12.0, 15.0, 17.0, 20.0, 28.0, 22.0, 31.0, 37.0, 37.0, 27.0, 40.0, 49.0, 36.0, 38.0, 43.0, 44.0, 35.0, 35.0, 34.0, 35.0, 44.0, 38.0, 32.0, 35.0, 29.0, 27.0, 14.0, 13.0, 11.0, 20.0, 12.0, 11.0, 9.0, 12.0, 3.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-47.87879943847656, -46.54505157470703, -45.211299896240234, -43.8775520324707, -42.543800354003906, -41.210052490234375, -39.876304626464844, -38.54255294799805, -37.20880126953125, -35.87505340576172, -34.54130172729492, -33.20755386352539, -31.873802185058594, -30.540054321289062, -29.2063045501709, -27.872554779052734, -26.538806915283203, -25.20505714416504, -23.871307373046875, -22.537559509277344, -21.203807830810547, -19.870059967041016, -18.53631019592285, -17.202560424804688, -15.868810653686523, -14.53506088256836, -13.201311111450195, -11.867562294006348, -10.533812522888184, -9.20006275177002, -7.866313934326172, -6.532564163208008, -5.198810577392578, -3.865061044692993, -2.531311511993408, -1.1975622177124023, 0.13618755340576172, 1.4699373245239258, 2.8036861419677734, 4.1374359130859375, 5.471185684204102, 6.804935455322266, 8.13868522644043, 9.472434043884277, 10.806183815002441, 12.139933586120605, 13.473682403564453, 14.807432174682617, 16.14118194580078, 17.474931716918945, 18.80868148803711, 20.14242935180664, 21.476181030273438, 22.80992889404297, 24.143678665161133, 25.477428436279297, 26.81117820739746, 28.144927978515625, 29.47867774963379, 30.812427520751953, 32.146175384521484, 33.47992706298828, 34.81367492675781, 36.147422790527344, 37.48117446899414]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 3.0, 3.0, 8.0, 8.0, 10.0, 9.0, 11.0, 16.0, 14.0, 22.0, 33.0, 22.0, 34.0, 39.0, 46.0, 40.0, 30.0, 58.0, 34.0, 47.0, 37.0, 42.0, 45.0, 50.0, 50.0, 25.0, 27.0, 28.0, 41.0, 21.0, 25.0, 26.0, 19.0, 16.0, 16.0, 9.0, 15.0, 11.0, 4.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.19195556640625, -52.56753921508789, -50.94312286376953, -49.318702697753906, -47.69428634643555, -46.06986999511719, -44.44545364379883, -42.82103729248047, -41.196617126464844, -39.572200775146484, -37.947784423828125, -36.3233642578125, -34.69894790649414, -33.07453155517578, -31.450115203857422, -29.825698852539062, -28.201282501220703, -26.576866149902344, -24.95244789123535, -23.328031539916992, -21.70361328125, -20.07919692993164, -18.45478057861328, -16.830364227294922, -15.20594596862793, -13.581528663635254, -11.957111358642578, -10.332695007324219, -8.708277702331543, -7.083860397338867, -5.459444046020508, -3.835026741027832, -2.2106056213378906, -0.586188554763794, 1.0382285118103027, 2.6626453399658203, 4.287062644958496, 5.911479949951172, 7.535896301269531, 9.160313606262207, 10.784730911254883, 12.409148216247559, 14.033565521240234, 15.657981872558594, 17.282398223876953, 18.906816482543945, 20.531232833862305, 22.155651092529297, 23.780067443847656, 25.404483795166016, 27.028902053833008, 28.653318405151367, 30.27773666381836, 31.90215301513672, 33.52656936645508, 35.15098571777344, 36.77540588378906, 38.39982223510742, 40.02423858642578, 41.648658752441406, 43.273075103759766, 44.897491455078125, 46.521907806396484, 48.146324157714844, 49.7707405090332]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 5.0, 7.0, 8.0, 14.0, 17.0, 39.0, 57.0, 101.0, 169.0, 229.0, 402.0, 598.0, 1103.0, 1682.0, 2748.0, 4497.0, 7686.0, 12982.0, 21269.0, 35578.0, 59487.0, 96597.0, 155917.0, 240455.0, 347017.0, 458528.0, 539414.0, 554723.0, 496018.0, 390989.0, 278977.0, 185856.0, 117529.0, 72423.0, 44286.0, 26204.0, 16047.0, 9720.0, 5873.0, 3558.0, 2126.0, 1288.0, 790.0, 478.0, 305.0, 205.0, 109.0, 70.0, 52.0, 28.0, 10.0, 13.0, 7.0, 4.0, 1.0, 1.0], "bins": [-33.75, -32.791015625, -31.83203125, -30.873046875, -29.9140625, -28.955078125, -27.99609375, -27.037109375, -26.078125, -25.119140625, -24.16015625, -23.201171875, -22.2421875, -21.283203125, -20.32421875, -19.365234375, -18.40625, -17.447265625, -16.48828125, -15.529296875, -14.5703125, -13.611328125, -12.65234375, -11.693359375, -10.734375, -9.775390625, -8.81640625, -7.857421875, -6.8984375, -5.939453125, -4.98046875, -4.021484375, -3.0625, -2.103515625, -1.14453125, -0.185546875, 0.7734375, 1.732421875, 2.69140625, 3.650390625, 4.609375, 5.568359375, 6.52734375, 7.486328125, 8.4453125, 9.404296875, 10.36328125, 11.322265625, 12.28125, 13.240234375, 14.19921875, 15.158203125, 16.1171875, 17.076171875, 18.03515625, 18.994140625, 19.953125, 20.912109375, 21.87109375, 22.830078125, 23.7890625, 24.748046875, 25.70703125, 26.666015625, 27.625]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 3.0, 6.0, 1.0, 4.0, 7.0, 6.0, 6.0, 13.0, 19.0, 9.0, 16.0, 18.0, 23.0, 30.0, 30.0, 39.0, 43.0, 36.0, 40.0, 38.0, 44.0, 48.0, 46.0, 44.0, 44.0, 36.0, 41.0, 38.0, 37.0, 34.0, 23.0, 26.0, 26.0, 23.0, 21.0, 16.0, 17.0, 16.0, 10.0, 7.0, 10.0, 4.0, 5.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-44.0, -42.7587890625, -41.517578125, -40.2763671875, -39.03515625, -37.7939453125, -36.552734375, -35.3115234375, -34.0703125, -32.8291015625, -31.587890625, -30.3466796875, -29.10546875, -27.8642578125, -26.623046875, -25.3818359375, -24.140625, -22.8994140625, -21.658203125, -20.4169921875, -19.17578125, -17.9345703125, -16.693359375, -15.4521484375, -14.2109375, -12.9697265625, -11.728515625, -10.4873046875, -9.24609375, -8.0048828125, -6.763671875, -5.5224609375, -4.28125, -3.0400390625, -1.798828125, -0.5576171875, 0.68359375, 1.9248046875, 3.166015625, 4.4072265625, 5.6484375, 6.8896484375, 8.130859375, 9.3720703125, 10.61328125, 11.8544921875, 13.095703125, 14.3369140625, 15.578125, 16.8193359375, 18.060546875, 19.3017578125, 20.54296875, 21.7841796875, 23.025390625, 24.2666015625, 25.5078125, 26.7490234375, 27.990234375, 29.2314453125, 30.47265625, 31.7138671875, 32.955078125, 34.1962890625, 35.4375]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 5.0, 3.0, 13.0, 26.0, 52.0, 96.0, 139.0, 235.0, 399.0, 762.0, 1288.0, 2262.0, 3904.0, 6722.0, 11611.0, 19397.0, 32404.0, 53155.0, 85197.0, 131649.0, 195110.0, 275613.0, 367865.0, 448747.0, 496965.0, 494290.0, 438781.0, 353971.0, 262259.0, 184655.0, 123432.0, 79431.0, 49748.0, 30307.0, 18219.0, 10709.0, 6289.0, 3656.0, 2153.0, 1204.0, 670.0, 375.0, 232.0, 129.0, 68.0, 44.0, 27.0, 9.0, 7.0, 6.0, 1.0, 0.0, 1.0, 3.0], "bins": [-33.84375, -32.874755859375, -31.90576171875, -30.936767578125, -29.9677734375, -28.998779296875, -28.02978515625, -27.060791015625, -26.091796875, -25.122802734375, -24.15380859375, -23.184814453125, -22.2158203125, -21.246826171875, -20.27783203125, -19.308837890625, -18.33984375, -17.370849609375, -16.40185546875, -15.432861328125, -14.4638671875, -13.494873046875, -12.52587890625, -11.556884765625, -10.587890625, -9.618896484375, -8.64990234375, -7.680908203125, -6.7119140625, -5.742919921875, -4.77392578125, -3.804931640625, -2.8359375, -1.866943359375, -0.89794921875, 0.071044921875, 1.0400390625, 2.009033203125, 2.97802734375, 3.947021484375, 4.916015625, 5.885009765625, 6.85400390625, 7.822998046875, 8.7919921875, 9.760986328125, 10.72998046875, 11.698974609375, 12.66796875, 13.636962890625, 14.60595703125, 15.574951171875, 16.5439453125, 17.512939453125, 18.48193359375, 19.450927734375, 20.419921875, 21.388916015625, 22.35791015625, 23.326904296875, 24.2958984375, 25.264892578125, 26.23388671875, 27.202880859375, 28.171875]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 6.0, 9.0, 10.0, 9.0, 13.0, 28.0, 30.0, 40.0, 35.0, 64.0, 68.0, 97.0, 104.0, 128.0, 161.0, 170.0, 205.0, 208.0, 238.0, 225.0, 219.0, 237.0, 225.0, 223.0, 217.0, 165.0, 156.0, 152.0, 127.0, 96.0, 90.0, 62.0, 61.0, 51.0, 39.0, 25.0, 31.0, 9.0, 13.0, 11.0, 8.0, 3.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.5234375, -14.9927978515625, -14.462158203125, -13.9315185546875, -13.40087890625, -12.8702392578125, -12.339599609375, -11.8089599609375, -11.2783203125, -10.7476806640625, -10.217041015625, -9.6864013671875, -9.15576171875, -8.6251220703125, -8.094482421875, -7.5638427734375, -7.033203125, -6.5025634765625, -5.971923828125, -5.4412841796875, -4.91064453125, -4.3800048828125, -3.849365234375, -3.3187255859375, -2.7880859375, -2.2574462890625, -1.726806640625, -1.1961669921875, -0.66552734375, -0.1348876953125, 0.395751953125, 0.9263916015625, 1.45703125, 1.9876708984375, 2.518310546875, 3.0489501953125, 3.57958984375, 4.1102294921875, 4.640869140625, 5.1715087890625, 5.7021484375, 6.2327880859375, 6.763427734375, 7.2940673828125, 7.82470703125, 8.3553466796875, 8.885986328125, 9.4166259765625, 9.947265625, 10.4779052734375, 11.008544921875, 11.5391845703125, 12.06982421875, 12.6004638671875, 13.131103515625, 13.6617431640625, 14.1923828125, 14.7230224609375, 15.253662109375, 15.7843017578125, 16.31494140625, 16.8455810546875, 17.376220703125, 17.9068603515625, 18.4375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 6.0, 3.0, 5.0, 10.0, 8.0, 14.0, 10.0, 19.0, 13.0, 16.0, 18.0, 19.0, 42.0, 25.0, 33.0, 42.0, 29.0, 43.0, 29.0, 36.0, 47.0, 39.0, 48.0, 43.0, 36.0, 41.0, 35.0, 40.0, 32.0, 32.0, 28.0, 31.0, 32.0, 19.0, 20.0, 13.0, 12.0, 9.0, 8.0, 4.0, 3.0, 5.0, 6.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-37.386783599853516, -36.2636833190918, -35.14058303833008, -34.01748275756836, -32.894386291503906, -31.771284103393555, -30.64818572998047, -29.52508544921875, -28.40198516845703, -27.278884887695312, -26.155784606933594, -25.032686233520508, -23.90958595275879, -22.78648567199707, -21.663387298583984, -20.540287017822266, -19.417186737060547, -18.294086456298828, -17.17098617553711, -16.047887802124023, -14.924787521362305, -13.801687240600586, -12.678587913513184, -11.555488586425781, -10.432388305664062, -9.309288024902344, -8.186188697814941, -7.063088893890381, -5.93998908996582, -4.81688928604126, -3.693789482116699, -2.5706896781921387, -1.4475860595703125, -0.32448625564575195, 0.7986135482788086, 1.9217133522033691, 3.0448131561279297, 4.16791296005249, 5.291012763977051, 6.414112567901611, 7.537212371826172, 8.66031265258789, 9.783411979675293, 10.906511306762695, 12.029611587524414, 13.152711868286133, 14.275811195373535, 15.398910522460938, 16.522010803222656, 17.645111083984375, 18.768211364746094, 19.89130973815918, 21.0144100189209, 22.137510299682617, 23.260608673095703, 24.383708953857422, 25.50680923461914, 26.62990951538086, 27.753009796142578, 28.876108169555664, 29.999208450317383, 31.1223087310791, 32.24540710449219, 33.368507385253906, 34.491607666015625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 2.0, 7.0, 8.0, 10.0, 7.0, 6.0, 7.0, 16.0, 15.0, 17.0, 16.0, 29.0, 34.0, 37.0, 19.0, 38.0, 37.0, 51.0, 50.0, 47.0, 39.0, 36.0, 38.0, 49.0, 43.0, 32.0, 38.0, 42.0, 31.0, 22.0, 28.0, 23.0, 16.0, 19.0, 18.0, 19.0, 15.0, 8.0, 14.0, 5.0, 5.0, 4.0, 2.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-41.15751647949219, -39.85011672973633, -38.542720794677734, -37.235321044921875, -35.927921295166016, -34.62052536010742, -33.31312561035156, -32.00572967529297, -30.69832992553711, -29.390932083129883, -28.083532333374023, -26.776134490966797, -25.46873664855957, -24.161338806152344, -22.853939056396484, -21.546541213989258, -20.2391414642334, -18.931743621826172, -17.624343872070312, -16.316946029663086, -15.00954818725586, -13.702149391174316, -12.394750595092773, -11.087352752685547, -9.779953956604004, -8.472555160522461, -7.165157318115234, -5.857758522033691, -4.550360202789307, -3.242961883544922, -1.935563087463379, -0.6281652450561523, 0.6792335510253906, 1.986631989479065, 3.2940304279327393, 4.601428985595703, 5.908827304840088, 7.216225624084473, 8.523624420166016, 9.831022262573242, 11.138421058654785, 12.445819854736328, 13.753217697143555, 15.060616493225098, 16.36801528930664, 17.675413131713867, 18.982810974121094, 20.290210723876953, 21.59760856628418, 22.905006408691406, 24.212406158447266, 25.519804000854492, 26.82720184326172, 28.134601593017578, 29.441999435424805, 30.74939727783203, 32.05679702758789, 33.36419677734375, 34.671592712402344, 35.9789924621582, 37.28639221191406, 38.593788146972656, 39.901187896728516, 41.208587646484375, 42.51598358154297]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 0.0, 6.0, 8.0, 3.0, 8.0, 10.0, 9.0, 11.0, 23.0, 29.0, 62.0, 59.0, 87.0, 132.0, 212.0, 305.0, 562.0, 946.0, 1668.0, 2838.0, 5218.0, 9304.0, 17001.0, 31814.0, 56990.0, 96841.0, 153104.0, 197340.0, 179735.0, 124176.0, 75210.0, 42722.0, 23275.0, 12706.0, 7042.0, 3773.0, 2156.0, 1264.0, 712.0, 428.0, 242.0, 176.0, 105.0, 85.0, 45.0, 31.0, 28.0, 17.0, 9.0, 6.0, 4.0, 9.0, 6.0, 7.0, 2.0, 4.0, 0.0, 1.0, 0.0, 2.0], "bins": [-19.015625, -18.416748046875, -17.81787109375, -17.218994140625, -16.6201171875, -16.021240234375, -15.42236328125, -14.823486328125, -14.224609375, -13.625732421875, -13.02685546875, -12.427978515625, -11.8291015625, -11.230224609375, -10.63134765625, -10.032470703125, -9.43359375, -8.834716796875, -8.23583984375, -7.636962890625, -7.0380859375, -6.439208984375, -5.84033203125, -5.241455078125, -4.642578125, -4.043701171875, -3.44482421875, -2.845947265625, -2.2470703125, -1.648193359375, -1.04931640625, -0.450439453125, 0.1484375, 0.747314453125, 1.34619140625, 1.945068359375, 2.5439453125, 3.142822265625, 3.74169921875, 4.340576171875, 4.939453125, 5.538330078125, 6.13720703125, 6.736083984375, 7.3349609375, 7.933837890625, 8.53271484375, 9.131591796875, 9.73046875, 10.329345703125, 10.92822265625, 11.527099609375, 12.1259765625, 12.724853515625, 13.32373046875, 13.922607421875, 14.521484375, 15.120361328125, 15.71923828125, 16.318115234375, 16.9169921875, 17.515869140625, 18.11474609375, 18.713623046875, 19.3125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 6.0, 3.0, 5.0, 4.0, 6.0, 11.0, 14.0, 13.0, 20.0, 13.0, 16.0, 18.0, 15.0, 33.0, 36.0, 30.0, 38.0, 43.0, 37.0, 40.0, 40.0, 38.0, 41.0, 35.0, 34.0, 43.0, 45.0, 27.0, 35.0, 40.0, 33.0, 37.0, 15.0, 18.0, 16.0, 13.0, 18.0, 9.0, 14.0, 10.0, 6.0, 10.0, 5.0, 3.0, 4.0, 8.0, 6.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-39.4375, -38.22412109375, -37.0107421875, -35.79736328125, -34.583984375, -33.37060546875, -32.1572265625, -30.94384765625, -29.73046875, -28.51708984375, -27.3037109375, -26.09033203125, -24.876953125, -23.66357421875, -22.4501953125, -21.23681640625, -20.0234375, -18.81005859375, -17.5966796875, -16.38330078125, -15.169921875, -13.95654296875, -12.7431640625, -11.52978515625, -10.31640625, -9.10302734375, -7.8896484375, -6.67626953125, -5.462890625, -4.24951171875, -3.0361328125, -1.82275390625, -0.609375, 0.60400390625, 1.8173828125, 3.03076171875, 4.244140625, 5.45751953125, 6.6708984375, 7.88427734375, 9.09765625, 10.31103515625, 11.5244140625, 12.73779296875, 13.951171875, 15.16455078125, 16.3779296875, 17.59130859375, 18.8046875, 20.01806640625, 21.2314453125, 22.44482421875, 23.658203125, 24.87158203125, 26.0849609375, 27.29833984375, 28.51171875, 29.72509765625, 30.9384765625, 32.15185546875, 33.365234375, 34.57861328125, 35.7919921875, 37.00537109375, 38.21875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 13.0, 10.0, 21.0, 33.0, 64.0, 93.0, 166.0, 307.0, 545.0, 1077.0, 2163.0, 4582.0, 9939.0, 23224.0, 57138.0, 137570.0, 264522.0, 278877.0, 155263.0, 65015.0, 26526.0, 11325.0, 5144.0, 2325.0, 1174.0, 657.0, 328.0, 196.0, 93.0, 70.0, 29.0, 23.0, 12.0, 8.0, 7.0, 3.0, 1.0, 1.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.4453125, -14.8951416015625, -14.344970703125, -13.7947998046875, -13.24462890625, -12.6944580078125, -12.144287109375, -11.5941162109375, -11.0439453125, -10.4937744140625, -9.943603515625, -9.3934326171875, -8.84326171875, -8.2930908203125, -7.742919921875, -7.1927490234375, -6.642578125, -6.0924072265625, -5.542236328125, -4.9920654296875, -4.44189453125, -3.8917236328125, -3.341552734375, -2.7913818359375, -2.2412109375, -1.6910400390625, -1.140869140625, -0.5906982421875, -0.04052734375, 0.5096435546875, 1.059814453125, 1.6099853515625, 2.16015625, 2.7103271484375, 3.260498046875, 3.8106689453125, 4.36083984375, 4.9110107421875, 5.461181640625, 6.0113525390625, 6.5615234375, 7.1116943359375, 7.661865234375, 8.2120361328125, 8.76220703125, 9.3123779296875, 9.862548828125, 10.4127197265625, 10.962890625, 11.5130615234375, 12.063232421875, 12.6134033203125, 13.16357421875, 13.7137451171875, 14.263916015625, 14.8140869140625, 15.3642578125, 15.9144287109375, 16.464599609375, 17.0147705078125, 17.56494140625, 18.1151123046875, 18.665283203125, 19.2154541015625, 19.765625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 7.0, 4.0, 7.0, 10.0, 9.0, 10.0, 9.0, 8.0, 19.0, 18.0, 26.0, 29.0, 31.0, 36.0, 36.0, 41.0, 32.0, 44.0, 37.0, 44.0, 43.0, 38.0, 44.0, 43.0, 42.0, 36.0, 42.0, 35.0, 29.0, 29.0, 21.0, 28.0, 24.0, 26.0, 17.0, 7.0, 11.0, 10.0, 10.0, 7.0, 2.0, 6.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.875, -24.021484375, -23.16796875, -22.314453125, -21.4609375, -20.607421875, -19.75390625, -18.900390625, -18.046875, -17.193359375, -16.33984375, -15.486328125, -14.6328125, -13.779296875, -12.92578125, -12.072265625, -11.21875, -10.365234375, -9.51171875, -8.658203125, -7.8046875, -6.951171875, -6.09765625, -5.244140625, -4.390625, -3.537109375, -2.68359375, -1.830078125, -0.9765625, -0.123046875, 0.73046875, 1.583984375, 2.4375, 3.291015625, 4.14453125, 4.998046875, 5.8515625, 6.705078125, 7.55859375, 8.412109375, 9.265625, 10.119140625, 10.97265625, 11.826171875, 12.6796875, 13.533203125, 14.38671875, 15.240234375, 16.09375, 16.947265625, 17.80078125, 18.654296875, 19.5078125, 20.361328125, 21.21484375, 22.068359375, 22.921875, 23.775390625, 24.62890625, 25.482421875, 26.3359375, 27.189453125, 28.04296875, 28.896484375, 29.75]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 3.0, 5.0, 7.0, 8.0, 7.0, 14.0, 28.0, 26.0, 28.0, 46.0, 69.0, 94.0, 133.0, 247.0, 361.0, 587.0, 1100.0, 2035.0, 4420.0, 11043.0, 34100.0, 153909.0, 559333.0, 213513.0, 43556.0, 13273.0, 5196.0, 2350.0, 1209.0, 698.0, 397.0, 237.0, 172.0, 94.0, 79.0, 50.0, 40.0, 29.0, 21.0, 10.0, 8.0, 9.0, 5.0, 5.0, 0.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-10.28125, -9.9658203125, -9.650390625, -9.3349609375, -9.01953125, -8.7041015625, -8.388671875, -8.0732421875, -7.7578125, -7.4423828125, -7.126953125, -6.8115234375, -6.49609375, -6.1806640625, -5.865234375, -5.5498046875, -5.234375, -4.9189453125, -4.603515625, -4.2880859375, -3.97265625, -3.6572265625, -3.341796875, -3.0263671875, -2.7109375, -2.3955078125, -2.080078125, -1.7646484375, -1.44921875, -1.1337890625, -0.818359375, -0.5029296875, -0.1875, 0.1279296875, 0.443359375, 0.7587890625, 1.07421875, 1.3896484375, 1.705078125, 2.0205078125, 2.3359375, 2.6513671875, 2.966796875, 3.2822265625, 3.59765625, 3.9130859375, 4.228515625, 4.5439453125, 4.859375, 5.1748046875, 5.490234375, 5.8056640625, 6.12109375, 6.4365234375, 6.751953125, 7.0673828125, 7.3828125, 7.6982421875, 8.013671875, 8.3291015625, 8.64453125, 8.9599609375, 9.275390625, 9.5908203125, 9.90625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 6.0, 6.0, 3.0, 2.0, 8.0, 5.0, 12.0, 8.0, 9.0, 15.0, 18.0, 24.0, 29.0, 52.0, 66.0, 90.0, 114.0, 113.0, 122.0, 76.0, 60.0, 43.0, 29.0, 13.0, 18.0, 21.0, 14.0, 7.0, 10.0, 8.0, 2.0, 4.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.0013628005981445312, -0.0013146549463272095, -0.0012665092945098877, -0.001218363642692566, -0.0011702179908752441, -0.0011220723390579224, -0.0010739266872406006, -0.0010257810354232788, -0.000977635383605957, -0.0009294897317886353, -0.0008813440799713135, -0.0008331984281539917, -0.0007850527763366699, -0.0007369071245193481, -0.0006887614727020264, -0.0006406158208847046, -0.0005924701690673828, -0.000544324517250061, -0.0004961788654327393, -0.0004480332136154175, -0.0003998875617980957, -0.0003517419099807739, -0.00030359625816345215, -0.00025545060634613037, -0.0002073049545288086, -0.00015915930271148682, -0.00011101365089416504, -6.286799907684326e-05, -1.4722347259521484e-05, 3.342330455780029e-05, 8.156895637512207e-05, 0.00012971460819244385, 0.00017786026000976562, 0.0002260059118270874, 0.0002741515636444092, 0.00032229721546173096, 0.00037044286727905273, 0.0004185885190963745, 0.0004667341709136963, 0.0005148798227310181, 0.0005630254745483398, 0.0006111711263656616, 0.0006593167781829834, 0.0007074624300003052, 0.000755608081817627, 0.0008037537336349487, 0.0008518993854522705, 0.0009000450372695923, 0.0009481906890869141, 0.0009963363409042358, 0.0010444819927215576, 0.0010926276445388794, 0.0011407732963562012, 0.001188918948173523, 0.0012370645999908447, 0.0012852102518081665, 0.0013333559036254883, 0.00138150155544281, 0.0014296472072601318, 0.0014777928590774536, 0.0015259385108947754, 0.0015740841627120972, 0.001622229814529419, 0.0016703754663467407, 0.0017185211181640625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 9.0, 8.0, 13.0, 17.0, 19.0, 26.0, 39.0, 70.0, 102.0, 138.0, 188.0, 286.0, 413.0, 634.0, 975.0, 1682.0, 2716.0, 4651.0, 8953.0, 16492.0, 33447.0, 66438.0, 130745.0, 224042.0, 243332.0, 150942.0, 78599.0, 39813.0, 19797.0, 10255.0, 5581.0, 3065.0, 1820.0, 1155.0, 697.0, 459.0, 302.0, 184.0, 133.0, 104.0, 59.0, 46.0, 42.0, 25.0, 19.0, 10.0, 9.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-8.234375, -7.97802734375, -7.7216796875, -7.46533203125, -7.208984375, -6.95263671875, -6.6962890625, -6.43994140625, -6.18359375, -5.92724609375, -5.6708984375, -5.41455078125, -5.158203125, -4.90185546875, -4.6455078125, -4.38916015625, -4.1328125, -3.87646484375, -3.6201171875, -3.36376953125, -3.107421875, -2.85107421875, -2.5947265625, -2.33837890625, -2.08203125, -1.82568359375, -1.5693359375, -1.31298828125, -1.056640625, -0.80029296875, -0.5439453125, -0.28759765625, -0.03125, 0.22509765625, 0.4814453125, 0.73779296875, 0.994140625, 1.25048828125, 1.5068359375, 1.76318359375, 2.01953125, 2.27587890625, 2.5322265625, 2.78857421875, 3.044921875, 3.30126953125, 3.5576171875, 3.81396484375, 4.0703125, 4.32666015625, 4.5830078125, 4.83935546875, 5.095703125, 5.35205078125, 5.6083984375, 5.86474609375, 6.12109375, 6.37744140625, 6.6337890625, 6.89013671875, 7.146484375, 7.40283203125, 7.6591796875, 7.91552734375, 8.171875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 5.0, 0.0, 6.0, 10.0, 10.0, 10.0, 17.0, 44.0, 49.0, 86.0, 80.0, 95.0, 89.0, 113.0, 97.0, 75.0, 62.0, 60.0, 33.0, 16.0, 15.0, 8.0, 4.0, 6.0, 5.0, 2.0, 2.0, 4.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.4375, -4.306884765625, -4.17626953125, -4.045654296875, -3.9150390625, -3.784423828125, -3.65380859375, -3.523193359375, -3.392578125, -3.261962890625, -3.13134765625, -3.000732421875, -2.8701171875, -2.739501953125, -2.60888671875, -2.478271484375, -2.34765625, -2.217041015625, -2.08642578125, -1.955810546875, -1.8251953125, -1.694580078125, -1.56396484375, -1.433349609375, -1.302734375, -1.172119140625, -1.04150390625, -0.910888671875, -0.7802734375, -0.649658203125, -0.51904296875, -0.388427734375, -0.2578125, -0.127197265625, 0.00341796875, 0.134033203125, 0.2646484375, 0.395263671875, 0.52587890625, 0.656494140625, 0.787109375, 0.917724609375, 1.04833984375, 1.178955078125, 1.3095703125, 1.440185546875, 1.57080078125, 1.701416015625, 1.83203125, 1.962646484375, 2.09326171875, 2.223876953125, 2.3544921875, 2.485107421875, 2.61572265625, 2.746337890625, 2.876953125, 3.007568359375, 3.13818359375, 3.268798828125, 3.3994140625, 3.530029296875, 3.66064453125, 3.791259765625, 3.921875]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 2.0, 4.0, 8.0, 5.0, 5.0, 4.0, 14.0, 13.0, 13.0, 20.0, 20.0, 20.0, 23.0, 26.0, 20.0, 39.0, 40.0, 35.0, 29.0, 36.0, 50.0, 40.0, 40.0, 40.0, 50.0, 39.0, 37.0, 47.0, 34.0, 45.0, 26.0, 31.0, 20.0, 27.0, 27.0, 21.0, 17.0, 11.0, 3.0, 8.0, 2.0, 7.0, 3.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-38.30130386352539, -37.19415283203125, -36.087005615234375, -34.979854583740234, -33.872703552246094, -32.76555633544922, -31.658405303955078, -30.551254272460938, -29.44410514831543, -28.336956024169922, -27.22980499267578, -26.122655868530273, -25.015506744384766, -23.908355712890625, -22.801206588745117, -21.69405746459961, -20.58690643310547, -19.47975730895996, -18.37260627746582, -17.265457153320312, -16.158306121826172, -15.051156997680664, -13.944007873535156, -12.836857795715332, -11.729707717895508, -10.622557640075684, -9.51540756225586, -8.408258438110352, -7.301108360290527, -6.193958282470703, -5.086808681488037, -3.979659080505371, -2.8725128173828125, -1.7653629779815674, -0.6582131385803223, 0.44893670082092285, 1.556086540222168, 2.663236618041992, 3.770386219024658, 4.877535820007324, 5.984685897827148, 7.091835975646973, 8.198986053466797, 9.306135177612305, 10.413285255432129, 11.520435333251953, 12.627584457397461, 13.734734535217285, 14.84188461303711, 15.949034690856934, 17.056184768676758, 18.163333892822266, 19.270484924316406, 20.377634048461914, 21.484783172607422, 22.591934204101562, 23.69908332824707, 24.806232452392578, 25.91338348388672, 27.020532608032227, 28.127681732177734, 29.234832763671875, 30.341981887817383, 31.44913101196289, 32.55628204345703]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 8.0, 11.0, 9.0, 6.0, 8.0, 11.0, 9.0, 20.0, 20.0, 17.0, 35.0, 36.0, 31.0, 27.0, 39.0, 46.0, 43.0, 49.0, 40.0, 40.0, 41.0, 35.0, 56.0, 34.0, 36.0, 39.0, 42.0, 28.0, 24.0, 25.0, 18.0, 17.0, 18.0, 18.0, 10.0, 16.0, 11.0, 9.0, 3.0, 4.0, 6.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-39.1461181640625, -37.879295349121094, -36.61247253417969, -35.34564971923828, -34.078826904296875, -32.81200408935547, -31.54517936706543, -30.278356552124023, -29.011533737182617, -27.74471092224121, -26.477888107299805, -25.2110652923584, -23.94424057006836, -22.677417755126953, -21.410594940185547, -20.14377212524414, -18.876949310302734, -17.610126495361328, -16.343303680419922, -15.0764799118042, -13.809657096862793, -12.542834281921387, -11.276010513305664, -10.009187698364258, -8.742364883422852, -7.475542068481445, -6.208718776702881, -4.941895484924316, -3.67507266998291, -2.408249855041504, -1.1414265632629395, 0.125396728515625, 1.3922233581542969, 2.6590464115142822, 3.9258694648742676, 5.192692756652832, 6.459515571594238, 7.7263383865356445, 8.993162155151367, 10.259984970092773, 11.52680778503418, 12.793630599975586, 14.060453414916992, 15.327277183532715, 16.594100952148438, 17.860923767089844, 19.12774658203125, 20.394569396972656, 21.661392211914062, 22.92821502685547, 24.195037841796875, 25.46186065673828, 26.728683471679688, 27.995506286621094, 29.262331008911133, 30.52915382385254, 31.795976638793945, 33.062801361083984, 34.32962417602539, 35.5964469909668, 36.8632698059082, 38.13009262084961, 39.396915435791016, 40.66373825073242, 41.93056106567383]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 5.0, 9.0, 6.0, 13.0, 18.0, 22.0, 47.0, 54.0, 95.0, 144.0, 226.0, 364.0, 579.0, 879.0, 1405.0, 2059.0, 3379.0, 5286.0, 8133.0, 12288.0, 18434.0, 26647.0, 37764.0, 51348.0, 66999.0, 81942.0, 94460.0, 102553.0, 103182.0, 96896.0, 84710.0, 69371.0, 54100.0, 39421.0, 28393.0, 19904.0, 13329.0, 8571.0, 5548.0, 3560.0, 2366.0, 1445.0, 925.0, 627.0, 392.0, 262.0, 147.0, 94.0, 60.0, 41.0, 27.0, 8.0, 9.0, 10.0, 9.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-25.71875, -24.891357421875, -24.06396484375, -23.236572265625, -22.4091796875, -21.581787109375, -20.75439453125, -19.927001953125, -19.099609375, -18.272216796875, -17.44482421875, -16.617431640625, -15.7900390625, -14.962646484375, -14.13525390625, -13.307861328125, -12.48046875, -11.653076171875, -10.82568359375, -9.998291015625, -9.1708984375, -8.343505859375, -7.51611328125, -6.688720703125, -5.861328125, -5.033935546875, -4.20654296875, -3.379150390625, -2.5517578125, -1.724365234375, -0.89697265625, -0.069580078125, 0.7578125, 1.585205078125, 2.41259765625, 3.239990234375, 4.0673828125, 4.894775390625, 5.72216796875, 6.549560546875, 7.376953125, 8.204345703125, 9.03173828125, 9.859130859375, 10.6865234375, 11.513916015625, 12.34130859375, 13.168701171875, 13.99609375, 14.823486328125, 15.65087890625, 16.478271484375, 17.3056640625, 18.133056640625, 18.96044921875, 19.787841796875, 20.615234375, 21.442626953125, 22.27001953125, 23.097412109375, 23.9248046875, 24.752197265625, 25.57958984375, 26.406982421875, 27.234375]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 5.0, 5.0, 8.0, 8.0, 8.0, 8.0, 8.0, 8.0, 17.0, 20.0, 22.0, 29.0, 28.0, 37.0, 34.0, 31.0, 44.0, 32.0, 47.0, 45.0, 43.0, 46.0, 43.0, 44.0, 40.0, 41.0, 35.0, 36.0, 35.0, 19.0, 27.0, 29.0, 15.0, 18.0, 14.0, 9.0, 15.0, 13.0, 14.0, 7.0, 6.0, 8.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 3.0, 1.0], "bins": [-43.8125, -42.57568359375, -41.3388671875, -40.10205078125, -38.865234375, -37.62841796875, -36.3916015625, -35.15478515625, -33.91796875, -32.68115234375, -31.4443359375, -30.20751953125, -28.970703125, -27.73388671875, -26.4970703125, -25.26025390625, -24.0234375, -22.78662109375, -21.5498046875, -20.31298828125, -19.076171875, -17.83935546875, -16.6025390625, -15.36572265625, -14.12890625, -12.89208984375, -11.6552734375, -10.41845703125, -9.181640625, -7.94482421875, -6.7080078125, -5.47119140625, -4.234375, -2.99755859375, -1.7607421875, -0.52392578125, 0.712890625, 1.94970703125, 3.1865234375, 4.42333984375, 5.66015625, 6.89697265625, 8.1337890625, 9.37060546875, 10.607421875, 11.84423828125, 13.0810546875, 14.31787109375, 15.5546875, 16.79150390625, 18.0283203125, 19.26513671875, 20.501953125, 21.73876953125, 22.9755859375, 24.21240234375, 25.44921875, 26.68603515625, 27.9228515625, 29.15966796875, 30.396484375, 31.63330078125, 32.8701171875, 34.10693359375, 35.34375]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 3.0, 6.0, 10.0, 11.0, 20.0, 43.0, 63.0, 114.0, 155.0, 237.0, 423.0, 618.0, 1004.0, 1545.0, 2493.0, 3523.0, 5378.0, 8032.0, 11724.0, 17222.0, 24157.0, 33071.0, 44742.0, 58048.0, 71131.0, 83445.0, 92778.0, 96393.0, 94841.0, 87866.0, 75858.0, 62235.0, 48423.0, 36772.0, 26661.0, 18985.0, 13436.0, 9042.0, 6269.0, 4186.0, 2704.0, 1747.0, 1203.0, 732.0, 465.0, 256.0, 166.0, 121.0, 90.0, 47.0, 31.0, 16.0, 12.0, 6.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-27.09375, -26.238037109375, -25.38232421875, -24.526611328125, -23.6708984375, -22.815185546875, -21.95947265625, -21.103759765625, -20.248046875, -19.392333984375, -18.53662109375, -17.680908203125, -16.8251953125, -15.969482421875, -15.11376953125, -14.258056640625, -13.40234375, -12.546630859375, -11.69091796875, -10.835205078125, -9.9794921875, -9.123779296875, -8.26806640625, -7.412353515625, -6.556640625, -5.700927734375, -4.84521484375, -3.989501953125, -3.1337890625, -2.278076171875, -1.42236328125, -0.566650390625, 0.2890625, 1.144775390625, 2.00048828125, 2.856201171875, 3.7119140625, 4.567626953125, 5.42333984375, 6.279052734375, 7.134765625, 7.990478515625, 8.84619140625, 9.701904296875, 10.5576171875, 11.413330078125, 12.26904296875, 13.124755859375, 13.98046875, 14.836181640625, 15.69189453125, 16.547607421875, 17.4033203125, 18.259033203125, 19.11474609375, 19.970458984375, 20.826171875, 21.681884765625, 22.53759765625, 23.393310546875, 24.2490234375, 25.104736328125, 25.96044921875, 26.816162109375, 27.671875]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 7.0, 2.0, 1.0, 4.0, 7.0, 8.0, 11.0, 17.0, 13.0, 23.0, 15.0, 23.0, 15.0, 25.0, 19.0, 24.0, 30.0, 29.0, 37.0, 30.0, 44.0, 33.0, 42.0, 37.0, 46.0, 33.0, 40.0, 37.0, 35.0, 30.0, 29.0, 22.0, 34.0, 31.0, 30.0, 25.0, 15.0, 22.0, 12.0, 10.0, 17.0, 6.0, 7.0, 6.0, 9.0, 8.0, 5.0, 5.0, 3.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-22.03125, -21.310546875, -20.58984375, -19.869140625, -19.1484375, -18.427734375, -17.70703125, -16.986328125, -16.265625, -15.544921875, -14.82421875, -14.103515625, -13.3828125, -12.662109375, -11.94140625, -11.220703125, -10.5, -9.779296875, -9.05859375, -8.337890625, -7.6171875, -6.896484375, -6.17578125, -5.455078125, -4.734375, -4.013671875, -3.29296875, -2.572265625, -1.8515625, -1.130859375, -0.41015625, 0.310546875, 1.03125, 1.751953125, 2.47265625, 3.193359375, 3.9140625, 4.634765625, 5.35546875, 6.076171875, 6.796875, 7.517578125, 8.23828125, 8.958984375, 9.6796875, 10.400390625, 11.12109375, 11.841796875, 12.5625, 13.283203125, 14.00390625, 14.724609375, 15.4453125, 16.166015625, 16.88671875, 17.607421875, 18.328125, 19.048828125, 19.76953125, 20.490234375, 21.2109375, 21.931640625, 22.65234375, 23.373046875, 24.09375]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 6.0, 9.0, 13.0, 11.0, 22.0, 26.0, 47.0, 45.0, 78.0, 94.0, 133.0, 185.0, 246.0, 370.0, 543.0, 857.0, 1333.0, 2308.0, 4093.0, 7684.0, 14622.0, 28705.0, 55453.0, 99709.0, 155026.0, 193389.0, 182282.0, 132568.0, 78631.0, 42670.0, 21706.0, 11450.0, 5930.0, 3206.0, 1743.0, 1134.0, 658.0, 479.0, 298.0, 222.0, 144.0, 107.0, 87.0, 75.0, 48.0, 35.0, 22.0, 18.0, 11.0, 7.0, 10.0, 4.0, 8.0, 1.0, 3.0, 3.0, 1.0, 1.0], "bins": [-15.671875, -15.178955078125, -14.68603515625, -14.193115234375, -13.7001953125, -13.207275390625, -12.71435546875, -12.221435546875, -11.728515625, -11.235595703125, -10.74267578125, -10.249755859375, -9.7568359375, -9.263916015625, -8.77099609375, -8.278076171875, -7.78515625, -7.292236328125, -6.79931640625, -6.306396484375, -5.8134765625, -5.320556640625, -4.82763671875, -4.334716796875, -3.841796875, -3.348876953125, -2.85595703125, -2.363037109375, -1.8701171875, -1.377197265625, -0.88427734375, -0.391357421875, 0.1015625, 0.594482421875, 1.08740234375, 1.580322265625, 2.0732421875, 2.566162109375, 3.05908203125, 3.552001953125, 4.044921875, 4.537841796875, 5.03076171875, 5.523681640625, 6.0166015625, 6.509521484375, 7.00244140625, 7.495361328125, 7.98828125, 8.481201171875, 8.97412109375, 9.467041015625, 9.9599609375, 10.452880859375, 10.94580078125, 11.438720703125, 11.931640625, 12.424560546875, 12.91748046875, 13.410400390625, 13.9033203125, 14.396240234375, 14.88916015625, 15.382080078125, 15.875]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 6.0, 2.0, 5.0, 6.0, 6.0, 12.0, 7.0, 7.0, 17.0, 28.0, 28.0, 28.0, 43.0, 38.0, 49.0, 65.0, 49.0, 63.0, 62.0, 64.0, 52.0, 59.0, 47.0, 56.0, 46.0, 35.0, 19.0, 26.0, 17.0, 9.0, 11.0, 8.0, 10.0, 6.0, 7.0, 1.0, 1.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0014410018920898438, -0.0013992488384246826, -0.0013574957847595215, -0.0013157427310943604, -0.0012739896774291992, -0.001232236623764038, -0.001190483570098877, -0.0011487305164337158, -0.0011069774627685547, -0.0010652244091033936, -0.0010234713554382324, -0.0009817183017730713, -0.0009399652481079102, -0.000898212194442749, -0.0008564591407775879, -0.0008147060871124268, -0.0007729530334472656, -0.0007311999797821045, -0.0006894469261169434, -0.0006476938724517822, -0.0006059408187866211, -0.00056418776512146, -0.0005224347114562988, -0.0004806816577911377, -0.00043892860412597656, -0.00039717555046081543, -0.0003554224967956543, -0.00031366944313049316, -0.00027191638946533203, -0.0002301633358001709, -0.00018841028213500977, -0.00014665722846984863, -0.0001049041748046875, -6.315112113952637e-05, -2.1398067474365234e-05, 2.03549861907959e-05, 6.210803985595703e-05, 0.00010386109352111816, 0.0001456141471862793, 0.00018736720085144043, 0.00022912025451660156, 0.0002708733081817627, 0.00031262636184692383, 0.00035437941551208496, 0.0003961324691772461, 0.0004378855228424072, 0.00047963857650756836, 0.0005213916301727295, 0.0005631446838378906, 0.0006048977375030518, 0.0006466507911682129, 0.000688403844833374, 0.0007301568984985352, 0.0007719099521636963, 0.0008136630058288574, 0.0008554160594940186, 0.0008971691131591797, 0.0009389221668243408, 0.000980675220489502, 0.001022428274154663, 0.0010641813278198242, 0.0011059343814849854, 0.0011476874351501465, 0.0011894404888153076, 0.0012311935424804688]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 2.0, 4.0, 10.0, 18.0, 28.0, 39.0, 48.0, 80.0, 136.0, 252.0, 325.0, 661.0, 1016.0, 1845.0, 3198.0, 5665.0, 10208.0, 17458.0, 29899.0, 50524.0, 78807.0, 113129.0, 141379.0, 152656.0, 140353.0, 109577.0, 76051.0, 48012.0, 28772.0, 16379.0, 9439.0, 5245.0, 3073.0, 1651.0, 1046.0, 618.0, 371.0, 214.0, 144.0, 86.0, 57.0, 29.0, 26.0, 14.0, 6.0, 7.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.1484375, -12.75537109375, -12.3623046875, -11.96923828125, -11.576171875, -11.18310546875, -10.7900390625, -10.39697265625, -10.00390625, -9.61083984375, -9.2177734375, -8.82470703125, -8.431640625, -8.03857421875, -7.6455078125, -7.25244140625, -6.859375, -6.46630859375, -6.0732421875, -5.68017578125, -5.287109375, -4.89404296875, -4.5009765625, -4.10791015625, -3.71484375, -3.32177734375, -2.9287109375, -2.53564453125, -2.142578125, -1.74951171875, -1.3564453125, -0.96337890625, -0.5703125, -0.17724609375, 0.2158203125, 0.60888671875, 1.001953125, 1.39501953125, 1.7880859375, 2.18115234375, 2.57421875, 2.96728515625, 3.3603515625, 3.75341796875, 4.146484375, 4.53955078125, 4.9326171875, 5.32568359375, 5.71875, 6.11181640625, 6.5048828125, 6.89794921875, 7.291015625, 7.68408203125, 8.0771484375, 8.47021484375, 8.86328125, 9.25634765625, 9.6494140625, 10.04248046875, 10.435546875, 10.82861328125, 11.2216796875, 11.61474609375, 12.0078125]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 1.0, 11.0, 6.0, 4.0, 9.0, 16.0, 20.0, 17.0, 23.0, 24.0, 38.0, 45.0, 59.0, 52.0, 56.0, 62.0, 57.0, 77.0, 71.0, 72.0, 43.0, 50.0, 49.0, 25.0, 25.0, 20.0, 15.0, 11.0, 12.0, 5.0, 10.0, 3.0, 5.0, 1.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.65625, -5.47161865234375, -5.2869873046875, -5.10235595703125, -4.917724609375, -4.73309326171875, -4.5484619140625, -4.36383056640625, -4.17919921875, -3.99456787109375, -3.8099365234375, -3.62530517578125, -3.440673828125, -3.25604248046875, -3.0714111328125, -2.88677978515625, -2.7021484375, -2.51751708984375, -2.3328857421875, -2.14825439453125, -1.963623046875, -1.77899169921875, -1.5943603515625, -1.40972900390625, -1.22509765625, -1.04046630859375, -0.8558349609375, -0.67120361328125, -0.486572265625, -0.30194091796875, -0.1173095703125, 0.06732177734375, 0.251953125, 0.43658447265625, 0.6212158203125, 0.80584716796875, 0.990478515625, 1.17510986328125, 1.3597412109375, 1.54437255859375, 1.72900390625, 1.91363525390625, 2.0982666015625, 2.28289794921875, 2.467529296875, 2.65216064453125, 2.8367919921875, 3.02142333984375, 3.2060546875, 3.39068603515625, 3.5753173828125, 3.75994873046875, 3.944580078125, 4.12921142578125, 4.3138427734375, 4.49847412109375, 4.68310546875, 4.86773681640625, 5.0523681640625, 5.23699951171875, 5.421630859375, 5.60626220703125, 5.7908935546875, 5.97552490234375, 6.16015625]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 4.0, 3.0, 4.0, 1.0, 5.0, 11.0, 10.0, 7.0, 9.0, 7.0, 14.0, 11.0, 20.0, 21.0, 28.0, 23.0, 25.0, 27.0, 26.0, 26.0, 36.0, 32.0, 42.0, 36.0, 36.0, 32.0, 44.0, 38.0, 36.0, 38.0, 42.0, 35.0, 37.0, 25.0, 27.0, 31.0, 27.0, 23.0, 11.0, 23.0, 10.0, 16.0, 12.0, 11.0, 11.0, 3.0, 3.0, 3.0, 0.0, 0.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-32.09178161621094, -31.142948150634766, -30.194114685058594, -29.245281219482422, -28.29644775390625, -27.347614288330078, -26.398780822753906, -25.449947357177734, -24.501113891601562, -23.55228042602539, -22.60344696044922, -21.654613494873047, -20.705780029296875, -19.756946563720703, -18.80811309814453, -17.85927963256836, -16.910446166992188, -15.961612701416016, -15.012779235839844, -14.063945770263672, -13.1151123046875, -12.166278839111328, -11.217445373535156, -10.268611907958984, -9.319778442382812, -8.37094497680664, -7.422111511230469, -6.473278045654297, -5.524444580078125, -4.575611114501953, -3.6267776489257812, -2.6779441833496094, -1.7291126251220703, -0.7802791595458984, 0.16855430603027344, 1.1173877716064453, 2.066221237182617, 3.015054702758789, 3.963888168334961, 4.912721633911133, 5.861555099487305, 6.810388565063477, 7.759222030639648, 8.70805549621582, 9.656888961791992, 10.605722427368164, 11.554555892944336, 12.503389358520508, 13.45222282409668, 14.401056289672852, 15.349889755249023, 16.298723220825195, 17.247556686401367, 18.19639015197754, 19.14522361755371, 20.094057083129883, 21.042890548706055, 21.991724014282227, 22.9405574798584, 23.88939094543457, 24.838224411010742, 25.787057876586914, 26.735891342163086, 27.684724807739258, 28.63355827331543]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 11.0, 4.0, 9.0, 6.0, 12.0, 17.0, 14.0, 12.0, 15.0, 19.0, 27.0, 24.0, 36.0, 38.0, 35.0, 36.0, 45.0, 32.0, 45.0, 48.0, 35.0, 52.0, 45.0, 35.0, 43.0, 38.0, 33.0, 41.0, 34.0, 28.0, 18.0, 22.0, 22.0, 16.0, 14.0, 11.0, 6.0, 8.0, 5.0, 4.0, 5.0, 5.0, 0.0, 5.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-42.34571075439453, -41.03445053100586, -39.72319030761719, -38.41193389892578, -37.10067367553711, -35.78941345214844, -34.478153228759766, -33.166893005371094, -31.855634689331055, -30.544374465942383, -29.233116149902344, -27.921855926513672, -26.610595703125, -25.29933738708496, -23.98807716369629, -22.67681884765625, -21.365558624267578, -20.054298400878906, -18.743040084838867, -17.431779861450195, -16.120521545410156, -14.809261322021484, -13.498001098632812, -12.186741828918457, -10.875482559204102, -9.564223289489746, -8.25296401977539, -6.941703796386719, -5.630444526672363, -4.319185256958008, -3.007925510406494, -1.6966657638549805, -0.3854026794433594, 0.9258568286895752, 2.2371163368225098, 3.5483758449554443, 4.859635353088379, 6.170894622802734, 7.482154369354248, 8.793414115905762, 10.104673385620117, 11.415932655334473, 12.727191925048828, 14.0384521484375, 15.349711418151855, 16.66097068786621, 17.972230911254883, 19.283489227294922, 20.594749450683594, 21.906009674072266, 23.217267990112305, 24.528528213500977, 25.839786529541016, 27.151046752929688, 28.46230697631836, 29.77356719970703, 31.08482551574707, 32.39608383178711, 33.70734405517578, 35.01860427856445, 36.329864501953125, 37.64112091064453, 38.9523811340332, 40.263641357421875, 41.57490158081055]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 6.0, 13.0, 25.0, 33.0, 47.0, 81.0, 139.0, 265.0, 391.0, 665.0, 1193.0, 2035.0, 3361.0, 5908.0, 10023.0, 16822.0, 28450.0, 46892.0, 76656.0, 121951.0, 188291.0, 274831.0, 373979.0, 466791.0, 521445.0, 518542.0, 453939.0, 357404.0, 258461.0, 175922.0, 112480.0, 70667.0, 42850.0, 26035.0, 15440.0, 9068.0, 5449.0, 3204.0, 1869.0, 1077.0, 654.0, 384.0, 230.0, 116.0, 84.0, 56.0, 25.0, 22.0, 8.0, 7.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-26.640625, -25.80615234375, -24.9716796875, -24.13720703125, -23.302734375, -22.46826171875, -21.6337890625, -20.79931640625, -19.96484375, -19.13037109375, -18.2958984375, -17.46142578125, -16.626953125, -15.79248046875, -14.9580078125, -14.12353515625, -13.2890625, -12.45458984375, -11.6201171875, -10.78564453125, -9.951171875, -9.11669921875, -8.2822265625, -7.44775390625, -6.61328125, -5.77880859375, -4.9443359375, -4.10986328125, -3.275390625, -2.44091796875, -1.6064453125, -0.77197265625, 0.0625, 0.89697265625, 1.7314453125, 2.56591796875, 3.400390625, 4.23486328125, 5.0693359375, 5.90380859375, 6.73828125, 7.57275390625, 8.4072265625, 9.24169921875, 10.076171875, 10.91064453125, 11.7451171875, 12.57958984375, 13.4140625, 14.24853515625, 15.0830078125, 15.91748046875, 16.751953125, 17.58642578125, 18.4208984375, 19.25537109375, 20.08984375, 20.92431640625, 21.7587890625, 22.59326171875, 23.427734375, 24.26220703125, 25.0966796875, 25.93115234375, 26.765625]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 4.0, 6.0, 8.0, 20.0, 11.0, 15.0, 14.0, 18.0, 18.0, 19.0, 27.0, 33.0, 34.0, 36.0, 32.0, 33.0, 43.0, 48.0, 50.0, 48.0, 43.0, 40.0, 45.0, 44.0, 31.0, 33.0, 36.0, 28.0, 32.0, 37.0, 21.0, 17.0, 15.0, 16.0, 9.0, 10.0, 6.0, 8.0, 2.0, 5.0, 6.0, 2.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-30.96875, -29.96142578125, -28.9541015625, -27.94677734375, -26.939453125, -25.93212890625, -24.9248046875, -23.91748046875, -22.91015625, -21.90283203125, -20.8955078125, -19.88818359375, -18.880859375, -17.87353515625, -16.8662109375, -15.85888671875, -14.8515625, -13.84423828125, -12.8369140625, -11.82958984375, -10.822265625, -9.81494140625, -8.8076171875, -7.80029296875, -6.79296875, -5.78564453125, -4.7783203125, -3.77099609375, -2.763671875, -1.75634765625, -0.7490234375, 0.25830078125, 1.265625, 2.27294921875, 3.2802734375, 4.28759765625, 5.294921875, 6.30224609375, 7.3095703125, 8.31689453125, 9.32421875, 10.33154296875, 11.3388671875, 12.34619140625, 13.353515625, 14.36083984375, 15.3681640625, 16.37548828125, 17.3828125, 18.39013671875, 19.3974609375, 20.40478515625, 21.412109375, 22.41943359375, 23.4267578125, 24.43408203125, 25.44140625, 26.44873046875, 27.4560546875, 28.46337890625, 29.470703125, 30.47802734375, 31.4853515625, 32.49267578125, 33.5]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 7.0, 9.0, 19.0, 30.0, 48.0, 85.0, 111.0, 173.0, 296.0, 480.0, 765.0, 1237.0, 2126.0, 3208.0, 5316.0, 8195.0, 12912.0, 20312.0, 31180.0, 46370.0, 67790.0, 99668.0, 137080.0, 186088.0, 241251.0, 298699.0, 350631.0, 387364.0, 400303.0, 386639.0, 350338.0, 297091.0, 240891.0, 184443.0, 137140.0, 97023.0, 67740.0, 46251.0, 30562.0, 19992.0, 12605.0, 8241.0, 5102.0, 3291.0, 1992.0, 1249.0, 744.0, 435.0, 299.0, 166.0, 131.0, 72.0, 41.0, 26.0, 17.0, 10.0, 6.0, 2.0, 3.0, 3.0], "bins": [-22.390625, -21.701416015625, -21.01220703125, -20.322998046875, -19.6337890625, -18.944580078125, -18.25537109375, -17.566162109375, -16.876953125, -16.187744140625, -15.49853515625, -14.809326171875, -14.1201171875, -13.430908203125, -12.74169921875, -12.052490234375, -11.36328125, -10.674072265625, -9.98486328125, -9.295654296875, -8.6064453125, -7.917236328125, -7.22802734375, -6.538818359375, -5.849609375, -5.160400390625, -4.47119140625, -3.781982421875, -3.0927734375, -2.403564453125, -1.71435546875, -1.025146484375, -0.3359375, 0.353271484375, 1.04248046875, 1.731689453125, 2.4208984375, 3.110107421875, 3.79931640625, 4.488525390625, 5.177734375, 5.866943359375, 6.55615234375, 7.245361328125, 7.9345703125, 8.623779296875, 9.31298828125, 10.002197265625, 10.69140625, 11.380615234375, 12.06982421875, 12.759033203125, 13.4482421875, 14.137451171875, 14.82666015625, 15.515869140625, 16.205078125, 16.894287109375, 17.58349609375, 18.272705078125, 18.9619140625, 19.651123046875, 20.34033203125, 21.029541015625, 21.71875]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 15.0, 9.0, 19.0, 7.0, 32.0, 26.0, 38.0, 43.0, 61.0, 72.0, 98.0, 119.0, 124.0, 154.0, 217.0, 212.0, 227.0, 229.0, 229.0, 239.0, 251.0, 231.0, 216.0, 221.0, 184.0, 153.0, 119.0, 117.0, 85.0, 73.0, 67.0, 46.0, 45.0, 24.0, 18.0, 17.0, 10.0, 9.0, 7.0, 4.0, 3.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.0703125, -12.5892333984375, -12.108154296875, -11.6270751953125, -11.14599609375, -10.6649169921875, -10.183837890625, -9.7027587890625, -9.2216796875, -8.7406005859375, -8.259521484375, -7.7784423828125, -7.29736328125, -6.8162841796875, -6.335205078125, -5.8541259765625, -5.373046875, -4.8919677734375, -4.410888671875, -3.9298095703125, -3.44873046875, -2.9676513671875, -2.486572265625, -2.0054931640625, -1.5244140625, -1.0433349609375, -0.562255859375, -0.0811767578125, 0.39990234375, 0.8809814453125, 1.362060546875, 1.8431396484375, 2.32421875, 2.8052978515625, 3.286376953125, 3.7674560546875, 4.24853515625, 4.7296142578125, 5.210693359375, 5.6917724609375, 6.1728515625, 6.6539306640625, 7.135009765625, 7.6160888671875, 8.09716796875, 8.5782470703125, 9.059326171875, 9.5404052734375, 10.021484375, 10.5025634765625, 10.983642578125, 11.4647216796875, 11.94580078125, 12.4268798828125, 12.907958984375, 13.3890380859375, 13.8701171875, 14.3511962890625, 14.832275390625, 15.3133544921875, 15.79443359375, 16.2755126953125, 16.756591796875, 17.2376708984375, 17.71875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 7.0, 2.0, 8.0, 1.0, 4.0, 6.0, 8.0, 5.0, 11.0, 12.0, 17.0, 15.0, 20.0, 26.0, 21.0, 37.0, 32.0, 37.0, 32.0, 54.0, 27.0, 34.0, 44.0, 40.0, 36.0, 37.0, 36.0, 45.0, 29.0, 51.0, 31.0, 36.0, 36.0, 26.0, 22.0, 24.0, 12.0, 12.0, 10.0, 10.0, 8.0, 11.0, 11.0, 5.0, 4.0, 7.0, 6.0, 2.0, 2.0, 2.0, 3.0, 1.0], "bins": [-31.60767364501953, -30.733016967773438, -29.858360290527344, -28.98370361328125, -28.109045028686523, -27.23438835144043, -26.359731674194336, -25.485074996948242, -24.610416412353516, -23.735759735107422, -22.861103057861328, -21.986446380615234, -21.111787796020508, -20.237131118774414, -19.36247444152832, -18.487817764282227, -17.613161087036133, -16.73850440979004, -15.863846778869629, -14.989190101623535, -14.114532470703125, -13.239875793457031, -12.365219116210938, -11.490562438964844, -10.615904808044434, -9.74124813079834, -8.86659049987793, -7.991933822631836, -7.117276668548584, -6.242619514465332, -5.367962837219238, -4.493305683135986, -3.6186485290527344, -2.7439913749694824, -1.8693344593048096, -0.9946775436401367, -0.12002038955688477, 0.7546367645263672, 1.629293441772461, 2.503950595855713, 3.378607749938965, 4.253264904022217, 5.127922058105469, 6.0025787353515625, 6.8772358894348145, 7.751893043518066, 8.62654972076416, 9.50120735168457, 10.375864028930664, 11.250520706176758, 12.125178337097168, 12.999835014343262, 13.874492645263672, 14.749149322509766, 15.62380599975586, 16.498462677001953, 17.373119354248047, 18.24777603149414, 19.122432708740234, 19.997089385986328, 20.871747970581055, 21.74640464782715, 22.621061325073242, 23.495718002319336, 24.370376586914062]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 4.0, 5.0, 3.0, 4.0, 9.0, 8.0, 5.0, 7.0, 15.0, 12.0, 19.0, 25.0, 30.0, 23.0, 20.0, 36.0, 43.0, 36.0, 48.0, 29.0, 33.0, 42.0, 35.0, 46.0, 40.0, 40.0, 50.0, 41.0, 40.0, 30.0, 31.0, 27.0, 19.0, 23.0, 30.0, 11.0, 20.0, 7.0, 13.0, 11.0, 8.0, 1.0, 10.0, 6.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-32.73747634887695, -31.653339385986328, -30.569204330444336, -29.48506736755371, -28.40093231201172, -27.316795349121094, -26.23265838623047, -25.148521423339844, -24.06438636779785, -22.980249404907227, -21.896114349365234, -20.81197738647461, -19.727840423583984, -18.643705368041992, -17.559568405151367, -16.475433349609375, -15.39129638671875, -14.307160377502441, -13.223024368286133, -12.138887405395508, -11.0547513961792, -9.97061538696289, -8.886478424072266, -7.802342414855957, -6.718206405639648, -5.63407039642334, -4.549933910369873, -3.4657976627349854, -2.3816614151000977, -1.297525405883789, -0.21338891983032227, 0.8707475662231445, 1.9548873901367188, 3.0390236377716064, 4.123159885406494, 5.207296371459961, 6.2914323806762695, 7.375568389892578, 8.459705352783203, 9.543841361999512, 10.62797737121582, 11.712113380432129, 12.796249389648438, 13.880386352539062, 14.964522361755371, 16.04865837097168, 17.132795333862305, 18.216930389404297, 19.301067352294922, 20.385204315185547, 21.46933937072754, 22.553476333618164, 23.637611389160156, 24.72174835205078, 25.805885314941406, 26.89002227783203, 27.974157333374023, 29.05829429626465, 30.14242935180664, 31.226566314697266, 32.31070327758789, 33.39483642578125, 34.478973388671875, 35.5631103515625, 36.647247314453125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 4.0, 6.0, 6.0, 13.0, 22.0, 30.0, 44.0, 41.0, 93.0, 115.0, 206.0, 301.0, 493.0, 817.0, 1377.0, 2310.0, 4009.0, 6763.0, 12256.0, 22502.0, 40070.0, 70428.0, 114805.0, 166864.0, 190421.0, 159066.0, 106773.0, 64861.0, 36580.0, 20516.0, 11512.0, 6324.0, 3565.0, 2123.0, 1210.0, 775.0, 470.0, 283.0, 191.0, 108.0, 62.0, 50.0, 29.0, 25.0, 22.0, 3.0, 6.0, 4.0, 4.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-12.3125, -11.920654296875, -11.52880859375, -11.136962890625, -10.7451171875, -10.353271484375, -9.96142578125, -9.569580078125, -9.177734375, -8.785888671875, -8.39404296875, -8.002197265625, -7.6103515625, -7.218505859375, -6.82666015625, -6.434814453125, -6.04296875, -5.651123046875, -5.25927734375, -4.867431640625, -4.4755859375, -4.083740234375, -3.69189453125, -3.300048828125, -2.908203125, -2.516357421875, -2.12451171875, -1.732666015625, -1.3408203125, -0.948974609375, -0.55712890625, -0.165283203125, 0.2265625, 0.618408203125, 1.01025390625, 1.402099609375, 1.7939453125, 2.185791015625, 2.57763671875, 2.969482421875, 3.361328125, 3.753173828125, 4.14501953125, 4.536865234375, 4.9287109375, 5.320556640625, 5.71240234375, 6.104248046875, 6.49609375, 6.887939453125, 7.27978515625, 7.671630859375, 8.0634765625, 8.455322265625, 8.84716796875, 9.239013671875, 9.630859375, 10.022705078125, 10.41455078125, 10.806396484375, 11.1982421875, 11.590087890625, 11.98193359375, 12.373779296875, 12.765625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 3.0, 12.0, 4.0, 10.0, 4.0, 11.0, 14.0, 20.0, 18.0, 29.0, 21.0, 19.0, 35.0, 30.0, 35.0, 32.0, 47.0, 39.0, 47.0, 44.0, 40.0, 50.0, 51.0, 49.0, 44.0, 29.0, 33.0, 36.0, 28.0, 21.0, 25.0, 19.0, 22.0, 13.0, 14.0, 11.0, 9.0, 9.0, 4.0, 9.0, 4.0, 6.0, 0.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.0625, -31.90185546875, -30.7412109375, -29.58056640625, -28.419921875, -27.25927734375, -26.0986328125, -24.93798828125, -23.77734375, -22.61669921875, -21.4560546875, -20.29541015625, -19.134765625, -17.97412109375, -16.8134765625, -15.65283203125, -14.4921875, -13.33154296875, -12.1708984375, -11.01025390625, -9.849609375, -8.68896484375, -7.5283203125, -6.36767578125, -5.20703125, -4.04638671875, -2.8857421875, -1.72509765625, -0.564453125, 0.59619140625, 1.7568359375, 2.91748046875, 4.078125, 5.23876953125, 6.3994140625, 7.56005859375, 8.720703125, 9.88134765625, 11.0419921875, 12.20263671875, 13.36328125, 14.52392578125, 15.6845703125, 16.84521484375, 18.005859375, 19.16650390625, 20.3271484375, 21.48779296875, 22.6484375, 23.80908203125, 24.9697265625, 26.13037109375, 27.291015625, 28.45166015625, 29.6123046875, 30.77294921875, 31.93359375, 33.09423828125, 34.2548828125, 35.41552734375, 36.576171875, 37.73681640625, 38.8974609375, 40.05810546875, 41.21875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 7.0, 8.0, 8.0, 15.0, 18.0, 23.0, 42.0, 68.0, 118.0, 174.0, 290.0, 474.0, 710.0, 1274.0, 2254.0, 4166.0, 7545.0, 14091.0, 27569.0, 52371.0, 97072.0, 160767.0, 207476.0, 190280.0, 128108.0, 72031.0, 38642.0, 19676.0, 10379.0, 5675.0, 2969.0, 1774.0, 968.0, 570.0, 374.0, 199.0, 139.0, 84.0, 52.0, 46.0, 24.0, 22.0, 6.0, 2.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.34375, -8.0535888671875, -7.763427734375, -7.4732666015625, -7.18310546875, -6.8929443359375, -6.602783203125, -6.3126220703125, -6.0224609375, -5.7322998046875, -5.442138671875, -5.1519775390625, -4.86181640625, -4.5716552734375, -4.281494140625, -3.9913330078125, -3.701171875, -3.4110107421875, -3.120849609375, -2.8306884765625, -2.54052734375, -2.2503662109375, -1.960205078125, -1.6700439453125, -1.3798828125, -1.0897216796875, -0.799560546875, -0.5093994140625, -0.21923828125, 0.0709228515625, 0.361083984375, 0.6512451171875, 0.94140625, 1.2315673828125, 1.521728515625, 1.8118896484375, 2.10205078125, 2.3922119140625, 2.682373046875, 2.9725341796875, 3.2626953125, 3.5528564453125, 3.843017578125, 4.1331787109375, 4.42333984375, 4.7135009765625, 5.003662109375, 5.2938232421875, 5.583984375, 5.8741455078125, 6.164306640625, 6.4544677734375, 6.74462890625, 7.0347900390625, 7.324951171875, 7.6151123046875, 7.9052734375, 8.1954345703125, 8.485595703125, 8.7757568359375, 9.06591796875, 9.3560791015625, 9.646240234375, 9.9364013671875, 10.2265625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 3.0, 4.0, 3.0, 4.0, 4.0, 7.0, 15.0, 18.0, 16.0, 13.0, 18.0, 28.0, 27.0, 27.0, 32.0, 30.0, 42.0, 36.0, 32.0, 38.0, 41.0, 50.0, 43.0, 40.0, 41.0, 42.0, 44.0, 27.0, 36.0, 23.0, 29.0, 21.0, 28.0, 15.0, 18.0, 23.0, 20.0, 12.0, 15.0, 12.0, 3.0, 10.0, 8.0, 5.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-21.453125, -20.741943359375, -20.03076171875, -19.319580078125, -18.6083984375, -17.897216796875, -17.18603515625, -16.474853515625, -15.763671875, -15.052490234375, -14.34130859375, -13.630126953125, -12.9189453125, -12.207763671875, -11.49658203125, -10.785400390625, -10.07421875, -9.363037109375, -8.65185546875, -7.940673828125, -7.2294921875, -6.518310546875, -5.80712890625, -5.095947265625, -4.384765625, -3.673583984375, -2.96240234375, -2.251220703125, -1.5400390625, -0.828857421875, -0.11767578125, 0.593505859375, 1.3046875, 2.015869140625, 2.72705078125, 3.438232421875, 4.1494140625, 4.860595703125, 5.57177734375, 6.282958984375, 6.994140625, 7.705322265625, 8.41650390625, 9.127685546875, 9.8388671875, 10.550048828125, 11.26123046875, 11.972412109375, 12.68359375, 13.394775390625, 14.10595703125, 14.817138671875, 15.5283203125, 16.239501953125, 16.95068359375, 17.661865234375, 18.373046875, 19.084228515625, 19.79541015625, 20.506591796875, 21.2177734375, 21.928955078125, 22.64013671875, 23.351318359375, 24.0625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 1.0, 4.0, 4.0, 1.0, 6.0, 9.0, 15.0, 17.0, 44.0, 57.0, 66.0, 100.0, 140.0, 186.0, 284.0, 418.0, 551.0, 862.0, 1234.0, 1883.0, 2988.0, 5102.0, 8777.0, 16503.0, 34912.0, 82220.0, 202588.0, 332736.0, 201034.0, 82058.0, 34636.0, 16544.0, 8658.0, 5033.0, 3054.0, 1875.0, 1221.0, 845.0, 567.0, 428.0, 260.0, 203.0, 144.0, 89.0, 64.0, 47.0, 26.0, 22.0, 8.0, 17.0, 11.0, 5.0, 2.0, 4.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.529296875, -3.41357421875, -3.2978515625, -3.18212890625, -3.06640625, -2.95068359375, -2.8349609375, -2.71923828125, -2.603515625, -2.48779296875, -2.3720703125, -2.25634765625, -2.140625, -2.02490234375, -1.9091796875, -1.79345703125, -1.677734375, -1.56201171875, -1.4462890625, -1.33056640625, -1.21484375, -1.09912109375, -0.9833984375, -0.86767578125, -0.751953125, -0.63623046875, -0.5205078125, -0.40478515625, -0.2890625, -0.17333984375, -0.0576171875, 0.05810546875, 0.173828125, 0.28955078125, 0.4052734375, 0.52099609375, 0.63671875, 0.75244140625, 0.8681640625, 0.98388671875, 1.099609375, 1.21533203125, 1.3310546875, 1.44677734375, 1.5625, 1.67822265625, 1.7939453125, 1.90966796875, 2.025390625, 2.14111328125, 2.2568359375, 2.37255859375, 2.48828125, 2.60400390625, 2.7197265625, 2.83544921875, 2.951171875, 3.06689453125, 3.1826171875, 3.29833984375, 3.4140625, 3.52978515625, 3.6455078125, 3.76123046875, 3.876953125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 7.0, 19.0, 14.0, 22.0, 33.0, 72.0, 118.0, 160.0, 156.0, 153.0, 85.0, 58.0, 37.0, 25.0, 14.0, 10.0, 11.0, 6.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0018568038940429688, -0.00181589275598526, -0.0017749816179275513, -0.0017340704798698425, -0.0016931593418121338, -0.001652248203754425, -0.0016113370656967163, -0.0015704259276390076, -0.0015295147895812988, -0.00148860365152359, -0.0014476925134658813, -0.0014067813754081726, -0.0013658702373504639, -0.0013249590992927551, -0.0012840479612350464, -0.0012431368231773376, -0.001202225685119629, -0.0011613145470619202, -0.0011204034090042114, -0.0010794922709465027, -0.001038581132888794, -0.0009976699948310852, -0.0009567588567733765, -0.0009158477187156677, -0.000874936580657959, -0.0008340254426002502, -0.0007931143045425415, -0.0007522031664848328, -0.000711292028427124, -0.0006703808903694153, -0.0006294697523117065, -0.0005885586142539978, -0.0005476474761962891, -0.0005067363381385803, -0.0004658252000808716, -0.00042491406202316284, -0.0003840029239654541, -0.00034309178590774536, -0.0003021806478500366, -0.0002612695097923279, -0.00022035837173461914, -0.0001794472336769104, -0.00013853609561920166, -9.762495756149292e-05, -5.671381950378418e-05, -1.580268144607544e-05, 2.51084566116333e-05, 6.601959466934204e-05, 0.00010693073272705078, 0.00014784187078475952, 0.00018875300884246826, 0.000229664146900177, 0.00027057528495788574, 0.0003114864230155945, 0.0003523975610733032, 0.00039330869913101196, 0.0004342198371887207, 0.00047513097524642944, 0.0005160421133041382, 0.0005569532513618469, 0.0005978643894195557, 0.0006387755274772644, 0.0006796866655349731, 0.0007205978035926819, 0.0007615089416503906]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 3.0, 4.0, 3.0, 4.0, 9.0, 24.0, 17.0, 32.0, 50.0, 67.0, 117.0, 156.0, 220.0, 311.0, 423.0, 693.0, 979.0, 1468.0, 2204.0, 3245.0, 4904.0, 7494.0, 11883.0, 19335.0, 32328.0, 54773.0, 93136.0, 149717.0, 197481.0, 175314.0, 116296.0, 69198.0, 40825.0, 24053.0, 14679.0, 9374.0, 5884.0, 3879.0, 2572.0, 1711.0, 1165.0, 801.0, 525.0, 352.0, 249.0, 198.0, 134.0, 102.0, 49.0, 35.0, 36.0, 23.0, 13.0, 7.0, 6.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.40625, -4.2628173828125, -4.119384765625, -3.9759521484375, -3.83251953125, -3.6890869140625, -3.545654296875, -3.4022216796875, -3.2587890625, -3.1153564453125, -2.971923828125, -2.8284912109375, -2.68505859375, -2.5416259765625, -2.398193359375, -2.2547607421875, -2.111328125, -1.9678955078125, -1.824462890625, -1.6810302734375, -1.53759765625, -1.3941650390625, -1.250732421875, -1.1072998046875, -0.9638671875, -0.8204345703125, -0.677001953125, -0.5335693359375, -0.39013671875, -0.2467041015625, -0.103271484375, 0.0401611328125, 0.18359375, 0.3270263671875, 0.470458984375, 0.6138916015625, 0.75732421875, 0.9007568359375, 1.044189453125, 1.1876220703125, 1.3310546875, 1.4744873046875, 1.617919921875, 1.7613525390625, 1.90478515625, 2.0482177734375, 2.191650390625, 2.3350830078125, 2.478515625, 2.6219482421875, 2.765380859375, 2.9088134765625, 3.05224609375, 3.1956787109375, 3.339111328125, 3.4825439453125, 3.6259765625, 3.7694091796875, 3.912841796875, 4.0562744140625, 4.19970703125, 4.3431396484375, 4.486572265625, 4.6300048828125, 4.7734375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 2.0, 1.0, 6.0, 4.0, 7.0, 4.0, 3.0, 7.0, 7.0, 5.0, 10.0, 16.0, 18.0, 13.0, 24.0, 17.0, 27.0, 31.0, 46.0, 51.0, 43.0, 76.0, 54.0, 72.0, 68.0, 62.0, 55.0, 48.0, 48.0, 25.0, 23.0, 28.0, 14.0, 11.0, 14.0, 11.0, 8.0, 8.0, 5.0, 6.0, 6.0, 6.0, 1.0, 4.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.369140625, -1.3266143798828125, -1.284088134765625, -1.2415618896484375, -1.19903564453125, -1.1565093994140625, -1.113983154296875, -1.0714569091796875, -1.0289306640625, -0.9864044189453125, -0.943878173828125, -0.9013519287109375, -0.85882568359375, -0.8162994384765625, -0.773773193359375, -0.7312469482421875, -0.688720703125, -0.6461944580078125, -0.603668212890625, -0.5611419677734375, -0.51861572265625, -0.4760894775390625, -0.433563232421875, -0.3910369873046875, -0.3485107421875, -0.3059844970703125, -0.263458251953125, -0.2209320068359375, -0.17840576171875, -0.1358795166015625, -0.093353271484375, -0.0508270263671875, -0.00830078125, 0.0342254638671875, 0.076751708984375, 0.1192779541015625, 0.16180419921875, 0.2043304443359375, 0.246856689453125, 0.2893829345703125, 0.3319091796875, 0.3744354248046875, 0.416961669921875, 0.4594879150390625, 0.50201416015625, 0.5445404052734375, 0.587066650390625, 0.6295928955078125, 0.672119140625, 0.7146453857421875, 0.757171630859375, 0.7996978759765625, 0.84222412109375, 0.8847503662109375, 0.927276611328125, 0.9698028564453125, 1.0123291015625, 1.0548553466796875, 1.097381591796875, 1.1399078369140625, 1.18243408203125, 1.2249603271484375, 1.267486572265625, 1.3100128173828125, 1.3525390625]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 5.0, 2.0, 2.0, 7.0, 7.0, 4.0, 4.0, 7.0, 8.0, 18.0, 9.0, 17.0, 21.0, 32.0, 30.0, 33.0, 29.0, 41.0, 30.0, 43.0, 42.0, 24.0, 46.0, 34.0, 40.0, 47.0, 40.0, 48.0, 30.0, 48.0, 31.0, 35.0, 27.0, 27.0, 22.0, 15.0, 17.0, 8.0, 12.0, 16.0, 13.0, 8.0, 4.0, 7.0, 6.0, 6.0, 0.0, 4.0, 3.0, 1.0, 2.0, 1.0], "bins": [-31.824756622314453, -30.9390869140625, -30.053415298461914, -29.16774559020996, -28.282075881958008, -27.396404266357422, -26.51073455810547, -25.625064849853516, -24.73939323425293, -23.853723526000977, -22.96805191040039, -22.082382202148438, -21.196712493896484, -20.3110408782959, -19.425371170043945, -18.53969955444336, -17.654029846191406, -16.768360137939453, -15.882689476013184, -14.997018814086914, -14.111348152160645, -13.225677490234375, -12.340007781982422, -11.454337120056152, -10.568668365478516, -9.682997703552246, -8.797327995300293, -7.911657333374023, -7.025986671447754, -6.140316486358643, -5.254646301269531, -4.368975639343262, -3.483304977416992, -2.5976345539093018, -1.7119642496109009, -0.8262939453125, 0.05937647819519043, 0.9450469017028809, 1.8307170867919922, 2.7163877487182617, 3.602057933807373, 4.487728118896484, 5.373398780822754, 6.259068965911865, 7.144739151000977, 8.030409812927246, 8.916080474853516, 9.801750183105469, 10.687420845031738, 11.573091506958008, 12.458761215209961, 13.34443187713623, 14.2301025390625, 15.115772247314453, 16.001441955566406, 16.887113571166992, 17.772783279418945, 18.6584529876709, 19.544124603271484, 20.429794311523438, 21.31546401977539, 22.201135635375977, 23.08680534362793, 23.972476959228516, 24.85814666748047]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 8.0, 1.0, 5.0, 4.0, 9.0, 7.0, 6.0, 5.0, 11.0, 17.0, 22.0, 19.0, 34.0, 17.0, 25.0, 31.0, 37.0, 44.0, 47.0, 33.0, 34.0, 37.0, 44.0, 33.0, 49.0, 35.0, 55.0, 35.0, 46.0, 29.0, 26.0, 30.0, 21.0, 31.0, 25.0, 13.0, 16.0, 7.0, 12.0, 11.0, 10.0, 3.0, 8.0, 5.0, 3.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-32.50355529785156, -31.424339294433594, -30.345121383666992, -29.265905380249023, -28.186687469482422, -27.107471466064453, -26.028255462646484, -24.949037551879883, -23.86981964111328, -22.790603637695312, -21.71138572692871, -20.632169723510742, -19.55295181274414, -18.473735809326172, -17.394519805908203, -16.3153018951416, -15.236085891723633, -14.156868934631348, -13.077651977539062, -11.998435974121094, -10.919218063354492, -9.840002059936523, -8.760785102844238, -7.681568145751953, -6.602351188659668, -5.523134231567383, -4.443917274475098, -3.3647007942199707, -2.2854838371276855, -1.2062668800354004, -0.12705039978027344, 0.9521665573120117, 2.031383514404297, 3.110600471496582, 4.189817428588867, 5.269033908843994, 6.348250865936279, 7.4274678230285645, 8.506684303283691, 9.585901260375977, 10.665118217468262, 11.744335174560547, 12.823552131652832, 13.902769088745117, 14.981985092163086, 16.061203002929688, 17.140419006347656, 18.219635009765625, 19.298852920532227, 20.378068923950195, 21.457286834716797, 22.536502838134766, 23.615720748901367, 24.694936752319336, 25.774154663085938, 26.853370666503906, 27.932586669921875, 29.011802673339844, 30.091020584106445, 31.170236587524414, 32.249454498291016, 33.328670501708984, 34.40788650512695, 35.48710632324219, 36.566322326660156]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 4.0, 7.0, 10.0, 10.0, 17.0, 33.0, 46.0, 57.0, 139.0, 212.0, 251.0, 403.0, 600.0, 932.0, 1410.0, 2157.0, 3335.0, 4874.0, 7318.0, 10556.0, 15587.0, 21969.0, 30119.0, 40230.0, 52326.0, 65091.0, 77601.0, 87027.0, 93436.0, 93597.0, 88491.0, 79700.0, 67422.0, 54437.0, 43155.0, 31506.0, 23136.0, 16459.0, 11373.0, 7797.0, 5389.0, 3450.0, 2431.0, 1521.0, 993.0, 646.0, 450.0, 323.0, 174.0, 141.0, 81.0, 42.0, 37.0, 20.0, 16.0, 10.0, 4.0, 0.0, 8.0, 4.0], "bins": [-22.53125, -21.850341796875, -21.16943359375, -20.488525390625, -19.8076171875, -19.126708984375, -18.44580078125, -17.764892578125, -17.083984375, -16.403076171875, -15.72216796875, -15.041259765625, -14.3603515625, -13.679443359375, -12.99853515625, -12.317626953125, -11.63671875, -10.955810546875, -10.27490234375, -9.593994140625, -8.9130859375, -8.232177734375, -7.55126953125, -6.870361328125, -6.189453125, -5.508544921875, -4.82763671875, -4.146728515625, -3.4658203125, -2.784912109375, -2.10400390625, -1.423095703125, -0.7421875, -0.061279296875, 0.61962890625, 1.300537109375, 1.9814453125, 2.662353515625, 3.34326171875, 4.024169921875, 4.705078125, 5.385986328125, 6.06689453125, 6.747802734375, 7.4287109375, 8.109619140625, 8.79052734375, 9.471435546875, 10.15234375, 10.833251953125, 11.51416015625, 12.195068359375, 12.8759765625, 13.556884765625, 14.23779296875, 14.918701171875, 15.599609375, 16.280517578125, 16.96142578125, 17.642333984375, 18.3232421875, 19.004150390625, 19.68505859375, 20.365966796875, 21.046875]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 5.0, 6.0, 3.0, 3.0, 5.0, 7.0, 8.0, 11.0, 9.0, 17.0, 11.0, 18.0, 21.0, 17.0, 24.0, 31.0, 33.0, 31.0, 39.0, 36.0, 33.0, 38.0, 35.0, 41.0, 43.0, 40.0, 41.0, 33.0, 31.0, 38.0, 37.0, 29.0, 29.0, 30.0, 19.0, 30.0, 22.0, 12.0, 20.0, 10.0, 10.0, 6.0, 6.0, 2.0, 10.0, 8.0, 6.0, 5.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-29.78125, -28.80126953125, -27.8212890625, -26.84130859375, -25.861328125, -24.88134765625, -23.9013671875, -22.92138671875, -21.94140625, -20.96142578125, -19.9814453125, -19.00146484375, -18.021484375, -17.04150390625, -16.0615234375, -15.08154296875, -14.1015625, -13.12158203125, -12.1416015625, -11.16162109375, -10.181640625, -9.20166015625, -8.2216796875, -7.24169921875, -6.26171875, -5.28173828125, -4.3017578125, -3.32177734375, -2.341796875, -1.36181640625, -0.3818359375, 0.59814453125, 1.578125, 2.55810546875, 3.5380859375, 4.51806640625, 5.498046875, 6.47802734375, 7.4580078125, 8.43798828125, 9.41796875, 10.39794921875, 11.3779296875, 12.35791015625, 13.337890625, 14.31787109375, 15.2978515625, 16.27783203125, 17.2578125, 18.23779296875, 19.2177734375, 20.19775390625, 21.177734375, 22.15771484375, 23.1376953125, 24.11767578125, 25.09765625, 26.07763671875, 27.0576171875, 28.03759765625, 29.017578125, 29.99755859375, 30.9775390625, 31.95751953125, 32.9375]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 3.0, 5.0, 14.0, 21.0, 26.0, 25.0, 88.0, 130.0, 184.0, 289.0, 432.0, 708.0, 1128.0, 1835.0, 2725.0, 4332.0, 6603.0, 9826.0, 15006.0, 21760.0, 30546.0, 42490.0, 56592.0, 71149.0, 85340.0, 95525.0, 101181.0, 99270.0, 91537.0, 79408.0, 64011.0, 49646.0, 36597.0, 26208.0, 18160.0, 12443.0, 8090.0, 5524.0, 3462.0, 2297.0, 1398.0, 942.0, 580.0, 383.0, 233.0, 168.0, 90.0, 54.0, 49.0, 16.0, 19.0, 5.0, 9.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-23.109375, -22.3330078125, -21.556640625, -20.7802734375, -20.00390625, -19.2275390625, -18.451171875, -17.6748046875, -16.8984375, -16.1220703125, -15.345703125, -14.5693359375, -13.79296875, -13.0166015625, -12.240234375, -11.4638671875, -10.6875, -9.9111328125, -9.134765625, -8.3583984375, -7.58203125, -6.8056640625, -6.029296875, -5.2529296875, -4.4765625, -3.7001953125, -2.923828125, -2.1474609375, -1.37109375, -0.5947265625, 0.181640625, 0.9580078125, 1.734375, 2.5107421875, 3.287109375, 4.0634765625, 4.83984375, 5.6162109375, 6.392578125, 7.1689453125, 7.9453125, 8.7216796875, 9.498046875, 10.2744140625, 11.05078125, 11.8271484375, 12.603515625, 13.3798828125, 14.15625, 14.9326171875, 15.708984375, 16.4853515625, 17.26171875, 18.0380859375, 18.814453125, 19.5908203125, 20.3671875, 21.1435546875, 21.919921875, 22.6962890625, 23.47265625, 24.2490234375, 25.025390625, 25.8017578125, 26.578125]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 5.0, 2.0, 2.0, 1.0, 4.0, 4.0, 11.0, 2.0, 10.0, 16.0, 9.0, 11.0, 15.0, 22.0, 28.0, 22.0, 31.0, 20.0, 29.0, 23.0, 35.0, 27.0, 42.0, 33.0, 38.0, 48.0, 25.0, 40.0, 46.0, 39.0, 33.0, 37.0, 35.0, 35.0, 31.0, 27.0, 25.0, 27.0, 19.0, 11.0, 26.0, 15.0, 11.0, 11.0, 6.0, 4.0, 4.0, 4.0, 7.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.28125, -18.6220703125, -17.962890625, -17.3037109375, -16.64453125, -15.9853515625, -15.326171875, -14.6669921875, -14.0078125, -13.3486328125, -12.689453125, -12.0302734375, -11.37109375, -10.7119140625, -10.052734375, -9.3935546875, -8.734375, -8.0751953125, -7.416015625, -6.7568359375, -6.09765625, -5.4384765625, -4.779296875, -4.1201171875, -3.4609375, -2.8017578125, -2.142578125, -1.4833984375, -0.82421875, -0.1650390625, 0.494140625, 1.1533203125, 1.8125, 2.4716796875, 3.130859375, 3.7900390625, 4.44921875, 5.1083984375, 5.767578125, 6.4267578125, 7.0859375, 7.7451171875, 8.404296875, 9.0634765625, 9.72265625, 10.3818359375, 11.041015625, 11.7001953125, 12.359375, 13.0185546875, 13.677734375, 14.3369140625, 14.99609375, 15.6552734375, 16.314453125, 16.9736328125, 17.6328125, 18.2919921875, 18.951171875, 19.6103515625, 20.26953125, 20.9287109375, 21.587890625, 22.2470703125, 22.90625]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 7.0, 2.0, 7.0, 15.0, 20.0, 38.0, 34.0, 63.0, 76.0, 121.0, 204.0, 341.0, 500.0, 827.0, 1379.0, 2357.0, 4477.0, 9272.0, 21494.0, 52216.0, 123762.0, 231871.0, 268864.0, 182349.0, 84570.0, 34505.0, 14589.0, 6460.0, 3396.0, 1859.0, 1063.0, 657.0, 407.0, 281.0, 150.0, 132.0, 73.0, 45.0, 26.0, 20.0, 13.0, 11.0, 3.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-24.765625, -24.0634765625, -23.361328125, -22.6591796875, -21.95703125, -21.2548828125, -20.552734375, -19.8505859375, -19.1484375, -18.4462890625, -17.744140625, -17.0419921875, -16.33984375, -15.6376953125, -14.935546875, -14.2333984375, -13.53125, -12.8291015625, -12.126953125, -11.4248046875, -10.72265625, -10.0205078125, -9.318359375, -8.6162109375, -7.9140625, -7.2119140625, -6.509765625, -5.8076171875, -5.10546875, -4.4033203125, -3.701171875, -2.9990234375, -2.296875, -1.5947265625, -0.892578125, -0.1904296875, 0.51171875, 1.2138671875, 1.916015625, 2.6181640625, 3.3203125, 4.0224609375, 4.724609375, 5.4267578125, 6.12890625, 6.8310546875, 7.533203125, 8.2353515625, 8.9375, 9.6396484375, 10.341796875, 11.0439453125, 11.74609375, 12.4482421875, 13.150390625, 13.8525390625, 14.5546875, 15.2568359375, 15.958984375, 16.6611328125, 17.36328125, 18.0654296875, 18.767578125, 19.4697265625, 20.171875]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 5.0, 3.0, 8.0, 13.0, 13.0, 10.0, 27.0, 28.0, 39.0, 44.0, 47.0, 67.0, 64.0, 81.0, 59.0, 80.0, 64.0, 70.0, 58.0, 43.0, 34.0, 25.0, 28.0, 23.0, 14.0, 17.0, 11.0, 7.0, 3.0, 1.0, 1.0, 5.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0018367767333984375, -0.0017850697040557861, -0.0017333626747131348, -0.0016816556453704834, -0.001629948616027832, -0.0015782415866851807, -0.0015265345573425293, -0.001474827527999878, -0.0014231204986572266, -0.0013714134693145752, -0.0013197064399719238, -0.0012679994106292725, -0.001216292381286621, -0.0011645853519439697, -0.0011128783226013184, -0.001061171293258667, -0.0010094642639160156, -0.0009577572345733643, -0.0009060502052307129, -0.0008543431758880615, -0.0008026361465454102, -0.0007509291172027588, -0.0006992220878601074, -0.0006475150585174561, -0.0005958080291748047, -0.0005441009998321533, -0.000492393970489502, -0.0004406869411468506, -0.0003889799118041992, -0.00033727288246154785, -0.0002855658531188965, -0.00023385882377624512, -0.00018215179443359375, -0.00013044476509094238, -7.873773574829102e-05, -2.703070640563965e-05, 2.467632293701172e-05, 7.638335227966309e-05, 0.00012809038162231445, 0.00017979741096496582, 0.0002315044403076172, 0.00028321146965026855, 0.0003349184989929199, 0.0003866255283355713, 0.00043833255767822266, 0.000490039587020874, 0.0005417466163635254, 0.0005934536457061768, 0.0006451606750488281, 0.0006968677043914795, 0.0007485747337341309, 0.0008002817630767822, 0.0008519887924194336, 0.000903695821762085, 0.0009554028511047363, 0.0010071098804473877, 0.001058816909790039, 0.0011105239391326904, 0.0011622309684753418, 0.0012139379978179932, 0.0012656450271606445, 0.001317352056503296, 0.0013690590858459473, 0.0014207661151885986, 0.00147247314453125]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 5.0, 6.0, 7.0, 6.0, 14.0, 20.0, 26.0, 36.0, 62.0, 73.0, 139.0, 215.0, 322.0, 459.0, 680.0, 1050.0, 1549.0, 2364.0, 3803.0, 6120.0, 9759.0, 15717.0, 26101.0, 41600.0, 64423.0, 94072.0, 124207.0, 143367.0, 142286.0, 119838.0, 89428.0, 59488.0, 38281.0, 23715.0, 14480.0, 9069.0, 5557.0, 3573.0, 2274.0, 1494.0, 978.0, 631.0, 428.0, 278.0, 193.0, 132.0, 78.0, 59.0, 34.0, 21.0, 15.0, 19.0, 6.0, 5.0, 6.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.6328125, -11.268310546875, -10.90380859375, -10.539306640625, -10.1748046875, -9.810302734375, -9.44580078125, -9.081298828125, -8.716796875, -8.352294921875, -7.98779296875, -7.623291015625, -7.2587890625, -6.894287109375, -6.52978515625, -6.165283203125, -5.80078125, -5.436279296875, -5.07177734375, -4.707275390625, -4.3427734375, -3.978271484375, -3.61376953125, -3.249267578125, -2.884765625, -2.520263671875, -2.15576171875, -1.791259765625, -1.4267578125, -1.062255859375, -0.69775390625, -0.333251953125, 0.03125, 0.395751953125, 0.76025390625, 1.124755859375, 1.4892578125, 1.853759765625, 2.21826171875, 2.582763671875, 2.947265625, 3.311767578125, 3.67626953125, 4.040771484375, 4.4052734375, 4.769775390625, 5.13427734375, 5.498779296875, 5.86328125, 6.227783203125, 6.59228515625, 6.956787109375, 7.3212890625, 7.685791015625, 8.05029296875, 8.414794921875, 8.779296875, 9.143798828125, 9.50830078125, 9.872802734375, 10.2373046875, 10.601806640625, 10.96630859375, 11.330810546875, 11.6953125]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 4.0, 5.0, 6.0, 6.0, 10.0, 12.0, 11.0, 12.0, 17.0, 18.0, 23.0, 25.0, 30.0, 31.0, 34.0, 43.0, 54.0, 47.0, 57.0, 52.0, 38.0, 46.0, 59.0, 50.0, 41.0, 44.0, 47.0, 35.0, 23.0, 23.0, 16.0, 16.0, 13.0, 9.0, 10.0, 7.0, 6.0, 2.0, 6.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-5.5546875, -5.401123046875, -5.24755859375, -5.093994140625, -4.9404296875, -4.786865234375, -4.63330078125, -4.479736328125, -4.326171875, -4.172607421875, -4.01904296875, -3.865478515625, -3.7119140625, -3.558349609375, -3.40478515625, -3.251220703125, -3.09765625, -2.944091796875, -2.79052734375, -2.636962890625, -2.4833984375, -2.329833984375, -2.17626953125, -2.022705078125, -1.869140625, -1.715576171875, -1.56201171875, -1.408447265625, -1.2548828125, -1.101318359375, -0.94775390625, -0.794189453125, -0.640625, -0.487060546875, -0.33349609375, -0.179931640625, -0.0263671875, 0.127197265625, 0.28076171875, 0.434326171875, 0.587890625, 0.741455078125, 0.89501953125, 1.048583984375, 1.2021484375, 1.355712890625, 1.50927734375, 1.662841796875, 1.81640625, 1.969970703125, 2.12353515625, 2.277099609375, 2.4306640625, 2.584228515625, 2.73779296875, 2.891357421875, 3.044921875, 3.198486328125, 3.35205078125, 3.505615234375, 3.6591796875, 3.812744140625, 3.96630859375, 4.119873046875, 4.2734375]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 7.0, 9.0, 10.0, 7.0, 10.0, 8.0, 14.0, 14.0, 24.0, 31.0, 35.0, 26.0, 41.0, 36.0, 35.0, 60.0, 46.0, 55.0, 49.0, 35.0, 58.0, 47.0, 60.0, 40.0, 36.0, 30.0, 40.0, 27.0, 17.0, 19.0, 13.0, 16.0, 10.0, 10.0, 7.0, 12.0, 5.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-37.054561614990234, -36.048763275146484, -35.04296112060547, -34.03716278076172, -33.03136444091797, -32.02556610107422, -31.019763946533203, -30.013965606689453, -29.008167266845703, -28.00236701965332, -26.99656867980957, -25.990768432617188, -24.984970092773438, -23.979169845581055, -22.973369598388672, -21.967571258544922, -20.96177101135254, -19.955970764160156, -18.950172424316406, -17.944372177124023, -16.938573837280273, -15.93277359008789, -14.926974296569824, -13.921175003051758, -12.915375709533691, -11.909576416015625, -10.903777122497559, -9.897977828979492, -8.89217758178711, -7.886378765106201, -6.880578994750977, -5.87477970123291, -4.868980407714844, -3.8631811141967773, -2.857381582260132, -1.8515820503234863, -0.8457827568054199, 0.16001653671264648, 1.165816307067871, 2.1716156005859375, 3.177414894104004, 4.18321418762207, 5.189013481140137, 6.194813251495361, 7.200612545013428, 8.206411361694336, 9.212211608886719, 10.218010902404785, 11.223810195922852, 12.229609489440918, 13.235408782958984, 14.241209030151367, 15.247007369995117, 16.2528076171875, 17.25860595703125, 18.264406204223633, 19.270206451416016, 20.2760066986084, 21.28180503845215, 22.28760528564453, 23.29340362548828, 24.299203872680664, 25.305004119873047, 26.310802459716797, 27.316600799560547]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 3.0, 5.0, 6.0, 2.0, 5.0, 5.0, 14.0, 11.0, 17.0, 8.0, 15.0, 24.0, 14.0, 19.0, 23.0, 30.0, 21.0, 28.0, 33.0, 41.0, 37.0, 50.0, 49.0, 44.0, 36.0, 43.0, 42.0, 40.0, 39.0, 36.0, 24.0, 35.0, 33.0, 26.0, 30.0, 16.0, 15.0, 15.0, 16.0, 14.0, 9.0, 6.0, 7.0, 8.0, 2.0, 4.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-35.0855827331543, -33.9887580871582, -32.89193344116211, -31.79511070251465, -30.698287963867188, -29.601463317871094, -28.504638671875, -27.40781593322754, -26.310993194580078, -25.214168548583984, -24.117345809936523, -23.02052116394043, -21.92369842529297, -20.826873779296875, -19.73004913330078, -18.63322639465332, -17.536401748657227, -16.439577102661133, -15.342754364013672, -14.245929718017578, -13.149106979370117, -12.052282333374023, -10.955458641052246, -9.858634948730469, -8.761811256408691, -7.664987564086914, -6.568163871765137, -5.471339702606201, -4.374516010284424, -3.2776923179626465, -2.180868148803711, -1.0840444564819336, 0.01277923583984375, 1.1096030473709106, 2.2064268589019775, 3.303250789642334, 4.400074481964111, 5.496898174285889, 6.593722343444824, 7.690546035766602, 8.787369728088379, 9.884193420410156, 10.981017112731934, 12.077840805053711, 13.174665451049805, 14.271488189697266, 15.36831283569336, 16.465137481689453, 17.561960220336914, 18.658784866333008, 19.75560760498047, 20.852432250976562, 21.949254989624023, 23.046079635620117, 24.142902374267578, 25.239727020263672, 26.336551666259766, 27.43337631225586, 28.53019905090332, 29.627023696899414, 30.723846435546875, 31.82067108154297, 32.91749572753906, 34.014320373535156, 35.111141204833984]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 5.0, 11.0, 22.0, 26.0, 52.0, 92.0, 139.0, 275.0, 431.0, 762.0, 1225.0, 2251.0, 3741.0, 6377.0, 10697.0, 17823.0, 29778.0, 48909.0, 78669.0, 123691.0, 187390.0, 271230.0, 366086.0, 451836.0, 507107.0, 506536.0, 451042.0, 360783.0, 266089.0, 184077.0, 121390.0, 76712.0, 47350.0, 28844.0, 17522.0, 10337.0, 6128.0, 3652.0, 2098.0, 1260.0, 756.0, 458.0, 282.0, 148.0, 86.0, 47.0, 27.0, 23.0, 7.0, 5.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.546875, -22.786865234375, -22.02685546875, -21.266845703125, -20.5068359375, -19.746826171875, -18.98681640625, -18.226806640625, -17.466796875, -16.706787109375, -15.94677734375, -15.186767578125, -14.4267578125, -13.666748046875, -12.90673828125, -12.146728515625, -11.38671875, -10.626708984375, -9.86669921875, -9.106689453125, -8.3466796875, -7.586669921875, -6.82666015625, -6.066650390625, -5.306640625, -4.546630859375, -3.78662109375, -3.026611328125, -2.2666015625, -1.506591796875, -0.74658203125, 0.013427734375, 0.7734375, 1.533447265625, 2.29345703125, 3.053466796875, 3.8134765625, 4.573486328125, 5.33349609375, 6.093505859375, 6.853515625, 7.613525390625, 8.37353515625, 9.133544921875, 9.8935546875, 10.653564453125, 11.41357421875, 12.173583984375, 12.93359375, 13.693603515625, 14.45361328125, 15.213623046875, 15.9736328125, 16.733642578125, 17.49365234375, 18.253662109375, 19.013671875, 19.773681640625, 20.53369140625, 21.293701171875, 22.0537109375, 22.813720703125, 23.57373046875, 24.333740234375, 25.09375]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 4.0, 4.0, 10.0, 14.0, 10.0, 8.0, 14.0, 20.0, 14.0, 18.0, 19.0, 21.0, 28.0, 33.0, 31.0, 26.0, 40.0, 36.0, 37.0, 56.0, 44.0, 50.0, 39.0, 45.0, 44.0, 36.0, 30.0, 32.0, 44.0, 21.0, 26.0, 24.0, 21.0, 26.0, 13.0, 13.0, 10.0, 10.0, 5.0, 6.0, 10.0, 6.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-31.453125, -30.562744140625, -29.67236328125, -28.781982421875, -27.8916015625, -27.001220703125, -26.11083984375, -25.220458984375, -24.330078125, -23.439697265625, -22.54931640625, -21.658935546875, -20.7685546875, -19.878173828125, -18.98779296875, -18.097412109375, -17.20703125, -16.316650390625, -15.42626953125, -14.535888671875, -13.6455078125, -12.755126953125, -11.86474609375, -10.974365234375, -10.083984375, -9.193603515625, -8.30322265625, -7.412841796875, -6.5224609375, -5.632080078125, -4.74169921875, -3.851318359375, -2.9609375, -2.070556640625, -1.18017578125, -0.289794921875, 0.6005859375, 1.490966796875, 2.38134765625, 3.271728515625, 4.162109375, 5.052490234375, 5.94287109375, 6.833251953125, 7.7236328125, 8.614013671875, 9.50439453125, 10.394775390625, 11.28515625, 12.175537109375, 13.06591796875, 13.956298828125, 14.8466796875, 15.737060546875, 16.62744140625, 17.517822265625, 18.408203125, 19.298583984375, 20.18896484375, 21.079345703125, 21.9697265625, 22.860107421875, 23.75048828125, 24.640869140625, 25.53125]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [2.0, 3.0, 4.0, 3.0, 15.0, 30.0, 40.0, 65.0, 114.0, 157.0, 290.0, 488.0, 759.0, 1288.0, 2045.0, 3232.0, 5286.0, 8156.0, 12683.0, 19413.0, 29535.0, 43795.0, 63950.0, 90407.0, 126574.0, 168791.0, 218043.0, 271050.0, 320028.0, 359007.0, 379377.0, 376799.0, 353851.0, 314721.0, 263808.0, 211216.0, 162102.0, 120669.0, 86585.0, 60118.0, 41101.0, 27670.0, 18379.0, 11908.0, 7569.0, 4943.0, 3112.0, 1918.0, 1203.0, 773.0, 459.0, 260.0, 195.0, 110.0, 72.0, 58.0, 25.0, 21.0, 9.0, 9.0, 8.0, 1.0, 0.0, 2.0], "bins": [-18.9375, -18.3251953125, -17.712890625, -17.1005859375, -16.48828125, -15.8759765625, -15.263671875, -14.6513671875, -14.0390625, -13.4267578125, -12.814453125, -12.2021484375, -11.58984375, -10.9775390625, -10.365234375, -9.7529296875, -9.140625, -8.5283203125, -7.916015625, -7.3037109375, -6.69140625, -6.0791015625, -5.466796875, -4.8544921875, -4.2421875, -3.6298828125, -3.017578125, -2.4052734375, -1.79296875, -1.1806640625, -0.568359375, 0.0439453125, 0.65625, 1.2685546875, 1.880859375, 2.4931640625, 3.10546875, 3.7177734375, 4.330078125, 4.9423828125, 5.5546875, 6.1669921875, 6.779296875, 7.3916015625, 8.00390625, 8.6162109375, 9.228515625, 9.8408203125, 10.453125, 11.0654296875, 11.677734375, 12.2900390625, 12.90234375, 13.5146484375, 14.126953125, 14.7392578125, 15.3515625, 15.9638671875, 16.576171875, 17.1884765625, 17.80078125, 18.4130859375, 19.025390625, 19.6376953125, 20.25]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 8.0, 5.0, 6.0, 8.0, 16.0, 14.0, 13.0, 20.0, 27.0, 19.0, 44.0, 54.0, 50.0, 63.0, 74.0, 100.0, 95.0, 107.0, 129.0, 137.0, 163.0, 143.0, 161.0, 184.0, 173.0, 188.0, 188.0, 166.0, 175.0, 174.0, 148.0, 145.0, 152.0, 133.0, 121.0, 102.0, 93.0, 79.0, 60.0, 74.0, 54.0, 40.0, 38.0, 31.0, 19.0, 14.0, 17.0, 12.0, 10.0, 9.0, 8.0, 7.0, 5.0, 5.0, 2.0, 1.0, 4.0, 0.0, 2.0, 1.0], "bins": [-10.375, -10.029296875, -9.68359375, -9.337890625, -8.9921875, -8.646484375, -8.30078125, -7.955078125, -7.609375, -7.263671875, -6.91796875, -6.572265625, -6.2265625, -5.880859375, -5.53515625, -5.189453125, -4.84375, -4.498046875, -4.15234375, -3.806640625, -3.4609375, -3.115234375, -2.76953125, -2.423828125, -2.078125, -1.732421875, -1.38671875, -1.041015625, -0.6953125, -0.349609375, -0.00390625, 0.341796875, 0.6875, 1.033203125, 1.37890625, 1.724609375, 2.0703125, 2.416015625, 2.76171875, 3.107421875, 3.453125, 3.798828125, 4.14453125, 4.490234375, 4.8359375, 5.181640625, 5.52734375, 5.873046875, 6.21875, 6.564453125, 6.91015625, 7.255859375, 7.6015625, 7.947265625, 8.29296875, 8.638671875, 8.984375, 9.330078125, 9.67578125, 10.021484375, 10.3671875, 10.712890625, 11.05859375, 11.404296875, 11.75]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 5.0, 6.0, 8.0, 7.0, 8.0, 11.0, 8.0, 15.0, 21.0, 25.0, 22.0, 30.0, 31.0, 34.0, 28.0, 48.0, 36.0, 42.0, 37.0, 37.0, 58.0, 46.0, 46.0, 37.0, 42.0, 34.0, 42.0, 36.0, 33.0, 26.0, 26.0, 12.0, 22.0, 14.0, 21.0, 11.0, 13.0, 8.0, 3.0, 2.0, 2.0, 3.0, 3.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0], "bins": [-28.06747817993164, -27.208215713500977, -26.34895133972168, -25.489688873291016, -24.63042449951172, -23.771162033081055, -22.91189956665039, -22.052635192871094, -21.193370819091797, -20.334108352661133, -19.474843978881836, -18.615581512451172, -17.756317138671875, -16.89705467224121, -16.037792205810547, -15.17852783203125, -14.319265365600586, -13.460001945495605, -12.600738525390625, -11.741476058959961, -10.882211685180664, -10.02294921875, -9.16368579864502, -8.304422378540039, -7.445158958435059, -6.585895538330078, -5.726632118225098, -4.867369174957275, -4.008105754852295, -3.1488423347473145, -2.289579391479492, -1.4303159713745117, -0.5710506439208984, 0.2882126569747925, 1.1474759578704834, 2.0067391395568848, 2.8660025596618652, 3.7252659797668457, 4.584528923034668, 5.443792343139648, 6.303055763244629, 7.162319183349609, 8.02158260345459, 8.88084602355957, 9.740108489990234, 10.599372863769531, 11.458635330200195, 12.317898750305176, 13.177162170410156, 14.036425590515137, 14.895689010620117, 15.754951477050781, 16.614215850830078, 17.473478317260742, 18.332740783691406, 19.192005157470703, 20.05126953125, 20.910531997680664, 21.76979637145996, 22.629058837890625, 23.488323211669922, 24.347585678100586, 25.20684814453125, 26.066112518310547, 26.92537498474121]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 5.0, 5.0, 8.0, 10.0, 12.0, 16.0, 13.0, 15.0, 20.0, 26.0, 22.0, 19.0, 23.0, 29.0, 34.0, 33.0, 41.0, 53.0, 41.0, 46.0, 46.0, 28.0, 40.0, 43.0, 36.0, 41.0, 38.0, 42.0, 22.0, 23.0, 27.0, 16.0, 20.0, 19.0, 19.0, 13.0, 17.0, 12.0, 10.0, 7.0, 9.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-30.571224212646484, -29.551654815673828, -28.532087326049805, -27.51251792907715, -26.492950439453125, -25.47338104248047, -24.453811645507812, -23.434242248535156, -22.414674758911133, -21.395105361938477, -20.375537872314453, -19.355968475341797, -18.33639907836914, -17.316831588745117, -16.29726219177246, -15.277693748474121, -14.258125305175781, -13.238556861877441, -12.218988418579102, -11.199419021606445, -10.179850578308105, -9.160282135009766, -8.14071273803711, -7.1211442947387695, -6.10157585144043, -5.08200740814209, -4.062438488006592, -3.042869806289673, -2.023301124572754, -1.003732681274414, 0.015836238861083984, 1.035405158996582, 2.0549697875976562, 3.074538469314575, 4.094107151031494, 5.113676071166992, 6.133244514465332, 7.152812957763672, 8.172382354736328, 9.191950798034668, 10.211519241333008, 11.231087684631348, 12.250656127929688, 13.270225524902344, 14.289793968200684, 15.309362411499023, 16.32893180847168, 17.348499298095703, 18.36806869506836, 19.387638092041016, 20.40720558166504, 21.426774978637695, 22.44634246826172, 23.465911865234375, 24.48548126220703, 25.505050659179688, 26.52461814880371, 27.544187545776367, 28.56375503540039, 29.583324432373047, 30.602893829345703, 31.622461318969727, 32.64202880859375, 33.661598205566406, 34.68116760253906]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 7.0, 10.0, 11.0, 21.0, 43.0, 67.0, 141.0, 211.0, 365.0, 552.0, 1050.0, 1674.0, 2961.0, 4611.0, 7658.0, 12484.0, 19685.0, 31316.0, 49527.0, 74296.0, 104274.0, 132962.0, 146877.0, 134860.0, 107550.0, 76971.0, 51402.0, 32873.0, 21136.0, 12891.0, 7849.0, 4751.0, 3021.0, 1829.0, 1067.0, 613.0, 379.0, 206.0, 141.0, 90.0, 57.0, 30.0, 17.0, 14.0, 5.0, 6.0, 2.0, 2.0, 0.0, 1.0], "bins": [-8.8203125, -8.5789794921875, -8.337646484375, -8.0963134765625, -7.85498046875, -7.6136474609375, -7.372314453125, -7.1309814453125, -6.8896484375, -6.6483154296875, -6.406982421875, -6.1656494140625, -5.92431640625, -5.6829833984375, -5.441650390625, -5.2003173828125, -4.958984375, -4.7176513671875, -4.476318359375, -4.2349853515625, -3.99365234375, -3.7523193359375, -3.510986328125, -3.2696533203125, -3.0283203125, -2.7869873046875, -2.545654296875, -2.3043212890625, -2.06298828125, -1.8216552734375, -1.580322265625, -1.3389892578125, -1.09765625, -0.8563232421875, -0.614990234375, -0.3736572265625, -0.13232421875, 0.1090087890625, 0.350341796875, 0.5916748046875, 0.8330078125, 1.0743408203125, 1.315673828125, 1.5570068359375, 1.79833984375, 2.0396728515625, 2.281005859375, 2.5223388671875, 2.763671875, 3.0050048828125, 3.246337890625, 3.4876708984375, 3.72900390625, 3.9703369140625, 4.211669921875, 4.4530029296875, 4.6943359375, 4.9356689453125, 5.177001953125, 5.4183349609375, 5.65966796875, 5.9010009765625, 6.142333984375, 6.3836669921875, 6.625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 6.0, 9.0, 7.0, 7.0, 17.0, 20.0, 12.0, 18.0, 17.0, 25.0, 25.0, 27.0, 32.0, 37.0, 32.0, 33.0, 41.0, 37.0, 37.0, 54.0, 38.0, 42.0, 40.0, 38.0, 35.0, 37.0, 42.0, 33.0, 32.0, 22.0, 26.0, 18.0, 22.0, 19.0, 14.0, 16.0, 7.0, 10.0, 5.0, 6.0, 6.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.46875, -31.39794921875, -30.3271484375, -29.25634765625, -28.185546875, -27.11474609375, -26.0439453125, -24.97314453125, -23.90234375, -22.83154296875, -21.7607421875, -20.68994140625, -19.619140625, -18.54833984375, -17.4775390625, -16.40673828125, -15.3359375, -14.26513671875, -13.1943359375, -12.12353515625, -11.052734375, -9.98193359375, -8.9111328125, -7.84033203125, -6.76953125, -5.69873046875, -4.6279296875, -3.55712890625, -2.486328125, -1.41552734375, -0.3447265625, 0.72607421875, 1.796875, 2.86767578125, 3.9384765625, 5.00927734375, 6.080078125, 7.15087890625, 8.2216796875, 9.29248046875, 10.36328125, 11.43408203125, 12.5048828125, 13.57568359375, 14.646484375, 15.71728515625, 16.7880859375, 17.85888671875, 18.9296875, 20.00048828125, 21.0712890625, 22.14208984375, 23.212890625, 24.28369140625, 25.3544921875, 26.42529296875, 27.49609375, 28.56689453125, 29.6376953125, 30.70849609375, 31.779296875, 32.85009765625, 33.9208984375, 34.99169921875, 36.0625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 10.0, 7.0, 7.0, 18.0, 37.0, 39.0, 65.0, 118.0, 185.0, 344.0, 544.0, 1020.0, 1756.0, 3340.0, 6209.0, 11754.0, 22525.0, 41792.0, 76088.0, 126670.0, 179112.0, 194965.0, 156227.0, 101156.0, 58162.0, 31001.0, 16516.0, 8583.0, 4554.0, 2480.0, 1354.0, 785.0, 430.0, 266.0, 167.0, 102.0, 57.0, 40.0, 25.0, 18.0, 11.0, 8.0, 4.0, 5.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.1171875, -6.88201904296875, -6.6468505859375, -6.41168212890625, -6.176513671875, -5.94134521484375, -5.7061767578125, -5.47100830078125, -5.23583984375, -5.00067138671875, -4.7655029296875, -4.53033447265625, -4.295166015625, -4.05999755859375, -3.8248291015625, -3.58966064453125, -3.3544921875, -3.11932373046875, -2.8841552734375, -2.64898681640625, -2.413818359375, -2.17864990234375, -1.9434814453125, -1.70831298828125, -1.47314453125, -1.23797607421875, -1.0028076171875, -0.76763916015625, -0.532470703125, -0.29730224609375, -0.0621337890625, 0.17303466796875, 0.408203125, 0.64337158203125, 0.8785400390625, 1.11370849609375, 1.348876953125, 1.58404541015625, 1.8192138671875, 2.05438232421875, 2.28955078125, 2.52471923828125, 2.7598876953125, 2.99505615234375, 3.230224609375, 3.46539306640625, 3.7005615234375, 3.93572998046875, 4.1708984375, 4.40606689453125, 4.6412353515625, 4.87640380859375, 5.111572265625, 5.34674072265625, 5.5819091796875, 5.81707763671875, 6.05224609375, 6.28741455078125, 6.5225830078125, 6.75775146484375, 6.992919921875, 7.22808837890625, 7.4632568359375, 7.69842529296875, 7.93359375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 3.0, 2.0, 7.0, 8.0, 8.0, 12.0, 8.0, 16.0, 21.0, 18.0, 16.0, 30.0, 24.0, 31.0, 28.0, 31.0, 35.0, 36.0, 45.0, 51.0, 47.0, 36.0, 57.0, 42.0, 50.0, 39.0, 48.0, 38.0, 39.0, 25.0, 16.0, 29.0, 19.0, 15.0, 13.0, 10.0, 15.0, 8.0, 11.0, 2.0, 3.0, 6.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.90625, -22.147216796875, -21.38818359375, -20.629150390625, -19.8701171875, -19.111083984375, -18.35205078125, -17.593017578125, -16.833984375, -16.074951171875, -15.31591796875, -14.556884765625, -13.7978515625, -13.038818359375, -12.27978515625, -11.520751953125, -10.76171875, -10.002685546875, -9.24365234375, -8.484619140625, -7.7255859375, -6.966552734375, -6.20751953125, -5.448486328125, -4.689453125, -3.930419921875, -3.17138671875, -2.412353515625, -1.6533203125, -0.894287109375, -0.13525390625, 0.623779296875, 1.3828125, 2.141845703125, 2.90087890625, 3.659912109375, 4.4189453125, 5.177978515625, 5.93701171875, 6.696044921875, 7.455078125, 8.214111328125, 8.97314453125, 9.732177734375, 10.4912109375, 11.250244140625, 12.00927734375, 12.768310546875, 13.52734375, 14.286376953125, 15.04541015625, 15.804443359375, 16.5634765625, 17.322509765625, 18.08154296875, 18.840576171875, 19.599609375, 20.358642578125, 21.11767578125, 21.876708984375, 22.6357421875, 23.394775390625, 24.15380859375, 24.912841796875, 25.671875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 12.0, 15.0, 13.0, 16.0, 25.0, 39.0, 34.0, 35.0, 83.0, 110.0, 144.0, 190.0, 271.0, 459.0, 618.0, 990.0, 1561.0, 2779.0, 4893.0, 9479.0, 19836.0, 46339.0, 116502.0, 268672.0, 312474.0, 151571.0, 60400.0, 25081.0, 11606.0, 5868.0, 3160.0, 1856.0, 1076.0, 714.0, 492.0, 335.0, 217.0, 147.0, 128.0, 78.0, 68.0, 48.0, 28.0, 17.0, 24.0, 15.0, 9.0, 11.0, 5.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 3.0], "bins": [-2.87109375, -2.781768798828125, -2.69244384765625, -2.603118896484375, -2.5137939453125, -2.424468994140625, -2.33514404296875, -2.245819091796875, -2.156494140625, -2.067169189453125, -1.97784423828125, -1.888519287109375, -1.7991943359375, -1.709869384765625, -1.62054443359375, -1.531219482421875, -1.44189453125, -1.352569580078125, -1.26324462890625, -1.173919677734375, -1.0845947265625, -0.995269775390625, -0.90594482421875, -0.816619873046875, -0.727294921875, -0.637969970703125, -0.54864501953125, -0.459320068359375, -0.3699951171875, -0.280670166015625, -0.19134521484375, -0.102020263671875, -0.0126953125, 0.076629638671875, 0.16595458984375, 0.255279541015625, 0.3446044921875, 0.433929443359375, 0.52325439453125, 0.612579345703125, 0.701904296875, 0.791229248046875, 0.88055419921875, 0.969879150390625, 1.0592041015625, 1.148529052734375, 1.23785400390625, 1.327178955078125, 1.41650390625, 1.505828857421875, 1.59515380859375, 1.684478759765625, 1.7738037109375, 1.863128662109375, 1.95245361328125, 2.041778564453125, 2.131103515625, 2.220428466796875, 2.30975341796875, 2.399078369140625, 2.4884033203125, 2.577728271484375, 2.66705322265625, 2.756378173828125, 2.845703125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 6.0, 4.0, 1.0, 6.0, 11.0, 9.0, 10.0, 15.0, 19.0, 22.0, 29.0, 29.0, 44.0, 51.0, 52.0, 73.0, 77.0, 82.0, 73.0, 76.0, 63.0, 57.0, 37.0, 50.0, 28.0, 25.0, 13.0, 10.0, 11.0, 4.0, 8.0, 4.0, 2.0, 6.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00042939186096191406, -0.00041761621832847595, -0.00040584057569503784, -0.00039406493306159973, -0.0003822892904281616, -0.0003705136477947235, -0.0003587380051612854, -0.0003469623625278473, -0.0003351867198944092, -0.00032341107726097107, -0.00031163543462753296, -0.00029985979199409485, -0.00028808414936065674, -0.00027630850672721863, -0.0002645328640937805, -0.0002527572214603424, -0.0002409815788269043, -0.0002292059361934662, -0.00021743029356002808, -0.00020565465092658997, -0.00019387900829315186, -0.00018210336565971375, -0.00017032772302627563, -0.00015855208039283752, -0.00014677643775939941, -0.0001350007951259613, -0.0001232251524925232, -0.00011144950985908508, -9.967386722564697e-05, -8.789822459220886e-05, -7.612258195877075e-05, -6.434693932533264e-05, -5.257129669189453e-05, -4.079565405845642e-05, -2.902001142501831e-05, -1.72443687915802e-05, -5.46872615814209e-06, 6.3069164752960205e-06, 1.808255910873413e-05, 2.985820174217224e-05, 4.163384437561035e-05, 5.340948700904846e-05, 6.518512964248657e-05, 7.696077227592468e-05, 8.873641490936279e-05, 0.0001005120575428009, 0.00011228770017623901, 0.00012406334280967712, 0.00013583898544311523, 0.00014761462807655334, 0.00015939027070999146, 0.00017116591334342957, 0.00018294155597686768, 0.00019471719861030579, 0.0002064928412437439, 0.000218268483877182, 0.00023004412651062012, 0.00024181976914405823, 0.00025359541177749634, 0.00026537105441093445, 0.00027714669704437256, 0.00028892233967781067, 0.0003006979823112488, 0.0003124736249446869, 0.000324249267578125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 9.0, 10.0, 6.0, 11.0, 13.0, 21.0, 33.0, 46.0, 59.0, 86.0, 83.0, 159.0, 228.0, 342.0, 468.0, 661.0, 972.0, 1347.0, 2018.0, 3084.0, 4873.0, 7765.0, 12549.0, 21151.0, 37565.0, 68089.0, 121573.0, 195052.0, 217249.0, 150890.0, 86279.0, 47539.0, 26492.0, 15289.0, 9181.0, 5785.0, 3682.0, 2503.0, 1607.0, 1184.0, 756.0, 537.0, 393.0, 298.0, 198.0, 138.0, 96.0, 58.0, 48.0, 32.0, 19.0, 9.0, 10.0, 8.0, 7.0, 6.0, 2.0], "bins": [-4.2421875, -4.121673583984375, -4.00115966796875, -3.880645751953125, -3.7601318359375, -3.639617919921875, -3.51910400390625, -3.398590087890625, -3.278076171875, -3.157562255859375, -3.03704833984375, -2.916534423828125, -2.7960205078125, -2.675506591796875, -2.55499267578125, -2.434478759765625, -2.31396484375, -2.193450927734375, -2.07293701171875, -1.952423095703125, -1.8319091796875, -1.711395263671875, -1.59088134765625, -1.470367431640625, -1.349853515625, -1.229339599609375, -1.10882568359375, -0.988311767578125, -0.8677978515625, -0.747283935546875, -0.62677001953125, -0.506256103515625, -0.3857421875, -0.265228271484375, -0.14471435546875, -0.024200439453125, 0.0963134765625, 0.216827392578125, 0.33734130859375, 0.457855224609375, 0.578369140625, 0.698883056640625, 0.81939697265625, 0.939910888671875, 1.0604248046875, 1.180938720703125, 1.30145263671875, 1.421966552734375, 1.54248046875, 1.662994384765625, 1.78350830078125, 1.904022216796875, 2.0245361328125, 2.145050048828125, 2.26556396484375, 2.386077880859375, 2.506591796875, 2.627105712890625, 2.74761962890625, 2.868133544921875, 2.9886474609375, 3.109161376953125, 3.22967529296875, 3.350189208984375, 3.470703125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 3.0, 4.0, 7.0, 6.0, 10.0, 13.0, 20.0, 20.0, 27.0, 39.0, 40.0, 51.0, 62.0, 66.0, 81.0, 80.0, 82.0, 69.0, 61.0, 44.0, 54.0, 34.0, 25.0, 26.0, 13.0, 17.0, 14.0, 9.0, 3.0, 13.0, 5.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.427734375, -1.379791259765625, -1.33184814453125, -1.283905029296875, -1.2359619140625, -1.188018798828125, -1.14007568359375, -1.092132568359375, -1.044189453125, -0.996246337890625, -0.94830322265625, -0.900360107421875, -0.8524169921875, -0.804473876953125, -0.75653076171875, -0.708587646484375, -0.66064453125, -0.612701416015625, -0.56475830078125, -0.516815185546875, -0.4688720703125, -0.420928955078125, -0.37298583984375, -0.325042724609375, -0.277099609375, -0.229156494140625, -0.18121337890625, -0.133270263671875, -0.0853271484375, -0.037384033203125, 0.01055908203125, 0.058502197265625, 0.1064453125, 0.154388427734375, 0.20233154296875, 0.250274658203125, 0.2982177734375, 0.346160888671875, 0.39410400390625, 0.442047119140625, 0.489990234375, 0.537933349609375, 0.58587646484375, 0.633819580078125, 0.6817626953125, 0.729705810546875, 0.77764892578125, 0.825592041015625, 0.87353515625, 0.921478271484375, 0.96942138671875, 1.017364501953125, 1.0653076171875, 1.113250732421875, 1.16119384765625, 1.209136962890625, 1.257080078125, 1.305023193359375, 1.35296630859375, 1.400909423828125, 1.4488525390625, 1.496795654296875, 1.54473876953125, 1.592681884765625, 1.640625]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 6.0, 3.0, 5.0, 10.0, 7.0, 7.0, 7.0, 11.0, 9.0, 19.0, 20.0, 28.0, 22.0, 31.0, 38.0, 39.0, 38.0, 46.0, 36.0, 39.0, 45.0, 52.0, 34.0, 51.0, 47.0, 38.0, 40.0, 34.0, 46.0, 25.0, 29.0, 32.0, 20.0, 14.0, 14.0, 21.0, 13.0, 5.0, 11.0, 3.0, 2.0, 3.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 2.0], "bins": [-29.735157012939453, -28.855043411254883, -27.974929809570312, -27.094816207885742, -26.214702606201172, -25.3345890045166, -24.45447540283203, -23.57436180114746, -22.69424819946289, -21.81413459777832, -20.93402099609375, -20.05390739440918, -19.17379379272461, -18.29368019104004, -17.41356658935547, -16.5334529876709, -15.653340339660645, -14.773226737976074, -13.893113136291504, -13.012999534606934, -12.132885932922363, -11.25277328491211, -10.372659683227539, -9.492546081542969, -8.612432479858398, -7.732318878173828, -6.852205276489258, -5.9720916748046875, -5.091978073120117, -4.211864948272705, -3.3317513465881348, -2.4516377449035645, -1.571523666381836, -0.6914101243019104, 0.18870341777801514, 1.068816900253296, 1.9489305019378662, 2.8290438652038574, 3.7091574668884277, 4.589271068572998, 5.469384670257568, 6.349498271942139, 7.229611873626709, 8.109724998474121, 8.989838600158691, 9.869952201843262, 10.750065803527832, 11.630179405212402, 12.510293006896973, 13.390406608581543, 14.270520210266113, 15.150633811950684, 16.030746459960938, 16.910860061645508, 17.790973663330078, 18.67108726501465, 19.55120086669922, 20.43131446838379, 21.31142807006836, 22.19154167175293, 23.0716552734375, 23.95176887512207, 24.83188247680664, 25.71199607849121, 26.59210968017578]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 5.0, 6.0, 8.0, 8.0, 13.0, 16.0, 12.0, 12.0, 20.0, 27.0, 22.0, 21.0, 19.0, 33.0, 33.0, 28.0, 38.0, 49.0, 47.0, 37.0, 53.0, 26.0, 41.0, 47.0, 36.0, 37.0, 43.0, 35.0, 33.0, 21.0, 22.0, 20.0, 21.0, 18.0, 17.0, 20.0, 14.0, 11.0, 9.0, 7.0, 12.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-30.27671241760254, -29.27250862121582, -28.268306732177734, -27.264102935791016, -26.259899139404297, -25.25569725036621, -24.251493453979492, -23.247291564941406, -22.243087768554688, -21.23888397216797, -20.234682083129883, -19.230478286743164, -18.226276397705078, -17.22207260131836, -16.21786880493164, -15.213665962219238, -14.209463119506836, -13.205260276794434, -12.201057434082031, -11.196853637695312, -10.19265079498291, -9.188447952270508, -8.184244155883789, -7.180041313171387, -6.175838470458984, -5.171635627746582, -4.1674323081970215, -3.16322922706604, -2.1590261459350586, -1.1548233032226562, -0.1506199836730957, 0.8535833358764648, 1.8577842712402344, 2.861987352371216, 3.8661904335021973, 4.870393753051758, 5.87459659576416, 6.8787994384765625, 7.883002758026123, 8.887206077575684, 9.891408920288086, 10.895611763000488, 11.89981460571289, 12.90401840209961, 13.908221244812012, 14.912424087524414, 15.916627883911133, 16.92082977294922, 17.925033569335938, 18.929237365722656, 19.933439254760742, 20.93764305114746, 21.941844940185547, 22.946048736572266, 23.950252532958984, 24.954456329345703, 25.95865821838379, 26.962862014770508, 27.967063903808594, 28.971267700195312, 29.97547149658203, 30.979673385620117, 31.983877182006836, 32.98807907104492, 33.99228286743164]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 2.0, 5.0, 9.0, 7.0, 14.0, 21.0, 34.0, 62.0, 76.0, 133.0, 215.0, 335.0, 537.0, 763.0, 1244.0, 2032.0, 3066.0, 4731.0, 7131.0, 10785.0, 15793.0, 22746.0, 31818.0, 43320.0, 55669.0, 69277.0, 81762.0, 91040.0, 96755.0, 95439.0, 88750.0, 78096.0, 65223.0, 51544.0, 39279.0, 28948.0, 20526.0, 14074.0, 9506.0, 6247.0, 4141.0, 2628.0, 1757.0, 1114.0, 671.0, 448.0, 303.0, 177.0, 102.0, 90.0, 43.0, 23.0, 20.0, 17.0, 9.0, 4.0, 4.0, 2.0, 3.0, 0.0, 1.0], "bins": [-20.703125, -20.052978515625, -19.40283203125, -18.752685546875, -18.1025390625, -17.452392578125, -16.80224609375, -16.152099609375, -15.501953125, -14.851806640625, -14.20166015625, -13.551513671875, -12.9013671875, -12.251220703125, -11.60107421875, -10.950927734375, -10.30078125, -9.650634765625, -9.00048828125, -8.350341796875, -7.7001953125, -7.050048828125, -6.39990234375, -5.749755859375, -5.099609375, -4.449462890625, -3.79931640625, -3.149169921875, -2.4990234375, -1.848876953125, -1.19873046875, -0.548583984375, 0.1015625, 0.751708984375, 1.40185546875, 2.052001953125, 2.7021484375, 3.352294921875, 4.00244140625, 4.652587890625, 5.302734375, 5.952880859375, 6.60302734375, 7.253173828125, 7.9033203125, 8.553466796875, 9.20361328125, 9.853759765625, 10.50390625, 11.154052734375, 11.80419921875, 12.454345703125, 13.1044921875, 13.754638671875, 14.40478515625, 15.054931640625, 15.705078125, 16.355224609375, 17.00537109375, 17.655517578125, 18.3056640625, 18.955810546875, 19.60595703125, 20.256103515625, 20.90625]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 7.0, 12.0, 14.0, 15.0, 11.0, 16.0, 16.0, 21.0, 18.0, 26.0, 26.0, 29.0, 18.0, 33.0, 39.0, 42.0, 45.0, 50.0, 51.0, 40.0, 43.0, 37.0, 36.0, 37.0, 28.0, 38.0, 36.0, 27.0, 24.0, 22.0, 33.0, 26.0, 18.0, 12.0, 13.0, 16.0, 6.0, 8.0, 8.0, 3.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-30.953125, -29.938232421875, -28.92333984375, -27.908447265625, -26.8935546875, -25.878662109375, -24.86376953125, -23.848876953125, -22.833984375, -21.819091796875, -20.80419921875, -19.789306640625, -18.7744140625, -17.759521484375, -16.74462890625, -15.729736328125, -14.71484375, -13.699951171875, -12.68505859375, -11.670166015625, -10.6552734375, -9.640380859375, -8.62548828125, -7.610595703125, -6.595703125, -5.580810546875, -4.56591796875, -3.551025390625, -2.5361328125, -1.521240234375, -0.50634765625, 0.508544921875, 1.5234375, 2.538330078125, 3.55322265625, 4.568115234375, 5.5830078125, 6.597900390625, 7.61279296875, 8.627685546875, 9.642578125, 10.657470703125, 11.67236328125, 12.687255859375, 13.7021484375, 14.717041015625, 15.73193359375, 16.746826171875, 17.76171875, 18.776611328125, 19.79150390625, 20.806396484375, 21.8212890625, 22.836181640625, 23.85107421875, 24.865966796875, 25.880859375, 26.895751953125, 27.91064453125, 28.925537109375, 29.9404296875, 30.955322265625, 31.97021484375, 32.985107421875, 34.0]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 5.0, 7.0, 11.0, 14.0, 31.0, 34.0, 72.0, 96.0, 189.0, 324.0, 508.0, 889.0, 1456.0, 2438.0, 4093.0, 6356.0, 10204.0, 16118.0, 24820.0, 37724.0, 53766.0, 71963.0, 91136.0, 106023.0, 114890.0, 113265.0, 101870.0, 85214.0, 65899.0, 47194.0, 33198.0, 21692.0, 14237.0, 8679.0, 5519.0, 3498.0, 2050.0, 1252.0, 711.0, 420.0, 280.0, 165.0, 97.0, 60.0, 35.0, 14.0, 19.0, 11.0, 6.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-24.421875, -23.6298828125, -22.837890625, -22.0458984375, -21.25390625, -20.4619140625, -19.669921875, -18.8779296875, -18.0859375, -17.2939453125, -16.501953125, -15.7099609375, -14.91796875, -14.1259765625, -13.333984375, -12.5419921875, -11.75, -10.9580078125, -10.166015625, -9.3740234375, -8.58203125, -7.7900390625, -6.998046875, -6.2060546875, -5.4140625, -4.6220703125, -3.830078125, -3.0380859375, -2.24609375, -1.4541015625, -0.662109375, 0.1298828125, 0.921875, 1.7138671875, 2.505859375, 3.2978515625, 4.08984375, 4.8818359375, 5.673828125, 6.4658203125, 7.2578125, 8.0498046875, 8.841796875, 9.6337890625, 10.42578125, 11.2177734375, 12.009765625, 12.8017578125, 13.59375, 14.3857421875, 15.177734375, 15.9697265625, 16.76171875, 17.5537109375, 18.345703125, 19.1376953125, 19.9296875, 20.7216796875, 21.513671875, 22.3056640625, 23.09765625, 23.8896484375, 24.681640625, 25.4736328125, 26.265625]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 6.0, 5.0, 7.0, 11.0, 7.0, 7.0, 7.0, 19.0, 19.0, 14.0, 26.0, 12.0, 34.0, 19.0, 33.0, 30.0, 38.0, 32.0, 44.0, 34.0, 26.0, 30.0, 43.0, 46.0, 49.0, 38.0, 33.0, 44.0, 39.0, 26.0, 26.0, 29.0, 21.0, 26.0, 19.0, 15.0, 15.0, 19.0, 9.0, 7.0, 6.0, 7.0, 6.0, 7.0, 6.0, 2.0, 6.0, 3.0, 3.0, 1.0], "bins": [-22.828125, -22.19921875, -21.5703125, -20.94140625, -20.3125, -19.68359375, -19.0546875, -18.42578125, -17.796875, -17.16796875, -16.5390625, -15.91015625, -15.28125, -14.65234375, -14.0234375, -13.39453125, -12.765625, -12.13671875, -11.5078125, -10.87890625, -10.25, -9.62109375, -8.9921875, -8.36328125, -7.734375, -7.10546875, -6.4765625, -5.84765625, -5.21875, -4.58984375, -3.9609375, -3.33203125, -2.703125, -2.07421875, -1.4453125, -0.81640625, -0.1875, 0.44140625, 1.0703125, 1.69921875, 2.328125, 2.95703125, 3.5859375, 4.21484375, 4.84375, 5.47265625, 6.1015625, 6.73046875, 7.359375, 7.98828125, 8.6171875, 9.24609375, 9.875, 10.50390625, 11.1328125, 11.76171875, 12.390625, 13.01953125, 13.6484375, 14.27734375, 14.90625, 15.53515625, 16.1640625, 16.79296875, 17.421875]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 5.0, 6.0, 9.0, 11.0, 11.0, 25.0, 29.0, 43.0, 56.0, 77.0, 113.0, 146.0, 235.0, 353.0, 594.0, 1069.0, 1849.0, 3391.0, 6785.0, 14911.0, 35909.0, 94753.0, 221059.0, 308475.0, 209476.0, 87716.0, 33695.0, 13806.0, 6460.0, 3187.0, 1666.0, 1017.0, 588.0, 333.0, 232.0, 124.0, 85.0, 53.0, 48.0, 40.0, 27.0, 21.0, 20.0, 9.0, 9.0, 9.0, 6.0, 4.0, 3.0, 3.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-25.953125, -25.10107421875, -24.2490234375, -23.39697265625, -22.544921875, -21.69287109375, -20.8408203125, -19.98876953125, -19.13671875, -18.28466796875, -17.4326171875, -16.58056640625, -15.728515625, -14.87646484375, -14.0244140625, -13.17236328125, -12.3203125, -11.46826171875, -10.6162109375, -9.76416015625, -8.912109375, -8.06005859375, -7.2080078125, -6.35595703125, -5.50390625, -4.65185546875, -3.7998046875, -2.94775390625, -2.095703125, -1.24365234375, -0.3916015625, 0.46044921875, 1.3125, 2.16455078125, 3.0166015625, 3.86865234375, 4.720703125, 5.57275390625, 6.4248046875, 7.27685546875, 8.12890625, 8.98095703125, 9.8330078125, 10.68505859375, 11.537109375, 12.38916015625, 13.2412109375, 14.09326171875, 14.9453125, 15.79736328125, 16.6494140625, 17.50146484375, 18.353515625, 19.20556640625, 20.0576171875, 20.90966796875, 21.76171875, 22.61376953125, 23.4658203125, 24.31787109375, 25.169921875, 26.02197265625, 26.8740234375, 27.72607421875, 28.578125]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 5.0, 2.0, 2.0, 2.0, 5.0, 4.0, 9.0, 17.0, 14.0, 23.0, 27.0, 42.0, 45.0, 76.0, 46.0, 85.0, 78.0, 94.0, 83.0, 74.0, 64.0, 58.0, 26.0, 25.0, 21.0, 23.0, 9.0, 12.0, 6.0, 7.0, 8.0, 7.0, 3.0, 5.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0021915435791015625, -0.0021255016326904297, -0.002059459686279297, -0.001993417739868164, -0.0019273757934570312, -0.0018613338470458984, -0.0017952919006347656, -0.0017292499542236328, -0.0016632080078125, -0.0015971660614013672, -0.0015311241149902344, -0.0014650821685791016, -0.0013990402221679688, -0.001332998275756836, -0.0012669563293457031, -0.0012009143829345703, -0.0011348724365234375, -0.0010688304901123047, -0.0010027885437011719, -0.0009367465972900391, -0.0008707046508789062, -0.0008046627044677734, -0.0007386207580566406, -0.0006725788116455078, -0.000606536865234375, -0.0005404949188232422, -0.0004744529724121094, -0.00040841102600097656, -0.00034236907958984375, -0.00027632713317871094, -0.00021028518676757812, -0.0001442432403564453, -7.82012939453125e-05, -1.2159347534179688e-05, 5.3882598876953125e-05, 0.00011992454528808594, 0.00018596649169921875, 0.00025200843811035156, 0.0003180503845214844, 0.0003840923309326172, 0.00045013427734375, 0.0005161762237548828, 0.0005822181701660156, 0.0006482601165771484, 0.0007143020629882812, 0.0007803440093994141, 0.0008463859558105469, 0.0009124279022216797, 0.0009784698486328125, 0.0010445117950439453, 0.0011105537414550781, 0.001176595687866211, 0.0012426376342773438, 0.0013086795806884766, 0.0013747215270996094, 0.0014407634735107422, 0.001506805419921875, 0.0015728473663330078, 0.0016388893127441406, 0.0017049312591552734, 0.0017709732055664062, 0.001837015151977539, 0.0019030570983886719, 0.0019690990447998047, 0.0020351409912109375]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 5.0, 7.0, 18.0, 16.0, 23.0, 29.0, 38.0, 55.0, 69.0, 100.0, 144.0, 148.0, 233.0, 340.0, 447.0, 746.0, 1159.0, 2358.0, 4948.0, 11285.0, 27418.0, 66821.0, 151477.0, 253333.0, 254785.0, 153953.0, 68304.0, 27825.0, 11439.0, 4971.0, 2315.0, 1278.0, 763.0, 443.0, 321.0, 248.0, 169.0, 132.0, 106.0, 71.0, 64.0, 39.0, 34.0, 24.0, 13.0, 12.0, 3.0, 8.0, 6.0, 6.0, 3.0, 3.0], "bins": [-27.5, -26.736328125, -25.97265625, -25.208984375, -24.4453125, -23.681640625, -22.91796875, -22.154296875, -21.390625, -20.626953125, -19.86328125, -19.099609375, -18.3359375, -17.572265625, -16.80859375, -16.044921875, -15.28125, -14.517578125, -13.75390625, -12.990234375, -12.2265625, -11.462890625, -10.69921875, -9.935546875, -9.171875, -8.408203125, -7.64453125, -6.880859375, -6.1171875, -5.353515625, -4.58984375, -3.826171875, -3.0625, -2.298828125, -1.53515625, -0.771484375, -0.0078125, 0.755859375, 1.51953125, 2.283203125, 3.046875, 3.810546875, 4.57421875, 5.337890625, 6.1015625, 6.865234375, 7.62890625, 8.392578125, 9.15625, 9.919921875, 10.68359375, 11.447265625, 12.2109375, 12.974609375, 13.73828125, 14.501953125, 15.265625, 16.029296875, 16.79296875, 17.556640625, 18.3203125, 19.083984375, 19.84765625, 20.611328125, 21.375]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 3.0, 1.0, 4.0, 3.0, 15.0, 13.0, 20.0, 14.0, 27.0, 31.0, 41.0, 52.0, 54.0, 79.0, 71.0, 68.0, 68.0, 80.0, 72.0, 69.0, 38.0, 46.0, 27.0, 34.0, 17.0, 19.0, 13.0, 6.0, 5.0, 2.0, 3.0, 0.0, 2.0, 1.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.7578125, -6.5081787109375, -6.258544921875, -6.0089111328125, -5.75927734375, -5.5096435546875, -5.260009765625, -5.0103759765625, -4.7607421875, -4.5111083984375, -4.261474609375, -4.0118408203125, -3.76220703125, -3.5125732421875, -3.262939453125, -3.0133056640625, -2.763671875, -2.5140380859375, -2.264404296875, -2.0147705078125, -1.76513671875, -1.5155029296875, -1.265869140625, -1.0162353515625, -0.7666015625, -0.5169677734375, -0.267333984375, -0.0177001953125, 0.23193359375, 0.4815673828125, 0.731201171875, 0.9808349609375, 1.23046875, 1.4801025390625, 1.729736328125, 1.9793701171875, 2.22900390625, 2.4786376953125, 2.728271484375, 2.9779052734375, 3.2275390625, 3.4771728515625, 3.726806640625, 3.9764404296875, 4.22607421875, 4.4757080078125, 4.725341796875, 4.9749755859375, 5.224609375, 5.4742431640625, 5.723876953125, 5.9735107421875, 6.22314453125, 6.4727783203125, 6.722412109375, 6.9720458984375, 7.2216796875, 7.4713134765625, 7.720947265625, 7.9705810546875, 8.22021484375, 8.4698486328125, 8.719482421875, 8.9691162109375, 9.21875]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 5.0, 4.0, 4.0, 5.0, 9.0, 12.0, 7.0, 6.0, 21.0, 21.0, 30.0, 18.0, 35.0, 26.0, 32.0, 43.0, 41.0, 40.0, 55.0, 53.0, 37.0, 41.0, 47.0, 50.0, 53.0, 41.0, 30.0, 25.0, 31.0, 37.0, 26.0, 19.0, 20.0, 12.0, 16.0, 11.0, 8.0, 10.0, 3.0, 6.0, 8.0, 1.0, 3.0, 2.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-29.68899917602539, -28.79994010925293, -27.9108829498291, -27.02182388305664, -26.13276481628418, -25.24370574951172, -24.35464859008789, -23.46558952331543, -22.57653045654297, -21.687471389770508, -20.79841423034668, -19.90935516357422, -19.020296096801758, -18.131237030029297, -17.24217987060547, -16.353120803833008, -15.46406364440918, -14.575005531311035, -13.685946464538574, -12.79688835144043, -11.907829284667969, -11.018771171569824, -10.12971305847168, -9.240653991699219, -8.351595878601074, -7.4625372886657715, -6.573478698730469, -5.684420585632324, -4.7953619956970215, -3.9063034057617188, -3.017245292663574, -2.1281867027282715, -1.239126205444336, -0.35006773471832275, 0.5389907360076904, 1.428049087524414, 2.317107677459717, 3.2061662673950195, 4.095224380493164, 4.984282970428467, 5.8733415603637695, 6.762400150299072, 7.651458740234375, 8.54051685333252, 9.429574966430664, 10.318634033203125, 11.20769214630127, 12.096750259399414, 12.985809326171875, 13.87486743927002, 14.76392650604248, 15.652984619140625, 16.542043685913086, 17.431102752685547, 18.320159912109375, 19.209218978881836, 20.098278045654297, 20.987337112426758, 21.876394271850586, 22.765453338623047, 23.654512405395508, 24.54357147216797, 25.432628631591797, 26.321687698364258, 27.210744857788086]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 5.0, 3.0, 4.0, 7.0, 8.0, 7.0, 10.0, 16.0, 14.0, 11.0, 25.0, 15.0, 23.0, 30.0, 40.0, 30.0, 41.0, 37.0, 49.0, 36.0, 55.0, 42.0, 41.0, 48.0, 38.0, 45.0, 37.0, 45.0, 34.0, 29.0, 20.0, 30.0, 20.0, 16.0, 23.0, 25.0, 7.0, 14.0, 8.0, 7.0, 6.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-32.83268737792969, -31.704620361328125, -30.576553344726562, -29.448486328125, -28.320417404174805, -27.192350387573242, -26.06428337097168, -24.936216354370117, -23.808147430419922, -22.68008041381836, -21.552013397216797, -20.423946380615234, -19.29587745666504, -18.167810440063477, -17.039743423461914, -15.911676406860352, -14.783609390258789, -13.655542373657227, -12.527474403381348, -11.399407386779785, -10.271339416503906, -9.143272399902344, -8.015205383300781, -6.8871378898620605, -5.75907039642334, -4.631002902984619, -3.5029356479644775, -2.374868392944336, -1.2468008995056152, -0.11873340606689453, 1.009333610534668, 2.1374011039733887, 3.2654685974121094, 4.39353609085083, 5.521603584289551, 6.649670600891113, 7.777738094329834, 8.905805587768555, 10.033872604370117, 11.16193962097168, 12.290007591247559, 13.418074607849121, 14.546142578125, 15.674209594726562, 16.802276611328125, 17.930343627929688, 19.05841064453125, 20.186479568481445, 21.314546585083008, 22.44261360168457, 23.570680618286133, 24.698749542236328, 25.82681655883789, 26.954883575439453, 28.082950592041016, 29.211017608642578, 30.33908462524414, 31.467151641845703, 32.595218658447266, 33.72328567504883, 34.85135269165039, 35.97942352294922, 37.10749053955078, 38.235557556152344, 39.363624572753906]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [4.0, 1.0, 3.0, 6.0, 12.0, 17.0, 31.0, 52.0, 104.0, 144.0, 227.0, 387.0, 599.0, 893.0, 1458.0, 2378.0, 3892.0, 5840.0, 9503.0, 15062.0, 23837.0, 37163.0, 57320.0, 86289.0, 129044.0, 184690.0, 254244.0, 329482.0, 398577.0, 447319.0, 456187.0, 426556.0, 364133.0, 289105.0, 216000.0, 153390.0, 105205.0, 70105.0, 45635.0, 29094.0, 18421.0, 11825.0, 7433.0, 4666.0, 2960.0, 1842.0, 1148.0, 706.0, 491.0, 314.0, 210.0, 125.0, 53.0, 42.0, 30.0, 21.0, 14.0, 3.0, 3.0, 2.0, 1.0, 3.0, 0.0, 3.0], "bins": [-19.40625, -18.7646484375, -18.123046875, -17.4814453125, -16.83984375, -16.1982421875, -15.556640625, -14.9150390625, -14.2734375, -13.6318359375, -12.990234375, -12.3486328125, -11.70703125, -11.0654296875, -10.423828125, -9.7822265625, -9.140625, -8.4990234375, -7.857421875, -7.2158203125, -6.57421875, -5.9326171875, -5.291015625, -4.6494140625, -4.0078125, -3.3662109375, -2.724609375, -2.0830078125, -1.44140625, -0.7998046875, -0.158203125, 0.4833984375, 1.125, 1.7666015625, 2.408203125, 3.0498046875, 3.69140625, 4.3330078125, 4.974609375, 5.6162109375, 6.2578125, 6.8994140625, 7.541015625, 8.1826171875, 8.82421875, 9.4658203125, 10.107421875, 10.7490234375, 11.390625, 12.0322265625, 12.673828125, 13.3154296875, 13.95703125, 14.5986328125, 15.240234375, 15.8818359375, 16.5234375, 17.1650390625, 17.806640625, 18.4482421875, 19.08984375, 19.7314453125, 20.373046875, 21.0146484375, 21.65625]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 5.0, 1.0, 3.0, 4.0, 5.0, 2.0, 4.0, 7.0, 7.0, 6.0, 20.0, 15.0, 18.0, 21.0, 22.0, 26.0, 32.0, 35.0, 40.0, 37.0, 41.0, 40.0, 37.0, 60.0, 44.0, 35.0, 51.0, 48.0, 43.0, 39.0, 40.0, 44.0, 27.0, 24.0, 26.0, 21.0, 18.0, 15.0, 10.0, 10.0, 7.0, 5.0, 10.0, 7.0, 1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.84375, -24.939453125, -24.03515625, -23.130859375, -22.2265625, -21.322265625, -20.41796875, -19.513671875, -18.609375, -17.705078125, -16.80078125, -15.896484375, -14.9921875, -14.087890625, -13.18359375, -12.279296875, -11.375, -10.470703125, -9.56640625, -8.662109375, -7.7578125, -6.853515625, -5.94921875, -5.044921875, -4.140625, -3.236328125, -2.33203125, -1.427734375, -0.5234375, 0.380859375, 1.28515625, 2.189453125, 3.09375, 3.998046875, 4.90234375, 5.806640625, 6.7109375, 7.615234375, 8.51953125, 9.423828125, 10.328125, 11.232421875, 12.13671875, 13.041015625, 13.9453125, 14.849609375, 15.75390625, 16.658203125, 17.5625, 18.466796875, 19.37109375, 20.275390625, 21.1796875, 22.083984375, 22.98828125, 23.892578125, 24.796875, 25.701171875, 26.60546875, 27.509765625, 28.4140625, 29.318359375, 30.22265625, 31.126953125, 32.03125]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 5.0, 21.0, 48.0, 78.0, 122.0, 221.0, 400.0, 697.0, 1165.0, 2153.0, 3671.0, 6006.0, 10004.0, 16786.0, 26700.0, 42582.0, 65196.0, 97316.0, 141623.0, 195313.0, 259396.0, 324635.0, 381016.0, 418428.0, 425820.0, 403116.0, 353899.0, 290411.0, 225806.0, 166253.0, 117576.0, 79540.0, 52287.0, 33440.0, 21039.0, 12866.0, 7780.0, 4554.0, 2736.0, 1513.0, 895.0, 507.0, 286.0, 174.0, 85.0, 53.0, 36.0, 15.0, 15.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-21.5625, -20.913818359375, -20.26513671875, -19.616455078125, -18.9677734375, -18.319091796875, -17.67041015625, -17.021728515625, -16.373046875, -15.724365234375, -15.07568359375, -14.427001953125, -13.7783203125, -13.129638671875, -12.48095703125, -11.832275390625, -11.18359375, -10.534912109375, -9.88623046875, -9.237548828125, -8.5888671875, -7.940185546875, -7.29150390625, -6.642822265625, -5.994140625, -5.345458984375, -4.69677734375, -4.048095703125, -3.3994140625, -2.750732421875, -2.10205078125, -1.453369140625, -0.8046875, -0.156005859375, 0.49267578125, 1.141357421875, 1.7900390625, 2.438720703125, 3.08740234375, 3.736083984375, 4.384765625, 5.033447265625, 5.68212890625, 6.330810546875, 6.9794921875, 7.628173828125, 8.27685546875, 8.925537109375, 9.57421875, 10.222900390625, 10.87158203125, 11.520263671875, 12.1689453125, 12.817626953125, 13.46630859375, 14.114990234375, 14.763671875, 15.412353515625, 16.06103515625, 16.709716796875, 17.3583984375, 18.007080078125, 18.65576171875, 19.304443359375, 19.953125]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 8.0, 8.0, 7.0, 13.0, 12.0, 20.0, 36.0, 26.0, 40.0, 42.0, 68.0, 64.0, 93.0, 102.0, 130.0, 142.0, 173.0, 174.0, 175.0, 216.0, 205.0, 203.0, 203.0, 214.0, 207.0, 182.0, 185.0, 174.0, 150.0, 149.0, 131.0, 92.0, 74.0, 73.0, 65.0, 43.0, 41.0, 38.0, 23.0, 32.0, 11.0, 8.0, 6.0, 7.0, 7.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.796875, -10.42578125, -10.0546875, -9.68359375, -9.3125, -8.94140625, -8.5703125, -8.19921875, -7.828125, -7.45703125, -7.0859375, -6.71484375, -6.34375, -5.97265625, -5.6015625, -5.23046875, -4.859375, -4.48828125, -4.1171875, -3.74609375, -3.375, -3.00390625, -2.6328125, -2.26171875, -1.890625, -1.51953125, -1.1484375, -0.77734375, -0.40625, -0.03515625, 0.3359375, 0.70703125, 1.078125, 1.44921875, 1.8203125, 2.19140625, 2.5625, 2.93359375, 3.3046875, 3.67578125, 4.046875, 4.41796875, 4.7890625, 5.16015625, 5.53125, 5.90234375, 6.2734375, 6.64453125, 7.015625, 7.38671875, 7.7578125, 8.12890625, 8.5, 8.87109375, 9.2421875, 9.61328125, 9.984375, 10.35546875, 10.7265625, 11.09765625, 11.46875, 11.83984375, 12.2109375, 12.58203125, 12.953125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 6.0, 5.0, 7.0, 10.0, 12.0, 13.0, 8.0, 20.0, 23.0, 25.0, 35.0, 31.0, 34.0, 32.0, 35.0, 47.0, 54.0, 56.0, 49.0, 51.0, 45.0, 44.0, 38.0, 41.0, 39.0, 31.0, 33.0, 37.0, 25.0, 21.0, 22.0, 14.0, 14.0, 11.0, 9.0, 9.0, 4.0, 2.0, 2.0, 6.0, 1.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-28.171144485473633, -27.296199798583984, -26.421255111694336, -25.546310424804688, -24.671363830566406, -23.796419143676758, -22.92147445678711, -22.04652976989746, -21.171585083007812, -20.296640396118164, -19.421695709228516, -18.546749114990234, -17.671804428100586, -16.796859741210938, -15.921915054321289, -15.04697036743164, -14.172024726867676, -13.297080039978027, -12.422134399414062, -11.547189712524414, -10.672245025634766, -9.797300338745117, -8.922354698181152, -8.047410011291504, -7.172464847564697, -6.297519683837891, -5.422574996948242, -4.5476298332214355, -3.672684907913208, -2.7977399826049805, -1.9227948188781738, -1.0478501319885254, -0.17290496826171875, 0.7020400166511536, 1.5769850015640259, 2.451930046081543, 3.3268749713897705, 4.201819896697998, 5.076765060424805, 5.951709747314453, 6.82665491104126, 7.701600074768066, 8.576544761657715, 9.45149040222168, 10.326435089111328, 11.201379776000977, 12.076324462890625, 12.951269149780273, 13.826214790344238, 14.701159477233887, 15.576105117797852, 16.4510498046875, 17.32599449157715, 18.200939178466797, 19.075885772705078, 19.950828552246094, 20.825775146484375, 21.700719833374023, 22.575664520263672, 23.450611114501953, 24.3255558013916, 25.20050048828125, 26.0754451751709, 26.950389862060547, 27.825334548950195]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 6.0, 3.0, 5.0, 6.0, 5.0, 4.0, 9.0, 4.0, 10.0, 12.0, 20.0, 29.0, 19.0, 24.0, 38.0, 31.0, 35.0, 37.0, 28.0, 41.0, 43.0, 39.0, 31.0, 47.0, 30.0, 48.0, 40.0, 42.0, 38.0, 37.0, 38.0, 28.0, 30.0, 24.0, 28.0, 15.0, 14.0, 14.0, 20.0, 3.0, 8.0, 7.0, 7.0, 6.0, 4.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.982175827026367, -26.99736976623535, -26.012563705444336, -25.02775764465332, -24.042951583862305, -23.05814552307129, -22.073341369628906, -21.08853530883789, -20.103729248046875, -19.11892318725586, -18.134117126464844, -17.149311065673828, -16.164505004882812, -15.179698944091797, -14.194893836975098, -13.210087776184082, -12.22528076171875, -11.240474700927734, -10.255668640136719, -9.270862579345703, -8.286056518554688, -7.30125093460083, -6.316445350646973, -5.331639289855957, -4.346833229064941, -3.362027168273926, -2.3772213459014893, -1.3924155235290527, -0.4076094627380371, 0.5771965980529785, 1.562002182006836, 2.5468082427978516, 3.5316162109375, 4.516422271728516, 5.501228332519531, 6.486033916473389, 7.470839977264404, 8.455646514892578, 9.440451622009277, 10.425257682800293, 11.410063743591309, 12.394869804382324, 13.37967586517334, 14.364480972290039, 15.349287033081055, 16.33409309387207, 17.318899154663086, 18.3037052154541, 19.288511276245117, 20.273317337036133, 21.25812339782715, 22.242929458618164, 23.22773551940918, 24.212541580200195, 25.197345733642578, 26.182151794433594, 27.16695785522461, 28.151763916015625, 29.13656997680664, 30.121376037597656, 31.106182098388672, 32.09098815917969, 33.0757942199707, 34.06060028076172, 35.045406341552734]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 6.0, 10.0, 15.0, 23.0, 31.0, 50.0, 100.0, 141.0, 257.0, 419.0, 685.0, 1056.0, 1786.0, 3033.0, 4950.0, 8032.0, 13047.0, 20710.0, 32809.0, 50343.0, 73863.0, 103498.0, 131335.0, 144496.0, 133459.0, 106505.0, 76105.0, 51664.0, 33642.0, 21790.0, 13594.0, 8291.0, 5017.0, 2998.0, 1923.0, 1137.0, 663.0, 425.0, 208.0, 167.0, 115.0, 61.0, 48.0, 24.0, 14.0, 9.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.64453125, -6.4403076171875, -6.236083984375, -6.0318603515625, -5.82763671875, -5.6234130859375, -5.419189453125, -5.2149658203125, -5.0107421875, -4.8065185546875, -4.602294921875, -4.3980712890625, -4.19384765625, -3.9896240234375, -3.785400390625, -3.5811767578125, -3.376953125, -3.1727294921875, -2.968505859375, -2.7642822265625, -2.56005859375, -2.3558349609375, -2.151611328125, -1.9473876953125, -1.7431640625, -1.5389404296875, -1.334716796875, -1.1304931640625, -0.92626953125, -0.7220458984375, -0.517822265625, -0.3135986328125, -0.109375, 0.0948486328125, 0.299072265625, 0.5032958984375, 0.70751953125, 0.9117431640625, 1.115966796875, 1.3201904296875, 1.5244140625, 1.7286376953125, 1.932861328125, 2.1370849609375, 2.34130859375, 2.5455322265625, 2.749755859375, 2.9539794921875, 3.158203125, 3.3624267578125, 3.566650390625, 3.7708740234375, 3.97509765625, 4.1793212890625, 4.383544921875, 4.5877685546875, 4.7919921875, 4.9962158203125, 5.200439453125, 5.4046630859375, 5.60888671875, 5.8131103515625, 6.017333984375, 6.2215576171875, 6.42578125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 3.0, 3.0, 7.0, 2.0, 7.0, 7.0, 9.0, 7.0, 11.0, 20.0, 21.0, 32.0, 32.0, 20.0, 25.0, 37.0, 39.0, 43.0, 35.0, 52.0, 44.0, 32.0, 33.0, 44.0, 38.0, 46.0, 45.0, 42.0, 30.0, 27.0, 22.0, 34.0, 34.0, 23.0, 19.0, 17.0, 9.0, 13.0, 12.0, 6.0, 5.0, 4.0, 7.0, 7.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.234375, -29.210205078125, -28.18603515625, -27.161865234375, -26.1376953125, -25.113525390625, -24.08935546875, -23.065185546875, -22.041015625, -21.016845703125, -19.99267578125, -18.968505859375, -17.9443359375, -16.920166015625, -15.89599609375, -14.871826171875, -13.84765625, -12.823486328125, -11.79931640625, -10.775146484375, -9.7509765625, -8.726806640625, -7.70263671875, -6.678466796875, -5.654296875, -4.630126953125, -3.60595703125, -2.581787109375, -1.5576171875, -0.533447265625, 0.49072265625, 1.514892578125, 2.5390625, 3.563232421875, 4.58740234375, 5.611572265625, 6.6357421875, 7.659912109375, 8.68408203125, 9.708251953125, 10.732421875, 11.756591796875, 12.78076171875, 13.804931640625, 14.8291015625, 15.853271484375, 16.87744140625, 17.901611328125, 18.92578125, 19.949951171875, 20.97412109375, 21.998291015625, 23.0224609375, 24.046630859375, 25.07080078125, 26.094970703125, 27.119140625, 28.143310546875, 29.16748046875, 30.191650390625, 31.2158203125, 32.239990234375, 33.26416015625, 34.288330078125, 35.3125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 9.0, 11.0, 5.0, 16.0, 31.0, 43.0, 54.0, 79.0, 139.0, 189.0, 273.0, 471.0, 715.0, 1096.0, 1832.0, 3093.0, 5192.0, 8753.0, 14878.0, 25395.0, 42569.0, 68514.0, 103382.0, 141369.0, 161548.0, 150101.0, 116048.0, 79225.0, 49938.0, 29729.0, 17841.0, 10438.0, 6115.0, 3566.0, 2226.0, 1361.0, 854.0, 505.0, 361.0, 220.0, 133.0, 73.0, 51.0, 39.0, 27.0, 23.0, 14.0, 7.0, 4.0, 4.0, 6.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.89453125, -5.71405029296875, -5.5335693359375, -5.35308837890625, -5.172607421875, -4.99212646484375, -4.8116455078125, -4.63116455078125, -4.45068359375, -4.27020263671875, -4.0897216796875, -3.90924072265625, -3.728759765625, -3.54827880859375, -3.3677978515625, -3.18731689453125, -3.0068359375, -2.82635498046875, -2.6458740234375, -2.46539306640625, -2.284912109375, -2.10443115234375, -1.9239501953125, -1.74346923828125, -1.56298828125, -1.38250732421875, -1.2020263671875, -1.02154541015625, -0.841064453125, -0.66058349609375, -0.4801025390625, -0.29962158203125, -0.119140625, 0.06134033203125, 0.2418212890625, 0.42230224609375, 0.602783203125, 0.78326416015625, 0.9637451171875, 1.14422607421875, 1.32470703125, 1.50518798828125, 1.6856689453125, 1.86614990234375, 2.046630859375, 2.22711181640625, 2.4075927734375, 2.58807373046875, 2.7685546875, 2.94903564453125, 3.1295166015625, 3.30999755859375, 3.490478515625, 3.67095947265625, 3.8514404296875, 4.03192138671875, 4.21240234375, 4.39288330078125, 4.5733642578125, 4.75384521484375, 4.934326171875, 5.11480712890625, 5.2952880859375, 5.47576904296875, 5.65625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 3.0, 1.0, 3.0, 0.0, 2.0, 4.0, 4.0, 8.0, 2.0, 7.0, 4.0, 11.0, 9.0, 13.0, 15.0, 20.0, 14.0, 21.0, 26.0, 19.0, 18.0, 37.0, 27.0, 38.0, 33.0, 37.0, 32.0, 35.0, 38.0, 40.0, 37.0, 39.0, 44.0, 40.0, 41.0, 28.0, 24.0, 20.0, 19.0, 17.0, 20.0, 28.0, 24.0, 17.0, 5.0, 15.0, 10.0, 10.0, 11.0, 9.0, 8.0, 8.0, 7.0, 3.0, 4.0, 1.0, 3.0, 1.0, 0.0, 3.0, 2.0], "bins": [-17.953125, -17.397216796875, -16.84130859375, -16.285400390625, -15.7294921875, -15.173583984375, -14.61767578125, -14.061767578125, -13.505859375, -12.949951171875, -12.39404296875, -11.838134765625, -11.2822265625, -10.726318359375, -10.17041015625, -9.614501953125, -9.05859375, -8.502685546875, -7.94677734375, -7.390869140625, -6.8349609375, -6.279052734375, -5.72314453125, -5.167236328125, -4.611328125, -4.055419921875, -3.49951171875, -2.943603515625, -2.3876953125, -1.831787109375, -1.27587890625, -0.719970703125, -0.1640625, 0.391845703125, 0.94775390625, 1.503662109375, 2.0595703125, 2.615478515625, 3.17138671875, 3.727294921875, 4.283203125, 4.839111328125, 5.39501953125, 5.950927734375, 6.5068359375, 7.062744140625, 7.61865234375, 8.174560546875, 8.73046875, 9.286376953125, 9.84228515625, 10.398193359375, 10.9541015625, 11.510009765625, 12.06591796875, 12.621826171875, 13.177734375, 13.733642578125, 14.28955078125, 14.845458984375, 15.4013671875, 15.957275390625, 16.51318359375, 17.069091796875, 17.625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 4.0, 9.0, 7.0, 16.0, 17.0, 33.0, 46.0, 48.0, 75.0, 122.0, 194.0, 248.0, 407.0, 557.0, 865.0, 1348.0, 2234.0, 3691.0, 6489.0, 11989.0, 22929.0, 47198.0, 98076.0, 197532.0, 272727.0, 191998.0, 94373.0, 45455.0, 22101.0, 11771.0, 6305.0, 3579.0, 2150.0, 1344.0, 878.0, 532.0, 379.0, 254.0, 172.0, 122.0, 87.0, 46.0, 41.0, 34.0, 24.0, 13.0, 14.0, 7.0, 6.0, 9.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-1.6533203125, -1.600799560546875, -1.54827880859375, -1.495758056640625, -1.4432373046875, -1.390716552734375, -1.33819580078125, -1.285675048828125, -1.233154296875, -1.180633544921875, -1.12811279296875, -1.075592041015625, -1.0230712890625, -0.970550537109375, -0.91802978515625, -0.865509033203125, -0.81298828125, -0.760467529296875, -0.70794677734375, -0.655426025390625, -0.6029052734375, -0.550384521484375, -0.49786376953125, -0.445343017578125, -0.392822265625, -0.340301513671875, -0.28778076171875, -0.235260009765625, -0.1827392578125, -0.130218505859375, -0.07769775390625, -0.025177001953125, 0.02734375, 0.079864501953125, 0.13238525390625, 0.184906005859375, 0.2374267578125, 0.289947509765625, 0.34246826171875, 0.394989013671875, 0.447509765625, 0.500030517578125, 0.55255126953125, 0.605072021484375, 0.6575927734375, 0.710113525390625, 0.76263427734375, 0.815155029296875, 0.86767578125, 0.920196533203125, 0.97271728515625, 1.025238037109375, 1.0777587890625, 1.130279541015625, 1.18280029296875, 1.235321044921875, 1.287841796875, 1.340362548828125, 1.39288330078125, 1.445404052734375, 1.4979248046875, 1.550445556640625, 1.60296630859375, 1.655487060546875, 1.7080078125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 1.0, 0.0, 3.0, 7.0, 7.0, 4.0, 11.0, 16.0, 23.0, 22.0, 32.0, 48.0, 60.0, 74.0, 63.0, 71.0, 81.0, 97.0, 76.0, 73.0, 67.0, 39.0, 31.0, 19.0, 24.0, 17.0, 10.0, 10.0, 4.0, 2.0, 5.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0003542900085449219, -0.0003448314964771271, -0.0003353729844093323, -0.0003259144723415375, -0.0003164559602737427, -0.0003069974482059479, -0.0002975389361381531, -0.0002880804240703583, -0.0002786219120025635, -0.0002691633999347687, -0.0002597048878669739, -0.0002502463757991791, -0.00024078786373138428, -0.00023132935166358948, -0.00022187083959579468, -0.00021241232752799988, -0.00020295381546020508, -0.00019349530339241028, -0.00018403679132461548, -0.00017457827925682068, -0.00016511976718902588, -0.00015566125512123108, -0.00014620274305343628, -0.00013674423098564148, -0.00012728571891784668, -0.00011782720685005188, -0.00010836869478225708, -9.891018271446228e-05, -8.945167064666748e-05, -7.999315857887268e-05, -7.053464651107788e-05, -6.107613444328308e-05, -5.161762237548828e-05, -4.215911030769348e-05, -3.270059823989868e-05, -2.3242086172103882e-05, -1.3783574104309082e-05, -4.325062036514282e-06, 5.133450031280518e-06, 1.4591962099075317e-05, 2.4050474166870117e-05, 3.350898623466492e-05, 4.296749830245972e-05, 5.2426010370254517e-05, 6.188452243804932e-05, 7.134303450584412e-05, 8.080154657363892e-05, 9.026005864143372e-05, 9.971857070922852e-05, 0.00010917708277702332, 0.00011863559484481812, 0.00012809410691261292, 0.00013755261898040771, 0.00014701113104820251, 0.00015646964311599731, 0.00016592815518379211, 0.00017538666725158691, 0.00018484517931938171, 0.00019430369138717651, 0.0002037622034549713, 0.0002132207155227661, 0.0002226792275905609, 0.0002321377396583557, 0.0002415962517261505, 0.0002510547637939453]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 7.0, 8.0, 12.0, 17.0, 22.0, 39.0, 59.0, 80.0, 141.0, 198.0, 300.0, 473.0, 691.0, 1090.0, 1702.0, 2720.0, 4225.0, 7127.0, 11796.0, 19962.0, 34124.0, 57665.0, 93364.0, 140401.0, 178348.0, 168999.0, 124219.0, 80708.0, 48532.0, 28751.0, 16768.0, 9991.0, 5867.0, 3699.0, 2315.0, 1433.0, 932.0, 600.0, 388.0, 258.0, 177.0, 115.0, 82.0, 48.0, 39.0, 26.0, 17.0, 5.0, 9.0, 6.0, 4.0, 3.0, 0.0, 2.0, 2.0, 0.0, 2.0], "bins": [-2.259765625, -2.18878173828125, -2.1177978515625, -2.04681396484375, -1.975830078125, -1.90484619140625, -1.8338623046875, -1.76287841796875, -1.69189453125, -1.62091064453125, -1.5499267578125, -1.47894287109375, -1.407958984375, -1.33697509765625, -1.2659912109375, -1.19500732421875, -1.1240234375, -1.05303955078125, -0.9820556640625, -0.91107177734375, -0.840087890625, -0.76910400390625, -0.6981201171875, -0.62713623046875, -0.55615234375, -0.48516845703125, -0.4141845703125, -0.34320068359375, -0.272216796875, -0.20123291015625, -0.1302490234375, -0.05926513671875, 0.01171875, 0.08270263671875, 0.1536865234375, 0.22467041015625, 0.295654296875, 0.36663818359375, 0.4376220703125, 0.50860595703125, 0.57958984375, 0.65057373046875, 0.7215576171875, 0.79254150390625, 0.863525390625, 0.93450927734375, 1.0054931640625, 1.07647705078125, 1.1474609375, 1.21844482421875, 1.2894287109375, 1.36041259765625, 1.431396484375, 1.50238037109375, 1.5733642578125, 1.64434814453125, 1.71533203125, 1.78631591796875, 1.8572998046875, 1.92828369140625, 1.999267578125, 2.07025146484375, 2.1412353515625, 2.21221923828125, 2.283203125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 4.0, 4.0, 7.0, 13.0, 16.0, 22.0, 17.0, 16.0, 17.0, 34.0, 35.0, 39.0, 47.0, 53.0, 68.0, 67.0, 76.0, 47.0, 60.0, 47.0, 43.0, 43.0, 44.0, 24.0, 30.0, 21.0, 22.0, 20.0, 20.0, 8.0, 8.0, 3.0, 5.0, 6.0, 2.0, 6.0, 3.0, 0.0, 1.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.80419921875, -0.7785415649414062, -0.7528839111328125, -0.7272262573242188, -0.701568603515625, -0.6759109497070312, -0.6502532958984375, -0.6245956420898438, -0.59893798828125, -0.5732803344726562, -0.5476226806640625, -0.5219650268554688, -0.496307373046875, -0.47064971923828125, -0.4449920654296875, -0.41933441162109375, -0.3936767578125, -0.36801910400390625, -0.3423614501953125, -0.31670379638671875, -0.291046142578125, -0.26538848876953125, -0.2397308349609375, -0.21407318115234375, -0.18841552734375, -0.16275787353515625, -0.1371002197265625, -0.11144256591796875, -0.085784912109375, -0.06012725830078125, -0.0344696044921875, -0.00881195068359375, 0.016845703125, 0.04250335693359375, 0.0681610107421875, 0.09381866455078125, 0.119476318359375, 0.14513397216796875, 0.1707916259765625, 0.19644927978515625, 0.22210693359375, 0.24776458740234375, 0.2734222412109375, 0.29907989501953125, 0.324737548828125, 0.35039520263671875, 0.3760528564453125, 0.40171051025390625, 0.4273681640625, 0.45302581787109375, 0.4786834716796875, 0.5043411254882812, 0.529998779296875, 0.5556564331054688, 0.5813140869140625, 0.6069717407226562, 0.63262939453125, 0.6582870483398438, 0.6839447021484375, 0.7096023559570312, 0.735260009765625, 0.7609176635742188, 0.7865753173828125, 0.8122329711914062, 0.837890625]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 7.0, 3.0, 10.0, 6.0, 7.0, 14.0, 11.0, 16.0, 23.0, 21.0, 26.0, 33.0, 34.0, 22.0, 41.0, 46.0, 34.0, 59.0, 50.0, 52.0, 54.0, 38.0, 48.0, 44.0, 35.0, 45.0, 27.0, 35.0, 27.0, 24.0, 21.0, 23.0, 16.0, 12.0, 6.0, 11.0, 11.0, 5.0, 2.0, 2.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-27.702054977416992, -26.835445404052734, -25.96883773803711, -25.10222816467285, -24.235618591308594, -23.36901092529297, -22.50240135192871, -21.635791778564453, -20.769184112548828, -19.90257453918457, -19.035966873168945, -18.169357299804688, -17.30274772644043, -16.436138153076172, -15.569530487060547, -14.702920913696289, -13.836311340332031, -12.96970272064209, -12.103093147277832, -11.23648452758789, -10.369874954223633, -9.503266334533691, -8.63665771484375, -7.77004861831665, -6.903439521789551, -6.036830425262451, -5.170221328735352, -4.30361270904541, -3.4370036125183105, -2.570394515991211, -1.7037858963012695, -0.8371767997741699, 0.0294342041015625, 0.8960431814193726, 1.7626521587371826, 2.629261016845703, 3.4958701133728027, 4.362479209899902, 5.229087829589844, 6.095696926116943, 6.962306022644043, 7.828915119171143, 8.695524215698242, 9.562132835388184, 10.428741455078125, 11.295351028442383, 12.161959648132324, 13.028568267822266, 13.895177841186523, 14.761786460876465, 15.628396034240723, 16.495004653930664, 17.361614227294922, 18.228221893310547, 19.094831466674805, 19.961441040039062, 20.828048706054688, 21.694658279418945, 22.56126594543457, 23.427875518798828, 24.294485092163086, 25.161094665527344, 26.02770233154297, 26.894311904907227, 27.760921478271484]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 7.0, 2.0, 5.0, 6.0, 6.0, 4.0, 8.0, 5.0, 12.0, 13.0, 17.0, 29.0, 24.0, 22.0, 35.0, 30.0, 38.0, 35.0, 29.0, 42.0, 44.0, 41.0, 29.0, 44.0, 26.0, 53.0, 37.0, 41.0, 41.0, 34.0, 41.0, 25.0, 34.0, 21.0, 27.0, 14.0, 16.0, 14.0, 20.0, 5.0, 7.0, 5.0, 7.0, 8.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.886810302734375, -26.911548614501953, -25.93628692626953, -24.961027145385742, -23.98576545715332, -23.0105037689209, -22.035242080688477, -21.059982299804688, -20.084720611572266, -19.109458923339844, -18.134197235107422, -17.158937454223633, -16.18367576599121, -15.208414077758789, -14.233152389526367, -13.257891654968262, -12.28262996673584, -11.307368278503418, -10.332107543945312, -9.35684585571289, -8.381585121154785, -7.406323432922363, -6.4310622215271, -5.455801010131836, -4.480539798736572, -3.5052785873413086, -2.530017375946045, -1.5547559261322021, -0.5794947147369385, 0.3957667350769043, 1.371027946472168, 2.3462891578674316, 3.3215503692626953, 4.296811580657959, 5.272072792053223, 6.2473344802856445, 7.22259521484375, 8.197856903076172, 9.173118591308594, 10.1483793258667, 11.123640060424805, 12.098901748657227, 13.074162483215332, 14.049424171447754, 15.02468490600586, 15.999946594238281, 16.975208282470703, 17.950469970703125, 18.925731658935547, 19.90099334716797, 20.87625503540039, 21.85151481628418, 22.8267765045166, 23.802038192749023, 24.777299880981445, 25.752559661865234, 26.727821350097656, 27.703083038330078, 28.6783447265625, 29.65360450744629, 30.62886619567871, 31.604127883911133, 32.57938766479492, 33.554649353027344, 34.529911041259766]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 1.0, 5.0, 12.0, 18.0, 20.0, 39.0, 56.0, 116.0, 202.0, 365.0, 498.0, 835.0, 1360.0, 2183.0, 3644.0, 5735.0, 8549.0, 13061.0, 19754.0, 28568.0, 39736.0, 53563.0, 67967.0, 82391.0, 93808.0, 100386.0, 100984.0, 93909.0, 82688.0, 68557.0, 53299.0, 40306.0, 28945.0, 19851.0, 13465.0, 8687.0, 5581.0, 3654.0, 2219.0, 1366.0, 823.0, 515.0, 312.0, 213.0, 110.0, 84.0, 45.0, 30.0, 21.0, 7.0, 7.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-19.59375, -18.981689453125, -18.36962890625, -17.757568359375, -17.1455078125, -16.533447265625, -15.92138671875, -15.309326171875, -14.697265625, -14.085205078125, -13.47314453125, -12.861083984375, -12.2490234375, -11.636962890625, -11.02490234375, -10.412841796875, -9.80078125, -9.188720703125, -8.57666015625, -7.964599609375, -7.3525390625, -6.740478515625, -6.12841796875, -5.516357421875, -4.904296875, -4.292236328125, -3.68017578125, -3.068115234375, -2.4560546875, -1.843994140625, -1.23193359375, -0.619873046875, -0.0078125, 0.604248046875, 1.21630859375, 1.828369140625, 2.4404296875, 3.052490234375, 3.66455078125, 4.276611328125, 4.888671875, 5.500732421875, 6.11279296875, 6.724853515625, 7.3369140625, 7.948974609375, 8.56103515625, 9.173095703125, 9.78515625, 10.397216796875, 11.00927734375, 11.621337890625, 12.2333984375, 12.845458984375, 13.45751953125, 14.069580078125, 14.681640625, 15.293701171875, 15.90576171875, 16.517822265625, 17.1298828125, 17.741943359375, 18.35400390625, 18.966064453125, 19.578125]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 4.0, 1.0, 2.0, 3.0, 7.0, 1.0, 4.0, 9.0, 9.0, 8.0, 13.0, 13.0, 18.0, 16.0, 16.0, 27.0, 25.0, 28.0, 33.0, 38.0, 16.0, 29.0, 43.0, 33.0, 30.0, 32.0, 30.0, 30.0, 47.0, 42.0, 43.0, 26.0, 43.0, 32.0, 37.0, 35.0, 26.0, 18.0, 13.0, 20.0, 18.0, 19.0, 12.0, 10.0, 13.0, 8.0, 8.0, 4.0, 8.0, 5.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-27.171875, -26.3017578125, -25.431640625, -24.5615234375, -23.69140625, -22.8212890625, -21.951171875, -21.0810546875, -20.2109375, -19.3408203125, -18.470703125, -17.6005859375, -16.73046875, -15.8603515625, -14.990234375, -14.1201171875, -13.25, -12.3798828125, -11.509765625, -10.6396484375, -9.76953125, -8.8994140625, -8.029296875, -7.1591796875, -6.2890625, -5.4189453125, -4.548828125, -3.6787109375, -2.80859375, -1.9384765625, -1.068359375, -0.1982421875, 0.671875, 1.5419921875, 2.412109375, 3.2822265625, 4.15234375, 5.0224609375, 5.892578125, 6.7626953125, 7.6328125, 8.5029296875, 9.373046875, 10.2431640625, 11.11328125, 11.9833984375, 12.853515625, 13.7236328125, 14.59375, 15.4638671875, 16.333984375, 17.2041015625, 18.07421875, 18.9443359375, 19.814453125, 20.6845703125, 21.5546875, 22.4248046875, 23.294921875, 24.1650390625, 25.03515625, 25.9052734375, 26.775390625, 27.6455078125, 28.515625]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 7.0, 17.0, 20.0, 28.0, 57.0, 112.0, 133.0, 234.0, 385.0, 648.0, 1006.0, 1720.0, 2616.0, 4405.0, 6953.0, 10744.0, 16906.0, 24922.0, 36157.0, 50206.0, 66678.0, 84162.0, 97943.0, 106658.0, 107155.0, 100687.0, 86197.0, 71146.0, 54082.0, 39121.0, 27051.0, 18121.0, 11937.0, 7798.0, 4736.0, 3101.0, 1822.0, 1142.0, 684.0, 416.0, 250.0, 147.0, 111.0, 49.0, 37.0, 24.0, 13.0, 10.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.703125, -20.03759765625, -19.3720703125, -18.70654296875, -18.041015625, -17.37548828125, -16.7099609375, -16.04443359375, -15.37890625, -14.71337890625, -14.0478515625, -13.38232421875, -12.716796875, -12.05126953125, -11.3857421875, -10.72021484375, -10.0546875, -9.38916015625, -8.7236328125, -8.05810546875, -7.392578125, -6.72705078125, -6.0615234375, -5.39599609375, -4.73046875, -4.06494140625, -3.3994140625, -2.73388671875, -2.068359375, -1.40283203125, -0.7373046875, -0.07177734375, 0.59375, 1.25927734375, 1.9248046875, 2.59033203125, 3.255859375, 3.92138671875, 4.5869140625, 5.25244140625, 5.91796875, 6.58349609375, 7.2490234375, 7.91455078125, 8.580078125, 9.24560546875, 9.9111328125, 10.57666015625, 11.2421875, 11.90771484375, 12.5732421875, 13.23876953125, 13.904296875, 14.56982421875, 15.2353515625, 15.90087890625, 16.56640625, 17.23193359375, 17.8974609375, 18.56298828125, 19.228515625, 19.89404296875, 20.5595703125, 21.22509765625, 21.890625]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 3.0, 6.0, 10.0, 14.0, 7.0, 10.0, 17.0, 20.0, 15.0, 26.0, 29.0, 30.0, 27.0, 34.0, 40.0, 30.0, 46.0, 48.0, 32.0, 41.0, 55.0, 32.0, 40.0, 50.0, 47.0, 43.0, 37.0, 34.0, 31.0, 24.0, 23.0, 15.0, 12.0, 15.0, 13.0, 13.0, 3.0, 10.0, 6.0, 3.0, 1.0, 3.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-22.328125, -21.683837890625, -21.03955078125, -20.395263671875, -19.7509765625, -19.106689453125, -18.46240234375, -17.818115234375, -17.173828125, -16.529541015625, -15.88525390625, -15.240966796875, -14.5966796875, -13.952392578125, -13.30810546875, -12.663818359375, -12.01953125, -11.375244140625, -10.73095703125, -10.086669921875, -9.4423828125, -8.798095703125, -8.15380859375, -7.509521484375, -6.865234375, -6.220947265625, -5.57666015625, -4.932373046875, -4.2880859375, -3.643798828125, -2.99951171875, -2.355224609375, -1.7109375, -1.066650390625, -0.42236328125, 0.221923828125, 0.8662109375, 1.510498046875, 2.15478515625, 2.799072265625, 3.443359375, 4.087646484375, 4.73193359375, 5.376220703125, 6.0205078125, 6.664794921875, 7.30908203125, 7.953369140625, 8.59765625, 9.241943359375, 9.88623046875, 10.530517578125, 11.1748046875, 11.819091796875, 12.46337890625, 13.107666015625, 13.751953125, 14.396240234375, 15.04052734375, 15.684814453125, 16.3291015625, 16.973388671875, 17.61767578125, 18.261962890625, 18.90625]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 8.0, 7.0, 13.0, 23.0, 25.0, 31.0, 55.0, 81.0, 136.0, 164.0, 317.0, 474.0, 716.0, 1185.0, 1847.0, 2857.0, 4480.0, 7084.0, 10924.0, 16577.0, 25422.0, 37554.0, 53431.0, 72515.0, 92741.0, 108858.0, 116983.0, 113545.0, 100807.0, 82325.0, 62444.0, 45159.0, 31016.0, 20891.0, 13657.0, 8755.0, 5687.0, 3480.0, 2325.0, 1422.0, 868.0, 605.0, 373.0, 248.0, 157.0, 98.0, 55.0, 38.0, 31.0, 30.0, 12.0, 15.0, 8.0, 6.0, 4.0, 0.0, 2.0], "bins": [-8.75, -8.49072265625, -8.2314453125, -7.97216796875, -7.712890625, -7.45361328125, -7.1943359375, -6.93505859375, -6.67578125, -6.41650390625, -6.1572265625, -5.89794921875, -5.638671875, -5.37939453125, -5.1201171875, -4.86083984375, -4.6015625, -4.34228515625, -4.0830078125, -3.82373046875, -3.564453125, -3.30517578125, -3.0458984375, -2.78662109375, -2.52734375, -2.26806640625, -2.0087890625, -1.74951171875, -1.490234375, -1.23095703125, -0.9716796875, -0.71240234375, -0.453125, -0.19384765625, 0.0654296875, 0.32470703125, 0.583984375, 0.84326171875, 1.1025390625, 1.36181640625, 1.62109375, 1.88037109375, 2.1396484375, 2.39892578125, 2.658203125, 2.91748046875, 3.1767578125, 3.43603515625, 3.6953125, 3.95458984375, 4.2138671875, 4.47314453125, 4.732421875, 4.99169921875, 5.2509765625, 5.51025390625, 5.76953125, 6.02880859375, 6.2880859375, 6.54736328125, 6.806640625, 7.06591796875, 7.3251953125, 7.58447265625, 7.84375]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 3.0, 4.0, 7.0, 13.0, 18.0, 9.0, 22.0, 31.0, 26.0, 26.0, 34.0, 35.0, 48.0, 39.0, 46.0, 43.0, 68.0, 68.0, 45.0, 56.0, 41.0, 35.0, 51.0, 34.0, 38.0, 38.0, 27.0, 23.0, 17.0, 15.0, 6.0, 10.0, 11.0, 2.0, 2.0, 4.0, 4.0, 1.0, 2.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011043548583984375, -0.0010685175657272339, -0.0010326802730560303, -0.0009968429803848267, -0.000961005687713623, -0.0009251683950424194, -0.0008893311023712158, -0.0008534938097000122, -0.0008176565170288086, -0.000781819224357605, -0.0007459819316864014, -0.0007101446390151978, -0.0006743073463439941, -0.0006384700536727905, -0.0006026327610015869, -0.0005667954683303833, -0.0005309581756591797, -0.0004951208829879761, -0.00045928359031677246, -0.00042344629764556885, -0.00038760900497436523, -0.0003517717123031616, -0.000315934419631958, -0.0002800971269607544, -0.0002442598342895508, -0.00020842254161834717, -0.00017258524894714355, -0.00013674795627593994, -0.00010091066360473633, -6.507337093353271e-05, -2.92360782623291e-05, 6.601214408874512e-06, 4.2438507080078125e-05, 7.827579975128174e-05, 0.00011411309242248535, 0.00014995038509368896, 0.00018578767776489258, 0.0002216249704360962, 0.0002574622631072998, 0.0002932995557785034, 0.00032913684844970703, 0.00036497414112091064, 0.00040081143379211426, 0.00043664872646331787, 0.0004724860191345215, 0.0005083233118057251, 0.0005441606044769287, 0.0005799978971481323, 0.0006158351898193359, 0.0006516724824905396, 0.0006875097751617432, 0.0007233470678329468, 0.0007591843605041504, 0.000795021653175354, 0.0008308589458465576, 0.0008666962385177612, 0.0009025335311889648, 0.0009383708238601685, 0.0009742081165313721, 0.0010100454092025757, 0.0010458827018737793, 0.001081719994544983, 0.0011175572872161865, 0.0011533945798873901, 0.0011892318725585938]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 4.0, 8.0, 8.0, 11.0, 36.0, 42.0, 73.0, 116.0, 169.0, 256.0, 422.0, 688.0, 1123.0, 1719.0, 2927.0, 4481.0, 7265.0, 11526.0, 18202.0, 27438.0, 41024.0, 58157.0, 77677.0, 97068.0, 112483.0, 118529.0, 112901.0, 98422.0, 78738.0, 58384.0, 41475.0, 27866.0, 18245.0, 11597.0, 7382.0, 4650.0, 2816.0, 1734.0, 1115.0, 680.0, 410.0, 252.0, 154.0, 86.0, 82.0, 57.0, 24.0, 17.0, 10.0, 7.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.5703125, -8.29833984375, -8.0263671875, -7.75439453125, -7.482421875, -7.21044921875, -6.9384765625, -6.66650390625, -6.39453125, -6.12255859375, -5.8505859375, -5.57861328125, -5.306640625, -5.03466796875, -4.7626953125, -4.49072265625, -4.21875, -3.94677734375, -3.6748046875, -3.40283203125, -3.130859375, -2.85888671875, -2.5869140625, -2.31494140625, -2.04296875, -1.77099609375, -1.4990234375, -1.22705078125, -0.955078125, -0.68310546875, -0.4111328125, -0.13916015625, 0.1328125, 0.40478515625, 0.6767578125, 0.94873046875, 1.220703125, 1.49267578125, 1.7646484375, 2.03662109375, 2.30859375, 2.58056640625, 2.8525390625, 3.12451171875, 3.396484375, 3.66845703125, 3.9404296875, 4.21240234375, 4.484375, 4.75634765625, 5.0283203125, 5.30029296875, 5.572265625, 5.84423828125, 6.1162109375, 6.38818359375, 6.66015625, 6.93212890625, 7.2041015625, 7.47607421875, 7.748046875, 8.02001953125, 8.2919921875, 8.56396484375, 8.8359375]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 5.0, 5.0, 10.0, 5.0, 13.0, 11.0, 13.0, 16.0, 21.0, 22.0, 22.0, 37.0, 23.0, 31.0, 44.0, 42.0, 43.0, 36.0, 53.0, 50.0, 48.0, 39.0, 32.0, 36.0, 43.0, 40.0, 38.0, 29.0, 26.0, 23.0, 24.0, 24.0, 20.0, 17.0, 9.0, 9.0, 9.0, 7.0, 2.0, 9.0, 2.0, 5.0, 1.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.583984375, -3.470733642578125, -3.35748291015625, -3.244232177734375, -3.1309814453125, -3.017730712890625, -2.90447998046875, -2.791229248046875, -2.677978515625, -2.564727783203125, -2.45147705078125, -2.338226318359375, -2.2249755859375, -2.111724853515625, -1.99847412109375, -1.885223388671875, -1.77197265625, -1.658721923828125, -1.54547119140625, -1.432220458984375, -1.3189697265625, -1.205718994140625, -1.09246826171875, -0.979217529296875, -0.865966796875, -0.752716064453125, -0.63946533203125, -0.526214599609375, -0.4129638671875, -0.299713134765625, -0.18646240234375, -0.073211669921875, 0.0400390625, 0.153289794921875, 0.26654052734375, 0.379791259765625, 0.4930419921875, 0.606292724609375, 0.71954345703125, 0.832794189453125, 0.946044921875, 1.059295654296875, 1.17254638671875, 1.285797119140625, 1.3990478515625, 1.512298583984375, 1.62554931640625, 1.738800048828125, 1.85205078125, 1.965301513671875, 2.07855224609375, 2.191802978515625, 2.3050537109375, 2.418304443359375, 2.53155517578125, 2.644805908203125, 2.758056640625, 2.871307373046875, 2.98455810546875, 3.097808837890625, 3.2110595703125, 3.324310302734375, 3.43756103515625, 3.550811767578125, 3.6640625]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 5.0, 3.0, 7.0, 10.0, 7.0, 9.0, 10.0, 10.0, 20.0, 20.0, 25.0, 19.0, 25.0, 34.0, 38.0, 43.0, 48.0, 43.0, 51.0, 41.0, 45.0, 44.0, 44.0, 49.0, 35.0, 44.0, 35.0, 41.0, 32.0, 28.0, 23.0, 20.0, 23.0, 11.0, 19.0, 9.0, 10.0, 5.0, 4.0, 4.0, 9.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.810029983520508, -23.951793670654297, -23.093557357788086, -22.235321044921875, -21.377086639404297, -20.518848419189453, -19.660614013671875, -18.802377700805664, -17.944141387939453, -17.085905075073242, -16.22766876220703, -15.369433403015137, -14.511197090148926, -13.652960777282715, -12.79472541809082, -11.93648910522461, -11.078252792358398, -10.220016479492188, -9.361780166625977, -8.503544807434082, -7.645308494567871, -6.78707218170166, -5.928836345672607, -5.070600509643555, -4.212364196777344, -3.354128122329712, -2.49589204788208, -1.6376559734344482, -0.7794198989868164, 0.07881641387939453, 0.9370522499084473, 1.7952880859375, 2.6535263061523438, 3.5117623805999756, 4.369998455047607, 5.22823429107666, 6.086470603942871, 6.944706916809082, 7.802942752838135, 8.661178588867188, 9.519414901733398, 10.37765121459961, 11.23588752746582, 12.094122886657715, 12.952359199523926, 13.810595512390137, 14.668830871582031, 15.527067184448242, 16.385303497314453, 17.243539810180664, 18.101776123046875, 18.960012435913086, 19.818248748779297, 20.676483154296875, 21.534719467163086, 22.392955780029297, 23.251192092895508, 24.10942840576172, 24.96766471862793, 25.82590103149414, 26.68413543701172, 27.542373657226562, 28.40060806274414, 29.25884437561035, 30.117080688476562]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 2.0, 4.0, 6.0, 7.0, 11.0, 4.0, 7.0, 16.0, 17.0, 5.0, 19.0, 16.0, 24.0, 21.0, 28.0, 33.0, 24.0, 29.0, 44.0, 35.0, 41.0, 36.0, 29.0, 39.0, 47.0, 43.0, 38.0, 37.0, 38.0, 37.0, 29.0, 19.0, 37.0, 25.0, 29.0, 20.0, 13.0, 10.0, 15.0, 16.0, 12.0, 12.0, 9.0, 4.0, 5.0, 10.0, 3.0, 1.0, 0.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-27.888347625732422, -26.984975814819336, -26.081605911254883, -25.178234100341797, -24.27486228942871, -23.371492385864258, -22.468120574951172, -21.56475067138672, -20.661378860473633, -19.758007049560547, -18.854637145996094, -17.951265335083008, -17.047893524169922, -16.14452362060547, -15.241151809692383, -14.337780952453613, -13.434409141540527, -12.531038284301758, -11.627666473388672, -10.724295616149902, -9.820924758911133, -8.917552947998047, -8.014182090759277, -7.110811233520508, -6.20743989944458, -5.304068565368652, -4.400697708129883, -3.497326374053955, -2.5939552783966064, -1.6905841827392578, -0.7872128486633301, 0.11615800857543945, 1.0195293426513672, 1.9229004383087158, 2.8262715339660645, 3.729642868041992, 4.633013725280762, 5.5363850593566895, 6.439756393432617, 7.343127250671387, 8.246498107910156, 9.149868965148926, 10.053240776062012, 10.956611633300781, 11.85998249053955, 12.76335334777832, 13.666725158691406, 14.570096015930176, 15.473467826843262, 16.37683868408203, 17.280210494995117, 18.183582305908203, 19.086952209472656, 19.990324020385742, 20.893695831298828, 21.79706573486328, 22.700437545776367, 23.603809356689453, 24.507179260253906, 25.410551071166992, 26.313922882080078, 27.21729278564453, 28.120664596557617, 29.024036407470703, 29.927406311035156]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [3.0, 4.0, 3.0, 7.0, 20.0, 32.0, 54.0, 72.0, 121.0, 201.0, 357.0, 547.0, 878.0, 1337.0, 2272.0, 3656.0, 5823.0, 9149.0, 14528.0, 22490.0, 34386.0, 52492.0, 77360.0, 112236.0, 158606.0, 214549.0, 279051.0, 341796.0, 393279.0, 421152.0, 416456.0, 383355.0, 328479.0, 264362.0, 201730.0, 146527.0, 103070.0, 70949.0, 46723.0, 30895.0, 20226.0, 12914.0, 8255.0, 5010.0, 3330.0, 2073.0, 1310.0, 779.0, 512.0, 358.0, 200.0, 142.0, 71.0, 45.0, 24.0, 19.0, 11.0, 5.0, 9.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-17.1875, -16.612548828125, -16.03759765625, -15.462646484375, -14.8876953125, -14.312744140625, -13.73779296875, -13.162841796875, -12.587890625, -12.012939453125, -11.43798828125, -10.863037109375, -10.2880859375, -9.713134765625, -9.13818359375, -8.563232421875, -7.98828125, -7.413330078125, -6.83837890625, -6.263427734375, -5.6884765625, -5.113525390625, -4.53857421875, -3.963623046875, -3.388671875, -2.813720703125, -2.23876953125, -1.663818359375, -1.0888671875, -0.513916015625, 0.06103515625, 0.635986328125, 1.2109375, 1.785888671875, 2.36083984375, 2.935791015625, 3.5107421875, 4.085693359375, 4.66064453125, 5.235595703125, 5.810546875, 6.385498046875, 6.96044921875, 7.535400390625, 8.1103515625, 8.685302734375, 9.26025390625, 9.835205078125, 10.41015625, 10.985107421875, 11.56005859375, 12.135009765625, 12.7099609375, 13.284912109375, 13.85986328125, 14.434814453125, 15.009765625, 15.584716796875, 16.15966796875, 16.734619140625, 17.3095703125, 17.884521484375, 18.45947265625, 19.034423828125, 19.609375]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 5.0, 5.0, 7.0, 4.0, 5.0, 10.0, 9.0, 15.0, 15.0, 17.0, 17.0, 21.0, 19.0, 26.0, 23.0, 29.0, 31.0, 31.0, 29.0, 34.0, 30.0, 37.0, 40.0, 44.0, 44.0, 42.0, 31.0, 33.0, 36.0, 27.0, 36.0, 32.0, 31.0, 20.0, 20.0, 17.0, 18.0, 19.0, 15.0, 13.0, 15.0, 11.0, 11.0, 4.0, 6.0, 7.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 1.0, 2.0], "bins": [-21.890625, -21.205322265625, -20.52001953125, -19.834716796875, -19.1494140625, -18.464111328125, -17.77880859375, -17.093505859375, -16.408203125, -15.722900390625, -15.03759765625, -14.352294921875, -13.6669921875, -12.981689453125, -12.29638671875, -11.611083984375, -10.92578125, -10.240478515625, -9.55517578125, -8.869873046875, -8.1845703125, -7.499267578125, -6.81396484375, -6.128662109375, -5.443359375, -4.758056640625, -4.07275390625, -3.387451171875, -2.7021484375, -2.016845703125, -1.33154296875, -0.646240234375, 0.0390625, 0.724365234375, 1.40966796875, 2.094970703125, 2.7802734375, 3.465576171875, 4.15087890625, 4.836181640625, 5.521484375, 6.206787109375, 6.89208984375, 7.577392578125, 8.2626953125, 8.947998046875, 9.63330078125, 10.318603515625, 11.00390625, 11.689208984375, 12.37451171875, 13.059814453125, 13.7451171875, 14.430419921875, 15.11572265625, 15.801025390625, 16.486328125, 17.171630859375, 17.85693359375, 18.542236328125, 19.2275390625, 19.912841796875, 20.59814453125, 21.283447265625, 21.96875]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [1.0, 4.0, 4.0, 9.0, 12.0, 15.0, 39.0, 55.0, 101.0, 165.0, 303.0, 489.0, 809.0, 1327.0, 2097.0, 3286.0, 5207.0, 8100.0, 12949.0, 19799.0, 29899.0, 44850.0, 64113.0, 90052.0, 124112.0, 163653.0, 210765.0, 258291.0, 303436.0, 339643.0, 360820.0, 363407.0, 346622.0, 315549.0, 271981.0, 223857.0, 176463.0, 135536.0, 99293.0, 70999.0, 49826.0, 33528.0, 22647.0, 14771.0, 9393.0, 6062.0, 3772.0, 2379.0, 1493.0, 921.0, 590.0, 319.0, 211.0, 124.0, 64.0, 31.0, 28.0, 17.0, 9.0, 0.0, 4.0, 0.0, 2.0, 1.0], "bins": [-16.8125, -16.272705078125, -15.73291015625, -15.193115234375, -14.6533203125, -14.113525390625, -13.57373046875, -13.033935546875, -12.494140625, -11.954345703125, -11.41455078125, -10.874755859375, -10.3349609375, -9.795166015625, -9.25537109375, -8.715576171875, -8.17578125, -7.635986328125, -7.09619140625, -6.556396484375, -6.0166015625, -5.476806640625, -4.93701171875, -4.397216796875, -3.857421875, -3.317626953125, -2.77783203125, -2.238037109375, -1.6982421875, -1.158447265625, -0.61865234375, -0.078857421875, 0.4609375, 1.000732421875, 1.54052734375, 2.080322265625, 2.6201171875, 3.159912109375, 3.69970703125, 4.239501953125, 4.779296875, 5.319091796875, 5.85888671875, 6.398681640625, 6.9384765625, 7.478271484375, 8.01806640625, 8.557861328125, 9.09765625, 9.637451171875, 10.17724609375, 10.717041015625, 11.2568359375, 11.796630859375, 12.33642578125, 12.876220703125, 13.416015625, 13.955810546875, 14.49560546875, 15.035400390625, 15.5751953125, 16.114990234375, 16.65478515625, 17.194580078125, 17.734375]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 2.0, 8.0, 6.0, 6.0, 8.0, 18.0, 20.0, 21.0, 21.0, 30.0, 37.0, 44.0, 46.0, 65.0, 86.0, 96.0, 102.0, 111.0, 123.0, 131.0, 173.0, 161.0, 156.0, 162.0, 189.0, 183.0, 196.0, 190.0, 170.0, 157.0, 161.0, 140.0, 148.0, 133.0, 112.0, 107.0, 93.0, 83.0, 65.0, 64.0, 53.0, 43.0, 30.0, 38.0, 27.0, 8.0, 13.0, 13.0, 11.0, 9.0, 5.0, 1.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-9.5, -9.1822509765625, -8.864501953125, -8.5467529296875, -8.22900390625, -7.9112548828125, -7.593505859375, -7.2757568359375, -6.9580078125, -6.6402587890625, -6.322509765625, -6.0047607421875, -5.68701171875, -5.3692626953125, -5.051513671875, -4.7337646484375, -4.416015625, -4.0982666015625, -3.780517578125, -3.4627685546875, -3.14501953125, -2.8272705078125, -2.509521484375, -2.1917724609375, -1.8740234375, -1.5562744140625, -1.238525390625, -0.9207763671875, -0.60302734375, -0.2852783203125, 0.032470703125, 0.3502197265625, 0.66796875, 0.9857177734375, 1.303466796875, 1.6212158203125, 1.93896484375, 2.2567138671875, 2.574462890625, 2.8922119140625, 3.2099609375, 3.5277099609375, 3.845458984375, 4.1632080078125, 4.48095703125, 4.7987060546875, 5.116455078125, 5.4342041015625, 5.751953125, 6.0697021484375, 6.387451171875, 6.7052001953125, 7.02294921875, 7.3406982421875, 7.658447265625, 7.9761962890625, 8.2939453125, 8.6116943359375, 8.929443359375, 9.2471923828125, 9.56494140625, 9.8826904296875, 10.200439453125, 10.5181884765625, 10.8359375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 7.0, 4.0, 7.0, 4.0, 8.0, 12.0, 8.0, 10.0, 11.0, 16.0, 15.0, 17.0, 23.0, 27.0, 22.0, 31.0, 19.0, 29.0, 40.0, 43.0, 36.0, 41.0, 39.0, 40.0, 36.0, 46.0, 39.0, 44.0, 29.0, 31.0, 35.0, 34.0, 31.0, 22.0, 33.0, 21.0, 21.0, 20.0, 13.0, 7.0, 5.0, 9.0, 5.0, 2.0, 3.0, 3.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-24.885677337646484, -24.141450881958008, -23.39722442626953, -22.652997970581055, -21.908771514892578, -21.164546966552734, -20.420320510864258, -19.67609405517578, -18.931867599487305, -18.187641143798828, -17.44341468811035, -16.699188232421875, -15.954962730407715, -15.210736274719238, -14.466510772705078, -13.722284317016602, -12.978057861328125, -12.233831405639648, -11.489604949951172, -10.745379447937012, -10.001152992248535, -9.256926536560059, -8.512701034545898, -7.768474578857422, -7.024248123168945, -6.280021667480469, -5.53579568862915, -4.791569709777832, -4.0473432540893555, -3.303117036819458, -2.5588908195495605, -1.8146648406982422, -1.0704402923583984, -0.326214075088501, 0.4180121421813965, 1.162238359451294, 1.9064645767211914, 2.650690793991089, 3.3949170112609863, 4.139142990112305, 4.883369445800781, 5.627595901489258, 6.371821880340576, 7.1160478591918945, 7.860274314880371, 8.604500770568848, 9.348726272583008, 10.092952728271484, 10.837179183959961, 11.581405639648438, 12.325632095336914, 13.069857597351074, 13.81408405303955, 14.558310508728027, 15.302536010742188, 16.046762466430664, 16.79098892211914, 17.535215377807617, 18.279441833496094, 19.02366828918457, 19.767894744873047, 20.51211929321289, 21.256345748901367, 22.000572204589844, 22.74479866027832]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 5.0, 4.0, 2.0, 4.0, 8.0, 10.0, 6.0, 12.0, 12.0, 17.0, 22.0, 18.0, 27.0, 24.0, 31.0, 40.0, 37.0, 41.0, 40.0, 45.0, 44.0, 38.0, 56.0, 39.0, 42.0, 37.0, 52.0, 35.0, 27.0, 36.0, 24.0, 29.0, 25.0, 13.0, 17.0, 20.0, 19.0, 11.0, 7.0, 6.0, 7.0, 8.0, 6.0, 2.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.845184326171875, -28.89992332458496, -27.954662322998047, -27.009403228759766, -26.06414222717285, -25.118881225585938, -24.173622131347656, -23.228361129760742, -22.283100128173828, -21.337839126586914, -20.392578125, -19.44731903076172, -18.502058029174805, -17.55679702758789, -16.61153793334961, -15.666276931762695, -14.721015930175781, -13.775754928588867, -12.83049488067627, -11.885234832763672, -10.939973831176758, -9.994712829589844, -9.049452781677246, -8.104192733764648, -7.158931732177734, -6.2136712074279785, -5.268410682678223, -4.323150157928467, -3.377889633178711, -2.432629108428955, -1.4873685836791992, -0.5421080589294434, 0.4031505584716797, 1.3484110832214355, 2.2936716079711914, 3.2389321327209473, 4.184192657470703, 5.129453182220459, 6.074713706970215, 7.019974231719971, 7.965234756469727, 8.91049575805664, 9.855755805969238, 10.801015853881836, 11.74627685546875, 12.691537857055664, 13.636797904968262, 14.58205795288086, 15.527318954467773, 16.472579956054688, 17.41783905029297, 18.363100051879883, 19.308361053466797, 20.25362205505371, 21.198883056640625, 22.144142150878906, 23.08940315246582, 24.034664154052734, 24.979923248291016, 25.92518424987793, 26.870445251464844, 27.815706253051758, 28.760967254638672, 29.706226348876953, 30.651487350463867]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 5.0, 6.0, 3.0, 18.0, 25.0, 46.0, 61.0, 96.0, 184.0, 236.0, 445.0, 716.0, 1236.0, 2059.0, 3433.0, 5691.0, 10141.0, 16951.0, 28811.0, 48876.0, 79691.0, 120908.0, 161937.0, 171184.0, 142873.0, 99081.0, 62303.0, 37302.0, 22294.0, 13095.0, 7795.0, 4425.0, 2707.0, 1545.0, 933.0, 552.0, 362.0, 203.0, 108.0, 80.0, 63.0, 33.0, 13.0, 9.0, 10.0, 5.0, 8.0, 3.0, 1.0, 2.0], "bins": [-7.8203125, -7.6103515625, -7.400390625, -7.1904296875, -6.98046875, -6.7705078125, -6.560546875, -6.3505859375, -6.140625, -5.9306640625, -5.720703125, -5.5107421875, -5.30078125, -5.0908203125, -4.880859375, -4.6708984375, -4.4609375, -4.2509765625, -4.041015625, -3.8310546875, -3.62109375, -3.4111328125, -3.201171875, -2.9912109375, -2.78125, -2.5712890625, -2.361328125, -2.1513671875, -1.94140625, -1.7314453125, -1.521484375, -1.3115234375, -1.1015625, -0.8916015625, -0.681640625, -0.4716796875, -0.26171875, -0.0517578125, 0.158203125, 0.3681640625, 0.578125, 0.7880859375, 0.998046875, 1.2080078125, 1.41796875, 1.6279296875, 1.837890625, 2.0478515625, 2.2578125, 2.4677734375, 2.677734375, 2.8876953125, 3.09765625, 3.3076171875, 3.517578125, 3.7275390625, 3.9375, 4.1474609375, 4.357421875, 4.5673828125, 4.77734375, 4.9873046875, 5.197265625, 5.4072265625, 5.6171875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 6.0, 0.0, 3.0, 2.0, 2.0, 8.0, 3.0, 9.0, 2.0, 13.0, 9.0, 13.0, 20.0, 22.0, 32.0, 22.0, 20.0, 28.0, 23.0, 30.0, 31.0, 35.0, 46.0, 46.0, 33.0, 32.0, 45.0, 29.0, 34.0, 45.0, 29.0, 37.0, 40.0, 30.0, 40.0, 20.0, 17.0, 23.0, 13.0, 23.0, 19.0, 9.0, 16.0, 11.0, 9.0, 5.0, 7.0, 5.0, 3.0, 3.0, 1.0, 6.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-25.625, -24.7568359375, -23.888671875, -23.0205078125, -22.15234375, -21.2841796875, -20.416015625, -19.5478515625, -18.6796875, -17.8115234375, -16.943359375, -16.0751953125, -15.20703125, -14.3388671875, -13.470703125, -12.6025390625, -11.734375, -10.8662109375, -9.998046875, -9.1298828125, -8.26171875, -7.3935546875, -6.525390625, -5.6572265625, -4.7890625, -3.9208984375, -3.052734375, -2.1845703125, -1.31640625, -0.4482421875, 0.419921875, 1.2880859375, 2.15625, 3.0244140625, 3.892578125, 4.7607421875, 5.62890625, 6.4970703125, 7.365234375, 8.2333984375, 9.1015625, 9.9697265625, 10.837890625, 11.7060546875, 12.57421875, 13.4423828125, 14.310546875, 15.1787109375, 16.046875, 16.9150390625, 17.783203125, 18.6513671875, 19.51953125, 20.3876953125, 21.255859375, 22.1240234375, 22.9921875, 23.8603515625, 24.728515625, 25.5966796875, 26.46484375, 27.3330078125, 28.201171875, 29.0693359375, 29.9375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 6.0, 4.0, 5.0, 3.0, 5.0, 9.0, 7.0, 19.0, 22.0, 23.0, 41.0, 43.0, 65.0, 102.0, 169.0, 262.0, 365.0, 659.0, 1075.0, 1895.0, 3358.0, 6311.0, 12221.0, 23844.0, 47006.0, 89536.0, 153941.0, 208116.0, 200316.0, 137327.0, 78069.0, 40196.0, 20482.0, 10571.0, 5362.0, 2936.0, 1541.0, 974.0, 601.0, 333.0, 247.0, 162.0, 106.0, 59.0, 45.0, 42.0, 30.0, 15.0, 11.0, 10.0, 9.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0], "bins": [-6.93359375, -6.71612548828125, -6.4986572265625, -6.28118896484375, -6.063720703125, -5.84625244140625, -5.6287841796875, -5.41131591796875, -5.19384765625, -4.97637939453125, -4.7589111328125, -4.54144287109375, -4.323974609375, -4.10650634765625, -3.8890380859375, -3.67156982421875, -3.4541015625, -3.23663330078125, -3.0191650390625, -2.80169677734375, -2.584228515625, -2.36676025390625, -2.1492919921875, -1.93182373046875, -1.71435546875, -1.49688720703125, -1.2794189453125, -1.06195068359375, -0.844482421875, -0.62701416015625, -0.4095458984375, -0.19207763671875, 0.025390625, 0.24285888671875, 0.4603271484375, 0.67779541015625, 0.895263671875, 1.11273193359375, 1.3302001953125, 1.54766845703125, 1.76513671875, 1.98260498046875, 2.2000732421875, 2.41754150390625, 2.635009765625, 2.85247802734375, 3.0699462890625, 3.28741455078125, 3.5048828125, 3.72235107421875, 3.9398193359375, 4.15728759765625, 4.374755859375, 4.59222412109375, 4.8096923828125, 5.02716064453125, 5.24462890625, 5.46209716796875, 5.6795654296875, 5.89703369140625, 6.114501953125, 6.33197021484375, 6.5494384765625, 6.76690673828125, 6.984375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 3.0, 2.0, 6.0, 7.0, 7.0, 6.0, 11.0, 9.0, 16.0, 22.0, 22.0, 29.0, 26.0, 28.0, 26.0, 47.0, 32.0, 33.0, 45.0, 50.0, 36.0, 42.0, 43.0, 62.0, 44.0, 38.0, 39.0, 41.0, 36.0, 28.0, 33.0, 28.0, 25.0, 15.0, 18.0, 13.0, 6.0, 6.0, 7.0, 5.0, 4.0, 4.0, 3.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-21.234375, -20.5869140625, -19.939453125, -19.2919921875, -18.64453125, -17.9970703125, -17.349609375, -16.7021484375, -16.0546875, -15.4072265625, -14.759765625, -14.1123046875, -13.46484375, -12.8173828125, -12.169921875, -11.5224609375, -10.875, -10.2275390625, -9.580078125, -8.9326171875, -8.28515625, -7.6376953125, -6.990234375, -6.3427734375, -5.6953125, -5.0478515625, -4.400390625, -3.7529296875, -3.10546875, -2.4580078125, -1.810546875, -1.1630859375, -0.515625, 0.1318359375, 0.779296875, 1.4267578125, 2.07421875, 2.7216796875, 3.369140625, 4.0166015625, 4.6640625, 5.3115234375, 5.958984375, 6.6064453125, 7.25390625, 7.9013671875, 8.548828125, 9.1962890625, 9.84375, 10.4912109375, 11.138671875, 11.7861328125, 12.43359375, 13.0810546875, 13.728515625, 14.3759765625, 15.0234375, 15.6708984375, 16.318359375, 16.9658203125, 17.61328125, 18.2607421875, 18.908203125, 19.5556640625, 20.203125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 5.0, 1.0, 2.0, 6.0, 10.0, 17.0, 12.0, 21.0, 21.0, 51.0, 63.0, 88.0, 136.0, 243.0, 412.0, 790.0, 1579.0, 3860.0, 10827.0, 39644.0, 193204.0, 531684.0, 205454.0, 41569.0, 11202.0, 4050.0, 1676.0, 825.0, 404.0, 250.0, 145.0, 93.0, 59.0, 51.0, 32.0, 16.0, 11.0, 11.0, 15.0, 4.0, 5.0, 2.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.13671875, -3.037200927734375, -2.93768310546875, -2.838165283203125, -2.7386474609375, -2.639129638671875, -2.53961181640625, -2.440093994140625, -2.340576171875, -2.241058349609375, -2.14154052734375, -2.042022705078125, -1.9425048828125, -1.842987060546875, -1.74346923828125, -1.643951416015625, -1.54443359375, -1.444915771484375, -1.34539794921875, -1.245880126953125, -1.1463623046875, -1.046844482421875, -0.94732666015625, -0.847808837890625, -0.748291015625, -0.648773193359375, -0.54925537109375, -0.449737548828125, -0.3502197265625, -0.250701904296875, -0.15118408203125, -0.051666259765625, 0.0478515625, 0.147369384765625, 0.24688720703125, 0.346405029296875, 0.4459228515625, 0.545440673828125, 0.64495849609375, 0.744476318359375, 0.843994140625, 0.943511962890625, 1.04302978515625, 1.142547607421875, 1.2420654296875, 1.341583251953125, 1.44110107421875, 1.540618896484375, 1.64013671875, 1.739654541015625, 1.83917236328125, 1.938690185546875, 2.0382080078125, 2.137725830078125, 2.23724365234375, 2.336761474609375, 2.436279296875, 2.535797119140625, 2.63531494140625, 2.734832763671875, 2.8343505859375, 2.933868408203125, 3.03338623046875, 3.132904052734375, 3.232421875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 5.0, 3.0, 5.0, 5.0, 7.0, 15.0, 25.0, 24.0, 34.0, 67.0, 90.0, 94.0, 110.0, 113.0, 94.0, 88.0, 65.0, 42.0, 35.0, 30.0, 10.0, 14.0, 12.0, 2.0, 4.0, 3.0, 3.0, 2.0, 6.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0004107952117919922, -0.0004003159701824188, -0.00038983672857284546, -0.0003793574869632721, -0.00036887824535369873, -0.00035839900374412537, -0.000347919762134552, -0.00033744052052497864, -0.0003269612789154053, -0.0003164820373058319, -0.00030600279569625854, -0.0002955235540866852, -0.0002850443124771118, -0.00027456507086753845, -0.0002640858292579651, -0.0002536065876483917, -0.00024312734603881836, -0.000232648104429245, -0.00022216886281967163, -0.00021168962121009827, -0.0002012103796005249, -0.00019073113799095154, -0.00018025189638137817, -0.0001697726547718048, -0.00015929341316223145, -0.00014881417155265808, -0.00013833492994308472, -0.00012785568833351135, -0.00011737644672393799, -0.00010689720511436462, -9.641796350479126e-05, -8.59387218952179e-05, -7.545948028564453e-05, -6.498023867607117e-05, -5.45009970664978e-05, -4.402175545692444e-05, -3.3542513847351074e-05, -2.306327223777771e-05, -1.2584030628204346e-05, -2.1047890186309814e-06, 8.374452590942383e-06, 1.8853694200515747e-05, 2.933293581008911e-05, 3.9812177419662476e-05, 5.029141902923584e-05, 6.0770660638809204e-05, 7.124990224838257e-05, 8.172914385795593e-05, 9.22083854675293e-05, 0.00010268762707710266, 0.00011316686868667603, 0.0001236461102962494, 0.00013412535190582275, 0.00014460459351539612, 0.00015508383512496948, 0.00016556307673454285, 0.0001760423183441162, 0.00018652155995368958, 0.00019700080156326294, 0.0002074800431728363, 0.00021795928478240967, 0.00022843852639198303, 0.0002389177680015564, 0.00024939700961112976, 0.0002598762512207031]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 9.0, 9.0, 13.0, 13.0, 29.0, 42.0, 66.0, 81.0, 130.0, 196.0, 266.0, 442.0, 623.0, 958.0, 1484.0, 2295.0, 3805.0, 6292.0, 11176.0, 20235.0, 38270.0, 73691.0, 140329.0, 227014.0, 225530.0, 138040.0, 72227.0, 37453.0, 19953.0, 11111.0, 6438.0, 3812.0, 2264.0, 1437.0, 940.0, 626.0, 383.0, 273.0, 188.0, 139.0, 88.0, 65.0, 48.0, 20.0, 16.0, 10.0, 10.0, 4.0, 7.0, 1.0, 3.0, 1.0, 3.0], "bins": [-2.939453125, -2.855438232421875, -2.77142333984375, -2.687408447265625, -2.6033935546875, -2.519378662109375, -2.43536376953125, -2.351348876953125, -2.267333984375, -2.183319091796875, -2.09930419921875, -2.015289306640625, -1.9312744140625, -1.847259521484375, -1.76324462890625, -1.679229736328125, -1.59521484375, -1.511199951171875, -1.42718505859375, -1.343170166015625, -1.2591552734375, -1.175140380859375, -1.09112548828125, -1.007110595703125, -0.923095703125, -0.839080810546875, -0.75506591796875, -0.671051025390625, -0.5870361328125, -0.503021240234375, -0.41900634765625, -0.334991455078125, -0.2509765625, -0.166961669921875, -0.08294677734375, 0.001068115234375, 0.0850830078125, 0.169097900390625, 0.25311279296875, 0.337127685546875, 0.421142578125, 0.505157470703125, 0.58917236328125, 0.673187255859375, 0.7572021484375, 0.841217041015625, 0.92523193359375, 1.009246826171875, 1.09326171875, 1.177276611328125, 1.26129150390625, 1.345306396484375, 1.4293212890625, 1.513336181640625, 1.59735107421875, 1.681365966796875, 1.765380859375, 1.849395751953125, 1.93341064453125, 2.017425537109375, 2.1014404296875, 2.185455322265625, 2.26947021484375, 2.353485107421875, 2.4375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 4.0, 5.0, 10.0, 10.0, 13.0, 10.0, 25.0, 23.0, 25.0, 39.0, 44.0, 59.0, 66.0, 61.0, 81.0, 91.0, 93.0, 79.0, 59.0, 44.0, 36.0, 37.0, 24.0, 14.0, 13.0, 11.0, 8.0, 5.0, 4.0, 5.0, 0.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.98828125, -0.9605484008789062, -0.9328155517578125, -0.9050827026367188, -0.877349853515625, -0.8496170043945312, -0.8218841552734375, -0.7941513061523438, -0.76641845703125, -0.7386856079101562, -0.7109527587890625, -0.6832199096679688, -0.655487060546875, -0.6277542114257812, -0.6000213623046875, -0.5722885131835938, -0.5445556640625, -0.5168228149414062, -0.4890899658203125, -0.46135711669921875, -0.433624267578125, -0.40589141845703125, -0.3781585693359375, -0.35042572021484375, -0.32269287109375, -0.29496002197265625, -0.2672271728515625, -0.23949432373046875, -0.211761474609375, -0.18402862548828125, -0.1562957763671875, -0.12856292724609375, -0.100830078125, -0.07309722900390625, -0.0453643798828125, -0.01763153076171875, 0.010101318359375, 0.03783416748046875, 0.0655670166015625, 0.09329986572265625, 0.12103271484375, 0.14876556396484375, 0.1764984130859375, 0.20423126220703125, 0.231964111328125, 0.25969696044921875, 0.2874298095703125, 0.31516265869140625, 0.3428955078125, 0.37062835693359375, 0.3983612060546875, 0.42609405517578125, 0.453826904296875, 0.48155975341796875, 0.5092926025390625, 0.5370254516601562, 0.56475830078125, 0.5924911499023438, 0.6202239990234375, 0.6479568481445312, 0.675689697265625, 0.7034225463867188, 0.7311553955078125, 0.7588882446289062, 0.78662109375]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 5.0, 5.0, 4.0, 7.0, 5.0, 8.0, 6.0, 9.0, 8.0, 18.0, 13.0, 15.0, 24.0, 23.0, 19.0, 24.0, 26.0, 25.0, 22.0, 42.0, 37.0, 39.0, 38.0, 38.0, 41.0, 42.0, 31.0, 44.0, 38.0, 36.0, 33.0, 31.0, 35.0, 25.0, 22.0, 27.0, 34.0, 20.0, 20.0, 16.0, 15.0, 4.0, 8.0, 4.0, 5.0, 3.0, 3.0, 4.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-23.547218322753906, -22.82798194885254, -22.108747482299805, -21.389511108398438, -20.670276641845703, -19.951040267944336, -19.23180389404297, -18.512569427490234, -17.793333053588867, -17.0740966796875, -16.354862213134766, -15.635625839233398, -14.916390419006348, -14.197154998779297, -13.47791862487793, -12.758683204650879, -12.039447784423828, -11.320212364196777, -10.600976943969727, -9.88174057006836, -9.162505149841309, -8.443269729614258, -7.724033832550049, -7.00479793548584, -6.285562515258789, -5.566327095031738, -4.847091197967529, -4.12785530090332, -3.4086198806762695, -2.6893842220306396, -1.9701485633850098, -1.2509126663208008, -0.5316753387451172, 0.1875603199005127, 0.9067959785461426, 1.6260316371917725, 2.3452672958374023, 3.0645029544830322, 3.783738613128662, 4.502974510192871, 5.222209930419922, 5.941445350646973, 6.660681247711182, 7.379917144775391, 8.099152565002441, 8.818387985229492, 9.53762435913086, 10.25685977935791, 10.976095199584961, 11.695330619812012, 12.414566040039062, 13.13380241394043, 13.85303783416748, 14.572273254394531, 15.291509628295898, 16.010746002197266, 16.72998046875, 17.449216842651367, 18.1684513092041, 18.88768768310547, 19.606922149658203, 20.32615852355957, 21.045394897460938, 21.764629364013672, 22.48386573791504]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 5.0, 4.0, 2.0, 4.0, 8.0, 9.0, 7.0, 12.0, 14.0, 14.0, 21.0, 21.0, 28.0, 22.0, 32.0, 41.0, 36.0, 44.0, 43.0, 40.0, 44.0, 37.0, 58.0, 43.0, 36.0, 43.0, 53.0, 31.0, 26.0, 32.0, 30.0, 26.0, 24.0, 16.0, 15.0, 19.0, 20.0, 11.0, 6.0, 7.0, 8.0, 6.0, 5.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.58525276184082, -28.641803741455078, -27.698352813720703, -26.75490379333496, -25.811452865600586, -24.868003845214844, -23.92455291748047, -22.981103897094727, -22.037654876708984, -21.094205856323242, -20.150754928588867, -19.207305908203125, -18.26385498046875, -17.320405960083008, -16.376956939697266, -15.43350601196289, -14.490055084228516, -13.546605110168457, -12.603155136108398, -11.659706115722656, -10.716255187988281, -9.772806167602539, -8.82935619354248, -7.885906219482422, -6.942456245422363, -5.999006271362305, -5.055556297302246, -4.112106800079346, -3.168656826019287, -2.2252068519592285, -1.2817573547363281, -0.33830738067626953, 0.6051425933837891, 1.548592448234558, 2.492042303085327, 3.4354920387268066, 4.378942012786865, 5.322391986846924, 6.265841484069824, 7.209291458129883, 8.152741432189941, 9.09619140625, 10.039641380310059, 10.983091354370117, 11.92654037475586, 12.869991302490234, 13.813440322875977, 14.756890296936035, 15.700340270996094, 16.643789291381836, 17.58724021911621, 18.530689239501953, 19.474140167236328, 20.41758918762207, 21.361038208007812, 22.304489135742188, 23.247940063476562, 24.191389083862305, 25.13484001159668, 26.078289031982422, 27.021739959716797, 27.96518898010254, 28.90863800048828, 29.852088928222656, 30.7955379486084]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 6.0, 10.0, 18.0, 15.0, 41.0, 57.0, 102.0, 214.0, 274.0, 429.0, 751.0, 1201.0, 1991.0, 3276.0, 5420.0, 8815.0, 14084.0, 21658.0, 33132.0, 47647.0, 65085.0, 84587.0, 101405.0, 113039.0, 114678.0, 105812.0, 91043.0, 71973.0, 54366.0, 38100.0, 25539.0, 16442.0, 10565.0, 6345.0, 4000.0, 2556.0, 1524.0, 938.0, 601.0, 341.0, 179.0, 128.0, 73.0, 36.0, 26.0, 19.0, 12.0, 1.0, 4.0, 7.0, 1.0, 0.0, 2.0, 1.0], "bins": [-21.734375, -21.0986328125, -20.462890625, -19.8271484375, -19.19140625, -18.5556640625, -17.919921875, -17.2841796875, -16.6484375, -16.0126953125, -15.376953125, -14.7412109375, -14.10546875, -13.4697265625, -12.833984375, -12.1982421875, -11.5625, -10.9267578125, -10.291015625, -9.6552734375, -9.01953125, -8.3837890625, -7.748046875, -7.1123046875, -6.4765625, -5.8408203125, -5.205078125, -4.5693359375, -3.93359375, -3.2978515625, -2.662109375, -2.0263671875, -1.390625, -0.7548828125, -0.119140625, 0.5166015625, 1.15234375, 1.7880859375, 2.423828125, 3.0595703125, 3.6953125, 4.3310546875, 4.966796875, 5.6025390625, 6.23828125, 6.8740234375, 7.509765625, 8.1455078125, 8.78125, 9.4169921875, 10.052734375, 10.6884765625, 11.32421875, 11.9599609375, 12.595703125, 13.2314453125, 13.8671875, 14.5029296875, 15.138671875, 15.7744140625, 16.41015625, 17.0458984375, 17.681640625, 18.3173828125, 18.953125]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 4.0, 1.0, 7.0, 0.0, 0.0, 2.0, 4.0, 6.0, 7.0, 9.0, 18.0, 18.0, 12.0, 9.0, 23.0, 19.0, 19.0, 28.0, 36.0, 40.0, 37.0, 25.0, 36.0, 45.0, 51.0, 37.0, 50.0, 41.0, 25.0, 43.0, 41.0, 40.0, 28.0, 27.0, 30.0, 29.0, 15.0, 22.0, 16.0, 12.0, 16.0, 19.0, 17.0, 9.0, 10.0, 4.0, 6.0, 5.0, 7.0, 1.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-26.453125, -25.58984375, -24.7265625, -23.86328125, -23.0, -22.13671875, -21.2734375, -20.41015625, -19.546875, -18.68359375, -17.8203125, -16.95703125, -16.09375, -15.23046875, -14.3671875, -13.50390625, -12.640625, -11.77734375, -10.9140625, -10.05078125, -9.1875, -8.32421875, -7.4609375, -6.59765625, -5.734375, -4.87109375, -4.0078125, -3.14453125, -2.28125, -1.41796875, -0.5546875, 0.30859375, 1.171875, 2.03515625, 2.8984375, 3.76171875, 4.625, 5.48828125, 6.3515625, 7.21484375, 8.078125, 8.94140625, 9.8046875, 10.66796875, 11.53125, 12.39453125, 13.2578125, 14.12109375, 14.984375, 15.84765625, 16.7109375, 17.57421875, 18.4375, 19.30078125, 20.1640625, 21.02734375, 21.890625, 22.75390625, 23.6171875, 24.48046875, 25.34375, 26.20703125, 27.0703125, 27.93359375, 28.796875]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 8.0, 11.0, 27.0, 25.0, 54.0, 70.0, 109.0, 226.0, 324.0, 528.0, 806.0, 1226.0, 1911.0, 2860.0, 4433.0, 6593.0, 9868.0, 14124.0, 20458.0, 28078.0, 38341.0, 50001.0, 62749.0, 75518.0, 85992.0, 92505.0, 94516.0, 90239.0, 81868.0, 70094.0, 57619.0, 44811.0, 33587.0, 24726.0, 17639.0, 12136.0, 8397.0, 5626.0, 3655.0, 2395.0, 1559.0, 1040.0, 681.0, 414.0, 271.0, 161.0, 107.0, 67.0, 39.0, 23.0, 12.0, 14.0, 6.0, 9.0, 6.0, 4.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.046875, -15.51708984375, -14.9873046875, -14.45751953125, -13.927734375, -13.39794921875, -12.8681640625, -12.33837890625, -11.80859375, -11.27880859375, -10.7490234375, -10.21923828125, -9.689453125, -9.15966796875, -8.6298828125, -8.10009765625, -7.5703125, -7.04052734375, -6.5107421875, -5.98095703125, -5.451171875, -4.92138671875, -4.3916015625, -3.86181640625, -3.33203125, -2.80224609375, -2.2724609375, -1.74267578125, -1.212890625, -0.68310546875, -0.1533203125, 0.37646484375, 0.90625, 1.43603515625, 1.9658203125, 2.49560546875, 3.025390625, 3.55517578125, 4.0849609375, 4.61474609375, 5.14453125, 5.67431640625, 6.2041015625, 6.73388671875, 7.263671875, 7.79345703125, 8.3232421875, 8.85302734375, 9.3828125, 9.91259765625, 10.4423828125, 10.97216796875, 11.501953125, 12.03173828125, 12.5615234375, 13.09130859375, 13.62109375, 14.15087890625, 14.6806640625, 15.21044921875, 15.740234375, 16.27001953125, 16.7998046875, 17.32958984375, 17.859375]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 4.0, 6.0, 3.0, 6.0, 3.0, 8.0, 11.0, 7.0, 7.0, 17.0, 15.0, 12.0, 12.0, 18.0, 19.0, 31.0, 28.0, 17.0, 27.0, 30.0, 52.0, 36.0, 29.0, 41.0, 34.0, 34.0, 39.0, 33.0, 33.0, 30.0, 32.0, 29.0, 32.0, 23.0, 31.0, 31.0, 21.0, 27.0, 21.0, 20.0, 17.0, 20.0, 14.0, 9.0, 5.0, 7.0, 8.0, 4.0, 4.0, 3.0, 4.0, 2.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-14.2109375, -13.7237548828125, -13.236572265625, -12.7493896484375, -12.26220703125, -11.7750244140625, -11.287841796875, -10.8006591796875, -10.3134765625, -9.8262939453125, -9.339111328125, -8.8519287109375, -8.36474609375, -7.8775634765625, -7.390380859375, -6.9031982421875, -6.416015625, -5.9288330078125, -5.441650390625, -4.9544677734375, -4.46728515625, -3.9801025390625, -3.492919921875, -3.0057373046875, -2.5185546875, -2.0313720703125, -1.544189453125, -1.0570068359375, -0.56982421875, -0.0826416015625, 0.404541015625, 0.8917236328125, 1.37890625, 1.8660888671875, 2.353271484375, 2.8404541015625, 3.32763671875, 3.8148193359375, 4.302001953125, 4.7891845703125, 5.2763671875, 5.7635498046875, 6.250732421875, 6.7379150390625, 7.22509765625, 7.7122802734375, 8.199462890625, 8.6866455078125, 9.173828125, 9.6610107421875, 10.148193359375, 10.6353759765625, 11.12255859375, 11.6097412109375, 12.096923828125, 12.5841064453125, 13.0712890625, 13.5584716796875, 14.045654296875, 14.5328369140625, 15.02001953125, 15.5072021484375, 15.994384765625, 16.4815673828125, 16.96875]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 1.0, 2.0, 7.0, 5.0, 2.0, 11.0, 15.0, 15.0, 23.0, 21.0, 42.0, 43.0, 68.0, 115.0, 173.0, 270.0, 383.0, 622.0, 989.0, 1529.0, 2431.0, 3876.0, 6316.0, 10211.0, 16339.0, 25581.0, 39117.0, 57199.0, 78405.0, 99622.0, 117047.0, 123452.0, 117505.0, 100895.0, 79236.0, 57337.0, 39648.0, 25832.0, 16662.0, 10224.0, 6470.0, 4072.0, 2408.0, 1490.0, 1009.0, 601.0, 409.0, 257.0, 181.0, 115.0, 82.0, 69.0, 46.0, 29.0, 19.0, 11.0, 8.0, 7.0, 4.0, 9.0, 2.0, 1.0], "bins": [-8.125, -7.882568359375, -7.64013671875, -7.397705078125, -7.1552734375, -6.912841796875, -6.67041015625, -6.427978515625, -6.185546875, -5.943115234375, -5.70068359375, -5.458251953125, -5.2158203125, -4.973388671875, -4.73095703125, -4.488525390625, -4.24609375, -4.003662109375, -3.76123046875, -3.518798828125, -3.2763671875, -3.033935546875, -2.79150390625, -2.549072265625, -2.306640625, -2.064208984375, -1.82177734375, -1.579345703125, -1.3369140625, -1.094482421875, -0.85205078125, -0.609619140625, -0.3671875, -0.124755859375, 0.11767578125, 0.360107421875, 0.6025390625, 0.844970703125, 1.08740234375, 1.329833984375, 1.572265625, 1.814697265625, 2.05712890625, 2.299560546875, 2.5419921875, 2.784423828125, 3.02685546875, 3.269287109375, 3.51171875, 3.754150390625, 3.99658203125, 4.239013671875, 4.4814453125, 4.723876953125, 4.96630859375, 5.208740234375, 5.451171875, 5.693603515625, 5.93603515625, 6.178466796875, 6.4208984375, 6.663330078125, 6.90576171875, 7.148193359375, 7.390625]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 7.0, 3.0, 9.0, 7.0, 8.0, 17.0, 23.0, 14.0, 33.0, 28.0, 43.0, 49.0, 72.0, 80.0, 71.0, 66.0, 59.0, 67.0, 56.0, 53.0, 45.0, 36.0, 36.0, 26.0, 25.0, 18.0, 12.0, 19.0, 8.0, 2.0, 8.0, 4.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008840560913085938, -0.0008467435836791992, -0.0008094310760498047, -0.0007721185684204102, -0.0007348060607910156, -0.0006974935531616211, -0.0006601810455322266, -0.000622868537902832, -0.0005855560302734375, -0.000548243522644043, -0.0005109310150146484, -0.0004736185073852539, -0.0004363059997558594, -0.00039899349212646484, -0.0003616809844970703, -0.0003243684768676758, -0.00028705596923828125, -0.0002497434616088867, -0.0002124309539794922, -0.00017511844635009766, -0.00013780593872070312, -0.0001004934310913086, -6.318092346191406e-05, -2.586841583251953e-05, 1.1444091796875e-05, 4.875659942626953e-05, 8.606910705566406e-05, 0.0001233816146850586, 0.00016069412231445312, 0.00019800662994384766, 0.0002353191375732422, 0.0002726316452026367, 0.00030994415283203125, 0.0003472566604614258, 0.0003845691680908203, 0.00042188167572021484, 0.0004591941833496094, 0.0004965066909790039, 0.0005338191986083984, 0.000571131706237793, 0.0006084442138671875, 0.000645756721496582, 0.0006830692291259766, 0.0007203817367553711, 0.0007576942443847656, 0.0007950067520141602, 0.0008323192596435547, 0.0008696317672729492, 0.0009069442749023438, 0.0009442567825317383, 0.0009815692901611328, 0.0010188817977905273, 0.0010561943054199219, 0.0010935068130493164, 0.001130819320678711, 0.0011681318283081055, 0.0012054443359375, 0.0012427568435668945, 0.001280069351196289, 0.0013173818588256836, 0.0013546943664550781, 0.0013920068740844727, 0.0014293193817138672, 0.0014666318893432617, 0.0015039443969726562]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 2.0, 8.0, 10.0, 15.0, 26.0, 27.0, 34.0, 66.0, 81.0, 150.0, 199.0, 273.0, 455.0, 721.0, 1215.0, 1933.0, 3200.0, 5299.0, 9161.0, 15339.0, 26066.0, 42594.0, 66816.0, 96629.0, 125678.0, 143694.0, 140582.0, 119615.0, 90039.0, 61956.0, 38789.0, 23498.0, 14228.0, 8096.0, 4638.0, 2783.0, 1660.0, 1064.0, 673.0, 416.0, 265.0, 199.0, 130.0, 86.0, 51.0, 37.0, 19.0, 21.0, 11.0, 7.0, 7.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.109375, -8.8046875, -8.5, -8.1953125, -7.890625, -7.5859375, -7.28125, -6.9765625, -6.671875, -6.3671875, -6.0625, -5.7578125, -5.453125, -5.1484375, -4.84375, -4.5390625, -4.234375, -3.9296875, -3.625, -3.3203125, -3.015625, -2.7109375, -2.40625, -2.1015625, -1.796875, -1.4921875, -1.1875, -0.8828125, -0.578125, -0.2734375, 0.03125, 0.3359375, 0.640625, 0.9453125, 1.25, 1.5546875, 1.859375, 2.1640625, 2.46875, 2.7734375, 3.078125, 3.3828125, 3.6875, 3.9921875, 4.296875, 4.6015625, 4.90625, 5.2109375, 5.515625, 5.8203125, 6.125, 6.4296875, 6.734375, 7.0390625, 7.34375, 7.6484375, 7.953125, 8.2578125, 8.5625, 8.8671875, 9.171875, 9.4765625, 9.78125, 10.0859375, 10.390625]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 7.0, 5.0, 11.0, 9.0, 17.0, 11.0, 26.0, 14.0, 31.0, 32.0, 38.0, 48.0, 66.0, 49.0, 49.0, 43.0, 55.0, 62.0, 48.0, 45.0, 57.0, 44.0, 47.0, 36.0, 35.0, 22.0, 26.0, 20.0, 9.0, 11.0, 4.0, 5.0, 9.0, 3.0, 4.0, 2.0, 1.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-4.34375, -4.22564697265625, -4.1075439453125, -3.98944091796875, -3.871337890625, -3.75323486328125, -3.6351318359375, -3.51702880859375, -3.39892578125, -3.28082275390625, -3.1627197265625, -3.04461669921875, -2.926513671875, -2.80841064453125, -2.6903076171875, -2.57220458984375, -2.4541015625, -2.33599853515625, -2.2178955078125, -2.09979248046875, -1.981689453125, -1.86358642578125, -1.7454833984375, -1.62738037109375, -1.50927734375, -1.39117431640625, -1.2730712890625, -1.15496826171875, -1.036865234375, -0.91876220703125, -0.8006591796875, -0.68255615234375, -0.564453125, -0.44635009765625, -0.3282470703125, -0.21014404296875, -0.092041015625, 0.02606201171875, 0.1441650390625, 0.26226806640625, 0.38037109375, 0.49847412109375, 0.6165771484375, 0.73468017578125, 0.852783203125, 0.97088623046875, 1.0889892578125, 1.20709228515625, 1.3251953125, 1.44329833984375, 1.5614013671875, 1.67950439453125, 1.797607421875, 1.91571044921875, 2.0338134765625, 2.15191650390625, 2.27001953125, 2.38812255859375, 2.5062255859375, 2.62432861328125, 2.742431640625, 2.86053466796875, 2.9786376953125, 3.09674072265625, 3.21484375]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 2.0, 4.0, 5.0, 5.0, 2.0, 6.0, 10.0, 4.0, 8.0, 16.0, 29.0, 16.0, 19.0, 16.0, 22.0, 28.0, 25.0, 26.0, 29.0, 42.0, 30.0, 33.0, 34.0, 44.0, 38.0, 40.0, 35.0, 38.0, 37.0, 39.0, 40.0, 24.0, 31.0, 29.0, 34.0, 24.0, 23.0, 29.0, 18.0, 10.0, 14.0, 8.0, 3.0, 8.0, 4.0, 5.0, 5.0, 2.0, 5.0, 1.0, 1.0, 4.0, 2.0, 0.0, 0.0, 3.0], "bins": [-22.8902530670166, -22.200899124145508, -21.511545181274414, -20.82219123840332, -20.13283920288086, -19.443485260009766, -18.754131317138672, -18.064777374267578, -17.375423431396484, -16.68606948852539, -15.996715545654297, -15.30736255645752, -14.618008613586426, -13.928654670715332, -13.239301681518555, -12.549947738647461, -11.860593795776367, -11.171239852905273, -10.48188591003418, -9.792532920837402, -9.103178977966309, -8.413825035095215, -7.724471569061279, -7.035118103027344, -6.34576416015625, -5.656410217285156, -4.967056751251221, -4.277703285217285, -3.5883493423461914, -2.8989956378936768, -2.209641933441162, -1.5202884674072266, -0.8309345245361328, -0.14158082008361816, 0.5477728843688965, 1.2371265888214111, 1.9264802932739258, 2.6158339977264404, 3.305187702178955, 3.9945411682128906, 4.683895111083984, 5.373249053955078, 6.062602519989014, 6.751955986022949, 7.441309928894043, 8.130663871765137, 8.820016860961914, 9.509370803833008, 10.198724746704102, 10.888078689575195, 11.577432632446289, 12.266785621643066, 12.95613956451416, 13.645493507385254, 14.334846496582031, 15.024200439453125, 15.713554382324219, 16.402908325195312, 17.092262268066406, 17.7816162109375, 18.470970153808594, 19.160322189331055, 19.84967613220215, 20.539030075073242, 21.228384017944336]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 3.0, 4.0, 1.0, 2.0, 6.0, 5.0, 6.0, 9.0, 11.0, 12.0, 21.0, 16.0, 17.0, 31.0, 26.0, 26.0, 27.0, 30.0, 37.0, 32.0, 43.0, 47.0, 36.0, 31.0, 45.0, 47.0, 42.0, 44.0, 38.0, 31.0, 33.0, 18.0, 34.0, 26.0, 22.0, 21.0, 19.0, 15.0, 13.0, 12.0, 15.0, 12.0, 8.0, 9.0, 5.0, 6.0, 7.0, 1.0, 4.0, 3.0, 2.0, 2.0, 2.0], "bins": [-30.595733642578125, -29.736892700195312, -28.8780517578125, -28.019210815429688, -27.160369873046875, -26.301528930664062, -25.44268798828125, -24.583847045898438, -23.725006103515625, -22.866165161132812, -22.00732421875, -21.148483276367188, -20.289642333984375, -19.430801391601562, -18.57196044921875, -17.713119506835938, -16.854278564453125, -15.995437622070312, -15.1365966796875, -14.277755737304688, -13.418914794921875, -12.560073852539062, -11.70123291015625, -10.842391967773438, -9.983551025390625, -9.124710083007812, -8.265869140625, -7.4070281982421875, -6.548187255859375, -5.6893463134765625, -4.83050537109375, -3.9716644287109375, -3.112823486328125, -2.2539825439453125, -1.3951416015625, -0.5363006591796875, 0.322540283203125, 1.1813812255859375, 2.04022216796875, 2.8990631103515625, 3.757904052734375, 4.6167449951171875, 5.4755859375, 6.3344268798828125, 7.193267822265625, 8.052108764648438, 8.91094970703125, 9.769790649414062, 10.628631591796875, 11.487472534179688, 12.3463134765625, 13.205154418945312, 14.063995361328125, 14.922836303710938, 15.78167724609375, 16.640518188476562, 17.499359130859375, 18.358200073242188, 19.217041015625, 20.075881958007812, 20.934722900390625, 21.793563842773438, 22.65240478515625, 23.511245727539062, 24.370086669921875]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 5.0, 10.0, 15.0, 33.0, 33.0, 77.0, 147.0, 239.0, 410.0, 649.0, 1063.0, 1868.0, 2885.0, 4752.0, 7914.0, 12451.0, 19532.0, 30798.0, 46988.0, 70468.0, 103378.0, 145481.0, 198156.0, 258777.0, 320152.0, 374160.0, 407017.0, 413474.0, 392121.0, 345617.0, 285899.0, 223631.0, 166955.0, 119418.0, 82533.0, 55579.0, 37260.0, 23688.0, 15344.0, 9569.0, 6137.0, 3704.0, 2300.0, 1388.0, 870.0, 541.0, 329.0, 200.0, 124.0, 60.0, 45.0, 25.0, 13.0, 5.0, 7.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-17.453125, -16.89404296875, -16.3349609375, -15.77587890625, -15.216796875, -14.65771484375, -14.0986328125, -13.53955078125, -12.98046875, -12.42138671875, -11.8623046875, -11.30322265625, -10.744140625, -10.18505859375, -9.6259765625, -9.06689453125, -8.5078125, -7.94873046875, -7.3896484375, -6.83056640625, -6.271484375, -5.71240234375, -5.1533203125, -4.59423828125, -4.03515625, -3.47607421875, -2.9169921875, -2.35791015625, -1.798828125, -1.23974609375, -0.6806640625, -0.12158203125, 0.4375, 0.99658203125, 1.5556640625, 2.11474609375, 2.673828125, 3.23291015625, 3.7919921875, 4.35107421875, 4.91015625, 5.46923828125, 6.0283203125, 6.58740234375, 7.146484375, 7.70556640625, 8.2646484375, 8.82373046875, 9.3828125, 9.94189453125, 10.5009765625, 11.06005859375, 11.619140625, 12.17822265625, 12.7373046875, 13.29638671875, 13.85546875, 14.41455078125, 14.9736328125, 15.53271484375, 16.091796875, 16.65087890625, 17.2099609375, 17.76904296875, 18.328125]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 6.0, 1.0, 7.0, 3.0, 0.0, 13.0, 12.0, 17.0, 15.0, 15.0, 21.0, 17.0, 31.0, 31.0, 35.0, 28.0, 34.0, 42.0, 38.0, 51.0, 40.0, 44.0, 51.0, 43.0, 39.0, 42.0, 48.0, 37.0, 35.0, 22.0, 23.0, 23.0, 27.0, 22.0, 15.0, 8.0, 9.0, 16.0, 12.0, 13.0, 5.0, 4.0, 8.0, 1.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-25.375, -24.631591796875, -23.88818359375, -23.144775390625, -22.4013671875, -21.657958984375, -20.91455078125, -20.171142578125, -19.427734375, -18.684326171875, -17.94091796875, -17.197509765625, -16.4541015625, -15.710693359375, -14.96728515625, -14.223876953125, -13.48046875, -12.737060546875, -11.99365234375, -11.250244140625, -10.5068359375, -9.763427734375, -9.02001953125, -8.276611328125, -7.533203125, -6.789794921875, -6.04638671875, -5.302978515625, -4.5595703125, -3.816162109375, -3.07275390625, -2.329345703125, -1.5859375, -0.842529296875, -0.09912109375, 0.644287109375, 1.3876953125, 2.131103515625, 2.87451171875, 3.617919921875, 4.361328125, 5.104736328125, 5.84814453125, 6.591552734375, 7.3349609375, 8.078369140625, 8.82177734375, 9.565185546875, 10.30859375, 11.052001953125, 11.79541015625, 12.538818359375, 13.2822265625, 14.025634765625, 14.76904296875, 15.512451171875, 16.255859375, 16.999267578125, 17.74267578125, 18.486083984375, 19.2294921875, 19.972900390625, 20.71630859375, 21.459716796875, 22.203125]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [3.0, 1.0, 8.0, 8.0, 9.0, 27.0, 32.0, 48.0, 97.0, 167.0, 277.0, 451.0, 702.0, 1195.0, 1954.0, 3066.0, 5116.0, 8076.0, 12138.0, 18792.0, 28054.0, 41098.0, 60693.0, 83926.0, 116178.0, 153474.0, 196726.0, 242176.0, 286282.0, 321213.0, 346613.0, 355392.0, 345181.0, 320176.0, 283002.0, 239975.0, 194712.0, 151090.0, 114010.0, 83248.0, 59130.0, 41418.0, 27693.0, 18474.0, 11953.0, 7737.0, 4736.0, 3008.0, 1952.0, 1118.0, 662.0, 399.0, 243.0, 171.0, 84.0, 49.0, 45.0, 17.0, 13.0, 7.0, 1.0, 3.0, 3.0, 2.0], "bins": [-16.390625, -15.869873046875, -15.34912109375, -14.828369140625, -14.3076171875, -13.786865234375, -13.26611328125, -12.745361328125, -12.224609375, -11.703857421875, -11.18310546875, -10.662353515625, -10.1416015625, -9.620849609375, -9.10009765625, -8.579345703125, -8.05859375, -7.537841796875, -7.01708984375, -6.496337890625, -5.9755859375, -5.454833984375, -4.93408203125, -4.413330078125, -3.892578125, -3.371826171875, -2.85107421875, -2.330322265625, -1.8095703125, -1.288818359375, -0.76806640625, -0.247314453125, 0.2734375, 0.794189453125, 1.31494140625, 1.835693359375, 2.3564453125, 2.877197265625, 3.39794921875, 3.918701171875, 4.439453125, 4.960205078125, 5.48095703125, 6.001708984375, 6.5224609375, 7.043212890625, 7.56396484375, 8.084716796875, 8.60546875, 9.126220703125, 9.64697265625, 10.167724609375, 10.6884765625, 11.209228515625, 11.72998046875, 12.250732421875, 12.771484375, 13.292236328125, 13.81298828125, 14.333740234375, 14.8544921875, 15.375244140625, 15.89599609375, 16.416748046875, 16.9375]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 4.0, 5.0, 5.0, 4.0, 5.0, 7.0, 11.0, 12.0, 19.0, 21.0, 20.0, 37.0, 39.0, 53.0, 59.0, 70.0, 85.0, 83.0, 122.0, 111.0, 142.0, 159.0, 171.0, 189.0, 191.0, 183.0, 179.0, 206.0, 195.0, 205.0, 156.0, 168.0, 190.0, 154.0, 128.0, 109.0, 98.0, 65.0, 58.0, 67.0, 59.0, 54.0, 40.0, 33.0, 26.0, 23.0, 21.0, 7.0, 12.0, 5.0, 9.0, 4.0, 3.0, 1.0, 3.0, 0.0, 1.0, 3.0, 1.0, 1.0], "bins": [-9.859375, -9.541015625, -9.22265625, -8.904296875, -8.5859375, -8.267578125, -7.94921875, -7.630859375, -7.3125, -6.994140625, -6.67578125, -6.357421875, -6.0390625, -5.720703125, -5.40234375, -5.083984375, -4.765625, -4.447265625, -4.12890625, -3.810546875, -3.4921875, -3.173828125, -2.85546875, -2.537109375, -2.21875, -1.900390625, -1.58203125, -1.263671875, -0.9453125, -0.626953125, -0.30859375, 0.009765625, 0.328125, 0.646484375, 0.96484375, 1.283203125, 1.6015625, 1.919921875, 2.23828125, 2.556640625, 2.875, 3.193359375, 3.51171875, 3.830078125, 4.1484375, 4.466796875, 4.78515625, 5.103515625, 5.421875, 5.740234375, 6.05859375, 6.376953125, 6.6953125, 7.013671875, 7.33203125, 7.650390625, 7.96875, 8.287109375, 8.60546875, 8.923828125, 9.2421875, 9.560546875, 9.87890625, 10.197265625, 10.515625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 2.0, 2.0, 2.0, 7.0, 8.0, 8.0, 11.0, 10.0, 16.0, 17.0, 21.0, 18.0, 21.0, 17.0, 20.0, 32.0, 33.0, 27.0, 35.0, 31.0, 41.0, 52.0, 40.0, 43.0, 31.0, 43.0, 41.0, 55.0, 41.0, 50.0, 26.0, 25.0, 28.0, 38.0, 27.0, 14.0, 17.0, 13.0, 13.0, 8.0, 4.0, 1.0, 5.0, 7.0, 1.0, 1.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.20938491821289, -23.411296844482422, -22.613208770751953, -21.81511878967285, -21.017030715942383, -20.218942642211914, -19.420852661132812, -18.622764587402344, -17.824676513671875, -17.026588439941406, -16.228500366210938, -15.430410385131836, -14.632322311401367, -13.834234237670898, -13.036145210266113, -12.238056182861328, -11.43996810913086, -10.64188003540039, -9.843791007995605, -9.04570198059082, -8.247613906860352, -7.449525356292725, -6.651436805725098, -5.853348255157471, -5.055259704589844, -4.257171154022217, -3.45908260345459, -2.660994052886963, -1.862905502319336, -1.064816951751709, -0.26672840118408203, 0.5313601493835449, 1.329446792602539, 2.127535343170166, 2.925623893737793, 3.72371244430542, 4.521800994873047, 5.319889545440674, 6.117978096008301, 6.916066646575928, 7.714155197143555, 8.512243270874023, 9.310332298278809, 10.108421325683594, 10.906509399414062, 11.704597473144531, 12.502686500549316, 13.300775527954102, 14.09886360168457, 14.896951675415039, 15.695040702819824, 16.49312973022461, 17.291217803955078, 18.089305877685547, 18.887393951416016, 19.685483932495117, 20.483572006225586, 21.281660079956055, 22.079750061035156, 22.877838134765625, 23.675926208496094, 24.474014282226562, 25.27210235595703, 26.070192337036133, 26.8682804107666]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 7.0, 1.0, 8.0, 6.0, 10.0, 5.0, 10.0, 10.0, 10.0, 11.0, 21.0, 12.0, 29.0, 34.0, 24.0, 30.0, 36.0, 47.0, 35.0, 48.0, 54.0, 36.0, 32.0, 29.0, 48.0, 38.0, 35.0, 32.0, 38.0, 33.0, 32.0, 31.0, 26.0, 26.0, 18.0, 11.0, 12.0, 14.0, 12.0, 11.0, 12.0, 7.0, 11.0, 4.0, 6.0, 2.0, 2.0, 2.0, 6.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0], "bins": [-26.185714721679688, -25.343616485595703, -24.501516342163086, -23.65941619873047, -22.817317962646484, -21.9752197265625, -21.133119583129883, -20.291019439697266, -19.44892120361328, -18.606822967529297, -17.76472282409668, -16.922622680664062, -16.080524444580078, -15.238425254821777, -14.396326065063477, -13.554226875305176, -12.712127685546875, -11.870028495788574, -11.027929306030273, -10.185830116271973, -9.343730926513672, -8.501631736755371, -7.65953254699707, -6.8174333572387695, -5.975334167480469, -5.133234977722168, -4.291135787963867, -3.4490365982055664, -2.6069374084472656, -1.7648382186889648, -0.9227390289306641, -0.08063983917236328, 0.7614574432373047, 1.6035566329956055, 2.4456558227539062, 3.287755012512207, 4.129854202270508, 4.971953392028809, 5.814052581787109, 6.65615177154541, 7.498250961303711, 8.340350151062012, 9.182449340820312, 10.024548530578613, 10.866647720336914, 11.708746910095215, 12.550846099853516, 13.392945289611816, 14.235044479370117, 15.077143669128418, 15.919242858886719, 16.761341094970703, 17.60344123840332, 18.445541381835938, 19.287639617919922, 20.129737854003906, 20.971837997436523, 21.81393814086914, 22.656036376953125, 23.49813461303711, 24.340234756469727, 25.182334899902344, 26.024433135986328, 26.866531372070312, 27.70863151550293]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 4.0, 5.0, 9.0, 8.0, 11.0, 14.0, 24.0, 33.0, 48.0, 65.0, 83.0, 136.0, 205.0, 292.0, 363.0, 588.0, 784.0, 1207.0, 1843.0, 2950.0, 4857.0, 8807.0, 15969.0, 31044.0, 62481.0, 121256.0, 203566.0, 234310.0, 167236.0, 91776.0, 45669.0, 23043.0, 12088.0, 6621.0, 3868.0, 2391.0, 1548.0, 1023.0, 701.0, 519.0, 348.0, 239.0, 177.0, 99.0, 83.0, 57.0, 36.0, 26.0, 17.0, 15.0, 15.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.67578125, -7.40435791015625, -7.1329345703125, -6.86151123046875, -6.590087890625, -6.31866455078125, -6.0472412109375, -5.77581787109375, -5.50439453125, -5.23297119140625, -4.9615478515625, -4.69012451171875, -4.418701171875, -4.14727783203125, -3.8758544921875, -3.60443115234375, -3.3330078125, -3.06158447265625, -2.7901611328125, -2.51873779296875, -2.247314453125, -1.97589111328125, -1.7044677734375, -1.43304443359375, -1.16162109375, -0.89019775390625, -0.6187744140625, -0.34735107421875, -0.075927734375, 0.19549560546875, 0.4669189453125, 0.73834228515625, 1.009765625, 1.28118896484375, 1.5526123046875, 1.82403564453125, 2.095458984375, 2.36688232421875, 2.6383056640625, 2.90972900390625, 3.18115234375, 3.45257568359375, 3.7239990234375, 3.99542236328125, 4.266845703125, 4.53826904296875, 4.8096923828125, 5.08111572265625, 5.3525390625, 5.62396240234375, 5.8953857421875, 6.16680908203125, 6.438232421875, 6.70965576171875, 6.9810791015625, 7.25250244140625, 7.52392578125, 7.79534912109375, 8.0667724609375, 8.33819580078125, 8.609619140625, 8.88104248046875, 9.1524658203125, 9.42388916015625, 9.6953125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 1.0, 5.0, 3.0, 10.0, 10.0, 4.0, 10.0, 14.0, 8.0, 13.0, 10.0, 23.0, 31.0, 25.0, 35.0, 46.0, 36.0, 34.0, 35.0, 39.0, 37.0, 50.0, 43.0, 33.0, 52.0, 43.0, 29.0, 40.0, 33.0, 24.0, 28.0, 27.0, 17.0, 24.0, 22.0, 16.0, 17.0, 16.0, 12.0, 11.0, 10.0, 8.0, 8.0, 4.0, 1.0, 4.0, 4.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-26.703125, -25.81396484375, -24.9248046875, -24.03564453125, -23.146484375, -22.25732421875, -21.3681640625, -20.47900390625, -19.58984375, -18.70068359375, -17.8115234375, -16.92236328125, -16.033203125, -15.14404296875, -14.2548828125, -13.36572265625, -12.4765625, -11.58740234375, -10.6982421875, -9.80908203125, -8.919921875, -8.03076171875, -7.1416015625, -6.25244140625, -5.36328125, -4.47412109375, -3.5849609375, -2.69580078125, -1.806640625, -0.91748046875, -0.0283203125, 0.86083984375, 1.75, 2.63916015625, 3.5283203125, 4.41748046875, 5.306640625, 6.19580078125, 7.0849609375, 7.97412109375, 8.86328125, 9.75244140625, 10.6416015625, 11.53076171875, 12.419921875, 13.30908203125, 14.1982421875, 15.08740234375, 15.9765625, 16.86572265625, 17.7548828125, 18.64404296875, 19.533203125, 20.42236328125, 21.3115234375, 22.20068359375, 23.08984375, 23.97900390625, 24.8681640625, 25.75732421875, 26.646484375, 27.53564453125, 28.4248046875, 29.31396484375, 30.203125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 3.0, 8.0, 7.0, 5.0, 6.0, 15.0, 22.0, 38.0, 44.0, 66.0, 108.0, 139.0, 235.0, 337.0, 709.0, 1272.0, 2683.0, 5841.0, 14309.0, 37961.0, 105699.0, 248703.0, 325237.0, 187677.0, 72356.0, 26196.0, 10156.0, 4243.0, 2028.0, 970.0, 575.0, 322.0, 219.0, 116.0, 75.0, 47.0, 36.0, 25.0, 25.0, 12.0, 11.0, 8.0, 6.0, 6.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-10.3828125, -10.040283203125, -9.69775390625, -9.355224609375, -9.0126953125, -8.670166015625, -8.32763671875, -7.985107421875, -7.642578125, -7.300048828125, -6.95751953125, -6.614990234375, -6.2724609375, -5.929931640625, -5.58740234375, -5.244873046875, -4.90234375, -4.559814453125, -4.21728515625, -3.874755859375, -3.5322265625, -3.189697265625, -2.84716796875, -2.504638671875, -2.162109375, -1.819580078125, -1.47705078125, -1.134521484375, -0.7919921875, -0.449462890625, -0.10693359375, 0.235595703125, 0.578125, 0.920654296875, 1.26318359375, 1.605712890625, 1.9482421875, 2.290771484375, 2.63330078125, 2.975830078125, 3.318359375, 3.660888671875, 4.00341796875, 4.345947265625, 4.6884765625, 5.031005859375, 5.37353515625, 5.716064453125, 6.05859375, 6.401123046875, 6.74365234375, 7.086181640625, 7.4287109375, 7.771240234375, 8.11376953125, 8.456298828125, 8.798828125, 9.141357421875, 9.48388671875, 9.826416015625, 10.1689453125, 10.511474609375, 10.85400390625, 11.196533203125, 11.5390625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 3.0, 10.0, 6.0, 12.0, 11.0, 6.0, 10.0, 12.0, 10.0, 21.0, 15.0, 27.0, 27.0, 25.0, 30.0, 41.0, 35.0, 31.0, 36.0, 34.0, 38.0, 40.0, 51.0, 36.0, 45.0, 38.0, 35.0, 32.0, 35.0, 33.0, 31.0, 31.0, 27.0, 18.0, 21.0, 20.0, 8.0, 15.0, 7.0, 8.0, 6.0, 6.0, 6.0, 4.0, 1.0, 5.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0], "bins": [-20.359375, -19.761474609375, -19.16357421875, -18.565673828125, -17.9677734375, -17.369873046875, -16.77197265625, -16.174072265625, -15.576171875, -14.978271484375, -14.38037109375, -13.782470703125, -13.1845703125, -12.586669921875, -11.98876953125, -11.390869140625, -10.79296875, -10.195068359375, -9.59716796875, -8.999267578125, -8.4013671875, -7.803466796875, -7.20556640625, -6.607666015625, -6.009765625, -5.411865234375, -4.81396484375, -4.216064453125, -3.6181640625, -3.020263671875, -2.42236328125, -1.824462890625, -1.2265625, -0.628662109375, -0.03076171875, 0.567138671875, 1.1650390625, 1.762939453125, 2.36083984375, 2.958740234375, 3.556640625, 4.154541015625, 4.75244140625, 5.350341796875, 5.9482421875, 6.546142578125, 7.14404296875, 7.741943359375, 8.33984375, 8.937744140625, 9.53564453125, 10.133544921875, 10.7314453125, 11.329345703125, 11.92724609375, 12.525146484375, 13.123046875, 13.720947265625, 14.31884765625, 14.916748046875, 15.5146484375, 16.112548828125, 16.71044921875, 17.308349609375, 17.90625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 1.0, 4.0, 8.0, 6.0, 10.0, 19.0, 27.0, 25.0, 44.0, 70.0, 124.0, 193.0, 305.0, 465.0, 848.0, 1408.0, 2835.0, 5667.0, 13717.0, 51693.0, 338792.0, 512880.0, 85694.0, 19174.0, 6888.0, 3375.0, 1787.0, 1003.0, 546.0, 347.0, 198.0, 125.0, 101.0, 62.0, 38.0, 17.0, 17.0, 15.0, 5.0, 10.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-3.546875, -3.4429931640625, -3.339111328125, -3.2352294921875, -3.13134765625, -3.0274658203125, -2.923583984375, -2.8197021484375, -2.7158203125, -2.6119384765625, -2.508056640625, -2.4041748046875, -2.30029296875, -2.1964111328125, -2.092529296875, -1.9886474609375, -1.884765625, -1.7808837890625, -1.677001953125, -1.5731201171875, -1.46923828125, -1.3653564453125, -1.261474609375, -1.1575927734375, -1.0537109375, -0.9498291015625, -0.845947265625, -0.7420654296875, -0.63818359375, -0.5343017578125, -0.430419921875, -0.3265380859375, -0.22265625, -0.1187744140625, -0.014892578125, 0.0889892578125, 0.19287109375, 0.2967529296875, 0.400634765625, 0.5045166015625, 0.6083984375, 0.7122802734375, 0.816162109375, 0.9200439453125, 1.02392578125, 1.1278076171875, 1.231689453125, 1.3355712890625, 1.439453125, 1.5433349609375, 1.647216796875, 1.7510986328125, 1.85498046875, 1.9588623046875, 2.062744140625, 2.1666259765625, 2.2705078125, 2.3743896484375, 2.478271484375, 2.5821533203125, 2.68603515625, 2.7899169921875, 2.893798828125, 2.9976806640625, 3.1015625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 6.0, 4.0, 4.0, 8.0, 10.0, 8.0, 11.0, 22.0, 26.0, 36.0, 60.0, 73.0, 136.0, 150.0, 133.0, 95.0, 75.0, 40.0, 33.0, 19.0, 7.0, 12.0, 9.0, 7.0, 0.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002574920654296875, -0.00024781376123428345, -0.0002381354570388794, -0.00022845715284347534, -0.0002187788486480713, -0.00020910054445266724, -0.00019942224025726318, -0.00018974393606185913, -0.00018006563186645508, -0.00017038732767105103, -0.00016070902347564697, -0.00015103071928024292, -0.00014135241508483887, -0.00013167411088943481, -0.00012199580669403076, -0.00011231750249862671, -0.00010263919830322266, -9.29608941078186e-05, -8.328258991241455e-05, -7.36042857170105e-05, -6.392598152160645e-05, -5.424767732620239e-05, -4.456937313079834e-05, -3.489106893539429e-05, -2.5212764739990234e-05, -1.553446054458618e-05, -5.856156349182129e-06, 3.822147846221924e-06, 1.3500452041625977e-05, 2.317875623703003e-05, 3.285706043243408e-05, 4.2535364627838135e-05, 5.221366882324219e-05, 6.189197301864624e-05, 7.157027721405029e-05, 8.124858140945435e-05, 9.09268856048584e-05, 0.00010060518980026245, 0.0001102834939956665, 0.00011996179819107056, 0.0001296401023864746, 0.00013931840658187866, 0.00014899671077728271, 0.00015867501497268677, 0.00016835331916809082, 0.00017803162336349487, 0.00018770992755889893, 0.00019738823175430298, 0.00020706653594970703, 0.00021674484014511108, 0.00022642314434051514, 0.0002361014485359192, 0.00024577975273132324, 0.0002554580569267273, 0.00026513636112213135, 0.0002748146653175354, 0.00028449296951293945, 0.0002941712737083435, 0.00030384957790374756, 0.0003135278820991516, 0.00032320618629455566, 0.0003328844904899597, 0.00034256279468536377, 0.0003522410988807678, 0.0003619194030761719]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 4.0, 9.0, 4.0, 7.0, 11.0, 17.0, 19.0, 34.0, 42.0, 66.0, 88.0, 117.0, 179.0, 293.0, 392.0, 591.0, 821.0, 1167.0, 1704.0, 2362.0, 3590.0, 5568.0, 8775.0, 15396.0, 29841.0, 65587.0, 153390.0, 295032.0, 245668.0, 112141.0, 48242.0, 23104.0, 12235.0, 7441.0, 4734.0, 3101.0, 2028.0, 1477.0, 982.0, 655.0, 484.0, 350.0, 245.0, 188.0, 109.0, 81.0, 62.0, 39.0, 29.0, 22.0, 19.0, 4.0, 3.0, 8.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0], "bins": [-2.6875, -2.60028076171875, -2.5130615234375, -2.42584228515625, -2.338623046875, -2.25140380859375, -2.1641845703125, -2.07696533203125, -1.98974609375, -1.90252685546875, -1.8153076171875, -1.72808837890625, -1.640869140625, -1.55364990234375, -1.4664306640625, -1.37921142578125, -1.2919921875, -1.20477294921875, -1.1175537109375, -1.03033447265625, -0.943115234375, -0.85589599609375, -0.7686767578125, -0.68145751953125, -0.59423828125, -0.50701904296875, -0.4197998046875, -0.33258056640625, -0.245361328125, -0.15814208984375, -0.0709228515625, 0.01629638671875, 0.103515625, 0.19073486328125, 0.2779541015625, 0.36517333984375, 0.452392578125, 0.53961181640625, 0.6268310546875, 0.71405029296875, 0.80126953125, 0.88848876953125, 0.9757080078125, 1.06292724609375, 1.150146484375, 1.23736572265625, 1.3245849609375, 1.41180419921875, 1.4990234375, 1.58624267578125, 1.6734619140625, 1.76068115234375, 1.847900390625, 1.93511962890625, 2.0223388671875, 2.10955810546875, 2.19677734375, 2.28399658203125, 2.3712158203125, 2.45843505859375, 2.545654296875, 2.63287353515625, 2.7200927734375, 2.80731201171875, 2.89453125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 3.0, 1.0, 4.0, 2.0, 2.0, 3.0, 2.0, 6.0, 6.0, 11.0, 14.0, 11.0, 23.0, 27.0, 40.0, 63.0, 93.0, 107.0, 135.0, 125.0, 86.0, 58.0, 40.0, 28.0, 18.0, 20.0, 16.0, 9.0, 11.0, 9.0, 1.0, 4.0, 8.0, 3.0, 2.0, 1.0, 4.0, 2.0, 5.0, 2.0, 1.0, 2.0], "bins": [-1.3076171875, -1.2754058837890625, -1.243194580078125, -1.2109832763671875, -1.17877197265625, -1.1465606689453125, -1.114349365234375, -1.0821380615234375, -1.0499267578125, -1.0177154541015625, -0.985504150390625, -0.9532928466796875, -0.92108154296875, -0.8888702392578125, -0.856658935546875, -0.8244476318359375, -0.792236328125, -0.7600250244140625, -0.727813720703125, -0.6956024169921875, -0.66339111328125, -0.6311798095703125, -0.598968505859375, -0.5667572021484375, -0.5345458984375, -0.5023345947265625, -0.470123291015625, -0.4379119873046875, -0.40570068359375, -0.3734893798828125, -0.341278076171875, -0.3090667724609375, -0.27685546875, -0.2446441650390625, -0.212432861328125, -0.1802215576171875, -0.14801025390625, -0.1157989501953125, -0.083587646484375, -0.0513763427734375, -0.0191650390625, 0.0130462646484375, 0.045257568359375, 0.0774688720703125, 0.10968017578125, 0.1418914794921875, 0.174102783203125, 0.2063140869140625, 0.238525390625, 0.2707366943359375, 0.302947998046875, 0.3351593017578125, 0.36737060546875, 0.3995819091796875, 0.431793212890625, 0.4640045166015625, 0.4962158203125, 0.5284271240234375, 0.560638427734375, 0.5928497314453125, 0.62506103515625, 0.6572723388671875, 0.689483642578125, 0.7216949462890625, 0.75390625]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 0.0, 5.0, 0.0, 2.0, 4.0, 5.0, 11.0, 9.0, 8.0, 8.0, 14.0, 18.0, 19.0, 21.0, 21.0, 18.0, 17.0, 21.0, 27.0, 35.0, 36.0, 35.0, 32.0, 52.0, 37.0, 36.0, 38.0, 44.0, 42.0, 47.0, 45.0, 45.0, 32.0, 29.0, 22.0, 31.0, 28.0, 26.0, 16.0, 19.0, 14.0, 11.0, 8.0, 3.0, 4.0, 5.0, 5.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-23.170150756835938, -22.39649200439453, -21.622833251953125, -20.84917640686035, -20.075517654418945, -19.30185890197754, -18.528202056884766, -17.75454330444336, -16.980884552001953, -16.207225799560547, -15.433568000793457, -14.659910202026367, -13.886251449584961, -13.112592697143555, -12.338934898376465, -11.565277099609375, -10.791618347167969, -10.017959594726562, -9.244301795959473, -8.470643997192383, -7.696985244750977, -6.9233269691467285, -6.1496686935424805, -5.376010417938232, -4.602352142333984, -3.8286938667297363, -3.0550355911254883, -2.2813773155212402, -1.5077190399169922, -0.7340607643127441, 0.039597511291503906, 0.813255786895752, 1.5869140625, 2.360572338104248, 3.134230613708496, 3.907888889312744, 4.681547164916992, 5.45520544052124, 6.228863716125488, 7.002521991729736, 7.776180267333984, 8.54983901977539, 9.32349681854248, 10.09715461730957, 10.870813369750977, 11.644472122192383, 12.418129920959473, 13.191787719726562, 13.965446472167969, 14.739105224609375, 15.512763023376465, 16.286420822143555, 17.06007957458496, 17.833738327026367, 18.60739517211914, 19.381053924560547, 20.154712677001953, 20.92837142944336, 21.702030181884766, 22.47568702697754, 23.249345779418945, 24.02300453186035, 24.796661376953125, 25.57032012939453, 26.343978881835938]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 2.0, 7.0, 6.0, 10.0, 6.0, 10.0, 9.0, 10.0, 11.0, 18.0, 15.0, 29.0, 29.0, 27.0, 27.0, 41.0, 43.0, 35.0, 44.0, 56.0, 36.0, 37.0, 26.0, 49.0, 34.0, 38.0, 36.0, 31.0, 37.0, 33.0, 31.0, 28.0, 24.0, 19.0, 13.0, 12.0, 10.0, 16.0, 11.0, 11.0, 9.0, 10.0, 4.0, 3.0, 4.0, 2.0, 3.0, 4.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0], "bins": [-26.323423385620117, -25.48480987548828, -24.646196365356445, -23.80758285522461, -22.96896743774414, -22.130353927612305, -21.29174041748047, -20.453126907348633, -19.614513397216797, -18.77589988708496, -17.937286376953125, -17.098670959472656, -16.26005744934082, -15.421443939208984, -14.582830429077148, -13.744216918945312, -12.90560245513916, -12.066988945007324, -11.228374481201172, -10.389760971069336, -9.5511474609375, -8.712533950805664, -7.873919486999512, -7.035305976867676, -6.196691989898682, -5.3580780029296875, -4.519464492797852, -3.6808505058288574, -2.8422367572784424, -2.0036230087280273, -1.1650090217590332, -0.32639551162719727, 0.5122184753417969, 1.350832223892212, 2.189445972442627, 3.028059959411621, 3.866673707962036, 4.705287456512451, 5.543901443481445, 6.382514953613281, 7.221128940582275, 8.05974292755127, 8.898356437683105, 9.736970901489258, 10.575584411621094, 11.41419792175293, 12.252811431884766, 13.091424942016602, 13.930039405822754, 14.76865291595459, 15.607267379760742, 16.445880889892578, 17.284494400024414, 18.12310791015625, 18.96172332763672, 19.800334930419922, 20.63895034790039, 21.477563858032227, 22.316177368164062, 23.15479278564453, 23.993406295776367, 24.832019805908203, 25.67063331604004, 26.509246826171875, 27.34786033630371]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 9.0, 11.0, 18.0, 22.0, 43.0, 52.0, 74.0, 114.0, 211.0, 318.0, 475.0, 694.0, 1094.0, 1660.0, 2479.0, 3840.0, 5552.0, 8185.0, 11709.0, 16416.0, 22579.0, 30039.0, 39612.0, 50140.0, 61567.0, 71153.0, 80544.0, 85198.0, 86911.0, 84316.0, 77517.0, 68546.0, 57623.0, 47354.0, 36789.0, 27675.0, 20315.0, 14864.0, 10593.0, 7371.0, 4904.0, 3450.0, 2308.0, 1410.0, 1025.0, 638.0, 435.0, 236.0, 177.0, 109.0, 58.0, 51.0, 23.0, 20.0, 24.0, 8.0, 3.0, 5.0, 1.0, 2.0], "bins": [-14.7890625, -14.3319091796875, -13.874755859375, -13.4176025390625, -12.96044921875, -12.5032958984375, -12.046142578125, -11.5889892578125, -11.1318359375, -10.6746826171875, -10.217529296875, -9.7603759765625, -9.30322265625, -8.8460693359375, -8.388916015625, -7.9317626953125, -7.474609375, -7.0174560546875, -6.560302734375, -6.1031494140625, -5.64599609375, -5.1888427734375, -4.731689453125, -4.2745361328125, -3.8173828125, -3.3602294921875, -2.903076171875, -2.4459228515625, -1.98876953125, -1.5316162109375, -1.074462890625, -0.6173095703125, -0.16015625, 0.2969970703125, 0.754150390625, 1.2113037109375, 1.66845703125, 2.1256103515625, 2.582763671875, 3.0399169921875, 3.4970703125, 3.9542236328125, 4.411376953125, 4.8685302734375, 5.32568359375, 5.7828369140625, 6.239990234375, 6.6971435546875, 7.154296875, 7.6114501953125, 8.068603515625, 8.5257568359375, 8.98291015625, 9.4400634765625, 9.897216796875, 10.3543701171875, 10.8115234375, 11.2686767578125, 11.725830078125, 12.1829833984375, 12.64013671875, 13.0972900390625, 13.554443359375, 14.0115966796875, 14.46875]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 7.0, 3.0, 3.0, 2.0, 10.0, 7.0, 7.0, 12.0, 11.0, 7.0, 18.0, 21.0, 22.0, 33.0, 31.0, 21.0, 38.0, 34.0, 45.0, 36.0, 41.0, 37.0, 44.0, 39.0, 45.0, 40.0, 33.0, 34.0, 33.0, 26.0, 30.0, 35.0, 29.0, 23.0, 20.0, 22.0, 20.0, 21.0, 6.0, 13.0, 14.0, 5.0, 13.0, 7.0, 2.0, 4.0, 4.0, 3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.609375, -25.748291015625, -24.88720703125, -24.026123046875, -23.1650390625, -22.303955078125, -21.44287109375, -20.581787109375, -19.720703125, -18.859619140625, -17.99853515625, -17.137451171875, -16.2763671875, -15.415283203125, -14.55419921875, -13.693115234375, -12.83203125, -11.970947265625, -11.10986328125, -10.248779296875, -9.3876953125, -8.526611328125, -7.66552734375, -6.804443359375, -5.943359375, -5.082275390625, -4.22119140625, -3.360107421875, -2.4990234375, -1.637939453125, -0.77685546875, 0.084228515625, 0.9453125, 1.806396484375, 2.66748046875, 3.528564453125, 4.3896484375, 5.250732421875, 6.11181640625, 6.972900390625, 7.833984375, 8.695068359375, 9.55615234375, 10.417236328125, 11.2783203125, 12.139404296875, 13.00048828125, 13.861572265625, 14.72265625, 15.583740234375, 16.44482421875, 17.305908203125, 18.1669921875, 19.028076171875, 19.88916015625, 20.750244140625, 21.611328125, 22.472412109375, 23.33349609375, 24.194580078125, 25.0556640625, 25.916748046875, 26.77783203125, 27.638916015625, 28.5]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 3.0, 7.0, 24.0, 29.0, 34.0, 61.0, 107.0, 162.0, 235.0, 433.0, 643.0, 978.0, 1659.0, 2520.0, 3748.0, 5635.0, 8370.0, 12309.0, 17531.0, 24684.0, 34007.0, 44932.0, 57390.0, 70304.0, 82045.0, 90693.0, 94507.0, 93042.0, 85888.0, 75195.0, 62454.0, 49902.0, 37954.0, 28192.0, 20194.0, 13992.0, 9848.0, 6513.0, 4350.0, 2912.0, 1792.0, 1189.0, 762.0, 510.0, 306.0, 193.0, 119.0, 78.0, 52.0, 28.0, 13.0, 18.0, 5.0, 6.0, 3.0, 2.0, 3.0], "bins": [-16.796875, -16.29833984375, -15.7998046875, -15.30126953125, -14.802734375, -14.30419921875, -13.8056640625, -13.30712890625, -12.80859375, -12.31005859375, -11.8115234375, -11.31298828125, -10.814453125, -10.31591796875, -9.8173828125, -9.31884765625, -8.8203125, -8.32177734375, -7.8232421875, -7.32470703125, -6.826171875, -6.32763671875, -5.8291015625, -5.33056640625, -4.83203125, -4.33349609375, -3.8349609375, -3.33642578125, -2.837890625, -2.33935546875, -1.8408203125, -1.34228515625, -0.84375, -0.34521484375, 0.1533203125, 0.65185546875, 1.150390625, 1.64892578125, 2.1474609375, 2.64599609375, 3.14453125, 3.64306640625, 4.1416015625, 4.64013671875, 5.138671875, 5.63720703125, 6.1357421875, 6.63427734375, 7.1328125, 7.63134765625, 8.1298828125, 8.62841796875, 9.126953125, 9.62548828125, 10.1240234375, 10.62255859375, 11.12109375, 11.61962890625, 12.1181640625, 12.61669921875, 13.115234375, 13.61376953125, 14.1123046875, 14.61083984375, 15.109375]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 4.0, 2.0, 4.0, 2.0, 3.0, 3.0, 7.0, 4.0, 11.0, 16.0, 18.0, 14.0, 17.0, 21.0, 27.0, 32.0, 23.0, 38.0, 33.0, 43.0, 50.0, 43.0, 50.0, 53.0, 47.0, 37.0, 46.0, 51.0, 37.0, 33.0, 44.0, 32.0, 26.0, 19.0, 23.0, 16.0, 20.0, 11.0, 11.0, 12.0, 9.0, 8.0, 7.0, 0.0, 3.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.828125, -16.2333984375, -15.638671875, -15.0439453125, -14.44921875, -13.8544921875, -13.259765625, -12.6650390625, -12.0703125, -11.4755859375, -10.880859375, -10.2861328125, -9.69140625, -9.0966796875, -8.501953125, -7.9072265625, -7.3125, -6.7177734375, -6.123046875, -5.5283203125, -4.93359375, -4.3388671875, -3.744140625, -3.1494140625, -2.5546875, -1.9599609375, -1.365234375, -0.7705078125, -0.17578125, 0.4189453125, 1.013671875, 1.6083984375, 2.203125, 2.7978515625, 3.392578125, 3.9873046875, 4.58203125, 5.1767578125, 5.771484375, 6.3662109375, 6.9609375, 7.5556640625, 8.150390625, 8.7451171875, 9.33984375, 9.9345703125, 10.529296875, 11.1240234375, 11.71875, 12.3134765625, 12.908203125, 13.5029296875, 14.09765625, 14.6923828125, 15.287109375, 15.8818359375, 16.4765625, 17.0712890625, 17.666015625, 18.2607421875, 18.85546875, 19.4501953125, 20.044921875, 20.6396484375, 21.234375]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 6.0, 3.0, 3.0, 10.0, 15.0, 15.0, 22.0, 33.0, 39.0, 77.0, 92.0, 117.0, 157.0, 328.0, 455.0, 706.0, 1130.0, 1958.0, 3224.0, 5505.0, 9320.0, 16143.0, 26698.0, 42698.0, 63365.0, 87416.0, 111532.0, 126647.0, 129697.0, 118967.0, 97992.0, 72434.0, 50606.0, 32316.0, 20025.0, 11630.0, 6915.0, 4009.0, 2378.0, 1439.0, 825.0, 563.0, 350.0, 225.0, 145.0, 104.0, 66.0, 56.0, 28.0, 32.0, 16.0, 16.0, 10.0, 3.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-7.21875, -6.979736328125, -6.74072265625, -6.501708984375, -6.2626953125, -6.023681640625, -5.78466796875, -5.545654296875, -5.306640625, -5.067626953125, -4.82861328125, -4.589599609375, -4.3505859375, -4.111572265625, -3.87255859375, -3.633544921875, -3.39453125, -3.155517578125, -2.91650390625, -2.677490234375, -2.4384765625, -2.199462890625, -1.96044921875, -1.721435546875, -1.482421875, -1.243408203125, -1.00439453125, -0.765380859375, -0.5263671875, -0.287353515625, -0.04833984375, 0.190673828125, 0.4296875, 0.668701171875, 0.90771484375, 1.146728515625, 1.3857421875, 1.624755859375, 1.86376953125, 2.102783203125, 2.341796875, 2.580810546875, 2.81982421875, 3.058837890625, 3.2978515625, 3.536865234375, 3.77587890625, 4.014892578125, 4.25390625, 4.492919921875, 4.73193359375, 4.970947265625, 5.2099609375, 5.448974609375, 5.68798828125, 5.927001953125, 6.166015625, 6.405029296875, 6.64404296875, 6.883056640625, 7.1220703125, 7.361083984375, 7.60009765625, 7.839111328125, 8.078125]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 3.0, 4.0, 10.0, 4.0, 10.0, 6.0, 17.0, 21.0, 26.0, 17.0, 27.0, 29.0, 35.0, 41.0, 48.0, 57.0, 54.0, 60.0, 61.0, 62.0, 58.0, 54.0, 40.0, 42.0, 46.0, 36.0, 26.0, 21.0, 17.0, 22.0, 8.0, 10.0, 14.0, 6.0, 5.0, 3.0, 4.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0009469985961914062, -0.0009180232882499695, -0.0008890479803085327, -0.000860072672367096, -0.0008310973644256592, -0.0008021220564842224, -0.0007731467485427856, -0.0007441714406013489, -0.0007151961326599121, -0.0006862208247184753, -0.0006572455167770386, -0.0006282702088356018, -0.000599294900894165, -0.0005703195929527283, -0.0005413442850112915, -0.0005123689770698547, -0.00048339366912841797, -0.0004544183611869812, -0.00042544305324554443, -0.00039646774530410767, -0.0003674924373626709, -0.00033851712942123413, -0.00030954182147979736, -0.0002805665135383606, -0.00025159120559692383, -0.00022261589765548706, -0.0001936405897140503, -0.00016466528177261353, -0.00013568997383117676, -0.00010671466588973999, -7.773935794830322e-05, -4.8764050006866455e-05, -1.9788742065429688e-05, 9.18656587600708e-06, 3.816187381744385e-05, 6.713718175888062e-05, 9.611248970031738e-05, 0.00012508779764175415, 0.00015406310558319092, 0.00018303841352462769, 0.00021201372146606445, 0.00024098902940750122, 0.000269964337348938, 0.00029893964529037476, 0.0003279149532318115, 0.0003568902611732483, 0.00038586556911468506, 0.0004148408770561218, 0.0004438161849975586, 0.00047279149293899536, 0.0005017668008804321, 0.0005307421088218689, 0.0005597174167633057, 0.0005886927247047424, 0.0006176680326461792, 0.000646643340587616, 0.0006756186485290527, 0.0007045939564704895, 0.0007335692644119263, 0.000762544572353363, 0.0007915198802947998, 0.0008204951882362366, 0.0008494704961776733, 0.0008784458041191101, 0.0009074211120605469]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 0.0, 3.0, 2.0, 4.0, 7.0, 6.0, 15.0, 16.0, 17.0, 30.0, 76.0, 105.0, 178.0, 270.0, 461.0, 779.0, 1288.0, 2117.0, 3473.0, 5976.0, 9910.0, 15992.0, 26044.0, 40053.0, 59788.0, 82605.0, 105724.0, 122966.0, 127973.0, 118658.0, 99194.0, 76337.0, 53859.0, 35706.0, 22914.0, 14266.0, 8595.0, 5254.0, 3122.0, 1925.0, 1090.0, 685.0, 422.0, 273.0, 143.0, 101.0, 53.0, 40.0, 27.0, 10.0, 7.0, 5.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.96484375, -7.71875, -7.47265625, -7.2265625, -6.98046875, -6.734375, -6.48828125, -6.2421875, -5.99609375, -5.75, -5.50390625, -5.2578125, -5.01171875, -4.765625, -4.51953125, -4.2734375, -4.02734375, -3.78125, -3.53515625, -3.2890625, -3.04296875, -2.796875, -2.55078125, -2.3046875, -2.05859375, -1.8125, -1.56640625, -1.3203125, -1.07421875, -0.828125, -0.58203125, -0.3359375, -0.08984375, 0.15625, 0.40234375, 0.6484375, 0.89453125, 1.140625, 1.38671875, 1.6328125, 1.87890625, 2.125, 2.37109375, 2.6171875, 2.86328125, 3.109375, 3.35546875, 3.6015625, 3.84765625, 4.09375, 4.33984375, 4.5859375, 4.83203125, 5.078125, 5.32421875, 5.5703125, 5.81640625, 6.0625, 6.30859375, 6.5546875, 6.80078125, 7.046875, 7.29296875, 7.5390625, 7.78515625]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 7.0, 7.0, 14.0, 13.0, 13.0, 13.0, 19.0, 22.0, 30.0, 35.0, 47.0, 42.0, 74.0, 57.0, 51.0, 51.0, 75.0, 68.0, 44.0, 56.0, 34.0, 31.0, 34.0, 37.0, 35.0, 19.0, 16.0, 14.0, 15.0, 11.0, 3.0, 5.0, 4.0, 3.0, 4.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.314453125, -3.195648193359375, -3.07684326171875, -2.958038330078125, -2.8392333984375, -2.720428466796875, -2.60162353515625, -2.482818603515625, -2.364013671875, -2.245208740234375, -2.12640380859375, -2.007598876953125, -1.8887939453125, -1.769989013671875, -1.65118408203125, -1.532379150390625, -1.41357421875, -1.294769287109375, -1.17596435546875, -1.057159423828125, -0.9383544921875, -0.819549560546875, -0.70074462890625, -0.581939697265625, -0.463134765625, -0.344329833984375, -0.22552490234375, -0.106719970703125, 0.0120849609375, 0.130889892578125, 0.24969482421875, 0.368499755859375, 0.4873046875, 0.606109619140625, 0.72491455078125, 0.843719482421875, 0.9625244140625, 1.081329345703125, 1.20013427734375, 1.318939208984375, 1.437744140625, 1.556549072265625, 1.67535400390625, 1.794158935546875, 1.9129638671875, 2.031768798828125, 2.15057373046875, 2.269378662109375, 2.38818359375, 2.506988525390625, 2.62579345703125, 2.744598388671875, 2.8634033203125, 2.982208251953125, 3.10101318359375, 3.219818115234375, 3.338623046875, 3.457427978515625, 3.57623291015625, 3.695037841796875, 3.8138427734375, 3.932647705078125, 4.05145263671875, 4.170257568359375, 4.2890625]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 2.0, 5.0, 10.0, 10.0, 9.0, 14.0, 14.0, 19.0, 18.0, 18.0, 27.0, 23.0, 24.0, 34.0, 31.0, 36.0, 32.0, 42.0, 44.0, 44.0, 48.0, 38.0, 46.0, 56.0, 44.0, 40.0, 44.0, 35.0, 31.0, 27.0, 28.0, 19.0, 24.0, 15.0, 12.0, 10.0, 11.0, 9.0, 2.0, 5.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-25.026466369628906, -24.18355941772461, -23.340654373168945, -22.49774742126465, -21.654842376708984, -20.811935424804688, -19.96902847290039, -19.126121520996094, -18.28321647644043, -17.440309524536133, -16.59740447998047, -15.754497528076172, -14.911591529846191, -14.068685531616211, -13.225778579711914, -12.382872581481934, -11.539966583251953, -10.697060585021973, -9.854154586791992, -9.011247634887695, -8.168341636657715, -7.325435638427734, -6.482529163360596, -5.639622688293457, -4.796716690063477, -3.953810453414917, -3.1109042167663574, -2.267997980117798, -1.4250917434692383, -0.5821857452392578, 0.26072072982788086, 1.1036272048950195, 1.9465351104736328, 2.7894413471221924, 3.632347583770752, 4.475254058837891, 5.318160057067871, 6.161066055297852, 7.00397253036499, 7.846879005432129, 8.68978500366211, 9.53269100189209, 10.37559700012207, 11.218503952026367, 12.061409950256348, 12.904315948486328, 13.747222900390625, 14.590128898620605, 15.433034896850586, 16.275941848754883, 17.118846893310547, 17.961753845214844, 18.80466079711914, 19.647565841674805, 20.4904727935791, 21.333377838134766, 22.176284790039062, 23.01919174194336, 23.862096786499023, 24.70500373840332, 25.547908782958984, 26.39081573486328, 27.233722686767578, 28.076629638671875, 28.91953468322754]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 4.0, 4.0, 3.0, 1.0, 3.0, 8.0, 9.0, 2.0, 6.0, 8.0, 12.0, 11.0, 21.0, 15.0, 22.0, 18.0, 21.0, 39.0, 38.0, 37.0, 27.0, 28.0, 35.0, 36.0, 34.0, 39.0, 31.0, 50.0, 45.0, 36.0, 35.0, 31.0, 34.0, 26.0, 24.0, 27.0, 21.0, 27.0, 18.0, 17.0, 14.0, 14.0, 10.0, 14.0, 8.0, 9.0, 11.0, 6.0, 5.0, 6.0, 2.0, 4.0, 3.0, 4.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-24.079917907714844, -23.278287887573242, -22.47665786743164, -21.67502784729004, -20.873397827148438, -20.07176971435547, -19.270139694213867, -18.468509674072266, -17.666879653930664, -16.865249633789062, -16.06361961364746, -15.261990547180176, -14.460360527038574, -13.658730506896973, -12.857101440429688, -12.055471420288086, -11.253841400146484, -10.452211380004883, -9.650581359863281, -8.848952293395996, -8.047322273254395, -7.245692253112793, -6.44406270980835, -5.642433166503906, -4.840803146362305, -4.039173126220703, -3.2375435829162598, -2.4359138011932373, -1.6342840194702148, -0.8326539993286133, -0.031024456024169922, 0.7706050872802734, 1.572235107421875, 2.3738648891448975, 3.17549467086792, 3.9771244525909424, 4.778754234313965, 5.580384254455566, 6.38201379776001, 7.183643341064453, 7.985273361206055, 8.786903381347656, 9.588533401489258, 10.390162467956543, 11.191792488098145, 11.993422508239746, 12.795051574707031, 13.596681594848633, 14.398311614990234, 15.199941635131836, 16.001571655273438, 16.80320167541504, 17.60483169555664, 18.40645980834961, 19.20808982849121, 20.009719848632812, 20.811349868774414, 21.612979888916016, 22.414609909057617, 23.21623992919922, 24.017868041992188, 24.819499969482422, 25.62112808227539, 26.422758102416992, 27.224388122558594]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 15.0, 11.0, 19.0, 49.0, 87.0, 151.0, 261.0, 558.0, 853.0, 1459.0, 2455.0, 4219.0, 6808.0, 11619.0, 18463.0, 29620.0, 45870.0, 69602.0, 102628.0, 146208.0, 199866.0, 261583.0, 323799.0, 375414.0, 410932.0, 415791.0, 393196.0, 346669.0, 286609.0, 223445.0, 165663.0, 118044.0, 81390.0, 54492.0, 35954.0, 22746.0, 14524.0, 8930.0, 5569.0, 3479.0, 2083.0, 1288.0, 786.0, 456.0, 246.0, 145.0, 94.0, 60.0, 42.0, 18.0, 13.0, 4.0, 3.0, 5.0, 0.0, 0.0, 0.0, 3.0], "bins": [-17.875, -17.302490234375, -16.72998046875, -16.157470703125, -15.5849609375, -15.012451171875, -14.43994140625, -13.867431640625, -13.294921875, -12.722412109375, -12.14990234375, -11.577392578125, -11.0048828125, -10.432373046875, -9.85986328125, -9.287353515625, -8.71484375, -8.142333984375, -7.56982421875, -6.997314453125, -6.4248046875, -5.852294921875, -5.27978515625, -4.707275390625, -4.134765625, -3.562255859375, -2.98974609375, -2.417236328125, -1.8447265625, -1.272216796875, -0.69970703125, -0.127197265625, 0.4453125, 1.017822265625, 1.59033203125, 2.162841796875, 2.7353515625, 3.307861328125, 3.88037109375, 4.452880859375, 5.025390625, 5.597900390625, 6.17041015625, 6.742919921875, 7.3154296875, 7.887939453125, 8.46044921875, 9.032958984375, 9.60546875, 10.177978515625, 10.75048828125, 11.322998046875, 11.8955078125, 12.468017578125, 13.04052734375, 13.613037109375, 14.185546875, 14.758056640625, 15.33056640625, 15.903076171875, 16.4755859375, 17.048095703125, 17.62060546875, 18.193115234375, 18.765625]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [2.0, 4.0, 1.0, 4.0, 1.0, 3.0, 2.0, 4.0, 4.0, 2.0, 5.0, 8.0, 11.0, 9.0, 12.0, 17.0, 18.0, 27.0, 20.0, 21.0, 21.0, 28.0, 28.0, 37.0, 31.0, 40.0, 31.0, 33.0, 42.0, 31.0, 45.0, 38.0, 38.0, 35.0, 34.0, 31.0, 30.0, 23.0, 18.0, 25.0, 21.0, 27.0, 19.0, 28.0, 20.0, 12.0, 10.0, 12.0, 10.0, 8.0, 10.0, 4.0, 3.0, 6.0, 1.0, 3.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 2.0, 4.0], "bins": [-19.4375, -18.802978515625, -18.16845703125, -17.533935546875, -16.8994140625, -16.264892578125, -15.63037109375, -14.995849609375, -14.361328125, -13.726806640625, -13.09228515625, -12.457763671875, -11.8232421875, -11.188720703125, -10.55419921875, -9.919677734375, -9.28515625, -8.650634765625, -8.01611328125, -7.381591796875, -6.7470703125, -6.112548828125, -5.47802734375, -4.843505859375, -4.208984375, -3.574462890625, -2.93994140625, -2.305419921875, -1.6708984375, -1.036376953125, -0.40185546875, 0.232666015625, 0.8671875, 1.501708984375, 2.13623046875, 2.770751953125, 3.4052734375, 4.039794921875, 4.67431640625, 5.308837890625, 5.943359375, 6.577880859375, 7.21240234375, 7.846923828125, 8.4814453125, 9.115966796875, 9.75048828125, 10.385009765625, 11.01953125, 11.654052734375, 12.28857421875, 12.923095703125, 13.5576171875, 14.192138671875, 14.82666015625, 15.461181640625, 16.095703125, 16.730224609375, 17.36474609375, 17.999267578125, 18.6337890625, 19.268310546875, 19.90283203125, 20.537353515625, 21.171875]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 4.0, 11.0, 22.0, 28.0, 71.0, 121.0, 163.0, 302.0, 528.0, 962.0, 1598.0, 2725.0, 4555.0, 7244.0, 11673.0, 18836.0, 29233.0, 43836.0, 65638.0, 93710.0, 129577.0, 173174.0, 221807.0, 270559.0, 316738.0, 351335.0, 369940.0, 369272.0, 347899.0, 312081.0, 267355.0, 216958.0, 168628.0, 126759.0, 91230.0, 62903.0, 42591.0, 27752.0, 18077.0, 11193.0, 7027.0, 4246.0, 2515.0, 1407.0, 840.0, 493.0, 281.0, 188.0, 88.0, 46.0, 35.0, 13.0, 15.0, 4.0, 1.0, 2.0, 2.0, 4.0], "bins": [-18.375, -17.8173828125, -17.259765625, -16.7021484375, -16.14453125, -15.5869140625, -15.029296875, -14.4716796875, -13.9140625, -13.3564453125, -12.798828125, -12.2412109375, -11.68359375, -11.1259765625, -10.568359375, -10.0107421875, -9.453125, -8.8955078125, -8.337890625, -7.7802734375, -7.22265625, -6.6650390625, -6.107421875, -5.5498046875, -4.9921875, -4.4345703125, -3.876953125, -3.3193359375, -2.76171875, -2.2041015625, -1.646484375, -1.0888671875, -0.53125, 0.0263671875, 0.583984375, 1.1416015625, 1.69921875, 2.2568359375, 2.814453125, 3.3720703125, 3.9296875, 4.4873046875, 5.044921875, 5.6025390625, 6.16015625, 6.7177734375, 7.275390625, 7.8330078125, 8.390625, 8.9482421875, 9.505859375, 10.0634765625, 10.62109375, 11.1787109375, 11.736328125, 12.2939453125, 12.8515625, 13.4091796875, 13.966796875, 14.5244140625, 15.08203125, 15.6396484375, 16.197265625, 16.7548828125, 17.3125]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 5.0, 8.0, 11.0, 12.0, 23.0, 27.0, 25.0, 48.0, 54.0, 62.0, 70.0, 75.0, 85.0, 104.0, 139.0, 137.0, 161.0, 175.0, 182.0, 183.0, 204.0, 228.0, 221.0, 209.0, 204.0, 187.0, 163.0, 161.0, 144.0, 139.0, 118.0, 102.0, 91.0, 63.0, 53.0, 44.0, 37.0, 36.0, 26.0, 16.0, 10.0, 12.0, 9.0, 7.0, 5.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.6171875, -11.2637939453125, -10.910400390625, -10.5570068359375, -10.20361328125, -9.8502197265625, -9.496826171875, -9.1434326171875, -8.7900390625, -8.4366455078125, -8.083251953125, -7.7298583984375, -7.37646484375, -7.0230712890625, -6.669677734375, -6.3162841796875, -5.962890625, -5.6094970703125, -5.256103515625, -4.9027099609375, -4.54931640625, -4.1959228515625, -3.842529296875, -3.4891357421875, -3.1357421875, -2.7823486328125, -2.428955078125, -2.0755615234375, -1.72216796875, -1.3687744140625, -1.015380859375, -0.6619873046875, -0.30859375, 0.0447998046875, 0.398193359375, 0.7515869140625, 1.10498046875, 1.4583740234375, 1.811767578125, 2.1651611328125, 2.5185546875, 2.8719482421875, 3.225341796875, 3.5787353515625, 3.93212890625, 4.2855224609375, 4.638916015625, 4.9923095703125, 5.345703125, 5.6990966796875, 6.052490234375, 6.4058837890625, 6.75927734375, 7.1126708984375, 7.466064453125, 7.8194580078125, 8.1728515625, 8.5262451171875, 8.879638671875, 9.2330322265625, 9.58642578125, 9.9398193359375, 10.293212890625, 10.6466064453125, 11.0]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 3.0, 2.0, 3.0, 5.0, 4.0, 11.0, 9.0, 14.0, 11.0, 9.0, 14.0, 17.0, 18.0, 26.0, 22.0, 30.0, 19.0, 31.0, 44.0, 27.0, 41.0, 42.0, 34.0, 43.0, 39.0, 34.0, 37.0, 47.0, 33.0, 37.0, 41.0, 29.0, 28.0, 29.0, 28.0, 24.0, 27.0, 21.0, 19.0, 7.0, 11.0, 7.0, 9.0, 7.0, 6.0, 1.0, 6.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-24.317245483398438, -23.54956817626953, -22.781890869140625, -22.014211654663086, -21.24653434753418, -20.478857040405273, -19.711177825927734, -18.943500518798828, -18.175823211669922, -17.408145904541016, -16.64046859741211, -15.87278938293457, -15.105112075805664, -14.337434768676758, -13.569756507873535, -12.802078247070312, -12.034400939941406, -11.2667236328125, -10.499045372009277, -9.731367111206055, -8.963689804077148, -8.196012496948242, -7.4283342361450195, -6.660656452178955, -5.892978668212891, -5.125300884246826, -4.357623100280762, -3.5899453163146973, -2.822267532348633, -2.0545897483825684, -1.286911964416504, -0.5192341804504395, 0.248443603515625, 1.0161213874816895, 1.783799171447754, 2.5514769554138184, 3.319154739379883, 4.086832523345947, 4.854510307312012, 5.622188091278076, 6.389865875244141, 7.157543659210205, 7.9252214431762695, 8.692899703979492, 9.460577011108398, 10.228254318237305, 10.995932579040527, 11.76361083984375, 12.531288146972656, 13.298965454101562, 14.066643714904785, 14.834321975708008, 15.601999282836914, 16.36967658996582, 17.13735580444336, 17.905033111572266, 18.672710418701172, 19.440387725830078, 20.208065032958984, 20.975744247436523, 21.74342155456543, 22.511098861694336, 23.278778076171875, 24.04645538330078, 24.814132690429688]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 4.0, 7.0, 3.0, 7.0, 13.0, 11.0, 14.0, 18.0, 15.0, 15.0, 19.0, 24.0, 26.0, 20.0, 31.0, 26.0, 32.0, 27.0, 37.0, 35.0, 28.0, 22.0, 40.0, 43.0, 38.0, 35.0, 38.0, 30.0, 40.0, 27.0, 32.0, 36.0, 20.0, 23.0, 27.0, 20.0, 22.0, 14.0, 14.0, 16.0, 8.0, 7.0, 9.0, 3.0, 6.0, 7.0, 7.0, 7.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-20.114910125732422, -19.35466766357422, -18.594425201416016, -17.834184646606445, -17.073942184448242, -16.31369972229004, -15.553458213806152, -14.793216705322266, -14.032974243164062, -13.27273178100586, -12.512490272521973, -11.752248764038086, -10.992006301879883, -10.23176383972168, -9.471522331237793, -8.711280822753906, -7.951038360595703, -7.190796375274658, -6.430554389953613, -5.670312404632568, -4.910070419311523, -4.1498284339904785, -3.3895864486694336, -2.6293444633483887, -1.8691024780273438, -1.1088604927062988, -0.3486185073852539, 0.411623477935791, 1.171865463256836, 1.9321074485778809, 2.692349433898926, 3.4525914192199707, 4.212831497192383, 4.973073482513428, 5.733315467834473, 6.493557453155518, 7.2537994384765625, 8.014041900634766, 8.774283409118652, 9.534524917602539, 10.294767379760742, 11.055009841918945, 11.815251350402832, 12.575492858886719, 13.335735321044922, 14.095977783203125, 14.856219291687012, 15.616460800170898, 16.3767032623291, 17.136945724487305, 17.897186279296875, 18.657428741455078, 19.41767120361328, 20.177913665771484, 20.938156127929688, 21.698396682739258, 22.45863914489746, 23.218881607055664, 23.979122161865234, 24.739364624023438, 25.49960708618164, 26.259849548339844, 27.020092010498047, 27.780332565307617, 28.54057502746582]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 6.0, 8.0, 7.0, 16.0, 22.0, 52.0, 51.0, 87.0, 140.0, 208.0, 325.0, 510.0, 776.0, 1367.0, 2104.0, 3350.0, 5560.0, 8904.0, 15059.0, 24586.0, 38956.0, 61213.0, 90505.0, 125096.0, 149291.0, 147492.0, 123407.0, 89917.0, 60001.0, 38085.0, 23626.0, 14501.0, 9079.0, 5461.0, 3331.0, 1989.0, 1242.0, 788.0, 502.0, 336.0, 202.0, 143.0, 82.0, 61.0, 32.0, 36.0, 22.0, 14.0, 8.0, 3.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.15625, -4.0128173828125, -3.869384765625, -3.7259521484375, -3.58251953125, -3.4390869140625, -3.295654296875, -3.1522216796875, -3.0087890625, -2.8653564453125, -2.721923828125, -2.5784912109375, -2.43505859375, -2.2916259765625, -2.148193359375, -2.0047607421875, -1.861328125, -1.7178955078125, -1.574462890625, -1.4310302734375, -1.28759765625, -1.1441650390625, -1.000732421875, -0.8572998046875, -0.7138671875, -0.5704345703125, -0.427001953125, -0.2835693359375, -0.14013671875, 0.0032958984375, 0.146728515625, 0.2901611328125, 0.43359375, 0.5770263671875, 0.720458984375, 0.8638916015625, 1.00732421875, 1.1507568359375, 1.294189453125, 1.4376220703125, 1.5810546875, 1.7244873046875, 1.867919921875, 2.0113525390625, 2.15478515625, 2.2982177734375, 2.441650390625, 2.5850830078125, 2.728515625, 2.8719482421875, 3.015380859375, 3.1588134765625, 3.30224609375, 3.4456787109375, 3.589111328125, 3.7325439453125, 3.8759765625, 4.0194091796875, 4.162841796875, 4.3062744140625, 4.44970703125, 4.5931396484375, 4.736572265625, 4.8800048828125, 5.0234375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 6.0, 2.0, 5.0, 7.0, 13.0, 10.0, 6.0, 12.0, 11.0, 20.0, 12.0, 18.0, 24.0, 28.0, 16.0, 33.0, 23.0, 34.0, 31.0, 30.0, 34.0, 40.0, 35.0, 45.0, 43.0, 34.0, 44.0, 33.0, 37.0, 31.0, 33.0, 27.0, 36.0, 28.0, 28.0, 11.0, 17.0, 25.0, 18.0, 13.0, 13.0, 6.0, 6.0, 4.0, 8.0, 3.0, 7.0, 7.0, 3.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.921875, -21.0908203125, -20.259765625, -19.4287109375, -18.59765625, -17.7666015625, -16.935546875, -16.1044921875, -15.2734375, -14.4423828125, -13.611328125, -12.7802734375, -11.94921875, -11.1181640625, -10.287109375, -9.4560546875, -8.625, -7.7939453125, -6.962890625, -6.1318359375, -5.30078125, -4.4697265625, -3.638671875, -2.8076171875, -1.9765625, -1.1455078125, -0.314453125, 0.5166015625, 1.34765625, 2.1787109375, 3.009765625, 3.8408203125, 4.671875, 5.5029296875, 6.333984375, 7.1650390625, 7.99609375, 8.8271484375, 9.658203125, 10.4892578125, 11.3203125, 12.1513671875, 12.982421875, 13.8134765625, 14.64453125, 15.4755859375, 16.306640625, 17.1376953125, 17.96875, 18.7998046875, 19.630859375, 20.4619140625, 21.29296875, 22.1240234375, 22.955078125, 23.7861328125, 24.6171875, 25.4482421875, 26.279296875, 27.1103515625, 27.94140625, 28.7724609375, 29.603515625, 30.4345703125, 31.265625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 2.0, 4.0, 11.0, 7.0, 15.0, 23.0, 32.0, 50.0, 96.0, 135.0, 229.0, 361.0, 616.0, 1012.0, 1826.0, 3333.0, 6029.0, 11109.0, 21149.0, 40296.0, 74519.0, 128882.0, 188704.0, 204594.0, 156131.0, 95907.0, 53042.0, 27855.0, 14677.0, 7981.0, 4303.0, 2323.0, 1368.0, 785.0, 444.0, 270.0, 182.0, 95.0, 60.0, 39.0, 19.0, 19.0, 11.0, 6.0, 6.0, 6.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.49609375, -5.3079833984375, -5.119873046875, -4.9317626953125, -4.74365234375, -4.5555419921875, -4.367431640625, -4.1793212890625, -3.9912109375, -3.8031005859375, -3.614990234375, -3.4268798828125, -3.23876953125, -3.0506591796875, -2.862548828125, -2.6744384765625, -2.486328125, -2.2982177734375, -2.110107421875, -1.9219970703125, -1.73388671875, -1.5457763671875, -1.357666015625, -1.1695556640625, -0.9814453125, -0.7933349609375, -0.605224609375, -0.4171142578125, -0.22900390625, -0.0408935546875, 0.147216796875, 0.3353271484375, 0.5234375, 0.7115478515625, 0.899658203125, 1.0877685546875, 1.27587890625, 1.4639892578125, 1.652099609375, 1.8402099609375, 2.0283203125, 2.2164306640625, 2.404541015625, 2.5926513671875, 2.78076171875, 2.9688720703125, 3.156982421875, 3.3450927734375, 3.533203125, 3.7213134765625, 3.909423828125, 4.0975341796875, 4.28564453125, 4.4737548828125, 4.661865234375, 4.8499755859375, 5.0380859375, 5.2261962890625, 5.414306640625, 5.6024169921875, 5.79052734375, 5.9786376953125, 6.166748046875, 6.3548583984375, 6.54296875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 3.0, 6.0, 5.0, 7.0, 6.0, 10.0, 11.0, 6.0, 16.0, 17.0, 16.0, 26.0, 27.0, 21.0, 25.0, 32.0, 31.0, 36.0, 39.0, 44.0, 25.0, 41.0, 40.0, 43.0, 35.0, 39.0, 44.0, 45.0, 38.0, 35.0, 23.0, 37.0, 23.0, 22.0, 19.0, 15.0, 23.0, 13.0, 14.0, 14.0, 7.0, 11.0, 5.0, 3.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-17.625, -17.06689453125, -16.5087890625, -15.95068359375, -15.392578125, -14.83447265625, -14.2763671875, -13.71826171875, -13.16015625, -12.60205078125, -12.0439453125, -11.48583984375, -10.927734375, -10.36962890625, -9.8115234375, -9.25341796875, -8.6953125, -8.13720703125, -7.5791015625, -7.02099609375, -6.462890625, -5.90478515625, -5.3466796875, -4.78857421875, -4.23046875, -3.67236328125, -3.1142578125, -2.55615234375, -1.998046875, -1.43994140625, -0.8818359375, -0.32373046875, 0.234375, 0.79248046875, 1.3505859375, 1.90869140625, 2.466796875, 3.02490234375, 3.5830078125, 4.14111328125, 4.69921875, 5.25732421875, 5.8154296875, 6.37353515625, 6.931640625, 7.48974609375, 8.0478515625, 8.60595703125, 9.1640625, 9.72216796875, 10.2802734375, 10.83837890625, 11.396484375, 11.95458984375, 12.5126953125, 13.07080078125, 13.62890625, 14.18701171875, 14.7451171875, 15.30322265625, 15.861328125, 16.41943359375, 16.9775390625, 17.53564453125, 18.09375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 4.0, 2.0, 3.0, 5.0, 10.0, 9.0, 19.0, 28.0, 28.0, 46.0, 61.0, 74.0, 124.0, 155.0, 217.0, 327.0, 457.0, 710.0, 1044.0, 1753.0, 2711.0, 4366.0, 7682.0, 14728.0, 31291.0, 72272.0, 168199.0, 293914.0, 239643.0, 113444.0, 47621.0, 21769.0, 10540.0, 5733.0, 3410.0, 2010.0, 1287.0, 855.0, 565.0, 425.0, 268.0, 205.0, 151.0, 94.0, 79.0, 66.0, 37.0, 34.0, 26.0, 20.0, 15.0, 10.0, 5.0, 10.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.1123046875, -1.076141357421875, -1.03997802734375, -1.003814697265625, -0.9676513671875, -0.931488037109375, -0.89532470703125, -0.859161376953125, -0.822998046875, -0.786834716796875, -0.75067138671875, -0.714508056640625, -0.6783447265625, -0.642181396484375, -0.60601806640625, -0.569854736328125, -0.53369140625, -0.497528076171875, -0.46136474609375, -0.425201416015625, -0.3890380859375, -0.352874755859375, -0.31671142578125, -0.280548095703125, -0.244384765625, -0.208221435546875, -0.17205810546875, -0.135894775390625, -0.0997314453125, -0.063568115234375, -0.02740478515625, 0.008758544921875, 0.044921875, 0.081085205078125, 0.11724853515625, 0.153411865234375, 0.1895751953125, 0.225738525390625, 0.26190185546875, 0.298065185546875, 0.334228515625, 0.370391845703125, 0.40655517578125, 0.442718505859375, 0.4788818359375, 0.515045166015625, 0.55120849609375, 0.587371826171875, 0.62353515625, 0.659698486328125, 0.69586181640625, 0.732025146484375, 0.7681884765625, 0.804351806640625, 0.84051513671875, 0.876678466796875, 0.912841796875, 0.949005126953125, 0.98516845703125, 1.021331787109375, 1.0574951171875, 1.093658447265625, 1.12982177734375, 1.165985107421875, 1.2021484375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 7.0, 8.0, 10.0, 10.0, 13.0, 27.0, 29.0, 38.0, 61.0, 84.0, 84.0, 108.0, 101.0, 85.0, 88.0, 71.0, 44.0, 36.0, 24.0, 20.0, 9.0, 8.0, 7.0, 11.0, 3.0, 6.0, 4.0, 1.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014495849609375, -0.00013921968638896942, -0.00013348087668418884, -0.00012774206697940826, -0.00012200325727462769, -0.00011626444756984711, -0.00011052563786506653, -0.00010478682816028595, -9.904801845550537e-05, -9.330920875072479e-05, -8.757039904594421e-05, -8.183158934116364e-05, -7.609277963638306e-05, -7.035396993160248e-05, -6.46151602268219e-05, -5.887635052204132e-05, -5.313754081726074e-05, -4.7398731112480164e-05, -4.1659921407699585e-05, -3.5921111702919006e-05, -3.0182301998138428e-05, -2.444349229335785e-05, -1.870468258857727e-05, -1.2965872883796692e-05, -7.227063179016113e-06, -1.4882534742355347e-06, 4.250556230545044e-06, 9.989365935325623e-06, 1.57281756401062e-05, 2.146698534488678e-05, 2.720579504966736e-05, 3.294460475444794e-05, 3.8683414459228516e-05, 4.4422224164009094e-05, 5.016103386878967e-05, 5.589984357357025e-05, 6.163865327835083e-05, 6.737746298313141e-05, 7.311627268791199e-05, 7.885508239269257e-05, 8.459389209747314e-05, 9.033270180225372e-05, 9.60715115070343e-05, 0.00010181032121181488, 0.00010754913091659546, 0.00011328794062137604, 0.00011902675032615662, 0.0001247655600309372, 0.00013050436973571777, 0.00013624317944049835, 0.00014198198914527893, 0.0001477207988500595, 0.0001534596085548401, 0.00015919841825962067, 0.00016493722796440125, 0.00017067603766918182, 0.0001764148473739624, 0.00018215365707874298, 0.00018789246678352356, 0.00019363127648830414, 0.00019937008619308472, 0.0002051088958978653, 0.00021084770560264587, 0.00021658651530742645, 0.00022232532501220703]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 5.0, 7.0, 9.0, 14.0, 18.0, 24.0, 40.0, 69.0, 92.0, 114.0, 152.0, 268.0, 300.0, 466.0, 668.0, 935.0, 1332.0, 1894.0, 2697.0, 4001.0, 5947.0, 8994.0, 14110.0, 22573.0, 37153.0, 62455.0, 105099.0, 163640.0, 198819.0, 159017.0, 100306.0, 59610.0, 35368.0, 21630.0, 13429.0, 8692.0, 5712.0, 3955.0, 2602.0, 1878.0, 1291.0, 934.0, 654.0, 463.0, 321.0, 234.0, 180.0, 116.0, 95.0, 51.0, 43.0, 34.0, 18.0, 16.0, 8.0, 3.0, 7.0, 2.0, 2.0, 3.0, 1.0, 1.0], "bins": [-1.271484375, -1.229736328125, -1.18798828125, -1.146240234375, -1.1044921875, -1.062744140625, -1.02099609375, -0.979248046875, -0.9375, -0.895751953125, -0.85400390625, -0.812255859375, -0.7705078125, -0.728759765625, -0.68701171875, -0.645263671875, -0.603515625, -0.561767578125, -0.52001953125, -0.478271484375, -0.4365234375, -0.394775390625, -0.35302734375, -0.311279296875, -0.26953125, -0.227783203125, -0.18603515625, -0.144287109375, -0.1025390625, -0.060791015625, -0.01904296875, 0.022705078125, 0.064453125, 0.106201171875, 0.14794921875, 0.189697265625, 0.2314453125, 0.273193359375, 0.31494140625, 0.356689453125, 0.3984375, 0.440185546875, 0.48193359375, 0.523681640625, 0.5654296875, 0.607177734375, 0.64892578125, 0.690673828125, 0.732421875, 0.774169921875, 0.81591796875, 0.857666015625, 0.8994140625, 0.941162109375, 0.98291015625, 1.024658203125, 1.06640625, 1.108154296875, 1.14990234375, 1.191650390625, 1.2333984375, 1.275146484375, 1.31689453125, 1.358642578125, 1.400390625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 5.0, 3.0, 3.0, 1.0, 6.0, 9.0, 10.0, 8.0, 12.0, 14.0, 19.0, 27.0, 27.0, 38.0, 52.0, 56.0, 60.0, 60.0, 71.0, 68.0, 67.0, 70.0, 39.0, 44.0, 38.0, 25.0, 28.0, 29.0, 18.0, 16.0, 14.0, 14.0, 13.0, 8.0, 8.0, 5.0, 2.0, 2.0, 2.0, 2.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0], "bins": [-0.59130859375, -0.5753898620605469, -0.5594711303710938, -0.5435523986816406, -0.5276336669921875, -0.5117149353027344, -0.49579620361328125, -0.4798774719238281, -0.463958740234375, -0.4480400085449219, -0.43212127685546875, -0.4162025451660156, -0.4002838134765625, -0.3843650817871094, -0.36844635009765625, -0.3525276184082031, -0.33660888671875, -0.3206901550292969, -0.30477142333984375, -0.2888526916503906, -0.2729339599609375, -0.2570152282714844, -0.24109649658203125, -0.22517776489257812, -0.209259033203125, -0.19334030151367188, -0.17742156982421875, -0.16150283813476562, -0.1455841064453125, -0.12966537475585938, -0.11374664306640625, -0.09782791137695312, -0.0819091796875, -0.06599044799804688, -0.05007171630859375, -0.034152984619140625, -0.0182342529296875, -0.002315521240234375, 0.01360321044921875, 0.029521942138671875, 0.045440673828125, 0.061359405517578125, 0.07727813720703125, 0.09319686889648438, 0.1091156005859375, 0.12503433227539062, 0.14095306396484375, 0.15687179565429688, 0.17279052734375, 0.18870925903320312, 0.20462799072265625, 0.22054672241210938, 0.2364654541015625, 0.2523841857910156, 0.26830291748046875, 0.2842216491699219, 0.300140380859375, 0.3160591125488281, 0.33197784423828125, 0.3478965759277344, 0.3638153076171875, 0.3797340393066406, 0.39565277099609375, 0.4115715026855469, 0.427490234375]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 4.0, 5.0, 11.0, 4.0, 14.0, 13.0, 10.0, 13.0, 13.0, 23.0, 21.0, 26.0, 21.0, 24.0, 34.0, 23.0, 45.0, 33.0, 35.0, 40.0, 45.0, 34.0, 40.0, 33.0, 39.0, 41.0, 35.0, 43.0, 36.0, 25.0, 32.0, 27.0, 21.0, 29.0, 21.0, 17.0, 16.0, 10.0, 11.0, 8.0, 7.0, 6.0, 2.0, 6.0, 5.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-23.540283203125, -22.78327751159668, -22.02627182006836, -21.26926612854004, -20.51226043701172, -19.7552547454834, -18.998249053955078, -18.24124526977539, -17.484237670898438, -16.727231979370117, -15.970226287841797, -15.213220596313477, -14.456214904785156, -13.699209213256836, -12.942204475402832, -12.185198783874512, -11.428194046020508, -10.671188354492188, -9.914182662963867, -9.157176971435547, -8.400171279907227, -7.6431660652160645, -6.886160850524902, -6.129155158996582, -5.372149467468262, -4.615143775939941, -3.8581383228302, -3.101132869720459, -2.3441271781921387, -1.5871214866638184, -0.8301162719726562, -0.07311058044433594, 0.6838970184326172, 1.440902590751648, 2.1979081630706787, 2.95491361618042, 3.7119193077087402, 4.4689249992370605, 5.225930213928223, 5.982935905456543, 6.739941596984863, 7.496947288513184, 8.253952980041504, 9.010957717895508, 9.767963409423828, 10.524969100952148, 11.281974792480469, 12.038980484008789, 12.79598617553711, 13.55299186706543, 14.30999755859375, 15.06700325012207, 15.82400894165039, 16.58101463317871, 17.33802032470703, 18.09502410888672, 18.852031707763672, 19.609037399291992, 20.366043090820312, 21.123048782348633, 21.880054473876953, 22.637060165405273, 23.394065856933594, 24.15106964111328, 24.9080753326416]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 1.0, 8.0, 4.0, 6.0, 9.0, 13.0, 14.0, 17.0, 17.0, 13.0, 21.0, 23.0, 24.0, 22.0, 28.0, 29.0, 31.0, 28.0, 32.0, 35.0, 33.0, 19.0, 41.0, 43.0, 39.0, 34.0, 39.0, 32.0, 41.0, 29.0, 24.0, 37.0, 26.0, 21.0, 23.0, 25.0, 19.0, 18.0, 15.0, 14.0, 9.0, 8.0, 6.0, 5.0, 7.0, 6.0, 7.0, 8.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-20.398534774780273, -19.63751983642578, -18.87650489807129, -18.115488052368164, -17.354473114013672, -16.59345817565918, -15.832443237304688, -15.071427345275879, -14.31041145324707, -13.549396514892578, -12.78838062286377, -12.027365684509277, -11.266349792480469, -10.505334854125977, -9.744319915771484, -8.983304023742676, -8.222289085388184, -7.461273670196533, -6.700258255004883, -5.939243316650391, -5.178227424621582, -4.41721248626709, -3.6561970710754395, -2.895181655883789, -2.1341662406921387, -1.3731508255004883, -0.6121355295181274, 0.1488797664642334, 0.9098951816558838, 1.6709105968475342, 2.4319257736206055, 3.192941188812256, 3.9539566040039062, 4.714972019195557, 5.475987434387207, 6.237002372741699, 6.998018264770508, 7.759033203125, 8.520048141479492, 9.2810640335083, 10.04207992553711, 10.803094863891602, 11.56411075592041, 12.325125694274902, 13.086141586303711, 13.847156524658203, 14.608171463012695, 15.369187355041504, 16.130203247070312, 16.891218185424805, 17.652233123779297, 18.413249969482422, 19.174264907836914, 19.935279846191406, 20.6962947845459, 21.45730972290039, 22.218324661254883, 22.979339599609375, 23.740354537963867, 24.501371383666992, 25.262386322021484, 26.023401260375977, 26.78441619873047, 27.545433044433594, 28.306447982788086]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 14.0, 21.0, 20.0, 49.0, 56.0, 80.0, 134.0, 223.0, 378.0, 583.0, 925.0, 1540.0, 2305.0, 3523.0, 5462.0, 7999.0, 11623.0, 16566.0, 23408.0, 31575.0, 42069.0, 53219.0, 64699.0, 76336.0, 84886.0, 90499.0, 90121.0, 85599.0, 77742.0, 66809.0, 55118.0, 43482.0, 32971.0, 24297.0, 17583.0, 12210.0, 8459.0, 5471.0, 3813.0, 2433.0, 1586.0, 959.0, 669.0, 434.0, 235.0, 147.0, 116.0, 53.0, 24.0, 19.0, 15.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-14.765625, -14.30517578125, -13.8447265625, -13.38427734375, -12.923828125, -12.46337890625, -12.0029296875, -11.54248046875, -11.08203125, -10.62158203125, -10.1611328125, -9.70068359375, -9.240234375, -8.77978515625, -8.3193359375, -7.85888671875, -7.3984375, -6.93798828125, -6.4775390625, -6.01708984375, -5.556640625, -5.09619140625, -4.6357421875, -4.17529296875, -3.71484375, -3.25439453125, -2.7939453125, -2.33349609375, -1.873046875, -1.41259765625, -0.9521484375, -0.49169921875, -0.03125, 0.42919921875, 0.8896484375, 1.35009765625, 1.810546875, 2.27099609375, 2.7314453125, 3.19189453125, 3.65234375, 4.11279296875, 4.5732421875, 5.03369140625, 5.494140625, 5.95458984375, 6.4150390625, 6.87548828125, 7.3359375, 7.79638671875, 8.2568359375, 8.71728515625, 9.177734375, 9.63818359375, 10.0986328125, 10.55908203125, 11.01953125, 11.47998046875, 11.9404296875, 12.40087890625, 12.861328125, 13.32177734375, 13.7822265625, 14.24267578125, 14.703125]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 4.0, 7.0, 9.0, 10.0, 11.0, 24.0, 14.0, 14.0, 12.0, 20.0, 18.0, 26.0, 28.0, 39.0, 35.0, 33.0, 28.0, 41.0, 42.0, 28.0, 35.0, 37.0, 51.0, 43.0, 33.0, 44.0, 29.0, 28.0, 36.0, 29.0, 20.0, 22.0, 17.0, 22.0, 17.0, 17.0, 15.0, 15.0, 9.0, 9.0, 12.0, 7.0, 5.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.71875, -21.89013671875, -21.0615234375, -20.23291015625, -19.404296875, -18.57568359375, -17.7470703125, -16.91845703125, -16.08984375, -15.26123046875, -14.4326171875, -13.60400390625, -12.775390625, -11.94677734375, -11.1181640625, -10.28955078125, -9.4609375, -8.63232421875, -7.8037109375, -6.97509765625, -6.146484375, -5.31787109375, -4.4892578125, -3.66064453125, -2.83203125, -2.00341796875, -1.1748046875, -0.34619140625, 0.482421875, 1.31103515625, 2.1396484375, 2.96826171875, 3.796875, 4.62548828125, 5.4541015625, 6.28271484375, 7.111328125, 7.93994140625, 8.7685546875, 9.59716796875, 10.42578125, 11.25439453125, 12.0830078125, 12.91162109375, 13.740234375, 14.56884765625, 15.3974609375, 16.22607421875, 17.0546875, 17.88330078125, 18.7119140625, 19.54052734375, 20.369140625, 21.19775390625, 22.0263671875, 22.85498046875, 23.68359375, 24.51220703125, 25.3408203125, 26.16943359375, 26.998046875, 27.82666015625, 28.6552734375, 29.48388671875, 30.3125]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 3.0, 4.0, 7.0, 13.0, 20.0, 33.0, 38.0, 73.0, 107.0, 170.0, 276.0, 439.0, 619.0, 958.0, 1448.0, 2133.0, 3207.0, 4905.0, 6997.0, 10108.0, 14641.0, 20434.0, 28172.0, 37624.0, 48007.0, 59840.0, 72054.0, 81922.0, 88381.0, 90722.0, 87582.0, 80494.0, 70802.0, 59543.0, 47751.0, 36513.0, 27297.0, 20255.0, 14175.0, 9863.0, 6889.0, 4656.0, 3226.0, 2112.0, 1360.0, 899.0, 612.0, 424.0, 269.0, 161.0, 106.0, 83.0, 51.0, 42.0, 15.0, 13.0, 13.0, 4.0, 4.0, 2.0, 1.0], "bins": [-15.0078125, -14.5455322265625, -14.083251953125, -13.6209716796875, -13.15869140625, -12.6964111328125, -12.234130859375, -11.7718505859375, -11.3095703125, -10.8472900390625, -10.385009765625, -9.9227294921875, -9.46044921875, -8.9981689453125, -8.535888671875, -8.0736083984375, -7.611328125, -7.1490478515625, -6.686767578125, -6.2244873046875, -5.76220703125, -5.2999267578125, -4.837646484375, -4.3753662109375, -3.9130859375, -3.4508056640625, -2.988525390625, -2.5262451171875, -2.06396484375, -1.6016845703125, -1.139404296875, -0.6771240234375, -0.21484375, 0.2474365234375, 0.709716796875, 1.1719970703125, 1.63427734375, 2.0965576171875, 2.558837890625, 3.0211181640625, 3.4833984375, 3.9456787109375, 4.407958984375, 4.8702392578125, 5.33251953125, 5.7947998046875, 6.257080078125, 6.7193603515625, 7.181640625, 7.6439208984375, 8.106201171875, 8.5684814453125, 9.03076171875, 9.4930419921875, 9.955322265625, 10.4176025390625, 10.8798828125, 11.3421630859375, 11.804443359375, 12.2667236328125, 12.72900390625, 13.1912841796875, 13.653564453125, 14.1158447265625, 14.578125]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 4.0, 1.0, 8.0, 9.0, 9.0, 13.0, 14.0, 10.0, 11.0, 14.0, 23.0, 18.0, 25.0, 24.0, 21.0, 29.0, 38.0, 36.0, 24.0, 32.0, 40.0, 28.0, 35.0, 37.0, 40.0, 27.0, 31.0, 35.0, 36.0, 31.0, 29.0, 37.0, 25.0, 29.0, 24.0, 23.0, 24.0, 11.0, 15.0, 11.0, 16.0, 6.0, 13.0, 10.0, 4.0, 6.0, 3.0, 9.0, 4.0, 1.0, 2.0, 0.0, 0.0, 3.0], "bins": [-16.515625, -16.0172119140625, -15.518798828125, -15.0203857421875, -14.52197265625, -14.0235595703125, -13.525146484375, -13.0267333984375, -12.5283203125, -12.0299072265625, -11.531494140625, -11.0330810546875, -10.53466796875, -10.0362548828125, -9.537841796875, -9.0394287109375, -8.541015625, -8.0426025390625, -7.544189453125, -7.0457763671875, -6.54736328125, -6.0489501953125, -5.550537109375, -5.0521240234375, -4.5537109375, -4.0552978515625, -3.556884765625, -3.0584716796875, -2.56005859375, -2.0616455078125, -1.563232421875, -1.0648193359375, -0.56640625, -0.0679931640625, 0.430419921875, 0.9288330078125, 1.42724609375, 1.9256591796875, 2.424072265625, 2.9224853515625, 3.4208984375, 3.9193115234375, 4.417724609375, 4.9161376953125, 5.41455078125, 5.9129638671875, 6.411376953125, 6.9097900390625, 7.408203125, 7.9066162109375, 8.405029296875, 8.9034423828125, 9.40185546875, 9.9002685546875, 10.398681640625, 10.8970947265625, 11.3955078125, 11.8939208984375, 12.392333984375, 12.8907470703125, 13.38916015625, 13.8875732421875, 14.385986328125, 14.8843994140625, 15.3828125]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 5.0, 6.0, 3.0, 14.0, 21.0, 33.0, 49.0, 71.0, 92.0, 137.0, 226.0, 319.0, 493.0, 854.0, 1181.0, 1868.0, 2826.0, 4347.0, 6344.0, 9771.0, 14107.0, 20584.0, 29003.0, 39876.0, 52445.0, 66200.0, 79296.0, 90381.0, 96900.0, 96999.0, 91734.0, 81617.0, 68056.0, 54374.0, 41532.0, 30106.0, 21317.0, 15210.0, 10179.0, 6829.0, 4557.0, 2930.0, 1967.0, 1271.0, 814.0, 524.0, 395.0, 219.0, 148.0, 95.0, 79.0, 41.0, 42.0, 20.0, 26.0, 10.0, 9.0, 9.0, 3.0, 4.0, 5.0], "bins": [-5.53515625, -5.362548828125, -5.18994140625, -5.017333984375, -4.8447265625, -4.672119140625, -4.49951171875, -4.326904296875, -4.154296875, -3.981689453125, -3.80908203125, -3.636474609375, -3.4638671875, -3.291259765625, -3.11865234375, -2.946044921875, -2.7734375, -2.600830078125, -2.42822265625, -2.255615234375, -2.0830078125, -1.910400390625, -1.73779296875, -1.565185546875, -1.392578125, -1.219970703125, -1.04736328125, -0.874755859375, -0.7021484375, -0.529541015625, -0.35693359375, -0.184326171875, -0.01171875, 0.160888671875, 0.33349609375, 0.506103515625, 0.6787109375, 0.851318359375, 1.02392578125, 1.196533203125, 1.369140625, 1.541748046875, 1.71435546875, 1.886962890625, 2.0595703125, 2.232177734375, 2.40478515625, 2.577392578125, 2.75, 2.922607421875, 3.09521484375, 3.267822265625, 3.4404296875, 3.613037109375, 3.78564453125, 3.958251953125, 4.130859375, 4.303466796875, 4.47607421875, 4.648681640625, 4.8212890625, 4.993896484375, 5.16650390625, 5.339111328125, 5.51171875]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 1.0, 6.0, 1.0, 3.0, 14.0, 9.0, 14.0, 21.0, 25.0, 30.0, 21.0, 33.0, 25.0, 46.0, 37.0, 39.0, 46.0, 48.0, 49.0, 46.0, 60.0, 40.0, 47.0, 44.0, 44.0, 36.0, 36.0, 20.0, 31.0, 23.0, 19.0, 17.0, 16.0, 21.0, 7.0, 11.0, 7.0, 6.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0007042884826660156, -0.0006781965494155884, -0.0006521046161651611, -0.0006260126829147339, -0.0005999207496643066, -0.0005738288164138794, -0.0005477368831634521, -0.0005216449499130249, -0.0004955530166625977, -0.0004694610834121704, -0.00044336915016174316, -0.0004172772169113159, -0.00039118528366088867, -0.0003650933504104614, -0.0003390014171600342, -0.00031290948390960693, -0.0002868175506591797, -0.00026072561740875244, -0.0002346336841583252, -0.00020854175090789795, -0.0001824498176574707, -0.00015635788440704346, -0.0001302659511566162, -0.00010417401790618896, -7.808208465576172e-05, -5.199015140533447e-05, -2.5898218154907227e-05, 1.9371509552001953e-07, 2.6285648345947266e-05, 5.237758159637451e-05, 7.846951484680176e-05, 0.000104561448097229, 0.00013065338134765625, 0.0001567453145980835, 0.00018283724784851074, 0.000208929181098938, 0.00023502111434936523, 0.0002611130475997925, 0.0002872049808502197, 0.00031329691410064697, 0.0003393888473510742, 0.00036548078060150146, 0.0003915727138519287, 0.00041766464710235596, 0.0004437565803527832, 0.00046984851360321045, 0.0004959404468536377, 0.0005220323801040649, 0.0005481243133544922, 0.0005742162466049194, 0.0006003081798553467, 0.0006264001131057739, 0.0006524920463562012, 0.0006785839796066284, 0.0007046759128570557, 0.0007307678461074829, 0.0007568597793579102, 0.0007829517126083374, 0.0008090436458587646, 0.0008351355791091919, 0.0008612275123596191, 0.0008873194456100464, 0.0009134113788604736, 0.0009395033121109009, 0.0009655952453613281]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 5.0, 6.0, 16.0, 32.0, 36.0, 47.0, 73.0, 143.0, 186.0, 304.0, 451.0, 687.0, 1108.0, 1627.0, 2585.0, 3990.0, 6101.0, 9616.0, 14365.0, 21375.0, 30958.0, 43028.0, 58411.0, 74361.0, 89505.0, 100723.0, 105712.0, 102670.0, 92494.0, 77680.0, 61838.0, 46505.0, 33456.0, 23200.0, 15622.0, 10432.0, 6703.0, 4429.0, 2872.0, 1877.0, 1183.0, 784.0, 461.0, 307.0, 218.0, 123.0, 88.0, 69.0, 39.0, 20.0, 22.0, 8.0, 6.0, 4.0, 4.0], "bins": [-7.16796875, -6.9666748046875, -6.765380859375, -6.5640869140625, -6.36279296875, -6.1614990234375, -5.960205078125, -5.7589111328125, -5.5576171875, -5.3563232421875, -5.155029296875, -4.9537353515625, -4.75244140625, -4.5511474609375, -4.349853515625, -4.1485595703125, -3.947265625, -3.7459716796875, -3.544677734375, -3.3433837890625, -3.14208984375, -2.9407958984375, -2.739501953125, -2.5382080078125, -2.3369140625, -2.1356201171875, -1.934326171875, -1.7330322265625, -1.53173828125, -1.3304443359375, -1.129150390625, -0.9278564453125, -0.7265625, -0.5252685546875, -0.323974609375, -0.1226806640625, 0.07861328125, 0.2799072265625, 0.481201171875, 0.6824951171875, 0.8837890625, 1.0850830078125, 1.286376953125, 1.4876708984375, 1.68896484375, 1.8902587890625, 2.091552734375, 2.2928466796875, 2.494140625, 2.6954345703125, 2.896728515625, 3.0980224609375, 3.29931640625, 3.5006103515625, 3.701904296875, 3.9031982421875, 4.1044921875, 4.3057861328125, 4.507080078125, 4.7083740234375, 4.90966796875, 5.1109619140625, 5.312255859375, 5.5135498046875, 5.71484375]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 5.0, 5.0, 8.0, 11.0, 14.0, 12.0, 17.0, 13.0, 19.0, 33.0, 22.0, 30.0, 43.0, 37.0, 39.0, 41.0, 49.0, 48.0, 59.0, 55.0, 42.0, 50.0, 43.0, 40.0, 39.0, 34.0, 33.0, 25.0, 18.0, 16.0, 18.0, 9.0, 12.0, 16.0, 10.0, 11.0, 6.0, 6.0, 4.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.232421875, -3.134307861328125, -3.03619384765625, -2.938079833984375, -2.8399658203125, -2.741851806640625, -2.64373779296875, -2.545623779296875, -2.447509765625, -2.349395751953125, -2.25128173828125, -2.153167724609375, -2.0550537109375, -1.956939697265625, -1.85882568359375, -1.760711669921875, -1.66259765625, -1.564483642578125, -1.46636962890625, -1.368255615234375, -1.2701416015625, -1.172027587890625, -1.07391357421875, -0.975799560546875, -0.877685546875, -0.779571533203125, -0.68145751953125, -0.583343505859375, -0.4852294921875, -0.387115478515625, -0.28900146484375, -0.190887451171875, -0.0927734375, 0.005340576171875, 0.10345458984375, 0.201568603515625, 0.2996826171875, 0.397796630859375, 0.49591064453125, 0.594024658203125, 0.692138671875, 0.790252685546875, 0.88836669921875, 0.986480712890625, 1.0845947265625, 1.182708740234375, 1.28082275390625, 1.378936767578125, 1.47705078125, 1.575164794921875, 1.67327880859375, 1.771392822265625, 1.8695068359375, 1.967620849609375, 2.06573486328125, 2.163848876953125, 2.261962890625, 2.360076904296875, 2.45819091796875, 2.556304931640625, 2.6544189453125, 2.752532958984375, 2.85064697265625, 2.948760986328125, 3.046875]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [4.0, 3.0, 1.0, 3.0, 3.0, 3.0, 2.0, 2.0, 8.0, 6.0, 6.0, 8.0, 13.0, 12.0, 12.0, 12.0, 19.0, 25.0, 19.0, 26.0, 20.0, 22.0, 22.0, 37.0, 27.0, 45.0, 40.0, 36.0, 37.0, 41.0, 38.0, 39.0, 23.0, 31.0, 46.0, 41.0, 33.0, 24.0, 32.0, 29.0, 32.0, 17.0, 19.0, 20.0, 13.0, 16.0, 6.0, 9.0, 8.0, 6.0, 5.0, 5.0, 1.0, 5.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.452224731445312, -20.738773345947266, -20.02532196044922, -19.31186866760254, -18.598417282104492, -17.884965896606445, -17.1715145111084, -16.45806121826172, -15.744609832763672, -15.031158447265625, -14.317706108093262, -13.604254722595215, -12.890802383422852, -12.177350997924805, -11.463899612426758, -10.750447273254395, -10.036995887756348, -9.3235445022583, -8.610092163085938, -7.896640777587891, -7.183188438415527, -6.4697370529174805, -5.756285190582275, -5.04283332824707, -4.329381465911865, -3.61592960357666, -2.902477741241455, -2.189026117324829, -1.475574254989624, -0.762122392654419, -0.04867076873779297, 0.6647810935974121, 1.3782329559326172, 2.0916848182678223, 2.8051366806030273, 3.5185883045196533, 4.2320404052734375, 4.945491790771484, 5.6589436531066895, 6.3723955154418945, 7.0858473777771, 7.799299240112305, 8.512750625610352, 9.226202964782715, 9.939654350280762, 10.653106689453125, 11.366558074951172, 12.080009460449219, 12.793461799621582, 13.506913185119629, 14.220365524291992, 14.933816909790039, 15.647269248962402, 16.360721588134766, 17.074172973632812, 17.78762435913086, 18.501075744628906, 19.214527130126953, 19.927978515625, 20.64143180847168, 21.354883193969727, 22.068334579467773, 22.78178596496582, 23.4952392578125, 24.208690643310547]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 3.0, 4.0, 7.0, 5.0, 1.0, 11.0, 12.0, 16.0, 19.0, 13.0, 17.0, 31.0, 24.0, 39.0, 24.0, 39.0, 30.0, 34.0, 44.0, 44.0, 48.0, 50.0, 43.0, 40.0, 42.0, 39.0, 38.0, 34.0, 32.0, 29.0, 23.0, 24.0, 23.0, 22.0, 18.0, 12.0, 11.0, 11.0, 13.0, 9.0, 10.0, 9.0, 6.0, 2.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.564584732055664, -25.62040138244629, -24.67621612548828, -23.732032775878906, -22.78784942626953, -21.843666076660156, -20.89948272705078, -19.955297470092773, -19.0111141204834, -18.066930770874023, -17.122745513916016, -16.17856216430664, -15.234378814697266, -14.29019546508789, -13.3460111618042, -12.401826858520508, -11.457643508911133, -10.513460159301758, -9.569275856018066, -8.625091552734375, -7.680908203125, -6.736724376678467, -5.792540550231934, -4.8483567237854, -3.904172897338867, -2.959989070892334, -2.015805244445801, -1.0716214179992676, -0.12743759155273438, 0.8167462348937988, 1.760930061340332, 2.7051138877868652, 3.6492996215820312, 4.5934834480285645, 5.537667274475098, 6.481851100921631, 7.426034927368164, 8.370218276977539, 9.31440258026123, 10.258586883544922, 11.202770233154297, 12.146953582763672, 13.091137886047363, 14.035322189331055, 14.97950553894043, 15.923688888549805, 16.867874145507812, 17.812057495117188, 18.756240844726562, 19.700424194335938, 20.644607543945312, 21.58879280090332, 22.532976150512695, 23.47715950012207, 24.421344757080078, 25.365528106689453, 26.309711456298828, 27.253894805908203, 28.198078155517578, 29.142263412475586, 30.08644676208496, 31.030630111694336, 31.974815368652344, 32.91899871826172, 33.863182067871094]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 7.0, 24.0, 30.0, 45.0, 82.0, 159.0, 223.0, 437.0, 754.0, 1318.0, 2176.0, 3609.0, 6120.0, 9931.0, 15790.0, 25085.0, 38924.0, 58334.0, 86149.0, 122424.0, 168737.0, 221295.0, 279251.0, 333199.0, 376400.0, 396491.0, 392899.0, 364900.0, 320936.0, 265793.0, 208349.0, 156054.0, 112846.0, 78364.0, 52611.0, 34841.0, 22309.0, 14445.0, 8866.0, 5609.0, 3418.0, 2016.0, 1200.0, 695.0, 455.0, 264.0, 170.0, 110.0, 55.0, 44.0, 16.0, 19.0, 4.0, 6.0, 4.0, 1.0, 0.0, 1.0], "bins": [-18.359375, -17.783447265625, -17.20751953125, -16.631591796875, -16.0556640625, -15.479736328125, -14.90380859375, -14.327880859375, -13.751953125, -13.176025390625, -12.60009765625, -12.024169921875, -11.4482421875, -10.872314453125, -10.29638671875, -9.720458984375, -9.14453125, -8.568603515625, -7.99267578125, -7.416748046875, -6.8408203125, -6.264892578125, -5.68896484375, -5.113037109375, -4.537109375, -3.961181640625, -3.38525390625, -2.809326171875, -2.2333984375, -1.657470703125, -1.08154296875, -0.505615234375, 0.0703125, 0.646240234375, 1.22216796875, 1.798095703125, 2.3740234375, 2.949951171875, 3.52587890625, 4.101806640625, 4.677734375, 5.253662109375, 5.82958984375, 6.405517578125, 6.9814453125, 7.557373046875, 8.13330078125, 8.709228515625, 9.28515625, 9.861083984375, 10.43701171875, 11.012939453125, 11.5888671875, 12.164794921875, 12.74072265625, 13.316650390625, 13.892578125, 14.468505859375, 15.04443359375, 15.620361328125, 16.1962890625, 16.772216796875, 17.34814453125, 17.924072265625, 18.5]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 0.0, 8.0, 5.0, 7.0, 10.0, 8.0, 15.0, 14.0, 14.0, 14.0, 15.0, 24.0, 14.0, 35.0, 31.0, 37.0, 36.0, 46.0, 42.0, 49.0, 41.0, 33.0, 33.0, 49.0, 37.0, 39.0, 42.0, 28.0, 32.0, 30.0, 28.0, 25.0, 29.0, 23.0, 19.0, 17.0, 13.0, 12.0, 9.0, 12.0, 7.0, 10.0, 5.0, 7.0, 2.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.921875, -19.17138671875, -18.4208984375, -17.67041015625, -16.919921875, -16.16943359375, -15.4189453125, -14.66845703125, -13.91796875, -13.16748046875, -12.4169921875, -11.66650390625, -10.916015625, -10.16552734375, -9.4150390625, -8.66455078125, -7.9140625, -7.16357421875, -6.4130859375, -5.66259765625, -4.912109375, -4.16162109375, -3.4111328125, -2.66064453125, -1.91015625, -1.15966796875, -0.4091796875, 0.34130859375, 1.091796875, 1.84228515625, 2.5927734375, 3.34326171875, 4.09375, 4.84423828125, 5.5947265625, 6.34521484375, 7.095703125, 7.84619140625, 8.5966796875, 9.34716796875, 10.09765625, 10.84814453125, 11.5986328125, 12.34912109375, 13.099609375, 13.85009765625, 14.6005859375, 15.35107421875, 16.1015625, 16.85205078125, 17.6025390625, 18.35302734375, 19.103515625, 19.85400390625, 20.6044921875, 21.35498046875, 22.10546875, 22.85595703125, 23.6064453125, 24.35693359375, 25.107421875, 25.85791015625, 26.6083984375, 27.35888671875, 28.109375]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 11.0, 12.0, 46.0, 53.0, 115.0, 198.0, 416.0, 681.0, 1209.0, 2261.0, 3657.0, 6290.0, 10435.0, 17270.0, 27662.0, 42852.0, 65283.0, 95128.0, 134154.0, 180834.0, 234065.0, 286730.0, 335238.0, 369249.0, 385563.0, 380392.0, 354573.0, 310661.0, 259022.0, 204484.0, 155555.0, 112600.0, 77634.0, 51812.0, 34085.0, 21785.0, 13326.0, 7995.0, 4669.0, 2722.0, 1612.0, 910.0, 438.0, 275.0, 145.0, 86.0, 51.0, 23.0, 13.0, 8.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.46875, -18.855224609375, -18.24169921875, -17.628173828125, -17.0146484375, -16.401123046875, -15.78759765625, -15.174072265625, -14.560546875, -13.947021484375, -13.33349609375, -12.719970703125, -12.1064453125, -11.492919921875, -10.87939453125, -10.265869140625, -9.65234375, -9.038818359375, -8.42529296875, -7.811767578125, -7.1982421875, -6.584716796875, -5.97119140625, -5.357666015625, -4.744140625, -4.130615234375, -3.51708984375, -2.903564453125, -2.2900390625, -1.676513671875, -1.06298828125, -0.449462890625, 0.1640625, 0.777587890625, 1.39111328125, 2.004638671875, 2.6181640625, 3.231689453125, 3.84521484375, 4.458740234375, 5.072265625, 5.685791015625, 6.29931640625, 6.912841796875, 7.5263671875, 8.139892578125, 8.75341796875, 9.366943359375, 9.98046875, 10.593994140625, 11.20751953125, 11.821044921875, 12.4345703125, 13.048095703125, 13.66162109375, 14.275146484375, 14.888671875, 15.502197265625, 16.11572265625, 16.729248046875, 17.3427734375, 17.956298828125, 18.56982421875, 19.183349609375, 19.796875]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 3.0, 5.0, 10.0, 19.0, 16.0, 19.0, 19.0, 23.0, 26.0, 42.0, 41.0, 40.0, 54.0, 79.0, 83.0, 79.0, 95.0, 151.0, 136.0, 162.0, 156.0, 169.0, 170.0, 182.0, 216.0, 177.0, 189.0, 175.0, 175.0, 151.0, 160.0, 142.0, 118.0, 116.0, 109.0, 84.0, 86.0, 59.0, 77.0, 52.0, 38.0, 38.0, 38.0, 22.0, 16.0, 17.0, 12.0, 10.0, 9.0, 1.0, 4.0, 5.0, 4.0, 2.0, 2.0, 2.0, 2.0], "bins": [-10.390625, -10.0684814453125, -9.746337890625, -9.4241943359375, -9.10205078125, -8.7799072265625, -8.457763671875, -8.1356201171875, -7.8134765625, -7.4913330078125, -7.169189453125, -6.8470458984375, -6.52490234375, -6.2027587890625, -5.880615234375, -5.5584716796875, -5.236328125, -4.9141845703125, -4.592041015625, -4.2698974609375, -3.94775390625, -3.6256103515625, -3.303466796875, -2.9813232421875, -2.6591796875, -2.3370361328125, -2.014892578125, -1.6927490234375, -1.37060546875, -1.0484619140625, -0.726318359375, -0.4041748046875, -0.08203125, 0.2401123046875, 0.562255859375, 0.8843994140625, 1.20654296875, 1.5286865234375, 1.850830078125, 2.1729736328125, 2.4951171875, 2.8172607421875, 3.139404296875, 3.4615478515625, 3.78369140625, 4.1058349609375, 4.427978515625, 4.7501220703125, 5.072265625, 5.3944091796875, 5.716552734375, 6.0386962890625, 6.36083984375, 6.6829833984375, 7.005126953125, 7.3272705078125, 7.6494140625, 7.9715576171875, 8.293701171875, 8.6158447265625, 8.93798828125, 9.2601318359375, 9.582275390625, 9.9044189453125, 10.2265625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 6.0, 4.0, 4.0, 8.0, 3.0, 13.0, 12.0, 7.0, 22.0, 15.0, 19.0, 24.0, 20.0, 17.0, 14.0, 30.0, 29.0, 39.0, 33.0, 37.0, 34.0, 43.0, 37.0, 42.0, 37.0, 42.0, 40.0, 40.0, 45.0, 39.0, 24.0, 28.0, 21.0, 11.0, 16.0, 33.0, 24.0, 21.0, 15.0, 13.0, 12.0, 8.0, 12.0, 3.0, 2.0, 3.0, 4.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-26.218730926513672, -25.436527252197266, -24.654325485229492, -23.872121810913086, -23.089920043945312, -22.307716369628906, -21.5255126953125, -20.743309020996094, -19.96110725402832, -19.178903579711914, -18.39670181274414, -17.614498138427734, -16.832294464111328, -16.050092697143555, -15.267889022827148, -14.485686302185059, -13.703483581542969, -12.921280860900879, -12.139078140258789, -11.356874465942383, -10.574671745300293, -9.792469024658203, -9.010265350341797, -8.228062629699707, -7.445859909057617, -6.663657188415527, -5.881453990936279, -5.099250793457031, -4.317048072814941, -3.5348451137542725, -2.7526421546936035, -1.9704389572143555, -1.1882381439208984, -0.4060351848602295, 0.37616777420043945, 1.1583707332611084, 1.9405736923217773, 2.7227766513824463, 3.5049796104431152, 4.287182807922363, 5.069385528564453, 5.851588249206543, 6.633791446685791, 7.415994644165039, 8.198197364807129, 8.980400085449219, 9.762603759765625, 10.544806480407715, 11.327009201049805, 12.109211921691895, 12.891414642333984, 13.67361831665039, 14.45582103729248, 15.23802375793457, 16.020227432250977, 16.80242919921875, 17.584632873535156, 18.366836547851562, 19.149038314819336, 19.931241989135742, 20.713443756103516, 21.495647430419922, 22.277851104736328, 23.060054779052734, 23.842256546020508]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 2.0, 5.0, 5.0, 7.0, 12.0, 12.0, 17.0, 14.0, 14.0, 27.0, 12.0, 25.0, 21.0, 22.0, 29.0, 38.0, 32.0, 42.0, 39.0, 35.0, 34.0, 34.0, 40.0, 43.0, 36.0, 34.0, 45.0, 55.0, 40.0, 25.0, 25.0, 21.0, 20.0, 22.0, 13.0, 19.0, 13.0, 13.0, 17.0, 14.0, 5.0, 7.0, 4.0, 6.0, 4.0, 3.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-27.830825805664062, -26.948915481567383, -26.067005157470703, -25.185094833374023, -24.303184509277344, -23.421274185180664, -22.539363861083984, -21.657451629638672, -20.775543212890625, -19.893632888793945, -19.011722564697266, -18.129812240600586, -17.247901916503906, -16.365991592407227, -15.48408031463623, -14.60216999053955, -13.720258712768555, -12.838348388671875, -11.956438064575195, -11.074527740478516, -10.192617416381836, -9.310707092285156, -8.42879581451416, -7.5468854904174805, -6.664975166320801, -5.783064842224121, -4.901154518127441, -4.0192437171936035, -3.137333393096924, -2.255423069000244, -1.3735122680664062, -0.49160194396972656, 0.3903064727783203, 1.2722169160842896, 2.154127359390259, 3.0360379219055176, 3.9179482460021973, 4.799858570098877, 5.681769371032715, 6.5636796951293945, 7.445590019226074, 8.327500343322754, 9.209410667419434, 10.09132194519043, 10.97323226928711, 11.855142593383789, 12.737052917480469, 13.618963241577148, 14.500873565673828, 15.382783889770508, 16.264694213867188, 17.146604537963867, 18.028514862060547, 18.910425186157227, 19.792335510253906, 20.67424774169922, 21.556156158447266, 22.438066482543945, 23.319976806640625, 24.201887130737305, 25.083797454833984, 25.965707778930664, 26.847618103027344, 27.729530334472656, 28.611440658569336]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 6.0, 5.0, 6.0, 23.0, 26.0, 38.0, 64.0, 82.0, 111.0, 177.0, 263.0, 409.0, 645.0, 935.0, 1381.0, 2055.0, 3235.0, 4850.0, 7498.0, 11061.0, 16878.0, 25113.0, 38372.0, 55552.0, 77076.0, 101115.0, 120944.0, 129356.0, 119707.0, 97734.0, 73870.0, 52699.0, 35933.0, 24160.0, 16247.0, 10574.0, 6891.0, 4632.0, 2969.0, 1991.0, 1197.0, 861.0, 594.0, 391.0, 284.0, 185.0, 125.0, 76.0, 62.0, 37.0, 15.0, 19.0, 10.0, 10.0, 4.0, 9.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-3.76171875, -3.63812255859375, -3.5145263671875, -3.39093017578125, -3.267333984375, -3.14373779296875, -3.0201416015625, -2.89654541015625, -2.77294921875, -2.64935302734375, -2.5257568359375, -2.40216064453125, -2.278564453125, -2.15496826171875, -2.0313720703125, -1.90777587890625, -1.7841796875, -1.66058349609375, -1.5369873046875, -1.41339111328125, -1.289794921875, -1.16619873046875, -1.0426025390625, -0.91900634765625, -0.79541015625, -0.67181396484375, -0.5482177734375, -0.42462158203125, -0.301025390625, -0.17742919921875, -0.0538330078125, 0.06976318359375, 0.193359375, 0.31695556640625, 0.4405517578125, 0.56414794921875, 0.687744140625, 0.81134033203125, 0.9349365234375, 1.05853271484375, 1.18212890625, 1.30572509765625, 1.4293212890625, 1.55291748046875, 1.676513671875, 1.80010986328125, 1.9237060546875, 2.04730224609375, 2.1708984375, 2.29449462890625, 2.4180908203125, 2.54168701171875, 2.665283203125, 2.78887939453125, 2.9124755859375, 3.03607177734375, 3.15966796875, 3.28326416015625, 3.4068603515625, 3.53045654296875, 3.654052734375, 3.77764892578125, 3.9012451171875, 4.02484130859375, 4.1484375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 5.0, 4.0, 8.0, 6.0, 11.0, 16.0, 14.0, 15.0, 16.0, 20.0, 30.0, 25.0, 28.0, 20.0, 34.0, 36.0, 42.0, 37.0, 29.0, 39.0, 35.0, 43.0, 57.0, 38.0, 52.0, 40.0, 31.0, 36.0, 23.0, 32.0, 26.0, 22.0, 20.0, 15.0, 14.0, 16.0, 15.0, 10.0, 18.0, 8.0, 5.0, 5.0, 3.0, 5.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.328125, -26.374755859375, -25.42138671875, -24.468017578125, -23.5146484375, -22.561279296875, -21.60791015625, -20.654541015625, -19.701171875, -18.747802734375, -17.79443359375, -16.841064453125, -15.8876953125, -14.934326171875, -13.98095703125, -13.027587890625, -12.07421875, -11.120849609375, -10.16748046875, -9.214111328125, -8.2607421875, -7.307373046875, -6.35400390625, -5.400634765625, -4.447265625, -3.493896484375, -2.54052734375, -1.587158203125, -0.6337890625, 0.319580078125, 1.27294921875, 2.226318359375, 3.1796875, 4.133056640625, 5.08642578125, 6.039794921875, 6.9931640625, 7.946533203125, 8.89990234375, 9.853271484375, 10.806640625, 11.760009765625, 12.71337890625, 13.666748046875, 14.6201171875, 15.573486328125, 16.52685546875, 17.480224609375, 18.43359375, 19.386962890625, 20.34033203125, 21.293701171875, 22.2470703125, 23.200439453125, 24.15380859375, 25.107177734375, 26.060546875, 27.013916015625, 27.96728515625, 28.920654296875, 29.8740234375, 30.827392578125, 31.78076171875, 32.734130859375, 33.6875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 9.0, 16.0, 16.0, 26.0, 30.0, 43.0, 74.0, 101.0, 185.0, 261.0, 398.0, 645.0, 1050.0, 1621.0, 2822.0, 4594.0, 7709.0, 12947.0, 21951.0, 37213.0, 61693.0, 96930.0, 137971.0, 165875.0, 159423.0, 124050.0, 82998.0, 51810.0, 30671.0, 18246.0, 10852.0, 6386.0, 3838.0, 2342.0, 1391.0, 810.0, 524.0, 366.0, 223.0, 134.0, 115.0, 58.0, 38.0, 40.0, 28.0, 11.0, 8.0, 8.0, 5.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-4.953125, -4.79241943359375, -4.6317138671875, -4.47100830078125, -4.310302734375, -4.14959716796875, -3.9888916015625, -3.82818603515625, -3.66748046875, -3.50677490234375, -3.3460693359375, -3.18536376953125, -3.024658203125, -2.86395263671875, -2.7032470703125, -2.54254150390625, -2.3818359375, -2.22113037109375, -2.0604248046875, -1.89971923828125, -1.739013671875, -1.57830810546875, -1.4176025390625, -1.25689697265625, -1.09619140625, -0.93548583984375, -0.7747802734375, -0.61407470703125, -0.453369140625, -0.29266357421875, -0.1319580078125, 0.02874755859375, 0.189453125, 0.35015869140625, 0.5108642578125, 0.67156982421875, 0.832275390625, 0.99298095703125, 1.1536865234375, 1.31439208984375, 1.47509765625, 1.63580322265625, 1.7965087890625, 1.95721435546875, 2.117919921875, 2.27862548828125, 2.4393310546875, 2.60003662109375, 2.7607421875, 2.92144775390625, 3.0821533203125, 3.24285888671875, 3.403564453125, 3.56427001953125, 3.7249755859375, 3.88568115234375, 4.04638671875, 4.20709228515625, 4.3677978515625, 4.52850341796875, 4.689208984375, 4.84991455078125, 5.0106201171875, 5.17132568359375, 5.33203125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 5.0, 2.0, 4.0, 8.0, 5.0, 10.0, 7.0, 11.0, 11.0, 14.0, 17.0, 16.0, 27.0, 26.0, 22.0, 24.0, 20.0, 41.0, 40.0, 37.0, 38.0, 25.0, 37.0, 27.0, 29.0, 33.0, 41.0, 39.0, 27.0, 35.0, 32.0, 32.0, 32.0, 31.0, 19.0, 18.0, 18.0, 24.0, 21.0, 20.0, 15.0, 14.0, 11.0, 15.0, 7.0, 6.0, 2.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 4.0, 1.0, 1.0, 1.0], "bins": [-17.140625, -16.605224609375, -16.06982421875, -15.534423828125, -14.9990234375, -14.463623046875, -13.92822265625, -13.392822265625, -12.857421875, -12.322021484375, -11.78662109375, -11.251220703125, -10.7158203125, -10.180419921875, -9.64501953125, -9.109619140625, -8.57421875, -8.038818359375, -7.50341796875, -6.968017578125, -6.4326171875, -5.897216796875, -5.36181640625, -4.826416015625, -4.291015625, -3.755615234375, -3.22021484375, -2.684814453125, -2.1494140625, -1.614013671875, -1.07861328125, -0.543212890625, -0.0078125, 0.527587890625, 1.06298828125, 1.598388671875, 2.1337890625, 2.669189453125, 3.20458984375, 3.739990234375, 4.275390625, 4.810791015625, 5.34619140625, 5.881591796875, 6.4169921875, 6.952392578125, 7.48779296875, 8.023193359375, 8.55859375, 9.093994140625, 9.62939453125, 10.164794921875, 10.7001953125, 11.235595703125, 11.77099609375, 12.306396484375, 12.841796875, 13.377197265625, 13.91259765625, 14.447998046875, 14.9833984375, 15.518798828125, 16.05419921875, 16.589599609375, 17.125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 5.0, 7.0, 11.0, 12.0, 21.0, 29.0, 35.0, 65.0, 84.0, 147.0, 210.0, 387.0, 689.0, 1190.0, 2481.0, 5359.0, 13580.0, 38566.0, 124402.0, 349906.0, 336205.0, 116505.0, 35674.0, 12493.0, 5161.0, 2442.0, 1274.0, 653.0, 376.0, 195.0, 138.0, 82.0, 46.0, 36.0, 25.0, 23.0, 12.0, 11.0, 7.0, 4.0, 5.0, 1.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6396484375, -1.5883636474609375, -1.537078857421875, -1.4857940673828125, -1.43450927734375, -1.3832244873046875, -1.331939697265625, -1.2806549072265625, -1.2293701171875, -1.1780853271484375, -1.126800537109375, -1.0755157470703125, -1.02423095703125, -0.9729461669921875, -0.921661376953125, -0.8703765869140625, -0.819091796875, -0.7678070068359375, -0.716522216796875, -0.6652374267578125, -0.61395263671875, -0.5626678466796875, -0.511383056640625, -0.4600982666015625, -0.4088134765625, -0.3575286865234375, -0.306243896484375, -0.2549591064453125, -0.20367431640625, -0.1523895263671875, -0.101104736328125, -0.0498199462890625, 0.00146484375, 0.0527496337890625, 0.104034423828125, 0.1553192138671875, 0.20660400390625, 0.2578887939453125, 0.309173583984375, 0.3604583740234375, 0.4117431640625, 0.4630279541015625, 0.514312744140625, 0.5655975341796875, 0.61688232421875, 0.6681671142578125, 0.719451904296875, 0.7707366943359375, 0.822021484375, 0.8733062744140625, 0.924591064453125, 0.9758758544921875, 1.02716064453125, 1.0784454345703125, 1.129730224609375, 1.1810150146484375, 1.2322998046875, 1.2835845947265625, 1.334869384765625, 1.3861541748046875, 1.43743896484375, 1.4887237548828125, 1.540008544921875, 1.5912933349609375, 1.642578125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 8.0, 6.0, 7.0, 5.0, 12.0, 7.0, 13.0, 11.0, 32.0, 21.0, 24.0, 25.0, 33.0, 48.0, 52.0, 48.0, 38.0, 57.0, 59.0, 54.0, 63.0, 47.0, 34.0, 42.0, 45.0, 36.0, 30.0, 23.0, 24.0, 19.0, 12.0, 18.0, 9.0, 4.0, 9.0, 6.0, 7.0, 3.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-8.666515350341797e-05, -8.384697139263153e-05, -8.102878928184509e-05, -7.821060717105865e-05, -7.539242506027222e-05, -7.257424294948578e-05, -6.975606083869934e-05, -6.69378787279129e-05, -6.411969661712646e-05, -6.130151450634003e-05, -5.848333239555359e-05, -5.566515028476715e-05, -5.284696817398071e-05, -5.0028786063194275e-05, -4.721060395240784e-05, -4.43924218416214e-05, -4.157423973083496e-05, -3.875605762004852e-05, -3.5937875509262085e-05, -3.311969339847565e-05, -3.030151128768921e-05, -2.748332917690277e-05, -2.4665147066116333e-05, -2.1846964955329895e-05, -1.9028782844543457e-05, -1.621060073375702e-05, -1.3392418622970581e-05, -1.0574236512184143e-05, -7.756054401397705e-06, -4.937872290611267e-06, -2.119690179824829e-06, 6.984919309616089e-07, 3.516674041748047e-06, 6.334856152534485e-06, 9.153038263320923e-06, 1.197122037410736e-05, 1.4789402484893799e-05, 1.7607584595680237e-05, 2.0425766706466675e-05, 2.3243948817253113e-05, 2.606213092803955e-05, 2.888031303882599e-05, 3.169849514961243e-05, 3.4516677260398865e-05, 3.73348593711853e-05, 4.015304148197174e-05, 4.297122359275818e-05, 4.578940570354462e-05, 4.8607587814331055e-05, 5.142576992511749e-05, 5.424395203590393e-05, 5.706213414669037e-05, 5.988031625747681e-05, 6.269849836826324e-05, 6.551668047904968e-05, 6.833486258983612e-05, 7.115304470062256e-05, 7.3971226811409e-05, 7.678940892219543e-05, 7.960759103298187e-05, 8.242577314376831e-05, 8.524395525455475e-05, 8.806213736534119e-05, 9.088031947612762e-05, 9.369850158691406e-05]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 8.0, 10.0, 9.0, 22.0, 23.0, 36.0, 45.0, 59.0, 85.0, 109.0, 182.0, 249.0, 468.0, 687.0, 1167.0, 1996.0, 3723.0, 6929.0, 13571.0, 27314.0, 57751.0, 123364.0, 234646.0, 268297.0, 159230.0, 75871.0, 35658.0, 17408.0, 8777.0, 4629.0, 2499.0, 1443.0, 826.0, 499.0, 343.0, 181.0, 136.0, 93.0, 71.0, 44.0, 29.0, 23.0, 12.0, 14.0, 12.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.9375, -1.877288818359375, -1.81707763671875, -1.756866455078125, -1.6966552734375, -1.636444091796875, -1.57623291015625, -1.516021728515625, -1.455810546875, -1.395599365234375, -1.33538818359375, -1.275177001953125, -1.2149658203125, -1.154754638671875, -1.09454345703125, -1.034332275390625, -0.97412109375, -0.913909912109375, -0.85369873046875, -0.793487548828125, -0.7332763671875, -0.673065185546875, -0.61285400390625, -0.552642822265625, -0.492431640625, -0.432220458984375, -0.37200927734375, -0.311798095703125, -0.2515869140625, -0.191375732421875, -0.13116455078125, -0.070953369140625, -0.0107421875, 0.049468994140625, 0.10968017578125, 0.169891357421875, 0.2301025390625, 0.290313720703125, 0.35052490234375, 0.410736083984375, 0.470947265625, 0.531158447265625, 0.59136962890625, 0.651580810546875, 0.7117919921875, 0.772003173828125, 0.83221435546875, 0.892425537109375, 0.95263671875, 1.012847900390625, 1.07305908203125, 1.133270263671875, 1.1934814453125, 1.253692626953125, 1.31390380859375, 1.374114990234375, 1.434326171875, 1.494537353515625, 1.55474853515625, 1.614959716796875, 1.6751708984375, 1.735382080078125, 1.79559326171875, 1.855804443359375, 1.916015625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 2.0, 2.0, 1.0, 4.0, 8.0, 7.0, 8.0, 13.0, 9.0, 11.0, 19.0, 15.0, 27.0, 20.0, 36.0, 27.0, 49.0, 50.0, 50.0, 58.0, 68.0, 73.0, 49.0, 39.0, 37.0, 46.0, 38.0, 38.0, 36.0, 25.0, 27.0, 9.0, 18.0, 9.0, 11.0, 14.0, 10.0, 6.0, 6.0, 11.0, 3.0, 5.0, 2.0, 5.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.33447265625, -0.32260894775390625, -0.3107452392578125, -0.29888153076171875, -0.287017822265625, -0.27515411376953125, -0.2632904052734375, -0.25142669677734375, -0.23956298828125, -0.22769927978515625, -0.2158355712890625, -0.20397186279296875, -0.192108154296875, -0.18024444580078125, -0.1683807373046875, -0.15651702880859375, -0.1446533203125, -0.13278961181640625, -0.1209259033203125, -0.10906219482421875, -0.097198486328125, -0.08533477783203125, -0.0734710693359375, -0.06160736083984375, -0.04974365234375, -0.03787994384765625, -0.0260162353515625, -0.01415252685546875, -0.002288818359375, 0.00957489013671875, 0.0214385986328125, 0.03330230712890625, 0.045166015625, 0.05702972412109375, 0.0688934326171875, 0.08075714111328125, 0.092620849609375, 0.10448455810546875, 0.1163482666015625, 0.12821197509765625, 0.14007568359375, 0.15193939208984375, 0.1638031005859375, 0.17566680908203125, 0.187530517578125, 0.19939422607421875, 0.2112579345703125, 0.22312164306640625, 0.2349853515625, 0.24684906005859375, 0.2587127685546875, 0.27057647705078125, 0.282440185546875, 0.29430389404296875, 0.3061676025390625, 0.31803131103515625, 0.32989501953125, 0.34175872802734375, 0.3536224365234375, 0.36548614501953125, 0.377349853515625, 0.38921356201171875, 0.4010772705078125, 0.41294097900390625, 0.4248046875]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 6.0, 6.0, 6.0, 6.0, 10.0, 10.0, 11.0, 20.0, 22.0, 23.0, 16.0, 18.0, 22.0, 16.0, 31.0, 34.0, 40.0, 43.0, 42.0, 32.0, 37.0, 51.0, 28.0, 46.0, 44.0, 44.0, 45.0, 40.0, 30.0, 23.0, 23.0, 10.0, 25.0, 28.0, 27.0, 18.0, 14.0, 18.0, 10.0, 8.0, 9.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-27.539588928222656, -26.726106643676758, -25.91262435913086, -25.099140167236328, -24.28565788269043, -23.47217559814453, -22.658693313598633, -21.845211029052734, -21.031726837158203, -20.218244552612305, -19.404762268066406, -18.591278076171875, -17.777795791625977, -16.964313507080078, -16.15083122253418, -15.337347984313965, -14.523865699768066, -13.710383415222168, -12.896900177001953, -12.083417892456055, -11.26993465423584, -10.456452369689941, -9.642969131469727, -8.829486846923828, -8.01600456237793, -7.202521800994873, -6.389039039611816, -5.575556755065918, -4.762073516845703, -3.9485912322998047, -3.135108470916748, -2.3216257095336914, -1.5081424713134766, -0.6946597695350647, 0.11882293224334717, 0.9323055744171143, 1.745788335800171, 2.5592708587646484, 3.372753620147705, 4.186236381530762, 4.999719142913818, 5.813201904296875, 6.626684665679932, 7.440167427062988, 8.253649711608887, 9.067132949829102, 9.880615234375, 10.694097518920898, 11.507580757141113, 12.321063041687012, 13.134546279907227, 13.948028564453125, 14.76151180267334, 15.574994087219238, 16.388477325439453, 17.20195960998535, 18.01544189453125, 18.82892417907715, 19.642406463623047, 20.455890655517578, 21.269372940063477, 22.082855224609375, 22.896337509155273, 23.709819793701172, 24.523303985595703]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 2.0, 8.0, 4.0, 7.0, 11.0, 14.0, 15.0, 13.0, 16.0, 25.0, 15.0, 24.0, 21.0, 22.0, 31.0, 37.0, 35.0, 41.0, 39.0, 34.0, 33.0, 34.0, 41.0, 45.0, 33.0, 35.0, 48.0, 52.0, 39.0, 24.0, 27.0, 19.0, 18.0, 23.0, 16.0, 17.0, 12.0, 14.0, 15.0, 14.0, 5.0, 7.0, 4.0, 6.0, 4.0, 3.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-27.607845306396484, -26.72903823852539, -25.850229263305664, -24.97142219543457, -24.092613220214844, -23.21380615234375, -22.334997177124023, -21.45619010925293, -20.577381134033203, -19.69857406616211, -18.819765090942383, -17.94095802307129, -17.062149047851562, -16.18334197998047, -15.304533004760742, -14.425725936889648, -13.546917915344238, -12.668109893798828, -11.789301872253418, -10.910493850708008, -10.031685829162598, -9.152877807617188, -8.274070739746094, -7.395262241363525, -6.516454219818115, -5.637646198272705, -4.758838176727295, -3.880030393600464, -3.0012223720550537, -2.1224145889282227, -1.2436065673828125, -0.36479854583740234, 0.5140094757080078, 1.392817497253418, 2.271625518798828, 3.150433301925659, 4.029241561889648, 4.9080491065979, 5.7868571281433105, 6.665665149688721, 7.544473171234131, 8.423280715942383, 9.302088737487793, 10.180896759033203, 11.059704780578613, 11.938512802124023, 12.817320823669434, 13.696128845214844, 14.574936866760254, 15.453744888305664, 16.332551956176758, 17.211360931396484, 18.090167999267578, 18.968976974487305, 19.8477840423584, 20.726593017578125, 21.60540008544922, 22.484207153320312, 23.36301612854004, 24.241823196411133, 25.12063217163086, 25.999439239501953, 26.87824821472168, 27.757055282592773, 28.6358642578125]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 4.0, 6.0, 5.0, 20.0, 18.0, 40.0, 61.0, 86.0, 122.0, 193.0, 314.0, 526.0, 787.0, 1217.0, 1913.0, 2756.0, 4118.0, 6061.0, 8757.0, 12657.0, 17472.0, 24140.0, 31864.0, 41121.0, 51869.0, 62204.0, 71844.0, 80007.0, 84825.0, 85046.0, 82957.0, 75697.0, 67204.0, 56202.0, 45735.0, 35989.0, 27404.0, 20330.0, 14755.0, 10256.0, 7133.0, 5028.0, 3471.0, 2235.0, 1455.0, 954.0, 638.0, 408.0, 260.0, 163.0, 86.0, 58.0, 35.0, 29.0, 15.0, 4.0, 6.0, 3.0, 4.0, 2.0, 1.0], "bins": [-13.8984375, -13.4671630859375, -13.035888671875, -12.6046142578125, -12.17333984375, -11.7420654296875, -11.310791015625, -10.8795166015625, -10.4482421875, -10.0169677734375, -9.585693359375, -9.1544189453125, -8.72314453125, -8.2918701171875, -7.860595703125, -7.4293212890625, -6.998046875, -6.5667724609375, -6.135498046875, -5.7042236328125, -5.27294921875, -4.8416748046875, -4.410400390625, -3.9791259765625, -3.5478515625, -3.1165771484375, -2.685302734375, -2.2540283203125, -1.82275390625, -1.3914794921875, -0.960205078125, -0.5289306640625, -0.09765625, 0.3336181640625, 0.764892578125, 1.1961669921875, 1.62744140625, 2.0587158203125, 2.489990234375, 2.9212646484375, 3.3525390625, 3.7838134765625, 4.215087890625, 4.6463623046875, 5.07763671875, 5.5089111328125, 5.940185546875, 6.3714599609375, 6.802734375, 7.2340087890625, 7.665283203125, 8.0965576171875, 8.52783203125, 8.9591064453125, 9.390380859375, 9.8216552734375, 10.2529296875, 10.6842041015625, 11.115478515625, 11.5467529296875, 11.97802734375, 12.4093017578125, 12.840576171875, 13.2718505859375, 13.703125]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 3.0, 3.0, 10.0, 9.0, 14.0, 9.0, 11.0, 20.0, 19.0, 15.0, 24.0, 18.0, 19.0, 21.0, 25.0, 39.0, 23.0, 32.0, 43.0, 40.0, 26.0, 40.0, 30.0, 47.0, 39.0, 41.0, 33.0, 35.0, 47.0, 32.0, 27.0, 27.0, 18.0, 21.0, 24.0, 16.0, 13.0, 18.0, 14.0, 12.0, 10.0, 6.0, 11.0, 5.0, 7.0, 6.0, 5.0, 4.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-28.84375, -27.9677734375, -27.091796875, -26.2158203125, -25.33984375, -24.4638671875, -23.587890625, -22.7119140625, -21.8359375, -20.9599609375, -20.083984375, -19.2080078125, -18.33203125, -17.4560546875, -16.580078125, -15.7041015625, -14.828125, -13.9521484375, -13.076171875, -12.2001953125, -11.32421875, -10.4482421875, -9.572265625, -8.6962890625, -7.8203125, -6.9443359375, -6.068359375, -5.1923828125, -4.31640625, -3.4404296875, -2.564453125, -1.6884765625, -0.8125, 0.0634765625, 0.939453125, 1.8154296875, 2.69140625, 3.5673828125, 4.443359375, 5.3193359375, 6.1953125, 7.0712890625, 7.947265625, 8.8232421875, 9.69921875, 10.5751953125, 11.451171875, 12.3271484375, 13.203125, 14.0791015625, 14.955078125, 15.8310546875, 16.70703125, 17.5830078125, 18.458984375, 19.3349609375, 20.2109375, 21.0869140625, 21.962890625, 22.8388671875, 23.71484375, 24.5908203125, 25.466796875, 26.3427734375, 27.21875]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 4.0, 1.0, 3.0, 7.0, 8.0, 16.0, 40.0, 46.0, 90.0, 123.0, 193.0, 313.0, 439.0, 735.0, 1220.0, 1840.0, 2923.0, 4373.0, 6548.0, 10053.0, 14514.0, 20990.0, 29454.0, 40023.0, 51606.0, 65049.0, 77755.0, 88018.0, 94312.0, 95784.0, 90278.0, 80684.0, 68736.0, 55069.0, 43041.0, 32276.0, 23153.0, 16188.0, 11074.0, 7467.0, 5066.0, 3279.0, 2075.0, 1343.0, 902.0, 550.0, 349.0, 208.0, 141.0, 86.0, 40.0, 26.0, 17.0, 21.0, 10.0, 4.0, 4.0, 1.0, 3.0, 1.0, 1.0], "bins": [-16.078125, -15.577880859375, -15.07763671875, -14.577392578125, -14.0771484375, -13.576904296875, -13.07666015625, -12.576416015625, -12.076171875, -11.575927734375, -11.07568359375, -10.575439453125, -10.0751953125, -9.574951171875, -9.07470703125, -8.574462890625, -8.07421875, -7.573974609375, -7.07373046875, -6.573486328125, -6.0732421875, -5.572998046875, -5.07275390625, -4.572509765625, -4.072265625, -3.572021484375, -3.07177734375, -2.571533203125, -2.0712890625, -1.571044921875, -1.07080078125, -0.570556640625, -0.0703125, 0.429931640625, 0.93017578125, 1.430419921875, 1.9306640625, 2.430908203125, 2.93115234375, 3.431396484375, 3.931640625, 4.431884765625, 4.93212890625, 5.432373046875, 5.9326171875, 6.432861328125, 6.93310546875, 7.433349609375, 7.93359375, 8.433837890625, 8.93408203125, 9.434326171875, 9.9345703125, 10.434814453125, 10.93505859375, 11.435302734375, 11.935546875, 12.435791015625, 12.93603515625, 13.436279296875, 13.9365234375, 14.436767578125, 14.93701171875, 15.437255859375, 15.9375]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 5.0, 7.0, 4.0, 5.0, 7.0, 5.0, 17.0, 8.0, 8.0, 15.0, 20.0, 17.0, 29.0, 24.0, 34.0, 30.0, 32.0, 36.0, 30.0, 37.0, 36.0, 45.0, 37.0, 35.0, 42.0, 38.0, 27.0, 46.0, 44.0, 35.0, 42.0, 28.0, 26.0, 24.0, 29.0, 23.0, 10.0, 13.0, 12.0, 11.0, 7.0, 7.0, 6.0, 6.0, 3.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-20.8125, -20.227294921875, -19.64208984375, -19.056884765625, -18.4716796875, -17.886474609375, -17.30126953125, -16.716064453125, -16.130859375, -15.545654296875, -14.96044921875, -14.375244140625, -13.7900390625, -13.204833984375, -12.61962890625, -12.034423828125, -11.44921875, -10.864013671875, -10.27880859375, -9.693603515625, -9.1083984375, -8.523193359375, -7.93798828125, -7.352783203125, -6.767578125, -6.182373046875, -5.59716796875, -5.011962890625, -4.4267578125, -3.841552734375, -3.25634765625, -2.671142578125, -2.0859375, -1.500732421875, -0.91552734375, -0.330322265625, 0.2548828125, 0.840087890625, 1.42529296875, 2.010498046875, 2.595703125, 3.180908203125, 3.76611328125, 4.351318359375, 4.9365234375, 5.521728515625, 6.10693359375, 6.692138671875, 7.27734375, 7.862548828125, 8.44775390625, 9.032958984375, 9.6181640625, 10.203369140625, 10.78857421875, 11.373779296875, 11.958984375, 12.544189453125, 13.12939453125, 13.714599609375, 14.2998046875, 14.885009765625, 15.47021484375, 16.055419921875, 16.640625]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 7.0, 9.0, 16.0, 34.0, 50.0, 82.0, 154.0, 226.0, 398.0, 616.0, 1035.0, 1796.0, 3078.0, 5159.0, 8500.0, 13548.0, 21141.0, 31792.0, 46243.0, 62855.0, 80727.0, 96858.0, 107683.0, 110861.0, 106047.0, 93441.0, 76358.0, 58810.0, 42115.0, 28804.0, 19171.0, 12197.0, 7407.0, 4549.0, 2776.0, 1690.0, 910.0, 563.0, 318.0, 203.0, 119.0, 86.0, 50.0, 30.0, 16.0, 15.0, 9.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0], "bins": [-6.16015625, -5.96990966796875, -5.7796630859375, -5.58941650390625, -5.399169921875, -5.20892333984375, -5.0186767578125, -4.82843017578125, -4.63818359375, -4.44793701171875, -4.2576904296875, -4.06744384765625, -3.877197265625, -3.68695068359375, -3.4967041015625, -3.30645751953125, -3.1162109375, -2.92596435546875, -2.7357177734375, -2.54547119140625, -2.355224609375, -2.16497802734375, -1.9747314453125, -1.78448486328125, -1.59423828125, -1.40399169921875, -1.2137451171875, -1.02349853515625, -0.833251953125, -0.64300537109375, -0.4527587890625, -0.26251220703125, -0.072265625, 0.11798095703125, 0.3082275390625, 0.49847412109375, 0.688720703125, 0.87896728515625, 1.0692138671875, 1.25946044921875, 1.44970703125, 1.63995361328125, 1.8302001953125, 2.02044677734375, 2.210693359375, 2.40093994140625, 2.5911865234375, 2.78143310546875, 2.9716796875, 3.16192626953125, 3.3521728515625, 3.54241943359375, 3.732666015625, 3.92291259765625, 4.1131591796875, 4.30340576171875, 4.49365234375, 4.68389892578125, 4.8741455078125, 5.06439208984375, 5.254638671875, 5.44488525390625, 5.6351318359375, 5.82537841796875, 6.015625]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 7.0, 4.0, 4.0, 7.0, 5.0, 10.0, 18.0, 16.0, 14.0, 23.0, 27.0, 22.0, 27.0, 25.0, 38.0, 43.0, 43.0, 40.0, 48.0, 39.0, 52.0, 29.0, 52.0, 43.0, 48.0, 34.0, 37.0, 35.0, 34.0, 20.0, 25.0, 16.0, 16.0, 21.0, 12.0, 10.0, 15.0, 11.0, 8.0, 6.0, 7.0, 3.0, 4.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.0006465911865234375, -0.0006256401538848877, -0.0006046891212463379, -0.0005837380886077881, -0.0005627870559692383, -0.0005418360233306885, -0.0005208849906921387, -0.0004999339580535889, -0.00047898292541503906, -0.00045803189277648926, -0.00043708086013793945, -0.00041612982749938965, -0.00039517879486083984, -0.00037422776222229004, -0.00035327672958374023, -0.00033232569694519043, -0.0003113746643066406, -0.0002904236316680908, -0.000269472599029541, -0.0002485215663909912, -0.0002275705337524414, -0.0002066195011138916, -0.0001856684684753418, -0.000164717435836792, -0.0001437664031982422, -0.00012281537055969238, -0.00010186433792114258, -8.091330528259277e-05, -5.996227264404297e-05, -3.9011240005493164e-05, -1.806020736694336e-05, 2.8908252716064453e-06, 2.384185791015625e-05, 4.4792890548706055e-05, 6.574392318725586e-05, 8.669495582580566e-05, 0.00010764598846435547, 0.00012859702110290527, 0.00014954805374145508, 0.00017049908638000488, 0.0001914501190185547, 0.0002124011516571045, 0.0002333521842956543, 0.0002543032169342041, 0.0002752542495727539, 0.0002962052822113037, 0.0003171563148498535, 0.0003381073474884033, 0.0003590583801269531, 0.00038000941276550293, 0.00040096044540405273, 0.00042191147804260254, 0.00044286251068115234, 0.00046381354331970215, 0.00048476457595825195, 0.0005057156085968018, 0.0005266666412353516, 0.0005476176738739014, 0.0005685687065124512, 0.000589519739151001, 0.0006104707717895508, 0.0006314218044281006, 0.0006523728370666504, 0.0006733238697052002, 0.00069427490234375]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 6.0, 5.0, 1.0, 8.0, 22.0, 33.0, 37.0, 63.0, 86.0, 189.0, 293.0, 467.0, 790.0, 1400.0, 2520.0, 4296.0, 7438.0, 12829.0, 21659.0, 35124.0, 54509.0, 78294.0, 102872.0, 123164.0, 132313.0, 125688.0, 107993.0, 82475.0, 58567.0, 38303.0, 23797.0, 14187.0, 8126.0, 4642.0, 2620.0, 1527.0, 886.0, 520.0, 312.0, 196.0, 126.0, 61.0, 51.0, 33.0, 16.0, 9.0, 6.0, 1.0, 6.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.95703125, -6.71368408203125, -6.4703369140625, -6.22698974609375, -5.983642578125, -5.74029541015625, -5.4969482421875, -5.25360107421875, -5.01025390625, -4.76690673828125, -4.5235595703125, -4.28021240234375, -4.036865234375, -3.79351806640625, -3.5501708984375, -3.30682373046875, -3.0634765625, -2.82012939453125, -2.5767822265625, -2.33343505859375, -2.090087890625, -1.84674072265625, -1.6033935546875, -1.36004638671875, -1.11669921875, -0.87335205078125, -0.6300048828125, -0.38665771484375, -0.143310546875, 0.10003662109375, 0.3433837890625, 0.58673095703125, 0.830078125, 1.07342529296875, 1.3167724609375, 1.56011962890625, 1.803466796875, 2.04681396484375, 2.2901611328125, 2.53350830078125, 2.77685546875, 3.02020263671875, 3.2635498046875, 3.50689697265625, 3.750244140625, 3.99359130859375, 4.2369384765625, 4.48028564453125, 4.7236328125, 4.96697998046875, 5.2103271484375, 5.45367431640625, 5.697021484375, 5.94036865234375, 6.1837158203125, 6.42706298828125, 6.67041015625, 6.91375732421875, 7.1571044921875, 7.40045166015625, 7.643798828125, 7.88714599609375, 8.1304931640625, 8.37384033203125, 8.6171875]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 5.0, 1.0, 3.0, 5.0, 13.0, 21.0, 13.0, 17.0, 20.0, 34.0, 33.0, 37.0, 49.0, 65.0, 72.0, 64.0, 79.0, 66.0, 61.0, 68.0, 58.0, 48.0, 41.0, 40.0, 25.0, 17.0, 18.0, 12.0, 4.0, 10.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.34765625, -5.2008056640625, -5.053955078125, -4.9071044921875, -4.76025390625, -4.6134033203125, -4.466552734375, -4.3197021484375, -4.1728515625, -4.0260009765625, -3.879150390625, -3.7322998046875, -3.58544921875, -3.4385986328125, -3.291748046875, -3.1448974609375, -2.998046875, -2.8511962890625, -2.704345703125, -2.5574951171875, -2.41064453125, -2.2637939453125, -2.116943359375, -1.9700927734375, -1.8232421875, -1.6763916015625, -1.529541015625, -1.3826904296875, -1.23583984375, -1.0889892578125, -0.942138671875, -0.7952880859375, -0.6484375, -0.5015869140625, -0.354736328125, -0.2078857421875, -0.06103515625, 0.0858154296875, 0.232666015625, 0.3795166015625, 0.5263671875, 0.6732177734375, 0.820068359375, 0.9669189453125, 1.11376953125, 1.2606201171875, 1.407470703125, 1.5543212890625, 1.701171875, 1.8480224609375, 1.994873046875, 2.1417236328125, 2.28857421875, 2.4354248046875, 2.582275390625, 2.7291259765625, 2.8759765625, 3.0228271484375, 3.169677734375, 3.3165283203125, 3.46337890625, 3.6102294921875, 3.757080078125, 3.9039306640625, 4.05078125]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 7.0, 7.0, 9.0, 12.0, 7.0, 10.0, 15.0, 21.0, 7.0, 27.0, 15.0, 30.0, 31.0, 30.0, 20.0, 27.0, 45.0, 37.0, 42.0, 40.0, 47.0, 34.0, 43.0, 41.0, 29.0, 44.0, 34.0, 34.0, 39.0, 22.0, 23.0, 18.0, 23.0, 11.0, 24.0, 21.0, 19.0, 12.0, 9.0, 14.0, 6.0, 4.0, 3.0, 4.0, 2.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-26.427213668823242, -25.63755989074707, -24.84790802001953, -24.05825424194336, -23.26860237121582, -22.47894859313965, -21.68929672241211, -20.899642944335938, -20.109989166259766, -19.320335388183594, -18.530683517456055, -17.741029739379883, -16.951377868652344, -16.161724090576172, -15.372071266174316, -14.582418441772461, -13.792766571044922, -13.003113746643066, -12.213460922241211, -11.423807144165039, -10.6341552734375, -9.844501495361328, -9.054848670959473, -8.265195846557617, -7.475543022155762, -6.685890197753906, -5.896237373352051, -5.106584072113037, -4.316931247711182, -3.527278423309326, -2.7376251220703125, -1.947972297668457, -1.1583213806152344, -0.36866843700408936, 0.42098450660705566, 1.2106375694274902, 2.0002903938293457, 2.789943218231201, 3.579596519470215, 4.36924934387207, 5.158902168273926, 5.948554992675781, 6.738207817077637, 7.52786111831665, 8.317514419555664, 9.107166290283203, 9.896820068359375, 10.68647289276123, 11.476125717163086, 12.265778541564941, 13.055431365966797, 13.845085144042969, 14.634737014770508, 15.42439079284668, 16.21404266357422, 17.00369644165039, 17.793350219726562, 18.583003997802734, 19.372655868530273, 20.162309646606445, 20.951961517333984, 21.741615295410156, 22.531269073486328, 23.320920944213867, 24.110572814941406]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 0.0, 3.0, 6.0, 5.0, 4.0, 6.0, 9.0, 15.0, 12.0, 10.0, 17.0, 22.0, 19.0, 17.0, 12.0, 20.0, 30.0, 20.0, 34.0, 30.0, 32.0, 44.0, 35.0, 22.0, 48.0, 29.0, 33.0, 39.0, 39.0, 37.0, 40.0, 25.0, 44.0, 31.0, 22.0, 18.0, 23.0, 17.0, 20.0, 20.0, 14.0, 13.0, 9.0, 14.0, 10.0, 9.0, 7.0, 4.0, 3.0, 2.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0], "bins": [-27.040788650512695, -26.192590713500977, -25.34439468383789, -24.496196746826172, -23.647998809814453, -22.799802780151367, -21.95160484313965, -21.103408813476562, -20.255210876464844, -19.407012939453125, -18.55881690979004, -17.71061897277832, -16.862422943115234, -16.014225006103516, -15.166027069091797, -14.317830085754395, -13.469633102416992, -12.62143611907959, -11.773239135742188, -10.925041198730469, -10.076844215393066, -9.228647232055664, -8.380449295043945, -7.532252311706543, -6.684055328369141, -5.835858345031738, -4.987660884857178, -4.139463424682617, -3.291266441345215, -2.4430694580078125, -1.594871997833252, -0.7466745376586914, 0.10152053833007812, 0.9497177600860596, 1.797914981842041, 2.6461122035980225, 3.494309425354004, 4.342506408691406, 5.190703868865967, 6.038901329040527, 6.88709831237793, 7.735295295715332, 8.583492279052734, 9.431690216064453, 10.279887199401855, 11.128084182739258, 11.976282119750977, 12.824479103088379, 13.672676086425781, 14.520873069763184, 15.369070053100586, 16.217267990112305, 17.06546401977539, 17.91366195678711, 18.761859893798828, 19.610057830810547, 20.458253860473633, 21.30645179748535, 22.154647827148438, 23.002845764160156, 23.851043701171875, 24.69923973083496, 25.54743766784668, 26.395633697509766, 27.243831634521484]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 4.0, 11.0, 10.0, 29.0, 35.0, 70.0, 135.0, 219.0, 421.0, 748.0, 1123.0, 1943.0, 3011.0, 5241.0, 8197.0, 13118.0, 20438.0, 31227.0, 46811.0, 68162.0, 96449.0, 134381.0, 177285.0, 226564.0, 276061.0, 322527.0, 355998.0, 372262.0, 369075.0, 344991.0, 308245.0, 260467.0, 209333.0, 161810.0, 119834.0, 86005.0, 59701.0, 40361.0, 26310.0, 17210.0, 10947.0, 6840.0, 4170.0, 2625.0, 1594.0, 969.0, 559.0, 313.0, 191.0, 103.0, 70.0, 45.0, 27.0, 8.0, 4.0, 6.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-18.453125, -17.8544921875, -17.255859375, -16.6572265625, -16.05859375, -15.4599609375, -14.861328125, -14.2626953125, -13.6640625, -13.0654296875, -12.466796875, -11.8681640625, -11.26953125, -10.6708984375, -10.072265625, -9.4736328125, -8.875, -8.2763671875, -7.677734375, -7.0791015625, -6.48046875, -5.8818359375, -5.283203125, -4.6845703125, -4.0859375, -3.4873046875, -2.888671875, -2.2900390625, -1.69140625, -1.0927734375, -0.494140625, 0.1044921875, 0.703125, 1.3017578125, 1.900390625, 2.4990234375, 3.09765625, 3.6962890625, 4.294921875, 4.8935546875, 5.4921875, 6.0908203125, 6.689453125, 7.2880859375, 7.88671875, 8.4853515625, 9.083984375, 9.6826171875, 10.28125, 10.8798828125, 11.478515625, 12.0771484375, 12.67578125, 13.2744140625, 13.873046875, 14.4716796875, 15.0703125, 15.6689453125, 16.267578125, 16.8662109375, 17.46484375, 18.0634765625, 18.662109375, 19.2607421875, 19.859375]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 5.0, 2.0, 9.0, 1.0, 6.0, 12.0, 11.0, 13.0, 13.0, 12.0, 19.0, 22.0, 20.0, 20.0, 27.0, 25.0, 20.0, 31.0, 33.0, 37.0, 42.0, 29.0, 40.0, 44.0, 35.0, 38.0, 41.0, 36.0, 42.0, 39.0, 27.0, 28.0, 26.0, 29.0, 20.0, 8.0, 18.0, 26.0, 22.0, 14.0, 13.0, 9.0, 7.0, 3.0, 9.0, 5.0, 4.0, 8.0, 3.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-24.046875, -23.3056640625, -22.564453125, -21.8232421875, -21.08203125, -20.3408203125, -19.599609375, -18.8583984375, -18.1171875, -17.3759765625, -16.634765625, -15.8935546875, -15.15234375, -14.4111328125, -13.669921875, -12.9287109375, -12.1875, -11.4462890625, -10.705078125, -9.9638671875, -9.22265625, -8.4814453125, -7.740234375, -6.9990234375, -6.2578125, -5.5166015625, -4.775390625, -4.0341796875, -3.29296875, -2.5517578125, -1.810546875, -1.0693359375, -0.328125, 0.4130859375, 1.154296875, 1.8955078125, 2.63671875, 3.3779296875, 4.119140625, 4.8603515625, 5.6015625, 6.3427734375, 7.083984375, 7.8251953125, 8.56640625, 9.3076171875, 10.048828125, 10.7900390625, 11.53125, 12.2724609375, 13.013671875, 13.7548828125, 14.49609375, 15.2373046875, 15.978515625, 16.7197265625, 17.4609375, 18.2021484375, 18.943359375, 19.6845703125, 20.42578125, 21.1669921875, 21.908203125, 22.6494140625, 23.390625]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 12.0, 20.0, 27.0, 65.0, 99.0, 172.0, 316.0, 551.0, 1016.0, 1772.0, 2883.0, 4847.0, 8182.0, 13100.0, 20800.0, 32164.0, 48395.0, 71408.0, 100836.0, 136966.0, 181598.0, 226880.0, 274677.0, 314341.0, 346614.0, 362459.0, 358773.0, 339575.0, 304291.0, 259835.0, 213387.0, 168000.0, 125982.0, 91825.0, 63586.0, 43012.0, 28474.0, 18454.0, 11455.0, 7197.0, 4321.0, 2505.0, 1428.0, 884.0, 491.0, 258.0, 157.0, 97.0, 52.0, 23.0, 19.0, 5.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.03125, -18.393798828125, -17.75634765625, -17.118896484375, -16.4814453125, -15.843994140625, -15.20654296875, -14.569091796875, -13.931640625, -13.294189453125, -12.65673828125, -12.019287109375, -11.3818359375, -10.744384765625, -10.10693359375, -9.469482421875, -8.83203125, -8.194580078125, -7.55712890625, -6.919677734375, -6.2822265625, -5.644775390625, -5.00732421875, -4.369873046875, -3.732421875, -3.094970703125, -2.45751953125, -1.820068359375, -1.1826171875, -0.545166015625, 0.09228515625, 0.729736328125, 1.3671875, 2.004638671875, 2.64208984375, 3.279541015625, 3.9169921875, 4.554443359375, 5.19189453125, 5.829345703125, 6.466796875, 7.104248046875, 7.74169921875, 8.379150390625, 9.0166015625, 9.654052734375, 10.29150390625, 10.928955078125, 11.56640625, 12.203857421875, 12.84130859375, 13.478759765625, 14.1162109375, 14.753662109375, 15.39111328125, 16.028564453125, 16.666015625, 17.303466796875, 17.94091796875, 18.578369140625, 19.2158203125, 19.853271484375, 20.49072265625, 21.128173828125, 21.765625]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 6.0, 5.0, 11.0, 16.0, 13.0, 10.0, 25.0, 36.0, 39.0, 46.0, 55.0, 61.0, 85.0, 102.0, 102.0, 139.0, 146.0, 167.0, 160.0, 178.0, 183.0, 177.0, 186.0, 205.0, 195.0, 205.0, 171.0, 184.0, 184.0, 137.0, 128.0, 121.0, 102.0, 101.0, 75.0, 69.0, 71.0, 46.0, 39.0, 18.0, 20.0, 17.0, 5.0, 22.0, 1.0, 7.0, 4.0, 2.0, 1.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0], "bins": [-12.3984375, -12.0150146484375, -11.631591796875, -11.2481689453125, -10.86474609375, -10.4813232421875, -10.097900390625, -9.7144775390625, -9.3310546875, -8.9476318359375, -8.564208984375, -8.1807861328125, -7.79736328125, -7.4139404296875, -7.030517578125, -6.6470947265625, -6.263671875, -5.8802490234375, -5.496826171875, -5.1134033203125, -4.72998046875, -4.3465576171875, -3.963134765625, -3.5797119140625, -3.1962890625, -2.8128662109375, -2.429443359375, -2.0460205078125, -1.66259765625, -1.2791748046875, -0.895751953125, -0.5123291015625, -0.12890625, 0.2545166015625, 0.637939453125, 1.0213623046875, 1.40478515625, 1.7882080078125, 2.171630859375, 2.5550537109375, 2.9384765625, 3.3218994140625, 3.705322265625, 4.0887451171875, 4.47216796875, 4.8555908203125, 5.239013671875, 5.6224365234375, 6.005859375, 6.3892822265625, 6.772705078125, 7.1561279296875, 7.53955078125, 7.9229736328125, 8.306396484375, 8.6898193359375, 9.0732421875, 9.4566650390625, 9.840087890625, 10.2235107421875, 10.60693359375, 10.9903564453125, 11.373779296875, 11.7572021484375, 12.140625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 3.0, 11.0, 9.0, 7.0, 8.0, 12.0, 19.0, 13.0, 20.0, 18.0, 20.0, 21.0, 30.0, 33.0, 33.0, 30.0, 42.0, 41.0, 39.0, 34.0, 35.0, 50.0, 34.0, 33.0, 30.0, 49.0, 29.0, 35.0, 32.0, 26.0, 16.0, 27.0, 14.0, 14.0, 16.0, 20.0, 15.0, 16.0, 11.0, 8.0, 12.0, 4.0, 9.0, 4.0, 10.0, 2.0, 4.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-26.096071243286133, -25.275848388671875, -24.45562744140625, -23.635404586791992, -22.815183639526367, -21.99496078491211, -21.174739837646484, -20.354516983032227, -19.5342960357666, -18.714073181152344, -17.89385223388672, -17.07362937927246, -16.253408432006836, -15.433185577392578, -14.612964630126953, -13.792741775512695, -12.972519874572754, -12.152297973632812, -11.332076072692871, -10.51185417175293, -9.691632270812988, -8.871410369873047, -8.051187515258789, -7.230966091156006, -6.4107441902160645, -5.590522289276123, -4.770300388336182, -3.950078248977661, -3.1298563480377197, -2.309634208679199, -1.4894123077392578, -0.6691904067993164, 0.151031494140625, 0.9712534546852112, 1.7914754152297974, 2.6116974353790283, 3.4319193363189697, 4.25214147567749, 5.072363376617432, 5.892585277557373, 6.7128071784973145, 7.533029079437256, 8.353251457214355, 9.173473358154297, 9.993695259094238, 10.81391716003418, 11.634139060974121, 12.454360961914062, 13.274582862854004, 14.094804763793945, 14.915026664733887, 15.735248565673828, 16.555471420288086, 17.37569236755371, 18.19591522216797, 19.016136169433594, 19.83635902404785, 20.65658187866211, 21.476802825927734, 22.297025680541992, 23.117246627807617, 23.937469482421875, 24.7576904296875, 25.577913284301758, 26.398134231567383]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 2.0, 3.0, 4.0, 11.0, 8.0, 6.0, 4.0, 12.0, 17.0, 22.0, 17.0, 26.0, 26.0, 14.0, 36.0, 31.0, 32.0, 37.0, 32.0, 41.0, 38.0, 40.0, 42.0, 36.0, 39.0, 33.0, 40.0, 29.0, 31.0, 37.0, 27.0, 31.0, 34.0, 24.0, 18.0, 19.0, 22.0, 14.0, 14.0, 12.0, 7.0, 9.0, 3.0, 6.0, 3.0, 4.0, 5.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0], "bins": [-28.561195373535156, -27.63642692565918, -26.711658477783203, -25.78689193725586, -24.862123489379883, -23.937355041503906, -23.012588500976562, -22.087820053100586, -21.16305160522461, -20.238283157348633, -19.313514709472656, -18.388748168945312, -17.463979721069336, -16.53921127319336, -15.6144437789917, -14.689676284790039, -13.764907836914062, -12.840139389038086, -11.915371894836426, -10.990604400634766, -10.065835952758789, -9.141067504882812, -8.216300010681152, -7.291532039642334, -6.366764068603516, -5.441996097564697, -4.517228126525879, -3.5924601554870605, -2.667692184448242, -1.7429242134094238, -0.8181562423706055, 0.10661172866821289, 1.0313777923583984, 1.9561457633972168, 2.880913734436035, 3.8056817054748535, 4.730449676513672, 5.65521764755249, 6.579985618591309, 7.504753589630127, 8.429521560668945, 9.354290008544922, 10.279057502746582, 11.203824996948242, 12.128593444824219, 13.053361892700195, 13.978129386901855, 14.902896881103516, 15.827665328979492, 16.75243377685547, 17.677200317382812, 18.60196876525879, 19.526737213134766, 20.451505661010742, 21.37627410888672, 22.301040649414062, 23.22580909729004, 24.150577545166016, 25.07534408569336, 26.000112533569336, 26.924880981445312, 27.84964942932129, 28.774417877197266, 29.69918441772461, 30.623952865600586]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 7.0, 6.0, 9.0, 19.0, 22.0, 42.0, 71.0, 83.0, 166.0, 232.0, 413.0, 692.0, 1142.0, 1913.0, 3290.0, 5610.0, 9548.0, 16294.0, 26958.0, 44308.0, 70363.0, 105411.0, 140851.0, 160258.0, 147657.0, 113157.0, 76799.0, 48719.0, 30132.0, 18206.0, 10775.0, 6330.0, 3758.0, 2111.0, 1266.0, 731.0, 470.0, 274.0, 183.0, 115.0, 57.0, 43.0, 18.0, 23.0, 6.0, 9.0, 7.0, 6.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.7109375, -4.5570068359375, -4.403076171875, -4.2491455078125, -4.09521484375, -3.9412841796875, -3.787353515625, -3.6334228515625, -3.4794921875, -3.3255615234375, -3.171630859375, -3.0177001953125, -2.86376953125, -2.7098388671875, -2.555908203125, -2.4019775390625, -2.248046875, -2.0941162109375, -1.940185546875, -1.7862548828125, -1.63232421875, -1.4783935546875, -1.324462890625, -1.1705322265625, -1.0166015625, -0.8626708984375, -0.708740234375, -0.5548095703125, -0.40087890625, -0.2469482421875, -0.093017578125, 0.0609130859375, 0.21484375, 0.3687744140625, 0.522705078125, 0.6766357421875, 0.83056640625, 0.9844970703125, 1.138427734375, 1.2923583984375, 1.4462890625, 1.6002197265625, 1.754150390625, 1.9080810546875, 2.06201171875, 2.2159423828125, 2.369873046875, 2.5238037109375, 2.677734375, 2.8316650390625, 2.985595703125, 3.1395263671875, 3.29345703125, 3.4473876953125, 3.601318359375, 3.7552490234375, 3.9091796875, 4.0631103515625, 4.217041015625, 4.3709716796875, 4.52490234375, 4.6788330078125, 4.832763671875, 4.9866943359375, 5.140625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 5.0, 3.0, 2.0, 7.0, 12.0, 9.0, 13.0, 18.0, 13.0, 18.0, 23.0, 20.0, 27.0, 30.0, 35.0, 34.0, 40.0, 47.0, 46.0, 46.0, 38.0, 38.0, 42.0, 44.0, 32.0, 48.0, 33.0, 26.0, 41.0, 30.0, 26.0, 27.0, 18.0, 22.0, 10.0, 22.0, 14.0, 10.0, 8.0, 4.0, 5.0, 10.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.25, -28.1884765625, -27.126953125, -26.0654296875, -25.00390625, -23.9423828125, -22.880859375, -21.8193359375, -20.7578125, -19.6962890625, -18.634765625, -17.5732421875, -16.51171875, -15.4501953125, -14.388671875, -13.3271484375, -12.265625, -11.2041015625, -10.142578125, -9.0810546875, -8.01953125, -6.9580078125, -5.896484375, -4.8349609375, -3.7734375, -2.7119140625, -1.650390625, -0.5888671875, 0.47265625, 1.5341796875, 2.595703125, 3.6572265625, 4.71875, 5.7802734375, 6.841796875, 7.9033203125, 8.96484375, 10.0263671875, 11.087890625, 12.1494140625, 13.2109375, 14.2724609375, 15.333984375, 16.3955078125, 17.45703125, 18.5185546875, 19.580078125, 20.6416015625, 21.703125, 22.7646484375, 23.826171875, 24.8876953125, 25.94921875, 27.0107421875, 28.072265625, 29.1337890625, 30.1953125, 31.2568359375, 32.318359375, 33.3798828125, 34.44140625, 35.5029296875, 36.564453125, 37.6259765625, 38.6875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 7.0, 3.0, 0.0, 12.0, 13.0, 13.0, 19.0, 21.0, 47.0, 74.0, 99.0, 148.0, 221.0, 362.0, 544.0, 881.0, 1403.0, 2200.0, 3383.0, 5527.0, 9097.0, 14946.0, 24913.0, 40711.0, 64082.0, 96898.0, 131393.0, 155018.0, 149274.0, 120313.0, 83862.0, 54994.0, 34160.0, 20986.0, 12571.0, 7644.0, 4746.0, 2884.0, 1832.0, 1130.0, 718.0, 506.0, 304.0, 189.0, 145.0, 102.0, 56.0, 41.0, 25.0, 20.0, 14.0, 6.0, 5.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.1484375, -4.9915771484375, -4.834716796875, -4.6778564453125, -4.52099609375, -4.3641357421875, -4.207275390625, -4.0504150390625, -3.8935546875, -3.7366943359375, -3.579833984375, -3.4229736328125, -3.26611328125, -3.1092529296875, -2.952392578125, -2.7955322265625, -2.638671875, -2.4818115234375, -2.324951171875, -2.1680908203125, -2.01123046875, -1.8543701171875, -1.697509765625, -1.5406494140625, -1.3837890625, -1.2269287109375, -1.070068359375, -0.9132080078125, -0.75634765625, -0.5994873046875, -0.442626953125, -0.2857666015625, -0.12890625, 0.0279541015625, 0.184814453125, 0.3416748046875, 0.49853515625, 0.6553955078125, 0.812255859375, 0.9691162109375, 1.1259765625, 1.2828369140625, 1.439697265625, 1.5965576171875, 1.75341796875, 1.9102783203125, 2.067138671875, 2.2239990234375, 2.380859375, 2.5377197265625, 2.694580078125, 2.8514404296875, 3.00830078125, 3.1651611328125, 3.322021484375, 3.4788818359375, 3.6357421875, 3.7926025390625, 3.949462890625, 4.1063232421875, 4.26318359375, 4.4200439453125, 4.576904296875, 4.7337646484375, 4.890625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 5.0, 2.0, 5.0, 10.0, 2.0, 11.0, 8.0, 19.0, 18.0, 19.0, 24.0, 20.0, 41.0, 38.0, 32.0, 33.0, 37.0, 40.0, 43.0, 42.0, 31.0, 34.0, 50.0, 48.0, 42.0, 38.0, 50.0, 37.0, 41.0, 26.0, 26.0, 21.0, 20.0, 15.0, 13.0, 8.0, 11.0, 12.0, 12.0, 7.0, 5.0, 2.0, 3.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-24.875, -24.16748046875, -23.4599609375, -22.75244140625, -22.044921875, -21.33740234375, -20.6298828125, -19.92236328125, -19.21484375, -18.50732421875, -17.7998046875, -17.09228515625, -16.384765625, -15.67724609375, -14.9697265625, -14.26220703125, -13.5546875, -12.84716796875, -12.1396484375, -11.43212890625, -10.724609375, -10.01708984375, -9.3095703125, -8.60205078125, -7.89453125, -7.18701171875, -6.4794921875, -5.77197265625, -5.064453125, -4.35693359375, -3.6494140625, -2.94189453125, -2.234375, -1.52685546875, -0.8193359375, -0.11181640625, 0.595703125, 1.30322265625, 2.0107421875, 2.71826171875, 3.42578125, 4.13330078125, 4.8408203125, 5.54833984375, 6.255859375, 6.96337890625, 7.6708984375, 8.37841796875, 9.0859375, 9.79345703125, 10.5009765625, 11.20849609375, 11.916015625, 12.62353515625, 13.3310546875, 14.03857421875, 14.74609375, 15.45361328125, 16.1611328125, 16.86865234375, 17.576171875, 18.28369140625, 18.9912109375, 19.69873046875, 20.40625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 7.0, 9.0, 8.0, 12.0, 19.0, 32.0, 29.0, 51.0, 78.0, 109.0, 138.0, 237.0, 316.0, 519.0, 747.0, 1185.0, 2030.0, 3481.0, 6163.0, 11574.0, 23092.0, 47805.0, 97774.0, 183397.0, 252908.0, 198495.0, 109199.0, 53632.0, 26149.0, 12849.0, 6923.0, 3737.0, 2150.0, 1284.0, 747.0, 544.0, 351.0, 215.0, 159.0, 119.0, 85.0, 52.0, 49.0, 30.0, 19.0, 19.0, 9.0, 9.0, 5.0, 5.0, 4.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.0244140625, -0.991973876953125, -0.95953369140625, -0.927093505859375, -0.8946533203125, -0.862213134765625, -0.82977294921875, -0.797332763671875, -0.764892578125, -0.732452392578125, -0.70001220703125, -0.667572021484375, -0.6351318359375, -0.602691650390625, -0.57025146484375, -0.537811279296875, -0.50537109375, -0.472930908203125, -0.44049072265625, -0.408050537109375, -0.3756103515625, -0.343170166015625, -0.31072998046875, -0.278289794921875, -0.245849609375, -0.213409423828125, -0.18096923828125, -0.148529052734375, -0.1160888671875, -0.083648681640625, -0.05120849609375, -0.018768310546875, 0.013671875, 0.046112060546875, 0.07855224609375, 0.110992431640625, 0.1434326171875, 0.175872802734375, 0.20831298828125, 0.240753173828125, 0.273193359375, 0.305633544921875, 0.33807373046875, 0.370513916015625, 0.4029541015625, 0.435394287109375, 0.46783447265625, 0.500274658203125, 0.53271484375, 0.565155029296875, 0.59759521484375, 0.630035400390625, 0.6624755859375, 0.694915771484375, 0.72735595703125, 0.759796142578125, 0.792236328125, 0.824676513671875, 0.85711669921875, 0.889556884765625, 0.9219970703125, 0.954437255859375, 0.98687744140625, 1.019317626953125, 1.0517578125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 4.0, 9.0, 4.0, 10.0, 16.0, 17.0, 21.0, 43.0, 46.0, 44.0, 53.0, 46.0, 57.0, 63.0, 56.0, 80.0, 69.0, 51.0, 50.0, 51.0, 38.0, 37.0, 34.0, 26.0, 12.0, 23.0, 10.0, 12.0, 4.0, 4.0, 4.0, 1.0, 1.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010210275650024414, -9.870342910289764e-05, -9.530410170555115e-05, -9.190477430820465e-05, -8.850544691085815e-05, -8.510611951351166e-05, -8.170679211616516e-05, -7.830746471881866e-05, -7.490813732147217e-05, -7.150880992412567e-05, -6.810948252677917e-05, -6.471015512943268e-05, -6.131082773208618e-05, -5.7911500334739685e-05, -5.451217293739319e-05, -5.111284554004669e-05, -4.7713518142700195e-05, -4.43141907453537e-05, -4.09148633480072e-05, -3.7515535950660706e-05, -3.411620855331421e-05, -3.071688115596771e-05, -2.7317553758621216e-05, -2.391822636127472e-05, -2.0518898963928223e-05, -1.7119571566581726e-05, -1.372024416923523e-05, -1.0320916771888733e-05, -6.921589374542236e-06, -3.5222619771957397e-06, -1.2293457984924316e-07, 3.2763928174972534e-06, 6.67572021484375e-06, 1.0075047612190247e-05, 1.3474375009536743e-05, 1.687370240688324e-05, 2.0273029804229736e-05, 2.3672357201576233e-05, 2.707168459892273e-05, 3.0471011996269226e-05, 3.387033939361572e-05, 3.726966679096222e-05, 4.0668994188308716e-05, 4.406832158565521e-05, 4.746764898300171e-05, 5.0866976380348206e-05, 5.42663037776947e-05, 5.76656311750412e-05, 6.10649585723877e-05, 6.446428596973419e-05, 6.786361336708069e-05, 7.126294076442719e-05, 7.466226816177368e-05, 7.806159555912018e-05, 8.146092295646667e-05, 8.486025035381317e-05, 8.825957775115967e-05, 9.165890514850616e-05, 9.505823254585266e-05, 9.845755994319916e-05, 0.00010185688734054565, 0.00010525621473789215, 0.00010865554213523865, 0.00011205486953258514, 0.00011545419692993164]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 4.0, 4.0, 9.0, 10.0, 14.0, 18.0, 19.0, 28.0, 44.0, 67.0, 89.0, 120.0, 165.0, 256.0, 302.0, 498.0, 672.0, 1054.0, 1417.0, 2201.0, 3311.0, 4975.0, 7910.0, 12469.0, 19676.0, 31990.0, 50423.0, 78788.0, 118470.0, 159318.0, 167276.0, 133652.0, 92164.0, 58687.0, 37603.0, 23354.0, 14515.0, 9306.0, 5921.0, 3831.0, 2498.0, 1633.0, 1132.0, 778.0, 588.0, 401.0, 254.0, 191.0, 154.0, 110.0, 51.0, 44.0, 29.0, 28.0, 17.0, 9.0, 6.0, 7.0, 4.0, 3.0, 4.0], "bins": [-1.21484375, -1.17822265625, -1.1416015625, -1.10498046875, -1.068359375, -1.03173828125, -0.9951171875, -0.95849609375, -0.921875, -0.88525390625, -0.8486328125, -0.81201171875, -0.775390625, -0.73876953125, -0.7021484375, -0.66552734375, -0.62890625, -0.59228515625, -0.5556640625, -0.51904296875, -0.482421875, -0.44580078125, -0.4091796875, -0.37255859375, -0.3359375, -0.29931640625, -0.2626953125, -0.22607421875, -0.189453125, -0.15283203125, -0.1162109375, -0.07958984375, -0.04296875, -0.00634765625, 0.0302734375, 0.06689453125, 0.103515625, 0.14013671875, 0.1767578125, 0.21337890625, 0.25, 0.28662109375, 0.3232421875, 0.35986328125, 0.396484375, 0.43310546875, 0.4697265625, 0.50634765625, 0.54296875, 0.57958984375, 0.6162109375, 0.65283203125, 0.689453125, 0.72607421875, 0.7626953125, 0.79931640625, 0.8359375, 0.87255859375, 0.9091796875, 0.94580078125, 0.982421875, 1.01904296875, 1.0556640625, 1.09228515625, 1.12890625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 4.0, 4.0, 7.0, 7.0, 11.0, 5.0, 21.0, 16.0, 21.0, 26.0, 22.0, 28.0, 40.0, 42.0, 41.0, 52.0, 45.0, 53.0, 53.0, 66.0, 51.0, 42.0, 61.0, 50.0, 43.0, 31.0, 31.0, 21.0, 21.0, 13.0, 13.0, 14.0, 10.0, 5.0, 6.0, 7.0, 3.0, 7.0, 4.0, 3.0, 7.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.560546875, -0.5445823669433594, -0.5286178588867188, -0.5126533508300781, -0.4966888427734375, -0.4807243347167969, -0.46475982666015625, -0.4487953186035156, -0.432830810546875, -0.4168663024902344, -0.40090179443359375, -0.3849372863769531, -0.3689727783203125, -0.3530082702636719, -0.33704376220703125, -0.3210792541503906, -0.30511474609375, -0.2891502380371094, -0.27318572998046875, -0.2572212219238281, -0.2412567138671875, -0.22529220581054688, -0.20932769775390625, -0.19336318969726562, -0.177398681640625, -0.16143417358398438, -0.14546966552734375, -0.12950515747070312, -0.1135406494140625, -0.09757614135742188, -0.08161163330078125, -0.06564712524414062, -0.0496826171875, -0.033718109130859375, -0.01775360107421875, -0.001789093017578125, 0.0141754150390625, 0.030139923095703125, 0.04610443115234375, 0.062068939208984375, 0.078033447265625, 0.09399795532226562, 0.10996246337890625, 0.12592697143554688, 0.1418914794921875, 0.15785598754882812, 0.17382049560546875, 0.18978500366210938, 0.20574951171875, 0.22171401977539062, 0.23767852783203125, 0.2536430358886719, 0.2696075439453125, 0.2855720520019531, 0.30153656005859375, 0.3175010681152344, 0.333465576171875, 0.3494300842285156, 0.36539459228515625, 0.3813591003417969, 0.3973236083984375, 0.4132881164550781, 0.42925262451171875, 0.4452171325683594, 0.461181640625]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 4.0, 9.0, 10.0, 7.0, 8.0, 19.0, 15.0, 14.0, 18.0, 20.0, 21.0, 24.0, 32.0, 35.0, 34.0, 37.0, 40.0, 31.0, 41.0, 39.0, 42.0, 41.0, 36.0, 36.0, 34.0, 39.0, 38.0, 26.0, 33.0, 24.0, 17.0, 21.0, 14.0, 16.0, 20.0, 14.0, 19.0, 10.0, 11.0, 8.0, 10.0, 6.0, 8.0, 6.0, 6.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-25.874074935913086, -25.047775268554688, -24.221477508544922, -23.395177841186523, -22.568880081176758, -21.74258041381836, -20.916282653808594, -20.089982986450195, -19.26368522644043, -18.43738555908203, -17.611087799072266, -16.784788131713867, -15.958490371704102, -15.132190704345703, -14.305892944335938, -13.479593276977539, -12.653294563293457, -11.826995849609375, -11.000697135925293, -10.174398422241211, -9.348099708557129, -8.521800994873047, -7.695501804351807, -6.869203090667725, -6.042904376983643, -5.2166056632995605, -4.3903069496154785, -3.5640079975128174, -2.7377092838287354, -1.9114103317260742, -1.0851116180419922, -0.25881290435791016, 0.5674858093261719, 1.393784523010254, 2.220083236694336, 3.046382188796997, 3.872680902481079, 4.69897985458374, 5.525278568267822, 6.351577281951904, 7.177875995635986, 8.004175186157227, 8.830473899841309, 9.65677261352539, 10.483071327209473, 11.309370040893555, 12.135668754577637, 12.961967468261719, 13.7882661819458, 14.614564895629883, 15.440863609313965, 16.267162322998047, 17.093461990356445, 17.91975975036621, 18.74605941772461, 19.572357177734375, 20.398656845092773, 21.224956512451172, 22.051254272460938, 22.877553939819336, 23.7038516998291, 24.5301513671875, 25.356449127197266, 26.182748794555664, 27.00904655456543]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 3.0, 2.0, 4.0, 13.0, 6.0, 6.0, 4.0, 11.0, 17.0, 23.0, 17.0, 23.0, 29.0, 15.0, 36.0, 32.0, 32.0, 40.0, 26.0, 43.0, 38.0, 46.0, 36.0, 37.0, 34.0, 37.0, 40.0, 29.0, 33.0, 35.0, 28.0, 32.0, 31.0, 24.0, 21.0, 20.0, 19.0, 14.0, 15.0, 10.0, 8.0, 8.0, 3.0, 6.0, 3.0, 4.0, 5.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0], "bins": [-28.726627349853516, -27.802722930908203, -26.878816604614258, -25.954912185668945, -25.031005859375, -24.107101440429688, -23.183197021484375, -22.25929069519043, -21.335384368896484, -20.411479949951172, -19.487573623657227, -18.563669204711914, -17.63976287841797, -16.715858459472656, -15.791953086853027, -14.868047714233398, -13.944143295288086, -13.020237922668457, -12.096332550048828, -11.172428131103516, -10.24852180480957, -9.324617385864258, -8.400712013244629, -7.476806640625, -6.552901268005371, -5.628995895385742, -4.705090522766113, -3.7811856269836426, -2.8572802543640137, -1.9333748817443848, -1.009469985961914, -0.08556461334228516, 0.8383426666259766, 1.762247920036316, 2.6861531734466553, 3.610058307647705, 4.533963680267334, 5.457869052886963, 6.381773948669434, 7.3056793212890625, 8.229584693908691, 9.15349006652832, 10.07739543914795, 11.001300811767578, 11.92520523071289, 12.849111557006836, 13.773015975952148, 14.696921348571777, 15.620826721191406, 16.54473114013672, 17.468637466430664, 18.392541885375977, 19.316448211669922, 20.240352630615234, 21.164257049560547, 22.088163375854492, 23.012069702148438, 23.93597412109375, 24.859880447387695, 25.783784866333008, 26.707691192626953, 27.631595611572266, 28.555500030517578, 29.479406356811523, 30.403310775756836]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 4.0, 14.0, 17.0, 34.0, 51.0, 89.0, 136.0, 250.0, 331.0, 574.0, 892.0, 1369.0, 2025.0, 3053.0, 4586.0, 6659.0, 9603.0, 13780.0, 19007.0, 25736.0, 33629.0, 43077.0, 53346.0, 63328.0, 73103.0, 80407.0, 83923.0, 83709.0, 80621.0, 74100.0, 65040.0, 54865.0, 44640.0, 35045.0, 26474.0, 19793.0, 14229.0, 10027.0, 7014.0, 4835.0, 3135.0, 2111.0, 1367.0, 960.0, 564.0, 367.0, 251.0, 156.0, 99.0, 61.0, 35.0, 21.0, 13.0, 5.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.8125, -13.3677978515625, -12.923095703125, -12.4783935546875, -12.03369140625, -11.5889892578125, -11.144287109375, -10.6995849609375, -10.2548828125, -9.8101806640625, -9.365478515625, -8.9207763671875, -8.47607421875, -8.0313720703125, -7.586669921875, -7.1419677734375, -6.697265625, -6.2525634765625, -5.807861328125, -5.3631591796875, -4.91845703125, -4.4737548828125, -4.029052734375, -3.5843505859375, -3.1396484375, -2.6949462890625, -2.250244140625, -1.8055419921875, -1.36083984375, -0.9161376953125, -0.471435546875, -0.0267333984375, 0.41796875, 0.8626708984375, 1.307373046875, 1.7520751953125, 2.19677734375, 2.6414794921875, 3.086181640625, 3.5308837890625, 3.9755859375, 4.4202880859375, 4.864990234375, 5.3096923828125, 5.75439453125, 6.1990966796875, 6.643798828125, 7.0885009765625, 7.533203125, 7.9779052734375, 8.422607421875, 8.8673095703125, 9.31201171875, 9.7567138671875, 10.201416015625, 10.6461181640625, 11.0908203125, 11.5355224609375, 11.980224609375, 12.4249267578125, 12.86962890625, 13.3143310546875, 13.759033203125, 14.2037353515625, 14.6484375]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 5.0, 3.0, 3.0, 6.0, 6.0, 5.0, 12.0, 5.0, 7.0, 12.0, 13.0, 16.0, 19.0, 9.0, 22.0, 25.0, 29.0, 37.0, 35.0, 31.0, 27.0, 35.0, 43.0, 47.0, 34.0, 34.0, 33.0, 34.0, 29.0, 44.0, 40.0, 35.0, 41.0, 18.0, 27.0, 31.0, 31.0, 22.0, 14.0, 15.0, 15.0, 13.0, 13.0, 8.0, 5.0, 6.0, 7.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-26.71875, -25.783203125, -24.84765625, -23.912109375, -22.9765625, -22.041015625, -21.10546875, -20.169921875, -19.234375, -18.298828125, -17.36328125, -16.427734375, -15.4921875, -14.556640625, -13.62109375, -12.685546875, -11.75, -10.814453125, -9.87890625, -8.943359375, -8.0078125, -7.072265625, -6.13671875, -5.201171875, -4.265625, -3.330078125, -2.39453125, -1.458984375, -0.5234375, 0.412109375, 1.34765625, 2.283203125, 3.21875, 4.154296875, 5.08984375, 6.025390625, 6.9609375, 7.896484375, 8.83203125, 9.767578125, 10.703125, 11.638671875, 12.57421875, 13.509765625, 14.4453125, 15.380859375, 16.31640625, 17.251953125, 18.1875, 19.123046875, 20.05859375, 20.994140625, 21.9296875, 22.865234375, 23.80078125, 24.736328125, 25.671875, 26.607421875, 27.54296875, 28.478515625, 29.4140625, 30.349609375, 31.28515625, 32.220703125, 33.15625]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 1.0, 6.0, 5.0, 20.0, 31.0, 42.0, 82.0, 130.0, 196.0, 331.0, 485.0, 851.0, 1299.0, 2156.0, 3262.0, 5113.0, 7788.0, 11715.0, 17291.0, 24647.0, 34423.0, 45852.0, 59222.0, 71842.0, 85043.0, 93231.0, 97698.0, 94089.0, 87430.0, 75287.0, 61809.0, 48943.0, 36751.0, 26471.0, 18707.0, 12513.0, 8367.0, 5468.0, 3692.0, 2353.0, 1501.0, 910.0, 554.0, 364.0, 237.0, 129.0, 80.0, 69.0, 28.0, 18.0, 12.0, 14.0, 4.0, 4.0, 1.0, 1.0], "bins": [-18.15625, -17.631591796875, -17.10693359375, -16.582275390625, -16.0576171875, -15.532958984375, -15.00830078125, -14.483642578125, -13.958984375, -13.434326171875, -12.90966796875, -12.385009765625, -11.8603515625, -11.335693359375, -10.81103515625, -10.286376953125, -9.76171875, -9.237060546875, -8.71240234375, -8.187744140625, -7.6630859375, -7.138427734375, -6.61376953125, -6.089111328125, -5.564453125, -5.039794921875, -4.51513671875, -3.990478515625, -3.4658203125, -2.941162109375, -2.41650390625, -1.891845703125, -1.3671875, -0.842529296875, -0.31787109375, 0.206787109375, 0.7314453125, 1.256103515625, 1.78076171875, 2.305419921875, 2.830078125, 3.354736328125, 3.87939453125, 4.404052734375, 4.9287109375, 5.453369140625, 5.97802734375, 6.502685546875, 7.02734375, 7.552001953125, 8.07666015625, 8.601318359375, 9.1259765625, 9.650634765625, 10.17529296875, 10.699951171875, 11.224609375, 11.749267578125, 12.27392578125, 12.798583984375, 13.3232421875, 13.847900390625, 14.37255859375, 14.897216796875, 15.421875]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 4.0, 7.0, 6.0, 6.0, 7.0, 13.0, 11.0, 25.0, 31.0, 22.0, 25.0, 21.0, 30.0, 25.0, 32.0, 32.0, 34.0, 34.0, 38.0, 53.0, 44.0, 37.0, 39.0, 41.0, 33.0, 27.0, 30.0, 33.0, 27.0, 29.0, 24.0, 23.0, 22.0, 25.0, 22.0, 20.0, 8.0, 13.0, 9.0, 9.0, 9.0, 5.0, 4.0, 4.0, 4.0, 5.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.703125, -18.066650390625, -17.43017578125, -16.793701171875, -16.1572265625, -15.520751953125, -14.88427734375, -14.247802734375, -13.611328125, -12.974853515625, -12.33837890625, -11.701904296875, -11.0654296875, -10.428955078125, -9.79248046875, -9.156005859375, -8.51953125, -7.883056640625, -7.24658203125, -6.610107421875, -5.9736328125, -5.337158203125, -4.70068359375, -4.064208984375, -3.427734375, -2.791259765625, -2.15478515625, -1.518310546875, -0.8818359375, -0.245361328125, 0.39111328125, 1.027587890625, 1.6640625, 2.300537109375, 2.93701171875, 3.573486328125, 4.2099609375, 4.846435546875, 5.48291015625, 6.119384765625, 6.755859375, 7.392333984375, 8.02880859375, 8.665283203125, 9.3017578125, 9.938232421875, 10.57470703125, 11.211181640625, 11.84765625, 12.484130859375, 13.12060546875, 13.757080078125, 14.3935546875, 15.030029296875, 15.66650390625, 16.302978515625, 16.939453125, 17.575927734375, 18.21240234375, 18.848876953125, 19.4853515625, 20.121826171875, 20.75830078125, 21.394775390625, 22.03125]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 7.0, 5.0, 13.0, 13.0, 23.0, 30.0, 61.0, 89.0, 155.0, 291.0, 449.0, 775.0, 1344.0, 2216.0, 3765.0, 5955.0, 9781.0, 14989.0, 22818.0, 33121.0, 45601.0, 60484.0, 75419.0, 89967.0, 98891.0, 102447.0, 99983.0, 91041.0, 77892.0, 62582.0, 47429.0, 34379.0, 24126.0, 15945.0, 10175.0, 6403.0, 4015.0, 2428.0, 1422.0, 797.0, 488.0, 296.0, 185.0, 105.0, 69.0, 38.0, 21.0, 7.0, 12.0, 5.0, 9.0, 3.0, 2.0, 1.0, 2.0], "bins": [-6.39453125, -6.20953369140625, -6.0245361328125, -5.83953857421875, -5.654541015625, -5.46954345703125, -5.2845458984375, -5.09954833984375, -4.91455078125, -4.72955322265625, -4.5445556640625, -4.35955810546875, -4.174560546875, -3.98956298828125, -3.8045654296875, -3.61956787109375, -3.4345703125, -3.24957275390625, -3.0645751953125, -2.87957763671875, -2.694580078125, -2.50958251953125, -2.3245849609375, -2.13958740234375, -1.95458984375, -1.76959228515625, -1.5845947265625, -1.39959716796875, -1.214599609375, -1.02960205078125, -0.8446044921875, -0.65960693359375, -0.474609375, -0.28961181640625, -0.1046142578125, 0.08038330078125, 0.265380859375, 0.45037841796875, 0.6353759765625, 0.82037353515625, 1.00537109375, 1.19036865234375, 1.3753662109375, 1.56036376953125, 1.745361328125, 1.93035888671875, 2.1153564453125, 2.30035400390625, 2.4853515625, 2.67034912109375, 2.8553466796875, 3.04034423828125, 3.225341796875, 3.41033935546875, 3.5953369140625, 3.78033447265625, 3.96533203125, 4.15032958984375, 4.3353271484375, 4.52032470703125, 4.705322265625, 4.89031982421875, 5.0753173828125, 5.26031494140625, 5.4453125]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 1.0, 5.0, 3.0, 11.0, 8.0, 6.0, 8.0, 12.0, 15.0, 22.0, 21.0, 16.0, 19.0, 27.0, 38.0, 29.0, 32.0, 37.0, 43.0, 29.0, 31.0, 38.0, 41.0, 44.0, 44.0, 40.0, 36.0, 45.0, 39.0, 34.0, 31.0, 32.0, 27.0, 24.0, 22.0, 15.0, 23.0, 14.0, 8.0, 4.0, 4.0, 7.0, 5.0, 6.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 2.0], "bins": [-0.0006084442138671875, -0.0005877465009689331, -0.0005670487880706787, -0.0005463510751724243, -0.0005256533622741699, -0.0005049556493759155, -0.00048425793647766113, -0.00046356022357940674, -0.00044286251068115234, -0.00042216479778289795, -0.00040146708488464355, -0.00038076937198638916, -0.00036007165908813477, -0.00033937394618988037, -0.000318676233291626, -0.0002979785203933716, -0.0002772808074951172, -0.0002565830945968628, -0.0002358853816986084, -0.000215187668800354, -0.0001944899559020996, -0.00017379224300384521, -0.00015309453010559082, -0.00013239681720733643, -0.00011169910430908203, -9.100139141082764e-05, -7.030367851257324e-05, -4.960596561431885e-05, -2.8908252716064453e-05, -8.210539817810059e-06, 1.2487173080444336e-05, 3.318488597869873e-05, 5.3882598876953125e-05, 7.458031177520752e-05, 9.527802467346191e-05, 0.00011597573757171631, 0.0001366734504699707, 0.0001573711633682251, 0.0001780688762664795, 0.0001987665891647339, 0.00021946430206298828, 0.00024016201496124268, 0.00026085972785949707, 0.00028155744075775146, 0.00030225515365600586, 0.00032295286655426025, 0.00034365057945251465, 0.00036434829235076904, 0.00038504600524902344, 0.00040574371814727783, 0.0004264414310455322, 0.0004471391439437866, 0.000467836856842041, 0.0004885345697402954, 0.0005092322826385498, 0.0005299299955368042, 0.0005506277084350586, 0.000571325421333313, 0.0005920231342315674, 0.0006127208471298218, 0.0006334185600280762, 0.0006541162729263306, 0.000674813985824585, 0.0006955116987228394, 0.0007162094116210938]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 5.0, 3.0, 4.0, 10.0, 15.0, 26.0, 30.0, 68.0, 93.0, 149.0, 247.0, 370.0, 571.0, 885.0, 1438.0, 2126.0, 3405.0, 5243.0, 7977.0, 12052.0, 17651.0, 24826.0, 34757.0, 46595.0, 58556.0, 71905.0, 83055.0, 91261.0, 95113.0, 92480.0, 85898.0, 75408.0, 62319.0, 49924.0, 37862.0, 27660.0, 19707.0, 13443.0, 8826.0, 5952.0, 3743.0, 2553.0, 1571.0, 1029.0, 600.0, 416.0, 277.0, 181.0, 112.0, 61.0, 44.0, 29.0, 15.0, 8.0, 10.0, 2.0, 1.0, 0.0, 2.0, 3.0], "bins": [-5.85546875, -5.67608642578125, -5.4967041015625, -5.31732177734375, -5.137939453125, -4.95855712890625, -4.7791748046875, -4.59979248046875, -4.42041015625, -4.24102783203125, -4.0616455078125, -3.88226318359375, -3.702880859375, -3.52349853515625, -3.3441162109375, -3.16473388671875, -2.9853515625, -2.80596923828125, -2.6265869140625, -2.44720458984375, -2.267822265625, -2.08843994140625, -1.9090576171875, -1.72967529296875, -1.55029296875, -1.37091064453125, -1.1915283203125, -1.01214599609375, -0.832763671875, -0.65338134765625, -0.4739990234375, -0.29461669921875, -0.115234375, 0.06414794921875, 0.2435302734375, 0.42291259765625, 0.602294921875, 0.78167724609375, 0.9610595703125, 1.14044189453125, 1.31982421875, 1.49920654296875, 1.6785888671875, 1.85797119140625, 2.037353515625, 2.21673583984375, 2.3961181640625, 2.57550048828125, 2.7548828125, 2.93426513671875, 3.1136474609375, 3.29302978515625, 3.472412109375, 3.65179443359375, 3.8311767578125, 4.01055908203125, 4.18994140625, 4.36932373046875, 4.5487060546875, 4.72808837890625, 4.907470703125, 5.08685302734375, 5.2662353515625, 5.44561767578125, 5.625]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 6.0, 3.0, 1.0, 3.0, 5.0, 6.0, 6.0, 18.0, 15.0, 15.0, 18.0, 23.0, 30.0, 24.0, 36.0, 33.0, 36.0, 46.0, 33.0, 38.0, 45.0, 40.0, 44.0, 39.0, 43.0, 45.0, 38.0, 32.0, 40.0, 40.0, 33.0, 24.0, 18.0, 22.0, 17.0, 25.0, 14.0, 7.0, 10.0, 6.0, 8.0, 4.0, 9.0, 3.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-2.794921875, -2.708770751953125, -2.62261962890625, -2.536468505859375, -2.4503173828125, -2.364166259765625, -2.27801513671875, -2.191864013671875, -2.105712890625, -2.019561767578125, -1.93341064453125, -1.847259521484375, -1.7611083984375, -1.674957275390625, -1.58880615234375, -1.502655029296875, -1.41650390625, -1.330352783203125, -1.24420166015625, -1.158050537109375, -1.0718994140625, -0.985748291015625, -0.89959716796875, -0.813446044921875, -0.727294921875, -0.641143798828125, -0.55499267578125, -0.468841552734375, -0.3826904296875, -0.296539306640625, -0.21038818359375, -0.124237060546875, -0.0380859375, 0.048065185546875, 0.13421630859375, 0.220367431640625, 0.3065185546875, 0.392669677734375, 0.47882080078125, 0.564971923828125, 0.651123046875, 0.737274169921875, 0.82342529296875, 0.909576416015625, 0.9957275390625, 1.081878662109375, 1.16802978515625, 1.254180908203125, 1.34033203125, 1.426483154296875, 1.51263427734375, 1.598785400390625, 1.6849365234375, 1.771087646484375, 1.85723876953125, 1.943389892578125, 2.029541015625, 2.115692138671875, 2.20184326171875, 2.287994384765625, 2.3741455078125, 2.460296630859375, 2.54644775390625, 2.632598876953125, 2.71875]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 8.0, 8.0, 4.0, 14.0, 9.0, 15.0, 19.0, 24.0, 19.0, 20.0, 18.0, 32.0, 34.0, 34.0, 46.0, 46.0, 52.0, 40.0, 38.0, 47.0, 34.0, 42.0, 32.0, 38.0, 50.0, 35.0, 32.0, 17.0, 23.0, 19.0, 22.0, 19.0, 16.0, 20.0, 11.0, 14.0, 9.0, 12.0, 10.0, 3.0, 6.0, 1.0, 1.0, 10.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.839197158813477, -26.94318199157715, -26.047168731689453, -25.151153564453125, -24.255138397216797, -23.3591251373291, -22.463109970092773, -21.567096710205078, -20.67108154296875, -19.775066375732422, -18.879053115844727, -17.9830379486084, -17.087024688720703, -16.191009521484375, -15.294994354248047, -14.398980140686035, -13.502965927124023, -12.606951713562012, -11.7109375, -10.814922332763672, -9.91890811920166, -9.022893905639648, -8.12687873840332, -7.230864524841309, -6.334850311279297, -5.438836097717285, -4.542821407318115, -3.6468069553375244, -2.7507925033569336, -1.8547782897949219, -0.958763599395752, -0.06274890899658203, 0.8332653045654297, 1.7292797565460205, 2.6252942085266113, 3.521308660507202, 4.417323112487793, 5.313337326049805, 6.209352016448975, 7.1053667068481445, 8.001380920410156, 8.897395133972168, 9.79340934753418, 10.689424514770508, 11.58543872833252, 12.481452941894531, 13.37746810913086, 14.273482322692871, 15.169496536254883, 16.06551170349121, 16.961524963378906, 17.857540130615234, 18.753555297851562, 19.649568557739258, 20.545583724975586, 21.44159698486328, 22.33761215209961, 23.233627319335938, 24.129640579223633, 25.02565574645996, 25.921669006347656, 26.817684173583984, 27.713699340820312, 28.60971450805664, 29.505727767944336]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 4.0, 4.0, 2.0, 6.0, 4.0, 12.0, 6.0, 13.0, 7.0, 16.0, 14.0, 17.0, 21.0, 18.0, 24.0, 29.0, 31.0, 30.0, 26.0, 37.0, 39.0, 38.0, 36.0, 33.0, 23.0, 45.0, 39.0, 37.0, 31.0, 30.0, 41.0, 33.0, 40.0, 24.0, 35.0, 28.0, 19.0, 17.0, 14.0, 15.0, 15.0, 10.0, 6.0, 6.0, 9.0, 7.0, 2.0, 5.0, 2.0, 6.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-32.157630920410156, -31.153738021850586, -30.149845123291016, -29.145950317382812, -28.142057418823242, -27.138164520263672, -26.1342716217041, -25.13037872314453, -24.126483917236328, -23.122591018676758, -22.118698120117188, -21.114803314208984, -20.110910415649414, -19.107017517089844, -18.103124618530273, -17.099231719970703, -16.095338821411133, -15.091445922851562, -14.087552070617676, -13.083659172058105, -12.079765319824219, -11.075872421264648, -10.071979522705078, -9.068086624145508, -8.064192771911621, -7.060299396514893, -6.056406021118164, -5.052513122558594, -4.048619747161865, -3.0447263717651367, -2.0408334732055664, -1.036940097808838, -0.033046722412109375, 0.9708465337753296, 1.9747397899627686, 2.978632926940918, 3.9825263023376465, 4.986419677734375, 5.990312576293945, 6.994205951690674, 7.998099327087402, 9.001992225646973, 10.00588607788086, 11.00977897644043, 12.013671875, 13.017565727233887, 14.021458625793457, 15.025352478027344, 16.029245376586914, 17.033138275146484, 18.037031173706055, 19.040924072265625, 20.044818878173828, 21.0487117767334, 22.05260467529297, 23.05649757385254, 24.06039047241211, 25.06428337097168, 26.06817626953125, 27.072071075439453, 28.075963973999023, 29.079856872558594, 30.083749771118164, 31.087642669677734, 32.09153747558594]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 8.0, 8.0, 14.0, 47.0, 63.0, 111.0, 181.0, 329.0, 547.0, 920.0, 1536.0, 2393.0, 3974.0, 6179.0, 9805.0, 15433.0, 23073.0, 34938.0, 50284.0, 71667.0, 98933.0, 132272.0, 172187.0, 215002.0, 258732.0, 298868.0, 329597.0, 346264.0, 347508.0, 332179.0, 303680.0, 264815.0, 220957.0, 179074.0, 137422.0, 103347.0, 74315.0, 52486.0, 36188.0, 24613.0, 16111.0, 10451.0, 6690.0, 4194.0, 2635.0, 1686.0, 1027.0, 616.0, 365.0, 232.0, 141.0, 78.0, 42.0, 38.0, 19.0, 10.0, 6.0, 5.0, 2.0, 2.0], "bins": [-20.671875, -20.027587890625, -19.38330078125, -18.739013671875, -18.0947265625, -17.450439453125, -16.80615234375, -16.161865234375, -15.517578125, -14.873291015625, -14.22900390625, -13.584716796875, -12.9404296875, -12.296142578125, -11.65185546875, -11.007568359375, -10.36328125, -9.718994140625, -9.07470703125, -8.430419921875, -7.7861328125, -7.141845703125, -6.49755859375, -5.853271484375, -5.208984375, -4.564697265625, -3.92041015625, -3.276123046875, -2.6318359375, -1.987548828125, -1.34326171875, -0.698974609375, -0.0546875, 0.589599609375, 1.23388671875, 1.878173828125, 2.5224609375, 3.166748046875, 3.81103515625, 4.455322265625, 5.099609375, 5.743896484375, 6.38818359375, 7.032470703125, 7.6767578125, 8.321044921875, 8.96533203125, 9.609619140625, 10.25390625, 10.898193359375, 11.54248046875, 12.186767578125, 12.8310546875, 13.475341796875, 14.11962890625, 14.763916015625, 15.408203125, 16.052490234375, 16.69677734375, 17.341064453125, 17.9853515625, 18.629638671875, 19.27392578125, 19.918212890625, 20.5625]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 2.0, 6.0, 3.0, 2.0, 8.0, 5.0, 7.0, 16.0, 11.0, 11.0, 16.0, 22.0, 21.0, 23.0, 27.0, 33.0, 22.0, 34.0, 32.0, 41.0, 36.0, 35.0, 29.0, 22.0, 44.0, 39.0, 22.0, 47.0, 41.0, 30.0, 37.0, 39.0, 28.0, 32.0, 25.0, 15.0, 23.0, 16.0, 12.0, 14.0, 11.0, 7.0, 11.0, 10.0, 9.0, 6.0, 7.0, 5.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 3.0], "bins": [-27.96875, -27.11083984375, -26.2529296875, -25.39501953125, -24.537109375, -23.67919921875, -22.8212890625, -21.96337890625, -21.10546875, -20.24755859375, -19.3896484375, -18.53173828125, -17.673828125, -16.81591796875, -15.9580078125, -15.10009765625, -14.2421875, -13.38427734375, -12.5263671875, -11.66845703125, -10.810546875, -9.95263671875, -9.0947265625, -8.23681640625, -7.37890625, -6.52099609375, -5.6630859375, -4.80517578125, -3.947265625, -3.08935546875, -2.2314453125, -1.37353515625, -0.515625, 0.34228515625, 1.2001953125, 2.05810546875, 2.916015625, 3.77392578125, 4.6318359375, 5.48974609375, 6.34765625, 7.20556640625, 8.0634765625, 8.92138671875, 9.779296875, 10.63720703125, 11.4951171875, 12.35302734375, 13.2109375, 14.06884765625, 14.9267578125, 15.78466796875, 16.642578125, 17.50048828125, 18.3583984375, 19.21630859375, 20.07421875, 20.93212890625, 21.7900390625, 22.64794921875, 23.505859375, 24.36376953125, 25.2216796875, 26.07958984375, 26.9375]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 6.0, 12.0, 32.0, 43.0, 75.0, 147.0, 248.0, 491.0, 927.0, 1662.0, 3022.0, 5181.0, 9158.0, 15639.0, 26344.0, 41817.0, 65980.0, 98571.0, 141613.0, 195492.0, 255479.0, 314962.0, 364596.0, 399752.0, 408325.0, 392928.0, 354043.0, 301228.0, 240798.0, 181857.0, 131700.0, 89898.0, 59527.0, 37406.0, 23146.0, 13864.0, 8171.0, 4621.0, 2472.0, 1391.0, 753.0, 449.0, 221.0, 104.0, 74.0, 32.0, 14.0, 14.0, 2.0, 4.0, 4.0], "bins": [-31.3125, -30.474853515625, -29.63720703125, -28.799560546875, -27.9619140625, -27.124267578125, -26.28662109375, -25.448974609375, -24.611328125, -23.773681640625, -22.93603515625, -22.098388671875, -21.2607421875, -20.423095703125, -19.58544921875, -18.747802734375, -17.91015625, -17.072509765625, -16.23486328125, -15.397216796875, -14.5595703125, -13.721923828125, -12.88427734375, -12.046630859375, -11.208984375, -10.371337890625, -9.53369140625, -8.696044921875, -7.8583984375, -7.020751953125, -6.18310546875, -5.345458984375, -4.5078125, -3.670166015625, -2.83251953125, -1.994873046875, -1.1572265625, -0.319580078125, 0.51806640625, 1.355712890625, 2.193359375, 3.031005859375, 3.86865234375, 4.706298828125, 5.5439453125, 6.381591796875, 7.21923828125, 8.056884765625, 8.89453125, 9.732177734375, 10.56982421875, 11.407470703125, 12.2451171875, 13.082763671875, 13.92041015625, 14.758056640625, 15.595703125, 16.433349609375, 17.27099609375, 18.108642578125, 18.9462890625, 19.783935546875, 20.62158203125, 21.459228515625, 22.296875]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 5.0, 4.0, 5.0, 9.0, 10.0, 13.0, 18.0, 20.0, 28.0, 25.0, 29.0, 41.0, 41.0, 49.0, 56.0, 64.0, 83.0, 88.0, 97.0, 110.0, 136.0, 142.0, 153.0, 158.0, 164.0, 175.0, 183.0, 176.0, 162.0, 160.0, 170.0, 148.0, 138.0, 151.0, 143.0, 132.0, 111.0, 88.0, 89.0, 72.0, 69.0, 67.0, 58.0, 41.0, 44.0, 36.0, 20.0, 18.0, 20.0, 15.0, 15.0, 12.0, 5.0, 6.0, 5.0, 4.0, 6.0, 0.0, 4.0, 0.0, 1.0], "bins": [-11.7578125, -11.374267578125, -10.99072265625, -10.607177734375, -10.2236328125, -9.840087890625, -9.45654296875, -9.072998046875, -8.689453125, -8.305908203125, -7.92236328125, -7.538818359375, -7.1552734375, -6.771728515625, -6.38818359375, -6.004638671875, -5.62109375, -5.237548828125, -4.85400390625, -4.470458984375, -4.0869140625, -3.703369140625, -3.31982421875, -2.936279296875, -2.552734375, -2.169189453125, -1.78564453125, -1.402099609375, -1.0185546875, -0.635009765625, -0.25146484375, 0.132080078125, 0.515625, 0.899169921875, 1.28271484375, 1.666259765625, 2.0498046875, 2.433349609375, 2.81689453125, 3.200439453125, 3.583984375, 3.967529296875, 4.35107421875, 4.734619140625, 5.1181640625, 5.501708984375, 5.88525390625, 6.268798828125, 6.65234375, 7.035888671875, 7.41943359375, 7.802978515625, 8.1865234375, 8.570068359375, 8.95361328125, 9.337158203125, 9.720703125, 10.104248046875, 10.48779296875, 10.871337890625, 11.2548828125, 11.638427734375, 12.02197265625, 12.405517578125, 12.7890625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 6.0, 5.0, 8.0, 8.0, 17.0, 15.0, 10.0, 17.0, 30.0, 30.0, 15.0, 37.0, 24.0, 32.0, 29.0, 33.0, 39.0, 43.0, 41.0, 38.0, 37.0, 54.0, 44.0, 31.0, 33.0, 33.0, 34.0, 35.0, 34.0, 26.0, 24.0, 17.0, 16.0, 10.0, 19.0, 17.0, 7.0, 8.0, 5.0, 11.0, 7.0, 2.0, 5.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.37582015991211, -29.334218978881836, -28.292619705200195, -27.251018524169922, -26.20941925048828, -25.167818069458008, -24.126216888427734, -23.084617614746094, -22.04301643371582, -21.001415252685547, -19.959815979003906, -18.918214797973633, -17.87661361694336, -16.83501434326172, -15.793413162231445, -14.751812934875488, -13.710212707519531, -12.668612480163574, -11.627012252807617, -10.585411071777344, -9.543810844421387, -8.50221061706543, -7.4606099128723145, -6.419009208679199, -5.377408981323242, -4.335808753967285, -3.29420804977417, -2.252607583999634, -1.2110071182250977, -0.16940689086914062, 0.8721938133239746, 1.9137945175170898, 2.9553985595703125, 3.9969990253448486, 5.038599491119385, 6.0802001953125, 7.121800422668457, 8.163400650024414, 9.205001831054688, 10.246602058410645, 11.288202285766602, 12.329802513122559, 13.371402740478516, 14.413003921508789, 15.454604148864746, 16.496204376220703, 17.537805557250977, 18.57940673828125, 19.62100601196289, 20.662607192993164, 21.704206466674805, 22.745807647705078, 23.78740692138672, 24.829008102416992, 25.870609283447266, 26.912208557128906, 27.95380973815918, 28.995410919189453, 30.037010192871094, 31.078611373901367, 32.12021255493164, 33.16181182861328, 34.20341110229492, 35.24501419067383, 36.28661346435547]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 4.0, 6.0, 4.0, 7.0, 7.0, 13.0, 10.0, 26.0, 15.0, 17.0, 23.0, 24.0, 34.0, 41.0, 37.0, 28.0, 41.0, 41.0, 39.0, 44.0, 43.0, 47.0, 47.0, 49.0, 34.0, 41.0, 47.0, 29.0, 22.0, 27.0, 27.0, 27.0, 23.0, 18.0, 15.0, 8.0, 13.0, 6.0, 5.0, 3.0, 6.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.401611328125, -34.16838836669922, -32.93516159057617, -31.70193862915039, -30.46871566772461, -29.235490798950195, -28.00226593017578, -26.76904296875, -25.535818099975586, -24.302593231201172, -23.06937026977539, -21.836145401000977, -20.602920532226562, -19.36969757080078, -18.136472702026367, -16.903247833251953, -15.670024871826172, -14.436800956726074, -13.203577041625977, -11.970352172851562, -10.737128257751465, -9.503904342651367, -8.270679473876953, -7.0374555587768555, -5.804231643676758, -4.57100772857666, -3.3377833366394043, -2.1045591831207275, -0.8713350296020508, 0.3618888854980469, 1.5951132774353027, 2.8283376693725586, 4.061561584472656, 5.294785499572754, 6.52800989151001, 7.761234283447266, 8.994458198547363, 10.227682113647461, 11.460906982421875, 12.694130897521973, 13.92735481262207, 15.160578727722168, 16.393802642822266, 17.62702751159668, 18.860252380371094, 20.093475341796875, 21.32670021057129, 22.559925079345703, 23.793148040771484, 25.0263729095459, 26.25959587097168, 27.492820739746094, 28.726043701171875, 29.95926856994629, 31.192493438720703, 32.425716400146484, 33.65894317626953, 34.89216613769531, 36.12539291381836, 37.35861587524414, 38.59183883666992, 39.82506561279297, 41.05828857421875, 42.29151153564453, 43.52473449707031]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 5.0, 6.0, 11.0, 12.0, 20.0, 31.0, 41.0, 69.0, 127.0, 142.0, 218.0, 338.0, 505.0, 843.0, 1326.0, 2101.0, 3236.0, 5248.0, 8367.0, 13515.0, 21893.0, 35227.0, 54864.0, 82203.0, 113623.0, 140268.0, 148513.0, 129380.0, 99063.0, 67912.0, 44540.0, 28186.0, 17693.0, 10953.0, 6703.0, 4235.0, 2555.0, 1646.0, 1041.0, 652.0, 470.0, 281.0, 167.0, 122.0, 73.0, 50.0, 29.0, 20.0, 15.0, 10.0, 4.0, 2.0, 7.0, 4.0, 1.0, 2.0], "bins": [-5.5859375, -5.42291259765625, -5.2598876953125, -5.09686279296875, -4.933837890625, -4.77081298828125, -4.6077880859375, -4.44476318359375, -4.28173828125, -4.11871337890625, -3.9556884765625, -3.79266357421875, -3.629638671875, -3.46661376953125, -3.3035888671875, -3.14056396484375, -2.9775390625, -2.81451416015625, -2.6514892578125, -2.48846435546875, -2.325439453125, -2.16241455078125, -1.9993896484375, -1.83636474609375, -1.67333984375, -1.51031494140625, -1.3472900390625, -1.18426513671875, -1.021240234375, -0.85821533203125, -0.6951904296875, -0.53216552734375, -0.369140625, -0.20611572265625, -0.0430908203125, 0.11993408203125, 0.282958984375, 0.44598388671875, 0.6090087890625, 0.77203369140625, 0.93505859375, 1.09808349609375, 1.2611083984375, 1.42413330078125, 1.587158203125, 1.75018310546875, 1.9132080078125, 2.07623291015625, 2.2392578125, 2.40228271484375, 2.5653076171875, 2.72833251953125, 2.891357421875, 3.05438232421875, 3.2174072265625, 3.38043212890625, 3.54345703125, 3.70648193359375, 3.8695068359375, 4.03253173828125, 4.195556640625, 4.35858154296875, 4.5216064453125, 4.68463134765625, 4.84765625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 5.0, 7.0, 1.0, 5.0, 7.0, 12.0, 7.0, 7.0, 14.0, 19.0, 30.0, 14.0, 26.0, 27.0, 28.0, 34.0, 31.0, 40.0, 37.0, 36.0, 39.0, 45.0, 61.0, 56.0, 33.0, 37.0, 52.0, 38.0, 35.0, 33.0, 28.0, 23.0, 25.0, 29.0, 13.0, 12.0, 10.0, 11.0, 11.0, 12.0, 7.0, 3.0, 3.0, 2.0, 3.0, 0.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.53125, -32.2587890625, -30.986328125, -29.7138671875, -28.44140625, -27.1689453125, -25.896484375, -24.6240234375, -23.3515625, -22.0791015625, -20.806640625, -19.5341796875, -18.26171875, -16.9892578125, -15.716796875, -14.4443359375, -13.171875, -11.8994140625, -10.626953125, -9.3544921875, -8.08203125, -6.8095703125, -5.537109375, -4.2646484375, -2.9921875, -1.7197265625, -0.447265625, 0.8251953125, 2.09765625, 3.3701171875, 4.642578125, 5.9150390625, 7.1875, 8.4599609375, 9.732421875, 11.0048828125, 12.27734375, 13.5498046875, 14.822265625, 16.0947265625, 17.3671875, 18.6396484375, 19.912109375, 21.1845703125, 22.45703125, 23.7294921875, 25.001953125, 26.2744140625, 27.546875, 28.8193359375, 30.091796875, 31.3642578125, 32.63671875, 33.9091796875, 35.181640625, 36.4541015625, 37.7265625, 38.9990234375, 40.271484375, 41.5439453125, 42.81640625, 44.0888671875, 45.361328125, 46.6337890625, 47.90625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 5.0, 2.0, 7.0, 15.0, 18.0, 28.0, 42.0, 79.0, 84.0, 184.0, 292.0, 456.0, 815.0, 1394.0, 2274.0, 3952.0, 7367.0, 13227.0, 23916.0, 42727.0, 73601.0, 120781.0, 171806.0, 189673.0, 154606.0, 101995.0, 60739.0, 34740.0, 19197.0, 10675.0, 5808.0, 3329.0, 1911.0, 1115.0, 659.0, 393.0, 244.0, 156.0, 90.0, 59.0, 40.0, 24.0, 20.0, 5.0, 3.0, 5.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-7.72265625, -7.49761962890625, -7.2725830078125, -7.04754638671875, -6.822509765625, -6.59747314453125, -6.3724365234375, -6.14739990234375, -5.92236328125, -5.69732666015625, -5.4722900390625, -5.24725341796875, -5.022216796875, -4.79718017578125, -4.5721435546875, -4.34710693359375, -4.1220703125, -3.89703369140625, -3.6719970703125, -3.44696044921875, -3.221923828125, -2.99688720703125, -2.7718505859375, -2.54681396484375, -2.32177734375, -2.09674072265625, -1.8717041015625, -1.64666748046875, -1.421630859375, -1.19659423828125, -0.9715576171875, -0.74652099609375, -0.521484375, -0.29644775390625, -0.0714111328125, 0.15362548828125, 0.378662109375, 0.60369873046875, 0.8287353515625, 1.05377197265625, 1.27880859375, 1.50384521484375, 1.7288818359375, 1.95391845703125, 2.178955078125, 2.40399169921875, 2.6290283203125, 2.85406494140625, 3.0791015625, 3.30413818359375, 3.5291748046875, 3.75421142578125, 3.979248046875, 4.20428466796875, 4.4293212890625, 4.65435791015625, 4.87939453125, 5.10443115234375, 5.3294677734375, 5.55450439453125, 5.779541015625, 6.00457763671875, 6.2296142578125, 6.45465087890625, 6.6796875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [4.0, 4.0, 3.0, 2.0, 1.0, 5.0, 5.0, 7.0, 6.0, 4.0, 9.0, 13.0, 15.0, 19.0, 22.0, 24.0, 20.0, 27.0, 15.0, 24.0, 35.0, 29.0, 29.0, 31.0, 39.0, 33.0, 52.0, 46.0, 39.0, 44.0, 41.0, 22.0, 34.0, 43.0, 22.0, 37.0, 26.0, 26.0, 23.0, 21.0, 18.0, 17.0, 16.0, 8.0, 10.0, 10.0, 7.0, 10.0, 4.0, 3.0, 4.0, 4.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-19.34375, -18.637939453125, -17.93212890625, -17.226318359375, -16.5205078125, -15.814697265625, -15.10888671875, -14.403076171875, -13.697265625, -12.991455078125, -12.28564453125, -11.579833984375, -10.8740234375, -10.168212890625, -9.46240234375, -8.756591796875, -8.05078125, -7.344970703125, -6.63916015625, -5.933349609375, -5.2275390625, -4.521728515625, -3.81591796875, -3.110107421875, -2.404296875, -1.698486328125, -0.99267578125, -0.286865234375, 0.4189453125, 1.124755859375, 1.83056640625, 2.536376953125, 3.2421875, 3.947998046875, 4.65380859375, 5.359619140625, 6.0654296875, 6.771240234375, 7.47705078125, 8.182861328125, 8.888671875, 9.594482421875, 10.30029296875, 11.006103515625, 11.7119140625, 12.417724609375, 13.12353515625, 13.829345703125, 14.53515625, 15.240966796875, 15.94677734375, 16.652587890625, 17.3583984375, 18.064208984375, 18.77001953125, 19.475830078125, 20.181640625, 20.887451171875, 21.59326171875, 22.299072265625, 23.0048828125, 23.710693359375, 24.41650390625, 25.122314453125, 25.828125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 4.0, 3.0, 3.0, 2.0, 2.0, 4.0, 20.0, 20.0, 23.0, 29.0, 61.0, 68.0, 112.0, 175.0, 263.0, 401.0, 686.0, 1177.0, 2120.0, 4001.0, 8348.0, 18638.0, 43074.0, 101222.0, 211693.0, 290066.0, 199938.0, 93504.0, 39512.0, 16967.0, 7738.0, 3797.0, 1936.0, 1121.0, 624.0, 421.0, 287.0, 156.0, 91.0, 78.0, 55.0, 31.0, 27.0, 22.0, 15.0, 7.0, 5.0, 9.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.0537109375, -1.0166778564453125, -0.979644775390625, -0.9426116943359375, -0.90557861328125, -0.8685455322265625, -0.831512451171875, -0.7944793701171875, -0.7574462890625, -0.7204132080078125, -0.683380126953125, -0.6463470458984375, -0.60931396484375, -0.5722808837890625, -0.535247802734375, -0.4982147216796875, -0.461181640625, -0.4241485595703125, -0.387115478515625, -0.3500823974609375, -0.31304931640625, -0.2760162353515625, -0.238983154296875, -0.2019500732421875, -0.1649169921875, -0.1278839111328125, -0.090850830078125, -0.0538177490234375, -0.01678466796875, 0.0202484130859375, 0.057281494140625, 0.0943145751953125, 0.13134765625, 0.1683807373046875, 0.205413818359375, 0.2424468994140625, 0.27947998046875, 0.3165130615234375, 0.353546142578125, 0.3905792236328125, 0.4276123046875, 0.4646453857421875, 0.501678466796875, 0.5387115478515625, 0.57574462890625, 0.6127777099609375, 0.649810791015625, 0.6868438720703125, 0.723876953125, 0.7609100341796875, 0.797943115234375, 0.8349761962890625, 0.87200927734375, 0.9090423583984375, 0.946075439453125, 0.9831085205078125, 1.0201416015625, 1.0571746826171875, 1.094207763671875, 1.1312408447265625, 1.16827392578125, 1.2053070068359375, 1.242340087890625, 1.2793731689453125, 1.31640625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 1.0, 6.0, 6.0, 3.0, 11.0, 14.0, 29.0, 25.0, 26.0, 46.0, 38.0, 48.0, 46.0, 58.0, 59.0, 64.0, 60.0, 62.0, 56.0, 49.0, 46.0, 51.0, 31.0, 37.0, 29.0, 24.0, 20.0, 16.0, 10.0, 16.0, 4.0, 4.0, 3.0, 7.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001023411750793457, -9.90256667137146e-05, -9.57101583480835e-05, -9.239464998245239e-05, -8.907914161682129e-05, -8.576363325119019e-05, -8.244812488555908e-05, -7.913261651992798e-05, -7.581710815429688e-05, -7.250159978866577e-05, -6.918609142303467e-05, -6.587058305740356e-05, -6.255507469177246e-05, -5.923956632614136e-05, -5.5924057960510254e-05, -5.260854959487915e-05, -4.929304122924805e-05, -4.597753286361694e-05, -4.266202449798584e-05, -3.9346516132354736e-05, -3.603100776672363e-05, -3.271549940109253e-05, -2.9399991035461426e-05, -2.6084482669830322e-05, -2.276897430419922e-05, -1.9453465938568115e-05, -1.6137957572937012e-05, -1.2822449207305908e-05, -9.506940841674805e-06, -6.191432476043701e-06, -2.8759241104125977e-06, 4.3958425521850586e-07, 3.7550926208496094e-06, 7.070600986480713e-06, 1.0386109352111816e-05, 1.370161771774292e-05, 1.7017126083374023e-05, 2.0332634449005127e-05, 2.364814281463623e-05, 2.6963651180267334e-05, 3.0279159545898438e-05, 3.359466791152954e-05, 3.6910176277160645e-05, 4.022568464279175e-05, 4.354119300842285e-05, 4.6856701374053955e-05, 5.017220973968506e-05, 5.348771810531616e-05, 5.6803226470947266e-05, 6.011873483657837e-05, 6.343424320220947e-05, 6.674975156784058e-05, 7.006525993347168e-05, 7.338076829910278e-05, 7.669627666473389e-05, 8.001178503036499e-05, 8.33272933959961e-05, 8.66428017616272e-05, 8.99583101272583e-05, 9.32738184928894e-05, 9.658932685852051e-05, 9.990483522415161e-05, 0.00010322034358978271, 0.00010653585195541382, 0.00010985136032104492]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 4.0, 4.0, 3.0, 13.0, 18.0, 31.0, 38.0, 63.0, 84.0, 119.0, 160.0, 227.0, 314.0, 415.0, 688.0, 874.0, 1301.0, 1953.0, 3005.0, 4692.0, 7300.0, 11657.0, 19819.0, 33247.0, 56441.0, 94377.0, 148807.0, 193370.0, 173366.0, 117360.0, 71045.0, 42295.0, 24872.0, 14945.0, 8991.0, 5556.0, 3604.0, 2265.0, 1613.0, 1063.0, 766.0, 547.0, 364.0, 279.0, 203.0, 122.0, 101.0, 63.0, 42.0, 26.0, 18.0, 10.0, 11.0, 3.0, 5.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0], "bins": [-1.3046875, -1.2622222900390625, -1.219757080078125, -1.1772918701171875, -1.13482666015625, -1.0923614501953125, -1.049896240234375, -1.0074310302734375, -0.9649658203125, -0.9225006103515625, -0.880035400390625, -0.8375701904296875, -0.79510498046875, -0.7526397705078125, -0.710174560546875, -0.6677093505859375, -0.625244140625, -0.5827789306640625, -0.540313720703125, -0.4978485107421875, -0.45538330078125, -0.4129180908203125, -0.370452880859375, -0.3279876708984375, -0.2855224609375, -0.2430572509765625, -0.200592041015625, -0.1581268310546875, -0.11566162109375, -0.0731964111328125, -0.030731201171875, 0.0117340087890625, 0.05419921875, 0.0966644287109375, 0.139129638671875, 0.1815948486328125, 0.22406005859375, 0.2665252685546875, 0.308990478515625, 0.3514556884765625, 0.3939208984375, 0.4363861083984375, 0.478851318359375, 0.5213165283203125, 0.56378173828125, 0.6062469482421875, 0.648712158203125, 0.6911773681640625, 0.733642578125, 0.7761077880859375, 0.818572998046875, 0.8610382080078125, 0.90350341796875, 0.9459686279296875, 0.988433837890625, 1.0308990478515625, 1.0733642578125, 1.1158294677734375, 1.158294677734375, 1.2007598876953125, 1.24322509765625, 1.2856903076171875, 1.328155517578125, 1.3706207275390625, 1.4130859375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 0.0, 1.0, 6.0, 5.0, 7.0, 4.0, 5.0, 9.0, 8.0, 9.0, 6.0, 17.0, 20.0, 22.0, 15.0, 25.0, 43.0, 37.0, 36.0, 41.0, 52.0, 45.0, 54.0, 57.0, 70.0, 45.0, 46.0, 44.0, 37.0, 35.0, 38.0, 26.0, 19.0, 20.0, 17.0, 18.0, 11.0, 9.0, 12.0, 9.0, 6.0, 10.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.4677734375, -0.4536399841308594, -0.43950653076171875, -0.4253730773925781, -0.4112396240234375, -0.3971061706542969, -0.38297271728515625, -0.3688392639160156, -0.354705810546875, -0.3405723571777344, -0.32643890380859375, -0.3123054504394531, -0.2981719970703125, -0.2840385437011719, -0.26990509033203125, -0.2557716369628906, -0.24163818359375, -0.22750473022460938, -0.21337127685546875, -0.19923782348632812, -0.1851043701171875, -0.17097091674804688, -0.15683746337890625, -0.14270401000976562, -0.128570556640625, -0.11443710327148438, -0.10030364990234375, -0.08617019653320312, -0.0720367431640625, -0.057903289794921875, -0.04376983642578125, -0.029636383056640625, -0.0155029296875, -0.001369476318359375, 0.01276397705078125, 0.026897430419921875, 0.0410308837890625, 0.055164337158203125, 0.06929779052734375, 0.08343124389648438, 0.097564697265625, 0.11169815063476562, 0.12583160400390625, 0.13996505737304688, 0.1540985107421875, 0.16823196411132812, 0.18236541748046875, 0.19649887084960938, 0.21063232421875, 0.22476577758789062, 0.23889923095703125, 0.2530326843261719, 0.2671661376953125, 0.2812995910644531, 0.29543304443359375, 0.3095664978027344, 0.323699951171875, 0.3378334045410156, 0.35196685791015625, 0.3661003112792969, 0.3802337646484375, 0.3943672180175781, 0.40850067138671875, 0.4226341247558594, 0.436767578125]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [3.0, 3.0, 3.0, 1.0, 2.0, 2.0, 4.0, 4.0, 4.0, 8.0, 6.0, 6.0, 10.0, 16.0, 12.0, 10.0, 19.0, 33.0, 27.0, 21.0, 33.0, 22.0, 34.0, 23.0, 40.0, 42.0, 45.0, 38.0, 31.0, 49.0, 40.0, 42.0, 33.0, 37.0, 33.0, 30.0, 37.0, 30.0, 26.0, 26.0, 18.0, 15.0, 13.0, 16.0, 16.0, 6.0, 12.0, 5.0, 11.0, 4.0, 3.0, 5.0, 1.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-29.883255004882812, -28.85761070251465, -27.831966400146484, -26.80632209777832, -25.780677795410156, -24.755033493041992, -23.729389190673828, -22.703746795654297, -21.6781005859375, -20.652456283569336, -19.626811981201172, -18.601167678833008, -17.575523376464844, -16.54987907409668, -15.524235725402832, -14.498591423034668, -13.47294807434082, -12.447303771972656, -11.421659469604492, -10.396015167236328, -9.370370864868164, -8.3447265625, -7.319083213806152, -6.293438911437988, -5.267794609069824, -4.24215030670166, -3.216506242752075, -2.1908621788024902, -1.1652178764343262, -0.1395735740661621, 0.8860702514648438, 1.9117145538330078, 2.937358856201172, 3.963003158569336, 4.9886474609375, 6.014291286468506, 7.03993558883667, 8.065580368041992, 9.09122371673584, 10.116868019104004, 11.142512321472168, 12.168156623840332, 13.193800926208496, 14.219444274902344, 15.245088577270508, 16.270732879638672, 17.296377182006836, 18.322021484375, 19.347665786743164, 20.373310089111328, 21.398954391479492, 22.424598693847656, 23.45024299621582, 24.475887298583984, 25.501529693603516, 26.527175903320312, 27.552818298339844, 28.578462600708008, 29.604106903076172, 30.629751205444336, 31.6553955078125, 32.68103790283203, 33.70668411254883, 34.73232650756836, 35.757972717285156]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 4.0, 6.0, 4.0, 7.0, 9.0, 11.0, 9.0, 26.0, 17.0, 16.0, 24.0, 27.0, 35.0, 36.0, 41.0, 24.0, 47.0, 38.0, 43.0, 45.0, 36.0, 47.0, 50.0, 50.0, 33.0, 44.0, 46.0, 26.0, 23.0, 26.0, 28.0, 25.0, 24.0, 19.0, 13.0, 8.0, 11.0, 6.0, 6.0, 2.0, 6.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.287620544433594, -34.051116943359375, -32.814613342285156, -31.578107833862305, -30.341602325439453, -29.105098724365234, -27.868595123291016, -26.632091522216797, -25.395586013793945, -24.159082412719727, -22.922576904296875, -21.686073303222656, -20.449569702148438, -19.213064193725586, -17.976560592651367, -16.740055084228516, -15.503551483154297, -14.267046928405762, -13.030542373657227, -11.794038772583008, -10.557534217834473, -9.321029663085938, -8.084526062011719, -6.848021507263184, -5.611516952514648, -4.375012397766113, -3.1385083198547363, -1.9020040035247803, -0.6654996871948242, 0.5710048675537109, 1.807508945465088, 3.044013023376465, 4.280513763427734, 5.5170183181762695, 6.7535223960876465, 7.990026473999023, 9.226531028747559, 10.463035583496094, 11.699539184570312, 12.936043739318848, 14.172548294067383, 15.409052848815918, 16.645557403564453, 17.882061004638672, 19.11856460571289, 20.355070114135742, 21.59157371520996, 22.828079223632812, 24.06458282470703, 25.30108642578125, 26.5375919342041, 27.77409553527832, 29.010601043701172, 30.24710464477539, 31.48360824584961, 32.72011184692383, 33.95661926269531, 35.19312286376953, 36.42962646484375, 37.666133880615234, 38.90263748168945, 40.13914108276367, 41.37564468383789, 42.61214828491211, 43.84865188598633]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 5.0, 15.0, 22.0, 45.0, 74.0, 113.0, 203.0, 315.0, 504.0, 784.0, 1284.0, 1958.0, 3073.0, 4587.0, 6883.0, 9971.0, 14144.0, 20162.0, 27051.0, 35815.0, 46010.0, 56099.0, 66439.0, 75504.0, 82655.0, 85804.0, 85363.0, 80498.0, 72788.0, 62901.0, 52907.0, 41923.0, 32267.0, 24521.0, 17519.0, 12627.0, 8919.0, 5819.0, 3808.0, 2616.0, 1702.0, 1024.0, 714.0, 430.0, 280.0, 146.0, 98.0, 77.0, 42.0, 25.0, 11.0, 11.0, 4.0, 0.0, 1.0, 3.0], "bins": [-17.0625, -16.5579833984375, -16.053466796875, -15.5489501953125, -15.04443359375, -14.5399169921875, -14.035400390625, -13.5308837890625, -13.0263671875, -12.5218505859375, -12.017333984375, -11.5128173828125, -11.00830078125, -10.5037841796875, -9.999267578125, -9.4947509765625, -8.990234375, -8.4857177734375, -7.981201171875, -7.4766845703125, -6.97216796875, -6.4676513671875, -5.963134765625, -5.4586181640625, -4.9541015625, -4.4495849609375, -3.945068359375, -3.4405517578125, -2.93603515625, -2.4315185546875, -1.927001953125, -1.4224853515625, -0.91796875, -0.4134521484375, 0.091064453125, 0.5955810546875, 1.10009765625, 1.6046142578125, 2.109130859375, 2.6136474609375, 3.1181640625, 3.6226806640625, 4.127197265625, 4.6317138671875, 5.13623046875, 5.6407470703125, 6.145263671875, 6.6497802734375, 7.154296875, 7.6588134765625, 8.163330078125, 8.6678466796875, 9.17236328125, 9.6768798828125, 10.181396484375, 10.6859130859375, 11.1904296875, 11.6949462890625, 12.199462890625, 12.7039794921875, 13.20849609375, 13.7130126953125, 14.217529296875, 14.7220458984375, 15.2265625]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 2.0, 6.0, 2.0, 7.0, 7.0, 7.0, 10.0, 19.0, 15.0, 20.0, 23.0, 24.0, 24.0, 35.0, 36.0, 35.0, 37.0, 35.0, 36.0, 40.0, 42.0, 44.0, 47.0, 36.0, 38.0, 42.0, 34.0, 37.0, 42.0, 28.0, 22.0, 26.0, 32.0, 24.0, 23.0, 23.0, 8.0, 11.0, 4.0, 7.0, 0.0, 6.0, 3.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.25, -34.02685546875, -32.8037109375, -31.58056640625, -30.357421875, -29.13427734375, -27.9111328125, -26.68798828125, -25.46484375, -24.24169921875, -23.0185546875, -21.79541015625, -20.572265625, -19.34912109375, -18.1259765625, -16.90283203125, -15.6796875, -14.45654296875, -13.2333984375, -12.01025390625, -10.787109375, -9.56396484375, -8.3408203125, -7.11767578125, -5.89453125, -4.67138671875, -3.4482421875, -2.22509765625, -1.001953125, 0.22119140625, 1.4443359375, 2.66748046875, 3.890625, 5.11376953125, 6.3369140625, 7.56005859375, 8.783203125, 10.00634765625, 11.2294921875, 12.45263671875, 13.67578125, 14.89892578125, 16.1220703125, 17.34521484375, 18.568359375, 19.79150390625, 21.0146484375, 22.23779296875, 23.4609375, 24.68408203125, 25.9072265625, 27.13037109375, 28.353515625, 29.57666015625, 30.7998046875, 32.02294921875, 33.24609375, 34.46923828125, 35.6923828125, 36.91552734375, 38.138671875, 39.36181640625, 40.5849609375, 41.80810546875, 43.03125]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 2.0, 7.0, 8.0, 16.0, 11.0, 22.0, 32.0, 69.0, 76.0, 135.0, 212.0, 369.0, 534.0, 844.0, 1295.0, 1869.0, 2870.0, 4304.0, 6263.0, 9374.0, 13320.0, 18927.0, 25823.0, 34755.0, 44481.0, 55747.0, 66369.0, 76799.0, 83823.0, 87047.0, 86446.0, 82317.0, 73883.0, 64474.0, 52546.0, 41952.0, 32340.0, 23973.0, 17293.0, 12059.0, 8498.0, 5864.0, 4006.0, 2582.0, 1712.0, 1103.0, 736.0, 467.0, 308.0, 224.0, 124.0, 84.0, 69.0, 46.0, 12.0, 14.0, 12.0, 12.0, 5.0, 4.0, 2.0], "bins": [-17.609375, -17.07373046875, -16.5380859375, -16.00244140625, -15.466796875, -14.93115234375, -14.3955078125, -13.85986328125, -13.32421875, -12.78857421875, -12.2529296875, -11.71728515625, -11.181640625, -10.64599609375, -10.1103515625, -9.57470703125, -9.0390625, -8.50341796875, -7.9677734375, -7.43212890625, -6.896484375, -6.36083984375, -5.8251953125, -5.28955078125, -4.75390625, -4.21826171875, -3.6826171875, -3.14697265625, -2.611328125, -2.07568359375, -1.5400390625, -1.00439453125, -0.46875, 0.06689453125, 0.6025390625, 1.13818359375, 1.673828125, 2.20947265625, 2.7451171875, 3.28076171875, 3.81640625, 4.35205078125, 4.8876953125, 5.42333984375, 5.958984375, 6.49462890625, 7.0302734375, 7.56591796875, 8.1015625, 8.63720703125, 9.1728515625, 9.70849609375, 10.244140625, 10.77978515625, 11.3154296875, 11.85107421875, 12.38671875, 12.92236328125, 13.4580078125, 13.99365234375, 14.529296875, 15.06494140625, 15.6005859375, 16.13623046875, 16.671875]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 9.0, 7.0, 7.0, 11.0, 10.0, 9.0, 11.0, 16.0, 19.0, 19.0, 18.0, 27.0, 24.0, 15.0, 40.0, 28.0, 46.0, 30.0, 38.0, 35.0, 36.0, 45.0, 50.0, 38.0, 39.0, 42.0, 42.0, 45.0, 33.0, 33.0, 25.0, 26.0, 20.0, 21.0, 22.0, 11.0, 10.0, 14.0, 8.0, 9.0, 7.0, 6.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-24.4375, -23.658447265625, -22.87939453125, -22.100341796875, -21.3212890625, -20.542236328125, -19.76318359375, -18.984130859375, -18.205078125, -17.426025390625, -16.64697265625, -15.867919921875, -15.0888671875, -14.309814453125, -13.53076171875, -12.751708984375, -11.97265625, -11.193603515625, -10.41455078125, -9.635498046875, -8.8564453125, -8.077392578125, -7.29833984375, -6.519287109375, -5.740234375, -4.961181640625, -4.18212890625, -3.403076171875, -2.6240234375, -1.844970703125, -1.06591796875, -0.286865234375, 0.4921875, 1.271240234375, 2.05029296875, 2.829345703125, 3.6083984375, 4.387451171875, 5.16650390625, 5.945556640625, 6.724609375, 7.503662109375, 8.28271484375, 9.061767578125, 9.8408203125, 10.619873046875, 11.39892578125, 12.177978515625, 12.95703125, 13.736083984375, 14.51513671875, 15.294189453125, 16.0732421875, 16.852294921875, 17.63134765625, 18.410400390625, 19.189453125, 19.968505859375, 20.74755859375, 21.526611328125, 22.3056640625, 23.084716796875, 23.86376953125, 24.642822265625, 25.421875]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 7.0, 3.0, 7.0, 8.0, 15.0, 38.0, 44.0, 85.0, 109.0, 205.0, 295.0, 453.0, 647.0, 1001.0, 1675.0, 2361.0, 3453.0, 5270.0, 7475.0, 10788.0, 15100.0, 21362.0, 28402.0, 36810.0, 46685.0, 56833.0, 66858.0, 75087.0, 81151.0, 83486.0, 83117.0, 78028.0, 70702.0, 61922.0, 51497.0, 41561.0, 32314.0, 24619.0, 18272.0, 12863.0, 9139.0, 6226.0, 4269.0, 2903.0, 1868.0, 1245.0, 779.0, 558.0, 339.0, 205.0, 147.0, 98.0, 64.0, 35.0, 25.0, 32.0, 11.0, 9.0, 4.0, 3.0, 4.0], "bins": [-6.26171875, -6.07049560546875, -5.8792724609375, -5.68804931640625, -5.496826171875, -5.30560302734375, -5.1143798828125, -4.92315673828125, -4.73193359375, -4.54071044921875, -4.3494873046875, -4.15826416015625, -3.967041015625, -3.77581787109375, -3.5845947265625, -3.39337158203125, -3.2021484375, -3.01092529296875, -2.8197021484375, -2.62847900390625, -2.437255859375, -2.24603271484375, -2.0548095703125, -1.86358642578125, -1.67236328125, -1.48114013671875, -1.2899169921875, -1.09869384765625, -0.907470703125, -0.71624755859375, -0.5250244140625, -0.33380126953125, -0.142578125, 0.04864501953125, 0.2398681640625, 0.43109130859375, 0.622314453125, 0.81353759765625, 1.0047607421875, 1.19598388671875, 1.38720703125, 1.57843017578125, 1.7696533203125, 1.96087646484375, 2.152099609375, 2.34332275390625, 2.5345458984375, 2.72576904296875, 2.9169921875, 3.10821533203125, 3.2994384765625, 3.49066162109375, 3.681884765625, 3.87310791015625, 4.0643310546875, 4.25555419921875, 4.44677734375, 4.63800048828125, 4.8292236328125, 5.02044677734375, 5.211669921875, 5.40289306640625, 5.5941162109375, 5.78533935546875, 5.9765625]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 5.0, 6.0, 4.0, 10.0, 8.0, 18.0, 15.0, 13.0, 16.0, 17.0, 30.0, 22.0, 31.0, 28.0, 37.0, 40.0, 46.0, 45.0, 40.0, 55.0, 45.0, 40.0, 45.0, 42.0, 37.0, 36.0, 33.0, 41.0, 34.0, 28.0, 22.0, 21.0, 24.0, 18.0, 10.0, 5.0, 11.0, 6.0, 7.0, 8.0, 4.0, 3.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009441375732421875, -0.0009143650531768799, -0.0008845925331115723, -0.0008548200130462646, -0.000825047492980957, -0.0007952749729156494, -0.0007655024528503418, -0.0007357299327850342, -0.0007059574127197266, -0.0006761848926544189, -0.0006464123725891113, -0.0006166398525238037, -0.0005868673324584961, -0.0005570948123931885, -0.0005273222923278809, -0.0004975497722625732, -0.0004677772521972656, -0.000438004732131958, -0.0004082322120666504, -0.0003784596920013428, -0.00034868717193603516, -0.00031891465187072754, -0.0002891421318054199, -0.0002593696117401123, -0.0002295970916748047, -0.00019982457160949707, -0.00017005205154418945, -0.00014027953147888184, -0.00011050701141357422, -8.07344913482666e-05, -5.0961971282958984e-05, -2.1189451217651367e-05, 8.58306884765625e-06, 3.835558891296387e-05, 6.812810897827148e-05, 9.79006290435791e-05, 0.00012767314910888672, 0.00015744566917419434, 0.00018721818923950195, 0.00021699070930480957, 0.0002467632293701172, 0.0002765357494354248, 0.0003063082695007324, 0.00033608078956604004, 0.00036585330963134766, 0.0003956258296966553, 0.0004253983497619629, 0.0004551708698272705, 0.0004849433898925781, 0.0005147159099578857, 0.0005444884300231934, 0.000574260950088501, 0.0006040334701538086, 0.0006338059902191162, 0.0006635785102844238, 0.0006933510303497314, 0.0007231235504150391, 0.0007528960704803467, 0.0007826685905456543, 0.0008124411106109619, 0.0008422136306762695, 0.0008719861507415771, 0.0009017586708068848, 0.0009315311908721924, 0.0009613037109375]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 12.0, 16.0, 29.0, 39.0, 63.0, 111.0, 150.0, 232.0, 363.0, 635.0, 963.0, 1535.0, 2448.0, 3877.0, 5923.0, 9022.0, 13848.0, 20084.0, 28824.0, 39891.0, 53558.0, 67445.0, 81671.0, 92332.0, 98720.0, 98803.0, 93045.0, 81615.0, 68516.0, 54119.0, 40884.0, 29510.0, 20568.0, 13893.0, 9219.0, 6072.0, 3845.0, 2412.0, 1547.0, 997.0, 637.0, 417.0, 261.0, 147.0, 108.0, 61.0, 41.0, 19.0, 18.0, 11.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.7109375, -7.47015380859375, -7.2293701171875, -6.98858642578125, -6.747802734375, -6.50701904296875, -6.2662353515625, -6.02545166015625, -5.78466796875, -5.54388427734375, -5.3031005859375, -5.06231689453125, -4.821533203125, -4.58074951171875, -4.3399658203125, -4.09918212890625, -3.8583984375, -3.61761474609375, -3.3768310546875, -3.13604736328125, -2.895263671875, -2.65447998046875, -2.4136962890625, -2.17291259765625, -1.93212890625, -1.69134521484375, -1.4505615234375, -1.20977783203125, -0.968994140625, -0.72821044921875, -0.4874267578125, -0.24664306640625, -0.005859375, 0.23492431640625, 0.4757080078125, 0.71649169921875, 0.957275390625, 1.19805908203125, 1.4388427734375, 1.67962646484375, 1.92041015625, 2.16119384765625, 2.4019775390625, 2.64276123046875, 2.883544921875, 3.12432861328125, 3.3651123046875, 3.60589599609375, 3.8466796875, 4.08746337890625, 4.3282470703125, 4.56903076171875, 4.809814453125, 5.05059814453125, 5.2913818359375, 5.53216552734375, 5.77294921875, 6.01373291015625, 6.2545166015625, 6.49530029296875, 6.736083984375, 6.97686767578125, 7.2176513671875, 7.45843505859375, 7.69921875]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 7.0, 5.0, 10.0, 9.0, 7.0, 8.0, 9.0, 12.0, 14.0, 20.0, 28.0, 20.0, 27.0, 34.0, 27.0, 30.0, 45.0, 46.0, 38.0, 43.0, 36.0, 41.0, 37.0, 50.0, 46.0, 36.0, 36.0, 33.0, 31.0, 28.0, 29.0, 37.0, 22.0, 11.0, 15.0, 14.0, 12.0, 5.0, 12.0, 8.0, 4.0, 3.0, 8.0, 2.0, 4.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 3.0], "bins": [-3.625, -3.5166015625, -3.408203125, -3.2998046875, -3.19140625, -3.0830078125, -2.974609375, -2.8662109375, -2.7578125, -2.6494140625, -2.541015625, -2.4326171875, -2.32421875, -2.2158203125, -2.107421875, -1.9990234375, -1.890625, -1.7822265625, -1.673828125, -1.5654296875, -1.45703125, -1.3486328125, -1.240234375, -1.1318359375, -1.0234375, -0.9150390625, -0.806640625, -0.6982421875, -0.58984375, -0.4814453125, -0.373046875, -0.2646484375, -0.15625, -0.0478515625, 0.060546875, 0.1689453125, 0.27734375, 0.3857421875, 0.494140625, 0.6025390625, 0.7109375, 0.8193359375, 0.927734375, 1.0361328125, 1.14453125, 1.2529296875, 1.361328125, 1.4697265625, 1.578125, 1.6865234375, 1.794921875, 1.9033203125, 2.01171875, 2.1201171875, 2.228515625, 2.3369140625, 2.4453125, 2.5537109375, 2.662109375, 2.7705078125, 2.87890625, 2.9873046875, 3.095703125, 3.2041015625, 3.3125]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 4.0, 4.0, 4.0, 3.0, 13.0, 7.0, 19.0, 13.0, 16.0, 19.0, 21.0, 28.0, 26.0, 31.0, 28.0, 33.0, 39.0, 45.0, 37.0, 56.0, 59.0, 46.0, 47.0, 35.0, 47.0, 52.0, 28.0, 35.0, 36.0, 32.0, 27.0, 13.0, 11.0, 18.0, 17.0, 13.0, 6.0, 9.0, 6.0, 10.0, 5.0, 2.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.935272216796875, -35.74992752075195, -34.56458282470703, -33.37923812866211, -32.19389343261719, -31.008546829223633, -29.823200225830078, -28.637855529785156, -27.452510833740234, -26.267166137695312, -25.08182144165039, -23.896474838256836, -22.711130142211914, -21.525785446166992, -20.340438842773438, -19.155094146728516, -17.969749450683594, -16.784404754638672, -15.599059104919434, -14.413713455200195, -13.228368759155273, -12.043024063110352, -10.857678413391113, -9.672332763671875, -8.486988067626953, -7.301642894744873, -6.116297721862793, -4.930952548980713, -3.745607376098633, -2.5602622032165527, -1.3749170303344727, -0.18957138061523438, 0.9957771301269531, 2.181122303009033, 3.3664674758911133, 4.551812648773193, 5.737157821655273, 6.9225029945373535, 8.107848167419434, 9.293193817138672, 10.478538513183594, 11.663883209228516, 12.849228858947754, 14.034574508666992, 15.219919204711914, 16.405263900756836, 17.59061050415039, 18.775955200195312, 19.961299896240234, 21.146644592285156, 22.331989288330078, 23.517335891723633, 24.702680587768555, 25.888025283813477, 27.07337188720703, 28.258716583251953, 29.444061279296875, 30.629405975341797, 31.81475067138672, 33.00009536743164, 34.18544006347656, 35.37078857421875, 36.55613327026367, 37.741477966308594, 38.926822662353516]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 5.0, 6.0, 12.0, 12.0, 8.0, 16.0, 16.0, 23.0, 23.0, 31.0, 30.0, 46.0, 38.0, 36.0, 33.0, 34.0, 49.0, 46.0, 48.0, 28.0, 45.0, 43.0, 39.0, 59.0, 41.0, 36.0, 34.0, 35.0, 17.0, 26.0, 22.0, 9.0, 17.0, 12.0, 11.0, 3.0, 2.0, 7.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.25132751464844, -40.81850814819336, -39.38568878173828, -37.9528694152832, -36.520050048828125, -35.08723068237305, -33.65441131591797, -32.221595764160156, -30.788774490356445, -29.355955123901367, -27.92313575744629, -26.490318298339844, -25.057498931884766, -23.624679565429688, -22.19186019897461, -20.75904083251953, -19.326221466064453, -17.893402099609375, -16.460582733154297, -15.027764320373535, -13.594944953918457, -12.162125587463379, -10.729307174682617, -9.296487808227539, -7.863668441772461, -6.430849075317383, -4.998030185699463, -3.565211296081543, -2.132391929626465, -0.6995725631713867, 0.733245849609375, 2.166065216064453, 3.5988845825195312, 5.031703948974609, 6.464522838592529, 7.897341728210449, 9.330161094665527, 10.762980461120605, 12.195798873901367, 13.628618240356445, 15.061437606811523, 16.4942569732666, 17.92707633972168, 19.359893798828125, 20.792713165283203, 22.22553253173828, 23.65835189819336, 25.091171264648438, 26.523990631103516, 27.956809997558594, 29.389629364013672, 30.82244873046875, 32.25526809692383, 33.688087463378906, 35.12090301513672, 36.55372619628906, 37.986541748046875, 39.41936111450195, 40.85218048095703, 42.28499984741211, 43.71781921386719, 45.150638580322266, 46.583457946777344, 48.016273498535156, 49.4490966796875]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [3.0, 14.0, 11.0, 19.0, 25.0, 54.0, 84.0, 142.0, 221.0, 370.0, 557.0, 916.0, 1530.0, 2302.0, 3497.0, 5439.0, 8434.0, 12306.0, 18511.0, 26811.0, 38447.0, 54175.0, 75005.0, 99963.0, 132461.0, 167132.0, 206725.0, 244937.0, 280860.0, 308619.0, 325407.0, 330308.0, 318000.0, 296064.0, 263961.0, 225580.0, 187133.0, 147743.0, 114878.0, 86603.0, 63796.0, 45592.0, 32333.0, 22043.0, 15227.0, 10215.0, 7048.0, 4489.0, 2884.0, 1952.0, 1241.0, 808.0, 530.0, 336.0, 232.0, 123.0, 75.0, 52.0, 33.0, 16.0, 18.0, 7.0, 5.0, 2.0], "bins": [-23.625, -22.869140625, -22.11328125, -21.357421875, -20.6015625, -19.845703125, -19.08984375, -18.333984375, -17.578125, -16.822265625, -16.06640625, -15.310546875, -14.5546875, -13.798828125, -13.04296875, -12.287109375, -11.53125, -10.775390625, -10.01953125, -9.263671875, -8.5078125, -7.751953125, -6.99609375, -6.240234375, -5.484375, -4.728515625, -3.97265625, -3.216796875, -2.4609375, -1.705078125, -0.94921875, -0.193359375, 0.5625, 1.318359375, 2.07421875, 2.830078125, 3.5859375, 4.341796875, 5.09765625, 5.853515625, 6.609375, 7.365234375, 8.12109375, 8.876953125, 9.6328125, 10.388671875, 11.14453125, 11.900390625, 12.65625, 13.412109375, 14.16796875, 14.923828125, 15.6796875, 16.435546875, 17.19140625, 17.947265625, 18.703125, 19.458984375, 20.21484375, 20.970703125, 21.7265625, 22.482421875, 23.23828125, 23.994140625, 24.75]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 7.0, 4.0, 3.0, 4.0, 12.0, 10.0, 11.0, 15.0, 30.0, 25.0, 24.0, 29.0, 34.0, 47.0, 41.0, 50.0, 38.0, 42.0, 38.0, 46.0, 39.0, 55.0, 42.0, 33.0, 43.0, 48.0, 32.0, 29.0, 39.0, 26.0, 27.0, 18.0, 21.0, 6.0, 11.0, 8.0, 5.0, 7.0, 4.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.21875, -38.82568359375, -37.4326171875, -36.03955078125, -34.646484375, -33.25341796875, -31.8603515625, -30.46728515625, -29.07421875, -27.68115234375, -26.2880859375, -24.89501953125, -23.501953125, -22.10888671875, -20.7158203125, -19.32275390625, -17.9296875, -16.53662109375, -15.1435546875, -13.75048828125, -12.357421875, -10.96435546875, -9.5712890625, -8.17822265625, -6.78515625, -5.39208984375, -3.9990234375, -2.60595703125, -1.212890625, 0.18017578125, 1.5732421875, 2.96630859375, 4.359375, 5.75244140625, 7.1455078125, 8.53857421875, 9.931640625, 11.32470703125, 12.7177734375, 14.11083984375, 15.50390625, 16.89697265625, 18.2900390625, 19.68310546875, 21.076171875, 22.46923828125, 23.8623046875, 25.25537109375, 26.6484375, 28.04150390625, 29.4345703125, 30.82763671875, 32.220703125, 33.61376953125, 35.0068359375, 36.39990234375, 37.79296875, 39.18603515625, 40.5791015625, 41.97216796875, 43.365234375, 44.75830078125, 46.1513671875, 47.54443359375, 48.9375]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 9.0, 7.0, 22.0, 33.0, 52.0, 101.0, 195.0, 335.0, 613.0, 1176.0, 2123.0, 3734.0, 6502.0, 11439.0, 19120.0, 32274.0, 52148.0, 81254.0, 122102.0, 174636.0, 236404.0, 304919.0, 364503.0, 409665.0, 427608.0, 417532.0, 378398.0, 321869.0, 255505.0, 192704.0, 136198.0, 91395.0, 58871.0, 37299.0, 22367.0, 13303.0, 7797.0, 4468.0, 2489.0, 1397.0, 779.0, 409.0, 243.0, 127.0, 75.0, 31.0, 27.0, 25.0, 6.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-36.0, -34.8623046875, -33.724609375, -32.5869140625, -31.44921875, -30.3115234375, -29.173828125, -28.0361328125, -26.8984375, -25.7607421875, -24.623046875, -23.4853515625, -22.34765625, -21.2099609375, -20.072265625, -18.9345703125, -17.796875, -16.6591796875, -15.521484375, -14.3837890625, -13.24609375, -12.1083984375, -10.970703125, -9.8330078125, -8.6953125, -7.5576171875, -6.419921875, -5.2822265625, -4.14453125, -3.0068359375, -1.869140625, -0.7314453125, 0.40625, 1.5439453125, 2.681640625, 3.8193359375, 4.95703125, 6.0947265625, 7.232421875, 8.3701171875, 9.5078125, 10.6455078125, 11.783203125, 12.9208984375, 14.05859375, 15.1962890625, 16.333984375, 17.4716796875, 18.609375, 19.7470703125, 20.884765625, 22.0224609375, 23.16015625, 24.2978515625, 25.435546875, 26.5732421875, 27.7109375, 28.8486328125, 29.986328125, 31.1240234375, 32.26171875, 33.3994140625, 34.537109375, 35.6748046875, 36.8125]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 8.0, 6.0, 10.0, 7.0, 15.0, 17.0, 27.0, 25.0, 35.0, 30.0, 41.0, 73.0, 93.0, 109.0, 109.0, 140.0, 140.0, 164.0, 176.0, 188.0, 201.0, 203.0, 202.0, 230.0, 203.0, 182.0, 187.0, 189.0, 155.0, 129.0, 115.0, 135.0, 93.0, 98.0, 66.0, 65.0, 55.0, 38.0, 35.0, 23.0, 18.0, 20.0, 8.0, 5.0, 4.0, 3.0, 5.0, 4.0, 3.0], "bins": [-23.359375, -22.739501953125, -22.11962890625, -21.499755859375, -20.8798828125, -20.260009765625, -19.64013671875, -19.020263671875, -18.400390625, -17.780517578125, -17.16064453125, -16.540771484375, -15.9208984375, -15.301025390625, -14.68115234375, -14.061279296875, -13.44140625, -12.821533203125, -12.20166015625, -11.581787109375, -10.9619140625, -10.342041015625, -9.72216796875, -9.102294921875, -8.482421875, -7.862548828125, -7.24267578125, -6.622802734375, -6.0029296875, -5.383056640625, -4.76318359375, -4.143310546875, -3.5234375, -2.903564453125, -2.28369140625, -1.663818359375, -1.0439453125, -0.424072265625, 0.19580078125, 0.815673828125, 1.435546875, 2.055419921875, 2.67529296875, 3.295166015625, 3.9150390625, 4.534912109375, 5.15478515625, 5.774658203125, 6.39453125, 7.014404296875, 7.63427734375, 8.254150390625, 8.8740234375, 9.493896484375, 10.11376953125, 10.733642578125, 11.353515625, 11.973388671875, 12.59326171875, 13.213134765625, 13.8330078125, 14.452880859375, 15.07275390625, 15.692626953125, 16.3125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 5.0, 4.0, 3.0, 4.0, 5.0, 6.0, 12.0, 13.0, 15.0, 28.0, 19.0, 21.0, 16.0, 36.0, 33.0, 38.0, 43.0, 43.0, 62.0, 57.0, 47.0, 48.0, 59.0, 40.0, 37.0, 34.0, 34.0, 41.0, 24.0, 26.0, 31.0, 18.0, 20.0, 18.0, 11.0, 10.0, 11.0, 6.0, 7.0, 5.0, 4.0, 6.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-57.164886474609375, -55.528656005859375, -53.892425537109375, -52.25619125366211, -50.61996078491211, -48.98373031616211, -47.347496032714844, -45.711265563964844, -44.075035095214844, -42.438804626464844, -40.802574157714844, -39.16633987426758, -37.53010940551758, -35.89387893676758, -34.25764465332031, -32.62141418457031, -30.985183715820312, -29.348953247070312, -27.71272087097168, -26.076488494873047, -24.440258026123047, -22.804027557373047, -21.167795181274414, -19.53156280517578, -17.89533233642578, -16.25910186767578, -14.622869491577148, -12.986638069152832, -11.350406646728516, -9.7141752243042, -8.077943801879883, -6.441712379455566, -4.80548095703125, -3.1692495346069336, -1.5330181121826172, 0.10321331024169922, 1.7394447326660156, 3.375676155090332, 5.011907577514648, 6.648138999938965, 8.284370422363281, 9.920601844787598, 11.556833267211914, 13.19306468963623, 14.829296112060547, 16.465526580810547, 18.10175895690918, 19.737991333007812, 21.374221801757812, 23.010452270507812, 24.646684646606445, 26.282917022705078, 27.919147491455078, 29.555377960205078, 31.19161033630371, 32.827842712402344, 34.464073181152344, 36.100303649902344, 37.736534118652344, 39.37276840209961, 41.00899887084961, 42.64522933959961, 44.281463623046875, 45.917694091796875, 47.553924560546875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 2.0, 8.0, 12.0, 10.0, 12.0, 20.0, 17.0, 13.0, 21.0, 24.0, 26.0, 30.0, 49.0, 37.0, 43.0, 38.0, 50.0, 36.0, 50.0, 40.0, 46.0, 54.0, 38.0, 50.0, 45.0, 37.0, 35.0, 30.0, 22.0, 27.0, 18.0, 10.0, 12.0, 11.0, 10.0, 5.0, 4.0, 5.0, 1.0, 3.0, 6.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.53180694580078, -53.77714920043945, -52.022491455078125, -50.26783752441406, -48.513179779052734, -46.758522033691406, -45.00386428833008, -43.24920654296875, -41.49454879760742, -39.739891052246094, -37.985233306884766, -36.23057556152344, -34.475921630859375, -32.72126388549805, -30.96660614013672, -29.21194839477539, -27.457292556762695, -25.702634811401367, -23.947978973388672, -22.193321228027344, -20.438663482666016, -18.684005737304688, -16.929349899291992, -15.174692153930664, -13.420035362243652, -11.66537857055664, -9.910720825195312, -8.1560640335083, -6.401406764984131, -4.646749496459961, -2.892092704772949, -1.137434959411621, 0.6172218322753906, 2.3718791007995605, 4.1265363693237305, 5.881193161010742, 7.635850429534912, 9.390507698059082, 11.145164489746094, 12.899822235107422, 14.654479026794434, 16.409135818481445, 18.163793563842773, 19.91844940185547, 21.673107147216797, 23.427764892578125, 25.182422637939453, 26.93708038330078, 28.691736221313477, 30.446393966674805, 32.2010498046875, 33.95570755004883, 35.710365295410156, 37.465023040771484, 39.21968078613281, 40.974334716796875, 42.7289924621582, 44.48365020751953, 46.23830795288086, 47.99296569824219, 49.74761962890625, 51.50227737426758, 53.256935119628906, 55.011592864990234, 56.76625061035156]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 5.0, 6.0, 5.0, 13.0, 16.0, 49.0, 42.0, 53.0, 94.0, 135.0, 201.0, 289.0, 452.0, 706.0, 1112.0, 1557.0, 2543.0, 3829.0, 5839.0, 9310.0, 14902.0, 23269.0, 36531.0, 56100.0, 82515.0, 114099.0, 138189.0, 143347.0, 126019.0, 96425.0, 67221.0, 44701.0, 28626.0, 18124.0, 11495.0, 7311.0, 4640.0, 3039.0, 2035.0, 1232.0, 839.0, 515.0, 365.0, 250.0, 194.0, 107.0, 75.0, 57.0, 40.0, 13.0, 11.0, 11.0, 3.0, 3.0, 7.0, 3.0, 1.0, 0.0, 1.0, 2.0], "bins": [-6.78125, -6.5640869140625, -6.346923828125, -6.1297607421875, -5.91259765625, -5.6954345703125, -5.478271484375, -5.2611083984375, -5.0439453125, -4.8267822265625, -4.609619140625, -4.3924560546875, -4.17529296875, -3.9581298828125, -3.740966796875, -3.5238037109375, -3.306640625, -3.0894775390625, -2.872314453125, -2.6551513671875, -2.43798828125, -2.2208251953125, -2.003662109375, -1.7864990234375, -1.5693359375, -1.3521728515625, -1.135009765625, -0.9178466796875, -0.70068359375, -0.4835205078125, -0.266357421875, -0.0491943359375, 0.16796875, 0.3851318359375, 0.602294921875, 0.8194580078125, 1.03662109375, 1.2537841796875, 1.470947265625, 1.6881103515625, 1.9052734375, 2.1224365234375, 2.339599609375, 2.5567626953125, 2.77392578125, 2.9910888671875, 3.208251953125, 3.4254150390625, 3.642578125, 3.8597412109375, 4.076904296875, 4.2940673828125, 4.51123046875, 4.7283935546875, 4.945556640625, 5.1627197265625, 5.3798828125, 5.5970458984375, 5.814208984375, 6.0313720703125, 6.24853515625, 6.4656982421875, 6.682861328125, 6.9000244140625, 7.1171875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 8.0, 8.0, 6.0, 13.0, 9.0, 13.0, 13.0, 9.0, 16.0, 22.0, 18.0, 15.0, 27.0, 28.0, 37.0, 36.0, 34.0, 37.0, 25.0, 45.0, 33.0, 45.0, 37.0, 41.0, 47.0, 36.0, 40.0, 42.0, 31.0, 22.0, 22.0, 25.0, 23.0, 25.0, 19.0, 23.0, 15.0, 11.0, 6.0, 14.0, 6.0, 0.0, 9.0, 0.0, 6.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.21875, -44.666015625, -43.11328125, -41.560546875, -40.0078125, -38.455078125, -36.90234375, -35.349609375, -33.796875, -32.244140625, -30.69140625, -29.138671875, -27.5859375, -26.033203125, -24.48046875, -22.927734375, -21.375, -19.822265625, -18.26953125, -16.716796875, -15.1640625, -13.611328125, -12.05859375, -10.505859375, -8.953125, -7.400390625, -5.84765625, -4.294921875, -2.7421875, -1.189453125, 0.36328125, 1.916015625, 3.46875, 5.021484375, 6.57421875, 8.126953125, 9.6796875, 11.232421875, 12.78515625, 14.337890625, 15.890625, 17.443359375, 18.99609375, 20.548828125, 22.1015625, 23.654296875, 25.20703125, 26.759765625, 28.3125, 29.865234375, 31.41796875, 32.970703125, 34.5234375, 36.076171875, 37.62890625, 39.181640625, 40.734375, 42.287109375, 43.83984375, 45.392578125, 46.9453125, 48.498046875, 50.05078125, 51.603515625, 53.15625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 6.0, 5.0, 7.0, 16.0, 17.0, 30.0, 45.0, 74.0, 111.0, 179.0, 302.0, 515.0, 802.0, 1309.0, 2351.0, 3983.0, 7066.0, 12593.0, 22085.0, 39185.0, 68192.0, 110313.0, 159828.0, 185231.0, 161237.0, 112624.0, 68505.0, 39576.0, 22451.0, 12793.0, 7182.0, 4072.0, 2415.0, 1316.0, 830.0, 532.0, 279.0, 197.0, 109.0, 78.0, 42.0, 33.0, 17.0, 15.0, 11.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.796875, -8.5177001953125, -8.238525390625, -7.9593505859375, -7.68017578125, -7.4010009765625, -7.121826171875, -6.8426513671875, -6.5634765625, -6.2843017578125, -6.005126953125, -5.7259521484375, -5.44677734375, -5.1676025390625, -4.888427734375, -4.6092529296875, -4.330078125, -4.0509033203125, -3.771728515625, -3.4925537109375, -3.21337890625, -2.9342041015625, -2.655029296875, -2.3758544921875, -2.0966796875, -1.8175048828125, -1.538330078125, -1.2591552734375, -0.97998046875, -0.7008056640625, -0.421630859375, -0.1424560546875, 0.13671875, 0.4158935546875, 0.695068359375, 0.9742431640625, 1.25341796875, 1.5325927734375, 1.811767578125, 2.0909423828125, 2.3701171875, 2.6492919921875, 2.928466796875, 3.2076416015625, 3.48681640625, 3.7659912109375, 4.045166015625, 4.3243408203125, 4.603515625, 4.8826904296875, 5.161865234375, 5.4410400390625, 5.72021484375, 5.9993896484375, 6.278564453125, 6.5577392578125, 6.8369140625, 7.1160888671875, 7.395263671875, 7.6744384765625, 7.95361328125, 8.2327880859375, 8.511962890625, 8.7911376953125, 9.0703125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 4.0, 4.0, 4.0, 6.0, 8.0, 1.0, 5.0, 6.0, 16.0, 11.0, 10.0, 16.0, 15.0, 15.0, 29.0, 26.0, 22.0, 23.0, 39.0, 54.0, 50.0, 24.0, 38.0, 31.0, 44.0, 46.0, 44.0, 38.0, 35.0, 34.0, 35.0, 31.0, 25.0, 23.0, 34.0, 31.0, 20.0, 14.0, 15.0, 13.0, 14.0, 14.0, 8.0, 7.0, 6.0, 7.0, 5.0, 4.0, 1.0, 0.0, 2.0, 1.0, 4.0, 0.0, 3.0, 1.0], "bins": [-31.328125, -30.367919921875, -29.40771484375, -28.447509765625, -27.4873046875, -26.527099609375, -25.56689453125, -24.606689453125, -23.646484375, -22.686279296875, -21.72607421875, -20.765869140625, -19.8056640625, -18.845458984375, -17.88525390625, -16.925048828125, -15.96484375, -15.004638671875, -14.04443359375, -13.084228515625, -12.1240234375, -11.163818359375, -10.20361328125, -9.243408203125, -8.283203125, -7.322998046875, -6.36279296875, -5.402587890625, -4.4423828125, -3.482177734375, -2.52197265625, -1.561767578125, -0.6015625, 0.358642578125, 1.31884765625, 2.279052734375, 3.2392578125, 4.199462890625, 5.15966796875, 6.119873046875, 7.080078125, 8.040283203125, 9.00048828125, 9.960693359375, 10.9208984375, 11.881103515625, 12.84130859375, 13.801513671875, 14.76171875, 15.721923828125, 16.68212890625, 17.642333984375, 18.6025390625, 19.562744140625, 20.52294921875, 21.483154296875, 22.443359375, 23.403564453125, 24.36376953125, 25.323974609375, 26.2841796875, 27.244384765625, 28.20458984375, 29.164794921875, 30.125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 5.0, 8.0, 8.0, 14.0, 12.0, 22.0, 35.0, 42.0, 72.0, 100.0, 143.0, 200.0, 307.0, 464.0, 673.0, 1096.0, 1886.0, 3221.0, 5569.0, 10178.0, 19075.0, 36435.0, 68869.0, 124002.0, 193172.0, 216490.0, 160888.0, 94473.0, 51086.0, 27193.0, 14327.0, 7676.0, 4362.0, 2449.0, 1479.0, 891.0, 537.0, 324.0, 255.0, 149.0, 103.0, 80.0, 56.0, 31.0, 38.0, 19.0, 15.0, 12.0, 10.0, 6.0, 4.0, 4.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2216796875, -1.179931640625, -1.13818359375, -1.096435546875, -1.0546875, -1.012939453125, -0.97119140625, -0.929443359375, -0.8876953125, -0.845947265625, -0.80419921875, -0.762451171875, -0.720703125, -0.678955078125, -0.63720703125, -0.595458984375, -0.5537109375, -0.511962890625, -0.47021484375, -0.428466796875, -0.38671875, -0.344970703125, -0.30322265625, -0.261474609375, -0.2197265625, -0.177978515625, -0.13623046875, -0.094482421875, -0.052734375, -0.010986328125, 0.03076171875, 0.072509765625, 0.1142578125, 0.156005859375, 0.19775390625, 0.239501953125, 0.28125, 0.322998046875, 0.36474609375, 0.406494140625, 0.4482421875, 0.489990234375, 0.53173828125, 0.573486328125, 0.615234375, 0.656982421875, 0.69873046875, 0.740478515625, 0.7822265625, 0.823974609375, 0.86572265625, 0.907470703125, 0.94921875, 0.990966796875, 1.03271484375, 1.074462890625, 1.1162109375, 1.157958984375, 1.19970703125, 1.241455078125, 1.283203125, 1.324951171875, 1.36669921875, 1.408447265625, 1.4501953125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 4.0, 1.0, 1.0, 4.0, 2.0, 10.0, 5.0, 6.0, 12.0, 7.0, 12.0, 18.0, 6.0, 15.0, 19.0, 17.0, 21.0, 20.0, 29.0, 29.0, 30.0, 47.0, 35.0, 34.0, 33.0, 53.0, 38.0, 36.0, 54.0, 44.0, 36.0, 39.0, 37.0, 23.0, 31.0, 32.0, 30.0, 23.0, 19.0, 15.0, 19.0, 10.0, 6.0, 9.0, 7.0, 2.0, 8.0, 9.0, 3.0, 1.0, 3.0, 3.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0], "bins": [-0.00010484457015991211, -0.00010163150727748871, -9.841844439506531e-05, -9.52053815126419e-05, -9.19923186302185e-05, -8.87792557477951e-05, -8.55661928653717e-05, -8.23531299829483e-05, -7.91400671005249e-05, -7.59270042181015e-05, -7.27139413356781e-05, -6.95008784532547e-05, -6.62878155708313e-05, -6.30747526884079e-05, -5.98616898059845e-05, -5.6648626923561096e-05, -5.3435564041137695e-05, -5.0222501158714294e-05, -4.7009438276290894e-05, -4.379637539386749e-05, -4.058331251144409e-05, -3.737024962902069e-05, -3.415718674659729e-05, -3.094412386417389e-05, -2.7731060981750488e-05, -2.4517998099327087e-05, -2.1304935216903687e-05, -1.8091872334480286e-05, -1.4878809452056885e-05, -1.1665746569633484e-05, -8.452683687210083e-06, -5.239620804786682e-06, -2.0265579223632812e-06, 1.1865049600601196e-06, 4.3995678424835205e-06, 7.612630724906921e-06, 1.0825693607330322e-05, 1.4038756489753723e-05, 1.7251819372177124e-05, 2.0464882254600525e-05, 2.3677945137023926e-05, 2.6891008019447327e-05, 3.0104070901870728e-05, 3.331713378429413e-05, 3.653019666671753e-05, 3.974325954914093e-05, 4.295632243156433e-05, 4.616938531398773e-05, 4.938244819641113e-05, 5.2595511078834534e-05, 5.5808573961257935e-05, 5.9021636843681335e-05, 6.223469972610474e-05, 6.544776260852814e-05, 6.866082549095154e-05, 7.187388837337494e-05, 7.508695125579834e-05, 7.830001413822174e-05, 8.151307702064514e-05, 8.472613990306854e-05, 8.793920278549194e-05, 9.115226566791534e-05, 9.436532855033875e-05, 9.757839143276215e-05, 0.00010079145431518555]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 5.0, 4.0, 4.0, 9.0, 16.0, 17.0, 35.0, 53.0, 53.0, 88.0, 110.0, 180.0, 278.0, 364.0, 621.0, 840.0, 1328.0, 1968.0, 3073.0, 4799.0, 7393.0, 12016.0, 19239.0, 32285.0, 52732.0, 85821.0, 135501.0, 183883.0, 177617.0, 124874.0, 78745.0, 47734.0, 28872.0, 17517.0, 10952.0, 6790.0, 4453.0, 2711.0, 1860.0, 1251.0, 770.0, 566.0, 357.0, 237.0, 173.0, 108.0, 83.0, 54.0, 38.0, 28.0, 19.0, 15.0, 10.0, 8.0, 3.0, 3.0, 3.0, 2.0], "bins": [-2.193359375, -2.128662109375, -2.06396484375, -1.999267578125, -1.9345703125, -1.869873046875, -1.80517578125, -1.740478515625, -1.67578125, -1.611083984375, -1.54638671875, -1.481689453125, -1.4169921875, -1.352294921875, -1.28759765625, -1.222900390625, -1.158203125, -1.093505859375, -1.02880859375, -0.964111328125, -0.8994140625, -0.834716796875, -0.77001953125, -0.705322265625, -0.640625, -0.575927734375, -0.51123046875, -0.446533203125, -0.3818359375, -0.317138671875, -0.25244140625, -0.187744140625, -0.123046875, -0.058349609375, 0.00634765625, 0.071044921875, 0.1357421875, 0.200439453125, 0.26513671875, 0.329833984375, 0.39453125, 0.459228515625, 0.52392578125, 0.588623046875, 0.6533203125, 0.718017578125, 0.78271484375, 0.847412109375, 0.912109375, 0.976806640625, 1.04150390625, 1.106201171875, 1.1708984375, 1.235595703125, 1.30029296875, 1.364990234375, 1.4296875, 1.494384765625, 1.55908203125, 1.623779296875, 1.6884765625, 1.753173828125, 1.81787109375, 1.882568359375, 1.947265625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 5.0, 5.0, 7.0, 9.0, 10.0, 9.0, 20.0, 22.0, 17.0, 30.0, 27.0, 41.0, 40.0, 61.0, 61.0, 72.0, 80.0, 83.0, 68.0, 63.0, 48.0, 49.0, 38.0, 32.0, 25.0, 18.0, 21.0, 11.0, 14.0, 6.0, 8.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.71337890625, -0.6857070922851562, -0.6580352783203125, -0.6303634643554688, -0.602691650390625, -0.5750198364257812, -0.5473480224609375, -0.5196762084960938, -0.49200439453125, -0.46433258056640625, -0.4366607666015625, -0.40898895263671875, -0.381317138671875, -0.35364532470703125, -0.3259735107421875, -0.29830169677734375, -0.2706298828125, -0.24295806884765625, -0.2152862548828125, -0.18761444091796875, -0.159942626953125, -0.13227081298828125, -0.1045989990234375, -0.07692718505859375, -0.04925537109375, -0.02158355712890625, 0.0060882568359375, 0.03376007080078125, 0.061431884765625, 0.08910369873046875, 0.1167755126953125, 0.14444732666015625, 0.172119140625, 0.19979095458984375, 0.2274627685546875, 0.25513458251953125, 0.282806396484375, 0.31047821044921875, 0.3381500244140625, 0.36582183837890625, 0.39349365234375, 0.42116546630859375, 0.4488372802734375, 0.47650909423828125, 0.504180908203125, 0.5318527221679688, 0.5595245361328125, 0.5871963500976562, 0.6148681640625, 0.6425399780273438, 0.6702117919921875, 0.6978836059570312, 0.725555419921875, 0.7532272338867188, 0.7808990478515625, 0.8085708618164062, 0.83624267578125, 0.8639144897460938, 0.8915863037109375, 0.9192581176757812, 0.946929931640625, 0.9746017456054688, 1.0022735595703125, 1.0299453735351562, 1.0576171875]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 4.0, 5.0, 5.0, 2.0, 4.0, 4.0, 8.0, 9.0, 13.0, 16.0, 21.0, 24.0, 19.0, 17.0, 34.0, 32.0, 35.0, 48.0, 39.0, 63.0, 60.0, 45.0, 42.0, 55.0, 52.0, 34.0, 32.0, 41.0, 40.0, 27.0, 23.0, 33.0, 19.0, 17.0, 19.0, 17.0, 8.0, 7.0, 11.0, 6.0, 5.0, 4.0, 5.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-57.571441650390625, -55.9372673034668, -54.30309295654297, -52.66891860961914, -51.03474426269531, -49.400569915771484, -47.766395568847656, -46.132225036621094, -44.498046875, -42.86387252807617, -41.229698181152344, -39.595523834228516, -37.96134948730469, -36.32717514038086, -34.69300079345703, -33.05883026123047, -31.42465591430664, -29.790481567382812, -28.156307220458984, -26.522132873535156, -24.887958526611328, -23.2537841796875, -21.619611740112305, -19.985437393188477, -18.35126304626465, -16.71708869934082, -15.082914352416992, -13.44874095916748, -11.814566612243652, -10.180392265319824, -8.546218872070312, -6.912044525146484, -5.277873992919922, -3.643699884414673, -2.009525775909424, -0.3753519058227539, 1.2588224411010742, 2.8929967880249023, 4.527170181274414, 6.161344528198242, 7.79551887512207, 9.429693222045898, 11.063867568969727, 12.698040962219238, 14.332215309143066, 15.966389656066895, 17.600563049316406, 19.234737396240234, 20.868911743164062, 22.50308609008789, 24.13726043701172, 25.771434783935547, 27.405609130859375, 29.039783477783203, 30.6739559173584, 32.308128356933594, 33.94230651855469, 35.576480865478516, 37.210655212402344, 38.84482955932617, 40.47900390625, 42.11317825317383, 43.747352600097656, 45.38152313232422, 47.01569747924805]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 3.0, 7.0, 13.0, 8.0, 13.0, 20.0, 17.0, 14.0, 18.0, 29.0, 24.0, 31.0, 49.0, 35.0, 45.0, 38.0, 50.0, 36.0, 52.0, 39.0, 47.0, 51.0, 39.0, 49.0, 46.0, 38.0, 34.0, 32.0, 19.0, 30.0, 16.0, 10.0, 10.0, 12.0, 9.0, 5.0, 5.0, 4.0, 3.0, 2.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.09373092651367, -54.33269500732422, -52.571659088134766, -50.81062316894531, -49.049591064453125, -47.28855514526367, -45.52751922607422, -43.766483306884766, -42.00544738769531, -40.24441146850586, -38.483375549316406, -36.72234344482422, -34.961307525634766, -33.20027160644531, -31.43923568725586, -29.678199768066406, -27.91716766357422, -26.156131744384766, -24.395097732543945, -22.634061813354492, -20.873027801513672, -19.11199188232422, -17.350955963134766, -15.589920997619629, -13.828886032104492, -12.067851066589355, -10.306816101074219, -8.545780181884766, -6.784745216369629, -5.023710250854492, -3.262674331665039, -1.5016393661499023, 0.2593955993652344, 2.02043080329895, 3.781466007232666, 5.542501449584961, 7.303536415100098, 9.064571380615234, 10.825607299804688, 12.586642265319824, 14.347677230834961, 16.108713150024414, 17.869747161865234, 19.630783081054688, 21.39181900024414, 23.15285301208496, 24.913888931274414, 26.674922943115234, 28.435958862304688, 30.19699478149414, 31.95802879333496, 33.71906280517578, 35.480098724365234, 37.24113464355469, 39.00217056274414, 40.763206481933594, 42.52423858642578, 44.285274505615234, 46.04631042480469, 47.807342529296875, 49.56837844848633, 51.32941436767578, 53.090450286865234, 54.85148620605469, 56.61252212524414]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 7.0, 7.0, 12.0, 22.0, 51.0, 87.0, 127.0, 196.0, 333.0, 566.0, 919.0, 1516.0, 2474.0, 3760.0, 6025.0, 9551.0, 14535.0, 21571.0, 30723.0, 42543.0, 56514.0, 71576.0, 85019.0, 96656.0, 101366.0, 100010.0, 92359.0, 79701.0, 65271.0, 50505.0, 36997.0, 26568.0, 18029.0, 12052.0, 7652.0, 4997.0, 3245.0, 1974.0, 1216.0, 738.0, 417.0, 268.0, 154.0, 110.0, 64.0, 30.0, 22.0, 11.0, 10.0, 2.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.34375, -23.5263671875, -22.708984375, -21.8916015625, -21.07421875, -20.2568359375, -19.439453125, -18.6220703125, -17.8046875, -16.9873046875, -16.169921875, -15.3525390625, -14.53515625, -13.7177734375, -12.900390625, -12.0830078125, -11.265625, -10.4482421875, -9.630859375, -8.8134765625, -7.99609375, -7.1787109375, -6.361328125, -5.5439453125, -4.7265625, -3.9091796875, -3.091796875, -2.2744140625, -1.45703125, -0.6396484375, 0.177734375, 0.9951171875, 1.8125, 2.6298828125, 3.447265625, 4.2646484375, 5.08203125, 5.8994140625, 6.716796875, 7.5341796875, 8.3515625, 9.1689453125, 9.986328125, 10.8037109375, 11.62109375, 12.4384765625, 13.255859375, 14.0732421875, 14.890625, 15.7080078125, 16.525390625, 17.3427734375, 18.16015625, 18.9775390625, 19.794921875, 20.6123046875, 21.4296875, 22.2470703125, 23.064453125, 23.8818359375, 24.69921875, 25.5166015625, 26.333984375, 27.1513671875, 27.96875]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 6.0, 6.0, 10.0, 5.0, 10.0, 6.0, 10.0, 18.0, 14.0, 17.0, 23.0, 28.0, 34.0, 37.0, 30.0, 39.0, 41.0, 42.0, 41.0, 54.0, 45.0, 41.0, 46.0, 41.0, 42.0, 50.0, 47.0, 37.0, 26.0, 26.0, 21.0, 24.0, 10.0, 14.0, 11.0, 16.0, 14.0, 2.0, 6.0, 6.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-54.03125, -52.3818359375, -50.732421875, -49.0830078125, -47.43359375, -45.7841796875, -44.134765625, -42.4853515625, -40.8359375, -39.1865234375, -37.537109375, -35.8876953125, -34.23828125, -32.5888671875, -30.939453125, -29.2900390625, -27.640625, -25.9912109375, -24.341796875, -22.6923828125, -21.04296875, -19.3935546875, -17.744140625, -16.0947265625, -14.4453125, -12.7958984375, -11.146484375, -9.4970703125, -7.84765625, -6.1982421875, -4.548828125, -2.8994140625, -1.25, 0.3994140625, 2.048828125, 3.6982421875, 5.34765625, 6.9970703125, 8.646484375, 10.2958984375, 11.9453125, 13.5947265625, 15.244140625, 16.8935546875, 18.54296875, 20.1923828125, 21.841796875, 23.4912109375, 25.140625, 26.7900390625, 28.439453125, 30.0888671875, 31.73828125, 33.3876953125, 35.037109375, 36.6865234375, 38.3359375, 39.9853515625, 41.634765625, 43.2841796875, 44.93359375, 46.5830078125, 48.232421875, 49.8818359375, 51.53125]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 14.0, 16.0, 23.0, 29.0, 67.0, 99.0, 137.0, 243.0, 342.0, 545.0, 822.0, 1270.0, 1928.0, 2865.0, 4457.0, 6630.0, 9839.0, 14633.0, 21082.0, 30221.0, 41777.0, 55117.0, 69928.0, 83714.0, 94793.0, 101026.0, 99316.0, 91615.0, 79307.0, 64797.0, 50538.0, 37021.0, 26753.0, 18866.0, 12893.0, 8877.0, 5857.0, 3774.0, 2587.0, 1728.0, 1023.0, 667.0, 451.0, 301.0, 193.0, 124.0, 81.0, 59.0, 38.0, 34.0, 16.0, 12.0, 9.0, 1.0, 3.0, 2.0, 1.0], "bins": [-30.484375, -29.555908203125, -28.62744140625, -27.698974609375, -26.7705078125, -25.842041015625, -24.91357421875, -23.985107421875, -23.056640625, -22.128173828125, -21.19970703125, -20.271240234375, -19.3427734375, -18.414306640625, -17.48583984375, -16.557373046875, -15.62890625, -14.700439453125, -13.77197265625, -12.843505859375, -11.9150390625, -10.986572265625, -10.05810546875, -9.129638671875, -8.201171875, -7.272705078125, -6.34423828125, -5.415771484375, -4.4873046875, -3.558837890625, -2.63037109375, -1.701904296875, -0.7734375, 0.155029296875, 1.08349609375, 2.011962890625, 2.9404296875, 3.868896484375, 4.79736328125, 5.725830078125, 6.654296875, 7.582763671875, 8.51123046875, 9.439697265625, 10.3681640625, 11.296630859375, 12.22509765625, 13.153564453125, 14.08203125, 15.010498046875, 15.93896484375, 16.867431640625, 17.7958984375, 18.724365234375, 19.65283203125, 20.581298828125, 21.509765625, 22.438232421875, 23.36669921875, 24.295166015625, 25.2236328125, 26.152099609375, 27.08056640625, 28.009033203125, 28.9375]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 9.0, 8.0, 11.0, 9.0, 21.0, 24.0, 19.0, 25.0, 22.0, 37.0, 29.0, 39.0, 34.0, 34.0, 39.0, 43.0, 42.0, 46.0, 46.0, 44.0, 41.0, 40.0, 32.0, 35.0, 31.0, 29.0, 44.0, 21.0, 27.0, 23.0, 14.0, 12.0, 10.0, 11.0, 9.0, 6.0, 4.0, 5.0, 8.0, 7.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-31.375, -30.36181640625, -29.3486328125, -28.33544921875, -27.322265625, -26.30908203125, -25.2958984375, -24.28271484375, -23.26953125, -22.25634765625, -21.2431640625, -20.22998046875, -19.216796875, -18.20361328125, -17.1904296875, -16.17724609375, -15.1640625, -14.15087890625, -13.1376953125, -12.12451171875, -11.111328125, -10.09814453125, -9.0849609375, -8.07177734375, -7.05859375, -6.04541015625, -5.0322265625, -4.01904296875, -3.005859375, -1.99267578125, -0.9794921875, 0.03369140625, 1.046875, 2.06005859375, 3.0732421875, 4.08642578125, 5.099609375, 6.11279296875, 7.1259765625, 8.13916015625, 9.15234375, 10.16552734375, 11.1787109375, 12.19189453125, 13.205078125, 14.21826171875, 15.2314453125, 16.24462890625, 17.2578125, 18.27099609375, 19.2841796875, 20.29736328125, 21.310546875, 22.32373046875, 23.3369140625, 24.35009765625, 25.36328125, 26.37646484375, 27.3896484375, 28.40283203125, 29.416015625, 30.42919921875, 31.4423828125, 32.45556640625, 33.46875]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 8.0, 7.0, 22.0, 18.0, 24.0, 34.0, 71.0, 116.0, 202.0, 286.0, 432.0, 674.0, 1113.0, 1688.0, 2869.0, 4303.0, 6724.0, 10529.0, 15685.0, 22967.0, 33097.0, 45950.0, 61141.0, 76392.0, 89980.0, 99748.0, 103050.0, 99843.0, 89890.0, 75691.0, 60655.0, 45790.0, 32844.0, 22704.0, 15604.0, 10102.0, 6568.0, 4313.0, 2706.0, 1800.0, 1040.0, 686.0, 394.0, 293.0, 186.0, 127.0, 68.0, 57.0, 24.0, 19.0, 15.0, 10.0, 6.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-11.46875, -11.1044921875, -10.740234375, -10.3759765625, -10.01171875, -9.6474609375, -9.283203125, -8.9189453125, -8.5546875, -8.1904296875, -7.826171875, -7.4619140625, -7.09765625, -6.7333984375, -6.369140625, -6.0048828125, -5.640625, -5.2763671875, -4.912109375, -4.5478515625, -4.18359375, -3.8193359375, -3.455078125, -3.0908203125, -2.7265625, -2.3623046875, -1.998046875, -1.6337890625, -1.26953125, -0.9052734375, -0.541015625, -0.1767578125, 0.1875, 0.5517578125, 0.916015625, 1.2802734375, 1.64453125, 2.0087890625, 2.373046875, 2.7373046875, 3.1015625, 3.4658203125, 3.830078125, 4.1943359375, 4.55859375, 4.9228515625, 5.287109375, 5.6513671875, 6.015625, 6.3798828125, 6.744140625, 7.1083984375, 7.47265625, 7.8369140625, 8.201171875, 8.5654296875, 8.9296875, 9.2939453125, 9.658203125, 10.0224609375, 10.38671875, 10.7509765625, 11.115234375, 11.4794921875, 11.84375]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 7.0, 4.0, 4.0, 6.0, 6.0, 11.0, 9.0, 18.0, 24.0, 24.0, 27.0, 34.0, 35.0, 28.0, 52.0, 52.0, 64.0, 47.0, 65.0, 53.0, 50.0, 56.0, 56.0, 44.0, 40.0, 44.0, 31.0, 22.0, 24.0, 7.0, 10.0, 10.0, 12.0, 9.0, 7.0, 3.0, 6.0, 1.0, 4.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0016155242919921875, -0.0015586018562316895, -0.0015016794204711914, -0.0014447569847106934, -0.0013878345489501953, -0.0013309121131896973, -0.0012739896774291992, -0.0012170672416687012, -0.0011601448059082031, -0.001103222370147705, -0.001046299934387207, -0.000989377498626709, -0.0009324550628662109, -0.0008755326271057129, -0.0008186101913452148, -0.0007616877555847168, -0.0007047653198242188, -0.0006478428840637207, -0.0005909204483032227, -0.0005339980125427246, -0.00047707557678222656, -0.0004201531410217285, -0.00036323070526123047, -0.0003063082695007324, -0.0002493858337402344, -0.00019246339797973633, -0.00013554096221923828, -7.861852645874023e-05, -2.1696090698242188e-05, 3.522634506225586e-05, 9.21487808227539e-05, 0.00014907121658325195, 0.00020599365234375, 0.00026291608810424805, 0.0003198385238647461, 0.00037676095962524414, 0.0004336833953857422, 0.0004906058311462402, 0.0005475282669067383, 0.0006044507026672363, 0.0006613731384277344, 0.0007182955741882324, 0.0007752180099487305, 0.0008321404457092285, 0.0008890628814697266, 0.0009459853172302246, 0.0010029077529907227, 0.0010598301887512207, 0.0011167526245117188, 0.0011736750602722168, 0.0012305974960327148, 0.0012875199317932129, 0.001344442367553711, 0.001401364803314209, 0.001458287239074707, 0.001515209674835205, 0.0015721321105957031, 0.0016290545463562012, 0.0016859769821166992, 0.0017428994178771973, 0.0017998218536376953, 0.0018567442893981934, 0.0019136667251586914, 0.0019705891609191895, 0.0020275115966796875]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 5.0, 4.0, 16.0, 6.0, 21.0, 61.0, 74.0, 119.0, 186.0, 277.0, 461.0, 762.0, 1197.0, 1860.0, 2985.0, 4678.0, 7410.0, 11167.0, 17272.0, 25328.0, 36564.0, 50568.0, 66479.0, 82600.0, 95939.0, 104702.0, 105123.0, 98783.0, 86175.0, 70799.0, 54149.0, 39997.0, 28222.0, 19148.0, 12677.0, 8277.0, 5364.0, 3290.0, 2211.0, 1380.0, 834.0, 505.0, 332.0, 199.0, 129.0, 81.0, 55.0, 42.0, 21.0, 12.0, 12.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.421875, -12.0352783203125, -11.648681640625, -11.2620849609375, -10.87548828125, -10.4888916015625, -10.102294921875, -9.7156982421875, -9.3291015625, -8.9425048828125, -8.555908203125, -8.1693115234375, -7.78271484375, -7.3961181640625, -7.009521484375, -6.6229248046875, -6.236328125, -5.8497314453125, -5.463134765625, -5.0765380859375, -4.68994140625, -4.3033447265625, -3.916748046875, -3.5301513671875, -3.1435546875, -2.7569580078125, -2.370361328125, -1.9837646484375, -1.59716796875, -1.2105712890625, -0.823974609375, -0.4373779296875, -0.05078125, 0.3358154296875, 0.722412109375, 1.1090087890625, 1.49560546875, 1.8822021484375, 2.268798828125, 2.6553955078125, 3.0419921875, 3.4285888671875, 3.815185546875, 4.2017822265625, 4.58837890625, 4.9749755859375, 5.361572265625, 5.7481689453125, 6.134765625, 6.5213623046875, 6.907958984375, 7.2945556640625, 7.68115234375, 8.0677490234375, 8.454345703125, 8.8409423828125, 9.2275390625, 9.6141357421875, 10.000732421875, 10.3873291015625, 10.77392578125, 11.1605224609375, 11.547119140625, 11.9337158203125, 12.3203125]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 4.0, 1.0, 5.0, 0.0, 2.0, 1.0, 3.0, 4.0, 8.0, 10.0, 4.0, 10.0, 8.0, 10.0, 17.0, 14.0, 16.0, 14.0, 18.0, 24.0, 34.0, 29.0, 23.0, 25.0, 40.0, 30.0, 39.0, 38.0, 37.0, 37.0, 38.0, 45.0, 29.0, 43.0, 35.0, 33.0, 33.0, 29.0, 27.0, 29.0, 22.0, 21.0, 17.0, 13.0, 11.0, 12.0, 8.0, 10.0, 14.0, 10.0, 12.0, 3.0, 3.0, 2.0, 4.0, 4.0, 4.0, 2.0, 1.0, 0.0, 2.0], "bins": [-5.32421875, -5.1627197265625, -5.001220703125, -4.8397216796875, -4.67822265625, -4.5167236328125, -4.355224609375, -4.1937255859375, -4.0322265625, -3.8707275390625, -3.709228515625, -3.5477294921875, -3.38623046875, -3.2247314453125, -3.063232421875, -2.9017333984375, -2.740234375, -2.5787353515625, -2.417236328125, -2.2557373046875, -2.09423828125, -1.9327392578125, -1.771240234375, -1.6097412109375, -1.4482421875, -1.2867431640625, -1.125244140625, -0.9637451171875, -0.80224609375, -0.6407470703125, -0.479248046875, -0.3177490234375, -0.15625, 0.0052490234375, 0.166748046875, 0.3282470703125, 0.48974609375, 0.6512451171875, 0.812744140625, 0.9742431640625, 1.1357421875, 1.2972412109375, 1.458740234375, 1.6202392578125, 1.78173828125, 1.9432373046875, 2.104736328125, 2.2662353515625, 2.427734375, 2.5892333984375, 2.750732421875, 2.9122314453125, 3.07373046875, 3.2352294921875, 3.396728515625, 3.5582275390625, 3.7197265625, 3.8812255859375, 4.042724609375, 4.2042236328125, 4.36572265625, 4.5272216796875, 4.688720703125, 4.8502197265625, 5.01171875]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 4.0, 4.0, 8.0, 7.0, 6.0, 6.0, 12.0, 7.0, 19.0, 18.0, 28.0, 31.0, 20.0, 27.0, 43.0, 43.0, 56.0, 41.0, 49.0, 43.0, 51.0, 62.0, 50.0, 47.0, 39.0, 33.0, 43.0, 29.0, 22.0, 40.0, 21.0, 17.0, 12.0, 13.0, 12.0, 10.0, 10.0, 8.0, 4.0, 7.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-60.628501892089844, -58.87873840332031, -57.12897872924805, -55.379215240478516, -53.62945556640625, -51.87969207763672, -50.12992858886719, -48.380165100097656, -46.63040542602539, -44.88064193725586, -43.130882263183594, -41.38111877441406, -39.63135528564453, -37.881595611572266, -36.131832122802734, -34.38207244873047, -32.63230895996094, -30.88254737854004, -29.13278579711914, -27.38302230834961, -25.63326072692871, -23.883499145507812, -22.13373565673828, -20.383974075317383, -18.634212493896484, -16.884450912475586, -15.134688377380371, -13.384925842285156, -11.635164260864258, -9.88540267944336, -8.135640144348145, -6.38587760925293, -4.636112213134766, -2.886350154876709, -1.1365880966186523, 0.6131739616394043, 2.362936019897461, 4.112697601318359, 5.862460136413574, 7.612222671508789, 9.361984252929688, 11.111745834350586, 12.8615083694458, 14.611270904541016, 16.361032485961914, 18.110794067382812, 19.860557556152344, 21.610319137573242, 23.36008071899414, 25.10984230041504, 26.859603881835938, 28.60936737060547, 30.359128952026367, 32.108890533447266, 33.8586540222168, 35.60841369628906, 37.358177185058594, 39.107940673828125, 40.85770034790039, 42.60746383666992, 44.35722351074219, 46.10698699951172, 47.85675048828125, 49.60651397705078, 51.35627365112305]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 8.0, 4.0, 7.0, 4.0, 6.0, 10.0, 12.0, 17.0, 9.0, 14.0, 18.0, 21.0, 22.0, 17.0, 24.0, 27.0, 42.0, 40.0, 40.0, 33.0, 55.0, 45.0, 34.0, 41.0, 43.0, 51.0, 37.0, 31.0, 41.0, 32.0, 22.0, 26.0, 18.0, 29.0, 21.0, 16.0, 20.0, 10.0, 8.0, 10.0, 13.0, 9.0, 6.0, 0.0, 6.0, 2.0, 4.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 0.0, 1.0], "bins": [-58.50265121459961, -56.67827224731445, -54.85389709472656, -53.029518127441406, -51.20513916015625, -49.380760192871094, -47.5563850402832, -45.73200607299805, -43.907630920410156, -42.083251953125, -40.25887680053711, -38.43449783325195, -36.6101188659668, -34.785743713378906, -32.96136474609375, -31.136985778808594, -29.312606811523438, -27.488229751586914, -25.663850784301758, -23.839473724365234, -22.015094757080078, -20.190717697143555, -18.36634063720703, -16.541961669921875, -14.717584609985352, -12.893206596374512, -11.068828582763672, -9.244451522827148, -7.420073509216309, -5.595695495605469, -3.7713184356689453, -1.9469404220581055, -0.12255859375, 1.7018191814422607, 3.5261969566345215, 5.350574493408203, 7.174952507019043, 8.999330520629883, 10.823707580566406, 12.648085594177246, 14.472463607788086, 16.29684066772461, 18.121219635009766, 19.94559669494629, 21.769973754882812, 23.59435272216797, 25.418729782104492, 27.243106842041016, 29.067485809326172, 30.891862869262695, 32.71623992919922, 34.540618896484375, 36.36499786376953, 38.18937683105469, 40.01375198364258, 41.838130950927734, 43.662506103515625, 45.48688507080078, 47.31126022338867, 49.13563919067383, 50.960018157958984, 52.784393310546875, 54.60877227783203, 56.43315124511719, 58.257530212402344]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 3.0, 14.0, 17.0, 15.0, 28.0, 55.0, 68.0, 94.0, 132.0, 178.0, 237.0, 337.0, 474.0, 639.0, 821.0, 1188.0, 1516.0, 1887.0, 2581.0, 3189.0, 4227.0, 6303.0, 997455.0, 7945.0, 5431.0, 3668.0, 2981.0, 2193.0, 1769.0, 1343.0, 1102.0, 775.0, 540.0, 376.0, 289.0, 212.0, 153.0, 93.0, 82.0, 60.0, 36.0, 34.0, 19.0, 11.0, 9.0, 11.0, 4.0, 8.0, 2.0, 3.0, 2.0, 0.0, 1.0], "bins": [-523.710693359375, -508.21435546875, -492.718017578125, -477.2217102050781, -461.7253723144531, -446.2290344238281, -430.7326965332031, -415.23638916015625, -399.74005126953125, -384.24371337890625, -368.74737548828125, -353.2510681152344, -337.7547302246094, -322.2583923339844, -306.7620544433594, -291.2657470703125, -275.7694091796875, -260.2730712890625, -244.77674865722656, -229.28041076660156, -213.78408813476562, -198.28775024414062, -182.79141235351562, -167.2950897216797, -151.79873657226562, -136.30239868164062, -120.80607604980469, -105.30973815917969, -89.81341552734375, -74.31707763671875, -58.82074737548828, -43.32441711425781, -27.828094482421875, -12.33176326751709, 3.1645679473876953, 18.660900115966797, 34.157230377197266, 49.653564453125, 65.14989471435547, 80.64622497558594, 96.1425552368164, 111.63888549804688, 127.13521575927734, 142.6315460205078, 158.1278839111328, 173.62420654296875, 189.12054443359375, 204.61688232421875, 220.1132049560547, 235.6095428466797, 251.10586547851562, 266.6022033691406, 282.0985412597656, 297.5948486328125, 313.0911865234375, 328.5875244140625, 344.0838623046875, 359.5802001953125, 375.0765380859375, 390.5728454589844, 406.0691833496094, 421.5655212402344, 437.0618591308594, 452.55816650390625, 468.05450439453125]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 7.0, 8.0, 12.0, 12.0, 19.0, 29.0, 41.0, 77.0, 108.0, 125.0, 203.0, 314.0, 413.0, 638.0, 1020.0, 1646.0, 2551.0, 4466.0, 7486.0, 11797.0, 18430.0, 26933.0, 48969.0, 51201664.0, 62414.0, 29003.0, 19525.0, 12665.0, 7963.0, 4876.0, 2846.0, 1754.0, 1129.0, 742.0, 447.0, 323.0, 209.0, 130.0, 120.0, 74.0, 54.0, 30.0, 28.0, 23.0, 9.0, 11.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-671.0728149414062, -652.2144775390625, -633.3560791015625, -614.4976806640625, -595.6393432617188, -576.781005859375, -557.922607421875, -539.064208984375, -520.2058715820312, -501.3475036621094, -482.4891357421875, -463.6307678222656, -444.77239990234375, -425.9140319824219, -407.0556640625, -388.1972961425781, -369.33892822265625, -350.4805603027344, -331.6221923828125, -312.7638244628906, -293.90545654296875, -275.0470886230469, -256.188720703125, -237.33035278320312, -218.47198486328125, -199.61361694335938, -180.7552490234375, -161.89688110351562, -143.03851318359375, -124.18014526367188, -105.32177734375, -86.46340942382812, -67.6051025390625, -48.746734619140625, -29.88836669921875, -11.029998779296875, 7.828369140625, 26.686737060546875, 45.54510498046875, 64.40347290039062, 83.2618408203125, 102.12020874023438, 120.97857666015625, 139.83694458007812, 158.6953125, 177.55368041992188, 196.41204833984375, 215.27041625976562, 234.1287841796875, 252.98715209960938, 271.84552001953125, 290.7038879394531, 309.562255859375, 328.4206237792969, 347.27899169921875, 366.1373596191406, 384.9957275390625, 403.8540954589844, 422.71246337890625, 441.5708312988281, 460.42919921875, 479.2875671386719, 498.14593505859375, 517.0042724609375, 535.8626708984375]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 6.0, 6.0, 10.0, 20.0, 33.0, 37.0, 49.0, 88.0, 137.0, 252.0, 327.0, 560.0, 952.0, 1634.0, 2688.0, 4351.0, 7376.0, 12192.0, 20207.0, 33627.0, 56659.0, 93429.0, 152521.0, 250886.0, 428531.0, 950910.0, 2266198.0, 947666.0, 428124.0, 249244.0, 151735.0, 92349.0, 55448.0, 33094.0, 19942.0, 11947.0, 7121.0, 4271.0, 2669.0, 1581.0, 959.0, 590.0, 391.0, 233.0, 136.0, 97.0, 54.0, 36.0, 25.0, 21.0, 9.0, 8.0, 3.0, 3.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0], "bins": [-9.875, -9.5511474609375, -9.227294921875, -8.9034423828125, -8.57958984375, -8.2557373046875, -7.931884765625, -7.6080322265625, -7.2841796875, -6.9603271484375, -6.636474609375, -6.3126220703125, -5.98876953125, -5.6649169921875, -5.341064453125, -5.0172119140625, -4.693359375, -4.3695068359375, -4.045654296875, -3.7218017578125, -3.39794921875, -3.0740966796875, -2.750244140625, -2.4263916015625, -2.1025390625, -1.7786865234375, -1.454833984375, -1.1309814453125, -0.80712890625, -0.4832763671875, -0.159423828125, 0.1644287109375, 0.48828125, 0.8121337890625, 1.135986328125, 1.4598388671875, 1.78369140625, 2.1075439453125, 2.431396484375, 2.7552490234375, 3.0791015625, 3.4029541015625, 3.726806640625, 4.0506591796875, 4.37451171875, 4.6983642578125, 5.022216796875, 5.3460693359375, 5.669921875, 5.9937744140625, 6.317626953125, 6.6414794921875, 6.96533203125, 7.2891845703125, 7.613037109375, 7.9368896484375, 8.2607421875, 8.5845947265625, 8.908447265625, 9.2322998046875, 9.55615234375, 9.8800048828125, 10.203857421875, 10.5277099609375, 10.8515625]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 7.0, 4.0, 4.0, 4.0, 8.0, 6.0, 16.0, 5.0, 8.0, 19.0, 9.0, 19.0, 23.0, 15.0, 24.0, 35.0, 35.0, 30.0, 41.0, 46.0, 49.0, 87.0, 199.0, 354.0, 361.0, 145.0, 56.0, 43.0, 32.0, 32.0, 49.0, 33.0, 34.0, 21.0, 22.0, 19.0, 23.0, 18.0, 15.0, 16.0, 10.0, 14.0, 8.0, 6.0, 7.0, 3.0, 5.0, 4.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-34.84375, -33.75830078125, -32.6728515625, -31.58740234375, -30.501953125, -29.41650390625, -28.3310546875, -27.24560546875, -26.16015625, -25.07470703125, -23.9892578125, -22.90380859375, -21.818359375, -20.73291015625, -19.6474609375, -18.56201171875, -17.4765625, -16.39111328125, -15.3056640625, -14.22021484375, -13.134765625, -12.04931640625, -10.9638671875, -9.87841796875, -8.79296875, -7.70751953125, -6.6220703125, -5.53662109375, -4.451171875, -3.36572265625, -2.2802734375, -1.19482421875, -0.109375, 0.97607421875, 2.0615234375, 3.14697265625, 4.232421875, 5.31787109375, 6.4033203125, 7.48876953125, 8.57421875, 9.65966796875, 10.7451171875, 11.83056640625, 12.916015625, 14.00146484375, 15.0869140625, 16.17236328125, 17.2578125, 18.34326171875, 19.4287109375, 20.51416015625, 21.599609375, 22.68505859375, 23.7705078125, 24.85595703125, 25.94140625, 27.02685546875, 28.1123046875, 29.19775390625, 30.283203125, 31.36865234375, 32.4541015625, 33.53955078125, 34.625]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 3.0, 6.0, 8.0, 24.0, 34.0, 44.0, 95.0, 154.0, 266.0, 466.0, 817.0, 1450.0, 2442.0, 4272.0, 7893.0, 13934.0, 24792.0, 43255.0, 74332.0, 126022.0, 208800.0, 334919.0, 646842.0, 2752526.0, 1040173.0, 400537.0, 246183.0, 150989.0, 90207.0, 51521.0, 29778.0, 16807.0, 9778.0, 5296.0, 2904.0, 1596.0, 914.0, 576.0, 315.0, 177.0, 109.0, 70.0, 37.0, 34.0, 12.0, 19.0, 6.0, 1.0, 2.0, 4.0, 1.0, 0.0, 1.0, 2.0], "bins": [-10.4296875, -10.1199951171875, -9.810302734375, -9.5006103515625, -9.19091796875, -8.8812255859375, -8.571533203125, -8.2618408203125, -7.9521484375, -7.6424560546875, -7.332763671875, -7.0230712890625, -6.71337890625, -6.4036865234375, -6.093994140625, -5.7843017578125, -5.474609375, -5.1649169921875, -4.855224609375, -4.5455322265625, -4.23583984375, -3.9261474609375, -3.616455078125, -3.3067626953125, -2.9970703125, -2.6873779296875, -2.377685546875, -2.0679931640625, -1.75830078125, -1.4486083984375, -1.138916015625, -0.8292236328125, -0.51953125, -0.2098388671875, 0.099853515625, 0.4095458984375, 0.71923828125, 1.0289306640625, 1.338623046875, 1.6483154296875, 1.9580078125, 2.2677001953125, 2.577392578125, 2.8870849609375, 3.19677734375, 3.5064697265625, 3.816162109375, 4.1258544921875, 4.435546875, 4.7452392578125, 5.054931640625, 5.3646240234375, 5.67431640625, 5.9840087890625, 6.293701171875, 6.6033935546875, 6.9130859375, 7.2227783203125, 7.532470703125, 7.8421630859375, 8.15185546875, 8.4615478515625, 8.771240234375, 9.0809326171875, 9.390625]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 0.0, 3.0, 2.0, 7.0, 7.0, 6.0, 1.0, 5.0, 10.0, 8.0, 17.0, 10.0, 13.0, 21.0, 17.0, 20.0, 27.0, 20.0, 30.0, 27.0, 31.0, 34.0, 33.0, 39.0, 86.0, 194.0, 513.0, 312.0, 95.0, 53.0, 34.0, 32.0, 37.0, 43.0, 35.0, 23.0, 25.0, 23.0, 29.0, 17.0, 13.0, 10.0, 10.0, 11.0, 10.0, 12.0, 8.0, 7.0, 5.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-38.78125, -37.48291015625, -36.1845703125, -34.88623046875, -33.587890625, -32.28955078125, -30.9912109375, -29.69287109375, -28.39453125, -27.09619140625, -25.7978515625, -24.49951171875, -23.201171875, -21.90283203125, -20.6044921875, -19.30615234375, -18.0078125, -16.70947265625, -15.4111328125, -14.11279296875, -12.814453125, -11.51611328125, -10.2177734375, -8.91943359375, -7.62109375, -6.32275390625, -5.0244140625, -3.72607421875, -2.427734375, -1.12939453125, 0.1689453125, 1.46728515625, 2.765625, 4.06396484375, 5.3623046875, 6.66064453125, 7.958984375, 9.25732421875, 10.5556640625, 11.85400390625, 13.15234375, 14.45068359375, 15.7490234375, 17.04736328125, 18.345703125, 19.64404296875, 20.9423828125, 22.24072265625, 23.5390625, 24.83740234375, 26.1357421875, 27.43408203125, 28.732421875, 30.03076171875, 31.3291015625, 32.62744140625, 33.92578125, 35.22412109375, 36.5224609375, 37.82080078125, 39.119140625, 40.41748046875, 41.7158203125, 43.01416015625, 44.3125]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 7.0, 6.0, 12.0, 11.0, 17.0, 25.0, 40.0, 54.0, 70.0, 102.0, 136.0, 234.0, 283.0, 474.0, 620.0, 912.0, 1301.0, 1977.0, 2969.0, 4372.0, 6650.0, 10072.0, 15180.0, 23323.0, 36299.0, 59569.0, 110446.0, 5058934.0, 688596.0, 106428.0, 57757.0, 36137.0, 23169.0, 14896.0, 9649.0, 6570.0, 4570.0, 3017.0, 1981.0, 1462.0, 954.0, 662.0, 453.0, 326.0, 227.0, 169.0, 84.0, 79.0, 37.0, 34.0, 25.0, 27.0, 10.0, 8.0, 13.0, 9.0, 0.0, 3.0, 2.0, 0.0, 1.0], "bins": [-24.84375, -24.04150390625, -23.2392578125, -22.43701171875, -21.634765625, -20.83251953125, -20.0302734375, -19.22802734375, -18.42578125, -17.62353515625, -16.8212890625, -16.01904296875, -15.216796875, -14.41455078125, -13.6123046875, -12.81005859375, -12.0078125, -11.20556640625, -10.4033203125, -9.60107421875, -8.798828125, -7.99658203125, -7.1943359375, -6.39208984375, -5.58984375, -4.78759765625, -3.9853515625, -3.18310546875, -2.380859375, -1.57861328125, -0.7763671875, 0.02587890625, 0.828125, 1.63037109375, 2.4326171875, 3.23486328125, 4.037109375, 4.83935546875, 5.6416015625, 6.44384765625, 7.24609375, 8.04833984375, 8.8505859375, 9.65283203125, 10.455078125, 11.25732421875, 12.0595703125, 12.86181640625, 13.6640625, 14.46630859375, 15.2685546875, 16.07080078125, 16.873046875, 17.67529296875, 18.4775390625, 19.27978515625, 20.08203125, 20.88427734375, 21.6865234375, 22.48876953125, 23.291015625, 24.09326171875, 24.8955078125, 25.69775390625, 26.5]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 3.0, 2.0, 5.0, 4.0, 7.0, 10.0, 20.0, 14.0, 13.0, 13.0, 17.0, 17.0, 18.0, 32.0, 28.0, 35.0, 45.0, 39.0, 49.0, 54.0, 202.0, 737.0, 201.0, 57.0, 58.0, 37.0, 46.0, 39.0, 26.0, 39.0, 22.0, 28.0, 18.0, 24.0, 15.0, 14.0, 12.0, 6.0, 6.0, 4.0, 9.0, 2.0, 1.0, 4.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-69.3125, -67.1865234375, -65.060546875, -62.9345703125, -60.80859375, -58.6826171875, -56.556640625, -54.4306640625, -52.3046875, -50.1787109375, -48.052734375, -45.9267578125, -43.80078125, -41.6748046875, -39.548828125, -37.4228515625, -35.296875, -33.1708984375, -31.044921875, -28.9189453125, -26.79296875, -24.6669921875, -22.541015625, -20.4150390625, -18.2890625, -16.1630859375, -14.037109375, -11.9111328125, -9.78515625, -7.6591796875, -5.533203125, -3.4072265625, -1.28125, 0.8447265625, 2.970703125, 5.0966796875, 7.22265625, 9.3486328125, 11.474609375, 13.6005859375, 15.7265625, 17.8525390625, 19.978515625, 22.1044921875, 24.23046875, 26.3564453125, 28.482421875, 30.6083984375, 32.734375, 34.8603515625, 36.986328125, 39.1123046875, 41.23828125, 43.3642578125, 45.490234375, 47.6162109375, 49.7421875, 51.8681640625, 53.994140625, 56.1201171875, 58.24609375, 60.3720703125, 62.498046875, 64.6240234375, 66.75]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 2.0, 3.0, 3.0, 8.0, 5.0, 10.0, 19.0, 36.0, 42.0, 122.0, 489.0, 133.0, 58.0, 24.0, 23.0, 9.0, 4.0, 5.0, 4.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-973.1376953125, -944.1845092773438, -915.2312622070312, -886.278076171875, -857.3248901367188, -828.3717041015625, -799.41845703125, -770.4652709960938, -741.5120849609375, -712.5588989257812, -683.6056518554688, -654.6524658203125, -625.6992797851562, -596.74609375, -567.7928466796875, -538.8396606445312, -509.8864440917969, -480.9332275390625, -451.98004150390625, -423.0268249511719, -394.0736389160156, -365.12042236328125, -336.167236328125, -307.2140197753906, -278.26080322265625, -249.30760192871094, -220.35440063476562, -191.40118408203125, -162.447998046875, -133.49478149414062, -104.54158020019531, -75.58837890625, -46.63519287109375, -17.681989669799805, 11.27121353149414, 40.22441864013672, 69.17761993408203, 98.13082885742188, 127.08403015136719, 156.0372314453125, 184.9904327392578, 213.94363403320312, 242.89683532714844, 271.85003662109375, 300.8032531738281, 329.7564697265625, 358.70965576171875, 387.662841796875, 416.6160583496094, 445.56927490234375, 474.5224609375, 503.4756774902344, 532.4288940429688, 561.382080078125, 590.3352661132812, 619.2884521484375, 648.24169921875, 677.1948852539062, 706.1481323242188, 735.101318359375, 764.0545043945312, 793.0076904296875, 821.9609375, 850.9141235351562, 879.8673095703125]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 10.0, 7.0, 10.0, 11.0, 17.0, 18.0, 30.0, 50.0, 82.0, 231.0, 263.0, 66.0, 63.0, 31.0, 23.0, 13.0, 9.0, 5.0, 10.0, 10.0, 5.0, 6.0, 1.0, 1.0, 3.0, 3.0, 4.0, 4.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-990.4898681640625, -958.5414428710938, -926.593017578125, -894.64453125, -862.6961059570312, -830.7476806640625, -798.7992553710938, -766.850830078125, -734.90234375, -702.9539184570312, -671.0054931640625, -639.0570068359375, -607.1085815429688, -575.16015625, -543.2117309570312, -511.2633056640625, -479.31488037109375, -447.366455078125, -415.4179992675781, -383.4695739746094, -351.5211181640625, -319.57269287109375, -287.624267578125, -255.6758270263672, -223.72738647460938, -191.77894592285156, -159.83050537109375, -127.882080078125, -95.93363952636719, -63.985198974609375, -32.036773681640625, -0.0883331298828125, 31.860107421875, 63.80854415893555, 95.7569808959961, 127.70541381835938, 159.6538543701172, 191.602294921875, 223.55072021484375, 255.49916076660156, 287.4476013183594, 319.3960266113281, 351.344482421875, 383.29290771484375, 415.2413330078125, 447.1897888183594, 479.1382141113281, 511.086669921875, 543.0350952148438, 574.9835205078125, 606.9319458007812, 638.88037109375, 670.828857421875, 702.7772827148438, 734.7257080078125, 766.6741333007812, 798.62255859375, 830.5709838867188, 862.5194091796875, 894.4678955078125, 926.4163208007812, 958.36474609375, 990.3131713867188, 1022.2615966796875, 1054.2100830078125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 6.0, 5.0, 13.0, 9.0, 30.0, 29.0, 52.0, 76.0, 120.0, 179.0, 266.0, 336.0, 579.0, 978.0, 1482.0, 2341.0, 3889.0, 6932.0, 13450.0, 27790.0, 69558.0, 355910.0, 3479609.0, 126428.0, 48347.0, 23413.0, 12720.0, 7195.0, 4493.0, 2645.0, 1795.0, 1130.0, 743.0, 561.0, 362.0, 220.0, 169.0, 147.0, 77.0, 57.0, 33.0, 28.0, 32.0, 17.0, 13.0, 10.0, 6.0, 3.0, 1.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.44140625, -4.28955078125, -4.1376953125, -3.98583984375, -3.833984375, -3.68212890625, -3.5302734375, -3.37841796875, -3.2265625, -3.07470703125, -2.9228515625, -2.77099609375, -2.619140625, -2.46728515625, -2.3154296875, -2.16357421875, -2.01171875, -1.85986328125, -1.7080078125, -1.55615234375, -1.404296875, -1.25244140625, -1.1005859375, -0.94873046875, -0.796875, -0.64501953125, -0.4931640625, -0.34130859375, -0.189453125, -0.03759765625, 0.1142578125, 0.26611328125, 0.41796875, 0.56982421875, 0.7216796875, 0.87353515625, 1.025390625, 1.17724609375, 1.3291015625, 1.48095703125, 1.6328125, 1.78466796875, 1.9365234375, 2.08837890625, 2.240234375, 2.39208984375, 2.5439453125, 2.69580078125, 2.84765625, 2.99951171875, 3.1513671875, 3.30322265625, 3.455078125, 3.60693359375, 3.7587890625, 3.91064453125, 4.0625, 4.21435546875, 4.3662109375, 4.51806640625, 4.669921875, 4.82177734375, 4.9736328125, 5.12548828125, 5.27734375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 3.0, 4.0, 5.0, 3.0, 5.0, 3.0, 5.0, 9.0, 10.0, 9.0, 10.0, 23.0, 23.0, 44.0, 656.0, 73.0, 25.0, 13.0, 14.0, 9.0, 5.0, 8.0, 8.0, 6.0, 3.0, 1.0, 5.0, 5.0, 6.0, 2.0, 6.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.40234375, -1.351898193359375, -1.30145263671875, -1.251007080078125, -1.2005615234375, -1.150115966796875, -1.09967041015625, -1.049224853515625, -0.998779296875, -0.948333740234375, -0.89788818359375, -0.847442626953125, -0.7969970703125, -0.746551513671875, -0.69610595703125, -0.645660400390625, -0.59521484375, -0.544769287109375, -0.49432373046875, -0.443878173828125, -0.3934326171875, -0.342987060546875, -0.29254150390625, -0.242095947265625, -0.191650390625, -0.141204833984375, -0.09075927734375, -0.040313720703125, 0.0101318359375, 0.060577392578125, 0.11102294921875, 0.161468505859375, 0.2119140625, 0.262359619140625, 0.31280517578125, 0.363250732421875, 0.4136962890625, 0.464141845703125, 0.51458740234375, 0.565032958984375, 0.615478515625, 0.665924072265625, 0.71636962890625, 0.766815185546875, 0.8172607421875, 0.867706298828125, 0.91815185546875, 0.968597412109375, 1.01904296875, 1.069488525390625, 1.11993408203125, 1.170379638671875, 1.2208251953125, 1.271270751953125, 1.32171630859375, 1.372161865234375, 1.422607421875, 1.473052978515625, 1.52349853515625, 1.573944091796875, 1.6243896484375, 1.674835205078125, 1.72528076171875, 1.775726318359375, 1.826171875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 4.0, 4.0, 6.0, 8.0, 18.0, 24.0, 39.0, 50.0, 61.0, 101.0, 101.0, 184.0, 318.0, 449.0, 776.0, 1450.0, 2611.0, 5263.0, 11767.0, 28612.0, 79701.0, 266181.0, 1261261.0, 1972261.0, 385226.0, 108581.0, 38550.0, 15617.0, 7137.0, 3511.0, 1796.0, 952.0, 586.0, 362.0, 230.0, 155.0, 109.0, 64.0, 52.0, 37.0, 28.0, 12.0, 14.0, 7.0, 4.0, 3.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.744140625, -3.627655029296875, -3.51116943359375, -3.394683837890625, -3.2781982421875, -3.161712646484375, -3.04522705078125, -2.928741455078125, -2.812255859375, -2.695770263671875, -2.57928466796875, -2.462799072265625, -2.3463134765625, -2.229827880859375, -2.11334228515625, -1.996856689453125, -1.88037109375, -1.763885498046875, -1.64739990234375, -1.530914306640625, -1.4144287109375, -1.297943115234375, -1.18145751953125, -1.064971923828125, -0.948486328125, -0.832000732421875, -0.71551513671875, -0.599029541015625, -0.4825439453125, -0.366058349609375, -0.24957275390625, -0.133087158203125, -0.0166015625, 0.099884033203125, 0.21636962890625, 0.332855224609375, 0.4493408203125, 0.565826416015625, 0.68231201171875, 0.798797607421875, 0.915283203125, 1.031768798828125, 1.14825439453125, 1.264739990234375, 1.3812255859375, 1.497711181640625, 1.61419677734375, 1.730682373046875, 1.84716796875, 1.963653564453125, 2.08013916015625, 2.196624755859375, 2.3131103515625, 2.429595947265625, 2.54608154296875, 2.662567138671875, 2.779052734375, 2.895538330078125, 3.01202392578125, 3.128509521484375, 3.2449951171875, 3.361480712890625, 3.47796630859375, 3.594451904296875, 3.7109375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 4.0, 2.0, 1.0, 5.0, 3.0, 5.0, 9.0, 7.0, 14.0, 10.0, 25.0, 24.0, 30.0, 37.0, 48.0, 56.0, 77.0, 83.0, 103.0, 151.0, 195.0, 264.0, 350.0, 460.0, 573.0, 360.0, 279.0, 187.0, 168.0, 108.0, 79.0, 74.0, 45.0, 36.0, 36.0, 24.0, 36.0, 30.0, 15.0, 17.0, 13.0, 9.0, 9.0, 5.0, 3.0, 7.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.326171875, -1.2774658203125, -1.228759765625, -1.1800537109375, -1.13134765625, -1.0826416015625, -1.033935546875, -0.9852294921875, -0.9365234375, -0.8878173828125, -0.839111328125, -0.7904052734375, -0.74169921875, -0.6929931640625, -0.644287109375, -0.5955810546875, -0.546875, -0.4981689453125, -0.449462890625, -0.4007568359375, -0.35205078125, -0.3033447265625, -0.254638671875, -0.2059326171875, -0.1572265625, -0.1085205078125, -0.059814453125, -0.0111083984375, 0.03759765625, 0.0863037109375, 0.135009765625, 0.1837158203125, 0.232421875, 0.2811279296875, 0.329833984375, 0.3785400390625, 0.42724609375, 0.4759521484375, 0.524658203125, 0.5733642578125, 0.6220703125, 0.6707763671875, 0.719482421875, 0.7681884765625, 0.81689453125, 0.8656005859375, 0.914306640625, 0.9630126953125, 1.01171875, 1.0604248046875, 1.109130859375, 1.1578369140625, 1.20654296875, 1.2552490234375, 1.303955078125, 1.3526611328125, 1.4013671875, 1.4500732421875, 1.498779296875, 1.5474853515625, 1.59619140625, 1.6448974609375, 1.693603515625, 1.7423095703125, 1.791015625]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 7.0, 9.0, 16.0, 40.0, 65.0, 111.0, 181.0, 211.0, 150.0, 106.0, 45.0, 23.0, 12.0, 9.0, 4.0, 3.0, 3.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.602636337280273, -23.034021377563477, -22.46540641784668, -21.896791458129883, -21.328176498413086, -20.75956153869629, -20.190946578979492, -19.622333526611328, -19.05371856689453, -18.485103607177734, -17.916488647460938, -17.34787368774414, -16.779258728027344, -16.210643768310547, -15.642029762268066, -15.07341480255127, -14.504798889160156, -13.93618392944336, -13.367568969726562, -12.798954010009766, -12.230339050292969, -11.661724090576172, -11.093110084533691, -10.524495124816895, -9.955880165100098, -9.3872652053833, -8.818650245666504, -8.250035285949707, -7.681420803070068, -7.1128058433532715, -6.544191360473633, -5.975576400756836, -5.4069623947143555, -4.838347434997559, -4.269732475280762, -3.701117992401123, -3.132503032684326, -2.5638880729675293, -1.9952733516693115, -1.4266586303710938, -0.8580436706542969, -0.28942883014678955, 0.2791860103607178, 0.8478008508682251, 1.4164156913757324, 1.9850306510925293, 2.553645372390747, 3.122260093688965, 3.6908750534057617, 4.259490013122559, 4.8281049728393555, 5.396719455718994, 5.965334415435791, 6.533949375152588, 7.102563858032227, 7.671178817749023, 8.23979377746582, 8.808408737182617, 9.377023696899414, 9.945638656616211, 10.514253616333008, 11.082868576049805, 11.651482582092285, 12.220097541809082, 12.788712501525879]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 3.0, 5.0, 3.0, 6.0, 12.0, 12.0, 15.0, 17.0, 23.0, 20.0, 28.0, 33.0, 34.0, 50.0, 43.0, 49.0, 45.0, 49.0, 52.0, 58.0, 51.0, 51.0, 53.0, 55.0, 26.0, 35.0, 41.0, 30.0, 22.0, 16.0, 10.0, 19.0, 10.0, 6.0, 5.0, 4.0, 4.0, 1.0, 6.0, 2.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.4104642868042, -9.095338821411133, -8.78021240234375, -8.465086936950684, -8.1499605178833, -7.834834575653076, -7.519708633422852, -7.204583168029785, -6.889456748962402, -6.574330806732178, -6.259204864501953, -5.9440789222717285, -5.628952980041504, -5.313827037811279, -4.998701095581055, -4.683575630187988, -4.368449687957764, -4.053323745727539, -3.7381978034973145, -3.42307186126709, -3.1079459190368652, -2.7928199768066406, -2.477694272994995, -2.1625683307647705, -1.847442388534546, -1.5323164463043213, -1.2171905040740967, -0.9020646810531616, -0.586938738822937, -0.2718127965927124, 0.043313026428222656, 0.35843896865844727, 0.6735649108886719, 0.9886908531188965, 1.303816795349121, 1.6189426183700562, 1.9340685606002808, 2.249194622039795, 2.5643203258514404, 2.879446268081665, 3.1945722103118896, 3.5096981525421143, 3.824824094772339, 4.139949798583984, 4.455075740814209, 4.770201683044434, 5.085327625274658, 5.400453567504883, 5.715579509735107, 6.030705451965332, 6.345831394195557, 6.660957336425781, 6.976083278656006, 7.2912092208862305, 7.606334686279297, 7.92146110534668, 8.236586570739746, 8.551712036132812, 8.866838455200195, 9.181963920593262, 9.497090339660645, 9.812215805053711, 10.127342224121094, 10.44246768951416, 10.757594108581543]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 6.0, 6.0, 9.0, 15.0, 22.0, 36.0, 31.0, 56.0, 58.0, 100.0, 148.0, 171.0, 309.0, 421.0, 591.0, 960.0, 1423.0, 2303.0, 3656.0, 5781.0, 10277.0, 18446.0, 39971.0, 410275.0, 465898.0, 41551.0, 18900.0, 10369.0, 6204.0, 3797.0, 2302.0, 1427.0, 976.0, 650.0, 436.0, 298.0, 184.0, 143.0, 118.0, 57.0, 55.0, 34.0, 23.0, 24.0, 20.0, 9.0, 9.0, 3.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-4.6796875, -4.5379638671875, -4.396240234375, -4.2545166015625, -4.11279296875, -3.9710693359375, -3.829345703125, -3.6876220703125, -3.5458984375, -3.4041748046875, -3.262451171875, -3.1207275390625, -2.97900390625, -2.8372802734375, -2.695556640625, -2.5538330078125, -2.412109375, -2.2703857421875, -2.128662109375, -1.9869384765625, -1.84521484375, -1.7034912109375, -1.561767578125, -1.4200439453125, -1.2783203125, -1.1365966796875, -0.994873046875, -0.8531494140625, -0.71142578125, -0.5697021484375, -0.427978515625, -0.2862548828125, -0.14453125, -0.0028076171875, 0.138916015625, 0.2806396484375, 0.42236328125, 0.5640869140625, 0.705810546875, 0.8475341796875, 0.9892578125, 1.1309814453125, 1.272705078125, 1.4144287109375, 1.55615234375, 1.6978759765625, 1.839599609375, 1.9813232421875, 2.123046875, 2.2647705078125, 2.406494140625, 2.5482177734375, 2.68994140625, 2.8316650390625, 2.973388671875, 3.1151123046875, 3.2568359375, 3.3985595703125, 3.540283203125, 3.6820068359375, 3.82373046875, 3.9654541015625, 4.107177734375, 4.2489013671875, 4.390625]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 6.0, 2.0, 4.0, 7.0, 1.0, 3.0, 7.0, 8.0, 9.0, 14.0, 27.0, 50.0, 160.0, 328.0, 204.0, 55.0, 24.0, 14.0, 12.0, 14.0, 6.0, 7.0, 5.0, 4.0, 6.0, 4.0, 4.0, 5.0, 3.0, 3.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5087890625, -1.458251953125, -1.40771484375, -1.357177734375, -1.306640625, -1.256103515625, -1.20556640625, -1.155029296875, -1.1044921875, -1.053955078125, -1.00341796875, -0.952880859375, -0.90234375, -0.851806640625, -0.80126953125, -0.750732421875, -0.7001953125, -0.649658203125, -0.59912109375, -0.548583984375, -0.498046875, -0.447509765625, -0.39697265625, -0.346435546875, -0.2958984375, -0.245361328125, -0.19482421875, -0.144287109375, -0.09375, -0.043212890625, 0.00732421875, 0.057861328125, 0.1083984375, 0.158935546875, 0.20947265625, 0.260009765625, 0.310546875, 0.361083984375, 0.41162109375, 0.462158203125, 0.5126953125, 0.563232421875, 0.61376953125, 0.664306640625, 0.71484375, 0.765380859375, 0.81591796875, 0.866455078125, 0.9169921875, 0.967529296875, 1.01806640625, 1.068603515625, 1.119140625, 1.169677734375, 1.22021484375, 1.270751953125, 1.3212890625, 1.371826171875, 1.42236328125, 1.472900390625, 1.5234375, 1.573974609375, 1.62451171875, 1.675048828125, 1.7255859375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 1.0, 3.0, 2.0, 4.0, 1.0, 1.0, 2.0, 8.0, 12.0, 11.0, 26.0, 29.0, 39.0, 87.0, 143.0, 379.0, 1302.0, 6247.0, 38724.0, 391215.0, 544776.0, 54972.0, 7896.0, 1773.0, 504.0, 182.0, 70.0, 49.0, 32.0, 19.0, 17.0, 8.0, 9.0, 4.0, 2.0, 1.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-11.6640625, -11.288818359375, -10.91357421875, -10.538330078125, -10.1630859375, -9.787841796875, -9.41259765625, -9.037353515625, -8.662109375, -8.286865234375, -7.91162109375, -7.536376953125, -7.1611328125, -6.785888671875, -6.41064453125, -6.035400390625, -5.66015625, -5.284912109375, -4.90966796875, -4.534423828125, -4.1591796875, -3.783935546875, -3.40869140625, -3.033447265625, -2.658203125, -2.282958984375, -1.90771484375, -1.532470703125, -1.1572265625, -0.781982421875, -0.40673828125, -0.031494140625, 0.34375, 0.718994140625, 1.09423828125, 1.469482421875, 1.8447265625, 2.219970703125, 2.59521484375, 2.970458984375, 3.345703125, 3.720947265625, 4.09619140625, 4.471435546875, 4.8466796875, 5.221923828125, 5.59716796875, 5.972412109375, 6.34765625, 6.722900390625, 7.09814453125, 7.473388671875, 7.8486328125, 8.223876953125, 8.59912109375, 8.974365234375, 9.349609375, 9.724853515625, 10.10009765625, 10.475341796875, 10.8505859375, 11.225830078125, 11.60107421875, 11.976318359375, 12.3515625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 2.0, 6.0, 2.0, 9.0, 7.0, 5.0, 9.0, 19.0, 16.0, 22.0, 25.0, 29.0, 30.0, 26.0, 30.0, 36.0, 43.0, 37.0, 52.0, 37.0, 45.0, 48.0, 41.0, 46.0, 31.0, 48.0, 36.0, 36.0, 30.0, 26.0, 25.0, 32.0, 21.0, 18.0, 19.0, 14.0, 10.0, 11.0, 6.0, 3.0, 5.0, 4.0, 4.0, 5.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-7.21875, -7.01922607421875, -6.8197021484375, -6.62017822265625, -6.420654296875, -6.22113037109375, -6.0216064453125, -5.82208251953125, -5.62255859375, -5.42303466796875, -5.2235107421875, -5.02398681640625, -4.824462890625, -4.62493896484375, -4.4254150390625, -4.22589111328125, -4.0263671875, -3.82684326171875, -3.6273193359375, -3.42779541015625, -3.228271484375, -3.02874755859375, -2.8292236328125, -2.62969970703125, -2.43017578125, -2.23065185546875, -2.0311279296875, -1.83160400390625, -1.632080078125, -1.43255615234375, -1.2330322265625, -1.03350830078125, -0.833984375, -0.63446044921875, -0.4349365234375, -0.23541259765625, -0.035888671875, 0.16363525390625, 0.3631591796875, 0.56268310546875, 0.76220703125, 0.96173095703125, 1.1612548828125, 1.36077880859375, 1.560302734375, 1.75982666015625, 1.9593505859375, 2.15887451171875, 2.3583984375, 2.55792236328125, 2.7574462890625, 2.95697021484375, 3.156494140625, 3.35601806640625, 3.5555419921875, 3.75506591796875, 3.95458984375, 4.15411376953125, 4.3536376953125, 4.55316162109375, 4.752685546875, 4.95220947265625, 5.1517333984375, 5.35125732421875, 5.55078125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 4.0, 6.0, 10.0, 10.0, 15.0, 19.0, 33.0, 40.0, 78.0, 133.0, 253.0, 545.0, 1582.0, 7334.0, 255132.0, 769470.0, 10494.0, 2047.0, 697.0, 269.0, 144.0, 78.0, 51.0, 33.0, 22.0, 19.0, 10.0, 15.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.3984375, -13.8858642578125, -13.373291015625, -12.8607177734375, -12.34814453125, -11.8355712890625, -11.322998046875, -10.8104248046875, -10.2978515625, -9.7852783203125, -9.272705078125, -8.7601318359375, -8.24755859375, -7.7349853515625, -7.222412109375, -6.7098388671875, -6.197265625, -5.6846923828125, -5.172119140625, -4.6595458984375, -4.14697265625, -3.6343994140625, -3.121826171875, -2.6092529296875, -2.0966796875, -1.5841064453125, -1.071533203125, -0.5589599609375, -0.04638671875, 0.4661865234375, 0.978759765625, 1.4913330078125, 2.00390625, 2.5164794921875, 3.029052734375, 3.5416259765625, 4.05419921875, 4.5667724609375, 5.079345703125, 5.5919189453125, 6.1044921875, 6.6170654296875, 7.129638671875, 7.6422119140625, 8.15478515625, 8.6673583984375, 9.179931640625, 9.6925048828125, 10.205078125, 10.7176513671875, 11.230224609375, 11.7427978515625, 12.25537109375, 12.7679443359375, 13.280517578125, 13.7930908203125, 14.3056640625, 14.8182373046875, 15.330810546875, 15.8433837890625, 16.35595703125, 16.8685302734375, 17.381103515625, 17.8936767578125, 18.40625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 1.0, 9.0, 6.0, 5.0, 5.0, 8.0, 17.0, 23.0, 21.0, 30.0, 45.0, 50.0, 58.0, 65.0, 93.0, 58.0, 90.0, 93.0, 73.0, 57.0, 43.0, 32.0, 27.0, 26.0, 18.0, 12.0, 11.0, 7.0, 6.0, 2.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00022339820861816406, -0.00021733343601226807, -0.00021126866340637207, -0.00020520389080047607, -0.00019913911819458008, -0.00019307434558868408, -0.00018700957298278809, -0.0001809448003768921, -0.0001748800277709961, -0.0001688152551651001, -0.0001627504825592041, -0.0001566857099533081, -0.0001506209373474121, -0.0001445561647415161, -0.00013849139213562012, -0.00013242661952972412, -0.00012636184692382812, -0.00012029707431793213, -0.00011423230171203613, -0.00010816752910614014, -0.00010210275650024414, -9.603798389434814e-05, -8.997321128845215e-05, -8.390843868255615e-05, -7.784366607666016e-05, -7.177889347076416e-05, -6.571412086486816e-05, -5.964934825897217e-05, -5.358457565307617e-05, -4.7519803047180176e-05, -4.145503044128418e-05, -3.5390257835388184e-05, -2.9325485229492188e-05, -2.326071262359619e-05, -1.7195940017700195e-05, -1.11311674118042e-05, -5.066394805908203e-06, 9.98377799987793e-07, 7.063150405883789e-06, 1.3127923011779785e-05, 1.919269561767578e-05, 2.5257468223571777e-05, 3.1322240829467773e-05, 3.738701343536377e-05, 4.3451786041259766e-05, 4.951655864715576e-05, 5.558133125305176e-05, 6.164610385894775e-05, 6.771087646484375e-05, 7.377564907073975e-05, 7.984042167663574e-05, 8.590519428253174e-05, 9.196996688842773e-05, 9.803473949432373e-05, 0.00010409951210021973, 0.00011016428470611572, 0.00011622905731201172, 0.00012229382991790771, 0.0001283586025238037, 0.0001344233751296997, 0.0001404881477355957, 0.0001465529203414917, 0.0001526176929473877, 0.0001586824655532837, 0.0001647472381591797]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 3.0, 8.0, 20.0, 20.0, 23.0, 41.0, 47.0, 78.0, 98.0, 166.0, 267.0, 408.0, 690.0, 1239.0, 2408.0, 5085.0, 12348.0, 39309.0, 193371.0, 593964.0, 146467.0, 32322.0, 10891.0, 4429.0, 2107.0, 1115.0, 633.0, 335.0, 206.0, 148.0, 99.0, 62.0, 46.0, 26.0, 21.0, 16.0, 10.0, 12.0, 10.0, 0.0, 5.0, 2.0, 2.0, 5.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.171875, -4.03009033203125, -3.8883056640625, -3.74652099609375, -3.604736328125, -3.46295166015625, -3.3211669921875, -3.17938232421875, -3.03759765625, -2.89581298828125, -2.7540283203125, -2.61224365234375, -2.470458984375, -2.32867431640625, -2.1868896484375, -2.04510498046875, -1.9033203125, -1.76153564453125, -1.6197509765625, -1.47796630859375, -1.336181640625, -1.19439697265625, -1.0526123046875, -0.91082763671875, -0.76904296875, -0.62725830078125, -0.4854736328125, -0.34368896484375, -0.201904296875, -0.06011962890625, 0.0816650390625, 0.22344970703125, 0.365234375, 0.50701904296875, 0.6488037109375, 0.79058837890625, 0.932373046875, 1.07415771484375, 1.2159423828125, 1.35772705078125, 1.49951171875, 1.64129638671875, 1.7830810546875, 1.92486572265625, 2.066650390625, 2.20843505859375, 2.3502197265625, 2.49200439453125, 2.6337890625, 2.77557373046875, 2.9173583984375, 3.05914306640625, 3.200927734375, 3.34271240234375, 3.4844970703125, 3.62628173828125, 3.76806640625, 3.90985107421875, 4.0516357421875, 4.19342041015625, 4.335205078125, 4.47698974609375, 4.6187744140625, 4.76055908203125, 4.90234375]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 1.0, 4.0, 6.0, 2.0, 7.0, 7.0, 13.0, 28.0, 16.0, 43.0, 40.0, 47.0, 73.0, 98.0, 75.0, 66.0, 92.0, 75.0, 73.0, 59.0, 45.0, 25.0, 27.0, 22.0, 13.0, 10.0, 6.0, 7.0, 7.0, 2.0, 2.0, 6.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.76171875, -5.6019287109375, -5.442138671875, -5.2823486328125, -5.12255859375, -4.9627685546875, -4.802978515625, -4.6431884765625, -4.4833984375, -4.3236083984375, -4.163818359375, -4.0040283203125, -3.84423828125, -3.6844482421875, -3.524658203125, -3.3648681640625, -3.205078125, -3.0452880859375, -2.885498046875, -2.7257080078125, -2.56591796875, -2.4061279296875, -2.246337890625, -2.0865478515625, -1.9267578125, -1.7669677734375, -1.607177734375, -1.4473876953125, -1.28759765625, -1.1278076171875, -0.968017578125, -0.8082275390625, -0.6484375, -0.4886474609375, -0.328857421875, -0.1690673828125, -0.00927734375, 0.1505126953125, 0.310302734375, 0.4700927734375, 0.6298828125, 0.7896728515625, 0.949462890625, 1.1092529296875, 1.26904296875, 1.4288330078125, 1.588623046875, 1.7484130859375, 1.908203125, 2.0679931640625, 2.227783203125, 2.3875732421875, 2.54736328125, 2.7071533203125, 2.866943359375, 3.0267333984375, 3.1865234375, 3.3463134765625, 3.506103515625, 3.6658935546875, 3.82568359375, 3.9854736328125, 4.145263671875, 4.3050537109375, 4.46484375]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 5.0, 6.0, 4.0, 8.0, 8.0, 17.0, 35.0, 73.0, 105.0, 216.0, 251.0, 140.0, 55.0, 32.0, 17.0, 8.0, 7.0, 5.0, 5.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-83.91691589355469, -81.30899810791016, -78.70108032226562, -76.0931625366211, -73.48524475097656, -70.87732696533203, -68.2694091796875, -65.66148376464844, -63.05356979370117, -60.44565200805664, -57.83773422241211, -55.22981643676758, -52.62189483642578, -50.01397705078125, -47.40605926513672, -44.79814147949219, -42.190223693847656, -39.582305908203125, -36.974388122558594, -34.36647033691406, -31.7585506439209, -29.150632858276367, -26.542713165283203, -23.934795379638672, -21.32687759399414, -18.71895980834961, -16.111042022705078, -13.503122329711914, -10.895204544067383, -8.287286758422852, -5.679368019104004, -3.0714492797851562, -0.463531494140625, 2.1443867683410645, 4.752305030822754, 7.360223293304443, 9.968141555786133, 12.576059341430664, 15.183978080749512, 17.79189682006836, 20.39981460571289, 23.007732391357422, 25.615650177001953, 28.223569869995117, 30.83148765563965, 33.43940734863281, 36.047325134277344, 38.655242919921875, 41.263160705566406, 43.87107849121094, 46.47899627685547, 49.0869140625, 51.69483184814453, 54.30274963378906, 56.91067123413086, 59.51858901977539, 62.12650680541992, 64.73442840576172, 67.34234619140625, 69.95026397705078, 72.55818176269531, 75.16609954833984, 77.77401733398438, 80.3819351196289, 82.98985290527344]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 5.0, 3.0, 3.0, 4.0, 6.0, 6.0, 9.0, 7.0, 7.0, 11.0, 33.0, 69.0, 110.0, 180.0, 171.0, 132.0, 93.0, 46.0, 37.0, 17.0, 10.0, 8.0, 7.0, 5.0, 7.0, 3.0, 5.0, 6.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-161.29098510742188, -157.19085693359375, -153.09072875976562, -148.99058532714844, -144.8904571533203, -140.7903289794922, -136.69020080566406, -132.59005737304688, -128.48992919921875, -124.38980102539062, -120.28966522216797, -116.18953704833984, -112.08940124511719, -107.98927307128906, -103.88914489746094, -99.78900909423828, -95.68888092041016, -91.58875274658203, -87.48861694335938, -83.38848876953125, -79.2883529663086, -75.18822479248047, -71.08808898925781, -66.98796081542969, -62.8878288269043, -58.787696838378906, -54.687564849853516, -50.587432861328125, -46.4873046875, -42.387168884277344, -38.28704071044922, -34.18690872192383, -30.086776733398438, -25.986644744873047, -21.886512756347656, -17.7863826751709, -13.686250686645508, -9.586118698120117, -5.485988616943359, -1.3858566284179688, 2.714275360107422, 6.814406871795654, 10.914538383483887, 15.014669418334961, 19.11480140686035, 23.214933395385742, 27.3150634765625, 31.41519546508789, 35.51532745361328, 39.61545944213867, 43.71559143066406, 47.81571960449219, 51.915855407714844, 56.01598358154297, 60.11611557006836, 64.21624755859375, 68.31637573242188, 72.41650390625, 76.51663970947266, 80.61676788330078, 84.71690368652344, 88.81703186035156, 92.91716003417969, 97.01729583740234, 101.117431640625]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 6.0, 5.0, 9.0, 14.0, 17.0, 19.0, 34.0, 35.0, 55.0, 66.0, 121.0, 211.0, 326.0, 567.0, 1065.0, 2156.0, 5061.0, 15492.0, 78502.0, 3841301.0, 206277.0, 26945.0, 8507.0, 3570.0, 1697.0, 888.0, 521.0, 270.0, 192.0, 95.0, 72.0, 48.0, 38.0, 31.0, 17.0, 13.0, 6.0, 13.0, 5.0, 5.0, 4.0, 2.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-20.984375, -20.379150390625, -19.77392578125, -19.168701171875, -18.5634765625, -17.958251953125, -17.35302734375, -16.747802734375, -16.142578125, -15.537353515625, -14.93212890625, -14.326904296875, -13.7216796875, -13.116455078125, -12.51123046875, -11.906005859375, -11.30078125, -10.695556640625, -10.09033203125, -9.485107421875, -8.8798828125, -8.274658203125, -7.66943359375, -7.064208984375, -6.458984375, -5.853759765625, -5.24853515625, -4.643310546875, -4.0380859375, -3.432861328125, -2.82763671875, -2.222412109375, -1.6171875, -1.011962890625, -0.40673828125, 0.198486328125, 0.8037109375, 1.408935546875, 2.01416015625, 2.619384765625, 3.224609375, 3.829833984375, 4.43505859375, 5.040283203125, 5.6455078125, 6.250732421875, 6.85595703125, 7.461181640625, 8.06640625, 8.671630859375, 9.27685546875, 9.882080078125, 10.4873046875, 11.092529296875, 11.69775390625, 12.302978515625, 12.908203125, 13.513427734375, 14.11865234375, 14.723876953125, 15.3291015625, 15.934326171875, 16.53955078125, 17.144775390625, 17.75]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 5.0, 6.0, 4.0, 4.0, 5.0, 6.0, 12.0, 14.0, 15.0, 15.0, 32.0, 58.0, 154.0, 209.0, 157.0, 112.0, 56.0, 44.0, 16.0, 9.0, 10.0, 12.0, 8.0, 11.0, 5.0, 3.0, 8.0, 2.0, 2.0, 1.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-1.7060546875, -1.660064697265625, -1.61407470703125, -1.568084716796875, -1.5220947265625, -1.476104736328125, -1.43011474609375, -1.384124755859375, -1.338134765625, -1.292144775390625, -1.24615478515625, -1.200164794921875, -1.1541748046875, -1.108184814453125, -1.06219482421875, -1.016204833984375, -0.97021484375, -0.924224853515625, -0.87823486328125, -0.832244873046875, -0.7862548828125, -0.740264892578125, -0.69427490234375, -0.648284912109375, -0.602294921875, -0.556304931640625, -0.51031494140625, -0.464324951171875, -0.4183349609375, -0.372344970703125, -0.32635498046875, -0.280364990234375, -0.234375, -0.188385009765625, -0.14239501953125, -0.096405029296875, -0.0504150390625, -0.004425048828125, 0.04156494140625, 0.087554931640625, 0.133544921875, 0.179534912109375, 0.22552490234375, 0.271514892578125, 0.3175048828125, 0.363494873046875, 0.40948486328125, 0.455474853515625, 0.50146484375, 0.547454833984375, 0.59344482421875, 0.639434814453125, 0.6854248046875, 0.731414794921875, 0.77740478515625, 0.823394775390625, 0.869384765625, 0.915374755859375, 0.96136474609375, 1.007354736328125, 1.0533447265625, 1.099334716796875, 1.14532470703125, 1.191314697265625, 1.2373046875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 6.0, 5.0, 5.0, 21.0, 21.0, 22.0, 29.0, 56.0, 97.0, 98.0, 166.0, 300.0, 445.0, 700.0, 1216.0, 2175.0, 4348.0, 9663.0, 24559.0, 77554.0, 398960.0, 3105888.0, 441558.0, 81715.0, 25364.0, 9693.0, 4451.0, 2239.0, 1210.0, 655.0, 385.0, 223.0, 145.0, 104.0, 73.0, 36.0, 30.0, 26.0, 14.0, 8.0, 10.0, 3.0, 3.0, 2.0, 5.0, 3.0, 1.0], "bins": [-10.1015625, -9.83935546875, -9.5771484375, -9.31494140625, -9.052734375, -8.79052734375, -8.5283203125, -8.26611328125, -8.00390625, -7.74169921875, -7.4794921875, -7.21728515625, -6.955078125, -6.69287109375, -6.4306640625, -6.16845703125, -5.90625, -5.64404296875, -5.3818359375, -5.11962890625, -4.857421875, -4.59521484375, -4.3330078125, -4.07080078125, -3.80859375, -3.54638671875, -3.2841796875, -3.02197265625, -2.759765625, -2.49755859375, -2.2353515625, -1.97314453125, -1.7109375, -1.44873046875, -1.1865234375, -0.92431640625, -0.662109375, -0.39990234375, -0.1376953125, 0.12451171875, 0.38671875, 0.64892578125, 0.9111328125, 1.17333984375, 1.435546875, 1.69775390625, 1.9599609375, 2.22216796875, 2.484375, 2.74658203125, 3.0087890625, 3.27099609375, 3.533203125, 3.79541015625, 4.0576171875, 4.31982421875, 4.58203125, 4.84423828125, 5.1064453125, 5.36865234375, 5.630859375, 5.89306640625, 6.1552734375, 6.41748046875, 6.6796875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 3.0, 1.0, 6.0, 5.0, 7.0, 7.0, 4.0, 18.0, 24.0, 33.0, 54.0, 71.0, 116.0, 198.0, 413.0, 995.0, 1229.0, 402.0, 191.0, 106.0, 60.0, 42.0, 18.0, 28.0, 15.0, 7.0, 4.0, 3.0, 8.0, 3.0, 0.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.671875, -2.603515625, -2.53515625, -2.466796875, -2.3984375, -2.330078125, -2.26171875, -2.193359375, -2.125, -2.056640625, -1.98828125, -1.919921875, -1.8515625, -1.783203125, -1.71484375, -1.646484375, -1.578125, -1.509765625, -1.44140625, -1.373046875, -1.3046875, -1.236328125, -1.16796875, -1.099609375, -1.03125, -0.962890625, -0.89453125, -0.826171875, -0.7578125, -0.689453125, -0.62109375, -0.552734375, -0.484375, -0.416015625, -0.34765625, -0.279296875, -0.2109375, -0.142578125, -0.07421875, -0.005859375, 0.0625, 0.130859375, 0.19921875, 0.267578125, 0.3359375, 0.404296875, 0.47265625, 0.541015625, 0.609375, 0.677734375, 0.74609375, 0.814453125, 0.8828125, 0.951171875, 1.01953125, 1.087890625, 1.15625, 1.224609375, 1.29296875, 1.361328125, 1.4296875, 1.498046875, 1.56640625, 1.634765625, 1.703125]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 5.0, 6.0, 9.0, 20.0, 29.0, 54.0, 118.0, 228.0, 253.0, 174.0, 62.0, 27.0, 9.0, 4.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-30.096309661865234, -29.46102523803711, -28.825742721557617, -28.190458297729492, -27.555173873901367, -26.919889450073242, -26.28460693359375, -25.649322509765625, -25.0140380859375, -24.378753662109375, -23.743471145629883, -23.108186721801758, -22.472902297973633, -21.837617874145508, -21.202335357666016, -20.56705093383789, -19.931766510009766, -19.29648208618164, -18.66119956970215, -18.025915145874023, -17.3906307220459, -16.755346298217773, -16.12006378173828, -15.484779357910156, -14.849496841430664, -14.214213371276855, -13.57892894744873, -12.943645477294922, -12.308361053466797, -11.673077583312988, -11.03779411315918, -10.402509689331055, -9.767226219177246, -9.131942749023438, -8.496658325195312, -7.861374855041504, -7.226090431213379, -6.59080696105957, -5.9555230140686035, -5.320239067077637, -4.68495512008667, -4.049671173095703, -3.4143872261047363, -2.7791035175323486, -2.143819570541382, -1.508535623550415, -0.8732519149780273, -0.23796796798706055, 0.39731597900390625, 1.032599925994873, 1.6678837537765503, 2.3031675815582275, 2.9384515285491943, 3.573735475540161, 4.209019184112549, 4.844303131103516, 5.479587078094482, 6.114871025085449, 6.750154972076416, 7.385438919067383, 8.020722389221191, 8.656006813049316, 9.291290283203125, 9.92657470703125, 10.561858177185059]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 5.0, 3.0, 9.0, 15.0, 10.0, 21.0, 25.0, 41.0, 43.0, 57.0, 67.0, 84.0, 82.0, 106.0, 82.0, 71.0, 65.0, 51.0, 38.0, 39.0, 21.0, 14.0, 8.0, 14.0, 9.0, 4.0, 5.0, 1.0, 4.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.332693099975586, -9.962347030639648, -9.592000007629395, -9.221653938293457, -8.851306915283203, -8.480960845947266, -8.110613822937012, -7.740267753601074, -7.36992073059082, -6.999574184417725, -6.629227638244629, -6.258881092071533, -5.8885345458984375, -5.518187999725342, -5.147841453552246, -4.777495384216309, -4.407148838043213, -4.036802291870117, -3.6664557456970215, -3.296109199523926, -2.92576265335083, -2.5554161071777344, -2.1850697994232178, -1.814723253250122, -1.4443767070770264, -1.0740301609039307, -0.7036836743354797, -0.3333371877670288, 0.037009358406066895, 0.4073559045791626, 0.7777023315429688, 1.1480488777160645, 1.5183954238891602, 1.8887419700622559, 2.2590885162353516, 2.6294350624084473, 2.999781608581543, 3.3701281547546387, 3.7404744625091553, 4.110820770263672, 4.481167793273926, 4.8515143394470215, 5.221860885620117, 5.592207431793213, 5.962553977966309, 6.332900524139404, 6.7032470703125, 7.0735931396484375, 7.443939685821533, 7.814286231994629, 8.184632301330566, 8.55497932434082, 8.925325393676758, 9.295672416687012, 9.66601848602295, 10.036365509033203, 10.40671157836914, 10.777057647705078, 11.147404670715332, 11.51775074005127, 11.888097763061523, 12.258443832397461, 12.628790855407715, 12.999136924743652, 13.369483947753906]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 5.0, 4.0, 8.0, 11.0, 16.0, 31.0, 50.0, 110.0, 176.0, 387.0, 1032.0, 3137.0, 15404.0, 220528.0, 766906.0, 32970.0, 5289.0, 1460.0, 531.0, 220.0, 113.0, 70.0, 47.0, 20.0, 12.0, 7.0, 2.0, 2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-22.765625, -22.07958984375, -21.3935546875, -20.70751953125, -20.021484375, -19.33544921875, -18.6494140625, -17.96337890625, -17.27734375, -16.59130859375, -15.9052734375, -15.21923828125, -14.533203125, -13.84716796875, -13.1611328125, -12.47509765625, -11.7890625, -11.10302734375, -10.4169921875, -9.73095703125, -9.044921875, -8.35888671875, -7.6728515625, -6.98681640625, -6.30078125, -5.61474609375, -4.9287109375, -4.24267578125, -3.556640625, -2.87060546875, -2.1845703125, -1.49853515625, -0.8125, -0.12646484375, 0.5595703125, 1.24560546875, 1.931640625, 2.61767578125, 3.3037109375, 3.98974609375, 4.67578125, 5.36181640625, 6.0478515625, 6.73388671875, 7.419921875, 8.10595703125, 8.7919921875, 9.47802734375, 10.1640625, 10.85009765625, 11.5361328125, 12.22216796875, 12.908203125, 13.59423828125, 14.2802734375, 14.96630859375, 15.65234375, 16.33837890625, 17.0244140625, 17.71044921875, 18.396484375, 19.08251953125, 19.7685546875, 20.45458984375, 21.140625]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 8.0, 6.0, 10.0, 12.0, 10.0, 13.0, 22.0, 43.0, 87.0, 125.0, 154.0, 171.0, 122.0, 73.0, 50.0, 28.0, 16.0, 15.0, 11.0, 8.0, 5.0, 6.0, 3.0, 0.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3896484375, -1.3437347412109375, -1.297821044921875, -1.2519073486328125, -1.20599365234375, -1.1600799560546875, -1.114166259765625, -1.0682525634765625, -1.0223388671875, -0.9764251708984375, -0.930511474609375, -0.8845977783203125, -0.83868408203125, -0.7927703857421875, -0.746856689453125, -0.7009429931640625, -0.655029296875, -0.6091156005859375, -0.563201904296875, -0.5172882080078125, -0.47137451171875, -0.4254608154296875, -0.379547119140625, -0.3336334228515625, -0.2877197265625, -0.2418060302734375, -0.195892333984375, -0.1499786376953125, -0.10406494140625, -0.0581512451171875, -0.012237548828125, 0.0336761474609375, 0.07958984375, 0.1255035400390625, 0.171417236328125, 0.2173309326171875, 0.26324462890625, 0.3091583251953125, 0.355072021484375, 0.4009857177734375, 0.4468994140625, 0.4928131103515625, 0.538726806640625, 0.5846405029296875, 0.63055419921875, 0.6764678955078125, 0.722381591796875, 0.7682952880859375, 0.814208984375, 0.8601226806640625, 0.906036376953125, 0.9519500732421875, 0.99786376953125, 1.0437774658203125, 1.089691162109375, 1.1356048583984375, 1.1815185546875, 1.2274322509765625, 1.273345947265625, 1.3192596435546875, 1.36517333984375, 1.4110870361328125, 1.457000732421875, 1.5029144287109375, 1.548828125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 3.0, 0.0, 4.0, 1.0, 4.0, 4.0, 4.0, 7.0, 4.0, 8.0, 13.0, 33.0, 107.0, 531.0, 3834.0, 62807.0, 866760.0, 108090.0, 5394.0, 711.0, 146.0, 41.0, 13.0, 10.0, 8.0, 3.0, 4.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.953125, -18.371337890625, -17.78955078125, -17.207763671875, -16.6259765625, -16.044189453125, -15.46240234375, -14.880615234375, -14.298828125, -13.717041015625, -13.13525390625, -12.553466796875, -11.9716796875, -11.389892578125, -10.80810546875, -10.226318359375, -9.64453125, -9.062744140625, -8.48095703125, -7.899169921875, -7.3173828125, -6.735595703125, -6.15380859375, -5.572021484375, -4.990234375, -4.408447265625, -3.82666015625, -3.244873046875, -2.6630859375, -2.081298828125, -1.49951171875, -0.917724609375, -0.3359375, 0.245849609375, 0.82763671875, 1.409423828125, 1.9912109375, 2.572998046875, 3.15478515625, 3.736572265625, 4.318359375, 4.900146484375, 5.48193359375, 6.063720703125, 6.6455078125, 7.227294921875, 7.80908203125, 8.390869140625, 8.97265625, 9.554443359375, 10.13623046875, 10.718017578125, 11.2998046875, 11.881591796875, 12.46337890625, 13.045166015625, 13.626953125, 14.208740234375, 14.79052734375, 15.372314453125, 15.9541015625, 16.535888671875, 17.11767578125, 17.699462890625, 18.28125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 3.0, 10.0, 10.0, 13.0, 11.0, 15.0, 21.0, 14.0, 28.0, 36.0, 28.0, 33.0, 30.0, 47.0, 41.0, 46.0, 56.0, 56.0, 51.0, 56.0, 50.0, 52.0, 48.0, 46.0, 33.0, 33.0, 25.0, 21.0, 21.0, 18.0, 14.0, 6.0, 5.0, 3.0, 6.0, 5.0, 1.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.12109375, -3.97772216796875, -3.8343505859375, -3.69097900390625, -3.547607421875, -3.40423583984375, -3.2608642578125, -3.11749267578125, -2.97412109375, -2.83074951171875, -2.6873779296875, -2.54400634765625, -2.400634765625, -2.25726318359375, -2.1138916015625, -1.97052001953125, -1.8271484375, -1.68377685546875, -1.5404052734375, -1.39703369140625, -1.253662109375, -1.11029052734375, -0.9669189453125, -0.82354736328125, -0.68017578125, -0.53680419921875, -0.3934326171875, -0.25006103515625, -0.106689453125, 0.03668212890625, 0.1800537109375, 0.32342529296875, 0.466796875, 0.61016845703125, 0.7535400390625, 0.89691162109375, 1.040283203125, 1.18365478515625, 1.3270263671875, 1.47039794921875, 1.61376953125, 1.75714111328125, 1.9005126953125, 2.04388427734375, 2.187255859375, 2.33062744140625, 2.4739990234375, 2.61737060546875, 2.7607421875, 2.90411376953125, 3.0474853515625, 3.19085693359375, 3.334228515625, 3.47760009765625, 3.6209716796875, 3.76434326171875, 3.90771484375, 4.05108642578125, 4.1944580078125, 4.33782958984375, 4.481201171875, 4.62457275390625, 4.7679443359375, 4.91131591796875, 5.0546875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 0.0, 1.0, 1.0, 4.0, 0.0, 6.0, 11.0, 15.0, 30.0, 76.0, 185.0, 733.0, 4037.0, 155385.0, 878791.0, 7775.0, 1009.0, 265.0, 116.0, 47.0, 27.0, 15.0, 10.0, 6.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.25, -30.79296875, -29.3359375, -27.87890625, -26.421875, -24.96484375, -23.5078125, -22.05078125, -20.59375, -19.13671875, -17.6796875, -16.22265625, -14.765625, -13.30859375, -11.8515625, -10.39453125, -8.9375, -7.48046875, -6.0234375, -4.56640625, -3.109375, -1.65234375, -0.1953125, 1.26171875, 2.71875, 4.17578125, 5.6328125, 7.08984375, 8.546875, 10.00390625, 11.4609375, 12.91796875, 14.375, 15.83203125, 17.2890625, 18.74609375, 20.203125, 21.66015625, 23.1171875, 24.57421875, 26.03125, 27.48828125, 28.9453125, 30.40234375, 31.859375, 33.31640625, 34.7734375, 36.23046875, 37.6875, 39.14453125, 40.6015625, 42.05859375, 43.515625, 44.97265625, 46.4296875, 47.88671875, 49.34375, 50.80078125, 52.2578125, 53.71484375, 55.171875, 56.62890625, 58.0859375, 59.54296875, 61.0]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 3.0, 4.0, 2.0, 0.0, 7.0, 7.0, 1.0, 8.0, 14.0, 17.0, 29.0, 49.0, 79.0, 143.0, 241.0, 173.0, 87.0, 60.0, 27.0, 18.0, 13.0, 9.0, 6.0, 7.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0012063980102539062, -0.0011773556470870972, -0.001148313283920288, -0.001119270920753479, -0.00109022855758667, -0.0010611861944198608, -0.0010321438312530518, -0.0010031014680862427, -0.0009740591049194336, -0.0009450167417526245, -0.0009159743785858154, -0.0008869320154190063, -0.0008578896522521973, -0.0008288472890853882, -0.0007998049259185791, -0.00077076256275177, -0.0007417201995849609, -0.0007126778364181519, -0.0006836354732513428, -0.0006545931100845337, -0.0006255507469177246, -0.0005965083837509155, -0.0005674660205841064, -0.0005384236574172974, -0.0005093812942504883, -0.0004803389310836792, -0.0004512965679168701, -0.00042225420475006104, -0.00039321184158325195, -0.00036416947841644287, -0.0003351271152496338, -0.0003060847520828247, -0.0002770423889160156, -0.00024800002574920654, -0.00021895766258239746, -0.00018991529941558838, -0.0001608729362487793, -0.00013183057308197021, -0.00010278820991516113, -7.374584674835205e-05, -4.470348358154297e-05, -1.5661120414733887e-05, 1.3381242752075195e-05, 4.242360591888428e-05, 7.146596908569336e-05, 0.00010050833225250244, 0.00012955069541931152, 0.0001585930585861206, 0.0001876354217529297, 0.00021667778491973877, 0.00024572014808654785, 0.00027476251125335693, 0.000303804874420166, 0.0003328472375869751, 0.0003618896007537842, 0.00039093196392059326, 0.00041997432708740234, 0.0004490166902542114, 0.0004780590534210205, 0.0005071014165878296, 0.0005361437797546387, 0.0005651861429214478, 0.0005942285060882568, 0.0006232708692550659, 0.000652313232421875]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 5.0, 3.0, 8.0, 5.0, 7.0, 18.0, 27.0, 45.0, 68.0, 130.0, 164.0, 272.0, 403.0, 686.0, 1204.0, 2242.0, 4320.0, 9727.0, 27851.0, 127414.0, 617365.0, 196164.0, 36843.0, 12159.0, 5148.0, 2682.0, 1410.0, 808.0, 493.0, 337.0, 197.0, 112.0, 75.0, 52.0, 40.0, 22.0, 22.0, 11.0, 3.0, 5.0, 5.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.203125, -9.88037109375, -9.5576171875, -9.23486328125, -8.912109375, -8.58935546875, -8.2666015625, -7.94384765625, -7.62109375, -7.29833984375, -6.9755859375, -6.65283203125, -6.330078125, -6.00732421875, -5.6845703125, -5.36181640625, -5.0390625, -4.71630859375, -4.3935546875, -4.07080078125, -3.748046875, -3.42529296875, -3.1025390625, -2.77978515625, -2.45703125, -2.13427734375, -1.8115234375, -1.48876953125, -1.166015625, -0.84326171875, -0.5205078125, -0.19775390625, 0.125, 0.44775390625, 0.7705078125, 1.09326171875, 1.416015625, 1.73876953125, 2.0615234375, 2.38427734375, 2.70703125, 3.02978515625, 3.3525390625, 3.67529296875, 3.998046875, 4.32080078125, 4.6435546875, 4.96630859375, 5.2890625, 5.61181640625, 5.9345703125, 6.25732421875, 6.580078125, 6.90283203125, 7.2255859375, 7.54833984375, 7.87109375, 8.19384765625, 8.5166015625, 8.83935546875, 9.162109375, 9.48486328125, 9.8076171875, 10.13037109375, 10.453125]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 4.0, 3.0, 4.0, 3.0, 5.0, 8.0, 6.0, 12.0, 19.0, 38.0, 73.0, 87.0, 136.0, 151.0, 156.0, 97.0, 72.0, 53.0, 24.0, 12.0, 10.0, 8.0, 7.0, 4.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.859375, -10.505859375, -10.15234375, -9.798828125, -9.4453125, -9.091796875, -8.73828125, -8.384765625, -8.03125, -7.677734375, -7.32421875, -6.970703125, -6.6171875, -6.263671875, -5.91015625, -5.556640625, -5.203125, -4.849609375, -4.49609375, -4.142578125, -3.7890625, -3.435546875, -3.08203125, -2.728515625, -2.375, -2.021484375, -1.66796875, -1.314453125, -0.9609375, -0.607421875, -0.25390625, 0.099609375, 0.453125, 0.806640625, 1.16015625, 1.513671875, 1.8671875, 2.220703125, 2.57421875, 2.927734375, 3.28125, 3.634765625, 3.98828125, 4.341796875, 4.6953125, 5.048828125, 5.40234375, 5.755859375, 6.109375, 6.462890625, 6.81640625, 7.169921875, 7.5234375, 7.876953125, 8.23046875, 8.583984375, 8.9375, 9.291015625, 9.64453125, 9.998046875, 10.3515625, 10.705078125, 11.05859375, 11.412109375, 11.765625]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 7.0, 18.0, 60.0, 166.0, 346.0, 254.0, 91.0, 37.0, 13.0, 3.0, 5.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-133.65475463867188, -130.00514221191406, -126.35552215576172, -122.7059097290039, -119.05628967285156, -115.40667724609375, -111.75706481933594, -108.1074447631836, -104.45782470703125, -100.80821228027344, -97.1585922241211, -93.50897979736328, -89.85935974121094, -86.20974731445312, -82.56013488769531, -78.91051483154297, -75.26090240478516, -71.61128997802734, -67.961669921875, -64.31205749511719, -60.662437438964844, -57.01282501220703, -53.36320877075195, -49.713592529296875, -46.0639762878418, -42.41436004638672, -38.76474380493164, -35.11512756347656, -31.465513229370117, -27.81589698791504, -24.166282653808594, -20.516666412353516, -16.867050170898438, -13.21743392944336, -9.567818641662598, -5.918203353881836, -2.268587112426758, 1.3810291290283203, 5.030643463134766, 8.680259704589844, 12.329875946044922, 15.9794921875, 19.629108428955078, 23.278722763061523, 26.9283390045166, 30.57795524597168, 34.227569580078125, 37.8771858215332, 41.52680206298828, 45.17641830444336, 48.82603454589844, 52.47564697265625, 56.125267028808594, 59.774879455566406, 63.424495697021484, 67.07411193847656, 70.72372436523438, 74.37333679199219, 78.02295684814453, 81.67256927490234, 85.32218933105469, 88.9718017578125, 92.62141418457031, 96.27103424072266, 99.920654296875]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 1.0, 6.0, 3.0, 8.0, 7.0, 19.0, 20.0, 23.0, 45.0, 57.0, 36.0, 64.0, 93.0, 82.0, 91.0, 82.0, 73.0, 61.0, 64.0, 41.0, 39.0, 23.0, 22.0, 11.0, 9.0, 6.0, 9.0, 6.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-66.91558074951172, -65.18614196777344, -63.456703186035156, -61.727264404296875, -59.997825622558594, -58.26838684082031, -56.53894805908203, -54.80950927734375, -53.08007049560547, -51.35063171386719, -49.621192932128906, -47.891754150390625, -46.162315368652344, -44.43287658691406, -42.70343780517578, -40.9739990234375, -39.24456024169922, -37.51512145996094, -35.785682678222656, -34.056243896484375, -32.326805114746094, -30.597366333007812, -28.86792755126953, -27.13848876953125, -25.409046173095703, -23.679607391357422, -21.95016860961914, -20.22072982788086, -18.491291046142578, -16.761852264404297, -15.0324125289917, -13.302973747253418, -11.573535919189453, -9.844097137451172, -8.11465835571289, -6.385219097137451, -4.65578031539917, -2.9263410568237305, -1.1969022750854492, 0.532536506652832, 2.2619752883911133, 3.9914140701293945, 5.720852851867676, 7.450292110443115, 9.179731369018555, 10.909170150756836, 12.638608932495117, 14.368047714233398, 16.09748649597168, 17.82692527770996, 19.556364059448242, 21.285802841186523, 23.015241622924805, 24.74468231201172, 26.47412109375, 28.20355987548828, 29.932998657226562, 31.662437438964844, 33.391876220703125, 35.121315002441406, 36.85075378417969, 38.58019256591797, 40.30963134765625, 42.03907012939453, 43.76850891113281]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 7.0, 11.0, 12.0, 15.0, 18.0, 21.0, 37.0, 37.0, 63.0, 87.0, 131.0, 216.0, 432.0, 753.0, 1428.0, 3189.0, 8415.0, 32362.0, 420418.0, 3619435.0, 80148.0, 15984.0, 5430.0, 2398.0, 1249.0, 661.0, 405.0, 245.0, 172.0, 121.0, 81.0, 57.0, 64.0, 44.0, 23.0, 22.0, 21.0, 19.0, 14.0, 5.0, 10.0, 7.0, 4.0, 5.0, 0.0, 0.0, 3.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.734375, -20.025146484375, -19.31591796875, -18.606689453125, -17.8974609375, -17.188232421875, -16.47900390625, -15.769775390625, -15.060546875, -14.351318359375, -13.64208984375, -12.932861328125, -12.2236328125, -11.514404296875, -10.80517578125, -10.095947265625, -9.38671875, -8.677490234375, -7.96826171875, -7.259033203125, -6.5498046875, -5.840576171875, -5.13134765625, -4.422119140625, -3.712890625, -3.003662109375, -2.29443359375, -1.585205078125, -0.8759765625, -0.166748046875, 0.54248046875, 1.251708984375, 1.9609375, 2.670166015625, 3.37939453125, 4.088623046875, 4.7978515625, 5.507080078125, 6.21630859375, 6.925537109375, 7.634765625, 8.343994140625, 9.05322265625, 9.762451171875, 10.4716796875, 11.180908203125, 11.89013671875, 12.599365234375, 13.30859375, 14.017822265625, 14.72705078125, 15.436279296875, 16.1455078125, 16.854736328125, 17.56396484375, 18.273193359375, 18.982421875, 19.691650390625, 20.40087890625, 21.110107421875, 21.8193359375, 22.528564453125, 23.23779296875, 23.947021484375, 24.65625]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 6.0, 1.0, 6.0, 14.0, 16.0, 17.0, 23.0, 37.0, 48.0, 72.0, 125.0, 115.0, 121.0, 106.0, 91.0, 56.0, 59.0, 29.0, 17.0, 11.0, 10.0, 11.0, 4.0, 6.0, 6.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.24609375, -1.2022857666015625, -1.158477783203125, -1.1146697998046875, -1.07086181640625, -1.0270538330078125, -0.983245849609375, -0.9394378662109375, -0.8956298828125, -0.8518218994140625, -0.808013916015625, -0.7642059326171875, -0.72039794921875, -0.6765899658203125, -0.632781982421875, -0.5889739990234375, -0.545166015625, -0.5013580322265625, -0.457550048828125, -0.4137420654296875, -0.36993408203125, -0.3261260986328125, -0.282318115234375, -0.2385101318359375, -0.1947021484375, -0.1508941650390625, -0.107086181640625, -0.0632781982421875, -0.01947021484375, 0.0243377685546875, 0.068145751953125, 0.1119537353515625, 0.15576171875, 0.1995697021484375, 0.243377685546875, 0.2871856689453125, 0.33099365234375, 0.3748016357421875, 0.418609619140625, 0.4624176025390625, 0.5062255859375, 0.5500335693359375, 0.593841552734375, 0.6376495361328125, 0.68145751953125, 0.7252655029296875, 0.769073486328125, 0.8128814697265625, 0.856689453125, 0.9004974365234375, 0.944305419921875, 0.9881134033203125, 1.03192138671875, 1.0757293701171875, 1.119537353515625, 1.1633453369140625, 1.2071533203125, 1.2509613037109375, 1.294769287109375, 1.3385772705078125, 1.38238525390625, 1.4261932373046875, 1.470001220703125, 1.5138092041015625, 1.5576171875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 1.0, 6.0, 8.0, 14.0, 13.0, 12.0, 24.0, 29.0, 66.0, 83.0, 175.0, 558.0, 7848.0, 4049973.0, 132920.0, 1924.0, 307.0, 135.0, 72.0, 38.0, 15.0, 20.0, 10.0, 11.0, 8.0, 3.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.34375, -49.49462890625, -47.6455078125, -45.79638671875, -43.947265625, -42.09814453125, -40.2490234375, -38.39990234375, -36.55078125, -34.70166015625, -32.8525390625, -31.00341796875, -29.154296875, -27.30517578125, -25.4560546875, -23.60693359375, -21.7578125, -19.90869140625, -18.0595703125, -16.21044921875, -14.361328125, -12.51220703125, -10.6630859375, -8.81396484375, -6.96484375, -5.11572265625, -3.2666015625, -1.41748046875, 0.431640625, 2.28076171875, 4.1298828125, 5.97900390625, 7.828125, 9.67724609375, 11.5263671875, 13.37548828125, 15.224609375, 17.07373046875, 18.9228515625, 20.77197265625, 22.62109375, 24.47021484375, 26.3193359375, 28.16845703125, 30.017578125, 31.86669921875, 33.7158203125, 35.56494140625, 37.4140625, 39.26318359375, 41.1123046875, 42.96142578125, 44.810546875, 46.65966796875, 48.5087890625, 50.35791015625, 52.20703125, 54.05615234375, 55.9052734375, 57.75439453125, 59.603515625, 61.45263671875, 63.3017578125, 65.15087890625, 67.0]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 4.0, 3.0, 2.0, 5.0, 6.0, 12.0, 15.0, 12.0, 26.0, 37.0, 66.0, 106.0, 187.0, 349.0, 866.0, 1206.0, 534.0, 233.0, 132.0, 87.0, 63.0, 37.0, 24.0, 14.0, 17.0, 15.0, 4.0, 5.0, 5.0, 4.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.41015625, -2.327728271484375, -2.24530029296875, -2.162872314453125, -2.0804443359375, -1.998016357421875, -1.91558837890625, -1.833160400390625, -1.750732421875, -1.668304443359375, -1.58587646484375, -1.503448486328125, -1.4210205078125, -1.338592529296875, -1.25616455078125, -1.173736572265625, -1.09130859375, -1.008880615234375, -0.92645263671875, -0.844024658203125, -0.7615966796875, -0.679168701171875, -0.59674072265625, -0.514312744140625, -0.431884765625, -0.349456787109375, -0.26702880859375, -0.184600830078125, -0.1021728515625, -0.019744873046875, 0.06268310546875, 0.145111083984375, 0.2275390625, 0.309967041015625, 0.39239501953125, 0.474822998046875, 0.5572509765625, 0.639678955078125, 0.72210693359375, 0.804534912109375, 0.886962890625, 0.969390869140625, 1.05181884765625, 1.134246826171875, 1.2166748046875, 1.299102783203125, 1.38153076171875, 1.463958740234375, 1.54638671875, 1.628814697265625, 1.71124267578125, 1.793670654296875, 1.8760986328125, 1.958526611328125, 2.04095458984375, 2.123382568359375, 2.205810546875, 2.288238525390625, 2.37066650390625, 2.453094482421875, 2.5355224609375, 2.617950439453125, 2.70037841796875, 2.782806396484375, 2.865234375]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 4.0, 4.0, 12.0, 29.0, 113.0, 236.0, 295.0, 188.0, 76.0, 32.0, 7.0, 4.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.84351348876953, -23.994565963745117, -23.145618438720703, -22.29667091369629, -21.447723388671875, -20.598773956298828, -19.749828338623047, -18.90087890625, -18.051931381225586, -17.202983856201172, -16.354036331176758, -15.505088806152344, -14.656140327453613, -13.8071928024292, -12.958245277404785, -12.109296798706055, -11.260350227355957, -10.411402702331543, -9.562455177307129, -8.713506698608398, -7.864559173583984, -7.01561164855957, -6.166664123535156, -5.317716121673584, -4.46876859664917, -3.6198208332061768, -2.7708730697631836, -1.9219255447387695, -1.0729777812957764, -0.2240300178527832, 0.6249175071716309, 1.4738655090332031, 2.322813034057617, 3.1717607975006104, 4.0207085609436035, 4.869656085968018, 5.71860408782959, 6.567551612854004, 7.416499137878418, 8.265447616577148, 9.114395141601562, 9.963342666625977, 10.81229019165039, 11.661237716674805, 12.510186195373535, 13.35913372039795, 14.208081245422363, 15.057029724121094, 15.905976295471191, 16.754924774169922, 17.603872299194336, 18.45281982421875, 19.301767349243164, 20.150714874267578, 20.999662399291992, 21.848609924316406, 22.69755744934082, 23.546504974365234, 24.39545249938965, 25.244400024414062, 26.093347549438477, 26.94229507446289, 27.791244506835938, 28.64019203186035, 29.489139556884766]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 0.0, 3.0, 3.0, 2.0, 5.0, 8.0, 13.0, 15.0, 18.0, 20.0, 22.0, 37.0, 30.0, 60.0, 51.0, 50.0, 51.0, 74.0, 79.0, 74.0, 76.0, 63.0, 59.0, 43.0, 32.0, 27.0, 21.0, 23.0, 14.0, 9.0, 7.0, 4.0, 3.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.948840141296387, -9.580921173095703, -9.21300220489502, -8.845083236694336, -8.477164268493652, -8.109245300292969, -7.741326332092285, -7.373407363891602, -7.005488395690918, -6.637569427490234, -6.269650459289551, -5.901731491088867, -5.533812522888184, -5.1658935546875, -4.797974586486816, -4.430055618286133, -4.062136650085449, -3.6942176818847656, -3.326298713684082, -2.9583797454833984, -2.590460777282715, -2.2225418090820312, -1.8546228408813477, -1.486703872680664, -1.1187849044799805, -0.7508659362792969, -0.3829469680786133, -0.015027999877929688, 0.3528909683227539, 0.7208099365234375, 1.088728904724121, 1.4566478729248047, 1.8245658874511719, 2.1924848556518555, 2.560403823852539, 2.9283227920532227, 3.2962417602539062, 3.66416072845459, 4.032079696655273, 4.399998664855957, 4.767917633056641, 5.135836601257324, 5.503755569458008, 5.871674537658691, 6.239593505859375, 6.607512474060059, 6.975431442260742, 7.343350410461426, 7.711269378662109, 8.079188346862793, 8.447107315063477, 8.81502628326416, 9.182945251464844, 9.550864219665527, 9.918783187866211, 10.286702156066895, 10.654621124267578, 11.022540092468262, 11.390459060668945, 11.758378028869629, 12.126296997070312, 12.494215965270996, 12.86213493347168, 13.230053901672363, 13.597972869873047]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 3.0, 5.0, 3.0, 2.0, 6.0, 5.0, 11.0, 8.0, 6.0, 10.0, 12.0, 26.0, 19.0, 30.0, 33.0, 53.0, 66.0, 109.0, 191.0, 334.0, 669.0, 1509.0, 4855.0, 24701.0, 241548.0, 652006.0, 103899.0, 12809.0, 3157.0, 1170.0, 487.0, 270.0, 156.0, 106.0, 60.0, 43.0, 37.0, 35.0, 22.0, 24.0, 13.0, 12.0, 11.0, 6.0, 6.0, 2.0, 6.0, 2.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.078125, -13.642578125, -13.20703125, -12.771484375, -12.3359375, -11.900390625, -11.46484375, -11.029296875, -10.59375, -10.158203125, -9.72265625, -9.287109375, -8.8515625, -8.416015625, -7.98046875, -7.544921875, -7.109375, -6.673828125, -6.23828125, -5.802734375, -5.3671875, -4.931640625, -4.49609375, -4.060546875, -3.625, -3.189453125, -2.75390625, -2.318359375, -1.8828125, -1.447265625, -1.01171875, -0.576171875, -0.140625, 0.294921875, 0.73046875, 1.166015625, 1.6015625, 2.037109375, 2.47265625, 2.908203125, 3.34375, 3.779296875, 4.21484375, 4.650390625, 5.0859375, 5.521484375, 5.95703125, 6.392578125, 6.828125, 7.263671875, 7.69921875, 8.134765625, 8.5703125, 9.005859375, 9.44140625, 9.876953125, 10.3125, 10.748046875, 11.18359375, 11.619140625, 12.0546875, 12.490234375, 12.92578125, 13.361328125, 13.796875]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 3.0, 17.0, 28.0, 37.0, 93.0, 108.0, 146.0, 168.0, 140.0, 103.0, 71.0, 38.0, 25.0, 11.0, 9.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.4296875, -2.3681640625, -2.306640625, -2.2451171875, -2.18359375, -2.1220703125, -2.060546875, -1.9990234375, -1.9375, -1.8759765625, -1.814453125, -1.7529296875, -1.69140625, -1.6298828125, -1.568359375, -1.5068359375, -1.4453125, -1.3837890625, -1.322265625, -1.2607421875, -1.19921875, -1.1376953125, -1.076171875, -1.0146484375, -0.953125, -0.8916015625, -0.830078125, -0.7685546875, -0.70703125, -0.6455078125, -0.583984375, -0.5224609375, -0.4609375, -0.3994140625, -0.337890625, -0.2763671875, -0.21484375, -0.1533203125, -0.091796875, -0.0302734375, 0.03125, 0.0927734375, 0.154296875, 0.2158203125, 0.27734375, 0.3388671875, 0.400390625, 0.4619140625, 0.5234375, 0.5849609375, 0.646484375, 0.7080078125, 0.76953125, 0.8310546875, 0.892578125, 0.9541015625, 1.015625, 1.0771484375, 1.138671875, 1.2001953125, 1.26171875, 1.3232421875, 1.384765625, 1.4462890625, 1.5078125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 4.0, 11.0, 9.0, 17.0, 23.0, 19.0, 28.0, 37.0, 48.0, 72.0, 117.0, 145.0, 198.0, 314.0, 411.0, 669.0, 1048.0, 1906.0, 3445.0, 6630.0, 14205.0, 32300.0, 74746.0, 165110.0, 276588.0, 243224.0, 125076.0, 54878.0, 24028.0, 10801.0, 5299.0, 2756.0, 1609.0, 926.0, 558.0, 377.0, 262.0, 194.0, 133.0, 118.0, 70.0, 36.0, 39.0, 20.0, 10.0, 13.0, 7.0, 8.0, 8.0, 7.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-5.78125, -5.59954833984375, -5.4178466796875, -5.23614501953125, -5.054443359375, -4.87274169921875, -4.6910400390625, -4.50933837890625, -4.32763671875, -4.14593505859375, -3.9642333984375, -3.78253173828125, -3.600830078125, -3.41912841796875, -3.2374267578125, -3.05572509765625, -2.8740234375, -2.69232177734375, -2.5106201171875, -2.32891845703125, -2.147216796875, -1.96551513671875, -1.7838134765625, -1.60211181640625, -1.42041015625, -1.23870849609375, -1.0570068359375, -0.87530517578125, -0.693603515625, -0.51190185546875, -0.3302001953125, -0.14849853515625, 0.033203125, 0.21490478515625, 0.3966064453125, 0.57830810546875, 0.760009765625, 0.94171142578125, 1.1234130859375, 1.30511474609375, 1.48681640625, 1.66851806640625, 1.8502197265625, 2.03192138671875, 2.213623046875, 2.39532470703125, 2.5770263671875, 2.75872802734375, 2.9404296875, 3.12213134765625, 3.3038330078125, 3.48553466796875, 3.667236328125, 3.84893798828125, 4.0306396484375, 4.21234130859375, 4.39404296875, 4.57574462890625, 4.7574462890625, 4.93914794921875, 5.120849609375, 5.30255126953125, 5.4842529296875, 5.66595458984375, 5.84765625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 5.0, 11.0, 8.0, 9.0, 10.0, 12.0, 16.0, 15.0, 21.0, 27.0, 36.0, 39.0, 29.0, 48.0, 36.0, 44.0, 38.0, 37.0, 29.0, 53.0, 48.0, 37.0, 44.0, 45.0, 44.0, 32.0, 29.0, 23.0, 31.0, 24.0, 23.0, 17.0, 14.0, 10.0, 14.0, 12.0, 8.0, 9.0, 2.0, 5.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.66796875, -4.50732421875, -4.3466796875, -4.18603515625, -4.025390625, -3.86474609375, -3.7041015625, -3.54345703125, -3.3828125, -3.22216796875, -3.0615234375, -2.90087890625, -2.740234375, -2.57958984375, -2.4189453125, -2.25830078125, -2.09765625, -1.93701171875, -1.7763671875, -1.61572265625, -1.455078125, -1.29443359375, -1.1337890625, -0.97314453125, -0.8125, -0.65185546875, -0.4912109375, -0.33056640625, -0.169921875, -0.00927734375, 0.1513671875, 0.31201171875, 0.47265625, 0.63330078125, 0.7939453125, 0.95458984375, 1.115234375, 1.27587890625, 1.4365234375, 1.59716796875, 1.7578125, 1.91845703125, 2.0791015625, 2.23974609375, 2.400390625, 2.56103515625, 2.7216796875, 2.88232421875, 3.04296875, 3.20361328125, 3.3642578125, 3.52490234375, 3.685546875, 3.84619140625, 4.0068359375, 4.16748046875, 4.328125, 4.48876953125, 4.6494140625, 4.81005859375, 4.970703125, 5.13134765625, 5.2919921875, 5.45263671875, 5.61328125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 3.0, 3.0, 4.0, 4.0, 15.0, 12.0, 24.0, 51.0, 59.0, 92.0, 150.0, 314.0, 571.0, 1093.0, 2366.0, 5590.0, 15140.0, 49947.0, 199039.0, 472469.0, 219869.0, 54501.0, 16211.0, 5950.0, 2563.0, 1181.0, 573.0, 323.0, 170.0, 110.0, 61.0, 33.0, 24.0, 13.0, 6.0, 5.0, 6.0, 8.0, 3.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.109375, -8.85302734375, -8.5966796875, -8.34033203125, -8.083984375, -7.82763671875, -7.5712890625, -7.31494140625, -7.05859375, -6.80224609375, -6.5458984375, -6.28955078125, -6.033203125, -5.77685546875, -5.5205078125, -5.26416015625, -5.0078125, -4.75146484375, -4.4951171875, -4.23876953125, -3.982421875, -3.72607421875, -3.4697265625, -3.21337890625, -2.95703125, -2.70068359375, -2.4443359375, -2.18798828125, -1.931640625, -1.67529296875, -1.4189453125, -1.16259765625, -0.90625, -0.64990234375, -0.3935546875, -0.13720703125, 0.119140625, 0.37548828125, 0.6318359375, 0.88818359375, 1.14453125, 1.40087890625, 1.6572265625, 1.91357421875, 2.169921875, 2.42626953125, 2.6826171875, 2.93896484375, 3.1953125, 3.45166015625, 3.7080078125, 3.96435546875, 4.220703125, 4.47705078125, 4.7333984375, 4.98974609375, 5.24609375, 5.50244140625, 5.7587890625, 6.01513671875, 6.271484375, 6.52783203125, 6.7841796875, 7.04052734375, 7.296875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 3.0, 2.0, 5.0, 6.0, 5.0, 8.0, 15.0, 27.0, 32.0, 26.0, 31.0, 45.0, 57.0, 73.0, 73.0, 102.0, 87.0, 90.0, 62.0, 53.0, 41.0, 28.0, 31.0, 29.0, 10.0, 12.0, 10.0, 11.0, 5.0, 8.0, 3.0, 3.0, 4.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0008268356323242188, -0.0007970333099365234, -0.0007672309875488281, -0.0007374286651611328, -0.0007076263427734375, -0.0006778240203857422, -0.0006480216979980469, -0.0006182193756103516, -0.0005884170532226562, -0.0005586147308349609, -0.0005288124084472656, -0.0004990100860595703, -0.000469207763671875, -0.0004394054412841797, -0.0004096031188964844, -0.00037980079650878906, -0.00034999847412109375, -0.00032019615173339844, -0.0002903938293457031, -0.0002605915069580078, -0.0002307891845703125, -0.0002009868621826172, -0.00017118453979492188, -0.00014138221740722656, -0.00011157989501953125, -8.177757263183594e-05, -5.1975250244140625e-05, -2.2172927856445312e-05, 7.62939453125e-06, 3.743171691894531e-05, 6.723403930664062e-05, 9.703636169433594e-05, 0.00012683868408203125, 0.00015664100646972656, 0.00018644332885742188, 0.0002162456512451172, 0.0002460479736328125, 0.0002758502960205078, 0.0003056526184082031, 0.00033545494079589844, 0.00036525726318359375, 0.00039505958557128906, 0.0004248619079589844, 0.0004546642303466797, 0.000484466552734375, 0.0005142688751220703, 0.0005440711975097656, 0.0005738735198974609, 0.0006036758422851562, 0.0006334781646728516, 0.0006632804870605469, 0.0006930828094482422, 0.0007228851318359375, 0.0007526874542236328, 0.0007824897766113281, 0.0008122920989990234, 0.0008420944213867188, 0.0008718967437744141, 0.0009016990661621094, 0.0009315013885498047, 0.0009613037109375, 0.0009911060333251953, 0.0010209083557128906, 0.001050710678100586, 0.0010805130004882812]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 9.0, 9.0, 11.0, 26.0, 23.0, 38.0, 62.0, 78.0, 145.0, 267.0, 512.0, 1005.0, 2257.0, 5951.0, 21560.0, 129201.0, 648739.0, 196573.0, 29294.0, 7616.0, 2704.0, 1174.0, 547.0, 302.0, 169.0, 96.0, 66.0, 46.0, 17.0, 19.0, 16.0, 6.0, 4.0, 3.0, 2.0, 5.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.2421875, -13.83056640625, -13.4189453125, -13.00732421875, -12.595703125, -12.18408203125, -11.7724609375, -11.36083984375, -10.94921875, -10.53759765625, -10.1259765625, -9.71435546875, -9.302734375, -8.89111328125, -8.4794921875, -8.06787109375, -7.65625, -7.24462890625, -6.8330078125, -6.42138671875, -6.009765625, -5.59814453125, -5.1865234375, -4.77490234375, -4.36328125, -3.95166015625, -3.5400390625, -3.12841796875, -2.716796875, -2.30517578125, -1.8935546875, -1.48193359375, -1.0703125, -0.65869140625, -0.2470703125, 0.16455078125, 0.576171875, 0.98779296875, 1.3994140625, 1.81103515625, 2.22265625, 2.63427734375, 3.0458984375, 3.45751953125, 3.869140625, 4.28076171875, 4.6923828125, 5.10400390625, 5.515625, 5.92724609375, 6.3388671875, 6.75048828125, 7.162109375, 7.57373046875, 7.9853515625, 8.39697265625, 8.80859375, 9.22021484375, 9.6318359375, 10.04345703125, 10.455078125, 10.86669921875, 11.2783203125, 11.68994140625, 12.1015625]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 4.0, 3.0, 8.0, 11.0, 17.0, 19.0, 36.0, 46.0, 63.0, 77.0, 114.0, 122.0, 111.0, 112.0, 76.0, 53.0, 37.0, 31.0, 19.0, 14.0, 11.0, 4.0, 2.0, 5.0, 5.0, 2.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-10.234375, -9.98455810546875, -9.7347412109375, -9.48492431640625, -9.235107421875, -8.98529052734375, -8.7354736328125, -8.48565673828125, -8.23583984375, -7.98602294921875, -7.7362060546875, -7.48638916015625, -7.236572265625, -6.98675537109375, -6.7369384765625, -6.48712158203125, -6.2373046875, -5.98748779296875, -5.7376708984375, -5.48785400390625, -5.238037109375, -4.98822021484375, -4.7384033203125, -4.48858642578125, -4.23876953125, -3.98895263671875, -3.7391357421875, -3.48931884765625, -3.239501953125, -2.98968505859375, -2.7398681640625, -2.49005126953125, -2.240234375, -1.99041748046875, -1.7406005859375, -1.49078369140625, -1.240966796875, -0.99114990234375, -0.7413330078125, -0.49151611328125, -0.24169921875, 0.00811767578125, 0.2579345703125, 0.50775146484375, 0.757568359375, 1.00738525390625, 1.2572021484375, 1.50701904296875, 1.7568359375, 2.00665283203125, 2.2564697265625, 2.50628662109375, 2.756103515625, 3.00592041015625, 3.2557373046875, 3.50555419921875, 3.75537109375, 4.00518798828125, 4.2550048828125, 4.50482177734375, 4.754638671875, 5.00445556640625, 5.2542724609375, 5.50408935546875, 5.75390625]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 9.0, 12.0, 33.0, 51.0, 102.0, 189.0, 197.0, 167.0, 105.0, 62.0, 30.0, 16.0, 10.0, 3.0, 5.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-86.81666564941406, -84.31334686279297, -81.81002807617188, -79.30670166015625, -76.80338287353516, -74.30006408691406, -71.79674530029297, -69.29342651367188, -66.79010009765625, -64.28678131103516, -61.7834587097168, -59.2801399230957, -56.776817321777344, -54.27349853515625, -51.770179748535156, -49.26686096191406, -46.76354217529297, -44.260223388671875, -41.756900787353516, -39.25358200073242, -36.75025939941406, -34.24694061279297, -31.743621826171875, -29.24030113220215, -26.736980438232422, -24.233659744262695, -21.73033905029297, -19.227020263671875, -16.72369956970215, -14.220378875732422, -11.717059135437012, -9.213739395141602, -6.710411071777344, -4.207090854644775, -1.703770637512207, 0.7995495796203613, 3.3028697967529297, 5.806190490722656, 8.309510231018066, 10.812829971313477, 13.316150665283203, 15.81947135925293, 18.322792053222656, 20.82611083984375, 23.329431533813477, 25.832752227783203, 28.336071014404297, 30.839391708374023, 33.34271240234375, 35.846031188964844, 38.3493537902832, 40.8526725769043, 43.355995178222656, 45.85931396484375, 48.362632751464844, 50.86595153808594, 53.3692741394043, 55.87259292602539, 58.37591552734375, 60.879234313964844, 63.38255310058594, 65.88587951660156, 68.38919830322266, 70.89251708984375, 73.39583587646484]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 1.0, 3.0, 9.0, 9.0, 17.0, 15.0, 33.0, 34.0, 27.0, 43.0, 51.0, 56.0, 70.0, 71.0, 69.0, 73.0, 49.0, 60.0, 63.0, 52.0, 40.0, 40.0, 37.0, 32.0, 16.0, 13.0, 7.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.86215209960938, -64.96086120605469, -63.0595703125, -61.15827941894531, -59.25699234008789, -57.3557014465332, -55.454410552978516, -53.55311965942383, -51.651832580566406, -49.75054168701172, -47.84925079345703, -45.947959899902344, -44.04667282104492, -42.145381927490234, -40.24409103393555, -38.34280014038086, -36.44150924682617, -34.540218353271484, -32.6389274597168, -30.737638473510742, -28.836349487304688, -26.93505859375, -25.033767700195312, -23.132476806640625, -21.23118782043457, -19.329896926879883, -17.428607940673828, -15.52731704711914, -13.62602710723877, -11.724737167358398, -9.823446273803711, -7.92215633392334, -6.020870208740234, -4.119580268859863, -2.218289852142334, -0.3169994354248047, 1.5842905044555664, 3.4855804443359375, 5.386871337890625, 7.288161277770996, 9.189451217651367, 11.090741157531738, 12.99203109741211, 14.893321990966797, 16.794612884521484, 18.69590187072754, 20.597192764282227, 22.49848175048828, 24.39977264404297, 26.301063537597656, 28.20235252380371, 30.1036434173584, 32.00493240356445, 33.90622329711914, 35.80751419067383, 37.708805084228516, 39.61009216308594, 41.511383056640625, 43.41267395019531, 45.31396484375, 47.21525192260742, 49.11654281616211, 51.0178337097168, 52.919124603271484, 54.82041549682617]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 11.0, 9.0, 18.0, 24.0, 34.0, 58.0, 83.0, 118.0, 202.0, 411.0, 980.0, 3208.0, 21349.0, 3292826.0, 852016.0, 17218.0, 3393.0, 1132.0, 504.0, 267.0, 159.0, 79.0, 62.0, 34.0, 22.0, 14.0, 18.0, 6.0, 6.0, 6.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-38.21875, -36.94189453125, -35.6650390625, -34.38818359375, -33.111328125, -31.83447265625, -30.5576171875, -29.28076171875, -28.00390625, -26.72705078125, -25.4501953125, -24.17333984375, -22.896484375, -21.61962890625, -20.3427734375, -19.06591796875, -17.7890625, -16.51220703125, -15.2353515625, -13.95849609375, -12.681640625, -11.40478515625, -10.1279296875, -8.85107421875, -7.57421875, -6.29736328125, -5.0205078125, -3.74365234375, -2.466796875, -1.18994140625, 0.0869140625, 1.36376953125, 2.640625, 3.91748046875, 5.1943359375, 6.47119140625, 7.748046875, 9.02490234375, 10.3017578125, 11.57861328125, 12.85546875, 14.13232421875, 15.4091796875, 16.68603515625, 17.962890625, 19.23974609375, 20.5166015625, 21.79345703125, 23.0703125, 24.34716796875, 25.6240234375, 26.90087890625, 28.177734375, 29.45458984375, 30.7314453125, 32.00830078125, 33.28515625, 34.56201171875, 35.8388671875, 37.11572265625, 38.392578125, 39.66943359375, 40.9462890625, 42.22314453125, 43.5]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 7.0, 7.0, 6.0, 19.0, 22.0, 43.0, 43.0, 63.0, 69.0, 88.0, 102.0, 85.0, 95.0, 74.0, 70.0, 56.0, 51.0, 35.0, 19.0, 15.0, 7.0, 7.0, 3.0, 4.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-1.7880859375, -1.731353759765625, -1.67462158203125, -1.617889404296875, -1.5611572265625, -1.504425048828125, -1.44769287109375, -1.390960693359375, -1.334228515625, -1.277496337890625, -1.22076416015625, -1.164031982421875, -1.1072998046875, -1.050567626953125, -0.99383544921875, -0.937103271484375, -0.88037109375, -0.823638916015625, -0.76690673828125, -0.710174560546875, -0.6534423828125, -0.596710205078125, -0.53997802734375, -0.483245849609375, -0.426513671875, -0.369781494140625, -0.31304931640625, -0.256317138671875, -0.1995849609375, -0.142852783203125, -0.08612060546875, -0.029388427734375, 0.02734375, 0.084075927734375, 0.14080810546875, 0.197540283203125, 0.2542724609375, 0.311004638671875, 0.36773681640625, 0.424468994140625, 0.481201171875, 0.537933349609375, 0.59466552734375, 0.651397705078125, 0.7081298828125, 0.764862060546875, 0.82159423828125, 0.878326416015625, 0.93505859375, 0.991790771484375, 1.04852294921875, 1.105255126953125, 1.1619873046875, 1.218719482421875, 1.27545166015625, 1.332183837890625, 1.388916015625, 1.445648193359375, 1.50238037109375, 1.559112548828125, 1.6158447265625, 1.672576904296875, 1.72930908203125, 1.786041259765625, 1.8427734375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 6.0, 8.0, 16.0, 9.0, 24.0, 27.0, 39.0, 69.0, 98.0, 105.0, 174.0, 279.0, 997.0, 284819.0, 3904130.0, 2591.0, 360.0, 166.0, 111.0, 81.0, 64.0, 41.0, 28.0, 22.0, 12.0, 5.0, 3.0, 3.0, 2.0, 3.0, 2.0], "bins": [-120.0625, -117.51513671875, -114.9677734375, -112.42041015625, -109.873046875, -107.32568359375, -104.7783203125, -102.23095703125, -99.68359375, -97.13623046875, -94.5888671875, -92.04150390625, -89.494140625, -86.94677734375, -84.3994140625, -81.85205078125, -79.3046875, -76.75732421875, -74.2099609375, -71.66259765625, -69.115234375, -66.56787109375, -64.0205078125, -61.47314453125, -58.92578125, -56.37841796875, -53.8310546875, -51.28369140625, -48.736328125, -46.18896484375, -43.6416015625, -41.09423828125, -38.546875, -35.99951171875, -33.4521484375, -30.90478515625, -28.357421875, -25.81005859375, -23.2626953125, -20.71533203125, -18.16796875, -15.62060546875, -13.0732421875, -10.52587890625, -7.978515625, -5.43115234375, -2.8837890625, -0.33642578125, 2.2109375, 4.75830078125, 7.3056640625, 9.85302734375, 12.400390625, 14.94775390625, 17.4951171875, 20.04248046875, 22.58984375, 25.13720703125, 27.6845703125, 30.23193359375, 32.779296875, 35.32666015625, 37.8740234375, 40.42138671875, 42.96875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 8.0, 16.0, 33.0, 58.0, 140.0, 369.0, 1557.0, 1325.0, 338.0, 130.0, 55.0, 22.0, 18.0, 11.0, 5.0, 1.0, 1.0, 1.0, 1.0], "bins": [-11.3203125, -11.10235595703125, -10.8843994140625, -10.66644287109375, -10.448486328125, -10.23052978515625, -10.0125732421875, -9.79461669921875, -9.57666015625, -9.35870361328125, -9.1407470703125, -8.92279052734375, -8.704833984375, -8.48687744140625, -8.2689208984375, -8.05096435546875, -7.8330078125, -7.61505126953125, -7.3970947265625, -7.17913818359375, -6.961181640625, -6.74322509765625, -6.5252685546875, -6.30731201171875, -6.08935546875, -5.87139892578125, -5.6534423828125, -5.43548583984375, -5.217529296875, -4.99957275390625, -4.7816162109375, -4.56365966796875, -4.345703125, -4.12774658203125, -3.9097900390625, -3.69183349609375, -3.473876953125, -3.25592041015625, -3.0379638671875, -2.82000732421875, -2.60205078125, -2.38409423828125, -2.1661376953125, -1.94818115234375, -1.730224609375, -1.51226806640625, -1.2943115234375, -1.07635498046875, -0.8583984375, -0.64044189453125, -0.4224853515625, -0.20452880859375, 0.013427734375, 0.23138427734375, 0.4493408203125, 0.66729736328125, 0.88525390625, 1.10321044921875, 1.3211669921875, 1.53912353515625, 1.757080078125, 1.97503662109375, 2.1929931640625, 2.41094970703125, 2.62890625]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 7.0, 110.0, 824.0, 66.0, 7.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-185.94189453125, -177.99920654296875, -170.0565185546875, -162.11383056640625, -154.171142578125, -146.22845458984375, -138.2857666015625, -130.34307861328125, -122.40038299560547, -114.45769500732422, -106.51500701904297, -98.57231140136719, -90.62962341308594, -82.68693542480469, -74.74424743652344, -66.80155944824219, -58.85887145996094, -50.91618347167969, -42.97349548339844, -35.03080368041992, -27.088115692138672, -19.145427703857422, -11.202735900878906, -3.2600479125976562, 4.682640075683594, 12.62532901763916, 20.568017959594727, 28.51070785522461, 36.45339584350586, 44.39608383178711, 52.338775634765625, 60.281463623046875, 68.22415161132812, 76.16683959960938, 84.10952758789062, 92.05221557617188, 99.99490356445312, 107.93759155273438, 115.88028717041016, 123.8229751586914, 131.76565551757812, 139.70834350585938, 147.65103149414062, 155.59371948242188, 163.53640747070312, 171.47909545898438, 179.42178344726562, 187.36447143554688, 195.3071746826172, 203.24986267089844, 211.1925506591797, 219.13523864746094, 227.0779266357422, 235.02061462402344, 242.96331787109375, 250.906005859375, 258.84869384765625, 266.7913818359375, 274.73406982421875, 282.6767578125, 290.61944580078125, 298.5621337890625, 306.50482177734375, 314.447509765625, 322.39019775390625]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 8.0, 13.0, 24.0, 21.0, 35.0, 51.0, 70.0, 80.0, 97.0, 106.0, 92.0, 98.0, 67.0, 60.0, 59.0, 45.0, 26.0, 22.0, 12.0, 5.0, 8.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-28.453672409057617, -27.52790069580078, -26.602128982543945, -25.67635726928711, -24.75058364868164, -23.824811935424805, -22.89904022216797, -21.973268508911133, -21.047496795654297, -20.12172508239746, -19.195953369140625, -18.270179748535156, -17.34440803527832, -16.418636322021484, -15.492864608764648, -14.567092895507812, -13.641319274902344, -12.715547561645508, -11.789774894714355, -10.86400318145752, -9.938230514526367, -9.012458801269531, -8.086687088012695, -7.160914897918701, -6.235142707824707, -5.309370517730713, -4.383598327636719, -3.457826614379883, -2.5320544242858887, -1.6062822341918945, -0.6805105209350586, 0.24526166915893555, 1.1710319519042969, 2.096804141998291, 3.022576093673706, 3.948348045349121, 4.874120235443115, 5.799892425537109, 6.725664138793945, 7.6514363288879395, 8.577208518981934, 9.50298023223877, 10.428752899169922, 11.354524612426758, 12.280296325683594, 13.206068992614746, 14.131840705871582, 15.057613372802734, 15.98338508605957, 16.909156799316406, 17.834928512573242, 18.760700225830078, 19.686473846435547, 20.612245559692383, 21.53801727294922, 22.463788986206055, 23.38956069946289, 24.315332412719727, 25.241104125976562, 26.16687774658203, 27.092649459838867, 28.018421173095703, 28.94419288635254, 29.869964599609375, 30.795738220214844]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 0.0, 3.0, 4.0, 6.0, 7.0, 10.0, 5.0, 12.0, 13.0, 12.0, 17.0, 42.0, 58.0, 88.0, 153.0, 250.0, 500.0, 956.0, 2486.0, 7635.0, 44403.0, 381318.0, 521750.0, 72469.0, 10856.0, 3049.0, 1205.0, 529.0, 278.0, 147.0, 108.0, 65.0, 27.0, 26.0, 17.0, 11.0, 13.0, 9.0, 4.0, 8.0, 6.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.828125, -21.188232421875, -20.54833984375, -19.908447265625, -19.2685546875, -18.628662109375, -17.98876953125, -17.348876953125, -16.708984375, -16.069091796875, -15.42919921875, -14.789306640625, -14.1494140625, -13.509521484375, -12.86962890625, -12.229736328125, -11.58984375, -10.949951171875, -10.31005859375, -9.670166015625, -9.0302734375, -8.390380859375, -7.75048828125, -7.110595703125, -6.470703125, -5.830810546875, -5.19091796875, -4.551025390625, -3.9111328125, -3.271240234375, -2.63134765625, -1.991455078125, -1.3515625, -0.711669921875, -0.07177734375, 0.568115234375, 1.2080078125, 1.847900390625, 2.48779296875, 3.127685546875, 3.767578125, 4.407470703125, 5.04736328125, 5.687255859375, 6.3271484375, 6.967041015625, 7.60693359375, 8.246826171875, 8.88671875, 9.526611328125, 10.16650390625, 10.806396484375, 11.4462890625, 12.086181640625, 12.72607421875, 13.365966796875, 14.005859375, 14.645751953125, 15.28564453125, 15.925537109375, 16.5654296875, 17.205322265625, 17.84521484375, 18.485107421875, 19.125]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 7.0, 8.0, 12.0, 22.0, 31.0, 45.0, 79.0, 91.0, 111.0, 117.0, 117.0, 108.0, 85.0, 62.0, 43.0, 24.0, 12.0, 15.0, 1.0, 3.0, 4.0, 1.0, 0.0, 6.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.33203125, -3.246185302734375, -3.16033935546875, -3.074493408203125, -2.9886474609375, -2.902801513671875, -2.81695556640625, -2.731109619140625, -2.645263671875, -2.559417724609375, -2.47357177734375, -2.387725830078125, -2.3018798828125, -2.216033935546875, -2.13018798828125, -2.044342041015625, -1.95849609375, -1.872650146484375, -1.78680419921875, -1.700958251953125, -1.6151123046875, -1.529266357421875, -1.44342041015625, -1.357574462890625, -1.271728515625, -1.185882568359375, -1.10003662109375, -1.014190673828125, -0.9283447265625, -0.842498779296875, -0.75665283203125, -0.670806884765625, -0.5849609375, -0.499114990234375, -0.41326904296875, -0.327423095703125, -0.2415771484375, -0.155731201171875, -0.06988525390625, 0.015960693359375, 0.101806640625, 0.187652587890625, 0.27349853515625, 0.359344482421875, 0.4451904296875, 0.531036376953125, 0.61688232421875, 0.702728271484375, 0.78857421875, 0.874420166015625, 0.96026611328125, 1.046112060546875, 1.1319580078125, 1.217803955078125, 1.30364990234375, 1.389495849609375, 1.475341796875, 1.561187744140625, 1.64703369140625, 1.732879638671875, 1.8187255859375, 1.904571533203125, 1.99041748046875, 2.076263427734375, 2.162109375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 5.0, 6.0, 7.0, 5.0, 15.0, 13.0, 26.0, 20.0, 38.0, 51.0, 64.0, 99.0, 145.0, 212.0, 271.0, 444.0, 681.0, 1186.0, 2093.0, 4235.0, 9549.0, 24911.0, 69597.0, 186457.0, 328423.0, 251996.0, 105221.0, 36795.0, 13591.0, 5724.0, 2790.0, 1451.0, 840.0, 530.0, 312.0, 202.0, 154.0, 141.0, 70.0, 57.0, 35.0, 27.0, 17.0, 19.0, 7.0, 11.0, 3.0, 3.0, 2.0, 3.0, 2.0, 3.0, 0.0, 2.0], "bins": [-9.34375, -9.074462890625, -8.80517578125, -8.535888671875, -8.2666015625, -7.997314453125, -7.72802734375, -7.458740234375, -7.189453125, -6.920166015625, -6.65087890625, -6.381591796875, -6.1123046875, -5.843017578125, -5.57373046875, -5.304443359375, -5.03515625, -4.765869140625, -4.49658203125, -4.227294921875, -3.9580078125, -3.688720703125, -3.41943359375, -3.150146484375, -2.880859375, -2.611572265625, -2.34228515625, -2.072998046875, -1.8037109375, -1.534423828125, -1.26513671875, -0.995849609375, -0.7265625, -0.457275390625, -0.18798828125, 0.081298828125, 0.3505859375, 0.619873046875, 0.88916015625, 1.158447265625, 1.427734375, 1.697021484375, 1.96630859375, 2.235595703125, 2.5048828125, 2.774169921875, 3.04345703125, 3.312744140625, 3.58203125, 3.851318359375, 4.12060546875, 4.389892578125, 4.6591796875, 4.928466796875, 5.19775390625, 5.467041015625, 5.736328125, 6.005615234375, 6.27490234375, 6.544189453125, 6.8134765625, 7.082763671875, 7.35205078125, 7.621337890625, 7.890625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 5.0, 3.0, 1.0, 3.0, 5.0, 6.0, 12.0, 9.0, 13.0, 14.0, 17.0, 18.0, 19.0, 27.0, 29.0, 38.0, 35.0, 39.0, 49.0, 51.0, 45.0, 54.0, 54.0, 56.0, 43.0, 37.0, 41.0, 50.0, 34.0, 30.0, 24.0, 22.0, 21.0, 30.0, 13.0, 10.0, 9.0, 13.0, 6.0, 6.0, 5.0, 7.0, 0.0, 3.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.0234375, -7.77581787109375, -7.5281982421875, -7.28057861328125, -7.032958984375, -6.78533935546875, -6.5377197265625, -6.29010009765625, -6.04248046875, -5.79486083984375, -5.5472412109375, -5.29962158203125, -5.052001953125, -4.80438232421875, -4.5567626953125, -4.30914306640625, -4.0615234375, -3.81390380859375, -3.5662841796875, -3.31866455078125, -3.071044921875, -2.82342529296875, -2.5758056640625, -2.32818603515625, -2.08056640625, -1.83294677734375, -1.5853271484375, -1.33770751953125, -1.090087890625, -0.84246826171875, -0.5948486328125, -0.34722900390625, -0.099609375, 0.14801025390625, 0.3956298828125, 0.64324951171875, 0.890869140625, 1.13848876953125, 1.3861083984375, 1.63372802734375, 1.88134765625, 2.12896728515625, 2.3765869140625, 2.62420654296875, 2.871826171875, 3.11944580078125, 3.3670654296875, 3.61468505859375, 3.8623046875, 4.10992431640625, 4.3575439453125, 4.60516357421875, 4.852783203125, 5.10040283203125, 5.3480224609375, 5.59564208984375, 5.84326171875, 6.09088134765625, 6.3385009765625, 6.58612060546875, 6.833740234375, 7.08135986328125, 7.3289794921875, 7.57659912109375, 7.82421875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 6.0, 6.0, 3.0, 9.0, 12.0, 19.0, 27.0, 30.0, 66.0, 116.0, 213.0, 469.0, 1358.0, 4852.0, 27945.0, 271324.0, 626333.0, 99358.0, 12275.0, 2565.0, 844.0, 313.0, 147.0, 88.0, 58.0, 41.0, 26.0, 14.0, 16.0, 6.0, 4.0, 2.0, 7.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.265625, -9.804931640625, -9.34423828125, -8.883544921875, -8.4228515625, -7.962158203125, -7.50146484375, -7.040771484375, -6.580078125, -6.119384765625, -5.65869140625, -5.197998046875, -4.7373046875, -4.276611328125, -3.81591796875, -3.355224609375, -2.89453125, -2.433837890625, -1.97314453125, -1.512451171875, -1.0517578125, -0.591064453125, -0.13037109375, 0.330322265625, 0.791015625, 1.251708984375, 1.71240234375, 2.173095703125, 2.6337890625, 3.094482421875, 3.55517578125, 4.015869140625, 4.4765625, 4.937255859375, 5.39794921875, 5.858642578125, 6.3193359375, 6.780029296875, 7.24072265625, 7.701416015625, 8.162109375, 8.622802734375, 9.08349609375, 9.544189453125, 10.0048828125, 10.465576171875, 10.92626953125, 11.386962890625, 11.84765625, 12.308349609375, 12.76904296875, 13.229736328125, 13.6904296875, 14.151123046875, 14.61181640625, 15.072509765625, 15.533203125, 15.993896484375, 16.45458984375, 16.915283203125, 17.3759765625, 17.836669921875, 18.29736328125, 18.758056640625, 19.21875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 7.0, 7.0, 12.0, 10.0, 12.0, 11.0, 17.0, 16.0, 31.0, 29.0, 36.0, 62.0, 54.0, 61.0, 71.0, 71.0, 74.0, 57.0, 63.0, 52.0, 36.0, 37.0, 26.0, 28.0, 26.0, 20.0, 12.0, 14.0, 7.0, 11.0, 10.0, 8.0, 3.0, 3.0, 4.0, 0.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009431838989257812, -0.0009156465530395508, -0.0008881092071533203, -0.0008605718612670898, -0.0008330345153808594, -0.0008054971694946289, -0.0007779598236083984, -0.000750422477722168, -0.0007228851318359375, -0.000695347785949707, -0.0006678104400634766, -0.0006402730941772461, -0.0006127357482910156, -0.0005851984024047852, -0.0005576610565185547, -0.0005301237106323242, -0.0005025863647460938, -0.0004750490188598633, -0.0004475116729736328, -0.00041997432708740234, -0.0003924369812011719, -0.0003648996353149414, -0.00033736228942871094, -0.00030982494354248047, -0.00028228759765625, -0.00025475025177001953, -0.00022721290588378906, -0.0001996755599975586, -0.00017213821411132812, -0.00014460086822509766, -0.00011706352233886719, -8.952617645263672e-05, -6.198883056640625e-05, -3.445148468017578e-05, -6.9141387939453125e-06, 2.0623207092285156e-05, 4.8160552978515625e-05, 7.56978988647461e-05, 0.00010323524475097656, 0.00013077259063720703, 0.0001583099365234375, 0.00018584728240966797, 0.00021338462829589844, 0.0002409219741821289, 0.0002684593200683594, 0.00029599666595458984, 0.0003235340118408203, 0.0003510713577270508, 0.00037860870361328125, 0.0004061460494995117, 0.0004336833953857422, 0.00046122074127197266, 0.0004887580871582031, 0.0005162954330444336, 0.0005438327789306641, 0.0005713701248168945, 0.000598907470703125, 0.0006264448165893555, 0.0006539821624755859, 0.0006815195083618164, 0.0007090568542480469, 0.0007365942001342773, 0.0007641315460205078, 0.0007916688919067383, 0.0008192062377929688]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 4.0, 8.0, 9.0, 6.0, 14.0, 29.0, 30.0, 61.0, 95.0, 152.0, 293.0, 613.0, 1323.0, 3401.0, 11868.0, 60745.0, 384877.0, 479444.0, 83254.0, 15173.0, 4095.0, 1518.0, 658.0, 340.0, 207.0, 120.0, 66.0, 38.0, 34.0, 14.0, 14.0, 14.0, 7.0, 5.0, 8.0, 2.0, 4.0, 5.0, 0.0, 1.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-11.125, -10.698486328125, -10.27197265625, -9.845458984375, -9.4189453125, -8.992431640625, -8.56591796875, -8.139404296875, -7.712890625, -7.286376953125, -6.85986328125, -6.433349609375, -6.0068359375, -5.580322265625, -5.15380859375, -4.727294921875, -4.30078125, -3.874267578125, -3.44775390625, -3.021240234375, -2.5947265625, -2.168212890625, -1.74169921875, -1.315185546875, -0.888671875, -0.462158203125, -0.03564453125, 0.390869140625, 0.8173828125, 1.243896484375, 1.67041015625, 2.096923828125, 2.5234375, 2.949951171875, 3.37646484375, 3.802978515625, 4.2294921875, 4.656005859375, 5.08251953125, 5.509033203125, 5.935546875, 6.362060546875, 6.78857421875, 7.215087890625, 7.6416015625, 8.068115234375, 8.49462890625, 8.921142578125, 9.34765625, 9.774169921875, 10.20068359375, 10.627197265625, 11.0537109375, 11.480224609375, 11.90673828125, 12.333251953125, 12.759765625, 13.186279296875, 13.61279296875, 14.039306640625, 14.4658203125, 14.892333984375, 15.31884765625, 15.745361328125, 16.171875]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 5.0, 7.0, 6.0, 15.0, 15.0, 30.0, 55.0, 56.0, 111.0, 115.0, 128.0, 113.0, 115.0, 91.0, 40.0, 30.0, 19.0, 35.0, 9.0, 3.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.04296875, -5.71893310546875, -5.3948974609375, -5.07086181640625, -4.746826171875, -4.42279052734375, -4.0987548828125, -3.77471923828125, -3.45068359375, -3.12664794921875, -2.8026123046875, -2.47857666015625, -2.154541015625, -1.83050537109375, -1.5064697265625, -1.18243408203125, -0.8583984375, -0.53436279296875, -0.2103271484375, 0.11370849609375, 0.437744140625, 0.76177978515625, 1.0858154296875, 1.40985107421875, 1.73388671875, 2.05792236328125, 2.3819580078125, 2.70599365234375, 3.030029296875, 3.35406494140625, 3.6781005859375, 4.00213623046875, 4.326171875, 4.65020751953125, 4.9742431640625, 5.29827880859375, 5.622314453125, 5.94635009765625, 6.2703857421875, 6.59442138671875, 6.91845703125, 7.24249267578125, 7.5665283203125, 7.89056396484375, 8.214599609375, 8.53863525390625, 8.8626708984375, 9.18670654296875, 9.5107421875, 9.83477783203125, 10.1588134765625, 10.48284912109375, 10.806884765625, 11.13092041015625, 11.4549560546875, 11.77899169921875, 12.10302734375, 12.42706298828125, 12.7510986328125, 13.07513427734375, 13.399169921875, 13.72320556640625, 14.0472412109375, 14.37127685546875, 14.6953125]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 5.0, 11.0, 35.0, 82.0, 202.0, 303.0, 216.0, 90.0, 32.0, 17.0, 8.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-225.82984924316406, -220.74945068359375, -215.66903686523438, -210.588623046875, -205.5082244873047, -200.42782592773438, -195.347412109375, -190.26699829101562, -185.1865997314453, -180.106201171875, -175.02578735351562, -169.94537353515625, -164.86497497558594, -159.78457641601562, -154.70416259765625, -149.62374877929688, -144.54335021972656, -139.46295166015625, -134.38253784179688, -129.3021240234375, -124.22172546386719, -119.14131927490234, -114.0609130859375, -108.98050689697266, -103.90010070800781, -98.81969451904297, -93.73928833007812, -88.65888214111328, -83.57847595214844, -78.4980697631836, -73.41766357421875, -68.3372573852539, -63.256858825683594, -58.17645263671875, -53.096046447753906, -48.01564025878906, -42.93523406982422, -37.854827880859375, -32.77442169189453, -27.694015502929688, -22.613609313964844, -17.533203125, -12.452796936035156, -7.3723907470703125, -2.2919845581054688, 2.788421630859375, 7.868827819824219, 12.949234008789062, 18.029640197753906, 23.11004638671875, 28.190452575683594, 33.27085876464844, 38.35126495361328, 43.431671142578125, 48.51207733154297, 53.59248352050781, 58.672889709472656, 63.7532958984375, 68.83370208740234, 73.91410827636719, 78.99451446533203, 84.07492065429688, 89.15532684326172, 94.23573303222656, 99.3161392211914]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 6.0, 6.0, 10.0, 7.0, 12.0, 19.0, 24.0, 29.0, 27.0, 33.0, 41.0, 39.0, 51.0, 63.0, 53.0, 52.0, 51.0, 53.0, 48.0, 54.0, 42.0, 38.0, 42.0, 35.0, 30.0, 24.0, 22.0, 14.0, 14.0, 10.0, 15.0, 9.0, 10.0, 5.0, 6.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-77.57233428955078, -75.47307586669922, -73.37381744384766, -71.2745590209961, -69.17530059814453, -67.07604217529297, -64.9767837524414, -62.877525329589844, -60.77826690673828, -58.67900848388672, -56.579750061035156, -54.480491638183594, -52.38123321533203, -50.28197479248047, -48.182716369628906, -46.083457946777344, -43.98419952392578, -41.88494110107422, -39.785682678222656, -37.686424255371094, -35.58716583251953, -33.48790740966797, -31.388648986816406, -29.289390563964844, -27.19013214111328, -25.09087371826172, -22.991615295410156, -20.892356872558594, -18.79309844970703, -16.69384002685547, -14.594581604003906, -12.495323181152344, -10.396072387695312, -8.29681396484375, -6.1975555419921875, -4.098297119140625, -1.9990386962890625, 0.1002197265625, 2.1994781494140625, 4.298736572265625, 6.3979949951171875, 8.49725341796875, 10.596511840820312, 12.695770263671875, 14.795028686523438, 16.894287109375, 18.993545532226562, 21.092803955078125, 23.192062377929688, 25.29132080078125, 27.390579223632812, 29.489837646484375, 31.589096069335938, 33.6883544921875, 35.78761291503906, 37.886871337890625, 39.98612976074219, 42.08538818359375, 44.18464660644531, 46.283905029296875, 48.38316345214844, 50.482421875, 52.58168029785156, 54.680938720703125, 56.78019714355469]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 5.0, 5.0, 5.0, 8.0, 16.0, 10.0, 11.0, 22.0, 22.0, 38.0, 39.0, 37.0, 93.0, 135.0, 221.0, 379.0, 705.0, 1517.0, 3936.0, 15207.0, 101104.0, 3651623.0, 373664.0, 33619.0, 7446.0, 2408.0, 983.0, 436.0, 236.0, 145.0, 66.0, 46.0, 30.0, 17.0, 17.0, 11.0, 11.0, 7.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.078125, -30.254150390625, -29.43017578125, -28.606201171875, -27.7822265625, -26.958251953125, -26.13427734375, -25.310302734375, -24.486328125, -23.662353515625, -22.83837890625, -22.014404296875, -21.1904296875, -20.366455078125, -19.54248046875, -18.718505859375, -17.89453125, -17.070556640625, -16.24658203125, -15.422607421875, -14.5986328125, -13.774658203125, -12.95068359375, -12.126708984375, -11.302734375, -10.478759765625, -9.65478515625, -8.830810546875, -8.0068359375, -7.182861328125, -6.35888671875, -5.534912109375, -4.7109375, -3.886962890625, -3.06298828125, -2.239013671875, -1.4150390625, -0.591064453125, 0.23291015625, 1.056884765625, 1.880859375, 2.704833984375, 3.52880859375, 4.352783203125, 5.1767578125, 6.000732421875, 6.82470703125, 7.648681640625, 8.47265625, 9.296630859375, 10.12060546875, 10.944580078125, 11.7685546875, 12.592529296875, 13.41650390625, 14.240478515625, 15.064453125, 15.888427734375, 16.71240234375, 17.536376953125, 18.3603515625, 19.184326171875, 20.00830078125, 20.832275390625, 21.65625]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 5.0, 17.0, 7.0, 12.0, 23.0, 38.0, 56.0, 51.0, 73.0, 49.0, 77.0, 72.0, 84.0, 83.0, 78.0, 55.0, 50.0, 47.0, 40.0, 25.0, 25.0, 9.0, 7.0, 3.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.583984375, -2.503265380859375, -2.42254638671875, -2.341827392578125, -2.2611083984375, -2.180389404296875, -2.09967041015625, -2.018951416015625, -1.938232421875, -1.857513427734375, -1.77679443359375, -1.696075439453125, -1.6153564453125, -1.534637451171875, -1.45391845703125, -1.373199462890625, -1.29248046875, -1.211761474609375, -1.13104248046875, -1.050323486328125, -0.9696044921875, -0.888885498046875, -0.80816650390625, -0.727447509765625, -0.646728515625, -0.566009521484375, -0.48529052734375, -0.404571533203125, -0.3238525390625, -0.243133544921875, -0.16241455078125, -0.081695556640625, -0.0009765625, 0.079742431640625, 0.16046142578125, 0.241180419921875, 0.3218994140625, 0.402618408203125, 0.48333740234375, 0.564056396484375, 0.644775390625, 0.725494384765625, 0.80621337890625, 0.886932373046875, 0.9676513671875, 1.048370361328125, 1.12908935546875, 1.209808349609375, 1.29052734375, 1.371246337890625, 1.45196533203125, 1.532684326171875, 1.6134033203125, 1.694122314453125, 1.77484130859375, 1.855560302734375, 1.936279296875, 2.016998291015625, 2.09771728515625, 2.178436279296875, 2.2591552734375, 2.339874267578125, 2.42059326171875, 2.501312255859375, 2.58203125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 6.0, 11.0, 15.0, 25.0, 35.0, 54.0, 91.0, 121.0, 179.0, 385.0, 843.0, 3254.0, 324884.0, 3856394.0, 5998.0, 1052.0, 427.0, 204.0, 121.0, 64.0, 48.0, 38.0, 22.0, 9.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-108.3125, -105.8583984375, -103.404296875, -100.9501953125, -98.49609375, -96.0419921875, -93.587890625, -91.1337890625, -88.6796875, -86.2255859375, -83.771484375, -81.3173828125, -78.86328125, -76.4091796875, -73.955078125, -71.5009765625, -69.046875, -66.5927734375, -64.138671875, -61.6845703125, -59.23046875, -56.7763671875, -54.322265625, -51.8681640625, -49.4140625, -46.9599609375, -44.505859375, -42.0517578125, -39.59765625, -37.1435546875, -34.689453125, -32.2353515625, -29.78125, -27.3271484375, -24.873046875, -22.4189453125, -19.96484375, -17.5107421875, -15.056640625, -12.6025390625, -10.1484375, -7.6943359375, -5.240234375, -2.7861328125, -0.33203125, 2.1220703125, 4.576171875, 7.0302734375, 9.484375, 11.9384765625, 14.392578125, 16.8466796875, 19.30078125, 21.7548828125, 24.208984375, 26.6630859375, 29.1171875, 31.5712890625, 34.025390625, 36.4794921875, 38.93359375, 41.3876953125, 43.841796875, 46.2958984375, 48.75]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 5.0, 8.0, 28.0, 49.0, 123.0, 377.0, 1977.0, 1136.0, 234.0, 79.0, 42.0, 12.0, 9.0, 4.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-17.578125, -17.239013671875, -16.89990234375, -16.560791015625, -16.2216796875, -15.882568359375, -15.54345703125, -15.204345703125, -14.865234375, -14.526123046875, -14.18701171875, -13.847900390625, -13.5087890625, -13.169677734375, -12.83056640625, -12.491455078125, -12.15234375, -11.813232421875, -11.47412109375, -11.135009765625, -10.7958984375, -10.456787109375, -10.11767578125, -9.778564453125, -9.439453125, -9.100341796875, -8.76123046875, -8.422119140625, -8.0830078125, -7.743896484375, -7.40478515625, -7.065673828125, -6.7265625, -6.387451171875, -6.04833984375, -5.709228515625, -5.3701171875, -5.031005859375, -4.69189453125, -4.352783203125, -4.013671875, -3.674560546875, -3.33544921875, -2.996337890625, -2.6572265625, -2.318115234375, -1.97900390625, -1.639892578125, -1.30078125, -0.961669921875, -0.62255859375, -0.283447265625, 0.0556640625, 0.394775390625, 0.73388671875, 1.072998046875, 1.412109375, 1.751220703125, 2.09033203125, 2.429443359375, 2.7685546875, 3.107666015625, 3.44677734375, 3.785888671875, 4.125]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 1.0, 3.0, 8.0, 18.0, 30.0, 123.0, 289.0, 314.0, 136.0, 43.0, 23.0, 15.0, 2.0, 0.0, 6.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-101.5068130493164, -98.84917449951172, -96.1915283203125, -93.53388977050781, -90.87625122070312, -88.21861267089844, -85.56097412109375, -82.90332794189453, -80.24568939208984, -77.58805084228516, -74.93040466308594, -72.27276611328125, -69.61512756347656, -66.95748901367188, -64.29985046386719, -61.64220428466797, -58.98456573486328, -56.326927185058594, -53.66928482055664, -51.01164245605469, -48.35400390625, -45.69636535644531, -43.03872299194336, -40.381080627441406, -37.72344207763672, -35.06580352783203, -32.40816116333008, -29.750520706176758, -27.092880249023438, -24.435239791870117, -21.777599334716797, -19.119958877563477, -16.462326049804688, -13.804685592651367, -11.147045135498047, -8.489404678344727, -5.831764221191406, -3.174123764038086, -0.5164833068847656, 2.1411571502685547, 4.798797607421875, 7.456438064575195, 10.114078521728516, 12.771718978881836, 15.429359436035156, 18.086999893188477, 20.744640350341797, 23.402280807495117, 26.059921264648438, 28.717561721801758, 31.375202178955078, 34.03284454345703, 36.69048309326172, 39.348121643066406, 42.00576400756836, 44.66340637207031, 47.321044921875, 49.97868347167969, 52.63632583618164, 55.293968200683594, 57.95160675048828, 60.60924530029297, 63.26688766479492, 65.92453002929688, 68.58216857910156]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 6.0, 4.0, 1.0, 3.0, 5.0, 12.0, 13.0, 19.0, 34.0, 34.0, 45.0, 43.0, 55.0, 66.0, 62.0, 62.0, 78.0, 80.0, 66.0, 68.0, 65.0, 47.0, 32.0, 29.0, 24.0, 17.0, 8.0, 8.0, 13.0, 2.0, 5.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.922222137451172, -30.00249481201172, -29.082765579223633, -28.16303825378418, -27.243309020996094, -26.32358169555664, -25.403854370117188, -24.4841251373291, -23.564395904541016, -22.644668579101562, -21.724939346313477, -20.805212020874023, -19.885482788085938, -18.965755462646484, -18.04602813720703, -17.126298904418945, -16.206571578979492, -15.286843299865723, -14.367115020751953, -13.4473876953125, -12.527658462524414, -11.607931137084961, -10.688202857971191, -9.768474578857422, -8.848746299743652, -7.929018020629883, -7.009289741516113, -6.089561939239502, -5.169833660125732, -4.250105381011963, -3.3303775787353516, -2.410649299621582, -1.4909210205078125, -0.5711928606033325, 0.34853529930114746, 1.268263339996338, 2.1879916191101074, 3.107719898223877, 4.027447700500488, 4.947175979614258, 5.866904258728027, 6.786632537841797, 7.706360816955566, 8.626089096069336, 9.545816421508789, 10.465545654296875, 11.385272979736328, 12.305001258850098, 13.224729537963867, 14.144457817077637, 15.064186096191406, 15.98391342163086, 16.903642654418945, 17.8233699798584, 18.743099212646484, 19.662826538085938, 20.58255386352539, 21.502281188964844, 22.42201042175293, 23.341737747192383, 24.26146697998047, 25.181194305419922, 26.100921630859375, 27.02065086364746, 27.940380096435547]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 7.0, 10.0, 11.0, 15.0, 38.0, 54.0, 110.0, 136.0, 259.0, 436.0, 871.0, 1904.0, 5426.0, 20251.0, 102728.0, 446840.0, 370878.0, 75164.0, 15480.0, 4461.0, 1676.0, 818.0, 418.0, 214.0, 141.0, 84.0, 45.0, 29.0, 17.0, 17.0, 9.0, 9.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.71875, -17.211181640625, -16.70361328125, -16.196044921875, -15.6884765625, -15.180908203125, -14.67333984375, -14.165771484375, -13.658203125, -13.150634765625, -12.64306640625, -12.135498046875, -11.6279296875, -11.120361328125, -10.61279296875, -10.105224609375, -9.59765625, -9.090087890625, -8.58251953125, -8.074951171875, -7.5673828125, -7.059814453125, -6.55224609375, -6.044677734375, -5.537109375, -5.029541015625, -4.52197265625, -4.014404296875, -3.5068359375, -2.999267578125, -2.49169921875, -1.984130859375, -1.4765625, -0.968994140625, -0.46142578125, 0.046142578125, 0.5537109375, 1.061279296875, 1.56884765625, 2.076416015625, 2.583984375, 3.091552734375, 3.59912109375, 4.106689453125, 4.6142578125, 5.121826171875, 5.62939453125, 6.136962890625, 6.64453125, 7.152099609375, 7.65966796875, 8.167236328125, 8.6748046875, 9.182373046875, 9.68994140625, 10.197509765625, 10.705078125, 11.212646484375, 11.72021484375, 12.227783203125, 12.7353515625, 13.242919921875, 13.75048828125, 14.258056640625, 14.765625]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 7.0, 3.0, 3.0, 7.0, 14.0, 19.0, 25.0, 42.0, 47.0, 52.0, 55.0, 61.0, 83.0, 77.0, 80.0, 70.0, 75.0, 67.0, 51.0, 51.0, 33.0, 17.0, 14.0, 21.0, 6.0, 5.0, 5.0, 4.0, 4.0, 6.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.25390625, -3.160919189453125, -3.06793212890625, -2.974945068359375, -2.8819580078125, -2.788970947265625, -2.69598388671875, -2.602996826171875, -2.510009765625, -2.417022705078125, -2.32403564453125, -2.231048583984375, -2.1380615234375, -2.045074462890625, -1.95208740234375, -1.859100341796875, -1.76611328125, -1.673126220703125, -1.58013916015625, -1.487152099609375, -1.3941650390625, -1.301177978515625, -1.20819091796875, -1.115203857421875, -1.022216796875, -0.929229736328125, -0.83624267578125, -0.743255615234375, -0.6502685546875, -0.557281494140625, -0.46429443359375, -0.371307373046875, -0.2783203125, -0.185333251953125, -0.09234619140625, 0.000640869140625, 0.0936279296875, 0.186614990234375, 0.27960205078125, 0.372589111328125, 0.465576171875, 0.558563232421875, 0.65155029296875, 0.744537353515625, 0.8375244140625, 0.930511474609375, 1.02349853515625, 1.116485595703125, 1.20947265625, 1.302459716796875, 1.39544677734375, 1.488433837890625, 1.5814208984375, 1.674407958984375, 1.76739501953125, 1.860382080078125, 1.953369140625, 2.046356201171875, 2.13934326171875, 2.232330322265625, 2.3253173828125, 2.418304443359375, 2.51129150390625, 2.604278564453125, 2.697265625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 5.0, 2.0, 4.0, 5.0, 10.0, 11.0, 14.0, 31.0, 27.0, 43.0, 56.0, 87.0, 103.0, 196.0, 276.0, 449.0, 812.0, 1776.0, 3973.0, 10439.0, 31431.0, 105631.0, 305083.0, 368524.0, 150565.0, 44627.0, 14557.0, 5156.0, 2155.0, 1053.0, 520.0, 316.0, 208.0, 119.0, 76.0, 57.0, 50.0, 27.0, 22.0, 22.0, 14.0, 13.0, 9.0, 7.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.6328125, -8.28955078125, -7.9462890625, -7.60302734375, -7.259765625, -6.91650390625, -6.5732421875, -6.22998046875, -5.88671875, -5.54345703125, -5.2001953125, -4.85693359375, -4.513671875, -4.17041015625, -3.8271484375, -3.48388671875, -3.140625, -2.79736328125, -2.4541015625, -2.11083984375, -1.767578125, -1.42431640625, -1.0810546875, -0.73779296875, -0.39453125, -0.05126953125, 0.2919921875, 0.63525390625, 0.978515625, 1.32177734375, 1.6650390625, 2.00830078125, 2.3515625, 2.69482421875, 3.0380859375, 3.38134765625, 3.724609375, 4.06787109375, 4.4111328125, 4.75439453125, 5.09765625, 5.44091796875, 5.7841796875, 6.12744140625, 6.470703125, 6.81396484375, 7.1572265625, 7.50048828125, 7.84375, 8.18701171875, 8.5302734375, 8.87353515625, 9.216796875, 9.56005859375, 9.9033203125, 10.24658203125, 10.58984375, 10.93310546875, 11.2763671875, 11.61962890625, 11.962890625, 12.30615234375, 12.6494140625, 12.99267578125, 13.3359375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 3.0, 2.0, 6.0, 11.0, 6.0, 7.0, 11.0, 10.0, 12.0, 17.0, 15.0, 19.0, 24.0, 26.0, 27.0, 38.0, 52.0, 33.0, 45.0, 41.0, 40.0, 47.0, 50.0, 31.0, 44.0, 40.0, 34.0, 38.0, 31.0, 35.0, 37.0, 20.0, 25.0, 22.0, 18.0, 17.0, 13.0, 10.0, 12.0, 5.0, 7.0, 7.0, 6.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.8671875, -8.573486328125, -8.27978515625, -7.986083984375, -7.6923828125, -7.398681640625, -7.10498046875, -6.811279296875, -6.517578125, -6.223876953125, -5.93017578125, -5.636474609375, -5.3427734375, -5.049072265625, -4.75537109375, -4.461669921875, -4.16796875, -3.874267578125, -3.58056640625, -3.286865234375, -2.9931640625, -2.699462890625, -2.40576171875, -2.112060546875, -1.818359375, -1.524658203125, -1.23095703125, -0.937255859375, -0.6435546875, -0.349853515625, -0.05615234375, 0.237548828125, 0.53125, 0.824951171875, 1.11865234375, 1.412353515625, 1.7060546875, 1.999755859375, 2.29345703125, 2.587158203125, 2.880859375, 3.174560546875, 3.46826171875, 3.761962890625, 4.0556640625, 4.349365234375, 4.64306640625, 4.936767578125, 5.23046875, 5.524169921875, 5.81787109375, 6.111572265625, 6.4052734375, 6.698974609375, 6.99267578125, 7.286376953125, 7.580078125, 7.873779296875, 8.16748046875, 8.461181640625, 8.7548828125, 9.048583984375, 9.34228515625, 9.635986328125, 9.9296875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 8.0, 3.0, 15.0, 15.0, 18.0, 42.0, 67.0, 161.0, 298.0, 844.0, 3158.0, 18366.0, 153419.0, 651189.0, 192975.0, 22496.0, 3832.0, 954.0, 351.0, 160.0, 71.0, 36.0, 29.0, 16.0, 7.0, 9.0, 4.0, 4.0, 3.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.0625, -8.72119140625, -8.3798828125, -8.03857421875, -7.697265625, -7.35595703125, -7.0146484375, -6.67333984375, -6.33203125, -5.99072265625, -5.6494140625, -5.30810546875, -4.966796875, -4.62548828125, -4.2841796875, -3.94287109375, -3.6015625, -3.26025390625, -2.9189453125, -2.57763671875, -2.236328125, -1.89501953125, -1.5537109375, -1.21240234375, -0.87109375, -0.52978515625, -0.1884765625, 0.15283203125, 0.494140625, 0.83544921875, 1.1767578125, 1.51806640625, 1.859375, 2.20068359375, 2.5419921875, 2.88330078125, 3.224609375, 3.56591796875, 3.9072265625, 4.24853515625, 4.58984375, 4.93115234375, 5.2724609375, 5.61376953125, 5.955078125, 6.29638671875, 6.6376953125, 6.97900390625, 7.3203125, 7.66162109375, 8.0029296875, 8.34423828125, 8.685546875, 9.02685546875, 9.3681640625, 9.70947265625, 10.05078125, 10.39208984375, 10.7333984375, 11.07470703125, 11.416015625, 11.75732421875, 12.0986328125, 12.43994140625, 12.78125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 1.0, 1.0, 6.0, 1.0, 2.0, 2.0, 6.0, 5.0, 8.0, 6.0, 13.0, 9.0, 18.0, 10.0, 15.0, 26.0, 23.0, 28.0, 29.0, 42.0, 52.0, 70.0, 62.0, 73.0, 74.0, 51.0, 41.0, 48.0, 61.0, 33.0, 35.0, 23.0, 20.0, 24.0, 14.0, 18.0, 14.0, 8.0, 6.0, 7.0, 9.0, 1.0, 3.0, 1.0, 1.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.0008306503295898438, -0.0008045434951782227, -0.0007784366607666016, -0.0007523298263549805, -0.0007262229919433594, -0.0007001161575317383, -0.0006740093231201172, -0.0006479024887084961, -0.000621795654296875, -0.0005956888198852539, -0.0005695819854736328, -0.0005434751510620117, -0.0005173683166503906, -0.0004912614822387695, -0.00046515464782714844, -0.00043904781341552734, -0.00041294097900390625, -0.00038683414459228516, -0.00036072731018066406, -0.00033462047576904297, -0.0003085136413574219, -0.0002824068069458008, -0.0002562999725341797, -0.0002301931381225586, -0.0002040863037109375, -0.0001779794692993164, -0.0001518726348876953, -0.00012576580047607422, -9.965896606445312e-05, -7.355213165283203e-05, -4.744529724121094e-05, -2.1338462829589844e-05, 4.76837158203125e-06, 3.0875205993652344e-05, 5.698204040527344e-05, 8.308887481689453e-05, 0.00010919570922851562, 0.00013530254364013672, 0.0001614093780517578, 0.0001875162124633789, 0.000213623046875, 0.0002397298812866211, 0.0002658367156982422, 0.0002919435501098633, 0.0003180503845214844, 0.00034415721893310547, 0.00037026405334472656, 0.00039637088775634766, 0.00042247772216796875, 0.00044858455657958984, 0.00047469139099121094, 0.000500798225402832, 0.0005269050598144531, 0.0005530118942260742, 0.0005791187286376953, 0.0006052255630493164, 0.0006313323974609375, 0.0006574392318725586, 0.0006835460662841797, 0.0007096529006958008, 0.0007357597351074219, 0.000761866569519043, 0.0007879734039306641, 0.0008140802383422852, 0.0008401870727539062]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 5.0, 8.0, 10.0, 11.0, 8.0, 29.0, 45.0, 54.0, 57.0, 110.0, 161.0, 299.0, 591.0, 1177.0, 2526.0, 6698.0, 19450.0, 68759.0, 265063.0, 461088.0, 160046.0, 41498.0, 12557.0, 4538.0, 1818.0, 854.0, 416.0, 241.0, 156.0, 88.0, 46.0, 41.0, 33.0, 19.0, 10.0, 10.0, 12.0, 8.0, 2.0, 7.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-8.15625, -7.91851806640625, -7.6807861328125, -7.44305419921875, -7.205322265625, -6.96759033203125, -6.7298583984375, -6.49212646484375, -6.25439453125, -6.01666259765625, -5.7789306640625, -5.54119873046875, -5.303466796875, -5.06573486328125, -4.8280029296875, -4.59027099609375, -4.3525390625, -4.11480712890625, -3.8770751953125, -3.63934326171875, -3.401611328125, -3.16387939453125, -2.9261474609375, -2.68841552734375, -2.45068359375, -2.21295166015625, -1.9752197265625, -1.73748779296875, -1.499755859375, -1.26202392578125, -1.0242919921875, -0.78656005859375, -0.548828125, -0.31109619140625, -0.0733642578125, 0.16436767578125, 0.402099609375, 0.63983154296875, 0.8775634765625, 1.11529541015625, 1.35302734375, 1.59075927734375, 1.8284912109375, 2.06622314453125, 2.303955078125, 2.54168701171875, 2.7794189453125, 3.01715087890625, 3.2548828125, 3.49261474609375, 3.7303466796875, 3.96807861328125, 4.205810546875, 4.44354248046875, 4.6812744140625, 4.91900634765625, 5.15673828125, 5.39447021484375, 5.6322021484375, 5.86993408203125, 6.107666015625, 6.34539794921875, 6.5831298828125, 6.82086181640625, 7.05859375]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 4.0, 4.0, 3.0, 4.0, 8.0, 18.0, 10.0, 7.0, 21.0, 13.0, 24.0, 24.0, 29.0, 41.0, 34.0, 40.0, 36.0, 54.0, 51.0, 66.0, 41.0, 51.0, 48.0, 49.0, 48.0, 28.0, 43.0, 36.0, 25.0, 24.0, 24.0, 18.0, 14.0, 13.0, 9.0, 8.0, 10.0, 4.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.490234375, -3.371246337890625, -3.25225830078125, -3.133270263671875, -3.0142822265625, -2.895294189453125, -2.77630615234375, -2.657318115234375, -2.538330078125, -2.419342041015625, -2.30035400390625, -2.181365966796875, -2.0623779296875, -1.943389892578125, -1.82440185546875, -1.705413818359375, -1.58642578125, -1.467437744140625, -1.34844970703125, -1.229461669921875, -1.1104736328125, -0.991485595703125, -0.87249755859375, -0.753509521484375, -0.634521484375, -0.515533447265625, -0.39654541015625, -0.277557373046875, -0.1585693359375, -0.039581298828125, 0.07940673828125, 0.198394775390625, 0.3173828125, 0.436370849609375, 0.55535888671875, 0.674346923828125, 0.7933349609375, 0.912322998046875, 1.03131103515625, 1.150299072265625, 1.269287109375, 1.388275146484375, 1.50726318359375, 1.626251220703125, 1.7452392578125, 1.864227294921875, 1.98321533203125, 2.102203369140625, 2.22119140625, 2.340179443359375, 2.45916748046875, 2.578155517578125, 2.6971435546875, 2.816131591796875, 2.93511962890625, 3.054107666015625, 3.173095703125, 3.292083740234375, 3.41107177734375, 3.530059814453125, 3.6490478515625, 3.768035888671875, 3.88702392578125, 4.006011962890625, 4.125]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 2.0, 2.0, 4.0, 4.0, 16.0, 22.0, 27.0, 55.0, 57.0, 94.0, 113.0, 132.0, 126.0, 96.0, 72.0, 58.0, 49.0, 21.0, 16.0, 9.0, 15.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-89.24492645263672, -87.00086975097656, -84.7568130493164, -82.51275634765625, -80.26869201660156, -78.0246353149414, -75.78057861328125, -73.5365219116211, -71.29246520996094, -69.04840850830078, -66.80435180664062, -64.56029510498047, -62.31623458862305, -60.07217788696289, -57.82811737060547, -55.58406066894531, -53.340003967285156, -51.095947265625, -48.851890563964844, -46.60783004760742, -44.363773345947266, -42.11971664428711, -39.87565612792969, -37.63159942626953, -35.387542724609375, -33.14348602294922, -30.89942741394043, -28.65536880493164, -26.411312103271484, -24.167255401611328, -21.92319679260254, -19.67913818359375, -17.435077667236328, -15.191020011901855, -12.946962356567383, -10.70290470123291, -8.458847045898438, -6.214789390563965, -3.970731735229492, -1.7266740798950195, 0.5173835754394531, 2.761441230773926, 5.005498886108398, 7.249556541442871, 9.493614196777344, 11.737671852111816, 13.981729507446289, 16.225788116455078, 18.469844818115234, 20.71390151977539, 22.95796012878418, 25.20201873779297, 27.446075439453125, 29.69013214111328, 31.93419075012207, 34.17824935913086, 36.422306060791016, 38.66636276245117, 40.910423278808594, 43.15447998046875, 45.398536682128906, 47.64259338378906, 49.88665008544922, 52.13071060180664, 54.3747673034668]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 3.0, 9.0, 3.0, 18.0, 12.0, 13.0, 21.0, 20.0, 22.0, 35.0, 34.0, 54.0, 53.0, 61.0, 54.0, 75.0, 70.0, 70.0, 60.0, 49.0, 43.0, 42.0, 36.0, 29.0, 27.0, 24.0, 16.0, 9.0, 14.0, 6.0, 8.0, 3.0, 8.0, 2.0, 0.0, 3.0, 3.0], "bins": [-111.98564147949219, -109.38790130615234, -106.79015350341797, -104.19241333007812, -101.59466552734375, -98.9969253540039, -96.39917755126953, -93.80143737792969, -91.20368957519531, -88.60594940185547, -86.0082015991211, -83.41046142578125, -80.81271362304688, -78.21497344970703, -75.61722564697266, -73.01948547363281, -70.42173767089844, -67.8239974975586, -65.22624969482422, -62.62850570678711, -60.03076171875, -57.43301773071289, -54.83527374267578, -52.23753356933594, -49.639793395996094, -47.042049407958984, -44.444305419921875, -41.846561431884766, -39.248817443847656, -36.65107345581055, -34.05332946777344, -31.45558738708496, -28.85784149169922, -26.26009750366211, -23.662353515625, -21.06460952758789, -18.46686553955078, -15.869122505187988, -13.271379470825195, -10.673635482788086, -8.075891494750977, -5.478147506713867, -2.880403995513916, -0.28266048431396484, 2.3150835037231445, 4.912827491760254, 7.510570526123047, 10.108314514160156, 12.706058502197266, 15.303802490234375, 17.901546478271484, 20.499290466308594, 23.097034454345703, 25.694778442382812, 28.29252052307129, 30.8902645111084, 33.488006591796875, 36.085750579833984, 38.683494567871094, 41.2812385559082, 43.87898254394531, 46.47672653198242, 49.07447052001953, 51.672210693359375, 54.26995849609375]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 4.0, 10.0, 7.0, 19.0, 19.0, 23.0, 51.0, 54.0, 105.0, 181.0, 321.0, 668.0, 1886.0, 7921.0, 73054.0, 4006669.0, 90985.0, 9103.0, 1994.0, 620.0, 249.0, 145.0, 79.0, 30.0, 23.0, 20.0, 14.0, 7.0, 7.0, 3.0, 2.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.375, -40.21044921875, -39.0458984375, -37.88134765625, -36.716796875, -35.55224609375, -34.3876953125, -33.22314453125, -32.05859375, -30.89404296875, -29.7294921875, -28.56494140625, -27.400390625, -26.23583984375, -25.0712890625, -23.90673828125, -22.7421875, -21.57763671875, -20.4130859375, -19.24853515625, -18.083984375, -16.91943359375, -15.7548828125, -14.59033203125, -13.42578125, -12.26123046875, -11.0966796875, -9.93212890625, -8.767578125, -7.60302734375, -6.4384765625, -5.27392578125, -4.109375, -2.94482421875, -1.7802734375, -0.61572265625, 0.548828125, 1.71337890625, 2.8779296875, 4.04248046875, 5.20703125, 6.37158203125, 7.5361328125, 8.70068359375, 9.865234375, 11.02978515625, 12.1943359375, 13.35888671875, 14.5234375, 15.68798828125, 16.8525390625, 18.01708984375, 19.181640625, 20.34619140625, 21.5107421875, 22.67529296875, 23.83984375, 25.00439453125, 26.1689453125, 27.33349609375, 28.498046875, 29.66259765625, 30.8271484375, 31.99169921875, 33.15625]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 9.0, 10.0, 15.0, 18.0, 30.0, 37.0, 53.0, 72.0, 59.0, 73.0, 93.0, 91.0, 90.0, 73.0, 70.0, 54.0, 49.0, 35.0, 24.0, 12.0, 12.0, 6.0, 2.0, 2.0, 4.0, 1.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-4.48828125, -4.37396240234375, -4.2596435546875, -4.14532470703125, -4.031005859375, -3.91668701171875, -3.8023681640625, -3.68804931640625, -3.57373046875, -3.45941162109375, -3.3450927734375, -3.23077392578125, -3.116455078125, -3.00213623046875, -2.8878173828125, -2.77349853515625, -2.6591796875, -2.54486083984375, -2.4305419921875, -2.31622314453125, -2.201904296875, -2.08758544921875, -1.9732666015625, -1.85894775390625, -1.74462890625, -1.63031005859375, -1.5159912109375, -1.40167236328125, -1.287353515625, -1.17303466796875, -1.0587158203125, -0.94439697265625, -0.830078125, -0.71575927734375, -0.6014404296875, -0.48712158203125, -0.372802734375, -0.25848388671875, -0.1441650390625, -0.02984619140625, 0.08447265625, 0.19879150390625, 0.3131103515625, 0.42742919921875, 0.541748046875, 0.65606689453125, 0.7703857421875, 0.88470458984375, 0.9990234375, 1.11334228515625, 1.2276611328125, 1.34197998046875, 1.456298828125, 1.57061767578125, 1.6849365234375, 1.79925537109375, 1.91357421875, 2.02789306640625, 2.1422119140625, 2.25653076171875, 2.370849609375, 2.48516845703125, 2.5994873046875, 2.71380615234375, 2.828125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 3.0, 9.0, 19.0, 26.0, 21.0, 38.0, 65.0, 95.0, 135.0, 253.0, 570.0, 1373.0, 4479.0, 20799.0, 261151.0, 3796117.0, 92048.0, 11907.0, 2865.0, 1135.0, 513.0, 263.0, 135.0, 93.0, 46.0, 47.0, 19.0, 19.0, 12.0, 9.0, 5.0, 4.0, 2.0, 2.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-34.28125, -33.337890625, -32.39453125, -31.451171875, -30.5078125, -29.564453125, -28.62109375, -27.677734375, -26.734375, -25.791015625, -24.84765625, -23.904296875, -22.9609375, -22.017578125, -21.07421875, -20.130859375, -19.1875, -18.244140625, -17.30078125, -16.357421875, -15.4140625, -14.470703125, -13.52734375, -12.583984375, -11.640625, -10.697265625, -9.75390625, -8.810546875, -7.8671875, -6.923828125, -5.98046875, -5.037109375, -4.09375, -3.150390625, -2.20703125, -1.263671875, -0.3203125, 0.623046875, 1.56640625, 2.509765625, 3.453125, 4.396484375, 5.33984375, 6.283203125, 7.2265625, 8.169921875, 9.11328125, 10.056640625, 11.0, 11.943359375, 12.88671875, 13.830078125, 14.7734375, 15.716796875, 16.66015625, 17.603515625, 18.546875, 19.490234375, 20.43359375, 21.376953125, 22.3203125, 23.263671875, 24.20703125, 25.150390625, 26.09375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 5.0, 3.0, 6.0, 5.0, 8.0, 11.0, 9.0, 13.0, 22.0, 45.0, 53.0, 87.0, 152.0, 317.0, 884.0, 1445.0, 492.0, 194.0, 118.0, 57.0, 44.0, 36.0, 16.0, 19.0, 11.0, 10.0, 4.0, 1.0, 3.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.953125, -4.78924560546875, -4.6253662109375, -4.46148681640625, -4.297607421875, -4.13372802734375, -3.9698486328125, -3.80596923828125, -3.64208984375, -3.47821044921875, -3.3143310546875, -3.15045166015625, -2.986572265625, -2.82269287109375, -2.6588134765625, -2.49493408203125, -2.3310546875, -2.16717529296875, -2.0032958984375, -1.83941650390625, -1.675537109375, -1.51165771484375, -1.3477783203125, -1.18389892578125, -1.02001953125, -0.85614013671875, -0.6922607421875, -0.52838134765625, -0.364501953125, -0.20062255859375, -0.0367431640625, 0.12713623046875, 0.291015625, 0.45489501953125, 0.6187744140625, 0.78265380859375, 0.946533203125, 1.11041259765625, 1.2742919921875, 1.43817138671875, 1.60205078125, 1.76593017578125, 1.9298095703125, 2.09368896484375, 2.257568359375, 2.42144775390625, 2.5853271484375, 2.74920654296875, 2.9130859375, 3.07696533203125, 3.2408447265625, 3.40472412109375, 3.568603515625, 3.73248291015625, 3.8963623046875, 4.06024169921875, 4.22412109375, 4.38800048828125, 4.5518798828125, 4.71575927734375, 4.879638671875, 5.04351806640625, 5.2073974609375, 5.37127685546875, 5.53515625]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 20.0, 79.0, 250.0, 420.0, 171.0, 54.0, 17.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.04430389404297, -35.18310546875, -32.32190704345703, -29.460708618164062, -26.599510192871094, -23.738311767578125, -20.877113342285156, -18.015914916992188, -15.154716491699219, -12.29351806640625, -9.432319641113281, -6.5711212158203125, -3.7099227905273438, -0.848724365234375, 2.0124740600585938, 4.8736724853515625, 7.734870910644531, 10.5960693359375, 13.457267761230469, 16.318466186523438, 19.179664611816406, 22.040863037109375, 24.902061462402344, 27.763259887695312, 30.62445831298828, 33.48565673828125, 36.34685516357422, 39.20805358886719, 42.069252014160156, 44.930450439453125, 47.791648864746094, 50.65284729003906, 53.5140380859375, 56.37523651123047, 59.23643493652344, 62.097633361816406, 64.95883178710938, 67.82003021240234, 70.68122863769531, 73.54242706298828, 76.40362548828125, 79.26482391357422, 82.12602233886719, 84.98722076416016, 87.84841918945312, 90.7096176147461, 93.57081604003906, 96.43201446533203, 99.293212890625, 102.15441131591797, 105.01560974121094, 107.8768081665039, 110.73800659179688, 113.59920501708984, 116.46040344238281, 119.32160186767578, 122.18280029296875, 125.04399871826172, 127.90519714355469, 130.76638793945312, 133.62759399414062, 136.48880004882812, 139.34999084472656, 142.211181640625, 145.0723876953125]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 1.0, 4.0, 0.0, 9.0, 8.0, 5.0, 10.0, 13.0, 27.0, 25.0, 26.0, 36.0, 42.0, 39.0, 39.0, 73.0, 55.0, 62.0, 78.0, 73.0, 67.0, 54.0, 52.0, 39.0, 38.0, 33.0, 28.0, 20.0, 16.0, 9.0, 9.0, 6.0, 7.0, 0.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.02696418762207, -14.356404304504395, -13.685843467712402, -13.015283584594727, -12.344722747802734, -11.674162864685059, -11.003602981567383, -10.33304214477539, -9.662482261657715, -8.991922378540039, -8.321361541748047, -7.650801658630371, -6.980241298675537, -6.309680938720703, -5.639121055603027, -4.968560695648193, -4.298000335693359, -3.6274399757385254, -2.9568798542022705, -2.2863197326660156, -1.6157593727111816, -0.9451990127563477, -0.2746391296386719, 0.3959212303161621, 1.066481590270996, 1.7370418310165405, 2.407602071762085, 3.07816219329834, 3.748722553253174, 4.419282913208008, 5.089842796325684, 5.760403156280518, 6.430961608886719, 7.101521968841553, 7.772082328796387, 8.442642211914062, 9.113203048706055, 9.78376293182373, 10.454322814941406, 11.124883651733398, 11.795443534851074, 12.46600341796875, 13.136564254760742, 13.807124137878418, 14.477684020996094, 15.148244857788086, 15.818804740905762, 16.489364624023438, 17.15992546081543, 17.830486297607422, 18.50104522705078, 19.171606063842773, 19.842166900634766, 20.512725830078125, 21.183286666870117, 21.85384750366211, 22.52440643310547, 23.19496726989746, 23.86552619934082, 24.536087036132812, 25.206647872924805, 25.877208709716797, 26.547767639160156, 27.21832847595215, 27.88888931274414]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 1.0, 4.0, 1.0, 2.0, 7.0, 7.0, 3.0, 11.0, 7.0, 12.0, 27.0, 29.0, 39.0, 46.0, 58.0, 114.0, 140.0, 229.0, 371.0, 694.0, 1288.0, 2707.0, 6335.0, 18966.0, 72624.0, 289164.0, 446956.0, 152175.0, 37231.0, 10946.0, 4162.0, 1890.0, 888.0, 533.0, 325.0, 188.0, 112.0, 78.0, 36.0, 45.0, 26.0, 22.0, 8.0, 13.0, 13.0, 5.0, 7.0, 3.0, 5.0, 3.0, 3.0, 3.0, 0.0, 0.0, 3.0, 1.0], "bins": [-14.875, -14.4407958984375, -14.006591796875, -13.5723876953125, -13.13818359375, -12.7039794921875, -12.269775390625, -11.8355712890625, -11.4013671875, -10.9671630859375, -10.532958984375, -10.0987548828125, -9.66455078125, -9.2303466796875, -8.796142578125, -8.3619384765625, -7.927734375, -7.4935302734375, -7.059326171875, -6.6251220703125, -6.19091796875, -5.7567138671875, -5.322509765625, -4.8883056640625, -4.4541015625, -4.0198974609375, -3.585693359375, -3.1514892578125, -2.71728515625, -2.2830810546875, -1.848876953125, -1.4146728515625, -0.98046875, -0.5462646484375, -0.112060546875, 0.3221435546875, 0.75634765625, 1.1905517578125, 1.624755859375, 2.0589599609375, 2.4931640625, 2.9273681640625, 3.361572265625, 3.7957763671875, 4.22998046875, 4.6641845703125, 5.098388671875, 5.5325927734375, 5.966796875, 6.4010009765625, 6.835205078125, 7.2694091796875, 7.70361328125, 8.1378173828125, 8.572021484375, 9.0062255859375, 9.4404296875, 9.8746337890625, 10.308837890625, 10.7430419921875, 11.17724609375, 11.6114501953125, 12.045654296875, 12.4798583984375, 12.9140625]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 4.0, 3.0, 10.0, 10.0, 16.0, 21.0, 24.0, 31.0, 49.0, 51.0, 61.0, 65.0, 78.0, 85.0, 68.0, 71.0, 61.0, 54.0, 41.0, 53.0, 39.0, 27.0, 20.0, 23.0, 12.0, 5.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-3.568359375, -3.469635009765625, -3.37091064453125, -3.272186279296875, -3.1734619140625, -3.074737548828125, -2.97601318359375, -2.877288818359375, -2.778564453125, -2.679840087890625, -2.58111572265625, -2.482391357421875, -2.3836669921875, -2.284942626953125, -2.18621826171875, -2.087493896484375, -1.98876953125, -1.890045166015625, -1.79132080078125, -1.692596435546875, -1.5938720703125, -1.495147705078125, -1.39642333984375, -1.297698974609375, -1.198974609375, -1.100250244140625, -1.00152587890625, -0.902801513671875, -0.8040771484375, -0.705352783203125, -0.60662841796875, -0.507904052734375, -0.4091796875, -0.310455322265625, -0.21173095703125, -0.113006591796875, -0.0142822265625, 0.084442138671875, 0.18316650390625, 0.281890869140625, 0.380615234375, 0.479339599609375, 0.57806396484375, 0.676788330078125, 0.7755126953125, 0.874237060546875, 0.97296142578125, 1.071685791015625, 1.17041015625, 1.269134521484375, 1.36785888671875, 1.466583251953125, 1.5653076171875, 1.664031982421875, 1.76275634765625, 1.861480712890625, 1.960205078125, 2.058929443359375, 2.15765380859375, 2.256378173828125, 2.3551025390625, 2.453826904296875, 2.55255126953125, 2.651275634765625, 2.75]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 5.0, 4.0, 5.0, 3.0, 8.0, 11.0, 12.0, 14.0, 24.0, 30.0, 39.0, 55.0, 116.0, 185.0, 323.0, 601.0, 1299.0, 3195.0, 11056.0, 58278.0, 371118.0, 490866.0, 88745.0, 15452.0, 4010.0, 1498.0, 716.0, 326.0, 218.0, 112.0, 70.0, 41.0, 40.0, 19.0, 17.0, 8.0, 8.0, 9.0, 11.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-18.140625, -17.57568359375, -17.0107421875, -16.44580078125, -15.880859375, -15.31591796875, -14.7509765625, -14.18603515625, -13.62109375, -13.05615234375, -12.4912109375, -11.92626953125, -11.361328125, -10.79638671875, -10.2314453125, -9.66650390625, -9.1015625, -8.53662109375, -7.9716796875, -7.40673828125, -6.841796875, -6.27685546875, -5.7119140625, -5.14697265625, -4.58203125, -4.01708984375, -3.4521484375, -2.88720703125, -2.322265625, -1.75732421875, -1.1923828125, -0.62744140625, -0.0625, 0.50244140625, 1.0673828125, 1.63232421875, 2.197265625, 2.76220703125, 3.3271484375, 3.89208984375, 4.45703125, 5.02197265625, 5.5869140625, 6.15185546875, 6.716796875, 7.28173828125, 7.8466796875, 8.41162109375, 8.9765625, 9.54150390625, 10.1064453125, 10.67138671875, 11.236328125, 11.80126953125, 12.3662109375, 12.93115234375, 13.49609375, 14.06103515625, 14.6259765625, 15.19091796875, 15.755859375, 16.32080078125, 16.8857421875, 17.45068359375, 18.015625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 4.0, 5.0, 5.0, 7.0, 3.0, 8.0, 4.0, 6.0, 13.0, 15.0, 22.0, 35.0, 20.0, 38.0, 39.0, 37.0, 37.0, 55.0, 50.0, 57.0, 46.0, 54.0, 66.0, 51.0, 29.0, 39.0, 43.0, 37.0, 32.0, 23.0, 24.0, 25.0, 14.0, 13.0, 11.0, 10.0, 8.0, 4.0, 4.0, 4.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-12.7421875, -12.3714599609375, -12.000732421875, -11.6300048828125, -11.25927734375, -10.8885498046875, -10.517822265625, -10.1470947265625, -9.7763671875, -9.4056396484375, -9.034912109375, -8.6641845703125, -8.29345703125, -7.9227294921875, -7.552001953125, -7.1812744140625, -6.810546875, -6.4398193359375, -6.069091796875, -5.6983642578125, -5.32763671875, -4.9569091796875, -4.586181640625, -4.2154541015625, -3.8447265625, -3.4739990234375, -3.103271484375, -2.7325439453125, -2.36181640625, -1.9910888671875, -1.620361328125, -1.2496337890625, -0.87890625, -0.5081787109375, -0.137451171875, 0.2332763671875, 0.60400390625, 0.9747314453125, 1.345458984375, 1.7161865234375, 2.0869140625, 2.4576416015625, 2.828369140625, 3.1990966796875, 3.56982421875, 3.9405517578125, 4.311279296875, 4.6820068359375, 5.052734375, 5.4234619140625, 5.794189453125, 6.1649169921875, 6.53564453125, 6.9063720703125, 7.277099609375, 7.6478271484375, 8.0185546875, 8.3892822265625, 8.760009765625, 9.1307373046875, 9.50146484375, 9.8721923828125, 10.242919921875, 10.6136474609375, 10.984375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 2.0, 2.0, 7.0, 6.0, 10.0, 16.0, 18.0, 34.0, 67.0, 110.0, 197.0, 437.0, 1191.0, 4167.0, 17999.0, 126777.0, 645932.0, 215863.0, 27332.0, 5618.0, 1648.0, 594.0, 246.0, 102.0, 72.0, 26.0, 33.0, 14.0, 13.0, 9.0, 7.0, 4.0, 0.0, 4.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.765625, -8.4593505859375, -8.153076171875, -7.8468017578125, -7.54052734375, -7.2342529296875, -6.927978515625, -6.6217041015625, -6.3154296875, -6.0091552734375, -5.702880859375, -5.3966064453125, -5.09033203125, -4.7840576171875, -4.477783203125, -4.1715087890625, -3.865234375, -3.5589599609375, -3.252685546875, -2.9464111328125, -2.64013671875, -2.3338623046875, -2.027587890625, -1.7213134765625, -1.4150390625, -1.1087646484375, -0.802490234375, -0.4962158203125, -0.18994140625, 0.1163330078125, 0.422607421875, 0.7288818359375, 1.03515625, 1.3414306640625, 1.647705078125, 1.9539794921875, 2.26025390625, 2.5665283203125, 2.872802734375, 3.1790771484375, 3.4853515625, 3.7916259765625, 4.097900390625, 4.4041748046875, 4.71044921875, 5.0167236328125, 5.322998046875, 5.6292724609375, 5.935546875, 6.2418212890625, 6.548095703125, 6.8543701171875, 7.16064453125, 7.4669189453125, 7.773193359375, 8.0794677734375, 8.3857421875, 8.6920166015625, 8.998291015625, 9.3045654296875, 9.61083984375, 9.9171142578125, 10.223388671875, 10.5296630859375, 10.8359375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 8.0, 4.0, 8.0, 7.0, 17.0, 13.0, 27.0, 39.0, 43.0, 56.0, 63.0, 91.0, 90.0, 107.0, 101.0, 86.0, 67.0, 41.0, 26.0, 30.0, 19.0, 12.0, 15.0, 6.0, 7.0, 4.0, 2.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0010395050048828125, -0.0010012388229370117, -0.0009629726409912109, -0.0009247064590454102, -0.0008864402770996094, -0.0008481740951538086, -0.0008099079132080078, -0.000771641731262207, -0.0007333755493164062, -0.0006951093673706055, -0.0006568431854248047, -0.0006185770034790039, -0.0005803108215332031, -0.0005420446395874023, -0.0005037784576416016, -0.0004655122756958008, -0.00042724609375, -0.0003889799118041992, -0.00035071372985839844, -0.00031244754791259766, -0.0002741813659667969, -0.0002359151840209961, -0.0001976490020751953, -0.00015938282012939453, -0.00012111663818359375, -8.285045623779297e-05, -4.458427429199219e-05, -6.318092346191406e-06, 3.1948089599609375e-05, 7.021427154541016e-05, 0.00010848045349121094, 0.00014674663543701172, 0.0001850128173828125, 0.00022327899932861328, 0.00026154518127441406, 0.00029981136322021484, 0.0003380775451660156, 0.0003763437271118164, 0.0004146099090576172, 0.00045287609100341797, 0.0004911422729492188, 0.0005294084548950195, 0.0005676746368408203, 0.0006059408187866211, 0.0006442070007324219, 0.0006824731826782227, 0.0007207393646240234, 0.0007590055465698242, 0.000797271728515625, 0.0008355379104614258, 0.0008738040924072266, 0.0009120702743530273, 0.0009503364562988281, 0.000988602638244629, 0.0010268688201904297, 0.0010651350021362305, 0.0011034011840820312, 0.001141667366027832, 0.0011799335479736328, 0.0012181997299194336, 0.0012564659118652344, 0.0012947320938110352, 0.001332998275756836, 0.0013712644577026367, 0.0014095306396484375]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 6.0, 2.0, 2.0, 4.0, 6.0, 16.0, 18.0, 37.0, 47.0, 116.0, 188.0, 465.0, 1181.0, 4350.0, 30477.0, 430308.0, 534977.0, 38944.0, 5151.0, 1290.0, 485.0, 229.0, 105.0, 71.0, 32.0, 24.0, 5.0, 4.0, 10.0, 6.0, 2.0, 2.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.4921875, -13.083984375, -12.67578125, -12.267578125, -11.859375, -11.451171875, -11.04296875, -10.634765625, -10.2265625, -9.818359375, -9.41015625, -9.001953125, -8.59375, -8.185546875, -7.77734375, -7.369140625, -6.9609375, -6.552734375, -6.14453125, -5.736328125, -5.328125, -4.919921875, -4.51171875, -4.103515625, -3.6953125, -3.287109375, -2.87890625, -2.470703125, -2.0625, -1.654296875, -1.24609375, -0.837890625, -0.4296875, -0.021484375, 0.38671875, 0.794921875, 1.203125, 1.611328125, 2.01953125, 2.427734375, 2.8359375, 3.244140625, 3.65234375, 4.060546875, 4.46875, 4.876953125, 5.28515625, 5.693359375, 6.1015625, 6.509765625, 6.91796875, 7.326171875, 7.734375, 8.142578125, 8.55078125, 8.958984375, 9.3671875, 9.775390625, 10.18359375, 10.591796875, 11.0, 11.408203125, 11.81640625, 12.224609375, 12.6328125]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 6.0, 5.0, 7.0, 5.0, 5.0, 18.0, 23.0, 33.0, 46.0, 56.0, 67.0, 73.0, 99.0, 101.0, 84.0, 84.0, 66.0, 62.0, 52.0, 26.0, 24.0, 14.0, 20.0, 7.0, 5.0, 5.0, 8.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.4140625, -5.21759033203125, -5.0211181640625, -4.82464599609375, -4.628173828125, -4.43170166015625, -4.2352294921875, -4.03875732421875, -3.84228515625, -3.64581298828125, -3.4493408203125, -3.25286865234375, -3.056396484375, -2.85992431640625, -2.6634521484375, -2.46697998046875, -2.2705078125, -2.07403564453125, -1.8775634765625, -1.68109130859375, -1.484619140625, -1.28814697265625, -1.0916748046875, -0.89520263671875, -0.69873046875, -0.50225830078125, -0.3057861328125, -0.10931396484375, 0.087158203125, 0.28363037109375, 0.4801025390625, 0.67657470703125, 0.873046875, 1.06951904296875, 1.2659912109375, 1.46246337890625, 1.658935546875, 1.85540771484375, 2.0518798828125, 2.24835205078125, 2.44482421875, 2.64129638671875, 2.8377685546875, 3.03424072265625, 3.230712890625, 3.42718505859375, 3.6236572265625, 3.82012939453125, 4.0166015625, 4.21307373046875, 4.4095458984375, 4.60601806640625, 4.802490234375, 4.99896240234375, 5.1954345703125, 5.39190673828125, 5.58837890625, 5.78485107421875, 5.9813232421875, 6.17779541015625, 6.374267578125, 6.57073974609375, 6.7672119140625, 6.96368408203125, 7.16015625]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 13.0, 48.0, 184.0, 400.0, 256.0, 76.0, 23.0, 9.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-165.12338256835938, -157.109130859375, -149.09487915039062, -141.08062744140625, -133.06637573242188, -125.05211639404297, -117.03785705566406, -109.02360534667969, -101.00935363769531, -92.99510192871094, -84.98085021972656, -76.96659088134766, -68.95233917236328, -60.938087463378906, -52.923831939697266, -44.909576416015625, -36.89532470703125, -28.881071090698242, -20.866817474365234, -12.852563858032227, -4.838310241699219, 3.1759414672851562, 11.190196990966797, 19.204452514648438, 27.218704223632812, 35.23295593261719, 43.24721145629883, 51.26146697998047, 59.275718688964844, 67.28997039794922, 75.30422973632812, 83.3184814453125, 91.332763671875, 99.34701538085938, 107.36126708984375, 115.37552642822266, 123.38977813720703, 131.40402221679688, 139.4182891845703, 147.4325408935547, 155.44679260253906, 163.46104431152344, 171.4752960205078, 179.4895477294922, 187.50381469726562, 195.51806640625, 203.53231811523438, 211.54656982421875, 219.56082153320312, 227.5750732421875, 235.58932495117188, 243.60357666015625, 251.61782836914062, 259.632080078125, 267.6463317871094, 275.66058349609375, 283.67486572265625, 291.6891174316406, 299.703369140625, 307.7176208496094, 315.73187255859375, 323.7461242675781, 331.7603759765625, 339.774658203125, 347.78887939453125]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 5.0, 3.0, 1.0, 7.0, 5.0, 17.0, 10.0, 16.0, 7.0, 15.0, 22.0, 17.0, 28.0, 32.0, 34.0, 38.0, 37.0, 52.0, 46.0, 50.0, 45.0, 57.0, 49.0, 42.0, 51.0, 36.0, 47.0, 44.0, 28.0, 25.0, 19.0, 21.0, 16.0, 16.0, 14.0, 12.0, 7.0, 10.0, 9.0, 1.0, 2.0, 4.0, 7.0, 3.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-66.31913757324219, -64.38018798828125, -62.44123840332031, -60.502288818359375, -58.56333923339844, -56.6243896484375, -54.68544006347656, -52.746490478515625, -50.80754089355469, -48.86859130859375, -46.92964172363281, -44.990692138671875, -43.05174255371094, -41.11279296875, -39.17384338378906, -37.234893798828125, -35.29594802856445, -33.356998443603516, -31.418048858642578, -29.47909927368164, -27.540149688720703, -25.601200103759766, -23.66225242614746, -21.723302841186523, -19.784353256225586, -17.84540367126465, -15.906454086303711, -13.96750545501709, -12.028555870056152, -10.089606285095215, -8.150657653808594, -6.211708068847656, -4.272762298583984, -2.333812952041626, -0.3948636054992676, 1.5440855026245117, 3.483035087585449, 5.421984672546387, 7.360933303833008, 9.299882888793945, 11.238832473754883, 13.17778205871582, 15.116731643676758, 17.055679321289062, 18.99462890625, 20.933578491210938, 22.872528076171875, 24.811477661132812, 26.75042724609375, 28.689376831054688, 30.628326416015625, 32.56727600097656, 34.5062255859375, 36.44517517089844, 38.384124755859375, 40.32307434082031, 42.26202392578125, 44.20097351074219, 46.139923095703125, 48.07887268066406, 50.017822265625, 51.95677185058594, 53.895721435546875, 55.83467102050781, 57.773616790771484]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 6.0, 5.0, 9.0, 4.0, 6.0, 9.0, 12.0, 14.0, 21.0, 17.0, 27.0, 39.0, 43.0, 64.0, 87.0, 122.0, 142.0, 248.0, 375.0, 648.0, 1261.0, 2689.0, 6780.0, 22266.0, 128284.0, 3675742.0, 303522.0, 35211.0, 9738.0, 3599.0, 1588.0, 710.0, 418.0, 190.0, 132.0, 91.0, 46.0, 42.0, 21.0, 22.0, 8.0, 8.0, 8.0, 4.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-23.203125, -22.533447265625, -21.86376953125, -21.194091796875, -20.5244140625, -19.854736328125, -19.18505859375, -18.515380859375, -17.845703125, -17.176025390625, -16.50634765625, -15.836669921875, -15.1669921875, -14.497314453125, -13.82763671875, -13.157958984375, -12.48828125, -11.818603515625, -11.14892578125, -10.479248046875, -9.8095703125, -9.139892578125, -8.47021484375, -7.800537109375, -7.130859375, -6.461181640625, -5.79150390625, -5.121826171875, -4.4521484375, -3.782470703125, -3.11279296875, -2.443115234375, -1.7734375, -1.103759765625, -0.43408203125, 0.235595703125, 0.9052734375, 1.574951171875, 2.24462890625, 2.914306640625, 3.583984375, 4.253662109375, 4.92333984375, 5.593017578125, 6.2626953125, 6.932373046875, 7.60205078125, 8.271728515625, 8.94140625, 9.611083984375, 10.28076171875, 10.950439453125, 11.6201171875, 12.289794921875, 12.95947265625, 13.629150390625, 14.298828125, 14.968505859375, 15.63818359375, 16.307861328125, 16.9775390625, 17.647216796875, 18.31689453125, 18.986572265625, 19.65625]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 11.0, 14.0, 13.0, 12.0, 23.0, 24.0, 38.0, 35.0, 38.0, 57.0, 56.0, 62.0, 67.0, 82.0, 67.0, 67.0, 48.0, 60.0, 38.0, 48.0, 38.0, 19.0, 17.0, 13.0, 14.0, 12.0, 8.0, 6.0, 0.0, 5.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.021484375, -2.92877197265625, -2.8360595703125, -2.74334716796875, -2.650634765625, -2.55792236328125, -2.4652099609375, -2.37249755859375, -2.27978515625, -2.18707275390625, -2.0943603515625, -2.00164794921875, -1.908935546875, -1.81622314453125, -1.7235107421875, -1.63079833984375, -1.5380859375, -1.44537353515625, -1.3526611328125, -1.25994873046875, -1.167236328125, -1.07452392578125, -0.9818115234375, -0.88909912109375, -0.79638671875, -0.70367431640625, -0.6109619140625, -0.51824951171875, -0.425537109375, -0.33282470703125, -0.2401123046875, -0.14739990234375, -0.0546875, 0.03802490234375, 0.1307373046875, 0.22344970703125, 0.316162109375, 0.40887451171875, 0.5015869140625, 0.59429931640625, 0.68701171875, 0.77972412109375, 0.8724365234375, 0.96514892578125, 1.057861328125, 1.15057373046875, 1.2432861328125, 1.33599853515625, 1.4287109375, 1.52142333984375, 1.6141357421875, 1.70684814453125, 1.799560546875, 1.89227294921875, 1.9849853515625, 2.07769775390625, 2.17041015625, 2.26312255859375, 2.3558349609375, 2.44854736328125, 2.541259765625, 2.63397216796875, 2.7266845703125, 2.81939697265625, 2.912109375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 6.0, 3.0, 10.0, 17.0, 21.0, 26.0, 51.0, 79.0, 151.0, 260.0, 544.0, 1201.0, 4048.0, 51707.0, 4067581.0, 62413.0, 4071.0, 1151.0, 444.0, 207.0, 118.0, 71.0, 43.0, 25.0, 12.0, 14.0, 3.0, 9.0, 0.0, 4.0, 2.0], "bins": [-83.5625, -81.80419921875, -80.0458984375, -78.28759765625, -76.529296875, -74.77099609375, -73.0126953125, -71.25439453125, -69.49609375, -67.73779296875, -65.9794921875, -64.22119140625, -62.462890625, -60.70458984375, -58.9462890625, -57.18798828125, -55.4296875, -53.67138671875, -51.9130859375, -50.15478515625, -48.396484375, -46.63818359375, -44.8798828125, -43.12158203125, -41.36328125, -39.60498046875, -37.8466796875, -36.08837890625, -34.330078125, -32.57177734375, -30.8134765625, -29.05517578125, -27.296875, -25.53857421875, -23.7802734375, -22.02197265625, -20.263671875, -18.50537109375, -16.7470703125, -14.98876953125, -13.23046875, -11.47216796875, -9.7138671875, -7.95556640625, -6.197265625, -4.43896484375, -2.6806640625, -0.92236328125, 0.8359375, 2.59423828125, 4.3525390625, 6.11083984375, 7.869140625, 9.62744140625, 11.3857421875, 13.14404296875, 14.90234375, 16.66064453125, 18.4189453125, 20.17724609375, 21.935546875, 23.69384765625, 25.4521484375, 27.21044921875, 28.96875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 7.0, 3.0, 5.0, 8.0, 16.0, 28.0, 51.0, 137.0, 396.0, 1584.0, 1302.0, 307.0, 122.0, 50.0, 32.0, 17.0, 5.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0], "bins": [-20.515625, -20.11285400390625, -19.7100830078125, -19.30731201171875, -18.904541015625, -18.50177001953125, -18.0989990234375, -17.69622802734375, -17.29345703125, -16.89068603515625, -16.4879150390625, -16.08514404296875, -15.682373046875, -15.27960205078125, -14.8768310546875, -14.47406005859375, -14.0712890625, -13.66851806640625, -13.2657470703125, -12.86297607421875, -12.460205078125, -12.05743408203125, -11.6546630859375, -11.25189208984375, -10.84912109375, -10.44635009765625, -10.0435791015625, -9.64080810546875, -9.238037109375, -8.83526611328125, -8.4324951171875, -8.02972412109375, -7.626953125, -7.22418212890625, -6.8214111328125, -6.41864013671875, -6.015869140625, -5.61309814453125, -5.2103271484375, -4.80755615234375, -4.40478515625, -4.00201416015625, -3.5992431640625, -3.19647216796875, -2.793701171875, -2.39093017578125, -1.9881591796875, -1.58538818359375, -1.1826171875, -0.77984619140625, -0.3770751953125, 0.02569580078125, 0.428466796875, 0.83123779296875, 1.2340087890625, 1.63677978515625, 2.03955078125, 2.44232177734375, 2.8450927734375, 3.24786376953125, 3.650634765625, 4.05340576171875, 4.4561767578125, 4.85894775390625, 5.26171875]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 3.0, 9.0, 43.0, 210.0, 443.0, 235.0, 48.0, 10.0, 7.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-81.90866088867188, -76.64916229248047, -71.38965606689453, -66.13015747070312, -60.87065505981445, -55.61115264892578, -50.351654052734375, -45.0921516418457, -39.83264923095703, -34.57314682006836, -29.31364631652832, -24.05414581298828, -18.79464340209961, -13.535140991210938, -8.275640487670898, -3.0161399841308594, 2.2433624267578125, 7.502863883972168, 12.762365341186523, 18.021865844726562, 23.281368255615234, 28.540870666503906, 33.80036926269531, 39.059871673583984, 44.319374084472656, 49.57887649536133, 54.83837890625, 60.097877502441406, 65.35737609863281, 70.61688232421875, 75.87638092041016, 81.13587951660156, 86.3953857421875, 91.6548843383789, 96.91439056396484, 102.17388916015625, 107.43339538574219, 112.6928939819336, 117.952392578125, 123.21189880371094, 128.47140502929688, 133.7309112548828, 138.9904022216797, 144.24990844726562, 149.50941467285156, 154.7689208984375, 160.02841186523438, 165.2879180908203, 170.5474090576172, 175.80691528320312, 181.06640625, 186.32591247558594, 191.58541870117188, 196.84490966796875, 202.1044158935547, 207.36392211914062, 212.6234130859375, 217.88291931152344, 223.1424102783203, 228.40191650390625, 233.6614227294922, 238.92092895507812, 244.180419921875, 249.43992614746094, 254.69943237304688]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 7.0, 8.0, 12.0, 15.0, 27.0, 39.0, 78.0, 79.0, 94.0, 85.0, 86.0, 84.0, 108.0, 65.0, 64.0, 50.0, 36.0, 24.0, 21.0, 7.0, 7.0, 4.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.94160079956055, -53.329349517822266, -51.71709442138672, -50.10484313964844, -48.49258804321289, -46.88033676147461, -45.26808166503906, -43.65583038330078, -42.0435791015625, -40.43132781982422, -38.81907272338867, -37.20682144165039, -35.594566345214844, -33.98231506347656, -32.37006378173828, -30.757808685302734, -29.14555549621582, -27.533302307128906, -25.921049118041992, -24.308795928955078, -22.696544647216797, -21.084291458129883, -19.47203826904297, -17.859786987304688, -16.24753189086914, -14.635278701782227, -13.023026466369629, -11.410773277282715, -9.798521041870117, -8.186267852783203, -6.574014663696289, -4.961762428283691, -3.3495101928710938, -1.7372573614120483, -0.12500452995300293, 1.487248420715332, 3.099501132965088, 4.711753845214844, 6.324007034301758, 7.9362592697143555, 9.54851245880127, 11.160765647888184, 12.773017883300781, 14.385271072387695, 15.99752426147461, 17.60977554321289, 19.222030639648438, 20.83428192138672, 22.446535110473633, 24.058788299560547, 25.67104148864746, 27.283294677734375, 28.895545959472656, 30.50779914855957, 32.120052337646484, 33.732303619384766, 35.34455871582031, 36.956809997558594, 38.56906509399414, 40.18131637573242, 41.79357147216797, 43.40582275390625, 45.01807403564453, 46.63032913208008, 48.24258041381836]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 4.0, 12.0, 5.0, 15.0, 18.0, 24.0, 26.0, 44.0, 44.0, 87.0, 100.0, 146.0, 232.0, 365.0, 570.0, 998.0, 1831.0, 3952.0, 10338.0, 35349.0, 142456.0, 449018.0, 297128.0, 73669.0, 19455.0, 6495.0, 2731.0, 1294.0, 751.0, 431.0, 306.0, 212.0, 117.0, 91.0, 54.0, 46.0, 40.0, 25.0, 22.0, 23.0, 8.0, 6.0, 5.0, 5.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-16.328125, -15.8446044921875, -15.361083984375, -14.8775634765625, -14.39404296875, -13.9105224609375, -13.427001953125, -12.9434814453125, -12.4599609375, -11.9764404296875, -11.492919921875, -11.0093994140625, -10.52587890625, -10.0423583984375, -9.558837890625, -9.0753173828125, -8.591796875, -8.1082763671875, -7.624755859375, -7.1412353515625, -6.65771484375, -6.1741943359375, -5.690673828125, -5.2071533203125, -4.7236328125, -4.2401123046875, -3.756591796875, -3.2730712890625, -2.78955078125, -2.3060302734375, -1.822509765625, -1.3389892578125, -0.85546875, -0.3719482421875, 0.111572265625, 0.5950927734375, 1.07861328125, 1.5621337890625, 2.045654296875, 2.5291748046875, 3.0126953125, 3.4962158203125, 3.979736328125, 4.4632568359375, 4.94677734375, 5.4302978515625, 5.913818359375, 6.3973388671875, 6.880859375, 7.3643798828125, 7.847900390625, 8.3314208984375, 8.81494140625, 9.2984619140625, 9.781982421875, 10.2655029296875, 10.7490234375, 11.2325439453125, 11.716064453125, 12.1995849609375, 12.68310546875, 13.1666259765625, 13.650146484375, 14.1336669921875, 14.6171875]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 1.0, 4.0, 12.0, 16.0, 16.0, 23.0, 26.0, 53.0, 58.0, 77.0, 104.0, 113.0, 102.0, 93.0, 74.0, 63.0, 57.0, 43.0, 22.0, 19.0, 10.0, 6.0, 1.0, 0.0, 8.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.9296875, -4.7889404296875, -4.648193359375, -4.5074462890625, -4.36669921875, -4.2259521484375, -4.085205078125, -3.9444580078125, -3.8037109375, -3.6629638671875, -3.522216796875, -3.3814697265625, -3.24072265625, -3.0999755859375, -2.959228515625, -2.8184814453125, -2.677734375, -2.5369873046875, -2.396240234375, -2.2554931640625, -2.11474609375, -1.9739990234375, -1.833251953125, -1.6925048828125, -1.5517578125, -1.4110107421875, -1.270263671875, -1.1295166015625, -0.98876953125, -0.8480224609375, -0.707275390625, -0.5665283203125, -0.42578125, -0.2850341796875, -0.144287109375, -0.0035400390625, 0.13720703125, 0.2779541015625, 0.418701171875, 0.5594482421875, 0.7001953125, 0.8409423828125, 0.981689453125, 1.1224365234375, 1.26318359375, 1.4039306640625, 1.544677734375, 1.6854248046875, 1.826171875, 1.9669189453125, 2.107666015625, 2.2484130859375, 2.38916015625, 2.5299072265625, 2.670654296875, 2.8114013671875, 2.9521484375, 3.0928955078125, 3.233642578125, 3.3743896484375, 3.51513671875, 3.6558837890625, 3.796630859375, 3.9373779296875, 4.078125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 8.0, 6.0, 12.0, 11.0, 20.0, 43.0, 44.0, 62.0, 130.0, 235.0, 429.0, 1005.0, 2800.0, 9882.0, 44276.0, 203357.0, 507439.0, 215596.0, 47549.0, 10729.0, 2871.0, 1023.0, 432.0, 246.0, 144.0, 69.0, 37.0, 36.0, 17.0, 15.0, 8.0, 9.0, 7.0, 6.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.140625, -10.7041015625, -10.267578125, -9.8310546875, -9.39453125, -8.9580078125, -8.521484375, -8.0849609375, -7.6484375, -7.2119140625, -6.775390625, -6.3388671875, -5.90234375, -5.4658203125, -5.029296875, -4.5927734375, -4.15625, -3.7197265625, -3.283203125, -2.8466796875, -2.41015625, -1.9736328125, -1.537109375, -1.1005859375, -0.6640625, -0.2275390625, 0.208984375, 0.6455078125, 1.08203125, 1.5185546875, 1.955078125, 2.3916015625, 2.828125, 3.2646484375, 3.701171875, 4.1376953125, 4.57421875, 5.0107421875, 5.447265625, 5.8837890625, 6.3203125, 6.7568359375, 7.193359375, 7.6298828125, 8.06640625, 8.5029296875, 8.939453125, 9.3759765625, 9.8125, 10.2490234375, 10.685546875, 11.1220703125, 11.55859375, 11.9951171875, 12.431640625, 12.8681640625, 13.3046875, 13.7412109375, 14.177734375, 14.6142578125, 15.05078125, 15.4873046875, 15.923828125, 16.3603515625, 16.796875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 9.0, 5.0, 6.0, 9.0, 9.0, 16.0, 16.0, 11.0, 23.0, 23.0, 25.0, 22.0, 30.0, 34.0, 45.0, 41.0, 41.0, 55.0, 45.0, 43.0, 37.0, 45.0, 40.0, 41.0, 42.0, 44.0, 39.0, 40.0, 26.0, 26.0, 27.0, 18.0, 20.0, 7.0, 9.0, 12.0, 5.0, 7.0, 8.0, 4.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.7578125, -9.443603515625, -9.12939453125, -8.815185546875, -8.5009765625, -8.186767578125, -7.87255859375, -7.558349609375, -7.244140625, -6.929931640625, -6.61572265625, -6.301513671875, -5.9873046875, -5.673095703125, -5.35888671875, -5.044677734375, -4.73046875, -4.416259765625, -4.10205078125, -3.787841796875, -3.4736328125, -3.159423828125, -2.84521484375, -2.531005859375, -2.216796875, -1.902587890625, -1.58837890625, -1.274169921875, -0.9599609375, -0.645751953125, -0.33154296875, -0.017333984375, 0.296875, 0.611083984375, 0.92529296875, 1.239501953125, 1.5537109375, 1.867919921875, 2.18212890625, 2.496337890625, 2.810546875, 3.124755859375, 3.43896484375, 3.753173828125, 4.0673828125, 4.381591796875, 4.69580078125, 5.010009765625, 5.32421875, 5.638427734375, 5.95263671875, 6.266845703125, 6.5810546875, 6.895263671875, 7.20947265625, 7.523681640625, 7.837890625, 8.152099609375, 8.46630859375, 8.780517578125, 9.0947265625, 9.408935546875, 9.72314453125, 10.037353515625, 10.3515625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 2.0, 6.0, 2.0, 4.0, 8.0, 22.0, 48.0, 72.0, 171.0, 377.0, 1068.0, 3311.0, 14149.0, 80415.0, 585067.0, 311690.0, 40511.0, 8211.0, 2162.0, 725.0, 258.0, 137.0, 64.0, 30.0, 14.0, 10.0, 7.0, 3.0, 3.0, 4.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-12.453125, -12.13232421875, -11.8115234375, -11.49072265625, -11.169921875, -10.84912109375, -10.5283203125, -10.20751953125, -9.88671875, -9.56591796875, -9.2451171875, -8.92431640625, -8.603515625, -8.28271484375, -7.9619140625, -7.64111328125, -7.3203125, -6.99951171875, -6.6787109375, -6.35791015625, -6.037109375, -5.71630859375, -5.3955078125, -5.07470703125, -4.75390625, -4.43310546875, -4.1123046875, -3.79150390625, -3.470703125, -3.14990234375, -2.8291015625, -2.50830078125, -2.1875, -1.86669921875, -1.5458984375, -1.22509765625, -0.904296875, -0.58349609375, -0.2626953125, 0.05810546875, 0.37890625, 0.69970703125, 1.0205078125, 1.34130859375, 1.662109375, 1.98291015625, 2.3037109375, 2.62451171875, 2.9453125, 3.26611328125, 3.5869140625, 3.90771484375, 4.228515625, 4.54931640625, 4.8701171875, 5.19091796875, 5.51171875, 5.83251953125, 6.1533203125, 6.47412109375, 6.794921875, 7.11572265625, 7.4365234375, 7.75732421875, 8.078125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 3.0, 8.0, 2.0, 9.0, 5.0, 9.0, 6.0, 14.0, 14.0, 26.0, 34.0, 40.0, 42.0, 109.0, 157.0, 144.0, 112.0, 70.0, 46.0, 34.0, 24.0, 25.0, 9.0, 12.0, 7.0, 8.0, 1.0, 3.0, 2.0, 4.0, 4.0, 5.0, 1.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0015668869018554688, -0.0015235096216201782, -0.0014801323413848877, -0.0014367550611495972, -0.0013933777809143066, -0.0013500005006790161, -0.0013066232204437256, -0.001263245940208435, -0.0012198686599731445, -0.001176491379737854, -0.0011331140995025635, -0.001089736819267273, -0.0010463595390319824, -0.001002982258796692, -0.0009596049785614014, -0.0009162276983261108, -0.0008728504180908203, -0.0008294731378555298, -0.0007860958576202393, -0.0007427185773849487, -0.0006993412971496582, -0.0006559640169143677, -0.0006125867366790771, -0.0005692094564437866, -0.0005258321762084961, -0.00048245489597320557, -0.00043907761573791504, -0.0003957003355026245, -0.000352323055267334, -0.00030894577503204346, -0.00026556849479675293, -0.0002221912145614624, -0.00017881393432617188, -0.00013543665409088135, -9.205937385559082e-05, -4.868209362030029e-05, -5.304813385009766e-06, 3.807246685028076e-05, 8.144974708557129e-05, 0.00012482702732086182, 0.00016820430755615234, 0.00021158158779144287, 0.0002549588680267334, 0.0002983361482620239, 0.00034171342849731445, 0.000385090708732605, 0.0004284679889678955, 0.00047184526920318604, 0.0005152225494384766, 0.0005585998296737671, 0.0006019771099090576, 0.0006453543901443481, 0.0006887316703796387, 0.0007321089506149292, 0.0007754862308502197, 0.0008188635110855103, 0.0008622407913208008, 0.0009056180715560913, 0.0009489953517913818, 0.0009923726320266724, 0.0010357499122619629, 0.0010791271924972534, 0.001122504472732544, 0.0011658817529678345, 0.001209259033203125]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 9.0, 7.0, 15.0, 17.0, 20.0, 33.0, 42.0, 63.0, 122.0, 209.0, 374.0, 758.0, 1497.0, 3504.0, 9351.0, 28071.0, 104424.0, 455035.0, 335412.0, 75278.0, 21540.0, 7265.0, 2959.0, 1235.0, 579.0, 272.0, 179.0, 100.0, 50.0, 47.0, 20.0, 17.0, 10.0, 12.0, 7.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-6.5625, -6.33526611328125, -6.1080322265625, -5.88079833984375, -5.653564453125, -5.42633056640625, -5.1990966796875, -4.97186279296875, -4.74462890625, -4.51739501953125, -4.2901611328125, -4.06292724609375, -3.835693359375, -3.60845947265625, -3.3812255859375, -3.15399169921875, -2.9267578125, -2.69952392578125, -2.4722900390625, -2.24505615234375, -2.017822265625, -1.79058837890625, -1.5633544921875, -1.33612060546875, -1.10888671875, -0.88165283203125, -0.6544189453125, -0.42718505859375, -0.199951171875, 0.02728271484375, 0.2545166015625, 0.48175048828125, 0.708984375, 0.93621826171875, 1.1634521484375, 1.39068603515625, 1.617919921875, 1.84515380859375, 2.0723876953125, 2.29962158203125, 2.52685546875, 2.75408935546875, 2.9813232421875, 3.20855712890625, 3.435791015625, 3.66302490234375, 3.8902587890625, 4.11749267578125, 4.3447265625, 4.57196044921875, 4.7991943359375, 5.02642822265625, 5.253662109375, 5.48089599609375, 5.7081298828125, 5.93536376953125, 6.16259765625, 6.38983154296875, 6.6170654296875, 6.84429931640625, 7.071533203125, 7.29876708984375, 7.5260009765625, 7.75323486328125, 7.98046875]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 1.0, 2.0, 1.0, 4.0, 1.0, 5.0, 10.0, 13.0, 8.0, 16.0, 23.0, 17.0, 35.0, 31.0, 46.0, 60.0, 71.0, 95.0, 95.0, 95.0, 87.0, 54.0, 47.0, 44.0, 34.0, 27.0, 20.0, 13.0, 13.0, 10.0, 6.0, 7.0, 3.0, 7.0, 2.0, 3.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.3828125, -6.20013427734375, -6.0174560546875, -5.83477783203125, -5.652099609375, -5.46942138671875, -5.2867431640625, -5.10406494140625, -4.92138671875, -4.73870849609375, -4.5560302734375, -4.37335205078125, -4.190673828125, -4.00799560546875, -3.8253173828125, -3.64263916015625, -3.4599609375, -3.27728271484375, -3.0946044921875, -2.91192626953125, -2.729248046875, -2.54656982421875, -2.3638916015625, -2.18121337890625, -1.99853515625, -1.81585693359375, -1.6331787109375, -1.45050048828125, -1.267822265625, -1.08514404296875, -0.9024658203125, -0.71978759765625, -0.537109375, -0.35443115234375, -0.1717529296875, 0.01092529296875, 0.193603515625, 0.37628173828125, 0.5589599609375, 0.74163818359375, 0.92431640625, 1.10699462890625, 1.2896728515625, 1.47235107421875, 1.655029296875, 1.83770751953125, 2.0203857421875, 2.20306396484375, 2.3857421875, 2.56842041015625, 2.7510986328125, 2.93377685546875, 3.116455078125, 3.29913330078125, 3.4818115234375, 3.66448974609375, 3.84716796875, 4.02984619140625, 4.2125244140625, 4.39520263671875, 4.577880859375, 4.76055908203125, 4.9432373046875, 5.12591552734375, 5.30859375]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 2.0, 9.0, 11.0, 27.0, 50.0, 114.0, 149.0, 215.0, 193.0, 121.0, 66.0, 32.0, 13.0, 4.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.51082229614258, -43.41568374633789, -39.32054901123047, -35.22541046142578, -31.130271911621094, -27.035133361816406, -22.93999671936035, -18.844860076904297, -14.74972152709961, -10.654583930969238, -6.559446334838867, -2.464308738708496, 1.630828857421875, 5.7259674072265625, 9.821104049682617, 13.916240692138672, 18.01137924194336, 22.106517791748047, 26.2016544342041, 30.296791076660156, 34.391929626464844, 38.48706817626953, 42.58220672607422, 46.67734146118164, 50.77248001098633, 54.867618560791016, 58.96275329589844, 63.057891845703125, 67.15303039550781, 71.2481689453125, 75.34330749511719, 79.43844604492188, 83.5335693359375, 87.62870788574219, 91.72384643554688, 95.81898498535156, 99.91412353515625, 104.00926208496094, 108.1043930053711, 112.19953155517578, 116.29467010498047, 120.38980865478516, 124.48494720458984, 128.580078125, 132.6752166748047, 136.77035522460938, 140.86549377441406, 144.96063232421875, 149.05577087402344, 153.15090942382812, 157.2460479736328, 161.3411865234375, 165.4363250732422, 169.53146362304688, 173.62660217285156, 177.72174072265625, 181.81686401367188, 185.91200256347656, 190.00714111328125, 194.10227966308594, 198.19741821289062, 202.2925567626953, 206.3876953125, 210.48281860351562, 214.57797241210938]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 5.0, 7.0, 8.0, 5.0, 15.0, 11.0, 17.0, 16.0, 22.0, 19.0, 26.0, 28.0, 24.0, 42.0, 37.0, 37.0, 48.0, 44.0, 50.0, 45.0, 52.0, 47.0, 36.0, 43.0, 50.0, 34.0, 33.0, 36.0, 22.0, 34.0, 25.0, 17.0, 12.0, 14.0, 10.0, 14.0, 3.0, 4.0, 3.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0], "bins": [-60.47914505004883, -58.56175994873047, -56.644371032714844, -54.72698211669922, -52.80959701538086, -50.8922119140625, -48.974822998046875, -47.05743408203125, -45.14004898071289, -43.22266387939453, -41.305274963378906, -39.38788604736328, -37.47050094604492, -35.55311584472656, -33.63572692871094, -31.718339920043945, -29.800952911376953, -27.88356590270996, -25.96617889404297, -24.048791885375977, -22.131404876708984, -20.214017868041992, -18.296630859375, -16.379243850708008, -14.461856842041016, -12.544469833374023, -10.627082824707031, -8.709695816040039, -6.792308807373047, -4.874921798706055, -2.9575347900390625, -1.0401477813720703, 0.8772392272949219, 2.794626235961914, 4.712013244628906, 6.629400253295898, 8.54678726196289, 10.464174270629883, 12.381561279296875, 14.298948287963867, 16.21633529663086, 18.13372230529785, 20.051109313964844, 21.968496322631836, 23.885883331298828, 25.80327033996582, 27.720657348632812, 29.638044357299805, 31.555431365966797, 33.472816467285156, 35.39020538330078, 37.307594299316406, 39.224979400634766, 41.142364501953125, 43.05975341796875, 44.977142333984375, 46.894527435302734, 48.811912536621094, 50.72930145263672, 52.646690368652344, 54.5640754699707, 56.48146057128906, 58.39884948730469, 60.31623840332031, 62.23362350463867]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 8.0, 9.0, 8.0, 13.0, 17.0, 23.0, 38.0, 44.0, 59.0, 88.0, 151.0, 240.0, 486.0, 1195.0, 3148.0, 12557.0, 127580.0, 3990754.0, 46275.0, 7669.0, 2256.0, 792.0, 368.0, 190.0, 100.0, 67.0, 34.0, 27.0, 22.0, 17.0, 12.0, 9.0, 5.0, 8.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.84375, -24.8623046875, -23.880859375, -22.8994140625, -21.91796875, -20.9365234375, -19.955078125, -18.9736328125, -17.9921875, -17.0107421875, -16.029296875, -15.0478515625, -14.06640625, -13.0849609375, -12.103515625, -11.1220703125, -10.140625, -9.1591796875, -8.177734375, -7.1962890625, -6.21484375, -5.2333984375, -4.251953125, -3.2705078125, -2.2890625, -1.3076171875, -0.326171875, 0.6552734375, 1.63671875, 2.6181640625, 3.599609375, 4.5810546875, 5.5625, 6.5439453125, 7.525390625, 8.5068359375, 9.48828125, 10.4697265625, 11.451171875, 12.4326171875, 13.4140625, 14.3955078125, 15.376953125, 16.3583984375, 17.33984375, 18.3212890625, 19.302734375, 20.2841796875, 21.265625, 22.2470703125, 23.228515625, 24.2099609375, 25.19140625, 26.1728515625, 27.154296875, 28.1357421875, 29.1171875, 30.0986328125, 31.080078125, 32.0615234375, 33.04296875, 34.0244140625, 35.005859375, 35.9873046875, 36.96875]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 5.0, 9.0, 10.0, 12.0, 16.0, 25.0, 34.0, 40.0, 56.0, 64.0, 83.0, 69.0, 79.0, 82.0, 73.0, 88.0, 62.0, 51.0, 53.0, 27.0, 19.0, 13.0, 9.0, 6.0, 7.0, 3.0, 2.0, 1.0, 5.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.349609375, -3.224456787109375, -3.09930419921875, -2.974151611328125, -2.8489990234375, -2.723846435546875, -2.59869384765625, -2.473541259765625, -2.348388671875, -2.223236083984375, -2.09808349609375, -1.972930908203125, -1.8477783203125, -1.722625732421875, -1.59747314453125, -1.472320556640625, -1.34716796875, -1.222015380859375, -1.09686279296875, -0.971710205078125, -0.8465576171875, -0.721405029296875, -0.59625244140625, -0.471099853515625, -0.345947265625, -0.220794677734375, -0.09564208984375, 0.029510498046875, 0.1546630859375, 0.279815673828125, 0.40496826171875, 0.530120849609375, 0.6552734375, 0.780426025390625, 0.90557861328125, 1.030731201171875, 1.1558837890625, 1.281036376953125, 1.40618896484375, 1.531341552734375, 1.656494140625, 1.781646728515625, 1.90679931640625, 2.031951904296875, 2.1571044921875, 2.282257080078125, 2.40740966796875, 2.532562255859375, 2.65771484375, 2.782867431640625, 2.90802001953125, 3.033172607421875, 3.1583251953125, 3.283477783203125, 3.40863037109375, 3.533782958984375, 3.658935546875, 3.784088134765625, 3.90924072265625, 4.034393310546875, 4.1595458984375, 4.284698486328125, 4.40985107421875, 4.535003662109375, 4.66015625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 6.0, 7.0, 4.0, 14.0, 28.0, 34.0, 58.0, 93.0, 159.0, 297.0, 569.0, 1244.0, 3063.0, 8400.0, 29320.0, 174179.0, 3619857.0, 301014.0, 38700.0, 10596.0, 3605.0, 1483.0, 696.0, 348.0, 191.0, 116.0, 68.0, 48.0, 25.0, 15.0, 14.0, 11.0, 5.0, 2.0, 3.0, 4.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-14.515625, -14.008056640625, -13.50048828125, -12.992919921875, -12.4853515625, -11.977783203125, -11.47021484375, -10.962646484375, -10.455078125, -9.947509765625, -9.43994140625, -8.932373046875, -8.4248046875, -7.917236328125, -7.40966796875, -6.902099609375, -6.39453125, -5.886962890625, -5.37939453125, -4.871826171875, -4.3642578125, -3.856689453125, -3.34912109375, -2.841552734375, -2.333984375, -1.826416015625, -1.31884765625, -0.811279296875, -0.3037109375, 0.203857421875, 0.71142578125, 1.218994140625, 1.7265625, 2.234130859375, 2.74169921875, 3.249267578125, 3.7568359375, 4.264404296875, 4.77197265625, 5.279541015625, 5.787109375, 6.294677734375, 6.80224609375, 7.309814453125, 7.8173828125, 8.324951171875, 8.83251953125, 9.340087890625, 9.84765625, 10.355224609375, 10.86279296875, 11.370361328125, 11.8779296875, 12.385498046875, 12.89306640625, 13.400634765625, 13.908203125, 14.415771484375, 14.92333984375, 15.430908203125, 15.9384765625, 16.446044921875, 16.95361328125, 17.461181640625, 17.96875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 2.0, 4.0, 6.0, 2.0, 9.0, 10.0, 18.0, 19.0, 15.0, 31.0, 45.0, 38.0, 61.0, 111.0, 186.0, 363.0, 883.0, 1237.0, 431.0, 211.0, 128.0, 73.0, 51.0, 36.0, 23.0, 14.0, 10.0, 8.0, 8.0, 10.0, 4.0, 7.0, 5.0, 2.0, 5.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.345703125, -3.226837158203125, -3.10797119140625, -2.989105224609375, -2.8702392578125, -2.751373291015625, -2.63250732421875, -2.513641357421875, -2.394775390625, -2.275909423828125, -2.15704345703125, -2.038177490234375, -1.9193115234375, -1.800445556640625, -1.68157958984375, -1.562713623046875, -1.44384765625, -1.324981689453125, -1.20611572265625, -1.087249755859375, -0.9683837890625, -0.849517822265625, -0.73065185546875, -0.611785888671875, -0.492919921875, -0.374053955078125, -0.25518798828125, -0.136322021484375, -0.0174560546875, 0.101409912109375, 0.22027587890625, 0.339141845703125, 0.4580078125, 0.576873779296875, 0.69573974609375, 0.814605712890625, 0.9334716796875, 1.052337646484375, 1.17120361328125, 1.290069580078125, 1.408935546875, 1.527801513671875, 1.64666748046875, 1.765533447265625, 1.8843994140625, 2.003265380859375, 2.12213134765625, 2.240997314453125, 2.35986328125, 2.478729248046875, 2.59759521484375, 2.716461181640625, 2.8353271484375, 2.954193115234375, 3.07305908203125, 3.191925048828125, 3.310791015625, 3.429656982421875, 3.54852294921875, 3.667388916015625, 3.7862548828125, 3.905120849609375, 4.02398681640625, 4.142852783203125, 4.26171875]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 0.0, 3.0, 3.0, 5.0, 12.0, 32.0, 42.0, 80.0, 113.0, 158.0, 151.0, 154.0, 113.0, 56.0, 29.0, 30.0, 13.0, 6.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.488037109375, -33.311302185058594, -32.13457107543945, -30.957836151123047, -29.78110122680664, -28.604368209838867, -27.427635192871094, -26.250900268554688, -25.074167251586914, -23.89743423461914, -22.720699310302734, -21.54396629333496, -20.367233276367188, -19.19049835205078, -18.013765335083008, -16.837032318115234, -15.660297393798828, -14.483563423156738, -13.306829452514648, -12.130096435546875, -10.953362464904785, -9.776628494262695, -8.599895477294922, -7.423161506652832, -6.246427536010742, -5.069693565368652, -3.8929600715637207, -2.71622633934021, -1.5394926071166992, -0.3627586364746094, 0.8139748573303223, 1.990708351135254, 3.1674423217773438, 4.344176292419434, 5.520909786224365, 6.697643280029297, 7.874377250671387, 9.051111221313477, 10.22784423828125, 11.40457820892334, 12.58131217956543, 13.75804615020752, 14.93478012084961, 16.111513137817383, 17.288246154785156, 18.464981079101562, 19.641714096069336, 20.81844711303711, 21.995182037353516, 23.17191505432129, 24.348649978637695, 25.52538299560547, 26.702117919921875, 27.87885093688965, 29.055583953857422, 30.232318878173828, 31.4090518951416, 32.585784912109375, 33.76251983642578, 34.93925476074219, 36.11598587036133, 37.292720794677734, 38.46945571899414, 39.64618682861328, 40.82292175292969]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 3.0, 9.0, 7.0, 4.0, 12.0, 12.0, 15.0, 20.0, 17.0, 17.0, 27.0, 25.0, 30.0, 37.0, 37.0, 29.0, 32.0, 39.0, 36.0, 24.0, 48.0, 39.0, 43.0, 50.0, 43.0, 55.0, 39.0, 34.0, 39.0, 20.0, 20.0, 20.0, 24.0, 15.0, 17.0, 8.0, 12.0, 8.0, 7.0, 6.0, 8.0, 7.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 3.0], "bins": [-15.179865837097168, -14.753652572631836, -14.327439308166504, -13.901226043701172, -13.475011825561523, -13.048799514770508, -12.62258529663086, -12.196372032165527, -11.770158767700195, -11.343945503234863, -10.917732238769531, -10.4915189743042, -10.065305709838867, -9.639091491699219, -9.212878227233887, -8.786664962768555, -8.360451698303223, -7.934238433837891, -7.508025169372559, -7.081811428070068, -6.655598163604736, -6.229384899139404, -5.803171157836914, -5.376957893371582, -4.95074462890625, -4.524531364440918, -4.098318099975586, -3.6721043586730957, -3.2458910942077637, -2.8196778297424316, -2.3934643268585205, -1.9672508239746094, -1.541036605834961, -1.1148232221603394, -0.6886098384857178, -0.2623964548110962, 0.1638169288635254, 0.5900301933288574, 1.0162436962127686, 1.4424571990966797, 1.8686704635620117, 2.2948837280273438, 2.721097230911255, 3.147310733795166, 3.573523998260498, 3.99973726272583, 4.42595100402832, 4.852164268493652, 5.278377532958984, 5.704590797424316, 6.130804061889648, 6.557017803192139, 6.983231067657471, 7.409444332122803, 7.835658073425293, 8.261871337890625, 8.688084602355957, 9.114297866821289, 9.540511131286621, 9.966724395751953, 10.392938613891602, 10.819150924682617, 11.245365142822266, 11.671578407287598, 12.09779167175293]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 12.0, 12.0, 14.0, 18.0, 17.0, 32.0, 62.0, 100.0, 161.0, 259.0, 569.0, 1288.0, 3066.0, 10585.0, 53753.0, 361881.0, 509613.0, 84609.0, 15371.0, 4138.0, 1484.0, 659.0, 349.0, 167.0, 110.0, 74.0, 48.0, 31.0, 19.0, 13.0, 15.0, 4.0, 9.0, 3.0, 4.0, 3.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.328125, -18.615478515625, -17.90283203125, -17.190185546875, -16.4775390625, -15.764892578125, -15.05224609375, -14.339599609375, -13.626953125, -12.914306640625, -12.20166015625, -11.489013671875, -10.7763671875, -10.063720703125, -9.35107421875, -8.638427734375, -7.92578125, -7.213134765625, -6.50048828125, -5.787841796875, -5.0751953125, -4.362548828125, -3.64990234375, -2.937255859375, -2.224609375, -1.511962890625, -0.79931640625, -0.086669921875, 0.6259765625, 1.338623046875, 2.05126953125, 2.763916015625, 3.4765625, 4.189208984375, 4.90185546875, 5.614501953125, 6.3271484375, 7.039794921875, 7.75244140625, 8.465087890625, 9.177734375, 9.890380859375, 10.60302734375, 11.315673828125, 12.0283203125, 12.740966796875, 13.45361328125, 14.166259765625, 14.87890625, 15.591552734375, 16.30419921875, 17.016845703125, 17.7294921875, 18.442138671875, 19.15478515625, 19.867431640625, 20.580078125, 21.292724609375, 22.00537109375, 22.718017578125, 23.4306640625, 24.143310546875, 24.85595703125, 25.568603515625, 26.28125]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 8.0, 6.0, 5.0, 14.0, 21.0, 23.0, 33.0, 46.0, 59.0, 71.0, 83.0, 114.0, 86.0, 97.0, 90.0, 76.0, 53.0, 48.0, 22.0, 15.0, 13.0, 7.0, 9.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.75390625, -4.61041259765625, -4.4669189453125, -4.32342529296875, -4.179931640625, -4.03643798828125, -3.8929443359375, -3.74945068359375, -3.60595703125, -3.46246337890625, -3.3189697265625, -3.17547607421875, -3.031982421875, -2.88848876953125, -2.7449951171875, -2.60150146484375, -2.4580078125, -2.31451416015625, -2.1710205078125, -2.02752685546875, -1.884033203125, -1.74053955078125, -1.5970458984375, -1.45355224609375, -1.31005859375, -1.16656494140625, -1.0230712890625, -0.87957763671875, -0.736083984375, -0.59259033203125, -0.4490966796875, -0.30560302734375, -0.162109375, -0.01861572265625, 0.1248779296875, 0.26837158203125, 0.411865234375, 0.55535888671875, 0.6988525390625, 0.84234619140625, 0.98583984375, 1.12933349609375, 1.2728271484375, 1.41632080078125, 1.559814453125, 1.70330810546875, 1.8468017578125, 1.99029541015625, 2.1337890625, 2.27728271484375, 2.4207763671875, 2.56427001953125, 2.707763671875, 2.85125732421875, 2.9947509765625, 3.13824462890625, 3.28173828125, 3.42523193359375, 3.5687255859375, 3.71221923828125, 3.855712890625, 3.99920654296875, 4.1427001953125, 4.28619384765625, 4.4296875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 2.0, 5.0, 8.0, 9.0, 12.0, 17.0, 23.0, 39.0, 42.0, 45.0, 57.0, 96.0, 159.0, 218.0, 341.0, 577.0, 1151.0, 2538.0, 7040.0, 24858.0, 96218.0, 330007.0, 399907.0, 134704.0, 34396.0, 9565.0, 3288.0, 1375.0, 692.0, 388.0, 243.0, 158.0, 101.0, 78.0, 53.0, 37.0, 33.0, 28.0, 17.0, 10.0, 8.0, 7.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.640625, -11.2666015625, -10.892578125, -10.5185546875, -10.14453125, -9.7705078125, -9.396484375, -9.0224609375, -8.6484375, -8.2744140625, -7.900390625, -7.5263671875, -7.15234375, -6.7783203125, -6.404296875, -6.0302734375, -5.65625, -5.2822265625, -4.908203125, -4.5341796875, -4.16015625, -3.7861328125, -3.412109375, -3.0380859375, -2.6640625, -2.2900390625, -1.916015625, -1.5419921875, -1.16796875, -0.7939453125, -0.419921875, -0.0458984375, 0.328125, 0.7021484375, 1.076171875, 1.4501953125, 1.82421875, 2.1982421875, 2.572265625, 2.9462890625, 3.3203125, 3.6943359375, 4.068359375, 4.4423828125, 4.81640625, 5.1904296875, 5.564453125, 5.9384765625, 6.3125, 6.6865234375, 7.060546875, 7.4345703125, 7.80859375, 8.1826171875, 8.556640625, 8.9306640625, 9.3046875, 9.6787109375, 10.052734375, 10.4267578125, 10.80078125, 11.1748046875, 11.548828125, 11.9228515625, 12.296875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 4.0, 3.0, 3.0, 4.0, 2.0, 6.0, 7.0, 10.0, 10.0, 17.0, 9.0, 22.0, 26.0, 32.0, 28.0, 26.0, 32.0, 38.0, 33.0, 34.0, 44.0, 37.0, 50.0, 39.0, 44.0, 47.0, 46.0, 39.0, 39.0, 33.0, 31.0, 29.0, 26.0, 20.0, 21.0, 23.0, 19.0, 21.0, 13.0, 11.0, 11.0, 6.0, 3.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0], "bins": [-10.25, -9.9447021484375, -9.639404296875, -9.3341064453125, -9.02880859375, -8.7235107421875, -8.418212890625, -8.1129150390625, -7.8076171875, -7.5023193359375, -7.197021484375, -6.8917236328125, -6.58642578125, -6.2811279296875, -5.975830078125, -5.6705322265625, -5.365234375, -5.0599365234375, -4.754638671875, -4.4493408203125, -4.14404296875, -3.8387451171875, -3.533447265625, -3.2281494140625, -2.9228515625, -2.6175537109375, -2.312255859375, -2.0069580078125, -1.70166015625, -1.3963623046875, -1.091064453125, -0.7857666015625, -0.48046875, -0.1751708984375, 0.130126953125, 0.4354248046875, 0.74072265625, 1.0460205078125, 1.351318359375, 1.6566162109375, 1.9619140625, 2.2672119140625, 2.572509765625, 2.8778076171875, 3.18310546875, 3.4884033203125, 3.793701171875, 4.0989990234375, 4.404296875, 4.7095947265625, 5.014892578125, 5.3201904296875, 5.62548828125, 5.9307861328125, 6.236083984375, 6.5413818359375, 6.8466796875, 7.1519775390625, 7.457275390625, 7.7625732421875, 8.06787109375, 8.3731689453125, 8.678466796875, 8.9837646484375, 9.2890625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 7.0, 5.0, 10.0, 5.0, 12.0, 17.0, 21.0, 40.0, 62.0, 86.0, 134.0, 255.0, 478.0, 841.0, 1546.0, 3385.0, 7363.0, 17405.0, 46455.0, 153734.0, 445150.0, 256217.0, 71102.0, 24857.0, 10302.0, 4512.0, 2121.0, 1036.0, 576.0, 308.0, 209.0, 108.0, 73.0, 46.0, 26.0, 12.0, 11.0, 10.0, 4.0, 5.0, 2.0, 3.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.82421875, -5.63446044921875, -5.4447021484375, -5.25494384765625, -5.065185546875, -4.87542724609375, -4.6856689453125, -4.49591064453125, -4.30615234375, -4.11639404296875, -3.9266357421875, -3.73687744140625, -3.547119140625, -3.35736083984375, -3.1676025390625, -2.97784423828125, -2.7880859375, -2.59832763671875, -2.4085693359375, -2.21881103515625, -2.029052734375, -1.83929443359375, -1.6495361328125, -1.45977783203125, -1.27001953125, -1.08026123046875, -0.8905029296875, -0.70074462890625, -0.510986328125, -0.32122802734375, -0.1314697265625, 0.05828857421875, 0.248046875, 0.43780517578125, 0.6275634765625, 0.81732177734375, 1.007080078125, 1.19683837890625, 1.3865966796875, 1.57635498046875, 1.76611328125, 1.95587158203125, 2.1456298828125, 2.33538818359375, 2.525146484375, 2.71490478515625, 2.9046630859375, 3.09442138671875, 3.2841796875, 3.47393798828125, 3.6636962890625, 3.85345458984375, 4.043212890625, 4.23297119140625, 4.4227294921875, 4.61248779296875, 4.80224609375, 4.99200439453125, 5.1817626953125, 5.37152099609375, 5.561279296875, 5.75103759765625, 5.9407958984375, 6.13055419921875, 6.3203125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 4.0, 5.0, 1.0, 3.0, 2.0, 7.0, 15.0, 14.0, 15.0, 27.0, 43.0, 29.0, 52.0, 71.0, 101.0, 146.0, 121.0, 93.0, 83.0, 50.0, 29.0, 14.0, 24.0, 15.0, 7.0, 5.0, 5.0, 5.0, 4.0, 8.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011701583862304688, -0.0011246204376220703, -0.0010790824890136719, -0.0010335445404052734, -0.000988006591796875, -0.0009424686431884766, -0.0008969306945800781, -0.0008513927459716797, -0.0008058547973632812, -0.0007603168487548828, -0.0007147789001464844, -0.0006692409515380859, -0.0006237030029296875, -0.0005781650543212891, -0.0005326271057128906, -0.0004870891571044922, -0.00044155120849609375, -0.0003960132598876953, -0.0003504753112792969, -0.00030493736267089844, -0.0002593994140625, -0.00021386146545410156, -0.00016832351684570312, -0.0001227855682373047, -7.724761962890625e-05, -3.170967102050781e-05, 1.3828277587890625e-05, 5.936622619628906e-05, 0.0001049041748046875, 0.00015044212341308594, 0.00019598007202148438, 0.0002415180206298828, 0.00028705596923828125, 0.0003325939178466797, 0.0003781318664550781, 0.00042366981506347656, 0.000469207763671875, 0.0005147457122802734, 0.0005602836608886719, 0.0006058216094970703, 0.0006513595581054688, 0.0006968975067138672, 0.0007424354553222656, 0.0007879734039306641, 0.0008335113525390625, 0.0008790493011474609, 0.0009245872497558594, 0.0009701251983642578, 0.0010156631469726562, 0.0010612010955810547, 0.0011067390441894531, 0.0011522769927978516, 0.00119781494140625, 0.0012433528900146484, 0.0012888908386230469, 0.0013344287872314453, 0.0013799667358398438, 0.0014255046844482422, 0.0014710426330566406, 0.001516580581665039, 0.0015621185302734375, 0.001607656478881836, 0.0016531944274902344, 0.0016987323760986328, 0.0017442703247070312]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 4.0, 5.0, 3.0, 6.0, 9.0, 14.0, 19.0, 13.0, 25.0, 44.0, 83.0, 132.0, 239.0, 440.0, 914.0, 1975.0, 5627.0, 19134.0, 87900.0, 586963.0, 283151.0, 44286.0, 11114.0, 3634.0, 1410.0, 645.0, 335.0, 190.0, 70.0, 71.0, 33.0, 22.0, 11.0, 14.0, 5.0, 5.0, 6.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.8359375, -8.506103515625, -8.17626953125, -7.846435546875, -7.5166015625, -7.186767578125, -6.85693359375, -6.527099609375, -6.197265625, -5.867431640625, -5.53759765625, -5.207763671875, -4.8779296875, -4.548095703125, -4.21826171875, -3.888427734375, -3.55859375, -3.228759765625, -2.89892578125, -2.569091796875, -2.2392578125, -1.909423828125, -1.57958984375, -1.249755859375, -0.919921875, -0.590087890625, -0.26025390625, 0.069580078125, 0.3994140625, 0.729248046875, 1.05908203125, 1.388916015625, 1.71875, 2.048583984375, 2.37841796875, 2.708251953125, 3.0380859375, 3.367919921875, 3.69775390625, 4.027587890625, 4.357421875, 4.687255859375, 5.01708984375, 5.346923828125, 5.6767578125, 6.006591796875, 6.33642578125, 6.666259765625, 6.99609375, 7.325927734375, 7.65576171875, 7.985595703125, 8.3154296875, 8.645263671875, 8.97509765625, 9.304931640625, 9.634765625, 9.964599609375, 10.29443359375, 10.624267578125, 10.9541015625, 11.283935546875, 11.61376953125, 11.943603515625, 12.2734375]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 1.0, 6.0, 3.0, 5.0, 4.0, 7.0, 17.0, 19.0, 29.0, 34.0, 36.0, 66.0, 104.0, 125.0, 135.0, 116.0, 87.0, 52.0, 49.0, 28.0, 20.0, 13.0, 11.0, 9.0, 7.0, 3.0, 8.0, 6.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.9140625, -8.65411376953125, -8.3941650390625, -8.13421630859375, -7.874267578125, -7.61431884765625, -7.3543701171875, -7.09442138671875, -6.83447265625, -6.57452392578125, -6.3145751953125, -6.05462646484375, -5.794677734375, -5.53472900390625, -5.2747802734375, -5.01483154296875, -4.7548828125, -4.49493408203125, -4.2349853515625, -3.97503662109375, -3.715087890625, -3.45513916015625, -3.1951904296875, -2.93524169921875, -2.67529296875, -2.41534423828125, -2.1553955078125, -1.89544677734375, -1.635498046875, -1.37554931640625, -1.1156005859375, -0.85565185546875, -0.595703125, -0.33575439453125, -0.0758056640625, 0.18414306640625, 0.444091796875, 0.70404052734375, 0.9639892578125, 1.22393798828125, 1.48388671875, 1.74383544921875, 2.0037841796875, 2.26373291015625, 2.523681640625, 2.78363037109375, 3.0435791015625, 3.30352783203125, 3.5634765625, 3.82342529296875, 4.0833740234375, 4.34332275390625, 4.603271484375, 4.86322021484375, 5.1231689453125, 5.38311767578125, 5.64306640625, 5.90301513671875, 6.1629638671875, 6.42291259765625, 6.682861328125, 6.94281005859375, 7.2027587890625, 7.46270751953125, 7.72265625]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 3.0, 18.0, 84.0, 162.0, 277.0, 253.0, 125.0, 49.0, 22.0, 9.0, 6.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-105.2959976196289, -99.06365203857422, -92.83130645751953, -86.59896850585938, -80.36662292480469, -74.13427734375, -67.90193176269531, -61.669586181640625, -55.43724060058594, -49.20489501953125, -42.97254943847656, -36.74020767211914, -30.507862091064453, -24.275516510009766, -18.043174743652344, -11.810829162597656, -5.578483581542969, 0.6538610458374023, 6.886205673217773, 13.118549346923828, 19.350894927978516, 25.583240509033203, 31.815582275390625, 38.04792785644531, 44.2802734375, 50.51261901855469, 56.744964599609375, 62.9773063659668, 69.20965576171875, 75.44200134277344, 81.6743392944336, 87.90668487548828, 94.1390380859375, 100.37138366699219, 106.60372924804688, 112.83607482910156, 119.06842041015625, 125.30076599121094, 131.53311157226562, 137.76544189453125, 143.997802734375, 150.2301483154297, 156.46249389648438, 162.69483947753906, 168.92718505859375, 175.15953063964844, 181.39187622070312, 187.62420654296875, 193.85655212402344, 200.08889770507812, 206.3212432861328, 212.5535888671875, 218.7859344482422, 225.01828002929688, 231.2506103515625, 237.48297119140625, 243.71530151367188, 249.94764709472656, 256.17999267578125, 262.4123229980469, 268.6446838378906, 274.87701416015625, 281.109375, 287.3417053222656, 293.5740661621094]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 6.0, 2.0, 7.0, 4.0, 8.0, 7.0, 10.0, 12.0, 15.0, 14.0, 20.0, 24.0, 27.0, 28.0, 35.0, 37.0, 45.0, 30.0, 44.0, 48.0, 56.0, 41.0, 56.0, 54.0, 43.0, 43.0, 41.0, 27.0, 35.0, 35.0, 21.0, 22.0, 22.0, 17.0, 18.0, 5.0, 10.0, 5.0, 11.0, 3.0, 4.0, 2.0, 3.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.64113235473633, -59.731319427490234, -57.82150650024414, -55.91168975830078, -54.00187683105469, -52.092063903808594, -50.1822509765625, -48.272438049316406, -46.36262512207031, -44.45281219482422, -42.542999267578125, -40.63318634033203, -38.72336959838867, -36.81355667114258, -34.903743743896484, -32.99393081665039, -31.08411407470703, -29.174301147460938, -27.26448631286621, -25.354673385620117, -23.44485855102539, -21.535045623779297, -19.625232696533203, -17.71541976928711, -15.805604934692383, -13.895791053771973, -11.985977172851562, -10.076164245605469, -8.166350364685059, -6.256536483764648, -4.346723556518555, -2.4369096755981445, -0.527099609375, 1.382714033126831, 3.292527675628662, 5.202341079711914, 7.112154960632324, 9.021968841552734, 10.931781768798828, 12.841595649719238, 14.751409530639648, 16.661222457885742, 18.57103729248047, 20.480850219726562, 22.390663146972656, 24.300477981567383, 26.210290908813477, 28.120105743408203, 30.029918670654297, 31.93973159790039, 33.849544525146484, 35.759361267089844, 37.66917419433594, 39.57898712158203, 41.488800048828125, 43.39861297607422, 45.30842590332031, 47.218238830566406, 49.1280517578125, 51.037864685058594, 52.94768142700195, 54.85749435424805, 56.76730728149414, 58.677120208740234, 60.586936950683594]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 4.0, 4.0, 8.0, 6.0, 11.0, 14.0, 14.0, 30.0, 40.0, 57.0, 62.0, 100.0, 185.0, 291.0, 731.0, 1951.0, 9190.0, 144859.0, 4001618.0, 29260.0, 4092.0, 1015.0, 370.0, 161.0, 73.0, 49.0, 23.0, 28.0, 7.0, 9.0, 6.0, 9.0, 4.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-53.3125, -51.80078125, -50.2890625, -48.77734375, -47.265625, -45.75390625, -44.2421875, -42.73046875, -41.21875, -39.70703125, -38.1953125, -36.68359375, -35.171875, -33.66015625, -32.1484375, -30.63671875, -29.125, -27.61328125, -26.1015625, -24.58984375, -23.078125, -21.56640625, -20.0546875, -18.54296875, -17.03125, -15.51953125, -14.0078125, -12.49609375, -10.984375, -9.47265625, -7.9609375, -6.44921875, -4.9375, -3.42578125, -1.9140625, -0.40234375, 1.109375, 2.62109375, 4.1328125, 5.64453125, 7.15625, 8.66796875, 10.1796875, 11.69140625, 13.203125, 14.71484375, 16.2265625, 17.73828125, 19.25, 20.76171875, 22.2734375, 23.78515625, 25.296875, 26.80859375, 28.3203125, 29.83203125, 31.34375, 32.85546875, 34.3671875, 35.87890625, 37.390625, 38.90234375, 40.4140625, 41.92578125, 43.4375]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 3.0, 11.0, 17.0, 16.0, 18.0, 33.0, 43.0, 67.0, 81.0, 70.0, 100.0, 100.0, 104.0, 85.0, 85.0, 52.0, 27.0, 32.0, 21.0, 17.0, 7.0, 7.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.609375, -4.45709228515625, -4.3048095703125, -4.15252685546875, -4.000244140625, -3.84796142578125, -3.6956787109375, -3.54339599609375, -3.39111328125, -3.23883056640625, -3.0865478515625, -2.93426513671875, -2.781982421875, -2.62969970703125, -2.4774169921875, -2.32513427734375, -2.1728515625, -2.02056884765625, -1.8682861328125, -1.71600341796875, -1.563720703125, -1.41143798828125, -1.2591552734375, -1.10687255859375, -0.95458984375, -0.80230712890625, -0.6500244140625, -0.49774169921875, -0.345458984375, -0.19317626953125, -0.0408935546875, 0.11138916015625, 0.263671875, 0.41595458984375, 0.5682373046875, 0.72052001953125, 0.872802734375, 1.02508544921875, 1.1773681640625, 1.32965087890625, 1.48193359375, 1.63421630859375, 1.7864990234375, 1.93878173828125, 2.091064453125, 2.24334716796875, 2.3956298828125, 2.54791259765625, 2.7001953125, 2.85247802734375, 3.0047607421875, 3.15704345703125, 3.309326171875, 3.46160888671875, 3.6138916015625, 3.76617431640625, 3.91845703125, 4.07073974609375, 4.2230224609375, 4.37530517578125, 4.527587890625, 4.67987060546875, 4.8321533203125, 4.98443603515625, 5.13671875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 2.0, 2.0, 7.0, 10.0, 11.0, 17.0, 33.0, 56.0, 102.0, 171.0, 307.0, 687.0, 1341.0, 3230.0, 8703.0, 29657.0, 185380.0, 3655641.0, 258028.0, 34653.0, 9886.0, 3508.0, 1490.0, 636.0, 299.0, 173.0, 113.0, 52.0, 22.0, 26.0, 13.0, 10.0, 4.0, 2.0, 1.0, 2.0, 5.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.84375, -20.22265625, -19.6015625, -18.98046875, -18.359375, -17.73828125, -17.1171875, -16.49609375, -15.875, -15.25390625, -14.6328125, -14.01171875, -13.390625, -12.76953125, -12.1484375, -11.52734375, -10.90625, -10.28515625, -9.6640625, -9.04296875, -8.421875, -7.80078125, -7.1796875, -6.55859375, -5.9375, -5.31640625, -4.6953125, -4.07421875, -3.453125, -2.83203125, -2.2109375, -1.58984375, -0.96875, -0.34765625, 0.2734375, 0.89453125, 1.515625, 2.13671875, 2.7578125, 3.37890625, 4.0, 4.62109375, 5.2421875, 5.86328125, 6.484375, 7.10546875, 7.7265625, 8.34765625, 8.96875, 9.58984375, 10.2109375, 10.83203125, 11.453125, 12.07421875, 12.6953125, 13.31640625, 13.9375, 14.55859375, 15.1796875, 15.80078125, 16.421875, 17.04296875, 17.6640625, 18.28515625, 18.90625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 2.0, 4.0, 6.0, 4.0, 6.0, 8.0, 6.0, 19.0, 11.0, 16.0, 23.0, 26.0, 29.0, 48.0, 71.0, 112.0, 165.0, 325.0, 770.0, 1258.0, 520.0, 249.0, 127.0, 63.0, 46.0, 29.0, 25.0, 28.0, 15.0, 13.0, 9.0, 8.0, 10.0, 4.0, 6.0, 3.0, 2.0, 1.0, 0.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-5.875, -5.70843505859375, -5.5418701171875, -5.37530517578125, -5.208740234375, -5.04217529296875, -4.8756103515625, -4.70904541015625, -4.54248046875, -4.37591552734375, -4.2093505859375, -4.04278564453125, -3.876220703125, -3.70965576171875, -3.5430908203125, -3.37652587890625, -3.2099609375, -3.04339599609375, -2.8768310546875, -2.71026611328125, -2.543701171875, -2.37713623046875, -2.2105712890625, -2.04400634765625, -1.87744140625, -1.71087646484375, -1.5443115234375, -1.37774658203125, -1.211181640625, -1.04461669921875, -0.8780517578125, -0.71148681640625, -0.544921875, -0.37835693359375, -0.2117919921875, -0.04522705078125, 0.121337890625, 0.28790283203125, 0.4544677734375, 0.62103271484375, 0.78759765625, 0.95416259765625, 1.1207275390625, 1.28729248046875, 1.453857421875, 1.62042236328125, 1.7869873046875, 1.95355224609375, 2.1201171875, 2.28668212890625, 2.4532470703125, 2.61981201171875, 2.786376953125, 2.95294189453125, 3.1195068359375, 3.28607177734375, 3.45263671875, 3.61920166015625, 3.7857666015625, 3.95233154296875, 4.118896484375, 4.28546142578125, 4.4520263671875, 4.61859130859375, 4.78515625]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 11.0, 12.0, 57.0, 198.0, 342.0, 249.0, 96.0, 29.0, 10.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-195.0822296142578, -191.45753479003906, -187.83285522460938, -184.20816040039062, -180.58346557617188, -176.95877075195312, -173.33407592773438, -169.7093963623047, -166.08470153808594, -162.4600067138672, -158.8353271484375, -155.21063232421875, -151.5859375, -147.96124267578125, -144.3365478515625, -140.7118682861328, -137.08717346191406, -133.4624786376953, -129.83779907226562, -126.21310424804688, -122.58840942382812, -118.96371459960938, -115.33902740478516, -111.71434020996094, -108.08964538574219, -104.46495056152344, -100.84026336669922, -97.215576171875, -93.59088134765625, -89.9661865234375, -86.34149932861328, -82.71681213378906, -79.09212493896484, -75.46743774414062, -71.84274291992188, -68.21804809570312, -64.5933609008789, -60.96866989135742, -57.34397888183594, -53.71928787231445, -50.09459686279297, -46.469905853271484, -42.84521484375, -39.220523834228516, -35.59583282470703, -31.971141815185547, -28.346450805664062, -24.721759796142578, -21.097068786621094, -17.47237777709961, -13.847686767578125, -10.22299575805664, -6.598304748535156, -2.973613739013672, 0.6510772705078125, 4.275768280029297, 7.900459289550781, 11.525150299072266, 15.14984130859375, 18.774532318115234, 22.39922332763672, 26.023914337158203, 29.648605346679688, 33.27329635620117, 36.897987365722656]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 6.0, 5.0, 2.0, 9.0, 10.0, 10.0, 12.0, 14.0, 34.0, 31.0, 22.0, 43.0, 43.0, 34.0, 45.0, 53.0, 42.0, 51.0, 42.0, 53.0, 51.0, 44.0, 58.0, 33.0, 52.0, 28.0, 23.0, 29.0, 21.0, 22.0, 27.0, 13.0, 12.0, 10.0, 8.0, 5.0, 1.0, 3.0, 2.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.670917510986328, -20.9078311920166, -20.144746780395508, -19.38166046142578, -18.618576049804688, -17.85548973083496, -17.092403411865234, -16.32931900024414, -15.566232681274414, -14.803147315979004, -14.040061950683594, -13.276975631713867, -12.513890266418457, -11.750804901123047, -10.98771858215332, -10.22463321685791, -9.4615478515625, -8.69846248626709, -7.9353766441345215, -7.172290802001953, -6.409205436706543, -5.646120071411133, -4.8830342292785645, -4.119948387145996, -3.356863021850586, -2.5937774181365967, -1.8306918144226074, -1.0676062107086182, -0.3045206069946289, 0.45856499671936035, 1.2216506004333496, 1.984736442565918, 2.747821807861328, 3.5109074115753174, 4.273993015289307, 5.037078857421875, 5.800164222717285, 6.563249588012695, 7.326335430145264, 8.089421272277832, 8.852506637573242, 9.615592002868652, 10.378677368164062, 11.141763687133789, 11.9048490524292, 12.66793441772461, 13.431020736694336, 14.194106101989746, 14.957191467285156, 15.720276832580566, 16.483362197875977, 17.246448516845703, 18.009532928466797, 18.772619247436523, 19.53570556640625, 20.298789978027344, 21.06187629699707, 21.824962615966797, 22.58804702758789, 23.351133346557617, 24.114219665527344, 24.877304077148438, 25.640390396118164, 26.40347671508789, 27.166561126708984]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 13.0, 19.0, 22.0, 34.0, 32.0, 53.0, 91.0, 142.0, 233.0, 481.0, 951.0, 2289.0, 6852.0, 26121.0, 140616.0, 640266.0, 185362.0, 31831.0, 8235.0, 2766.0, 985.0, 468.0, 248.0, 151.0, 92.0, 66.0, 34.0, 24.0, 26.0, 20.0, 6.0, 3.0, 7.0, 3.0, 3.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.984375, -19.351318359375, -18.71826171875, -18.085205078125, -17.4521484375, -16.819091796875, -16.18603515625, -15.552978515625, -14.919921875, -14.286865234375, -13.65380859375, -13.020751953125, -12.3876953125, -11.754638671875, -11.12158203125, -10.488525390625, -9.85546875, -9.222412109375, -8.58935546875, -7.956298828125, -7.3232421875, -6.690185546875, -6.05712890625, -5.424072265625, -4.791015625, -4.157958984375, -3.52490234375, -2.891845703125, -2.2587890625, -1.625732421875, -0.99267578125, -0.359619140625, 0.2734375, 0.906494140625, 1.53955078125, 2.172607421875, 2.8056640625, 3.438720703125, 4.07177734375, 4.704833984375, 5.337890625, 5.970947265625, 6.60400390625, 7.237060546875, 7.8701171875, 8.503173828125, 9.13623046875, 9.769287109375, 10.40234375, 11.035400390625, 11.66845703125, 12.301513671875, 12.9345703125, 13.567626953125, 14.20068359375, 14.833740234375, 15.466796875, 16.099853515625, 16.73291015625, 17.365966796875, 17.9990234375, 18.632080078125, 19.26513671875, 19.898193359375, 20.53125]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 6.0, 10.0, 11.0, 14.0, 25.0, 28.0, 46.0, 53.0, 80.0, 101.0, 111.0, 102.0, 99.0, 91.0, 82.0, 49.0, 33.0, 22.0, 23.0, 8.0, 7.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.4609375, -5.29595947265625, -5.1309814453125, -4.96600341796875, -4.801025390625, -4.63604736328125, -4.4710693359375, -4.30609130859375, -4.14111328125, -3.97613525390625, -3.8111572265625, -3.64617919921875, -3.481201171875, -3.31622314453125, -3.1512451171875, -2.98626708984375, -2.8212890625, -2.65631103515625, -2.4913330078125, -2.32635498046875, -2.161376953125, -1.99639892578125, -1.8314208984375, -1.66644287109375, -1.50146484375, -1.33648681640625, -1.1715087890625, -1.00653076171875, -0.841552734375, -0.67657470703125, -0.5115966796875, -0.34661865234375, -0.181640625, -0.01666259765625, 0.1483154296875, 0.31329345703125, 0.478271484375, 0.64324951171875, 0.8082275390625, 0.97320556640625, 1.13818359375, 1.30316162109375, 1.4681396484375, 1.63311767578125, 1.798095703125, 1.96307373046875, 2.1280517578125, 2.29302978515625, 2.4580078125, 2.62298583984375, 2.7879638671875, 2.95294189453125, 3.117919921875, 3.28289794921875, 3.4478759765625, 3.61285400390625, 3.77783203125, 3.94281005859375, 4.1077880859375, 4.27276611328125, 4.437744140625, 4.60272216796875, 4.7677001953125, 4.93267822265625, 5.09765625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 3.0, 6.0, 8.0, 18.0, 17.0, 30.0, 41.0, 60.0, 97.0, 205.0, 433.0, 1013.0, 3495.0, 17659.0, 143821.0, 703502.0, 153752.0, 18777.0, 3680.0, 1040.0, 438.0, 195.0, 105.0, 54.0, 33.0, 26.0, 13.0, 11.0, 11.0, 7.0, 4.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.921875, -16.28369140625, -15.6455078125, -15.00732421875, -14.369140625, -13.73095703125, -13.0927734375, -12.45458984375, -11.81640625, -11.17822265625, -10.5400390625, -9.90185546875, -9.263671875, -8.62548828125, -7.9873046875, -7.34912109375, -6.7109375, -6.07275390625, -5.4345703125, -4.79638671875, -4.158203125, -3.52001953125, -2.8818359375, -2.24365234375, -1.60546875, -0.96728515625, -0.3291015625, 0.30908203125, 0.947265625, 1.58544921875, 2.2236328125, 2.86181640625, 3.5, 4.13818359375, 4.7763671875, 5.41455078125, 6.052734375, 6.69091796875, 7.3291015625, 7.96728515625, 8.60546875, 9.24365234375, 9.8818359375, 10.52001953125, 11.158203125, 11.79638671875, 12.4345703125, 13.07275390625, 13.7109375, 14.34912109375, 14.9873046875, 15.62548828125, 16.263671875, 16.90185546875, 17.5400390625, 18.17822265625, 18.81640625, 19.45458984375, 20.0927734375, 20.73095703125, 21.369140625, 22.00732421875, 22.6455078125, 23.28369140625, 23.921875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 7.0, 3.0, 4.0, 4.0, 7.0, 12.0, 14.0, 13.0, 9.0, 8.0, 18.0, 28.0, 22.0, 37.0, 41.0, 29.0, 55.0, 54.0, 41.0, 55.0, 49.0, 47.0, 41.0, 47.0, 45.0, 55.0, 58.0, 34.0, 36.0, 20.0, 17.0, 20.0, 13.0, 15.0, 14.0, 11.0, 5.0, 10.0, 4.0, 1.0, 6.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.5859375, -11.215576171875, -10.84521484375, -10.474853515625, -10.1044921875, -9.734130859375, -9.36376953125, -8.993408203125, -8.623046875, -8.252685546875, -7.88232421875, -7.511962890625, -7.1416015625, -6.771240234375, -6.40087890625, -6.030517578125, -5.66015625, -5.289794921875, -4.91943359375, -4.549072265625, -4.1787109375, -3.808349609375, -3.43798828125, -3.067626953125, -2.697265625, -2.326904296875, -1.95654296875, -1.586181640625, -1.2158203125, -0.845458984375, -0.47509765625, -0.104736328125, 0.265625, 0.635986328125, 1.00634765625, 1.376708984375, 1.7470703125, 2.117431640625, 2.48779296875, 2.858154296875, 3.228515625, 3.598876953125, 3.96923828125, 4.339599609375, 4.7099609375, 5.080322265625, 5.45068359375, 5.821044921875, 6.19140625, 6.561767578125, 6.93212890625, 7.302490234375, 7.6728515625, 8.043212890625, 8.41357421875, 8.783935546875, 9.154296875, 9.524658203125, 9.89501953125, 10.265380859375, 10.6357421875, 11.006103515625, 11.37646484375, 11.746826171875, 12.1171875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 7.0, 13.0, 30.0, 47.0, 105.0, 225.0, 482.0, 1397.0, 4684.0, 20669.0, 159413.0, 761525.0, 81609.0, 13318.0, 3340.0, 1016.0, 360.0, 155.0, 74.0, 46.0, 19.0, 6.0, 6.0, 3.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.6875, -13.348388671875, -13.00927734375, -12.670166015625, -12.3310546875, -11.991943359375, -11.65283203125, -11.313720703125, -10.974609375, -10.635498046875, -10.29638671875, -9.957275390625, -9.6181640625, -9.279052734375, -8.93994140625, -8.600830078125, -8.26171875, -7.922607421875, -7.58349609375, -7.244384765625, -6.9052734375, -6.566162109375, -6.22705078125, -5.887939453125, -5.548828125, -5.209716796875, -4.87060546875, -4.531494140625, -4.1923828125, -3.853271484375, -3.51416015625, -3.175048828125, -2.8359375, -2.496826171875, -2.15771484375, -1.818603515625, -1.4794921875, -1.140380859375, -0.80126953125, -0.462158203125, -0.123046875, 0.216064453125, 0.55517578125, 0.894287109375, 1.2333984375, 1.572509765625, 1.91162109375, 2.250732421875, 2.58984375, 2.928955078125, 3.26806640625, 3.607177734375, 3.9462890625, 4.285400390625, 4.62451171875, 4.963623046875, 5.302734375, 5.641845703125, 5.98095703125, 6.320068359375, 6.6591796875, 6.998291015625, 7.33740234375, 7.676513671875, 8.015625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 8.0, 3.0, 7.0, 9.0, 12.0, 8.0, 17.0, 33.0, 50.0, 92.0, 207.0, 243.0, 125.0, 65.0, 35.0, 18.0, 14.0, 15.0, 8.0, 7.0, 4.0, 5.0, 4.0, 4.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00214385986328125, -0.002083003520965576, -0.0020221471786499023, -0.0019612908363342285, -0.0019004344940185547, -0.0018395781517028809, -0.001778721809387207, -0.0017178654670715332, -0.0016570091247558594, -0.0015961527824401855, -0.0015352964401245117, -0.0014744400978088379, -0.001413583755493164, -0.0013527274131774902, -0.0012918710708618164, -0.0012310147285461426, -0.0011701583862304688, -0.001109302043914795, -0.001048445701599121, -0.0009875893592834473, -0.0009267330169677734, -0.0008658766746520996, -0.0008050203323364258, -0.000744163990020752, -0.0006833076477050781, -0.0006224513053894043, -0.0005615949630737305, -0.0005007386207580566, -0.0004398822784423828, -0.000379025936126709, -0.00031816959381103516, -0.00025731325149536133, -0.0001964569091796875, -0.00013560056686401367, -7.474422454833984e-05, -1.3887882232666016e-05, 4.696846008300781e-05, 0.00010782480239868164, 0.00016868114471435547, 0.0002295374870300293, 0.0002903938293457031, 0.00035125017166137695, 0.0004121065139770508, 0.0004729628562927246, 0.0005338191986083984, 0.0005946755409240723, 0.0006555318832397461, 0.0007163882255554199, 0.0007772445678710938, 0.0008381009101867676, 0.0008989572525024414, 0.0009598135948181152, 0.001020669937133789, 0.0010815262794494629, 0.0011423826217651367, 0.0012032389640808105, 0.0012640953063964844, 0.0013249516487121582, 0.001385807991027832, 0.0014466643333435059, 0.0015075206756591797, 0.0015683770179748535, 0.0016292333602905273, 0.0016900897026062012, 0.001750946044921875]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 7.0, 2.0, 7.0, 8.0, 11.0, 14.0, 27.0, 28.0, 45.0, 74.0, 138.0, 245.0, 446.0, 1140.0, 2693.0, 7920.0, 25196.0, 103417.0, 704934.0, 154465.0, 32021.0, 9880.0, 3329.0, 1261.0, 584.0, 286.0, 127.0, 89.0, 55.0, 40.0, 14.0, 14.0, 12.0, 11.0, 8.0, 5.0, 1.0, 2.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.7109375, -8.4437255859375, -8.176513671875, -7.9093017578125, -7.64208984375, -7.3748779296875, -7.107666015625, -6.8404541015625, -6.5732421875, -6.3060302734375, -6.038818359375, -5.7716064453125, -5.50439453125, -5.2371826171875, -4.969970703125, -4.7027587890625, -4.435546875, -4.1683349609375, -3.901123046875, -3.6339111328125, -3.36669921875, -3.0994873046875, -2.832275390625, -2.5650634765625, -2.2978515625, -2.0306396484375, -1.763427734375, -1.4962158203125, -1.22900390625, -0.9617919921875, -0.694580078125, -0.4273681640625, -0.16015625, 0.1070556640625, 0.374267578125, 0.6414794921875, 0.90869140625, 1.1759033203125, 1.443115234375, 1.7103271484375, 1.9775390625, 2.2447509765625, 2.511962890625, 2.7791748046875, 3.04638671875, 3.3135986328125, 3.580810546875, 3.8480224609375, 4.115234375, 4.3824462890625, 4.649658203125, 4.9168701171875, 5.18408203125, 5.4512939453125, 5.718505859375, 5.9857177734375, 6.2529296875, 6.5201416015625, 6.787353515625, 7.0545654296875, 7.32177734375, 7.5889892578125, 7.856201171875, 8.1234130859375, 8.390625]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 6.0, 6.0, 5.0, 3.0, 6.0, 8.0, 15.0, 22.0, 23.0, 31.0, 63.0, 107.0, 143.0, 175.0, 128.0, 88.0, 61.0, 35.0, 24.0, 10.0, 12.0, 11.0, 4.0, 8.0, 2.0, 7.0, 5.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.40234375, -7.1671142578125, -6.931884765625, -6.6966552734375, -6.46142578125, -6.2261962890625, -5.990966796875, -5.7557373046875, -5.5205078125, -5.2852783203125, -5.050048828125, -4.8148193359375, -4.57958984375, -4.3443603515625, -4.109130859375, -3.8739013671875, -3.638671875, -3.4034423828125, -3.168212890625, -2.9329833984375, -2.69775390625, -2.4625244140625, -2.227294921875, -1.9920654296875, -1.7568359375, -1.5216064453125, -1.286376953125, -1.0511474609375, -0.81591796875, -0.5806884765625, -0.345458984375, -0.1102294921875, 0.125, 0.3602294921875, 0.595458984375, 0.8306884765625, 1.06591796875, 1.3011474609375, 1.536376953125, 1.7716064453125, 2.0068359375, 2.2420654296875, 2.477294921875, 2.7125244140625, 2.94775390625, 3.1829833984375, 3.418212890625, 3.6534423828125, 3.888671875, 4.1239013671875, 4.359130859375, 4.5943603515625, 4.82958984375, 5.0648193359375, 5.300048828125, 5.5352783203125, 5.7705078125, 6.0057373046875, 6.240966796875, 6.4761962890625, 6.71142578125, 6.9466552734375, 7.181884765625, 7.4171142578125, 7.65234375]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 3.0, 8.0, 19.0, 17.0, 29.0, 73.0, 96.0, 144.0, 147.0, 129.0, 137.0, 90.0, 52.0, 28.0, 10.0, 11.0, 6.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-95.45228576660156, -92.02389526367188, -88.59550476074219, -85.1671142578125, -81.73873138427734, -78.31034088134766, -74.88195037841797, -71.45355987548828, -68.02517700195312, -64.59678649902344, -61.168399810791016, -57.74000930786133, -54.311622619628906, -50.88323211669922, -47.45484161376953, -44.026451110839844, -40.598060607910156, -37.16967010498047, -33.74128341674805, -30.31289291381836, -26.884504318237305, -23.45611572265625, -20.027725219726562, -16.599336624145508, -13.170948028564453, -9.742559432983398, -6.314169883728027, -2.8857803344726562, 0.5426082611083984, 3.970996856689453, 7.399387359619141, 10.827775955200195, 14.25616455078125, 17.684553146362305, 21.11294174194336, 24.541332244873047, 27.9697208404541, 31.398109436035156, 34.826499938964844, 38.25489044189453, 41.68327713012695, 45.11166763305664, 48.54005432128906, 51.96844482421875, 55.39683532714844, 58.82522201538086, 62.25361251831055, 65.68199920654297, 69.11038970947266, 72.53878021240234, 75.96717071533203, 79.39555358886719, 82.82394409179688, 86.25233459472656, 89.68072509765625, 93.10911560058594, 96.53750610351562, 99.96589660644531, 103.394287109375, 106.82267761230469, 110.25106048583984, 113.67945098876953, 117.10784149169922, 120.5362319946289, 123.96461486816406]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 3.0, 4.0, 7.0, 6.0, 7.0, 12.0, 12.0, 11.0, 8.0, 11.0, 22.0, 24.0, 23.0, 26.0, 33.0, 33.0, 37.0, 36.0, 54.0, 44.0, 49.0, 46.0, 38.0, 40.0, 46.0, 37.0, 32.0, 36.0, 38.0, 35.0, 25.0, 32.0, 27.0, 16.0, 9.0, 13.0, 16.0, 9.0, 12.0, 10.0, 6.0, 5.0, 7.0, 3.0, 1.0, 1.0, 2.0, 2.0, 4.0], "bins": [-66.17778015136719, -64.39293670654297, -62.60809326171875, -60.82324981689453, -59.03840637207031, -57.253562927246094, -55.468719482421875, -53.683876037597656, -51.89903259277344, -50.11418914794922, -48.329345703125, -46.54450225830078, -44.75965881347656, -42.974815368652344, -41.189971923828125, -39.405128479003906, -37.62028503417969, -35.83544158935547, -34.05059814453125, -32.26575469970703, -30.480911254882812, -28.696067810058594, -26.911224365234375, -25.126380920410156, -23.341537475585938, -21.55669403076172, -19.7718505859375, -17.98700714111328, -16.202163696289062, -14.417320251464844, -12.632476806640625, -10.847633361816406, -9.062793731689453, -7.277950286865234, -5.493106842041016, -3.708263397216797, -1.9234199523925781, -0.13857650756835938, 1.6462669372558594, 3.431110382080078, 5.215953826904297, 7.000797271728516, 8.785640716552734, 10.570484161376953, 12.355327606201172, 14.14017105102539, 15.92501449584961, 17.709857940673828, 19.494701385498047, 21.279544830322266, 23.064388275146484, 24.849231719970703, 26.634075164794922, 28.41891860961914, 30.20376205444336, 31.988605499267578, 33.7734489440918, 35.558292388916016, 37.343135833740234, 39.12797927856445, 40.91282272338867, 42.69766616821289, 44.48250961303711, 46.26735305786133, 48.05219650268555]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 2.0, 1.0, 4.0, 0.0, 2.0, 4.0, 8.0, 7.0, 6.0, 16.0, 16.0, 22.0, 31.0, 73.0, 113.0, 234.0, 563.0, 1840.0, 10884.0, 1135923.0, 3029488.0, 12081.0, 1988.0, 548.0, 191.0, 109.0, 66.0, 24.0, 17.0, 11.0, 4.0, 5.0, 3.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.625, -57.9697265625, -56.314453125, -54.6591796875, -53.00390625, -51.3486328125, -49.693359375, -48.0380859375, -46.3828125, -44.7275390625, -43.072265625, -41.4169921875, -39.76171875, -38.1064453125, -36.451171875, -34.7958984375, -33.140625, -31.4853515625, -29.830078125, -28.1748046875, -26.51953125, -24.8642578125, -23.208984375, -21.5537109375, -19.8984375, -18.2431640625, -16.587890625, -14.9326171875, -13.27734375, -11.6220703125, -9.966796875, -8.3115234375, -6.65625, -5.0009765625, -3.345703125, -1.6904296875, -0.03515625, 1.6201171875, 3.275390625, 4.9306640625, 6.5859375, 8.2412109375, 9.896484375, 11.5517578125, 13.20703125, 14.8623046875, 16.517578125, 18.1728515625, 19.828125, 21.4833984375, 23.138671875, 24.7939453125, 26.44921875, 28.1044921875, 29.759765625, 31.4150390625, 33.0703125, 34.7255859375, 36.380859375, 38.0361328125, 39.69140625, 41.3466796875, 43.001953125, 44.6572265625, 46.3125]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 1.0, 2.0, 4.0, 7.0, 6.0, 13.0, 18.0, 19.0, 40.0, 47.0, 59.0, 72.0, 78.0, 71.0, 91.0, 74.0, 84.0, 66.0, 57.0, 49.0, 42.0, 30.0, 21.0, 22.0, 8.0, 6.0, 6.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.94921875, -3.807373046875, -3.66552734375, -3.523681640625, -3.3818359375, -3.239990234375, -3.09814453125, -2.956298828125, -2.814453125, -2.672607421875, -2.53076171875, -2.388916015625, -2.2470703125, -2.105224609375, -1.96337890625, -1.821533203125, -1.6796875, -1.537841796875, -1.39599609375, -1.254150390625, -1.1123046875, -0.970458984375, -0.82861328125, -0.686767578125, -0.544921875, -0.403076171875, -0.26123046875, -0.119384765625, 0.0224609375, 0.164306640625, 0.30615234375, 0.447998046875, 0.58984375, 0.731689453125, 0.87353515625, 1.015380859375, 1.1572265625, 1.299072265625, 1.44091796875, 1.582763671875, 1.724609375, 1.866455078125, 2.00830078125, 2.150146484375, 2.2919921875, 2.433837890625, 2.57568359375, 2.717529296875, 2.859375, 3.001220703125, 3.14306640625, 3.284912109375, 3.4267578125, 3.568603515625, 3.71044921875, 3.852294921875, 3.994140625, 4.135986328125, 4.27783203125, 4.419677734375, 4.5615234375, 4.703369140625, 4.84521484375, 4.987060546875, 5.12890625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 8.0, 9.0, 19.0, 38.0, 66.0, 134.0, 244.0, 722.0, 2228.0, 9519.0, 72417.0, 3926300.0, 163070.0, 14908.0, 3048.0, 935.0, 316.0, 151.0, 58.0, 39.0, 21.0, 9.0, 9.0, 5.0, 1.0, 3.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-44.59375, -43.547607421875, -42.50146484375, -41.455322265625, -40.4091796875, -39.363037109375, -38.31689453125, -37.270751953125, -36.224609375, -35.178466796875, -34.13232421875, -33.086181640625, -32.0400390625, -30.993896484375, -29.94775390625, -28.901611328125, -27.85546875, -26.809326171875, -25.76318359375, -24.717041015625, -23.6708984375, -22.624755859375, -21.57861328125, -20.532470703125, -19.486328125, -18.440185546875, -17.39404296875, -16.347900390625, -15.3017578125, -14.255615234375, -13.20947265625, -12.163330078125, -11.1171875, -10.071044921875, -9.02490234375, -7.978759765625, -6.9326171875, -5.886474609375, -4.84033203125, -3.794189453125, -2.748046875, -1.701904296875, -0.65576171875, 0.390380859375, 1.4365234375, 2.482666015625, 3.52880859375, 4.574951171875, 5.62109375, 6.667236328125, 7.71337890625, 8.759521484375, 9.8056640625, 10.851806640625, 11.89794921875, 12.944091796875, 13.990234375, 15.036376953125, 16.08251953125, 17.128662109375, 18.1748046875, 19.220947265625, 20.26708984375, 21.313232421875, 22.359375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 8.0, 4.0, 10.0, 10.0, 18.0, 24.0, 15.0, 37.0, 66.0, 106.0, 267.0, 913.0, 1720.0, 437.0, 165.0, 92.0, 56.0, 26.0, 25.0, 22.0, 19.0, 5.0, 8.0, 4.0, 5.0, 3.0, 2.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-9.3515625, -9.1298828125, -8.908203125, -8.6865234375, -8.46484375, -8.2431640625, -8.021484375, -7.7998046875, -7.578125, -7.3564453125, -7.134765625, -6.9130859375, -6.69140625, -6.4697265625, -6.248046875, -6.0263671875, -5.8046875, -5.5830078125, -5.361328125, -5.1396484375, -4.91796875, -4.6962890625, -4.474609375, -4.2529296875, -4.03125, -3.8095703125, -3.587890625, -3.3662109375, -3.14453125, -2.9228515625, -2.701171875, -2.4794921875, -2.2578125, -2.0361328125, -1.814453125, -1.5927734375, -1.37109375, -1.1494140625, -0.927734375, -0.7060546875, -0.484375, -0.2626953125, -0.041015625, 0.1806640625, 0.40234375, 0.6240234375, 0.845703125, 1.0673828125, 1.2890625, 1.5107421875, 1.732421875, 1.9541015625, 2.17578125, 2.3974609375, 2.619140625, 2.8408203125, 3.0625, 3.2841796875, 3.505859375, 3.7275390625, 3.94921875, 4.1708984375, 4.392578125, 4.6142578125, 4.8359375]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 24.0, 46.0, 102.0, 183.0, 257.0, 194.0, 111.0, 48.0, 24.0, 6.0, 6.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.7572021484375, -53.34828567504883, -50.93936538696289, -48.53044891357422, -46.12153244018555, -43.712615966796875, -41.30369567871094, -38.894779205322266, -36.485862731933594, -34.07694625854492, -31.668027877807617, -29.259109497070312, -26.85019302368164, -24.441274642944336, -22.03235626220703, -19.62343978881836, -17.214519500732422, -14.805602073669434, -12.396684646606445, -9.98776626586914, -7.578848838806152, -5.169931411743164, -2.7610130310058594, -0.3520965576171875, 2.056821823120117, 4.4657392501831055, 6.874657154083252, 9.283575057983398, 11.692492485046387, 14.101409912109375, 16.51032829284668, 18.91924476623535, 21.328163146972656, 23.73708152770996, 26.145998001098633, 28.554916381835938, 30.96383285522461, 33.37274932861328, 35.78166961669922, 38.19058609008789, 40.59950256347656, 43.008419036865234, 45.41733932495117, 47.826255798339844, 50.235172271728516, 52.64408874511719, 55.053009033203125, 57.4619255065918, 59.870845794677734, 62.279762268066406, 64.68868255615234, 67.09759521484375, 69.50651550292969, 71.91543579101562, 74.32435607910156, 76.73326873779297, 79.1421890258789, 81.55110931396484, 83.96002197265625, 86.36894226074219, 88.77786254882812, 91.18677520751953, 93.59569549560547, 96.00460815429688, 98.41352844238281]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 1.0, 5.0, 6.0, 7.0, 9.0, 10.0, 9.0, 17.0, 27.0, 33.0, 32.0, 38.0, 34.0, 36.0, 55.0, 42.0, 46.0, 44.0, 41.0, 55.0, 49.0, 38.0, 40.0, 51.0, 42.0, 47.0, 28.0, 30.0, 26.0, 32.0, 16.0, 19.0, 11.0, 11.0, 5.0, 5.0, 1.0, 4.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.991661071777344, -25.238811492919922, -24.485963821411133, -23.73311424255371, -22.980266571044922, -22.2274169921875, -21.474567413330078, -20.72171974182129, -19.968870162963867, -19.216020584106445, -18.463172912597656, -17.710323333740234, -16.957475662231445, -16.204626083374023, -15.451777458190918, -14.698928833007812, -13.946080207824707, -13.193231582641602, -12.440382957458496, -11.68753433227539, -10.934684753417969, -10.181836128234863, -9.428987503051758, -8.676137924194336, -7.923289775848389, -7.170441150665283, -6.4175920486450195, -5.664743423461914, -4.911894798278809, -4.159045696258545, -3.4061970710754395, -2.653347969055176, -1.9004993438720703, -1.1476504802703857, -0.3948017358779907, 0.3580470085144043, 1.1108958721160889, 1.8637447357177734, 2.616593360900879, 3.3694424629211426, 4.122291088104248, 4.8751397132873535, 5.627988815307617, 6.380837440490723, 7.133686065673828, 7.886535167694092, 8.639383316040039, 9.392232894897461, 10.145081520080566, 10.897930145263672, 11.650778770446777, 12.403627395629883, 13.156476974487305, 13.90932559967041, 14.662174224853516, 15.415023803710938, 16.167871475219727, 16.92072105407715, 17.673568725585938, 18.42641830444336, 19.17926597595215, 19.93211555480957, 20.68496322631836, 21.43781280517578, 22.190662384033203]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 8.0, 0.0, 1.0, 4.0, 1.0, 9.0, 13.0, 15.0, 21.0, 31.0, 46.0, 94.0, 163.0, 278.0, 462.0, 956.0, 2205.0, 6003.0, 18568.0, 66088.0, 282279.0, 485859.0, 133863.0, 34722.0, 10366.0, 3565.0, 1464.0, 608.0, 351.0, 208.0, 119.0, 69.0, 48.0, 18.0, 25.0, 13.0, 15.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.75, -11.24462890625, -10.7392578125, -10.23388671875, -9.728515625, -9.22314453125, -8.7177734375, -8.21240234375, -7.70703125, -7.20166015625, -6.6962890625, -6.19091796875, -5.685546875, -5.18017578125, -4.6748046875, -4.16943359375, -3.6640625, -3.15869140625, -2.6533203125, -2.14794921875, -1.642578125, -1.13720703125, -0.6318359375, -0.12646484375, 0.37890625, 0.88427734375, 1.3896484375, 1.89501953125, 2.400390625, 2.90576171875, 3.4111328125, 3.91650390625, 4.421875, 4.92724609375, 5.4326171875, 5.93798828125, 6.443359375, 6.94873046875, 7.4541015625, 7.95947265625, 8.46484375, 8.97021484375, 9.4755859375, 9.98095703125, 10.486328125, 10.99169921875, 11.4970703125, 12.00244140625, 12.5078125, 13.01318359375, 13.5185546875, 14.02392578125, 14.529296875, 15.03466796875, 15.5400390625, 16.04541015625, 16.55078125, 17.05615234375, 17.5615234375, 18.06689453125, 18.572265625, 19.07763671875, 19.5830078125, 20.08837890625, 20.59375]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 5.0, 4.0, 15.0, 13.0, 15.0, 32.0, 33.0, 54.0, 55.0, 72.0, 84.0, 66.0, 85.0, 84.0, 61.0, 65.0, 59.0, 59.0, 40.0, 26.0, 23.0, 16.0, 17.0, 7.0, 7.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.6484375, -4.50189208984375, -4.3553466796875, -4.20880126953125, -4.062255859375, -3.91571044921875, -3.7691650390625, -3.62261962890625, -3.47607421875, -3.32952880859375, -3.1829833984375, -3.03643798828125, -2.889892578125, -2.74334716796875, -2.5968017578125, -2.45025634765625, -2.3037109375, -2.15716552734375, -2.0106201171875, -1.86407470703125, -1.717529296875, -1.57098388671875, -1.4244384765625, -1.27789306640625, -1.13134765625, -0.98480224609375, -0.8382568359375, -0.69171142578125, -0.545166015625, -0.39862060546875, -0.2520751953125, -0.10552978515625, 0.041015625, 0.18756103515625, 0.3341064453125, 0.48065185546875, 0.627197265625, 0.77374267578125, 0.9202880859375, 1.06683349609375, 1.21337890625, 1.35992431640625, 1.5064697265625, 1.65301513671875, 1.799560546875, 1.94610595703125, 2.0926513671875, 2.23919677734375, 2.3857421875, 2.53228759765625, 2.6788330078125, 2.82537841796875, 2.971923828125, 3.11846923828125, 3.2650146484375, 3.41156005859375, 3.55810546875, 3.70465087890625, 3.8511962890625, 3.99774169921875, 4.144287109375, 4.29083251953125, 4.4373779296875, 4.58392333984375, 4.73046875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 5.0, 3.0, 2.0, 6.0, 4.0, 6.0, 11.0, 18.0, 38.0, 42.0, 66.0, 160.0, 291.0, 735.0, 2155.0, 7722.0, 37144.0, 220886.0, 607693.0, 138647.0, 24506.0, 5634.0, 1660.0, 572.0, 246.0, 118.0, 65.0, 35.0, 19.0, 17.0, 7.0, 11.0, 5.0, 6.0, 5.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.671875, -17.108642578125, -16.54541015625, -15.982177734375, -15.4189453125, -14.855712890625, -14.29248046875, -13.729248046875, -13.166015625, -12.602783203125, -12.03955078125, -11.476318359375, -10.9130859375, -10.349853515625, -9.78662109375, -9.223388671875, -8.66015625, -8.096923828125, -7.53369140625, -6.970458984375, -6.4072265625, -5.843994140625, -5.28076171875, -4.717529296875, -4.154296875, -3.591064453125, -3.02783203125, -2.464599609375, -1.9013671875, -1.338134765625, -0.77490234375, -0.211669921875, 0.3515625, 0.914794921875, 1.47802734375, 2.041259765625, 2.6044921875, 3.167724609375, 3.73095703125, 4.294189453125, 4.857421875, 5.420654296875, 5.98388671875, 6.547119140625, 7.1103515625, 7.673583984375, 8.23681640625, 8.800048828125, 9.36328125, 9.926513671875, 10.48974609375, 11.052978515625, 11.6162109375, 12.179443359375, 12.74267578125, 13.305908203125, 13.869140625, 14.432373046875, 14.99560546875, 15.558837890625, 16.1220703125, 16.685302734375, 17.24853515625, 17.811767578125, 18.375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 4.0, 5.0, 4.0, 12.0, 15.0, 19.0, 17.0, 25.0, 30.0, 33.0, 39.0, 36.0, 32.0, 44.0, 48.0, 49.0, 51.0, 60.0, 51.0, 37.0, 38.0, 58.0, 53.0, 47.0, 34.0, 30.0, 22.0, 21.0, 14.0, 22.0, 10.0, 15.0, 9.0, 5.0, 4.0, 2.0, 3.0, 1.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.609375, -11.18701171875, -10.7646484375, -10.34228515625, -9.919921875, -9.49755859375, -9.0751953125, -8.65283203125, -8.23046875, -7.80810546875, -7.3857421875, -6.96337890625, -6.541015625, -6.11865234375, -5.6962890625, -5.27392578125, -4.8515625, -4.42919921875, -4.0068359375, -3.58447265625, -3.162109375, -2.73974609375, -2.3173828125, -1.89501953125, -1.47265625, -1.05029296875, -0.6279296875, -0.20556640625, 0.216796875, 0.63916015625, 1.0615234375, 1.48388671875, 1.90625, 2.32861328125, 2.7509765625, 3.17333984375, 3.595703125, 4.01806640625, 4.4404296875, 4.86279296875, 5.28515625, 5.70751953125, 6.1298828125, 6.55224609375, 6.974609375, 7.39697265625, 7.8193359375, 8.24169921875, 8.6640625, 9.08642578125, 9.5087890625, 9.93115234375, 10.353515625, 10.77587890625, 11.1982421875, 11.62060546875, 12.04296875, 12.46533203125, 12.8876953125, 13.31005859375, 13.732421875, 14.15478515625, 14.5771484375, 14.99951171875, 15.421875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 2.0, 6.0, 11.0, 12.0, 19.0, 28.0, 53.0, 54.0, 102.0, 137.0, 212.0, 402.0, 878.0, 2234.0, 10209.0, 116679.0, 870219.0, 38852.0, 5378.0, 1552.0, 663.0, 329.0, 191.0, 99.0, 77.0, 44.0, 23.0, 28.0, 13.0, 13.0, 5.0, 9.0, 7.0, 5.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-23.921875, -23.28076171875, -22.6396484375, -21.99853515625, -21.357421875, -20.71630859375, -20.0751953125, -19.43408203125, -18.79296875, -18.15185546875, -17.5107421875, -16.86962890625, -16.228515625, -15.58740234375, -14.9462890625, -14.30517578125, -13.6640625, -13.02294921875, -12.3818359375, -11.74072265625, -11.099609375, -10.45849609375, -9.8173828125, -9.17626953125, -8.53515625, -7.89404296875, -7.2529296875, -6.61181640625, -5.970703125, -5.32958984375, -4.6884765625, -4.04736328125, -3.40625, -2.76513671875, -2.1240234375, -1.48291015625, -0.841796875, -0.20068359375, 0.4404296875, 1.08154296875, 1.72265625, 2.36376953125, 3.0048828125, 3.64599609375, 4.287109375, 4.92822265625, 5.5693359375, 6.21044921875, 6.8515625, 7.49267578125, 8.1337890625, 8.77490234375, 9.416015625, 10.05712890625, 10.6982421875, 11.33935546875, 11.98046875, 12.62158203125, 13.2626953125, 13.90380859375, 14.544921875, 15.18603515625, 15.8271484375, 16.46826171875, 17.109375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 2.0, 7.0, 3.0, 9.0, 5.0, 19.0, 15.0, 34.0, 42.0, 39.0, 85.0, 224.0, 206.0, 117.0, 66.0, 35.0, 28.0, 22.0, 12.0, 10.0, 9.0, 3.0, 3.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.002765655517578125, -0.002699941396713257, -0.0026342272758483887, -0.0025685131549835205, -0.0025027990341186523, -0.002437084913253784, -0.002371370792388916, -0.002305656671524048, -0.0022399425506591797, -0.0021742284297943115, -0.0021085143089294434, -0.002042800188064575, -0.001977086067199707, -0.0019113719463348389, -0.0018456578254699707, -0.0017799437046051025, -0.0017142295837402344, -0.0016485154628753662, -0.001582801342010498, -0.0015170872211456299, -0.0014513731002807617, -0.0013856589794158936, -0.0013199448585510254, -0.0012542307376861572, -0.001188516616821289, -0.001122802495956421, -0.0010570883750915527, -0.0009913742542266846, -0.0009256601333618164, -0.0008599460124969482, -0.0007942318916320801, -0.0007285177707672119, -0.0006628036499023438, -0.0005970895290374756, -0.0005313754081726074, -0.00046566128730773926, -0.0003999471664428711, -0.00033423304557800293, -0.00026851892471313477, -0.0002028048038482666, -0.00013709068298339844, -7.137656211853027e-05, -5.662441253662109e-06, 6.0051679611206055e-05, 0.00012576580047607422, 0.00019147992134094238, 0.00025719404220581055, 0.0003229081630706787, 0.0003886222839355469, 0.00045433640480041504, 0.0005200505256652832, 0.0005857646465301514, 0.0006514787673950195, 0.0007171928882598877, 0.0007829070091247559, 0.000848621129989624, 0.0009143352508544922, 0.0009800493717193604, 0.0010457634925842285, 0.0011114776134490967, 0.0011771917343139648, 0.001242905855178833, 0.0013086199760437012, 0.0013743340969085693, 0.0014400482177734375]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 4.0, 0.0, 9.0, 17.0, 18.0, 28.0, 57.0, 122.0, 282.0, 1091.0, 6676.0, 126394.0, 893892.0, 17107.0, 2007.0, 497.0, 179.0, 80.0, 43.0, 20.0, 15.0, 8.0, 2.0, 4.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 2.0], "bins": [-43.0625, -42.109619140625, -41.15673828125, -40.203857421875, -39.2509765625, -38.298095703125, -37.34521484375, -36.392333984375, -35.439453125, -34.486572265625, -33.53369140625, -32.580810546875, -31.6279296875, -30.675048828125, -29.72216796875, -28.769287109375, -27.81640625, -26.863525390625, -25.91064453125, -24.957763671875, -24.0048828125, -23.052001953125, -22.09912109375, -21.146240234375, -20.193359375, -19.240478515625, -18.28759765625, -17.334716796875, -16.3818359375, -15.428955078125, -14.47607421875, -13.523193359375, -12.5703125, -11.617431640625, -10.66455078125, -9.711669921875, -8.7587890625, -7.805908203125, -6.85302734375, -5.900146484375, -4.947265625, -3.994384765625, -3.04150390625, -2.088623046875, -1.1357421875, -0.182861328125, 0.77001953125, 1.722900390625, 2.67578125, 3.628662109375, 4.58154296875, 5.534423828125, 6.4873046875, 7.440185546875, 8.39306640625, 9.345947265625, 10.298828125, 11.251708984375, 12.20458984375, 13.157470703125, 14.1103515625, 15.063232421875, 16.01611328125, 16.968994140625, 17.921875]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 5.0, 3.0, 6.0, 3.0, 9.0, 20.0, 23.0, 34.0, 83.0, 196.0, 314.0, 144.0, 64.0, 40.0, 21.0, 23.0, 2.0, 6.0, 7.0, 3.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.21875, -18.7305908203125, -18.242431640625, -17.7542724609375, -17.26611328125, -16.7779541015625, -16.289794921875, -15.8016357421875, -15.3134765625, -14.8253173828125, -14.337158203125, -13.8489990234375, -13.36083984375, -12.8726806640625, -12.384521484375, -11.8963623046875, -11.408203125, -10.9200439453125, -10.431884765625, -9.9437255859375, -9.45556640625, -8.9674072265625, -8.479248046875, -7.9910888671875, -7.5029296875, -7.0147705078125, -6.526611328125, -6.0384521484375, -5.55029296875, -5.0621337890625, -4.573974609375, -4.0858154296875, -3.59765625, -3.1094970703125, -2.621337890625, -2.1331787109375, -1.64501953125, -1.1568603515625, -0.668701171875, -0.1805419921875, 0.3076171875, 0.7957763671875, 1.283935546875, 1.7720947265625, 2.26025390625, 2.7484130859375, 3.236572265625, 3.7247314453125, 4.212890625, 4.7010498046875, 5.189208984375, 5.6773681640625, 6.16552734375, 6.6536865234375, 7.141845703125, 7.6300048828125, 8.1181640625, 8.6063232421875, 9.094482421875, 9.5826416015625, 10.07080078125, 10.5589599609375, 11.047119140625, 11.5352783203125, 12.0234375]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 10.0, 37.0, 62.0, 118.0, 227.0, 262.0, 179.0, 71.0, 30.0, 7.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-163.67164611816406, -156.66128540039062, -149.6509246826172, -142.64056396484375, -135.63021850585938, -128.61984252929688, -121.6094970703125, -114.59913635253906, -107.58877563476562, -100.57841491699219, -93.56805419921875, -86.55770111083984, -79.5473403930664, -72.53697967529297, -65.52662658691406, -58.516265869140625, -51.50590515136719, -44.49554443359375, -37.48518753051758, -30.474828720092773, -23.46446990966797, -16.45410919189453, -9.44375228881836, -2.4333953857421875, 4.57696533203125, 11.587324142456055, 18.59768295288086, 25.608041763305664, 32.61840057373047, 39.628761291503906, 46.63911819458008, 53.64947509765625, 60.659820556640625, 67.67018127441406, 74.6805419921875, 81.6908950805664, 88.70125579833984, 95.71161651611328, 102.72196960449219, 109.73233032226562, 116.74269104003906, 123.7530517578125, 130.76341247558594, 137.77377319335938, 144.78411865234375, 151.79449462890625, 158.80484008789062, 165.81520080566406, 172.8255615234375, 179.83592224121094, 186.84628295898438, 193.8566436767578, 200.86700439453125, 207.87734985351562, 214.88771057128906, 221.8980712890625, 228.90843200683594, 235.91879272460938, 242.9291534423828, 249.93951416015625, 256.9498596191406, 263.9602355957031, 270.9705810546875, 277.98095703125, 284.9913024902344]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 6.0, 6.0, 8.0, 9.0, 9.0, 14.0, 22.0, 18.0, 12.0, 18.0, 24.0, 30.0, 26.0, 30.0, 34.0, 39.0, 39.0, 44.0, 48.0, 52.0, 38.0, 46.0, 36.0, 39.0, 41.0, 31.0, 39.0, 29.0, 25.0, 25.0, 21.0, 19.0, 26.0, 27.0, 16.0, 12.0, 12.0, 3.0, 5.0, 5.0, 7.0, 4.0, 3.0, 3.0, 7.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-52.840850830078125, -51.15983963012695, -49.478824615478516, -47.797813415527344, -46.116798400878906, -44.435787200927734, -42.7547721862793, -41.073760986328125, -39.39274597167969, -37.711734771728516, -36.03071975708008, -34.349708557128906, -32.66869354248047, -30.987682342529297, -29.30666732788086, -27.625656127929688, -25.944643020629883, -24.263629913330078, -22.582616806030273, -20.90160369873047, -19.220590591430664, -17.53957748413086, -15.858565330505371, -14.177552223205566, -12.496539115905762, -10.815526008605957, -9.134512901306152, -7.453500270843506, -5.772487163543701, -4.091474533081055, -2.41046142578125, -0.7294483184814453, 0.9515647888183594, 2.632577896118164, 4.313591003417969, 5.994603633880615, 7.67561674118042, 9.356629371643066, 11.037642478942871, 12.718655586242676, 14.39966869354248, 16.08068084716797, 17.761693954467773, 19.442707061767578, 21.123720169067383, 22.804733276367188, 24.485746383666992, 26.166759490966797, 27.8477725982666, 29.528785705566406, 31.20979881286621, 32.890811920166016, 34.57182312011719, 36.252838134765625, 37.9338493347168, 39.614864349365234, 41.295875549316406, 42.97688674926758, 44.657901763916016, 46.33891296386719, 48.019927978515625, 49.7009391784668, 51.381954193115234, 53.062965393066406, 54.743980407714844]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 2.0, 3.0, 5.0, 11.0, 3.0, 7.0, 12.0, 9.0, 13.0, 19.0, 41.0, 67.0, 65.0, 112.0, 220.0, 354.0, 674.0, 1412.0, 3272.0, 9423.0, 39588.0, 3373648.0, 719151.0, 31855.0, 8368.0, 3075.0, 1273.0, 696.0, 345.0, 194.0, 136.0, 69.0, 54.0, 32.0, 17.0, 8.0, 17.0, 6.0, 9.0, 4.0, 1.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-41.53125, -40.464599609375, -39.39794921875, -38.331298828125, -37.2646484375, -36.197998046875, -35.13134765625, -34.064697265625, -32.998046875, -31.931396484375, -30.86474609375, -29.798095703125, -28.7314453125, -27.664794921875, -26.59814453125, -25.531494140625, -24.46484375, -23.398193359375, -22.33154296875, -21.264892578125, -20.1982421875, -19.131591796875, -18.06494140625, -16.998291015625, -15.931640625, -14.864990234375, -13.79833984375, -12.731689453125, -11.6650390625, -10.598388671875, -9.53173828125, -8.465087890625, -7.3984375, -6.331787109375, -5.26513671875, -4.198486328125, -3.1318359375, -2.065185546875, -0.99853515625, 0.068115234375, 1.134765625, 2.201416015625, 3.26806640625, 4.334716796875, 5.4013671875, 6.468017578125, 7.53466796875, 8.601318359375, 9.66796875, 10.734619140625, 11.80126953125, 12.867919921875, 13.9345703125, 15.001220703125, 16.06787109375, 17.134521484375, 18.201171875, 19.267822265625, 20.33447265625, 21.401123046875, 22.4677734375, 23.534423828125, 24.60107421875, 25.667724609375, 26.734375]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 6.0, 14.0, 25.0, 41.0, 56.0, 79.0, 78.0, 103.0, 105.0, 104.0, 93.0, 69.0, 76.0, 47.0, 43.0, 34.0, 14.0, 7.0, 2.0, 5.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.328125, -7.1243896484375, -6.920654296875, -6.7169189453125, -6.51318359375, -6.3094482421875, -6.105712890625, -5.9019775390625, -5.6982421875, -5.4945068359375, -5.290771484375, -5.0870361328125, -4.88330078125, -4.6795654296875, -4.475830078125, -4.2720947265625, -4.068359375, -3.8646240234375, -3.660888671875, -3.4571533203125, -3.25341796875, -3.0496826171875, -2.845947265625, -2.6422119140625, -2.4384765625, -2.2347412109375, -2.031005859375, -1.8272705078125, -1.62353515625, -1.4197998046875, -1.216064453125, -1.0123291015625, -0.80859375, -0.6048583984375, -0.401123046875, -0.1973876953125, 0.00634765625, 0.2100830078125, 0.413818359375, 0.6175537109375, 0.8212890625, 1.0250244140625, 1.228759765625, 1.4324951171875, 1.63623046875, 1.8399658203125, 2.043701171875, 2.2474365234375, 2.451171875, 2.6549072265625, 2.858642578125, 3.0623779296875, 3.26611328125, 3.4698486328125, 3.673583984375, 3.8773193359375, 4.0810546875, 4.2847900390625, 4.488525390625, 4.6922607421875, 4.89599609375, 5.0997314453125, 5.303466796875, 5.5072021484375, 5.7109375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 4.0, 3.0, 2.0, 13.0, 11.0, 29.0, 35.0, 77.0, 164.0, 297.0, 607.0, 1663.0, 7909.0, 82297.0, 4016711.0, 74208.0, 7473.0, 1629.0, 578.0, 290.0, 145.0, 60.0, 38.0, 23.0, 10.0, 9.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-65.75, -64.1650390625, -62.580078125, -60.9951171875, -59.41015625, -57.8251953125, -56.240234375, -54.6552734375, -53.0703125, -51.4853515625, -49.900390625, -48.3154296875, -46.73046875, -45.1455078125, -43.560546875, -41.9755859375, -40.390625, -38.8056640625, -37.220703125, -35.6357421875, -34.05078125, -32.4658203125, -30.880859375, -29.2958984375, -27.7109375, -26.1259765625, -24.541015625, -22.9560546875, -21.37109375, -19.7861328125, -18.201171875, -16.6162109375, -15.03125, -13.4462890625, -11.861328125, -10.2763671875, -8.69140625, -7.1064453125, -5.521484375, -3.9365234375, -2.3515625, -0.7666015625, 0.818359375, 2.4033203125, 3.98828125, 5.5732421875, 7.158203125, 8.7431640625, 10.328125, 11.9130859375, 13.498046875, 15.0830078125, 16.66796875, 18.2529296875, 19.837890625, 21.4228515625, 23.0078125, 24.5927734375, 26.177734375, 27.7626953125, 29.34765625, 30.9326171875, 32.517578125, 34.1025390625, 35.6875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 5.0, 4.0, 3.0, 9.0, 13.0, 17.0, 30.0, 30.0, 58.0, 145.0, 479.0, 2597.0, 412.0, 124.0, 63.0, 32.0, 15.0, 19.0, 7.0, 11.0, 2.0, 3.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.109375, -15.7296142578125, -15.349853515625, -14.9700927734375, -14.59033203125, -14.2105712890625, -13.830810546875, -13.4510498046875, -13.0712890625, -12.6915283203125, -12.311767578125, -11.9320068359375, -11.55224609375, -11.1724853515625, -10.792724609375, -10.4129638671875, -10.033203125, -9.6534423828125, -9.273681640625, -8.8939208984375, -8.51416015625, -8.1343994140625, -7.754638671875, -7.3748779296875, -6.9951171875, -6.6153564453125, -6.235595703125, -5.8558349609375, -5.47607421875, -5.0963134765625, -4.716552734375, -4.3367919921875, -3.95703125, -3.5772705078125, -3.197509765625, -2.8177490234375, -2.43798828125, -2.0582275390625, -1.678466796875, -1.2987060546875, -0.9189453125, -0.5391845703125, -0.159423828125, 0.2203369140625, 0.60009765625, 0.9798583984375, 1.359619140625, 1.7393798828125, 2.119140625, 2.4989013671875, 2.878662109375, 3.2584228515625, 3.63818359375, 4.0179443359375, 4.397705078125, 4.7774658203125, 5.1572265625, 5.5369873046875, 5.916748046875, 6.2965087890625, 6.67626953125, 7.0560302734375, 7.435791015625, 7.8155517578125, 8.1953125]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 5.0, 8.0, 7.0, 7.0, 23.0, 19.0, 49.0, 75.0, 125.0, 174.0, 170.0, 135.0, 90.0, 56.0, 30.0, 16.0, 4.0, 5.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.50460052490234, -65.521728515625, -63.538856506347656, -61.55598449707031, -59.5731086730957, -57.59023666381836, -55.607364654541016, -53.62449264526367, -51.64162063598633, -49.658748626708984, -47.67587661743164, -45.69300079345703, -43.71012878417969, -41.727256774902344, -39.744384765625, -37.761512756347656, -35.77864074707031, -33.79576873779297, -31.812894821166992, -29.83002281188965, -27.847150802612305, -25.864276885986328, -23.881404876708984, -21.89853286743164, -19.91565704345703, -17.932785034179688, -15.949912071228027, -13.967039108276367, -11.984167098999023, -10.001294136047363, -8.018421173095703, -6.035549163818359, -4.052677154541016, -2.0698046684265137, -0.08693194389343262, 1.8959407806396484, 3.8788132667541504, 5.861685752868652, 7.8445587158203125, 9.827430725097656, 11.810303688049316, 13.793176651000977, 15.77604866027832, 17.758922576904297, 19.74179458618164, 21.724666595458984, 23.707538604736328, 25.690410614013672, 27.67328453063965, 29.656156539916992, 31.63903045654297, 33.62190246582031, 35.604774475097656, 37.587646484375, 39.570518493652344, 41.55339050292969, 43.5362663269043, 45.51913833618164, 47.502010345458984, 49.484886169433594, 51.46775817871094, 53.45063018798828, 55.433502197265625, 57.41637420654297, 59.39924621582031]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 2.0, 5.0, 6.0, 4.0, 8.0, 12.0, 13.0, 14.0, 25.0, 23.0, 28.0, 28.0, 38.0, 51.0, 36.0, 42.0, 43.0, 50.0, 55.0, 55.0, 55.0, 52.0, 49.0, 38.0, 37.0, 28.0, 36.0, 24.0, 30.0, 21.0, 18.0, 21.0, 14.0, 6.0, 9.0, 10.0, 5.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-32.11056137084961, -31.223161697387695, -30.33576202392578, -29.448360443115234, -28.56096076965332, -27.673561096191406, -26.786161422729492, -25.898761749267578, -25.011362075805664, -24.12396240234375, -23.236562728881836, -22.349163055419922, -21.461761474609375, -20.57436180114746, -19.686962127685547, -18.799562454223633, -17.91216278076172, -17.024763107299805, -16.13736343383789, -15.24996280670166, -14.362563133239746, -13.475162506103516, -12.587762832641602, -11.700363159179688, -10.81296157836914, -9.925561904907227, -9.038161277770996, -8.150761604309082, -7.263361930847168, -6.375961780548096, -5.488561630249023, -4.601161956787109, -3.7137622833251953, -2.826362371444702, -1.9389623403549194, -1.0515623092651367, -0.16416239738464355, 0.7232375144958496, 1.6106376647949219, 2.498037338256836, 3.385437488555908, 4.2728376388549805, 5.1602373123168945, 6.047637462615967, 6.935037612915039, 7.822437286376953, 8.709836959838867, 9.597236633300781, 10.484637260437012, 11.372036933898926, 12.259437561035156, 13.14683723449707, 14.034236907958984, 14.921636581420898, 15.809037208557129, 16.69643783569336, 17.583837509155273, 18.471237182617188, 19.3586368560791, 20.246036529541016, 21.133438110351562, 22.020837783813477, 22.90823745727539, 23.795637130737305, 24.68303680419922]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 2.0, 4.0, 9.0, 12.0, 12.0, 17.0, 25.0, 37.0, 44.0, 93.0, 157.0, 231.0, 476.0, 805.0, 1836.0, 4356.0, 12676.0, 41471.0, 155843.0, 485498.0, 250641.0, 64398.0, 18677.0, 6359.0, 2489.0, 1076.0, 554.0, 295.0, 170.0, 91.0, 58.0, 53.0, 31.0, 15.0, 10.0, 12.0, 6.0, 3.0, 1.0, 6.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.4375, -19.792236328125, -19.14697265625, -18.501708984375, -17.8564453125, -17.211181640625, -16.56591796875, -15.920654296875, -15.275390625, -14.630126953125, -13.98486328125, -13.339599609375, -12.6943359375, -12.049072265625, -11.40380859375, -10.758544921875, -10.11328125, -9.468017578125, -8.82275390625, -8.177490234375, -7.5322265625, -6.886962890625, -6.24169921875, -5.596435546875, -4.951171875, -4.305908203125, -3.66064453125, -3.015380859375, -2.3701171875, -1.724853515625, -1.07958984375, -0.434326171875, 0.2109375, 0.856201171875, 1.50146484375, 2.146728515625, 2.7919921875, 3.437255859375, 4.08251953125, 4.727783203125, 5.373046875, 6.018310546875, 6.66357421875, 7.308837890625, 7.9541015625, 8.599365234375, 9.24462890625, 9.889892578125, 10.53515625, 11.180419921875, 11.82568359375, 12.470947265625, 13.1162109375, 13.761474609375, 14.40673828125, 15.052001953125, 15.697265625, 16.342529296875, 16.98779296875, 17.633056640625, 18.2783203125, 18.923583984375, 19.56884765625, 20.214111328125, 20.859375]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 7.0, 5.0, 5.0, 13.0, 8.0, 24.0, 18.0, 28.0, 27.0, 41.0, 39.0, 47.0, 66.0, 70.0, 80.0, 74.0, 83.0, 53.0, 62.0, 54.0, 47.0, 39.0, 33.0, 23.0, 20.0, 11.0, 13.0, 12.0, 4.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.90234375, -4.7408447265625, -4.579345703125, -4.4178466796875, -4.25634765625, -4.0948486328125, -3.933349609375, -3.7718505859375, -3.6103515625, -3.4488525390625, -3.287353515625, -3.1258544921875, -2.96435546875, -2.8028564453125, -2.641357421875, -2.4798583984375, -2.318359375, -2.1568603515625, -1.995361328125, -1.8338623046875, -1.67236328125, -1.5108642578125, -1.349365234375, -1.1878662109375, -1.0263671875, -0.8648681640625, -0.703369140625, -0.5418701171875, -0.38037109375, -0.2188720703125, -0.057373046875, 0.1041259765625, 0.265625, 0.4271240234375, 0.588623046875, 0.7501220703125, 0.91162109375, 1.0731201171875, 1.234619140625, 1.3961181640625, 1.5576171875, 1.7191162109375, 1.880615234375, 2.0421142578125, 2.20361328125, 2.3651123046875, 2.526611328125, 2.6881103515625, 2.849609375, 3.0111083984375, 3.172607421875, 3.3341064453125, 3.49560546875, 3.6571044921875, 3.818603515625, 3.9801025390625, 4.1416015625, 4.3031005859375, 4.464599609375, 4.6260986328125, 4.78759765625, 4.9490966796875, 5.110595703125, 5.2720947265625, 5.43359375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 5.0, 6.0, 13.0, 15.0, 24.0, 28.0, 46.0, 77.0, 103.0, 162.0, 287.0, 547.0, 1284.0, 4486.0, 26410.0, 281310.0, 655671.0, 65503.0, 8841.0, 2091.0, 719.0, 367.0, 173.0, 134.0, 79.0, 56.0, 46.0, 30.0, 15.0, 7.0, 6.0, 7.0, 6.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-31.34375, -30.33935546875, -29.3349609375, -28.33056640625, -27.326171875, -26.32177734375, -25.3173828125, -24.31298828125, -23.30859375, -22.30419921875, -21.2998046875, -20.29541015625, -19.291015625, -18.28662109375, -17.2822265625, -16.27783203125, -15.2734375, -14.26904296875, -13.2646484375, -12.26025390625, -11.255859375, -10.25146484375, -9.2470703125, -8.24267578125, -7.23828125, -6.23388671875, -5.2294921875, -4.22509765625, -3.220703125, -2.21630859375, -1.2119140625, -0.20751953125, 0.796875, 1.80126953125, 2.8056640625, 3.81005859375, 4.814453125, 5.81884765625, 6.8232421875, 7.82763671875, 8.83203125, 9.83642578125, 10.8408203125, 11.84521484375, 12.849609375, 13.85400390625, 14.8583984375, 15.86279296875, 16.8671875, 17.87158203125, 18.8759765625, 19.88037109375, 20.884765625, 21.88916015625, 22.8935546875, 23.89794921875, 24.90234375, 25.90673828125, 26.9111328125, 27.91552734375, 28.919921875, 29.92431640625, 30.9287109375, 31.93310546875, 32.9375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 6.0, 3.0, 6.0, 6.0, 11.0, 6.0, 9.0, 16.0, 21.0, 17.0, 28.0, 33.0, 35.0, 29.0, 45.0, 53.0, 56.0, 38.0, 59.0, 57.0, 53.0, 49.0, 47.0, 42.0, 49.0, 45.0, 35.0, 17.0, 24.0, 17.0, 21.0, 10.0, 14.0, 10.0, 10.0, 5.0, 5.0, 6.0, 3.0, 4.0, 7.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.5, -18.842529296875, -18.18505859375, -17.527587890625, -16.8701171875, -16.212646484375, -15.55517578125, -14.897705078125, -14.240234375, -13.582763671875, -12.92529296875, -12.267822265625, -11.6103515625, -10.952880859375, -10.29541015625, -9.637939453125, -8.98046875, -8.322998046875, -7.66552734375, -7.008056640625, -6.3505859375, -5.693115234375, -5.03564453125, -4.378173828125, -3.720703125, -3.063232421875, -2.40576171875, -1.748291015625, -1.0908203125, -0.433349609375, 0.22412109375, 0.881591796875, 1.5390625, 2.196533203125, 2.85400390625, 3.511474609375, 4.1689453125, 4.826416015625, 5.48388671875, 6.141357421875, 6.798828125, 7.456298828125, 8.11376953125, 8.771240234375, 9.4287109375, 10.086181640625, 10.74365234375, 11.401123046875, 12.05859375, 12.716064453125, 13.37353515625, 14.031005859375, 14.6884765625, 15.345947265625, 16.00341796875, 16.660888671875, 17.318359375, 17.975830078125, 18.63330078125, 19.290771484375, 19.9482421875, 20.605712890625, 21.26318359375, 21.920654296875, 22.578125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 7.0, 6.0, 10.0, 11.0, 19.0, 18.0, 27.0, 46.0, 59.0, 103.0, 150.0, 237.0, 377.0, 675.0, 1146.0, 2430.0, 5623.0, 16325.0, 78042.0, 746649.0, 157618.0, 24650.0, 7635.0, 3172.0, 1478.0, 835.0, 424.0, 256.0, 186.0, 117.0, 74.0, 49.0, 24.0, 32.0, 14.0, 9.0, 6.0, 6.0, 8.0, 1.0, 3.0, 3.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.984375, -19.390625, -18.796875, -18.203125, -17.609375, -17.015625, -16.421875, -15.828125, -15.234375, -14.640625, -14.046875, -13.453125, -12.859375, -12.265625, -11.671875, -11.078125, -10.484375, -9.890625, -9.296875, -8.703125, -8.109375, -7.515625, -6.921875, -6.328125, -5.734375, -5.140625, -4.546875, -3.953125, -3.359375, -2.765625, -2.171875, -1.578125, -0.984375, -0.390625, 0.203125, 0.796875, 1.390625, 1.984375, 2.578125, 3.171875, 3.765625, 4.359375, 4.953125, 5.546875, 6.140625, 6.734375, 7.328125, 7.921875, 8.515625, 9.109375, 9.703125, 10.296875, 10.890625, 11.484375, 12.078125, 12.671875, 13.265625, 13.859375, 14.453125, 15.046875, 15.640625, 16.234375, 16.828125, 17.421875, 18.015625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 6.0, 8.0, 10.0, 21.0, 19.0, 39.0, 68.0, 121.0, 347.0, 174.0, 83.0, 37.0, 20.0, 17.0, 4.0, 5.0, 6.0, 3.0, 4.0, 4.0, 3.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0052947998046875, -0.005122542381286621, -0.004950284957885742, -0.004778027534484863, -0.004605770111083984, -0.0044335126876831055, -0.0042612552642822266, -0.004088997840881348, -0.003916740417480469, -0.00374448299407959, -0.003572225570678711, -0.003399968147277832, -0.003227710723876953, -0.0030554533004760742, -0.0028831958770751953, -0.0027109384536743164, -0.0025386810302734375, -0.0023664236068725586, -0.0021941661834716797, -0.0020219087600708008, -0.0018496513366699219, -0.001677393913269043, -0.001505136489868164, -0.0013328790664672852, -0.0011606216430664062, -0.0009883642196655273, -0.0008161067962646484, -0.0006438493728637695, -0.0004715919494628906, -0.0002993345260620117, -0.0001270771026611328, 4.5180320739746094e-05, 0.000217437744140625, 0.0003896951675415039, 0.0005619525909423828, 0.0007342100143432617, 0.0009064674377441406, 0.0010787248611450195, 0.0012509822845458984, 0.0014232397079467773, 0.0015954971313476562, 0.0017677545547485352, 0.001940011978149414, 0.002112269401550293, 0.002284526824951172, 0.0024567842483520508, 0.0026290416717529297, 0.0028012990951538086, 0.0029735565185546875, 0.0031458139419555664, 0.0033180713653564453, 0.0034903287887573242, 0.003662586212158203, 0.003834843635559082, 0.004007101058959961, 0.00417935848236084, 0.004351615905761719, 0.004523873329162598, 0.0046961307525634766, 0.0048683881759643555, 0.005040645599365234, 0.005212903022766113, 0.005385160446166992, 0.005557417869567871, 0.00572967529296875]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 6.0, 12.0, 11.0, 17.0, 25.0, 38.0, 60.0, 124.0, 215.0, 409.0, 877.0, 2291.0, 8689.0, 67458.0, 896661.0, 59562.0, 8058.0, 2276.0, 838.0, 407.0, 213.0, 130.0, 64.0, 49.0, 24.0, 9.0, 9.0, 9.0, 5.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.125, -36.951171875, -35.77734375, -34.603515625, -33.4296875, -32.255859375, -31.08203125, -29.908203125, -28.734375, -27.560546875, -26.38671875, -25.212890625, -24.0390625, -22.865234375, -21.69140625, -20.517578125, -19.34375, -18.169921875, -16.99609375, -15.822265625, -14.6484375, -13.474609375, -12.30078125, -11.126953125, -9.953125, -8.779296875, -7.60546875, -6.431640625, -5.2578125, -4.083984375, -2.91015625, -1.736328125, -0.5625, 0.611328125, 1.78515625, 2.958984375, 4.1328125, 5.306640625, 6.48046875, 7.654296875, 8.828125, 10.001953125, 11.17578125, 12.349609375, 13.5234375, 14.697265625, 15.87109375, 17.044921875, 18.21875, 19.392578125, 20.56640625, 21.740234375, 22.9140625, 24.087890625, 25.26171875, 26.435546875, 27.609375, 28.783203125, 29.95703125, 31.130859375, 32.3046875, 33.478515625, 34.65234375, 35.826171875, 37.0]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 2.0, 3.0, 0.0, 4.0, 5.0, 2.0, 1.0, 3.0, 9.0, 11.0, 12.0, 17.0, 9.0, 21.0, 20.0, 46.0, 80.0, 164.0, 233.0, 140.0, 78.0, 45.0, 29.0, 26.0, 9.0, 8.0, 9.0, 9.0, 4.0, 3.0, 3.0, 0.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-22.859375, -22.19287109375, -21.5263671875, -20.85986328125, -20.193359375, -19.52685546875, -18.8603515625, -18.19384765625, -17.52734375, -16.86083984375, -16.1943359375, -15.52783203125, -14.861328125, -14.19482421875, -13.5283203125, -12.86181640625, -12.1953125, -11.52880859375, -10.8623046875, -10.19580078125, -9.529296875, -8.86279296875, -8.1962890625, -7.52978515625, -6.86328125, -6.19677734375, -5.5302734375, -4.86376953125, -4.197265625, -3.53076171875, -2.8642578125, -2.19775390625, -1.53125, -0.86474609375, -0.1982421875, 0.46826171875, 1.134765625, 1.80126953125, 2.4677734375, 3.13427734375, 3.80078125, 4.46728515625, 5.1337890625, 5.80029296875, 6.466796875, 7.13330078125, 7.7998046875, 8.46630859375, 9.1328125, 9.79931640625, 10.4658203125, 11.13232421875, 11.798828125, 12.46533203125, 13.1318359375, 13.79833984375, 14.46484375, 15.13134765625, 15.7978515625, 16.46435546875, 17.130859375, 17.79736328125, 18.4638671875, 19.13037109375, 19.796875]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 8.0, 20.0, 34.0, 51.0, 103.0, 133.0, 165.0, 165.0, 143.0, 99.0, 45.0, 14.0, 10.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-236.7103729248047, -228.84329223632812, -220.9761962890625, -213.10911560058594, -205.24203491210938, -197.37493896484375, -189.5078582763672, -181.64077758789062, -173.773681640625, -165.90660095214844, -158.0395050048828, -150.17242431640625, -142.30532836914062, -134.43824768066406, -126.5711669921875, -118.7040786743164, -110.83699035644531, -102.96990203857422, -95.10281372070312, -87.23573303222656, -79.36864471435547, -71.50155639648438, -63.63447189331055, -55.76738739013672, -47.900299072265625, -40.03321075439453, -32.1661262512207, -24.299039840698242, -16.43195343017578, -8.564865112304688, -0.6977806091308594, 7.169303894042969, 15.036376953125, 22.90346336364746, 30.770549774169922, 38.63763427734375, 46.504722595214844, 54.37181091308594, 62.238895416259766, 70.1059799194336, 77.97306823730469, 85.84015655517578, 93.70724487304688, 101.57432556152344, 109.44141387939453, 117.30850219726562, 125.17558288574219, 133.04266357421875, 140.90975952148438, 148.77684020996094, 156.64393615722656, 164.51101684570312, 172.37811279296875, 180.2451934814453, 188.11227416992188, 195.9793701171875, 203.84645080566406, 211.71353149414062, 219.58062744140625, 227.4477081298828, 235.31478881835938, 243.181884765625, 251.04896545410156, 258.9160461425781, 266.78314208984375]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 8.0, 2.0, 2.0, 10.0, 7.0, 8.0, 21.0, 11.0, 22.0, 30.0, 22.0, 41.0, 46.0, 43.0, 47.0, 59.0, 49.0, 60.0, 59.0, 62.0, 47.0, 50.0, 41.0, 44.0, 29.0, 35.0, 18.0, 27.0, 17.0, 21.0, 13.0, 18.0, 9.0, 12.0, 2.0, 6.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-142.8802490234375, -138.69435119628906, -134.50845336914062, -130.3225555419922, -126.13665771484375, -121.95075988769531, -117.7648696899414, -113.57897186279297, -109.39307403564453, -105.2071762084961, -101.02127838134766, -96.83538055419922, -92.64949035644531, -88.46359252929688, -84.27769470214844, -80.091796875, -75.90589904785156, -71.72000122070312, -67.53410339355469, -63.348209381103516, -59.16231155395508, -54.97641372680664, -50.79051971435547, -46.60462188720703, -42.418724060058594, -38.232826232910156, -34.04692840576172, -29.861034393310547, -25.67513656616211, -21.489238739013672, -17.303342819213867, -13.117446899414062, -8.931533813476562, -4.745636940002441, -0.5597400665283203, 3.626156806945801, 7.812053680419922, 11.99795150756836, 16.183847427368164, 20.36974334716797, 24.555641174316406, 28.741539001464844, 32.92743682861328, 37.11333084106445, 41.29922866821289, 45.48512649536133, 49.6710205078125, 53.85691833496094, 58.042816162109375, 62.22871398925781, 66.41461181640625, 70.60050964355469, 74.78640747070312, 78.97230529785156, 83.15819549560547, 87.3440933227539, 91.52999114990234, 95.71588897705078, 99.90178680419922, 104.08768463134766, 108.27357482910156, 112.45947265625, 116.64537048339844, 120.83126831054688, 125.01716613769531]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 7.0, 0.0, 6.0, 8.0, 5.0, 9.0, 8.0, 15.0, 15.0, 36.0, 54.0, 99.0, 120.0, 247.0, 437.0, 809.0, 1666.0, 3920.0, 11271.0, 46863.0, 1233827.0, 2818863.0, 55056.0, 12698.0, 4404.0, 1848.0, 871.0, 485.0, 242.0, 162.0, 84.0, 58.0, 30.0, 29.0, 15.0, 7.0, 7.0, 4.0, 0.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-31.609375, -30.707275390625, -29.80517578125, -28.903076171875, -28.0009765625, -27.098876953125, -26.19677734375, -25.294677734375, -24.392578125, -23.490478515625, -22.58837890625, -21.686279296875, -20.7841796875, -19.882080078125, -18.97998046875, -18.077880859375, -17.17578125, -16.273681640625, -15.37158203125, -14.469482421875, -13.5673828125, -12.665283203125, -11.76318359375, -10.861083984375, -9.958984375, -9.056884765625, -8.15478515625, -7.252685546875, -6.3505859375, -5.448486328125, -4.54638671875, -3.644287109375, -2.7421875, -1.840087890625, -0.93798828125, -0.035888671875, 0.8662109375, 1.768310546875, 2.67041015625, 3.572509765625, 4.474609375, 5.376708984375, 6.27880859375, 7.180908203125, 8.0830078125, 8.985107421875, 9.88720703125, 10.789306640625, 11.69140625, 12.593505859375, 13.49560546875, 14.397705078125, 15.2998046875, 16.201904296875, 17.10400390625, 18.006103515625, 18.908203125, 19.810302734375, 20.71240234375, 21.614501953125, 22.5166015625, 23.418701171875, 24.32080078125, 25.222900390625, 26.125]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 0.0, 4.0, 3.0, 5.0, 8.0, 11.0, 14.0, 15.0, 15.0, 26.0, 21.0, 27.0, 34.0, 29.0, 41.0, 50.0, 66.0, 51.0, 64.0, 51.0, 45.0, 48.0, 58.0, 45.0, 42.0, 43.0, 33.0, 28.0, 32.0, 17.0, 20.0, 17.0, 11.0, 11.0, 8.0, 3.0, 2.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.05078125, -3.90283203125, -3.7548828125, -3.60693359375, -3.458984375, -3.31103515625, -3.1630859375, -3.01513671875, -2.8671875, -2.71923828125, -2.5712890625, -2.42333984375, -2.275390625, -2.12744140625, -1.9794921875, -1.83154296875, -1.68359375, -1.53564453125, -1.3876953125, -1.23974609375, -1.091796875, -0.94384765625, -0.7958984375, -0.64794921875, -0.5, -0.35205078125, -0.2041015625, -0.05615234375, 0.091796875, 0.23974609375, 0.3876953125, 0.53564453125, 0.68359375, 0.83154296875, 0.9794921875, 1.12744140625, 1.275390625, 1.42333984375, 1.5712890625, 1.71923828125, 1.8671875, 2.01513671875, 2.1630859375, 2.31103515625, 2.458984375, 2.60693359375, 2.7548828125, 2.90283203125, 3.05078125, 3.19873046875, 3.3466796875, 3.49462890625, 3.642578125, 3.79052734375, 3.9384765625, 4.08642578125, 4.234375, 4.38232421875, 4.5302734375, 4.67822265625, 4.826171875, 4.97412109375, 5.1220703125, 5.27001953125, 5.41796875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 8.0, 22.0, 24.0, 50.0, 80.0, 142.0, 303.0, 625.0, 1560.0, 4400.0, 16885.0, 132740.0, 3859938.0, 152037.0, 17973.0, 4636.0, 1615.0, 665.0, 273.0, 132.0, 77.0, 38.0, 22.0, 11.0, 8.0, 10.0, 3.0, 3.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.6875, -44.4365234375, -43.185546875, -41.9345703125, -40.68359375, -39.4326171875, -38.181640625, -36.9306640625, -35.6796875, -34.4287109375, -33.177734375, -31.9267578125, -30.67578125, -29.4248046875, -28.173828125, -26.9228515625, -25.671875, -24.4208984375, -23.169921875, -21.9189453125, -20.66796875, -19.4169921875, -18.166015625, -16.9150390625, -15.6640625, -14.4130859375, -13.162109375, -11.9111328125, -10.66015625, -9.4091796875, -8.158203125, -6.9072265625, -5.65625, -4.4052734375, -3.154296875, -1.9033203125, -0.65234375, 0.5986328125, 1.849609375, 3.1005859375, 4.3515625, 5.6025390625, 6.853515625, 8.1044921875, 9.35546875, 10.6064453125, 11.857421875, 13.1083984375, 14.359375, 15.6103515625, 16.861328125, 18.1123046875, 19.36328125, 20.6142578125, 21.865234375, 23.1162109375, 24.3671875, 25.6181640625, 26.869140625, 28.1201171875, 29.37109375, 30.6220703125, 31.873046875, 33.1240234375, 34.375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 6.0, 2.0, 6.0, 10.0, 15.0, 18.0, 24.0, 37.0, 75.0, 136.0, 327.0, 1267.0, 1464.0, 323.0, 144.0, 77.0, 43.0, 27.0, 19.0, 10.0, 12.0, 7.0, 4.0, 2.0, 8.0, 5.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-15.8984375, -15.4693603515625, -15.040283203125, -14.6112060546875, -14.18212890625, -13.7530517578125, -13.323974609375, -12.8948974609375, -12.4658203125, -12.0367431640625, -11.607666015625, -11.1785888671875, -10.74951171875, -10.3204345703125, -9.891357421875, -9.4622802734375, -9.033203125, -8.6041259765625, -8.175048828125, -7.7459716796875, -7.31689453125, -6.8878173828125, -6.458740234375, -6.0296630859375, -5.6005859375, -5.1715087890625, -4.742431640625, -4.3133544921875, -3.88427734375, -3.4552001953125, -3.026123046875, -2.5970458984375, -2.16796875, -1.7388916015625, -1.309814453125, -0.8807373046875, -0.45166015625, -0.0225830078125, 0.406494140625, 0.8355712890625, 1.2646484375, 1.6937255859375, 2.122802734375, 2.5518798828125, 2.98095703125, 3.4100341796875, 3.839111328125, 4.2681884765625, 4.697265625, 5.1263427734375, 5.555419921875, 5.9844970703125, 6.41357421875, 6.8426513671875, 7.271728515625, 7.7008056640625, 8.1298828125, 8.5589599609375, 8.988037109375, 9.4171142578125, 9.84619140625, 10.2752685546875, 10.704345703125, 11.1334228515625, 11.5625]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 7.0, 19.0, 48.0, 145.0, 253.0, 236.0, 163.0, 76.0, 37.0, 12.0, 6.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.12347412109375, -35.10445785522461, -30.085437774658203, -25.066421508789062, -20.04740333557129, -15.028385162353516, -10.009368896484375, -4.990348815917969, 0.028667449951171875, 5.047685146331787, 10.066702842712402, 15.08572006225586, 20.104738235473633, 25.123756408691406, 30.142772674560547, 35.16179275512695, 40.180809020996094, 45.199825286865234, 50.21884536743164, 55.23786163330078, 60.25688171386719, 65.27589416503906, 70.29491424560547, 75.31393432617188, 80.33294677734375, 85.35196685791016, 90.37097930908203, 95.38999938964844, 100.40901947021484, 105.42803955078125, 110.44705200195312, 115.46607208251953, 120.48509216308594, 125.50411224365234, 130.52313232421875, 135.54214477539062, 140.5611572265625, 145.58018493652344, 150.5991973876953, 155.61822509765625, 160.63723754882812, 165.65625, 170.67527770996094, 175.6942901611328, 180.7133026123047, 185.73233032226562, 190.7513427734375, 195.77035522460938, 200.78936767578125, 205.80838012695312, 210.82740783691406, 215.84642028808594, 220.8654327392578, 225.88446044921875, 230.90347290039062, 235.9224853515625, 240.94151306152344, 245.9605255126953, 250.97955322265625, 255.99856567382812, 261.017578125, 266.0365905761719, 271.05560302734375, 276.07464599609375, 281.0936584472656]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 6.0, 5.0, 14.0, 13.0, 17.0, 13.0, 17.0, 25.0, 29.0, 25.0, 36.0, 38.0, 38.0, 39.0, 49.0, 57.0, 70.0, 54.0, 52.0, 37.0, 46.0, 37.0, 39.0, 37.0, 40.0, 36.0, 32.0, 20.0, 12.0, 15.0, 6.0, 15.0, 9.0, 5.0, 6.0, 6.0, 2.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.758644104003906, -43.33696746826172, -41.91529083251953, -40.493614196777344, -39.07193374633789, -37.6502571105957, -36.228580474853516, -34.80690383911133, -33.38522720336914, -31.963550567626953, -30.541872024536133, -29.120195388793945, -27.698518753051758, -26.276840209960938, -24.85516357421875, -23.433486938476562, -22.011808395385742, -20.590131759643555, -19.168453216552734, -17.746776580810547, -16.32509994506836, -14.903422355651855, -13.481744766235352, -12.060068130493164, -10.63839054107666, -9.216712951660156, -7.795036315917969, -6.373358726501465, -4.951681613922119, -3.5300045013427734, -2.1083269119262695, -0.686650276184082, 0.7350273132324219, 2.1567044258117676, 3.5783817768096924, 5.000059127807617, 6.421736240386963, 7.843413352966309, 9.265090942382812, 10.686767578125, 12.108445167541504, 13.530122756958008, 14.951799392700195, 16.373477935791016, 17.795154571533203, 19.21683120727539, 20.638507843017578, 22.060184478759766, 23.481863021850586, 24.903539657592773, 26.325218200683594, 27.74689483642578, 29.16857147216797, 30.590248107910156, 32.011924743652344, 33.43360137939453, 34.855281829833984, 36.27695846557617, 37.69863510131836, 39.12031555175781, 40.5419921875, 41.96366882324219, 43.385345458984375, 44.80702209472656, 46.22869873046875]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 6.0, 11.0, 14.0, 15.0, 43.0, 64.0, 111.0, 166.0, 312.0, 492.0, 859.0, 1579.0, 2927.0, 5874.0, 11935.0, 25822.0, 57106.0, 124942.0, 233918.0, 268005.0, 166730.0, 79505.0, 35538.0, 16343.0, 7741.0, 3825.0, 2025.0, 1138.0, 594.0, 378.0, 197.0, 119.0, 80.0, 50.0, 33.0, 21.0, 11.0, 14.0, 6.0, 0.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.5625, -10.2008056640625, -9.839111328125, -9.4774169921875, -9.11572265625, -8.7540283203125, -8.392333984375, -8.0306396484375, -7.6689453125, -7.3072509765625, -6.945556640625, -6.5838623046875, -6.22216796875, -5.8604736328125, -5.498779296875, -5.1370849609375, -4.775390625, -4.4136962890625, -4.052001953125, -3.6903076171875, -3.32861328125, -2.9669189453125, -2.605224609375, -2.2435302734375, -1.8818359375, -1.5201416015625, -1.158447265625, -0.7967529296875, -0.43505859375, -0.0733642578125, 0.288330078125, 0.6500244140625, 1.01171875, 1.3734130859375, 1.735107421875, 2.0968017578125, 2.45849609375, 2.8201904296875, 3.181884765625, 3.5435791015625, 3.9052734375, 4.2669677734375, 4.628662109375, 4.9903564453125, 5.35205078125, 5.7137451171875, 6.075439453125, 6.4371337890625, 6.798828125, 7.1605224609375, 7.522216796875, 7.8839111328125, 8.24560546875, 8.6072998046875, 8.968994140625, 9.3306884765625, 9.6923828125, 10.0540771484375, 10.415771484375, 10.7774658203125, 11.13916015625, 11.5008544921875, 11.862548828125, 12.2242431640625, 12.5859375]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 4.0, 5.0, 4.0, 8.0, 7.0, 11.0, 13.0, 14.0, 22.0, 20.0, 26.0, 29.0, 27.0, 34.0, 32.0, 40.0, 49.0, 39.0, 62.0, 61.0, 45.0, 55.0, 49.0, 47.0, 36.0, 46.0, 38.0, 36.0, 20.0, 21.0, 24.0, 17.0, 13.0, 11.0, 8.0, 8.0, 10.0, 3.0, 3.0, 2.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.8515625, -4.70721435546875, -4.5628662109375, -4.41851806640625, -4.274169921875, -4.12982177734375, -3.9854736328125, -3.84112548828125, -3.69677734375, -3.55242919921875, -3.4080810546875, -3.26373291015625, -3.119384765625, -2.97503662109375, -2.8306884765625, -2.68634033203125, -2.5419921875, -2.39764404296875, -2.2532958984375, -2.10894775390625, -1.964599609375, -1.82025146484375, -1.6759033203125, -1.53155517578125, -1.38720703125, -1.24285888671875, -1.0985107421875, -0.95416259765625, -0.809814453125, -0.66546630859375, -0.5211181640625, -0.37677001953125, -0.232421875, -0.08807373046875, 0.0562744140625, 0.20062255859375, 0.344970703125, 0.48931884765625, 0.6336669921875, 0.77801513671875, 0.92236328125, 1.06671142578125, 1.2110595703125, 1.35540771484375, 1.499755859375, 1.64410400390625, 1.7884521484375, 1.93280029296875, 2.0771484375, 2.22149658203125, 2.3658447265625, 2.51019287109375, 2.654541015625, 2.79888916015625, 2.9432373046875, 3.08758544921875, 3.23193359375, 3.37628173828125, 3.5206298828125, 3.66497802734375, 3.809326171875, 3.95367431640625, 4.0980224609375, 4.24237060546875, 4.38671875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 1.0, 6.0, 8.0, 7.0, 5.0, 13.0, 24.0, 24.0, 32.0, 71.0, 103.0, 155.0, 277.0, 456.0, 1044.0, 3263.0, 18416.0, 187609.0, 696671.0, 122744.0, 13157.0, 2587.0, 860.0, 384.0, 216.0, 148.0, 90.0, 67.0, 41.0, 30.0, 14.0, 15.0, 10.0, 7.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.140625, -29.079833984375, -28.01904296875, -26.958251953125, -25.8974609375, -24.836669921875, -23.77587890625, -22.715087890625, -21.654296875, -20.593505859375, -19.53271484375, -18.471923828125, -17.4111328125, -16.350341796875, -15.28955078125, -14.228759765625, -13.16796875, -12.107177734375, -11.04638671875, -9.985595703125, -8.9248046875, -7.864013671875, -6.80322265625, -5.742431640625, -4.681640625, -3.620849609375, -2.56005859375, -1.499267578125, -0.4384765625, 0.622314453125, 1.68310546875, 2.743896484375, 3.8046875, 4.865478515625, 5.92626953125, 6.987060546875, 8.0478515625, 9.108642578125, 10.16943359375, 11.230224609375, 12.291015625, 13.351806640625, 14.41259765625, 15.473388671875, 16.5341796875, 17.594970703125, 18.65576171875, 19.716552734375, 20.77734375, 21.838134765625, 22.89892578125, 23.959716796875, 25.0205078125, 26.081298828125, 27.14208984375, 28.202880859375, 29.263671875, 30.324462890625, 31.38525390625, 32.446044921875, 33.5068359375, 34.567626953125, 35.62841796875, 36.689208984375, 37.75]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 4.0, 8.0, 5.0, 8.0, 11.0, 13.0, 15.0, 23.0, 17.0, 26.0, 30.0, 29.0, 36.0, 45.0, 49.0, 45.0, 44.0, 47.0, 33.0, 58.0, 54.0, 41.0, 33.0, 44.0, 44.0, 35.0, 30.0, 31.0, 24.0, 22.0, 14.0, 18.0, 13.0, 11.0, 13.0, 8.0, 4.0, 6.0, 5.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.921875, -28.095703125, -27.26953125, -26.443359375, -25.6171875, -24.791015625, -23.96484375, -23.138671875, -22.3125, -21.486328125, -20.66015625, -19.833984375, -19.0078125, -18.181640625, -17.35546875, -16.529296875, -15.703125, -14.876953125, -14.05078125, -13.224609375, -12.3984375, -11.572265625, -10.74609375, -9.919921875, -9.09375, -8.267578125, -7.44140625, -6.615234375, -5.7890625, -4.962890625, -4.13671875, -3.310546875, -2.484375, -1.658203125, -0.83203125, -0.005859375, 0.8203125, 1.646484375, 2.47265625, 3.298828125, 4.125, 4.951171875, 5.77734375, 6.603515625, 7.4296875, 8.255859375, 9.08203125, 9.908203125, 10.734375, 11.560546875, 12.38671875, 13.212890625, 14.0390625, 14.865234375, 15.69140625, 16.517578125, 17.34375, 18.169921875, 18.99609375, 19.822265625, 20.6484375, 21.474609375, 22.30078125, 23.126953125, 23.953125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 5.0, 4.0, 9.0, 11.0, 24.0, 25.0, 47.0, 51.0, 79.0, 120.0, 171.0, 241.0, 462.0, 938.0, 1821.0, 3967.0, 10048.0, 32669.0, 151021.0, 530675.0, 242995.0, 49681.0, 13654.0, 5016.0, 2189.0, 1061.0, 606.0, 323.0, 245.0, 130.0, 77.0, 63.0, 42.0, 29.0, 20.0, 13.0, 11.0, 6.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.65625, -10.25634765625, -9.8564453125, -9.45654296875, -9.056640625, -8.65673828125, -8.2568359375, -7.85693359375, -7.45703125, -7.05712890625, -6.6572265625, -6.25732421875, -5.857421875, -5.45751953125, -5.0576171875, -4.65771484375, -4.2578125, -3.85791015625, -3.4580078125, -3.05810546875, -2.658203125, -2.25830078125, -1.8583984375, -1.45849609375, -1.05859375, -0.65869140625, -0.2587890625, 0.14111328125, 0.541015625, 0.94091796875, 1.3408203125, 1.74072265625, 2.140625, 2.54052734375, 2.9404296875, 3.34033203125, 3.740234375, 4.14013671875, 4.5400390625, 4.93994140625, 5.33984375, 5.73974609375, 6.1396484375, 6.53955078125, 6.939453125, 7.33935546875, 7.7392578125, 8.13916015625, 8.5390625, 8.93896484375, 9.3388671875, 9.73876953125, 10.138671875, 10.53857421875, 10.9384765625, 11.33837890625, 11.73828125, 12.13818359375, 12.5380859375, 12.93798828125, 13.337890625, 13.73779296875, 14.1376953125, 14.53759765625, 14.9375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 7.0, 11.0, 8.0, 12.0, 11.0, 18.0, 31.0, 44.0, 42.0, 61.0, 77.0, 83.0, 96.0, 98.0, 75.0, 71.0, 64.0, 49.0, 43.0, 26.0, 21.0, 6.0, 14.0, 13.0, 7.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002208709716796875, -0.002134382724761963, -0.0020600557327270508, -0.0019857287406921387, -0.0019114017486572266, -0.0018370747566223145, -0.0017627477645874023, -0.0016884207725524902, -0.0016140937805175781, -0.001539766788482666, -0.001465439796447754, -0.0013911128044128418, -0.0013167858123779297, -0.0012424588203430176, -0.0011681318283081055, -0.0010938048362731934, -0.0010194778442382812, -0.0009451508522033691, -0.000870823860168457, -0.0007964968681335449, -0.0007221698760986328, -0.0006478428840637207, -0.0005735158920288086, -0.0004991888999938965, -0.0004248619079589844, -0.00035053491592407227, -0.00027620792388916016, -0.00020188093185424805, -0.00012755393981933594, -5.322694778442383e-05, 2.110004425048828e-05, 9.542703628540039e-05, 0.0001697540283203125, 0.0002440810203552246, 0.0003184080123901367, 0.00039273500442504883, 0.00046706199645996094, 0.000541388988494873, 0.0006157159805297852, 0.0006900429725646973, 0.0007643699645996094, 0.0008386969566345215, 0.0009130239486694336, 0.0009873509407043457, 0.0010616779327392578, 0.00113600492477417, 0.001210331916809082, 0.0012846589088439941, 0.0013589859008789062, 0.0014333128929138184, 0.0015076398849487305, 0.0015819668769836426, 0.0016562938690185547, 0.0017306208610534668, 0.001804947853088379, 0.001879274845123291, 0.001953601837158203, 0.0020279288291931152, 0.0021022558212280273, 0.0021765828132629395, 0.0022509098052978516, 0.0023252367973327637, 0.0023995637893676758, 0.002473890781402588, 0.0025482177734375]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 4.0, 4.0, 9.0, 15.0, 20.0, 36.0, 43.0, 95.0, 161.0, 368.0, 1153.0, 5222.0, 48510.0, 783902.0, 193852.0, 11885.0, 2156.0, 578.0, 242.0, 123.0, 74.0, 55.0, 21.0, 14.0, 9.0, 5.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.609375, -27.613037109375, -26.61669921875, -25.620361328125, -24.6240234375, -23.627685546875, -22.63134765625, -21.635009765625, -20.638671875, -19.642333984375, -18.64599609375, -17.649658203125, -16.6533203125, -15.656982421875, -14.66064453125, -13.664306640625, -12.66796875, -11.671630859375, -10.67529296875, -9.678955078125, -8.6826171875, -7.686279296875, -6.68994140625, -5.693603515625, -4.697265625, -3.700927734375, -2.70458984375, -1.708251953125, -0.7119140625, 0.284423828125, 1.28076171875, 2.277099609375, 3.2734375, 4.269775390625, 5.26611328125, 6.262451171875, 7.2587890625, 8.255126953125, 9.25146484375, 10.247802734375, 11.244140625, 12.240478515625, 13.23681640625, 14.233154296875, 15.2294921875, 16.225830078125, 17.22216796875, 18.218505859375, 19.21484375, 20.211181640625, 21.20751953125, 22.203857421875, 23.2001953125, 24.196533203125, 25.19287109375, 26.189208984375, 27.185546875, 28.181884765625, 29.17822265625, 30.174560546875, 31.1708984375, 32.167236328125, 33.16357421875, 34.159912109375, 35.15625]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 2.0, 4.0, 6.0, 6.0, 6.0, 18.0, 19.0, 14.0, 30.0, 31.0, 43.0, 53.0, 41.0, 81.0, 84.0, 75.0, 105.0, 81.0, 60.0, 51.0, 36.0, 32.0, 27.0, 17.0, 18.0, 16.0, 6.0, 1.0, 7.0, 6.0, 3.0, 4.0, 1.0, 2.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-12.4453125, -12.068115234375, -11.69091796875, -11.313720703125, -10.9365234375, -10.559326171875, -10.18212890625, -9.804931640625, -9.427734375, -9.050537109375, -8.67333984375, -8.296142578125, -7.9189453125, -7.541748046875, -7.16455078125, -6.787353515625, -6.41015625, -6.032958984375, -5.65576171875, -5.278564453125, -4.9013671875, -4.524169921875, -4.14697265625, -3.769775390625, -3.392578125, -3.015380859375, -2.63818359375, -2.260986328125, -1.8837890625, -1.506591796875, -1.12939453125, -0.752197265625, -0.375, 0.002197265625, 0.37939453125, 0.756591796875, 1.1337890625, 1.510986328125, 1.88818359375, 2.265380859375, 2.642578125, 3.019775390625, 3.39697265625, 3.774169921875, 4.1513671875, 4.528564453125, 4.90576171875, 5.282958984375, 5.66015625, 6.037353515625, 6.41455078125, 6.791748046875, 7.1689453125, 7.546142578125, 7.92333984375, 8.300537109375, 8.677734375, 9.054931640625, 9.43212890625, 9.809326171875, 10.1865234375, 10.563720703125, 10.94091796875, 11.318115234375, 11.6953125]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 9.0, 20.0, 58.0, 140.0, 218.0, 228.0, 180.0, 75.0, 43.0, 15.0, 12.0, 5.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-314.6690979003906, -304.8736572265625, -295.0782165527344, -285.28277587890625, -275.4873352050781, -265.69189453125, -255.89646911621094, -246.1010284423828, -236.3055877685547, -226.51014709472656, -216.71470642089844, -206.9192657470703, -197.12384033203125, -187.32839965820312, -177.532958984375, -167.73751831054688, -157.94207763671875, -148.14663696289062, -138.3511962890625, -128.55575561523438, -118.76032257080078, -108.96488189697266, -99.16944885253906, -89.37400817871094, -79.57856750488281, -69.78312683105469, -59.98768997192383, -50.19225311279297, -40.396812438964844, -30.60137176513672, -20.80593490600586, -11.010498046875, -1.215057373046875, 8.580381393432617, 18.37582015991211, 28.1712589263916, 37.966697692871094, 47.76213836669922, 57.55757522583008, 67.35301208496094, 77.14845275878906, 86.94389343261719, 96.73933410644531, 106.5347671508789, 116.33020782470703, 126.12564849853516, 135.92108154296875, 145.71652221679688, 155.511962890625, 165.30740356445312, 175.10284423828125, 184.89828491210938, 194.6937255859375, 204.48916625976562, 214.2845916748047, 224.0800323486328, 233.87547302246094, 243.67091369628906, 253.4663543701172, 263.26177978515625, 273.0572204589844, 282.8526611328125, 292.6481018066406, 302.44354248046875, 312.2389831542969]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 2.0, 3.0, 6.0, 9.0, 3.0, 10.0, 9.0, 13.0, 14.0, 15.0, 19.0, 13.0, 22.0, 29.0, 29.0, 28.0, 30.0, 26.0, 39.0, 37.0, 34.0, 41.0, 31.0, 47.0, 39.0, 34.0, 40.0, 29.0, 32.0, 32.0, 32.0, 42.0, 37.0, 16.0, 19.0, 23.0, 22.0, 16.0, 16.0, 7.0, 11.0, 8.0, 10.0, 6.0, 7.0, 2.0, 7.0, 0.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0], "bins": [-115.05525970458984, -111.67643737792969, -108.297607421875, -104.91878509521484, -101.53996276855469, -98.16114044189453, -94.78231811523438, -91.40348815917969, -88.02466583251953, -84.64584350585938, -81.26701354980469, -77.88819122314453, -74.50936889648438, -71.13054656982422, -67.75172424316406, -64.37289428710938, -60.99407196044922, -57.61524963378906, -54.23642349243164, -50.85759735107422, -47.47877502441406, -44.099952697753906, -40.721126556396484, -37.34230041503906, -33.963478088378906, -30.584653854370117, -27.205829620361328, -23.82700538635254, -20.44818115234375, -17.06935691833496, -13.690532684326172, -10.311708450317383, -6.932891845703125, -3.554067611694336, -0.17524337768554688, 3.203580856323242, 6.582405090332031, 9.96122932434082, 13.34005355834961, 16.7188777923584, 20.097702026367188, 23.476526260375977, 26.855350494384766, 30.234174728393555, 33.612998962402344, 36.9918212890625, 40.37064743041992, 43.749473571777344, 47.1282958984375, 50.507118225097656, 53.88594436645508, 57.2647705078125, 60.643592834472656, 64.02241516113281, 67.4012451171875, 70.78006744384766, 74.15888977050781, 77.53771209716797, 80.91653442382812, 84.29536437988281, 87.67418670654297, 91.05300903320312, 94.43183898925781, 97.81066131591797, 101.18948364257812]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 4.0, 2.0, 5.0, 10.0, 15.0, 24.0, 44.0, 61.0, 133.0, 274.0, 695.0, 2459.0, 31858.0, 4146004.0, 10202.0, 1525.0, 497.0, 215.0, 108.0, 52.0, 36.0, 26.0, 19.0, 8.0, 5.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-92.625, -89.8466796875, -87.068359375, -84.2900390625, -81.51171875, -78.7333984375, -75.955078125, -73.1767578125, -70.3984375, -67.6201171875, -64.841796875, -62.0634765625, -59.28515625, -56.5068359375, -53.728515625, -50.9501953125, -48.171875, -45.3935546875, -42.615234375, -39.8369140625, -37.05859375, -34.2802734375, -31.501953125, -28.7236328125, -25.9453125, -23.1669921875, -20.388671875, -17.6103515625, -14.83203125, -12.0537109375, -9.275390625, -6.4970703125, -3.71875, -0.9404296875, 1.837890625, 4.6162109375, 7.39453125, 10.1728515625, 12.951171875, 15.7294921875, 18.5078125, 21.2861328125, 24.064453125, 26.8427734375, 29.62109375, 32.3994140625, 35.177734375, 37.9560546875, 40.734375, 43.5126953125, 46.291015625, 49.0693359375, 51.84765625, 54.6259765625, 57.404296875, 60.1826171875, 62.9609375, 65.7392578125, 68.517578125, 71.2958984375, 74.07421875, 76.8525390625, 79.630859375, 82.4091796875, 85.1875]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 7.0, 6.0, 4.0, 5.0, 12.0, 10.0, 28.0, 23.0, 27.0, 20.0, 21.0, 27.0, 27.0, 52.0, 52.0, 42.0, 43.0, 55.0, 47.0, 59.0, 38.0, 37.0, 44.0, 38.0, 38.0, 32.0, 35.0, 31.0, 23.0, 32.0, 17.0, 16.0, 15.0, 7.0, 6.0, 5.0, 7.0, 6.0, 5.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.09765625, -4.93212890625, -4.7666015625, -4.60107421875, -4.435546875, -4.27001953125, -4.1044921875, -3.93896484375, -3.7734375, -3.60791015625, -3.4423828125, -3.27685546875, -3.111328125, -2.94580078125, -2.7802734375, -2.61474609375, -2.44921875, -2.28369140625, -2.1181640625, -1.95263671875, -1.787109375, -1.62158203125, -1.4560546875, -1.29052734375, -1.125, -0.95947265625, -0.7939453125, -0.62841796875, -0.462890625, -0.29736328125, -0.1318359375, 0.03369140625, 0.19921875, 0.36474609375, 0.5302734375, 0.69580078125, 0.861328125, 1.02685546875, 1.1923828125, 1.35791015625, 1.5234375, 1.68896484375, 1.8544921875, 2.02001953125, 2.185546875, 2.35107421875, 2.5166015625, 2.68212890625, 2.84765625, 3.01318359375, 3.1787109375, 3.34423828125, 3.509765625, 3.67529296875, 3.8408203125, 4.00634765625, 4.171875, 4.33740234375, 4.5029296875, 4.66845703125, 4.833984375, 4.99951171875, 5.1650390625, 5.33056640625, 5.49609375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 6.0, 2.0, 1.0, 3.0, 1.0, 5.0, 7.0, 8.0, 6.0, 11.0, 16.0, 27.0, 25.0, 48.0, 37.0, 75.0, 81.0, 97.0, 149.0, 196.0, 236.0, 384.0, 484.0, 720.0, 1214.0, 2233.0, 4351.0, 10921.0, 42043.0, 3687348.0, 399094.0, 26787.0, 8546.0, 3647.0, 1959.0, 1141.0, 697.0, 456.0, 325.0, 225.0, 178.0, 110.0, 100.0, 76.0, 41.0, 47.0, 21.0, 24.0, 17.0, 14.0, 17.0, 12.0, 8.0, 5.0, 3.0, 5.0, 2.0, 0.0, 4.0, 1.0, 1.0], "bins": [-26.9375, -26.117919921875, -25.29833984375, -24.478759765625, -23.6591796875, -22.839599609375, -22.02001953125, -21.200439453125, -20.380859375, -19.561279296875, -18.74169921875, -17.922119140625, -17.1025390625, -16.282958984375, -15.46337890625, -14.643798828125, -13.82421875, -13.004638671875, -12.18505859375, -11.365478515625, -10.5458984375, -9.726318359375, -8.90673828125, -8.087158203125, -7.267578125, -6.447998046875, -5.62841796875, -4.808837890625, -3.9892578125, -3.169677734375, -2.35009765625, -1.530517578125, -0.7109375, 0.108642578125, 0.92822265625, 1.747802734375, 2.5673828125, 3.386962890625, 4.20654296875, 5.026123046875, 5.845703125, 6.665283203125, 7.48486328125, 8.304443359375, 9.1240234375, 9.943603515625, 10.76318359375, 11.582763671875, 12.40234375, 13.221923828125, 14.04150390625, 14.861083984375, 15.6806640625, 16.500244140625, 17.31982421875, 18.139404296875, 18.958984375, 19.778564453125, 20.59814453125, 21.417724609375, 22.2373046875, 23.056884765625, 23.87646484375, 24.696044921875, 25.515625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 5.0, 7.0, 10.0, 9.0, 22.0, 43.0, 122.0, 1500.0, 2106.0, 130.0, 51.0, 15.0, 19.0, 8.0, 3.0, 3.0, 4.0, 9.0, 2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.1640625, -7.94342041015625, -7.7227783203125, -7.50213623046875, -7.281494140625, -7.06085205078125, -6.8402099609375, -6.61956787109375, -6.39892578125, -6.17828369140625, -5.9576416015625, -5.73699951171875, -5.516357421875, -5.29571533203125, -5.0750732421875, -4.85443115234375, -4.6337890625, -4.41314697265625, -4.1925048828125, -3.97186279296875, -3.751220703125, -3.53057861328125, -3.3099365234375, -3.08929443359375, -2.86865234375, -2.64801025390625, -2.4273681640625, -2.20672607421875, -1.986083984375, -1.76544189453125, -1.5447998046875, -1.32415771484375, -1.103515625, -0.88287353515625, -0.6622314453125, -0.44158935546875, -0.220947265625, -0.00030517578125, 0.2203369140625, 0.44097900390625, 0.66162109375, 0.88226318359375, 1.1029052734375, 1.32354736328125, 1.544189453125, 1.76483154296875, 1.9854736328125, 2.20611572265625, 2.4267578125, 2.64739990234375, 2.8680419921875, 3.08868408203125, 3.309326171875, 3.52996826171875, 3.7506103515625, 3.97125244140625, 4.19189453125, 4.41253662109375, 4.6331787109375, 4.85382080078125, 5.074462890625, 5.29510498046875, 5.5157470703125, 5.73638916015625, 5.95703125]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 7.0, 10.0, 19.0, 51.0, 106.0, 169.0, 201.0, 191.0, 118.0, 67.0, 37.0, 16.0, 4.0, 3.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.04270935058594, -50.791961669921875, -49.54121398925781, -48.290462493896484, -47.03971481323242, -45.78896713256836, -44.5382194519043, -43.28746795654297, -42.036720275878906, -40.785972595214844, -39.53522491455078, -38.28447341918945, -37.03372573852539, -35.78297805786133, -34.532230377197266, -33.28147888183594, -32.030731201171875, -30.779983520507812, -29.529233932495117, -28.278486251831055, -27.02773666381836, -25.776988983154297, -24.526241302490234, -23.27549171447754, -22.02474594116211, -20.773998260498047, -19.52324867248535, -18.27250099182129, -17.021751403808594, -15.771003723144531, -14.520255088806152, -13.269506454467773, -12.018754959106445, -10.768006324768066, -9.517257690429688, -8.266510009765625, -7.015760898590088, -5.765012264251709, -4.514264106750488, -3.2635154724121094, -2.0127668380737305, -0.7620183229446411, 0.48873019218444824, 1.739478588104248, 2.990227222442627, 4.240975856781006, 5.491724014282227, 6.7424726486206055, 7.993221282958984, 9.243969917297363, 10.494718551635742, 11.745466232299805, 12.9962158203125, 14.246963500976562, 15.497712135314941, 16.74846076965332, 17.999210357666016, 19.249958038330078, 20.500707626342773, 21.751455307006836, 23.00220489501953, 24.252952575683594, 25.503700256347656, 26.75444984436035, 28.005197525024414]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 6.0, 3.0, 7.0, 3.0, 6.0, 12.0, 5.0, 15.0, 20.0, 16.0, 22.0, 17.0, 17.0, 26.0, 15.0, 31.0, 34.0, 38.0, 28.0, 34.0, 31.0, 38.0, 38.0, 46.0, 44.0, 47.0, 37.0, 35.0, 35.0, 26.0, 38.0, 27.0, 17.0, 25.0, 31.0, 34.0, 24.0, 8.0, 13.0, 16.0, 15.0, 8.0, 4.0, 4.0, 4.0, 2.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.579087257385254, -10.251937866210938, -9.924788475036621, -9.597639083862305, -9.270489692687988, -8.943340301513672, -8.616190910339355, -8.289041519165039, -7.961892604827881, -7.6347432136535645, -7.307593822479248, -6.980444431304932, -6.653295516967773, -6.326146125793457, -5.998996734619141, -5.671847343444824, -5.344697952270508, -5.017548561096191, -4.690399169921875, -4.363249778747559, -4.036100387573242, -3.708951234817505, -3.3818020820617676, -3.054652690887451, -2.7275032997131348, -2.4003539085388184, -2.073204517364502, -1.7460553646087646, -1.4189059734344482, -1.0917565822601318, -0.764607310295105, -0.4374580383300781, -0.11030769348144531, 0.21684163808822632, 0.543990969657898, 0.8711403012275696, 1.1982896327972412, 1.5254390239715576, 1.8525882959365845, 2.1797375679016113, 2.5068869590759277, 2.834036350250244, 3.1611857414245605, 3.488334894180298, 3.8154842853546143, 4.142633438110352, 4.469782829284668, 4.796932220458984, 5.124081611633301, 5.451231002807617, 5.778380393981934, 6.10552978515625, 6.432679176330566, 6.759828567504883, 7.086977481842041, 7.414126873016357, 7.741276264190674, 8.068425178527832, 8.395574569702148, 8.722723960876465, 9.049873352050781, 9.377022743225098, 9.704172134399414, 10.03132152557373, 10.358470916748047]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 2.0, 7.0, 11.0, 13.0, 16.0, 18.0, 36.0, 74.0, 92.0, 143.0, 222.0, 395.0, 655.0, 1242.0, 2133.0, 3922.0, 7653.0, 14354.0, 28558.0, 56546.0, 109120.0, 187260.0, 233706.0, 183607.0, 106152.0, 54677.0, 27822.0, 14109.0, 7201.0, 4015.0, 2063.0, 1155.0, 593.0, 394.0, 199.0, 124.0, 83.0, 56.0, 37.0, 27.0, 18.0, 18.0, 8.0, 5.0, 4.0, 2.0, 4.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.5859375, -9.2607421875, -8.935546875, -8.6103515625, -8.28515625, -7.9599609375, -7.634765625, -7.3095703125, -6.984375, -6.6591796875, -6.333984375, -6.0087890625, -5.68359375, -5.3583984375, -5.033203125, -4.7080078125, -4.3828125, -4.0576171875, -3.732421875, -3.4072265625, -3.08203125, -2.7568359375, -2.431640625, -2.1064453125, -1.78125, -1.4560546875, -1.130859375, -0.8056640625, -0.48046875, -0.1552734375, 0.169921875, 0.4951171875, 0.8203125, 1.1455078125, 1.470703125, 1.7958984375, 2.12109375, 2.4462890625, 2.771484375, 3.0966796875, 3.421875, 3.7470703125, 4.072265625, 4.3974609375, 4.72265625, 5.0478515625, 5.373046875, 5.6982421875, 6.0234375, 6.3486328125, 6.673828125, 6.9990234375, 7.32421875, 7.6494140625, 7.974609375, 8.2998046875, 8.625, 8.9501953125, 9.275390625, 9.6005859375, 9.92578125, 10.2509765625, 10.576171875, 10.9013671875, 11.2265625]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 6.0, 8.0, 7.0, 16.0, 16.0, 15.0, 21.0, 24.0, 23.0, 33.0, 29.0, 29.0, 45.0, 45.0, 44.0, 48.0, 52.0, 40.0, 53.0, 42.0, 44.0, 34.0, 46.0, 43.0, 35.0, 28.0, 29.0, 25.0, 29.0, 13.0, 15.0, 11.0, 11.0, 8.0, 6.0, 11.0, 4.0, 4.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.41796875, -5.2421875, -5.06640625, -4.890625, -4.71484375, -4.5390625, -4.36328125, -4.1875, -4.01171875, -3.8359375, -3.66015625, -3.484375, -3.30859375, -3.1328125, -2.95703125, -2.78125, -2.60546875, -2.4296875, -2.25390625, -2.078125, -1.90234375, -1.7265625, -1.55078125, -1.375, -1.19921875, -1.0234375, -0.84765625, -0.671875, -0.49609375, -0.3203125, -0.14453125, 0.03125, 0.20703125, 0.3828125, 0.55859375, 0.734375, 0.91015625, 1.0859375, 1.26171875, 1.4375, 1.61328125, 1.7890625, 1.96484375, 2.140625, 2.31640625, 2.4921875, 2.66796875, 2.84375, 3.01953125, 3.1953125, 3.37109375, 3.546875, 3.72265625, 3.8984375, 4.07421875, 4.25, 4.42578125, 4.6015625, 4.77734375, 4.953125, 5.12890625, 5.3046875, 5.48046875, 5.65625, 5.83203125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [4.0, 3.0, 1.0, 3.0, 1.0, 2.0, 5.0, 5.0, 5.0, 2.0, 10.0, 5.0, 4.0, 17.0, 15.0, 14.0, 20.0, 40.0, 59.0, 74.0, 99.0, 144.0, 194.0, 286.0, 413.0, 688.0, 1390.0, 3278.0, 10574.0, 43762.0, 221674.0, 548174.0, 168803.0, 34223.0, 8580.0, 2855.0, 1232.0, 619.0, 380.0, 235.0, 170.0, 116.0, 98.0, 68.0, 52.0, 33.0, 40.0, 19.0, 19.0, 12.0, 9.0, 12.0, 8.0, 4.0, 6.0, 5.0, 5.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-21.078125, -20.4072265625, -19.736328125, -19.0654296875, -18.39453125, -17.7236328125, -17.052734375, -16.3818359375, -15.7109375, -15.0400390625, -14.369140625, -13.6982421875, -13.02734375, -12.3564453125, -11.685546875, -11.0146484375, -10.34375, -9.6728515625, -9.001953125, -8.3310546875, -7.66015625, -6.9892578125, -6.318359375, -5.6474609375, -4.9765625, -4.3056640625, -3.634765625, -2.9638671875, -2.29296875, -1.6220703125, -0.951171875, -0.2802734375, 0.390625, 1.0615234375, 1.732421875, 2.4033203125, 3.07421875, 3.7451171875, 4.416015625, 5.0869140625, 5.7578125, 6.4287109375, 7.099609375, 7.7705078125, 8.44140625, 9.1123046875, 9.783203125, 10.4541015625, 11.125, 11.7958984375, 12.466796875, 13.1376953125, 13.80859375, 14.4794921875, 15.150390625, 15.8212890625, 16.4921875, 17.1630859375, 17.833984375, 18.5048828125, 19.17578125, 19.8466796875, 20.517578125, 21.1884765625, 21.859375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 1.0, 4.0, 2.0, 2.0, 0.0, 6.0, 5.0, 3.0, 1.0, 4.0, 9.0, 8.0, 12.0, 12.0, 12.0, 19.0, 28.0, 21.0, 23.0, 31.0, 32.0, 21.0, 42.0, 35.0, 43.0, 45.0, 32.0, 42.0, 53.0, 42.0, 33.0, 42.0, 42.0, 47.0, 30.0, 34.0, 26.0, 25.0, 19.0, 21.0, 13.0, 20.0, 12.0, 13.0, 16.0, 10.0, 4.0, 6.0, 5.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-27.59375, -26.818603515625, -26.04345703125, -25.268310546875, -24.4931640625, -23.718017578125, -22.94287109375, -22.167724609375, -21.392578125, -20.617431640625, -19.84228515625, -19.067138671875, -18.2919921875, -17.516845703125, -16.74169921875, -15.966552734375, -15.19140625, -14.416259765625, -13.64111328125, -12.865966796875, -12.0908203125, -11.315673828125, -10.54052734375, -9.765380859375, -8.990234375, -8.215087890625, -7.43994140625, -6.664794921875, -5.8896484375, -5.114501953125, -4.33935546875, -3.564208984375, -2.7890625, -2.013916015625, -1.23876953125, -0.463623046875, 0.3115234375, 1.086669921875, 1.86181640625, 2.636962890625, 3.412109375, 4.187255859375, 4.96240234375, 5.737548828125, 6.5126953125, 7.287841796875, 8.06298828125, 8.838134765625, 9.61328125, 10.388427734375, 11.16357421875, 11.938720703125, 12.7138671875, 13.489013671875, 14.26416015625, 15.039306640625, 15.814453125, 16.589599609375, 17.36474609375, 18.139892578125, 18.9150390625, 19.690185546875, 20.46533203125, 21.240478515625, 22.015625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 7.0, 8.0, 6.0, 11.0, 15.0, 18.0, 32.0, 45.0, 65.0, 91.0, 165.0, 253.0, 398.0, 680.0, 1301.0, 2474.0, 5652.0, 16066.0, 59726.0, 283070.0, 501843.0, 129656.0, 29915.0, 9364.0, 3662.0, 1798.0, 852.0, 504.0, 296.0, 202.0, 129.0, 92.0, 48.0, 34.0, 19.0, 17.0, 11.0, 12.0, 4.0, 3.0, 4.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.1640625, -9.8673095703125, -9.570556640625, -9.2738037109375, -8.97705078125, -8.6802978515625, -8.383544921875, -8.0867919921875, -7.7900390625, -7.4932861328125, -7.196533203125, -6.8997802734375, -6.60302734375, -6.3062744140625, -6.009521484375, -5.7127685546875, -5.416015625, -5.1192626953125, -4.822509765625, -4.5257568359375, -4.22900390625, -3.9322509765625, -3.635498046875, -3.3387451171875, -3.0419921875, -2.7452392578125, -2.448486328125, -2.1517333984375, -1.85498046875, -1.5582275390625, -1.261474609375, -0.9647216796875, -0.66796875, -0.3712158203125, -0.074462890625, 0.2222900390625, 0.51904296875, 0.8157958984375, 1.112548828125, 1.4093017578125, 1.7060546875, 2.0028076171875, 2.299560546875, 2.5963134765625, 2.89306640625, 3.1898193359375, 3.486572265625, 3.7833251953125, 4.080078125, 4.3768310546875, 4.673583984375, 4.9703369140625, 5.26708984375, 5.5638427734375, 5.860595703125, 6.1573486328125, 6.4541015625, 6.7508544921875, 7.047607421875, 7.3443603515625, 7.64111328125, 7.9378662109375, 8.234619140625, 8.5313720703125, 8.828125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 10.0, 9.0, 10.0, 28.0, 34.0, 68.0, 73.0, 98.0, 129.0, 135.0, 116.0, 100.0, 59.0, 53.0, 19.0, 16.0, 13.0, 8.0, 5.0, 7.0, 5.0, 1.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002246856689453125, -0.002157449722290039, -0.002068042755126953, -0.001978635787963867, -0.0018892288208007812, -0.0017998218536376953, -0.0017104148864746094, -0.0016210079193115234, -0.0015316009521484375, -0.0014421939849853516, -0.0013527870178222656, -0.0012633800506591797, -0.0011739730834960938, -0.0010845661163330078, -0.0009951591491699219, -0.0009057521820068359, -0.00081634521484375, -0.0007269382476806641, -0.0006375312805175781, -0.0005481243133544922, -0.00045871734619140625, -0.0003693103790283203, -0.0002799034118652344, -0.00019049644470214844, -0.0001010894775390625, -1.1682510375976562e-05, 7.772445678710938e-05, 0.0001671314239501953, 0.00025653839111328125, 0.0003459453582763672, 0.0004353523254394531, 0.0005247592926025391, 0.000614166259765625, 0.0007035732269287109, 0.0007929801940917969, 0.0008823871612548828, 0.0009717941284179688, 0.0010612010955810547, 0.0011506080627441406, 0.0012400150299072266, 0.0013294219970703125, 0.0014188289642333984, 0.0015082359313964844, 0.0015976428985595703, 0.0016870498657226562, 0.0017764568328857422, 0.0018658638000488281, 0.001955270767211914, 0.002044677734375, 0.002134084701538086, 0.002223491668701172, 0.002312898635864258, 0.0024023056030273438, 0.0024917125701904297, 0.0025811195373535156, 0.0026705265045166016, 0.0027599334716796875, 0.0028493404388427734, 0.0029387474060058594, 0.0030281543731689453, 0.0031175613403320312, 0.003206968307495117, 0.003296375274658203, 0.003385782241821289, 0.003475189208984375]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 0.0, 3.0, 4.0, 2.0, 7.0, 9.0, 11.0, 15.0, 29.0, 26.0, 56.0, 87.0, 128.0, 268.0, 556.0, 1381.0, 4383.0, 22641.0, 274300.0, 670402.0, 61790.0, 8431.0, 2269.0, 876.0, 390.0, 194.0, 113.0, 85.0, 39.0, 24.0, 9.0, 14.0, 9.0, 5.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.078125, -17.51708984375, -16.9560546875, -16.39501953125, -15.833984375, -15.27294921875, -14.7119140625, -14.15087890625, -13.58984375, -13.02880859375, -12.4677734375, -11.90673828125, -11.345703125, -10.78466796875, -10.2236328125, -9.66259765625, -9.1015625, -8.54052734375, -7.9794921875, -7.41845703125, -6.857421875, -6.29638671875, -5.7353515625, -5.17431640625, -4.61328125, -4.05224609375, -3.4912109375, -2.93017578125, -2.369140625, -1.80810546875, -1.2470703125, -0.68603515625, -0.125, 0.43603515625, 0.9970703125, 1.55810546875, 2.119140625, 2.68017578125, 3.2412109375, 3.80224609375, 4.36328125, 4.92431640625, 5.4853515625, 6.04638671875, 6.607421875, 7.16845703125, 7.7294921875, 8.29052734375, 8.8515625, 9.41259765625, 9.9736328125, 10.53466796875, 11.095703125, 11.65673828125, 12.2177734375, 12.77880859375, 13.33984375, 13.90087890625, 14.4619140625, 15.02294921875, 15.583984375, 16.14501953125, 16.7060546875, 17.26708984375, 17.828125]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 5.0, 1.0, 2.0, 2.0, 6.0, 8.0, 11.0, 14.0, 15.0, 32.0, 24.0, 43.0, 61.0, 66.0, 66.0, 84.0, 95.0, 78.0, 73.0, 75.0, 53.0, 46.0, 33.0, 29.0, 21.0, 22.0, 19.0, 6.0, 6.0, 5.0, 4.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.7421875, -12.36279296875, -11.9833984375, -11.60400390625, -11.224609375, -10.84521484375, -10.4658203125, -10.08642578125, -9.70703125, -9.32763671875, -8.9482421875, -8.56884765625, -8.189453125, -7.81005859375, -7.4306640625, -7.05126953125, -6.671875, -6.29248046875, -5.9130859375, -5.53369140625, -5.154296875, -4.77490234375, -4.3955078125, -4.01611328125, -3.63671875, -3.25732421875, -2.8779296875, -2.49853515625, -2.119140625, -1.73974609375, -1.3603515625, -0.98095703125, -0.6015625, -0.22216796875, 0.1572265625, 0.53662109375, 0.916015625, 1.29541015625, 1.6748046875, 2.05419921875, 2.43359375, 2.81298828125, 3.1923828125, 3.57177734375, 3.951171875, 4.33056640625, 4.7099609375, 5.08935546875, 5.46875, 5.84814453125, 6.2275390625, 6.60693359375, 6.986328125, 7.36572265625, 7.7451171875, 8.12451171875, 8.50390625, 8.88330078125, 9.2626953125, 9.64208984375, 10.021484375, 10.40087890625, 10.7802734375, 11.15966796875, 11.5390625]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [7.0, 4.0, 10.0, 25.0, 50.0, 82.0, 148.0, 203.0, 180.0, 146.0, 82.0, 49.0, 10.0, 9.0, 3.0, 4.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.85733795166016, -56.6220703125, -48.386802673339844, -40.15153884887695, -31.916271209716797, -23.68100357055664, -15.44573974609375, -7.210472106933594, 1.0247955322265625, 9.260062217712402, 17.495328903198242, 25.730594635009766, 33.96586227416992, 42.20112991333008, 50.43639373779297, 58.671661376953125, 66.90692901611328, 75.14219665527344, 83.3774642944336, 91.61273193359375, 99.84799194335938, 108.08326721191406, 116.31852722167969, 124.55379486083984, 132.7890625, 141.02432250976562, 149.2595977783203, 157.49485778808594, 165.73013305664062, 173.96539306640625, 182.20065307617188, 190.43592834472656, 198.67120361328125, 206.90646362304688, 215.14173889160156, 223.3769989013672, 231.61227416992188, 239.8475341796875, 248.08279418945312, 256.31805419921875, 264.5533447265625, 272.7886047363281, 281.02386474609375, 289.2591552734375, 297.4944152832031, 305.72967529296875, 313.9649353027344, 322.2001953125, 330.43548583984375, 338.6707458496094, 346.906005859375, 355.14129638671875, 363.3765563964844, 371.61181640625, 379.8470764160156, 388.08233642578125, 396.3175964355469, 404.5528564453125, 412.7881164550781, 421.0234069824219, 429.2586669921875, 437.4939270019531, 445.72918701171875, 453.9644775390625, 462.1997375488281]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 1.0, 7.0, 5.0, 4.0, 12.0, 12.0, 7.0, 16.0, 14.0, 29.0, 20.0, 30.0, 28.0, 29.0, 26.0, 49.0, 37.0, 40.0, 62.0, 62.0, 51.0, 53.0, 49.0, 51.0, 43.0, 31.0, 34.0, 28.0, 24.0, 29.0, 17.0, 21.0, 16.0, 18.0, 9.0, 12.0, 14.0, 1.0, 5.0, 4.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-119.9652099609375, -115.71774291992188, -111.47027587890625, -107.22280883789062, -102.975341796875, -98.72787475585938, -94.48041534423828, -90.23294830322266, -85.98548126220703, -81.7380142211914, -77.49054718017578, -73.24308013916016, -68.99562072753906, -64.74815368652344, -60.50068664550781, -56.25321960449219, -52.00575256347656, -47.75828552246094, -43.51081848144531, -39.26335525512695, -35.01588821411133, -30.768421173095703, -26.52095603942871, -22.27349090576172, -18.026023864746094, -13.778557777404785, -9.531091690063477, -5.283625602722168, -1.0361595153808594, 3.2113075256347656, 7.458772659301758, 11.70623779296875, 15.953704833984375, 20.201171875, 24.448637008666992, 28.696102142333984, 32.94356918334961, 37.191036224365234, 41.438499450683594, 45.68596649169922, 49.933433532714844, 54.18090057373047, 58.428367614746094, 62.67583084106445, 66.92329406738281, 71.17076110839844, 75.41822814941406, 79.66569519042969, 83.91316223144531, 88.16062927246094, 92.40809631347656, 96.65556335449219, 100.90303039550781, 105.15049743652344, 109.39795684814453, 113.64542388916016, 117.89289093017578, 122.1403579711914, 126.38782501220703, 130.63528442382812, 134.88275146484375, 139.13021850585938, 143.377685546875, 147.62515258789062, 151.87261962890625]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 9.0, 8.0, 22.0, 26.0, 41.0, 77.0, 111.0, 193.0, 348.0, 745.0, 1875.0, 6522.0, 69007.0, 4080368.0, 28075.0, 4264.0, 1357.0, 544.0, 279.0, 153.0, 87.0, 59.0, 37.0, 20.0, 24.0, 12.0, 11.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-49.9375, -48.668701171875, -47.39990234375, -46.131103515625, -44.8623046875, -43.593505859375, -42.32470703125, -41.055908203125, -39.787109375, -38.518310546875, -37.24951171875, -35.980712890625, -34.7119140625, -33.443115234375, -32.17431640625, -30.905517578125, -29.63671875, -28.367919921875, -27.09912109375, -25.830322265625, -24.5615234375, -23.292724609375, -22.02392578125, -20.755126953125, -19.486328125, -18.217529296875, -16.94873046875, -15.679931640625, -14.4111328125, -13.142333984375, -11.87353515625, -10.604736328125, -9.3359375, -8.067138671875, -6.79833984375, -5.529541015625, -4.2607421875, -2.991943359375, -1.72314453125, -0.454345703125, 0.814453125, 2.083251953125, 3.35205078125, 4.620849609375, 5.8896484375, 7.158447265625, 8.42724609375, 9.696044921875, 10.96484375, 12.233642578125, 13.50244140625, 14.771240234375, 16.0400390625, 17.308837890625, 18.57763671875, 19.846435546875, 21.115234375, 22.384033203125, 23.65283203125, 24.921630859375, 26.1904296875, 27.459228515625, 28.72802734375, 29.996826171875, 31.265625]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 6.0, 3.0, 5.0, 13.0, 16.0, 15.0, 18.0, 14.0, 27.0, 21.0, 32.0, 32.0, 36.0, 37.0, 59.0, 47.0, 47.0, 36.0, 41.0, 56.0, 47.0, 55.0, 57.0, 41.0, 41.0, 30.0, 37.0, 36.0, 20.0, 20.0, 15.0, 13.0, 6.0, 5.0, 6.0, 4.0, 3.0, 4.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.3671875, -6.1876220703125, -6.008056640625, -5.8284912109375, -5.64892578125, -5.4693603515625, -5.289794921875, -5.1102294921875, -4.9306640625, -4.7510986328125, -4.571533203125, -4.3919677734375, -4.21240234375, -4.0328369140625, -3.853271484375, -3.6737060546875, -3.494140625, -3.3145751953125, -3.135009765625, -2.9554443359375, -2.77587890625, -2.5963134765625, -2.416748046875, -2.2371826171875, -2.0576171875, -1.8780517578125, -1.698486328125, -1.5189208984375, -1.33935546875, -1.1597900390625, -0.980224609375, -0.8006591796875, -0.62109375, -0.4415283203125, -0.261962890625, -0.0823974609375, 0.09716796875, 0.2767333984375, 0.456298828125, 0.6358642578125, 0.8154296875, 0.9949951171875, 1.174560546875, 1.3541259765625, 1.53369140625, 1.7132568359375, 1.892822265625, 2.0723876953125, 2.251953125, 2.4315185546875, 2.611083984375, 2.7906494140625, 2.97021484375, 3.1497802734375, 3.329345703125, 3.5089111328125, 3.6884765625, 3.8680419921875, 4.047607421875, 4.2271728515625, 4.40673828125, 4.5863037109375, 4.765869140625, 4.9454345703125, 5.125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 5.0, 5.0, 10.0, 11.0, 9.0, 12.0, 17.0, 26.0, 30.0, 33.0, 56.0, 86.0, 82.0, 126.0, 164.0, 241.0, 352.0, 491.0, 886.0, 1587.0, 3464.0, 10685.0, 62933.0, 3924109.0, 161728.0, 17404.0, 4775.0, 1957.0, 1040.0, 644.0, 339.0, 264.0, 175.0, 131.0, 102.0, 66.0, 61.0, 45.0, 41.0, 27.0, 18.0, 15.0, 10.0, 10.0, 6.0, 4.0, 1.0, 3.0, 2.0, 4.0, 0.0, 1.0, 2.0], "bins": [-29.515625, -28.6640625, -27.8125, -26.9609375, -26.109375, -25.2578125, -24.40625, -23.5546875, -22.703125, -21.8515625, -21.0, -20.1484375, -19.296875, -18.4453125, -17.59375, -16.7421875, -15.890625, -15.0390625, -14.1875, -13.3359375, -12.484375, -11.6328125, -10.78125, -9.9296875, -9.078125, -8.2265625, -7.375, -6.5234375, -5.671875, -4.8203125, -3.96875, -3.1171875, -2.265625, -1.4140625, -0.5625, 0.2890625, 1.140625, 1.9921875, 2.84375, 3.6953125, 4.546875, 5.3984375, 6.25, 7.1015625, 7.953125, 8.8046875, 9.65625, 10.5078125, 11.359375, 12.2109375, 13.0625, 13.9140625, 14.765625, 15.6171875, 16.46875, 17.3203125, 18.171875, 19.0234375, 19.875, 20.7265625, 21.578125, 22.4296875, 23.28125, 24.1328125, 24.984375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 6.0, 7.0, 10.0, 16.0, 32.0, 79.0, 258.0, 3087.0, 368.0, 107.0, 39.0, 28.0, 11.0, 10.0, 2.0, 8.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.6875, -5.435546875, -5.18359375, -4.931640625, -4.6796875, -4.427734375, -4.17578125, -3.923828125, -3.671875, -3.419921875, -3.16796875, -2.916015625, -2.6640625, -2.412109375, -2.16015625, -1.908203125, -1.65625, -1.404296875, -1.15234375, -0.900390625, -0.6484375, -0.396484375, -0.14453125, 0.107421875, 0.359375, 0.611328125, 0.86328125, 1.115234375, 1.3671875, 1.619140625, 1.87109375, 2.123046875, 2.375, 2.626953125, 2.87890625, 3.130859375, 3.3828125, 3.634765625, 3.88671875, 4.138671875, 4.390625, 4.642578125, 4.89453125, 5.146484375, 5.3984375, 5.650390625, 5.90234375, 6.154296875, 6.40625, 6.658203125, 6.91015625, 7.162109375, 7.4140625, 7.666015625, 7.91796875, 8.169921875, 8.421875, 8.673828125, 8.92578125, 9.177734375, 9.4296875, 9.681640625, 9.93359375, 10.185546875, 10.4375]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 7.0, 23.0, 60.0, 178.0, 282.0, 257.0, 118.0, 49.0, 21.0, 6.0, 4.0, 8.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.32489776611328, -32.373016357421875, -30.421138763427734, -28.46925926208496, -26.517379760742188, -24.56549835205078, -22.61362075805664, -20.661739349365234, -18.709861755371094, -16.75798225402832, -14.806102752685547, -12.854223251342773, -10.90234375, -8.95046329498291, -6.998583793640137, -5.046704292297363, -3.0948238372802734, -1.1429442167282104, 0.8089354038238525, 2.760815143585205, 4.7126946449279785, 6.66457462310791, 8.616454124450684, 10.568333625793457, 12.52021312713623, 14.472092628479004, 16.423973083496094, 18.375852584838867, 20.32773208618164, 22.279611587524414, 24.231491088867188, 26.18337059020996, 28.135250091552734, 30.087129592895508, 32.03900909423828, 33.99089050292969, 35.94276809692383, 37.894649505615234, 39.846527099609375, 41.79840850830078, 43.75028610229492, 45.70216751098633, 47.65404510498047, 49.605926513671875, 51.557804107666016, 53.50968551635742, 55.46156311035156, 57.41344451904297, 59.365325927734375, 61.31720733642578, 63.26908493041992, 65.22096252441406, 67.17284393310547, 69.12472534179688, 71.07660675048828, 73.02848052978516, 74.98036193847656, 76.93224334716797, 78.88412475585938, 80.83599853515625, 82.78787994384766, 84.73976135253906, 86.69164276123047, 88.64351654052734, 90.59539794921875]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 5.0, 1.0, 1.0, 1.0, 5.0, 4.0, 4.0, 6.0, 12.0, 10.0, 14.0, 21.0, 24.0, 22.0, 24.0, 23.0, 32.0, 23.0, 38.0, 40.0, 40.0, 46.0, 55.0, 50.0, 36.0, 44.0, 36.0, 32.0, 41.0, 52.0, 31.0, 28.0, 32.0, 25.0, 29.0, 26.0, 16.0, 14.0, 10.0, 13.0, 11.0, 10.0, 10.0, 7.0, 2.0, 2.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.948797225952148, -12.477943420410156, -12.00709056854248, -11.536236763000488, -11.065382957458496, -10.59453010559082, -10.123676300048828, -9.652822494506836, -9.181968688964844, -8.711114883422852, -8.240262031555176, -7.769408226013184, -7.298554420471191, -6.827701091766357, -6.356847763061523, -5.885993957519531, -5.4151411056518555, -4.9442877769470215, -4.473433971405029, -4.002580642700195, -3.5317270755767822, -3.060873508453369, -2.590020179748535, -2.119166612625122, -1.648313045501709, -1.177459478378296, -0.7066060304641724, -0.23575258255004883, 0.23510098457336426, 0.7059545516967773, 1.1768078804016113, 1.6476614475250244, 2.1185150146484375, 2.5893685817718506, 3.0602221488952637, 3.5310754776000977, 4.00192928314209, 4.472782611846924, 4.943635940551758, 5.41448974609375, 5.885343074798584, 6.356196403503418, 6.82705020904541, 7.297903537750244, 7.768756866455078, 8.23961067199707, 8.710464477539062, 9.181317329406738, 9.65217113494873, 10.123024940490723, 10.593877792358398, 11.06473159790039, 11.535585403442383, 12.006439208984375, 12.47729206085205, 12.948145866394043, 13.418998718261719, 13.889852523803711, 14.360705375671387, 14.831559181213379, 15.302412986755371, 15.773265838623047, 16.24411964416504, 16.71497344970703, 17.185827255249023]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 5.0, 4.0, 6.0, 16.0, 12.0, 25.0, 31.0, 53.0, 81.0, 130.0, 192.0, 338.0, 605.0, 1036.0, 1869.0, 3532.0, 6872.0, 13764.0, 28289.0, 59235.0, 118521.0, 200710.0, 237319.0, 179865.0, 99815.0, 48818.0, 23209.0, 11400.0, 5865.0, 3082.0, 1534.0, 956.0, 507.0, 312.0, 207.0, 132.0, 65.0, 38.0, 31.0, 25.0, 20.0, 13.0, 8.0, 3.0, 6.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-8.3671875, -8.0916748046875, -7.816162109375, -7.5406494140625, -7.26513671875, -6.9896240234375, -6.714111328125, -6.4385986328125, -6.1630859375, -5.8875732421875, -5.612060546875, -5.3365478515625, -5.06103515625, -4.7855224609375, -4.510009765625, -4.2344970703125, -3.958984375, -3.6834716796875, -3.407958984375, -3.1324462890625, -2.85693359375, -2.5814208984375, -2.305908203125, -2.0303955078125, -1.7548828125, -1.4793701171875, -1.203857421875, -0.9283447265625, -0.65283203125, -0.3773193359375, -0.101806640625, 0.1737060546875, 0.44921875, 0.7247314453125, 1.000244140625, 1.2757568359375, 1.55126953125, 1.8267822265625, 2.102294921875, 2.3778076171875, 2.6533203125, 2.9288330078125, 3.204345703125, 3.4798583984375, 3.75537109375, 4.0308837890625, 4.306396484375, 4.5819091796875, 4.857421875, 5.1329345703125, 5.408447265625, 5.6839599609375, 5.95947265625, 6.2349853515625, 6.510498046875, 6.7860107421875, 7.0615234375, 7.3370361328125, 7.612548828125, 7.8880615234375, 8.16357421875, 8.4390869140625, 8.714599609375, 8.9901123046875, 9.265625]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 8.0, 3.0, 8.0, 5.0, 6.0, 14.0, 13.0, 21.0, 25.0, 22.0, 30.0, 36.0, 43.0, 40.0, 51.0, 44.0, 57.0, 55.0, 59.0, 53.0, 50.0, 43.0, 49.0, 51.0, 35.0, 38.0, 29.0, 16.0, 24.0, 20.0, 9.0, 10.0, 8.0, 10.0, 7.0, 5.0, 4.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.78125, -6.584228515625, -6.38720703125, -6.190185546875, -5.9931640625, -5.796142578125, -5.59912109375, -5.402099609375, -5.205078125, -5.008056640625, -4.81103515625, -4.614013671875, -4.4169921875, -4.219970703125, -4.02294921875, -3.825927734375, -3.62890625, -3.431884765625, -3.23486328125, -3.037841796875, -2.8408203125, -2.643798828125, -2.44677734375, -2.249755859375, -2.052734375, -1.855712890625, -1.65869140625, -1.461669921875, -1.2646484375, -1.067626953125, -0.87060546875, -0.673583984375, -0.4765625, -0.279541015625, -0.08251953125, 0.114501953125, 0.3115234375, 0.508544921875, 0.70556640625, 0.902587890625, 1.099609375, 1.296630859375, 1.49365234375, 1.690673828125, 1.8876953125, 2.084716796875, 2.28173828125, 2.478759765625, 2.67578125, 2.872802734375, 3.06982421875, 3.266845703125, 3.4638671875, 3.660888671875, 3.85791015625, 4.054931640625, 4.251953125, 4.448974609375, 4.64599609375, 4.843017578125, 5.0400390625, 5.237060546875, 5.43408203125, 5.631103515625, 5.828125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 3.0, 2.0, 0.0, 2.0, 2.0, 4.0, 13.0, 11.0, 12.0, 13.0, 13.0, 18.0, 35.0, 41.0, 57.0, 68.0, 81.0, 116.0, 169.0, 238.0, 307.0, 485.0, 671.0, 1245.0, 2602.0, 6763.0, 24494.0, 115928.0, 473553.0, 328080.0, 68125.0, 15451.0, 4707.0, 2045.0, 1057.0, 642.0, 408.0, 313.0, 198.0, 157.0, 113.0, 79.0, 59.0, 45.0, 33.0, 24.0, 15.0, 19.0, 12.0, 10.0, 7.0, 4.0, 5.0, 2.0, 9.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-17.171875, -16.64892578125, -16.1259765625, -15.60302734375, -15.080078125, -14.55712890625, -14.0341796875, -13.51123046875, -12.98828125, -12.46533203125, -11.9423828125, -11.41943359375, -10.896484375, -10.37353515625, -9.8505859375, -9.32763671875, -8.8046875, -8.28173828125, -7.7587890625, -7.23583984375, -6.712890625, -6.18994140625, -5.6669921875, -5.14404296875, -4.62109375, -4.09814453125, -3.5751953125, -3.05224609375, -2.529296875, -2.00634765625, -1.4833984375, -0.96044921875, -0.4375, 0.08544921875, 0.6083984375, 1.13134765625, 1.654296875, 2.17724609375, 2.7001953125, 3.22314453125, 3.74609375, 4.26904296875, 4.7919921875, 5.31494140625, 5.837890625, 6.36083984375, 6.8837890625, 7.40673828125, 7.9296875, 8.45263671875, 8.9755859375, 9.49853515625, 10.021484375, 10.54443359375, 11.0673828125, 11.59033203125, 12.11328125, 12.63623046875, 13.1591796875, 13.68212890625, 14.205078125, 14.72802734375, 15.2509765625, 15.77392578125, 16.296875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 6.0, 7.0, 8.0, 13.0, 15.0, 18.0, 17.0, 15.0, 30.0, 28.0, 38.0, 31.0, 38.0, 36.0, 53.0, 48.0, 49.0, 62.0, 41.0, 50.0, 44.0, 43.0, 43.0, 41.0, 37.0, 41.0, 35.0, 28.0, 21.0, 11.0, 13.0, 11.0, 5.0, 7.0, 3.0, 3.0, 2.0, 1.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.265625, -25.43359375, -24.6015625, -23.76953125, -22.9375, -22.10546875, -21.2734375, -20.44140625, -19.609375, -18.77734375, -17.9453125, -17.11328125, -16.28125, -15.44921875, -14.6171875, -13.78515625, -12.953125, -12.12109375, -11.2890625, -10.45703125, -9.625, -8.79296875, -7.9609375, -7.12890625, -6.296875, -5.46484375, -4.6328125, -3.80078125, -2.96875, -2.13671875, -1.3046875, -0.47265625, 0.359375, 1.19140625, 2.0234375, 2.85546875, 3.6875, 4.51953125, 5.3515625, 6.18359375, 7.015625, 7.84765625, 8.6796875, 9.51171875, 10.34375, 11.17578125, 12.0078125, 12.83984375, 13.671875, 14.50390625, 15.3359375, 16.16796875, 17.0, 17.83203125, 18.6640625, 19.49609375, 20.328125, 21.16015625, 21.9921875, 22.82421875, 23.65625, 24.48828125, 25.3203125, 26.15234375, 26.984375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 4.0, 3.0, 7.0, 1.0, 12.0, 11.0, 17.0, 11.0, 25.0, 30.0, 33.0, 42.0, 76.0, 157.0, 248.0, 482.0, 1088.0, 2846.0, 9708.0, 50884.0, 451359.0, 464040.0, 52417.0, 9844.0, 2923.0, 1134.0, 491.0, 211.0, 143.0, 104.0, 57.0, 44.0, 28.0, 19.0, 15.0, 8.0, 8.0, 12.0, 2.0, 2.0, 4.0, 5.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.390625, -10.9979248046875, -10.605224609375, -10.2125244140625, -9.81982421875, -9.4271240234375, -9.034423828125, -8.6417236328125, -8.2490234375, -7.8563232421875, -7.463623046875, -7.0709228515625, -6.67822265625, -6.2855224609375, -5.892822265625, -5.5001220703125, -5.107421875, -4.7147216796875, -4.322021484375, -3.9293212890625, -3.53662109375, -3.1439208984375, -2.751220703125, -2.3585205078125, -1.9658203125, -1.5731201171875, -1.180419921875, -0.7877197265625, -0.39501953125, -0.0023193359375, 0.390380859375, 0.7830810546875, 1.17578125, 1.5684814453125, 1.961181640625, 2.3538818359375, 2.74658203125, 3.1392822265625, 3.531982421875, 3.9246826171875, 4.3173828125, 4.7100830078125, 5.102783203125, 5.4954833984375, 5.88818359375, 6.2808837890625, 6.673583984375, 7.0662841796875, 7.458984375, 7.8516845703125, 8.244384765625, 8.6370849609375, 9.02978515625, 9.4224853515625, 9.815185546875, 10.2078857421875, 10.6005859375, 10.9932861328125, 11.385986328125, 11.7786865234375, 12.17138671875, 12.5640869140625, 12.956787109375, 13.3494873046875, 13.7421875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 3.0, 1.0, 8.0, 7.0, 9.0, 8.0, 3.0, 14.0, 20.0, 30.0, 40.0, 32.0, 61.0, 67.0, 64.0, 75.0, 96.0, 93.0, 89.0, 79.0, 44.0, 30.0, 27.0, 22.0, 22.0, 15.0, 9.0, 16.0, 6.0, 6.0, 3.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0018682479858398438, -0.0018123835325241089, -0.001756519079208374, -0.0017006546258926392, -0.0016447901725769043, -0.0015889257192611694, -0.0015330612659454346, -0.0014771968126296997, -0.0014213323593139648, -0.00136546790599823, -0.0013096034526824951, -0.0012537389993667603, -0.0011978745460510254, -0.0011420100927352905, -0.0010861456394195557, -0.0010302811861038208, -0.0009744167327880859, -0.0009185522794723511, -0.0008626878261566162, -0.0008068233728408813, -0.0007509589195251465, -0.0006950944662094116, -0.0006392300128936768, -0.0005833655595779419, -0.000527501106262207, -0.00047163665294647217, -0.0004157721996307373, -0.00035990774631500244, -0.0003040432929992676, -0.0002481788396835327, -0.00019231438636779785, -0.000136449933052063, -8.058547973632812e-05, -2.4721026420593262e-05, 3.11434268951416e-05, 8.700788021087646e-05, 0.00014287233352661133, 0.0001987367868423462, 0.00025460124015808105, 0.0003104656934738159, 0.0003663301467895508, 0.00042219460010528564, 0.0004780590534210205, 0.0005339235067367554, 0.0005897879600524902, 0.0006456524133682251, 0.00070151686668396, 0.0007573813199996948, 0.0008132457733154297, 0.0008691102266311646, 0.0009249746799468994, 0.0009808391332626343, 0.0010367035865783691, 0.001092568039894104, 0.0011484324932098389, 0.0012042969465255737, 0.0012601613998413086, 0.0013160258531570435, 0.0013718903064727783, 0.0014277547597885132, 0.001483619213104248, 0.001539483666419983, 0.0015953481197357178, 0.0016512125730514526, 0.0017070770263671875]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 6.0, 6.0, 9.0, 14.0, 52.0, 85.0, 174.0, 448.0, 1431.0, 6982.0, 124925.0, 862803.0, 45853.0, 4080.0, 1051.0, 346.0, 152.0, 67.0, 32.0, 16.0, 12.0, 8.0, 5.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.453125, -24.690185546875, -23.92724609375, -23.164306640625, -22.4013671875, -21.638427734375, -20.87548828125, -20.112548828125, -19.349609375, -18.586669921875, -17.82373046875, -17.060791015625, -16.2978515625, -15.534912109375, -14.77197265625, -14.009033203125, -13.24609375, -12.483154296875, -11.72021484375, -10.957275390625, -10.1943359375, -9.431396484375, -8.66845703125, -7.905517578125, -7.142578125, -6.379638671875, -5.61669921875, -4.853759765625, -4.0908203125, -3.327880859375, -2.56494140625, -1.802001953125, -1.0390625, -0.276123046875, 0.48681640625, 1.249755859375, 2.0126953125, 2.775634765625, 3.53857421875, 4.301513671875, 5.064453125, 5.827392578125, 6.59033203125, 7.353271484375, 8.1162109375, 8.879150390625, 9.64208984375, 10.405029296875, 11.16796875, 11.930908203125, 12.69384765625, 13.456787109375, 14.2197265625, 14.982666015625, 15.74560546875, 16.508544921875, 17.271484375, 18.034423828125, 18.79736328125, 19.560302734375, 20.3232421875, 21.086181640625, 21.84912109375, 22.612060546875, 23.375]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 5.0, 1.0, 5.0, 5.0, 9.0, 17.0, 29.0, 29.0, 38.0, 50.0, 58.0, 63.0, 67.0, 77.0, 71.0, 83.0, 64.0, 66.0, 67.0, 40.0, 38.0, 34.0, 23.0, 20.0, 14.0, 9.0, 6.0, 3.0, 2.0, 5.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.6484375, -10.313720703125, -9.97900390625, -9.644287109375, -9.3095703125, -8.974853515625, -8.64013671875, -8.305419921875, -7.970703125, -7.635986328125, -7.30126953125, -6.966552734375, -6.6318359375, -6.297119140625, -5.96240234375, -5.627685546875, -5.29296875, -4.958251953125, -4.62353515625, -4.288818359375, -3.9541015625, -3.619384765625, -3.28466796875, -2.949951171875, -2.615234375, -2.280517578125, -1.94580078125, -1.611083984375, -1.2763671875, -0.941650390625, -0.60693359375, -0.272216796875, 0.0625, 0.397216796875, 0.73193359375, 1.066650390625, 1.4013671875, 1.736083984375, 2.07080078125, 2.405517578125, 2.740234375, 3.074951171875, 3.40966796875, 3.744384765625, 4.0791015625, 4.413818359375, 4.74853515625, 5.083251953125, 5.41796875, 5.752685546875, 6.08740234375, 6.422119140625, 6.7568359375, 7.091552734375, 7.42626953125, 7.760986328125, 8.095703125, 8.430419921875, 8.76513671875, 9.099853515625, 9.4345703125, 9.769287109375, 10.10400390625, 10.438720703125, 10.7734375]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 3.0, 5.0, 6.0, 7.0, 17.0, 59.0, 217.0, 412.0, 203.0, 67.0, 14.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-164.0657958984375, -149.918701171875, -135.77159118652344, -121.62449645996094, -107.47738647460938, -93.33029174804688, -79.18318939208984, -65.03608703613281, -50.88898468017578, -36.74188232421875, -22.59478187561035, -8.447681427001953, 5.699420928955078, 19.846519470214844, 33.993621826171875, 48.140724182128906, 62.28782653808594, 76.43492889404297, 90.58203125, 104.7291259765625, 118.87623596191406, 133.02333068847656, 147.17044067382812, 161.31753540039062, 175.46463012695312, 189.61172485351562, 203.7588348388672, 217.9059295654297, 232.05303955078125, 246.20013427734375, 260.34722900390625, 274.49432373046875, 288.6414489746094, 302.7885437011719, 316.9356384277344, 331.082763671875, 345.2298583984375, 359.376953125, 373.5240478515625, 387.671142578125, 401.8182678222656, 415.9653625488281, 430.1124572753906, 444.25958251953125, 458.40667724609375, 472.55377197265625, 486.70086669921875, 500.84796142578125, 514.9950561523438, 529.1421508789062, 543.2892456054688, 557.4363403320312, 571.5834350585938, 585.7305908203125, 599.877685546875, 614.0247802734375, 628.171875, 642.3189697265625, 656.466064453125, 670.6131591796875, 684.76025390625, 698.9073486328125, 713.0545043945312, 727.2015991210938, 741.3486938476562]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 2.0, 6.0, 3.0, 5.0, 7.0, 12.0, 14.0, 13.0, 28.0, 18.0, 25.0, 30.0, 32.0, 43.0, 35.0, 34.0, 55.0, 51.0, 49.0, 62.0, 52.0, 54.0, 48.0, 39.0, 44.0, 38.0, 30.0, 26.0, 33.0, 23.0, 19.0, 12.0, 9.0, 11.0, 8.0, 7.0, 5.0, 4.0, 4.0, 1.0, 7.0, 1.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-123.40972137451172, -119.37999725341797, -115.35027313232422, -111.320556640625, -107.29083251953125, -103.2611083984375, -99.23138427734375, -95.20166015625, -91.17193603515625, -87.1422119140625, -83.11248779296875, -79.082763671875, -75.05304718017578, -71.02332305908203, -66.99359893798828, -62.96387481689453, -58.93415832519531, -54.90443420410156, -50.87471389770508, -46.84498977661133, -42.815269470214844, -38.785545349121094, -34.755821228027344, -30.726099014282227, -26.69637680053711, -22.666654586791992, -18.636932373046875, -14.607208251953125, -10.577486038208008, -6.547763824462891, -2.5180397033691406, 1.5116825103759766, 5.541412353515625, 9.571134567260742, 13.600857734680176, 17.63058090209961, 21.660303115844727, 25.690025329589844, 29.719749450683594, 33.749473571777344, 37.77919387817383, 41.80891799926758, 45.83863830566406, 49.86836242675781, 53.89808654785156, 57.92780685424805, 61.9575309753418, 65.98725128173828, 70.01697540283203, 74.04669952392578, 78.07642364501953, 82.10614013671875, 86.1358642578125, 90.16558837890625, 94.1953125, 98.22503662109375, 102.2547607421875, 106.28448486328125, 110.314208984375, 114.34393310546875, 118.37364959716797, 122.40337371826172, 126.43309783935547, 130.4628143310547, 134.49253845214844]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 2.0, 3.0, 3.0, 6.0, 9.0, 7.0, 31.0, 51.0, 79.0, 138.0, 290.0, 955.0, 7995.0, 4165280.0, 17421.0, 1271.0, 370.0, 182.0, 65.0, 47.0, 27.0, 18.0, 15.0, 10.0, 8.0, 5.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-81.8125, -79.4482421875, -77.083984375, -74.7197265625, -72.35546875, -69.9912109375, -67.626953125, -65.2626953125, -62.8984375, -60.5341796875, -58.169921875, -55.8056640625, -53.44140625, -51.0771484375, -48.712890625, -46.3486328125, -43.984375, -41.6201171875, -39.255859375, -36.8916015625, -34.52734375, -32.1630859375, -29.798828125, -27.4345703125, -25.0703125, -22.7060546875, -20.341796875, -17.9775390625, -15.61328125, -13.2490234375, -10.884765625, -8.5205078125, -6.15625, -3.7919921875, -1.427734375, 0.9365234375, 3.30078125, 5.6650390625, 8.029296875, 10.3935546875, 12.7578125, 15.1220703125, 17.486328125, 19.8505859375, 22.21484375, 24.5791015625, 26.943359375, 29.3076171875, 31.671875, 34.0361328125, 36.400390625, 38.7646484375, 41.12890625, 43.4931640625, 45.857421875, 48.2216796875, 50.5859375, 52.9501953125, 55.314453125, 57.6787109375, 60.04296875, 62.4072265625, 64.771484375, 67.1357421875, 69.5]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 1.0, 4.0, 4.0, 8.0, 4.0, 12.0, 10.0, 13.0, 17.0, 14.0, 27.0, 29.0, 40.0, 44.0, 65.0, 57.0, 52.0, 69.0, 64.0, 69.0, 55.0, 49.0, 54.0, 47.0, 37.0, 35.0, 30.0, 16.0, 23.0, 14.0, 13.0, 5.0, 6.0, 7.0, 3.0, 10.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.890625, -8.66607666015625, -8.4415283203125, -8.21697998046875, -7.992431640625, -7.76788330078125, -7.5433349609375, -7.31878662109375, -7.09423828125, -6.86968994140625, -6.6451416015625, -6.42059326171875, -6.196044921875, -5.97149658203125, -5.7469482421875, -5.52239990234375, -5.2978515625, -5.07330322265625, -4.8487548828125, -4.62420654296875, -4.399658203125, -4.17510986328125, -3.9505615234375, -3.72601318359375, -3.50146484375, -3.27691650390625, -3.0523681640625, -2.82781982421875, -2.603271484375, -2.37872314453125, -2.1541748046875, -1.92962646484375, -1.705078125, -1.48052978515625, -1.2559814453125, -1.03143310546875, -0.806884765625, -0.58233642578125, -0.3577880859375, -0.13323974609375, 0.09130859375, 0.31585693359375, 0.5404052734375, 0.76495361328125, 0.989501953125, 1.21405029296875, 1.4385986328125, 1.66314697265625, 1.8876953125, 2.11224365234375, 2.3367919921875, 2.56134033203125, 2.785888671875, 3.01043701171875, 3.2349853515625, 3.45953369140625, 3.68408203125, 3.90863037109375, 4.1331787109375, 4.35772705078125, 4.582275390625, 4.80682373046875, 5.0313720703125, 5.25592041015625, 5.48046875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 4.0, 2.0, 3.0, 3.0, 3.0, 4.0, 17.0, 11.0, 12.0, 23.0, 26.0, 35.0, 57.0, 70.0, 100.0, 147.0, 210.0, 308.0, 513.0, 807.0, 1303.0, 2182.0, 3682.0, 7881.0, 21216.0, 107319.0, 3873390.0, 132598.0, 23664.0, 8589.0, 3988.0, 2275.0, 1373.0, 881.0, 517.0, 341.0, 213.0, 153.0, 87.0, 84.0, 50.0, 38.0, 24.0, 19.0, 16.0, 20.0, 10.0, 4.0, 5.0, 4.0, 3.0, 4.0, 3.0, 3.0, 2.0], "bins": [-15.125, -14.699462890625, -14.27392578125, -13.848388671875, -13.4228515625, -12.997314453125, -12.57177734375, -12.146240234375, -11.720703125, -11.295166015625, -10.86962890625, -10.444091796875, -10.0185546875, -9.593017578125, -9.16748046875, -8.741943359375, -8.31640625, -7.890869140625, -7.46533203125, -7.039794921875, -6.6142578125, -6.188720703125, -5.76318359375, -5.337646484375, -4.912109375, -4.486572265625, -4.06103515625, -3.635498046875, -3.2099609375, -2.784423828125, -2.35888671875, -1.933349609375, -1.5078125, -1.082275390625, -0.65673828125, -0.231201171875, 0.1943359375, 0.619873046875, 1.04541015625, 1.470947265625, 1.896484375, 2.322021484375, 2.74755859375, 3.173095703125, 3.5986328125, 4.024169921875, 4.44970703125, 4.875244140625, 5.30078125, 5.726318359375, 6.15185546875, 6.577392578125, 7.0029296875, 7.428466796875, 7.85400390625, 8.279541015625, 8.705078125, 9.130615234375, 9.55615234375, 9.981689453125, 10.4072265625, 10.832763671875, 11.25830078125, 11.683837890625, 12.109375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 6.0, 2.0, 6.0, 6.0, 8.0, 12.0, 20.0, 50.0, 95.0, 296.0, 3092.0, 260.0, 91.0, 41.0, 26.0, 15.0, 12.0, 7.0, 5.0, 6.0, 2.0, 4.0, 5.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.05078125, -3.929656982421875, -3.80853271484375, -3.687408447265625, -3.5662841796875, -3.445159912109375, -3.32403564453125, -3.202911376953125, -3.081787109375, -2.960662841796875, -2.83953857421875, -2.718414306640625, -2.5972900390625, -2.476165771484375, -2.35504150390625, -2.233917236328125, -2.11279296875, -1.991668701171875, -1.87054443359375, -1.749420166015625, -1.6282958984375, -1.507171630859375, -1.38604736328125, -1.264923095703125, -1.143798828125, -1.022674560546875, -0.90155029296875, -0.780426025390625, -0.6593017578125, -0.538177490234375, -0.41705322265625, -0.295928955078125, -0.1748046875, -0.053680419921875, 0.06744384765625, 0.188568115234375, 0.3096923828125, 0.430816650390625, 0.55194091796875, 0.673065185546875, 0.794189453125, 0.915313720703125, 1.03643798828125, 1.157562255859375, 1.2786865234375, 1.399810791015625, 1.52093505859375, 1.642059326171875, 1.76318359375, 1.884307861328125, 2.00543212890625, 2.126556396484375, 2.2476806640625, 2.368804931640625, 2.48992919921875, 2.611053466796875, 2.732177734375, 2.853302001953125, 2.97442626953125, 3.095550537109375, 3.2166748046875, 3.337799072265625, 3.45892333984375, 3.580047607421875, 3.701171875]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 5.0, 8.0, 34.0, 51.0, 153.0, 217.0, 247.0, 143.0, 77.0, 41.0, 15.0, 11.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.020355224609375, -41.02103805541992, -40.021724700927734, -39.02240753173828, -38.023094177246094, -37.02377700805664, -36.02445983886719, -35.025146484375, -34.02582931518555, -33.026512145996094, -32.027198791503906, -31.027881622314453, -30.028566360473633, -29.029251098632812, -28.029935836791992, -27.030620574951172, -26.031307220458984, -25.031991958618164, -24.032676696777344, -23.03335952758789, -22.03404426574707, -21.03472900390625, -20.03541374206543, -19.03609848022461, -18.036781311035156, -17.037466049194336, -16.038150787353516, -15.038834571838379, -14.039519309997559, -13.040203094482422, -12.040887832641602, -11.041572570800781, -10.042257308959961, -9.04294204711914, -8.043625831604004, -7.044310569763184, -6.044995307922363, -5.045679569244385, -4.046363830566406, -3.047048568725586, -2.0477328300476074, -1.048417329788208, -0.04910171031951904, 0.9502139091491699, 1.9495294094085693, 2.9488449096679688, 3.9481606483459473, 4.947475910186768, 5.946791648864746, 6.946107387542725, 7.945422649383545, 8.944738388061523, 9.944053649902344, 10.943368911743164, 11.9426851272583, 12.942000389099121, 13.941316604614258, 14.940631866455078, 15.939948081970215, 16.93926239013672, 17.938579559326172, 18.937894821166992, 19.937210083007812, 20.936525344848633, 21.935840606689453]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 1.0, 8.0, 5.0, 5.0, 7.0, 13.0, 12.0, 12.0, 20.0, 14.0, 21.0, 21.0, 25.0, 22.0, 30.0, 24.0, 28.0, 33.0, 29.0, 38.0, 33.0, 42.0, 44.0, 29.0, 38.0, 34.0, 43.0, 38.0, 41.0, 43.0, 29.0, 36.0, 23.0, 15.0, 16.0, 16.0, 14.0, 9.0, 10.0, 12.0, 15.0, 9.0, 9.0, 5.0, 8.0, 6.0, 3.0, 4.0, 3.0, 4.0, 2.0, 3.0, 1.0, 0.0, 2.0], "bins": [-6.314723014831543, -6.115884780883789, -5.917046070098877, -5.718207836151123, -5.519369125366211, -5.320530891418457, -5.121692657470703, -4.922853946685791, -4.724015235900879, -4.525177001953125, -4.326338291168213, -4.127500057220459, -3.928661346435547, -3.729823112487793, -3.53098464012146, -3.332146167755127, -3.133307933807373, -2.93446946144104, -2.735630989074707, -2.536792755126953, -2.337954044342041, -2.139115810394287, -1.940277338027954, -1.741438865661621, -1.542600393295288, -1.343761920928955, -1.144923448562622, -0.9460850954055786, -0.7472466230392456, -0.5484081506729126, -0.34956979751586914, -0.15073132514953613, 0.04810762405395508, 0.2469460666179657, 0.4457845091819763, 0.6446229219436646, 0.8434613943099976, 1.0422998666763306, 1.241138219833374, 1.439976692199707, 1.63881516456604, 1.837653636932373, 2.036492109298706, 2.235330581665039, 2.434168815612793, 2.633007526397705, 2.831845760345459, 3.030684232711792, 3.229522705078125, 3.428361177444458, 3.627199649810791, 3.826037883758545, 4.024876594543457, 4.223714828491211, 4.422553062438965, 4.621391773223877, 4.820230484008789, 5.019068717956543, 5.217907428741455, 5.416745662689209, 5.615584373474121, 5.814422607421875, 6.013260841369629, 6.212099552154541, 6.410937786102295]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 5.0, 5.0, 9.0, 6.0, 21.0, 37.0, 33.0, 65.0, 125.0, 213.0, 368.0, 627.0, 1176.0, 2224.0, 4520.0, 9545.0, 20496.0, 44412.0, 94831.0, 184226.0, 263943.0, 209214.0, 111884.0, 53235.0, 24527.0, 11509.0, 5516.0, 2669.0, 1355.0, 743.0, 433.0, 212.0, 136.0, 87.0, 56.0, 25.0, 24.0, 10.0, 12.0, 11.0, 2.0, 7.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.0859375, -7.8302001953125, -7.574462890625, -7.3187255859375, -7.06298828125, -6.8072509765625, -6.551513671875, -6.2957763671875, -6.0400390625, -5.7843017578125, -5.528564453125, -5.2728271484375, -5.01708984375, -4.7613525390625, -4.505615234375, -4.2498779296875, -3.994140625, -3.7384033203125, -3.482666015625, -3.2269287109375, -2.97119140625, -2.7154541015625, -2.459716796875, -2.2039794921875, -1.9482421875, -1.6925048828125, -1.436767578125, -1.1810302734375, -0.92529296875, -0.6695556640625, -0.413818359375, -0.1580810546875, 0.09765625, 0.3533935546875, 0.609130859375, 0.8648681640625, 1.12060546875, 1.3763427734375, 1.632080078125, 1.8878173828125, 2.1435546875, 2.3992919921875, 2.655029296875, 2.9107666015625, 3.16650390625, 3.4222412109375, 3.677978515625, 3.9337158203125, 4.189453125, 4.4451904296875, 4.700927734375, 4.9566650390625, 5.21240234375, 5.4681396484375, 5.723876953125, 5.9796142578125, 6.2353515625, 6.4910888671875, 6.746826171875, 7.0025634765625, 7.25830078125, 7.5140380859375, 7.769775390625, 8.0255126953125, 8.28125]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 3.0, 4.0, 2.0, 4.0, 5.0, 2.0, 6.0, 11.0, 15.0, 21.0, 24.0, 16.0, 35.0, 28.0, 29.0, 56.0, 54.0, 69.0, 48.0, 61.0, 62.0, 54.0, 48.0, 58.0, 52.0, 43.0, 34.0, 26.0, 23.0, 24.0, 16.0, 20.0, 13.0, 15.0, 6.0, 6.0, 7.0, 1.0, 4.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.64453125, -7.43341064453125, -7.2222900390625, -7.01116943359375, -6.800048828125, -6.58892822265625, -6.3778076171875, -6.16668701171875, -5.95556640625, -5.74444580078125, -5.5333251953125, -5.32220458984375, -5.111083984375, -4.89996337890625, -4.6888427734375, -4.47772216796875, -4.2666015625, -4.05548095703125, -3.8443603515625, -3.63323974609375, -3.422119140625, -3.21099853515625, -2.9998779296875, -2.78875732421875, -2.57763671875, -2.36651611328125, -2.1553955078125, -1.94427490234375, -1.733154296875, -1.52203369140625, -1.3109130859375, -1.09979248046875, -0.888671875, -0.67755126953125, -0.4664306640625, -0.25531005859375, -0.044189453125, 0.16693115234375, 0.3780517578125, 0.58917236328125, 0.80029296875, 1.01141357421875, 1.2225341796875, 1.43365478515625, 1.644775390625, 1.85589599609375, 2.0670166015625, 2.27813720703125, 2.4892578125, 2.70037841796875, 2.9114990234375, 3.12261962890625, 3.333740234375, 3.54486083984375, 3.7559814453125, 3.96710205078125, 4.17822265625, 4.38934326171875, 4.6004638671875, 4.81158447265625, 5.022705078125, 5.23382568359375, 5.4449462890625, 5.65606689453125, 5.8671875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 4.0, 6.0, 6.0, 11.0, 14.0, 13.0, 25.0, 41.0, 73.0, 128.0, 283.0, 610.0, 1512.0, 7372.0, 190279.0, 811117.0, 32220.0, 2985.0, 990.0, 409.0, 206.0, 97.0, 51.0, 23.0, 25.0, 15.0, 10.0, 5.0, 9.0, 2.0, 4.0, 5.0, 4.0, 6.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-36.28125, -35.1904296875, -34.099609375, -33.0087890625, -31.91796875, -30.8271484375, -29.736328125, -28.6455078125, -27.5546875, -26.4638671875, -25.373046875, -24.2822265625, -23.19140625, -22.1005859375, -21.009765625, -19.9189453125, -18.828125, -17.7373046875, -16.646484375, -15.5556640625, -14.46484375, -13.3740234375, -12.283203125, -11.1923828125, -10.1015625, -9.0107421875, -7.919921875, -6.8291015625, -5.73828125, -4.6474609375, -3.556640625, -2.4658203125, -1.375, -0.2841796875, 0.806640625, 1.8974609375, 2.98828125, 4.0791015625, 5.169921875, 6.2607421875, 7.3515625, 8.4423828125, 9.533203125, 10.6240234375, 11.71484375, 12.8056640625, 13.896484375, 14.9873046875, 16.078125, 17.1689453125, 18.259765625, 19.3505859375, 20.44140625, 21.5322265625, 22.623046875, 23.7138671875, 24.8046875, 25.8955078125, 26.986328125, 28.0771484375, 29.16796875, 30.2587890625, 31.349609375, 32.4404296875, 33.53125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 4.0, 2.0, 3.0, 1.0, 14.0, 6.0, 8.0, 10.0, 12.0, 23.0, 19.0, 23.0, 24.0, 36.0, 30.0, 26.0, 56.0, 45.0, 45.0, 35.0, 50.0, 51.0, 48.0, 46.0, 44.0, 39.0, 43.0, 45.0, 32.0, 36.0, 40.0, 24.0, 11.0, 20.0, 15.0, 10.0, 8.0, 6.0, 2.0, 5.0, 5.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-30.859375, -30.01025390625, -29.1611328125, -28.31201171875, -27.462890625, -26.61376953125, -25.7646484375, -24.91552734375, -24.06640625, -23.21728515625, -22.3681640625, -21.51904296875, -20.669921875, -19.82080078125, -18.9716796875, -18.12255859375, -17.2734375, -16.42431640625, -15.5751953125, -14.72607421875, -13.876953125, -13.02783203125, -12.1787109375, -11.32958984375, -10.48046875, -9.63134765625, -8.7822265625, -7.93310546875, -7.083984375, -6.23486328125, -5.3857421875, -4.53662109375, -3.6875, -2.83837890625, -1.9892578125, -1.14013671875, -0.291015625, 0.55810546875, 1.4072265625, 2.25634765625, 3.10546875, 3.95458984375, 4.8037109375, 5.65283203125, 6.501953125, 7.35107421875, 8.2001953125, 9.04931640625, 9.8984375, 10.74755859375, 11.5966796875, 12.44580078125, 13.294921875, 14.14404296875, 14.9931640625, 15.84228515625, 16.69140625, 17.54052734375, 18.3896484375, 19.23876953125, 20.087890625, 20.93701171875, 21.7861328125, 22.63525390625, 23.484375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 7.0, 4.0, 4.0, 3.0, 11.0, 15.0, 12.0, 31.0, 57.0, 68.0, 122.0, 234.0, 541.0, 1401.0, 6667.0, 119121.0, 873957.0, 40647.0, 3786.0, 995.0, 415.0, 185.0, 92.0, 66.0, 52.0, 25.0, 12.0, 11.0, 6.0, 9.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-23.171875, -22.6114501953125, -22.051025390625, -21.4906005859375, -20.93017578125, -20.3697509765625, -19.809326171875, -19.2489013671875, -18.6884765625, -18.1280517578125, -17.567626953125, -17.0072021484375, -16.44677734375, -15.8863525390625, -15.325927734375, -14.7655029296875, -14.205078125, -13.6446533203125, -13.084228515625, -12.5238037109375, -11.96337890625, -11.4029541015625, -10.842529296875, -10.2821044921875, -9.7216796875, -9.1612548828125, -8.600830078125, -8.0404052734375, -7.47998046875, -6.9195556640625, -6.359130859375, -5.7987060546875, -5.23828125, -4.6778564453125, -4.117431640625, -3.5570068359375, -2.99658203125, -2.4361572265625, -1.875732421875, -1.3153076171875, -0.7548828125, -0.1944580078125, 0.365966796875, 0.9263916015625, 1.48681640625, 2.0472412109375, 2.607666015625, 3.1680908203125, 3.728515625, 4.2889404296875, 4.849365234375, 5.4097900390625, 5.97021484375, 6.5306396484375, 7.091064453125, 7.6514892578125, 8.2119140625, 8.7723388671875, 9.332763671875, 9.8931884765625, 10.45361328125, 11.0140380859375, 11.574462890625, 12.1348876953125, 12.6953125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 5.0, 5.0, 5.0, 14.0, 12.0, 19.0, 22.0, 20.0, 39.0, 30.0, 39.0, 73.0, 90.0, 113.0, 87.0, 92.0, 79.0, 56.0, 41.0, 25.0, 31.0, 23.0, 19.0, 17.0, 12.0, 7.0, 8.0, 2.0, 7.0, 7.0, 1.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0014171600341796875, -0.0013687461614608765, -0.0013203322887420654, -0.0012719184160232544, -0.0012235045433044434, -0.0011750906705856323, -0.0011266767978668213, -0.0010782629251480103, -0.0010298490524291992, -0.0009814351797103882, -0.0009330213069915771, -0.0008846074342727661, -0.0008361935615539551, -0.000787779688835144, -0.000739365816116333, -0.000690951943397522, -0.0006425380706787109, -0.0005941241979598999, -0.0005457103252410889, -0.0004972964525222778, -0.0004488825798034668, -0.00040046870708465576, -0.0003520548343658447, -0.0003036409616470337, -0.00025522708892822266, -0.00020681321620941162, -0.00015839934349060059, -0.00010998547077178955, -6.157159805297852e-05, -1.315772533416748e-05, 3.5256147384643555e-05, 8.367002010345459e-05, 0.00013208389282226562, 0.00018049776554107666, 0.0002289116382598877, 0.00027732551097869873, 0.00032573938369750977, 0.0003741532564163208, 0.00042256712913513184, 0.00047098100185394287, 0.0005193948745727539, 0.0005678087472915649, 0.000616222620010376, 0.000664636492729187, 0.000713050365447998, 0.0007614642381668091, 0.0008098781108856201, 0.0008582919836044312, 0.0009067058563232422, 0.0009551197290420532, 0.0010035336017608643, 0.0010519474744796753, 0.0011003613471984863, 0.0011487752199172974, 0.0011971890926361084, 0.0012456029653549194, 0.0012940168380737305, 0.0013424307107925415, 0.0013908445835113525, 0.0014392584562301636, 0.0014876723289489746, 0.0015360862016677856, 0.0015845000743865967, 0.0016329139471054077, 0.0016813278198242188]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 4.0, 3.0, 8.0, 7.0, 18.0, 24.0, 33.0, 62.0, 112.0, 231.0, 434.0, 1127.0, 3291.0, 17682.0, 278770.0, 699393.0, 39126.0, 5405.0, 1634.0, 617.0, 256.0, 128.0, 90.0, 43.0, 20.0, 13.0, 8.0, 10.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.265625, -13.776611328125, -13.28759765625, -12.798583984375, -12.3095703125, -11.820556640625, -11.33154296875, -10.842529296875, -10.353515625, -9.864501953125, -9.37548828125, -8.886474609375, -8.3974609375, -7.908447265625, -7.41943359375, -6.930419921875, -6.44140625, -5.952392578125, -5.46337890625, -4.974365234375, -4.4853515625, -3.996337890625, -3.50732421875, -3.018310546875, -2.529296875, -2.040283203125, -1.55126953125, -1.062255859375, -0.5732421875, -0.084228515625, 0.40478515625, 0.893798828125, 1.3828125, 1.871826171875, 2.36083984375, 2.849853515625, 3.3388671875, 3.827880859375, 4.31689453125, 4.805908203125, 5.294921875, 5.783935546875, 6.27294921875, 6.761962890625, 7.2509765625, 7.739990234375, 8.22900390625, 8.718017578125, 9.20703125, 9.696044921875, 10.18505859375, 10.674072265625, 11.1630859375, 11.652099609375, 12.14111328125, 12.630126953125, 13.119140625, 13.608154296875, 14.09716796875, 14.586181640625, 15.0751953125, 15.564208984375, 16.05322265625, 16.542236328125, 17.03125]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 9.0, 5.0, 8.0, 14.0, 12.0, 20.0, 34.0, 25.0, 40.0, 64.0, 80.0, 91.0, 110.0, 104.0, 82.0, 83.0, 60.0, 49.0, 31.0, 21.0, 19.0, 18.0, 5.0, 8.0, 6.0, 2.0, 0.0, 1.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.5078125, -13.1597900390625, -12.811767578125, -12.4637451171875, -12.11572265625, -11.7677001953125, -11.419677734375, -11.0716552734375, -10.7236328125, -10.3756103515625, -10.027587890625, -9.6795654296875, -9.33154296875, -8.9835205078125, -8.635498046875, -8.2874755859375, -7.939453125, -7.5914306640625, -7.243408203125, -6.8953857421875, -6.54736328125, -6.1993408203125, -5.851318359375, -5.5032958984375, -5.1552734375, -4.8072509765625, -4.459228515625, -4.1112060546875, -3.76318359375, -3.4151611328125, -3.067138671875, -2.7191162109375, -2.37109375, -2.0230712890625, -1.675048828125, -1.3270263671875, -0.97900390625, -0.6309814453125, -0.282958984375, 0.0650634765625, 0.4130859375, 0.7611083984375, 1.109130859375, 1.4571533203125, 1.80517578125, 2.1531982421875, 2.501220703125, 2.8492431640625, 3.197265625, 3.5452880859375, 3.893310546875, 4.2413330078125, 4.58935546875, 4.9373779296875, 5.285400390625, 5.6334228515625, 5.9814453125, 6.3294677734375, 6.677490234375, 7.0255126953125, 7.37353515625, 7.7215576171875, 8.069580078125, 8.4176025390625, 8.765625]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 4.0, 8.0, 9.0, 36.0, 62.0, 199.0, 273.0, 228.0, 127.0, 41.0, 14.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-301.7027587890625, -293.015380859375, -284.3280029296875, -275.640625, -266.9532470703125, -258.265869140625, -249.5784912109375, -240.89111328125, -232.2037353515625, -223.516357421875, -214.8289794921875, -206.1416015625, -197.4542236328125, -188.766845703125, -180.0794677734375, -171.39208984375, -162.7047119140625, -154.017333984375, -145.3299560546875, -136.642578125, -127.9552001953125, -119.267822265625, -110.5804443359375, -101.89306640625, -93.2056884765625, -84.518310546875, -75.8309326171875, -67.1435546875, -58.4561767578125, -49.768798828125, -41.0814208984375, -32.39404296875, -23.706634521484375, -15.019256591796875, -6.331878662109375, 2.355499267578125, 11.042877197265625, 19.730255126953125, 28.417633056640625, 37.105010986328125, 45.792388916015625, 54.479766845703125, 63.167144775390625, 71.85452270507812, 80.54190063476562, 89.22927856445312, 97.91665649414062, 106.60403442382812, 115.29141235351562, 123.97879028320312, 132.66616821289062, 141.35354614257812, 150.04092407226562, 158.72830200195312, 167.41567993164062, 176.10305786132812, 184.79043579101562, 193.47781372070312, 202.16519165039062, 210.85256958007812, 219.53994750976562, 228.22732543945312, 236.91470336914062, 245.60208129882812, 254.28945922851562]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 6.0, 4.0, 6.0, 3.0, 7.0, 13.0, 24.0, 21.0, 13.0, 18.0, 29.0, 38.0, 22.0, 32.0, 43.0, 49.0, 42.0, 50.0, 56.0, 64.0, 59.0, 49.0, 52.0, 38.0, 34.0, 47.0, 32.0, 19.0, 25.0, 19.0, 18.0, 14.0, 13.0, 8.0, 9.0, 8.0, 8.0, 3.0, 3.0, 3.0, 2.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-127.3512954711914, -123.29072570800781, -119.23015594482422, -115.16958618164062, -111.1090087890625, -107.04844665527344, -102.98786926269531, -98.92729949951172, -94.86672973632812, -90.80615997314453, -86.74559020996094, -82.68502044677734, -78.62445068359375, -74.56387329101562, -70.50330352783203, -66.44273376464844, -62.382164001464844, -58.32159423828125, -54.261024475097656, -50.2004508972168, -46.1398811340332, -42.07931137084961, -38.01873779296875, -33.958168029785156, -29.897598266601562, -25.83702850341797, -21.776456832885742, -17.715885162353516, -13.655315399169922, -9.594745635986328, -5.534173965454102, -1.473602294921875, 2.5869598388671875, 6.647530555725098, 10.708101272583008, 14.768671989440918, 18.829242706298828, 22.889812469482422, 26.95038414001465, 31.010955810546875, 35.07152557373047, 39.13209533691406, 43.192665100097656, 47.253238677978516, 51.31380844116211, 55.3743782043457, 59.43495178222656, 63.495521545410156, 67.55609130859375, 71.61666107177734, 75.67723083496094, 79.73780059814453, 83.79837036132812, 87.85894775390625, 91.91951751708984, 95.98008728027344, 100.04065704345703, 104.10122680664062, 108.16179656982422, 112.22236633300781, 116.28294372558594, 120.343505859375, 124.40408325195312, 128.46466064453125, 132.5252227783203]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 5.0, 6.0, 2.0, 13.0, 20.0, 30.0, 43.0, 48.0, 108.0, 144.0, 270.0, 482.0, 888.0, 2019.0, 5119.0, 17727.0, 156354.0, 3935763.0, 57589.0, 10910.0, 3543.0, 1482.0, 706.0, 410.0, 220.0, 124.0, 89.0, 56.0, 33.0, 20.0, 15.0, 10.0, 11.0, 12.0, 7.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-24.5625, -23.88623046875, -23.2099609375, -22.53369140625, -21.857421875, -21.18115234375, -20.5048828125, -19.82861328125, -19.15234375, -18.47607421875, -17.7998046875, -17.12353515625, -16.447265625, -15.77099609375, -15.0947265625, -14.41845703125, -13.7421875, -13.06591796875, -12.3896484375, -11.71337890625, -11.037109375, -10.36083984375, -9.6845703125, -9.00830078125, -8.33203125, -7.65576171875, -6.9794921875, -6.30322265625, -5.626953125, -4.95068359375, -4.2744140625, -3.59814453125, -2.921875, -2.24560546875, -1.5693359375, -0.89306640625, -0.216796875, 0.45947265625, 1.1357421875, 1.81201171875, 2.48828125, 3.16455078125, 3.8408203125, 4.51708984375, 5.193359375, 5.86962890625, 6.5458984375, 7.22216796875, 7.8984375, 8.57470703125, 9.2509765625, 9.92724609375, 10.603515625, 11.27978515625, 11.9560546875, 12.63232421875, 13.30859375, 13.98486328125, 14.6611328125, 15.33740234375, 16.013671875, 16.68994140625, 17.3662109375, 18.04248046875, 18.71875]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 4.0, 2.0, 3.0, 3.0, 7.0, 9.0, 5.0, 11.0, 15.0, 19.0, 16.0, 19.0, 24.0, 37.0, 30.0, 45.0, 36.0, 48.0, 60.0, 75.0, 60.0, 72.0, 52.0, 43.0, 48.0, 59.0, 32.0, 25.0, 27.0, 35.0, 24.0, 12.0, 12.0, 8.0, 5.0, 11.0, 7.0, 3.0, 2.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.27734375, -7.07220458984375, -6.8670654296875, -6.66192626953125, -6.456787109375, -6.25164794921875, -6.0465087890625, -5.84136962890625, -5.63623046875, -5.43109130859375, -5.2259521484375, -5.02081298828125, -4.815673828125, -4.61053466796875, -4.4053955078125, -4.20025634765625, -3.9951171875, -3.78997802734375, -3.5848388671875, -3.37969970703125, -3.174560546875, -2.96942138671875, -2.7642822265625, -2.55914306640625, -2.35400390625, -2.14886474609375, -1.9437255859375, -1.73858642578125, -1.533447265625, -1.32830810546875, -1.1231689453125, -0.91802978515625, -0.712890625, -0.50775146484375, -0.3026123046875, -0.09747314453125, 0.107666015625, 0.31280517578125, 0.5179443359375, 0.72308349609375, 0.92822265625, 1.13336181640625, 1.3385009765625, 1.54364013671875, 1.748779296875, 1.95391845703125, 2.1590576171875, 2.36419677734375, 2.5693359375, 2.77447509765625, 2.9796142578125, 3.18475341796875, 3.389892578125, 3.59503173828125, 3.8001708984375, 4.00531005859375, 4.21044921875, 4.41558837890625, 4.6207275390625, 4.82586669921875, 5.031005859375, 5.23614501953125, 5.4412841796875, 5.64642333984375, 5.8515625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 5.0, 4.0, 4.0, 9.0, 15.0, 19.0, 30.0, 42.0, 60.0, 80.0, 132.0, 188.0, 257.0, 476.0, 722.0, 1187.0, 2148.0, 4588.0, 11468.0, 41736.0, 662319.0, 3386632.0, 57131.0, 13983.0, 5201.0, 2445.0, 1282.0, 768.0, 451.0, 285.0, 180.0, 139.0, 109.0, 64.0, 39.0, 26.0, 19.0, 13.0, 11.0, 9.0, 5.0, 4.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.09375, -17.56298828125, -17.0322265625, -16.50146484375, -15.970703125, -15.43994140625, -14.9091796875, -14.37841796875, -13.84765625, -13.31689453125, -12.7861328125, -12.25537109375, -11.724609375, -11.19384765625, -10.6630859375, -10.13232421875, -9.6015625, -9.07080078125, -8.5400390625, -8.00927734375, -7.478515625, -6.94775390625, -6.4169921875, -5.88623046875, -5.35546875, -4.82470703125, -4.2939453125, -3.76318359375, -3.232421875, -2.70166015625, -2.1708984375, -1.64013671875, -1.109375, -0.57861328125, -0.0478515625, 0.48291015625, 1.013671875, 1.54443359375, 2.0751953125, 2.60595703125, 3.13671875, 3.66748046875, 4.1982421875, 4.72900390625, 5.259765625, 5.79052734375, 6.3212890625, 6.85205078125, 7.3828125, 7.91357421875, 8.4443359375, 8.97509765625, 9.505859375, 10.03662109375, 10.5673828125, 11.09814453125, 11.62890625, 12.15966796875, 12.6904296875, 13.22119140625, 13.751953125, 14.28271484375, 14.8134765625, 15.34423828125, 15.875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 4.0, 3.0, 0.0, 5.0, 14.0, 9.0, 12.0, 20.0, 35.0, 58.0, 129.0, 312.0, 2594.0, 518.0, 160.0, 58.0, 43.0, 25.0, 20.0, 17.0, 9.0, 7.0, 7.0, 4.0, 5.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.80859375, -7.576416015625, -7.34423828125, -7.112060546875, -6.8798828125, -6.647705078125, -6.41552734375, -6.183349609375, -5.951171875, -5.718994140625, -5.48681640625, -5.254638671875, -5.0224609375, -4.790283203125, -4.55810546875, -4.325927734375, -4.09375, -3.861572265625, -3.62939453125, -3.397216796875, -3.1650390625, -2.932861328125, -2.70068359375, -2.468505859375, -2.236328125, -2.004150390625, -1.77197265625, -1.539794921875, -1.3076171875, -1.075439453125, -0.84326171875, -0.611083984375, -0.37890625, -0.146728515625, 0.08544921875, 0.317626953125, 0.5498046875, 0.781982421875, 1.01416015625, 1.246337890625, 1.478515625, 1.710693359375, 1.94287109375, 2.175048828125, 2.4072265625, 2.639404296875, 2.87158203125, 3.103759765625, 3.3359375, 3.568115234375, 3.80029296875, 4.032470703125, 4.2646484375, 4.496826171875, 4.72900390625, 4.961181640625, 5.193359375, 5.425537109375, 5.65771484375, 5.889892578125, 6.1220703125, 6.354248046875, 6.58642578125, 6.818603515625, 7.05078125]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 5.0, 6.0, 12.0, 31.0, 72.0, 193.0, 260.0, 197.0, 125.0, 59.0, 19.0, 13.0, 4.0, 1.0, 5.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.33196258544922, -45.96194839477539, -43.59193420410156, -41.221920013427734, -38.851905822753906, -36.481895446777344, -34.111881256103516, -31.741867065429688, -29.37185287475586, -27.00183868408203, -24.631824493408203, -22.261812210083008, -19.89179801940918, -17.52178382873535, -15.15177059173584, -12.781757354736328, -10.4117431640625, -8.041728973388672, -5.67171573638916, -3.3017020225524902, -0.9316883087158203, 1.4383258819580078, 3.8083391189575195, 6.178352355957031, 8.54836654663086, 10.918380737304688, 13.2883939743042, 15.658407211303711, 18.02842140197754, 20.398435592651367, 22.768447875976562, 25.13846206665039, 27.508468627929688, 29.878482818603516, 32.248497009277344, 34.61851119995117, 36.988525390625, 39.35853576660156, 41.72854995727539, 44.09856414794922, 46.46857833862305, 48.838592529296875, 51.2086067199707, 53.57862091064453, 55.948631286621094, 58.31864929199219, 60.68865966796875, 63.05867385864258, 65.4286880493164, 67.79869842529297, 70.16871643066406, 72.53872680664062, 74.90874481201172, 77.27875518798828, 79.64877319335938, 82.01878356933594, 84.3887939453125, 86.75880432128906, 89.12882232666016, 91.49883270263672, 93.86885070800781, 96.23886108398438, 98.60887908935547, 100.97888946533203, 103.34890747070312]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 6.0, 4.0, 5.0, 5.0, 6.0, 11.0, 10.0, 18.0, 22.0, 19.0, 20.0, 30.0, 38.0, 43.0, 43.0, 42.0, 46.0, 56.0, 55.0, 44.0, 54.0, 52.0, 48.0, 44.0, 43.0, 35.0, 48.0, 31.0, 28.0, 21.0, 15.0, 20.0, 14.0, 2.0, 11.0, 8.0, 7.0, 4.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.09188461303711, -18.37574005126953, -17.659595489501953, -16.943450927734375, -16.227306365966797, -15.511161804199219, -14.795016288757324, -14.078871726989746, -13.362727165222168, -12.64658260345459, -11.930438041687012, -11.214292526245117, -10.498147964477539, -9.782003402709961, -9.065858840942383, -8.349714279174805, -7.633569717407227, -6.917425155639648, -6.20128059387207, -5.485135555267334, -4.768990993499756, -4.052846431732178, -3.3367013931274414, -2.6205568313598633, -1.9044122695922852, -1.1882675886154175, -0.4721229076385498, 0.24402189254760742, 0.9601664543151855, 1.6763110160827637, 2.3924560546875, 3.108600616455078, 3.8247451782226562, 4.540889739990234, 5.2570343017578125, 5.973179340362549, 6.689323902130127, 7.405468463897705, 8.121613502502441, 8.83775806427002, 9.553902626037598, 10.270047187805176, 10.986191749572754, 11.702337265014648, 12.418481826782227, 13.134626388549805, 13.850770950317383, 14.566915512084961, 15.283060073852539, 15.999204635620117, 16.715349197387695, 17.431493759155273, 18.14763832092285, 18.86378288269043, 19.57992935180664, 20.29607391357422, 21.012218475341797, 21.728363037109375, 22.444507598876953, 23.16065216064453, 23.87679672241211, 24.592941284179688, 25.309085845947266, 26.025230407714844, 26.741374969482422]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 2.0, 5.0, 10.0, 7.0, 17.0, 26.0, 25.0, 70.0, 116.0, 176.0, 331.0, 535.0, 1029.0, 1967.0, 4409.0, 10151.0, 25252.0, 67966.0, 184712.0, 357084.0, 243136.0, 92905.0, 34179.0, 13356.0, 5745.0, 2523.0, 1290.0, 658.0, 367.0, 190.0, 114.0, 61.0, 52.0, 35.0, 23.0, 10.0, 12.0, 1.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-10.3671875, -10.017578125, -9.66796875, -9.318359375, -8.96875, -8.619140625, -8.26953125, -7.919921875, -7.5703125, -7.220703125, -6.87109375, -6.521484375, -6.171875, -5.822265625, -5.47265625, -5.123046875, -4.7734375, -4.423828125, -4.07421875, -3.724609375, -3.375, -3.025390625, -2.67578125, -2.326171875, -1.9765625, -1.626953125, -1.27734375, -0.927734375, -0.578125, -0.228515625, 0.12109375, 0.470703125, 0.8203125, 1.169921875, 1.51953125, 1.869140625, 2.21875, 2.568359375, 2.91796875, 3.267578125, 3.6171875, 3.966796875, 4.31640625, 4.666015625, 5.015625, 5.365234375, 5.71484375, 6.064453125, 6.4140625, 6.763671875, 7.11328125, 7.462890625, 7.8125, 8.162109375, 8.51171875, 8.861328125, 9.2109375, 9.560546875, 9.91015625, 10.259765625, 10.609375, 10.958984375, 11.30859375, 11.658203125, 12.0078125]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 6.0, 0.0, 4.0, 6.0, 6.0, 4.0, 11.0, 10.0, 22.0, 6.0, 15.0, 17.0, 22.0, 37.0, 31.0, 43.0, 50.0, 58.0, 42.0, 58.0, 58.0, 54.0, 53.0, 60.0, 54.0, 46.0, 37.0, 24.0, 33.0, 24.0, 29.0, 22.0, 15.0, 10.0, 11.0, 10.0, 8.0, 3.0, 3.0, 6.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-6.96484375, -6.760009765625, -6.55517578125, -6.350341796875, -6.1455078125, -5.940673828125, -5.73583984375, -5.531005859375, -5.326171875, -5.121337890625, -4.91650390625, -4.711669921875, -4.5068359375, -4.302001953125, -4.09716796875, -3.892333984375, -3.6875, -3.482666015625, -3.27783203125, -3.072998046875, -2.8681640625, -2.663330078125, -2.45849609375, -2.253662109375, -2.048828125, -1.843994140625, -1.63916015625, -1.434326171875, -1.2294921875, -1.024658203125, -0.81982421875, -0.614990234375, -0.41015625, -0.205322265625, -0.00048828125, 0.204345703125, 0.4091796875, 0.614013671875, 0.81884765625, 1.023681640625, 1.228515625, 1.433349609375, 1.63818359375, 1.843017578125, 2.0478515625, 2.252685546875, 2.45751953125, 2.662353515625, 2.8671875, 3.072021484375, 3.27685546875, 3.481689453125, 3.6865234375, 3.891357421875, 4.09619140625, 4.301025390625, 4.505859375, 4.710693359375, 4.91552734375, 5.120361328125, 5.3251953125, 5.530029296875, 5.73486328125, 5.939697265625, 6.14453125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 3.0, 10.0, 12.0, 4.0, 19.0, 19.0, 25.0, 45.0, 55.0, 118.0, 183.0, 297.0, 561.0, 1365.0, 4655.0, 45907.0, 834003.0, 148664.0, 9006.0, 1931.0, 751.0, 342.0, 192.0, 126.0, 84.0, 44.0, 35.0, 22.0, 19.0, 12.0, 15.0, 5.0, 13.0, 2.0, 8.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-38.3125, -37.238525390625, -36.16455078125, -35.090576171875, -34.0166015625, -32.942626953125, -31.86865234375, -30.794677734375, -29.720703125, -28.646728515625, -27.57275390625, -26.498779296875, -25.4248046875, -24.350830078125, -23.27685546875, -22.202880859375, -21.12890625, -20.054931640625, -18.98095703125, -17.906982421875, -16.8330078125, -15.759033203125, -14.68505859375, -13.611083984375, -12.537109375, -11.463134765625, -10.38916015625, -9.315185546875, -8.2412109375, -7.167236328125, -6.09326171875, -5.019287109375, -3.9453125, -2.871337890625, -1.79736328125, -0.723388671875, 0.3505859375, 1.424560546875, 2.49853515625, 3.572509765625, 4.646484375, 5.720458984375, 6.79443359375, 7.868408203125, 8.9423828125, 10.016357421875, 11.09033203125, 12.164306640625, 13.23828125, 14.312255859375, 15.38623046875, 16.460205078125, 17.5341796875, 18.608154296875, 19.68212890625, 20.756103515625, 21.830078125, 22.904052734375, 23.97802734375, 25.052001953125, 26.1259765625, 27.199951171875, 28.27392578125, 29.347900390625, 30.421875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 4.0, 5.0, 3.0, 3.0, 6.0, 7.0, 8.0, 15.0, 15.0, 18.0, 13.0, 20.0, 19.0, 22.0, 43.0, 28.0, 31.0, 28.0, 48.0, 37.0, 33.0, 37.0, 53.0, 52.0, 48.0, 41.0, 35.0, 48.0, 40.0, 42.0, 20.0, 32.0, 21.0, 21.0, 15.0, 19.0, 20.0, 9.0, 9.0, 8.0, 4.0, 9.0, 6.0, 2.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-23.28125, -22.603515625, -21.92578125, -21.248046875, -20.5703125, -19.892578125, -19.21484375, -18.537109375, -17.859375, -17.181640625, -16.50390625, -15.826171875, -15.1484375, -14.470703125, -13.79296875, -13.115234375, -12.4375, -11.759765625, -11.08203125, -10.404296875, -9.7265625, -9.048828125, -8.37109375, -7.693359375, -7.015625, -6.337890625, -5.66015625, -4.982421875, -4.3046875, -3.626953125, -2.94921875, -2.271484375, -1.59375, -0.916015625, -0.23828125, 0.439453125, 1.1171875, 1.794921875, 2.47265625, 3.150390625, 3.828125, 4.505859375, 5.18359375, 5.861328125, 6.5390625, 7.216796875, 7.89453125, 8.572265625, 9.25, 9.927734375, 10.60546875, 11.283203125, 11.9609375, 12.638671875, 13.31640625, 13.994140625, 14.671875, 15.349609375, 16.02734375, 16.705078125, 17.3828125, 18.060546875, 18.73828125, 19.416015625, 20.09375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 5.0, 3.0, 3.0, 8.0, 10.0, 15.0, 17.0, 32.0, 38.0, 68.0, 84.0, 151.0, 256.0, 425.0, 882.0, 2161.0, 6475.0, 29529.0, 262538.0, 658604.0, 69607.0, 11583.0, 3385.0, 1263.0, 583.0, 319.0, 198.0, 116.0, 52.0, 54.0, 32.0, 19.0, 15.0, 9.0, 6.0, 7.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.7109375, -9.4185791015625, -9.126220703125, -8.8338623046875, -8.54150390625, -8.2491455078125, -7.956787109375, -7.6644287109375, -7.3720703125, -7.0797119140625, -6.787353515625, -6.4949951171875, -6.20263671875, -5.9102783203125, -5.617919921875, -5.3255615234375, -5.033203125, -4.7408447265625, -4.448486328125, -4.1561279296875, -3.86376953125, -3.5714111328125, -3.279052734375, -2.9866943359375, -2.6943359375, -2.4019775390625, -2.109619140625, -1.8172607421875, -1.52490234375, -1.2325439453125, -0.940185546875, -0.6478271484375, -0.35546875, -0.0631103515625, 0.229248046875, 0.5216064453125, 0.81396484375, 1.1063232421875, 1.398681640625, 1.6910400390625, 1.9833984375, 2.2757568359375, 2.568115234375, 2.8604736328125, 3.15283203125, 3.4451904296875, 3.737548828125, 4.0299072265625, 4.322265625, 4.6146240234375, 4.906982421875, 5.1993408203125, 5.49169921875, 5.7840576171875, 6.076416015625, 6.3687744140625, 6.6611328125, 6.9534912109375, 7.245849609375, 7.5382080078125, 7.83056640625, 8.1229248046875, 8.415283203125, 8.7076416015625, 9.0]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 5.0, 3.0, 4.0, 5.0, 7.0, 4.0, 9.0, 8.0, 18.0, 22.0, 30.0, 42.0, 54.0, 61.0, 99.0, 135.0, 162.0, 72.0, 59.0, 49.0, 34.0, 32.0, 19.0, 15.0, 16.0, 15.0, 7.0, 5.0, 3.0, 5.0, 3.0, 2.0, 2.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.002811431884765625, -0.0027356743812561035, -0.002659916877746582, -0.0025841593742370605, -0.002508401870727539, -0.0024326443672180176, -0.002356886863708496, -0.0022811293601989746, -0.002205371856689453, -0.0021296143531799316, -0.00205385684967041, -0.0019780993461608887, -0.0019023418426513672, -0.0018265843391418457, -0.0017508268356323242, -0.0016750693321228027, -0.0015993118286132812, -0.0015235543251037598, -0.0014477968215942383, -0.0013720393180847168, -0.0012962818145751953, -0.0012205243110656738, -0.0011447668075561523, -0.0010690093040466309, -0.0009932518005371094, -0.0009174942970275879, -0.0008417367935180664, -0.0007659792900085449, -0.0006902217864990234, -0.000614464282989502, -0.0005387067794799805, -0.000462949275970459, -0.0003871917724609375, -0.000311434268951416, -0.00023567676544189453, -0.00015991926193237305, -8.416175842285156e-05, -8.404254913330078e-06, 6.73532485961914e-05, 0.0001431107521057129, 0.00021886825561523438, 0.00029462575912475586, 0.00037038326263427734, 0.00044614076614379883, 0.0005218982696533203, 0.0005976557731628418, 0.0006734132766723633, 0.0007491707801818848, 0.0008249282836914062, 0.0009006857872009277, 0.0009764432907104492, 0.0010522007942199707, 0.0011279582977294922, 0.0012037158012390137, 0.0012794733047485352, 0.0013552308082580566, 0.0014309883117675781, 0.0015067458152770996, 0.001582503318786621, 0.0016582608222961426, 0.001734018325805664, 0.0018097758293151855, 0.001885533332824707, 0.0019612908363342285, 0.00203704833984375]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 8.0, 7.0, 7.0, 12.0, 34.0, 36.0, 54.0, 58.0, 125.0, 244.0, 392.0, 980.0, 2605.0, 10110.0, 75216.0, 751212.0, 182943.0, 18088.0, 3859.0, 1316.0, 537.0, 275.0, 157.0, 108.0, 58.0, 45.0, 28.0, 14.0, 13.0, 8.0, 5.0, 6.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.09375, -14.7132568359375, -14.332763671875, -13.9522705078125, -13.57177734375, -13.1912841796875, -12.810791015625, -12.4302978515625, -12.0498046875, -11.6693115234375, -11.288818359375, -10.9083251953125, -10.52783203125, -10.1473388671875, -9.766845703125, -9.3863525390625, -9.005859375, -8.6253662109375, -8.244873046875, -7.8643798828125, -7.48388671875, -7.1033935546875, -6.722900390625, -6.3424072265625, -5.9619140625, -5.5814208984375, -5.200927734375, -4.8204345703125, -4.43994140625, -4.0594482421875, -3.678955078125, -3.2984619140625, -2.91796875, -2.5374755859375, -2.156982421875, -1.7764892578125, -1.39599609375, -1.0155029296875, -0.635009765625, -0.2545166015625, 0.1259765625, 0.5064697265625, 0.886962890625, 1.2674560546875, 1.64794921875, 2.0284423828125, 2.408935546875, 2.7894287109375, 3.169921875, 3.5504150390625, 3.930908203125, 4.3114013671875, 4.69189453125, 5.0723876953125, 5.452880859375, 5.8333740234375, 6.2138671875, 6.5943603515625, 6.974853515625, 7.3553466796875, 7.73583984375, 8.1163330078125, 8.496826171875, 8.8773193359375, 9.2578125]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 4.0, 4.0, 7.0, 10.0, 9.0, 10.0, 22.0, 26.0, 26.0, 36.0, 45.0, 58.0, 82.0, 71.0, 71.0, 79.0, 87.0, 68.0, 52.0, 52.0, 37.0, 30.0, 32.0, 11.0, 15.0, 12.0, 10.0, 9.0, 5.0, 4.0, 6.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.546875, -7.31866455078125, -7.0904541015625, -6.86224365234375, -6.634033203125, -6.40582275390625, -6.1776123046875, -5.94940185546875, -5.72119140625, -5.49298095703125, -5.2647705078125, -5.03656005859375, -4.808349609375, -4.58013916015625, -4.3519287109375, -4.12371826171875, -3.8955078125, -3.66729736328125, -3.4390869140625, -3.21087646484375, -2.982666015625, -2.75445556640625, -2.5262451171875, -2.29803466796875, -2.06982421875, -1.84161376953125, -1.6134033203125, -1.38519287109375, -1.156982421875, -0.92877197265625, -0.7005615234375, -0.47235107421875, -0.244140625, -0.01593017578125, 0.2122802734375, 0.44049072265625, 0.668701171875, 0.89691162109375, 1.1251220703125, 1.35333251953125, 1.58154296875, 1.80975341796875, 2.0379638671875, 2.26617431640625, 2.494384765625, 2.72259521484375, 2.9508056640625, 3.17901611328125, 3.4072265625, 3.63543701171875, 3.8636474609375, 4.09185791015625, 4.320068359375, 4.54827880859375, 4.7764892578125, 5.00469970703125, 5.23291015625, 5.46112060546875, 5.6893310546875, 5.91754150390625, 6.145751953125, 6.37396240234375, 6.6021728515625, 6.83038330078125, 7.05859375]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 1.0, 3.0, 6.0, 10.0, 27.0, 79.0, 187.0, 236.0, 226.0, 130.0, 56.0, 18.0, 11.0, 4.0, 8.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-213.1764678955078, -205.19822692871094, -197.22000122070312, -189.24176025390625, -181.26351928710938, -173.2852783203125, -165.3070526123047, -157.3288116455078, -149.3505859375, -141.37234497070312, -133.3941192626953, -125.41587829589844, -117.43763732910156, -109.45940399169922, -101.48117065429688, -93.5029296875, -85.52468872070312, -77.54645538330078, -69.5682144165039, -61.58998107910156, -53.61174392700195, -45.633506774902344, -37.6552734375, -29.67703628540039, -21.69879913330078, -13.720562934875488, -5.742326736450195, 2.2359085083007812, 10.21414566040039, 18.1923828125, 26.170616149902344, 34.14885330200195, 42.1270751953125, 50.10531234741211, 58.08354949951172, 66.06178283691406, 74.04002380371094, 82.01825714111328, 89.99649047851562, 97.9747314453125, 105.95296478271484, 113.93119812011719, 121.90943908691406, 129.88766479492188, 137.86590576171875, 145.84414672851562, 153.8223876953125, 161.8006134033203, 169.7788543701172, 177.75709533691406, 185.73532104492188, 193.71356201171875, 201.69180297851562, 209.6700439453125, 217.6482696533203, 225.6265106201172, 233.604736328125, 241.58297729492188, 249.5612030029297, 257.5394287109375, 265.5176696777344, 273.49591064453125, 281.4741516113281, 289.452392578125, 297.4306335449219]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 3.0, 7.0, 3.0, 8.0, 13.0, 9.0, 12.0, 15.0, 9.0, 25.0, 14.0, 26.0, 29.0, 39.0, 36.0, 31.0, 38.0, 33.0, 50.0, 42.0, 51.0, 50.0, 45.0, 42.0, 55.0, 32.0, 46.0, 35.0, 29.0, 28.0, 19.0, 24.0, 27.0, 15.0, 9.0, 14.0, 16.0, 5.0, 7.0, 8.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-99.564453125, -96.45973205566406, -93.35501098632812, -90.25028991699219, -87.14556884765625, -84.04084777832031, -80.93612670898438, -77.83140563964844, -74.7266845703125, -71.62196350097656, -68.51724243164062, -65.41252136230469, -62.30780029296875, -59.20307922363281, -56.09835433959961, -52.99363327026367, -49.88890838623047, -46.78418731689453, -43.679466247558594, -40.574745178222656, -37.47002410888672, -34.36530303955078, -31.260578155517578, -28.15585708618164, -25.051136016845703, -21.946414947509766, -18.841693878173828, -15.736970901489258, -12.63224983215332, -9.527528762817383, -6.4228057861328125, -3.318084716796875, -0.21337127685546875, 2.891350269317627, 5.996071815490723, 9.100793838500977, 12.205514907836914, 15.310235977172852, 18.414958953857422, 21.51968002319336, 24.624401092529297, 27.729122161865234, 30.833843231201172, 33.938568115234375, 37.04328918457031, 40.14801025390625, 43.25273132324219, 46.357452392578125, 49.46217346191406, 52.56689453125, 55.67161560058594, 58.776336669921875, 61.88105773925781, 64.98577880859375, 68.09049987792969, 71.19522094726562, 74.29994201660156, 77.4046630859375, 80.50938415527344, 83.61410522460938, 86.71882629394531, 89.82354736328125, 92.92826843261719, 96.03298950195312, 99.1377182006836]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 6.0, 4.0, 5.0, 8.0, 6.0, 14.0, 25.0, 32.0, 41.0, 76.0, 145.0, 263.0, 470.0, 922.0, 1879.0, 4429.0, 11849.0, 41558.0, 323744.0, 3332786.0, 406817.0, 46950.0, 13188.0, 4865.0, 2031.0, 962.0, 528.0, 285.0, 156.0, 92.0, 58.0, 31.0, 14.0, 16.0, 9.0, 5.0, 6.0, 4.0, 1.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0], "bins": [-15.03125, -14.619873046875, -14.20849609375, -13.797119140625, -13.3857421875, -12.974365234375, -12.56298828125, -12.151611328125, -11.740234375, -11.328857421875, -10.91748046875, -10.506103515625, -10.0947265625, -9.683349609375, -9.27197265625, -8.860595703125, -8.44921875, -8.037841796875, -7.62646484375, -7.215087890625, -6.8037109375, -6.392333984375, -5.98095703125, -5.569580078125, -5.158203125, -4.746826171875, -4.33544921875, -3.924072265625, -3.5126953125, -3.101318359375, -2.68994140625, -2.278564453125, -1.8671875, -1.455810546875, -1.04443359375, -0.633056640625, -0.2216796875, 0.189697265625, 0.60107421875, 1.012451171875, 1.423828125, 1.835205078125, 2.24658203125, 2.657958984375, 3.0693359375, 3.480712890625, 3.89208984375, 4.303466796875, 4.71484375, 5.126220703125, 5.53759765625, 5.948974609375, 6.3603515625, 6.771728515625, 7.18310546875, 7.594482421875, 8.005859375, 8.417236328125, 8.82861328125, 9.239990234375, 9.6513671875, 10.062744140625, 10.47412109375, 10.885498046875, 11.296875]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 10.0, 5.0, 10.0, 11.0, 18.0, 16.0, 14.0, 22.0, 27.0, 41.0, 45.0, 47.0, 60.0, 59.0, 48.0, 54.0, 57.0, 52.0, 58.0, 51.0, 47.0, 50.0, 37.0, 30.0, 31.0, 19.0, 23.0, 14.0, 13.0, 10.0, 6.0, 4.0, 5.0, 2.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.234375, -6.0400390625, -5.845703125, -5.6513671875, -5.45703125, -5.2626953125, -5.068359375, -4.8740234375, -4.6796875, -4.4853515625, -4.291015625, -4.0966796875, -3.90234375, -3.7080078125, -3.513671875, -3.3193359375, -3.125, -2.9306640625, -2.736328125, -2.5419921875, -2.34765625, -2.1533203125, -1.958984375, -1.7646484375, -1.5703125, -1.3759765625, -1.181640625, -0.9873046875, -0.79296875, -0.5986328125, -0.404296875, -0.2099609375, -0.015625, 0.1787109375, 0.373046875, 0.5673828125, 0.76171875, 0.9560546875, 1.150390625, 1.3447265625, 1.5390625, 1.7333984375, 1.927734375, 2.1220703125, 2.31640625, 2.5107421875, 2.705078125, 2.8994140625, 3.09375, 3.2880859375, 3.482421875, 3.6767578125, 3.87109375, 4.0654296875, 4.259765625, 4.4541015625, 4.6484375, 4.8427734375, 5.037109375, 5.2314453125, 5.42578125, 5.6201171875, 5.814453125, 6.0087890625, 6.203125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 2.0, 7.0, 5.0, 1.0, 6.0, 9.0, 9.0, 8.0, 16.0, 17.0, 30.0, 43.0, 63.0, 133.0, 251.0, 513.0, 1282.0, 3896.0, 14903.0, 96726.0, 3548930.0, 482343.0, 33976.0, 7449.0, 2177.0, 750.0, 298.0, 175.0, 83.0, 55.0, 41.0, 18.0, 17.0, 14.0, 12.0, 5.0, 7.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-24.171875, -23.45556640625, -22.7392578125, -22.02294921875, -21.306640625, -20.59033203125, -19.8740234375, -19.15771484375, -18.44140625, -17.72509765625, -17.0087890625, -16.29248046875, -15.576171875, -14.85986328125, -14.1435546875, -13.42724609375, -12.7109375, -11.99462890625, -11.2783203125, -10.56201171875, -9.845703125, -9.12939453125, -8.4130859375, -7.69677734375, -6.98046875, -6.26416015625, -5.5478515625, -4.83154296875, -4.115234375, -3.39892578125, -2.6826171875, -1.96630859375, -1.25, -0.53369140625, 0.1826171875, 0.89892578125, 1.615234375, 2.33154296875, 3.0478515625, 3.76416015625, 4.48046875, 5.19677734375, 5.9130859375, 6.62939453125, 7.345703125, 8.06201171875, 8.7783203125, 9.49462890625, 10.2109375, 10.92724609375, 11.6435546875, 12.35986328125, 13.076171875, 13.79248046875, 14.5087890625, 15.22509765625, 15.94140625, 16.65771484375, 17.3740234375, 18.09033203125, 18.806640625, 19.52294921875, 20.2392578125, 20.95556640625, 21.671875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 2.0, 5.0, 5.0, 3.0, 10.0, 8.0, 9.0, 5.0, 19.0, 15.0, 24.0, 39.0, 49.0, 60.0, 124.0, 252.0, 485.0, 905.0, 879.0, 516.0, 244.0, 119.0, 94.0, 56.0, 38.0, 30.0, 21.0, 14.0, 9.0, 8.0, 11.0, 1.0, 4.0, 5.0, 0.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.328125, -11.83447265625, -11.3408203125, -10.84716796875, -10.353515625, -9.85986328125, -9.3662109375, -8.87255859375, -8.37890625, -7.88525390625, -7.3916015625, -6.89794921875, -6.404296875, -5.91064453125, -5.4169921875, -4.92333984375, -4.4296875, -3.93603515625, -3.4423828125, -2.94873046875, -2.455078125, -1.96142578125, -1.4677734375, -0.97412109375, -0.48046875, 0.01318359375, 0.5068359375, 1.00048828125, 1.494140625, 1.98779296875, 2.4814453125, 2.97509765625, 3.46875, 3.96240234375, 4.4560546875, 4.94970703125, 5.443359375, 5.93701171875, 6.4306640625, 6.92431640625, 7.41796875, 7.91162109375, 8.4052734375, 8.89892578125, 9.392578125, 9.88623046875, 10.3798828125, 10.87353515625, 11.3671875, 11.86083984375, 12.3544921875, 12.84814453125, 13.341796875, 13.83544921875, 14.3291015625, 14.82275390625, 15.31640625, 15.81005859375, 16.3037109375, 16.79736328125, 17.291015625, 17.78466796875, 18.2783203125, 18.77197265625, 19.265625]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 5.0, 2.0, 9.0, 9.0, 34.0, 61.0, 113.0, 176.0, 196.0, 170.0, 93.0, 66.0, 26.0, 21.0, 7.0, 4.0, 2.0, 2.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-206.44546508789062, -200.82093811035156, -195.1964111328125, -189.57186889648438, -183.9473419189453, -178.32281494140625, -172.69827270507812, -167.07374572753906, -161.44921875, -155.82469177246094, -150.20016479492188, -144.57562255859375, -138.9510955810547, -133.32656860351562, -127.70203399658203, -122.07749938964844, -116.45297241210938, -110.82844543457031, -105.20391082763672, -99.57937622070312, -93.95484924316406, -88.330322265625, -82.7057876586914, -77.08125305175781, -71.45672607421875, -65.83219909667969, -60.207664489746094, -54.583133697509766, -48.95860290527344, -43.33407211303711, -37.70954132080078, -32.08501052856445, -26.460479736328125, -20.835948944091797, -15.211418151855469, -9.58688735961914, -3.9623565673828125, 1.6621742248535156, 7.286705017089844, 12.911235809326172, 18.5357666015625, 24.160297393798828, 29.784828186035156, 35.409358978271484, 41.03388977050781, 46.65842056274414, 52.28295135498047, 57.9074821472168, 63.532012939453125, 69.15653991699219, 74.78107452392578, 80.40560913085938, 86.03013610839844, 91.6546630859375, 97.2791976928711, 102.90373229980469, 108.52825927734375, 114.15278625488281, 119.7773208618164, 125.40185546875, 131.02638244628906, 136.65090942382812, 142.27545166015625, 147.8999786376953, 153.52450561523438]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 5.0, 3.0, 9.0, 11.0, 8.0, 22.0, 22.0, 17.0, 34.0, 32.0, 33.0, 45.0, 54.0, 43.0, 60.0, 53.0, 52.0, 63.0, 62.0, 56.0, 42.0, 48.0, 35.0, 43.0, 36.0, 25.0, 20.0, 14.0, 16.0, 11.0, 5.0, 7.0, 7.0, 5.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-72.94668579101562, -70.21439361572266, -67.48210144042969, -64.74980926513672, -62.01751708984375, -59.28522491455078, -56.55292892456055, -53.82063674926758, -51.08834457397461, -48.35605239868164, -45.62376022338867, -42.89146423339844, -40.15917205810547, -37.4268798828125, -34.69458770751953, -31.962295532226562, -29.230003356933594, -26.497711181640625, -23.765419006347656, -21.033124923706055, -18.300832748413086, -15.568540573120117, -12.836246490478516, -10.103954315185547, -7.371662139892578, -4.639369487762451, -1.9070768356323242, 0.8252162933349609, 3.5575084686279297, 6.289800643920898, 9.0220947265625, 11.754386901855469, 14.486679077148438, 17.218971252441406, 19.951263427734375, 22.683557510375977, 25.415849685668945, 28.148141860961914, 30.880435943603516, 33.612728118896484, 36.34502029418945, 39.07731246948242, 41.80960464477539, 44.541900634765625, 47.274192810058594, 50.00648498535156, 52.73877716064453, 55.4710693359375, 58.20336151123047, 60.93565368652344, 63.667945861816406, 66.40023803710938, 69.13253021240234, 71.86482238769531, 74.59712219238281, 77.32940673828125, 80.06170654296875, 82.79399871826172, 85.52629089355469, 88.25858306884766, 90.99087524414062, 93.7231674194336, 96.45545959472656, 99.18775939941406, 101.9200439453125]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 2.0, 3.0, 5.0, 7.0, 9.0, 8.0, 21.0, 30.0, 41.0, 59.0, 100.0, 157.0, 255.0, 409.0, 695.0, 1216.0, 2151.0, 4282.0, 8832.0, 19162.0, 42858.0, 102329.0, 244536.0, 330661.0, 166154.0, 68541.0, 29242.0, 13388.0, 6136.0, 3174.0, 1698.0, 962.0, 573.0, 323.0, 189.0, 120.0, 71.0, 54.0, 31.0, 23.0, 12.0, 9.0, 9.0, 6.0, 3.0, 7.0, 0.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.234375, -8.9293212890625, -8.624267578125, -8.3192138671875, -8.01416015625, -7.7091064453125, -7.404052734375, -7.0989990234375, -6.7939453125, -6.4888916015625, -6.183837890625, -5.8787841796875, -5.57373046875, -5.2686767578125, -4.963623046875, -4.6585693359375, -4.353515625, -4.0484619140625, -3.743408203125, -3.4383544921875, -3.13330078125, -2.8282470703125, -2.523193359375, -2.2181396484375, -1.9130859375, -1.6080322265625, -1.302978515625, -0.9979248046875, -0.69287109375, -0.3878173828125, -0.082763671875, 0.2222900390625, 0.52734375, 0.8323974609375, 1.137451171875, 1.4425048828125, 1.74755859375, 2.0526123046875, 2.357666015625, 2.6627197265625, 2.9677734375, 3.2728271484375, 3.577880859375, 3.8829345703125, 4.18798828125, 4.4930419921875, 4.798095703125, 5.1031494140625, 5.408203125, 5.7132568359375, 6.018310546875, 6.3233642578125, 6.62841796875, 6.9334716796875, 7.238525390625, 7.5435791015625, 7.8486328125, 8.1536865234375, 8.458740234375, 8.7637939453125, 9.06884765625, 9.3739013671875, 9.678955078125, 9.9840087890625, 10.2890625]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 0.0, 4.0, 2.0, 1.0, 6.0, 4.0, 6.0, 11.0, 10.0, 16.0, 17.0, 26.0, 29.0, 22.0, 33.0, 33.0, 36.0, 46.0, 59.0, 55.0, 50.0, 58.0, 46.0, 51.0, 42.0, 46.0, 40.0, 37.0, 39.0, 29.0, 23.0, 20.0, 26.0, 14.0, 20.0, 10.0, 5.0, 10.0, 6.0, 5.0, 5.0, 3.0, 1.0, 1.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.09765625, -4.9151611328125, -4.732666015625, -4.5501708984375, -4.36767578125, -4.1851806640625, -4.002685546875, -3.8201904296875, -3.6376953125, -3.4552001953125, -3.272705078125, -3.0902099609375, -2.90771484375, -2.7252197265625, -2.542724609375, -2.3602294921875, -2.177734375, -1.9952392578125, -1.812744140625, -1.6302490234375, -1.44775390625, -1.2652587890625, -1.082763671875, -0.9002685546875, -0.7177734375, -0.5352783203125, -0.352783203125, -0.1702880859375, 0.01220703125, 0.1947021484375, 0.377197265625, 0.5596923828125, 0.7421875, 0.9246826171875, 1.107177734375, 1.2896728515625, 1.47216796875, 1.6546630859375, 1.837158203125, 2.0196533203125, 2.2021484375, 2.3846435546875, 2.567138671875, 2.7496337890625, 2.93212890625, 3.1146240234375, 3.297119140625, 3.4796142578125, 3.662109375, 3.8446044921875, 4.027099609375, 4.2095947265625, 4.39208984375, 4.5745849609375, 4.757080078125, 4.9395751953125, 5.1220703125, 5.3045654296875, 5.487060546875, 5.6695556640625, 5.85205078125, 6.0345458984375, 6.217041015625, 6.3995361328125, 6.58203125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 3.0, 9.0, 7.0, 12.0, 18.0, 25.0, 32.0, 68.0, 92.0, 148.0, 277.0, 515.0, 1322.0, 4650.0, 73431.0, 925864.0, 36399.0, 3535.0, 1045.0, 485.0, 243.0, 142.0, 78.0, 42.0, 34.0, 18.0, 16.0, 11.0, 8.0, 7.0, 3.0, 3.0, 0.0, 2.0, 1.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-52.03125, -50.60205078125, -49.1728515625, -47.74365234375, -46.314453125, -44.88525390625, -43.4560546875, -42.02685546875, -40.59765625, -39.16845703125, -37.7392578125, -36.31005859375, -34.880859375, -33.45166015625, -32.0224609375, -30.59326171875, -29.1640625, -27.73486328125, -26.3056640625, -24.87646484375, -23.447265625, -22.01806640625, -20.5888671875, -19.15966796875, -17.73046875, -16.30126953125, -14.8720703125, -13.44287109375, -12.013671875, -10.58447265625, -9.1552734375, -7.72607421875, -6.296875, -4.86767578125, -3.4384765625, -2.00927734375, -0.580078125, 0.84912109375, 2.2783203125, 3.70751953125, 5.13671875, 6.56591796875, 7.9951171875, 9.42431640625, 10.853515625, 12.28271484375, 13.7119140625, 15.14111328125, 16.5703125, 17.99951171875, 19.4287109375, 20.85791015625, 22.287109375, 23.71630859375, 25.1455078125, 26.57470703125, 28.00390625, 29.43310546875, 30.8623046875, 32.29150390625, 33.720703125, 35.14990234375, 36.5791015625, 38.00830078125, 39.4375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 5.0, 3.0, 5.0, 4.0, 11.0, 5.0, 6.0, 8.0, 10.0, 19.0, 22.0, 19.0, 31.0, 33.0, 52.0, 40.0, 38.0, 55.0, 51.0, 64.0, 49.0, 47.0, 63.0, 45.0, 44.0, 43.0, 45.0, 33.0, 31.0, 29.0, 22.0, 14.0, 13.0, 16.0, 8.0, 7.0, 10.0, 4.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0], "bins": [-34.53125, -33.63330078125, -32.7353515625, -31.83740234375, -30.939453125, -30.04150390625, -29.1435546875, -28.24560546875, -27.34765625, -26.44970703125, -25.5517578125, -24.65380859375, -23.755859375, -22.85791015625, -21.9599609375, -21.06201171875, -20.1640625, -19.26611328125, -18.3681640625, -17.47021484375, -16.572265625, -15.67431640625, -14.7763671875, -13.87841796875, -12.98046875, -12.08251953125, -11.1845703125, -10.28662109375, -9.388671875, -8.49072265625, -7.5927734375, -6.69482421875, -5.796875, -4.89892578125, -4.0009765625, -3.10302734375, -2.205078125, -1.30712890625, -0.4091796875, 0.48876953125, 1.38671875, 2.28466796875, 3.1826171875, 4.08056640625, 4.978515625, 5.87646484375, 6.7744140625, 7.67236328125, 8.5703125, 9.46826171875, 10.3662109375, 11.26416015625, 12.162109375, 13.06005859375, 13.9580078125, 14.85595703125, 15.75390625, 16.65185546875, 17.5498046875, 18.44775390625, 19.345703125, 20.24365234375, 21.1416015625, 22.03955078125, 22.9375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 3.0, 1.0, 3.0, 1.0, 4.0, 5.0, 7.0, 15.0, 18.0, 35.0, 56.0, 86.0, 141.0, 353.0, 965.0, 3620.0, 39267.0, 923369.0, 73647.0, 4979.0, 1106.0, 412.0, 206.0, 108.0, 57.0, 30.0, 19.0, 13.0, 12.0, 4.0, 3.0, 6.0, 4.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-23.765625, -23.097900390625, -22.43017578125, -21.762451171875, -21.0947265625, -20.427001953125, -19.75927734375, -19.091552734375, -18.423828125, -17.756103515625, -17.08837890625, -16.420654296875, -15.7529296875, -15.085205078125, -14.41748046875, -13.749755859375, -13.08203125, -12.414306640625, -11.74658203125, -11.078857421875, -10.4111328125, -9.743408203125, -9.07568359375, -8.407958984375, -7.740234375, -7.072509765625, -6.40478515625, -5.737060546875, -5.0693359375, -4.401611328125, -3.73388671875, -3.066162109375, -2.3984375, -1.730712890625, -1.06298828125, -0.395263671875, 0.2724609375, 0.940185546875, 1.60791015625, 2.275634765625, 2.943359375, 3.611083984375, 4.27880859375, 4.946533203125, 5.6142578125, 6.281982421875, 6.94970703125, 7.617431640625, 8.28515625, 8.952880859375, 9.62060546875, 10.288330078125, 10.9560546875, 11.623779296875, 12.29150390625, 12.959228515625, 13.626953125, 14.294677734375, 14.96240234375, 15.630126953125, 16.2978515625, 16.965576171875, 17.63330078125, 18.301025390625, 18.96875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 4.0, 7.0, 15.0, 13.0, 18.0, 28.0, 30.0, 31.0, 62.0, 73.0, 163.0, 197.0, 124.0, 73.0, 36.0, 26.0, 29.0, 19.0, 12.0, 11.0, 9.0, 6.0, 4.0, 1.0, 9.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0034656524658203125, -0.003367602825164795, -0.0032695531845092773, -0.0031715035438537598, -0.003073453903198242, -0.0029754042625427246, -0.002877354621887207, -0.0027793049812316895, -0.002681255340576172, -0.0025832056999206543, -0.0024851560592651367, -0.002387106418609619, -0.0022890567779541016, -0.002191007137298584, -0.0020929574966430664, -0.001994907855987549, -0.0018968582153320312, -0.0017988085746765137, -0.001700758934020996, -0.0016027092933654785, -0.001504659652709961, -0.0014066100120544434, -0.0013085603713989258, -0.0012105107307434082, -0.0011124610900878906, -0.001014411449432373, -0.0009163618087768555, -0.0008183121681213379, -0.0007202625274658203, -0.0006222128868103027, -0.0005241632461547852, -0.0004261136054992676, -0.00032806396484375, -0.00023001432418823242, -0.00013196468353271484, -3.3915042877197266e-05, 6.413459777832031e-05, 0.0001621842384338379, 0.00026023387908935547, 0.00035828351974487305, 0.0004563331604003906, 0.0005543828010559082, 0.0006524324417114258, 0.0007504820823669434, 0.0008485317230224609, 0.0009465813636779785, 0.001044631004333496, 0.0011426806449890137, 0.0012407302856445312, 0.0013387799263000488, 0.0014368295669555664, 0.001534879207611084, 0.0016329288482666016, 0.0017309784889221191, 0.0018290281295776367, 0.0019270777702331543, 0.002025127410888672, 0.0021231770515441895, 0.002221226692199707, 0.0023192763328552246, 0.002417325973510742, 0.0025153756141662598, 0.0026134252548217773, 0.002711474895477295, 0.0028095245361328125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 3.0, 4.0, 5.0, 7.0, 8.0, 9.0, 24.0, 26.0, 42.0, 70.0, 117.0, 182.0, 340.0, 694.0, 1738.0, 5434.0, 28359.0, 575113.0, 403910.0, 24641.0, 4800.0, 1553.0, 676.0, 303.0, 189.0, 91.0, 54.0, 50.0, 34.0, 20.0, 18.0, 11.0, 12.0, 4.0, 2.0, 4.0, 2.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-18.15625, -17.60546875, -17.0546875, -16.50390625, -15.953125, -15.40234375, -14.8515625, -14.30078125, -13.75, -13.19921875, -12.6484375, -12.09765625, -11.546875, -10.99609375, -10.4453125, -9.89453125, -9.34375, -8.79296875, -8.2421875, -7.69140625, -7.140625, -6.58984375, -6.0390625, -5.48828125, -4.9375, -4.38671875, -3.8359375, -3.28515625, -2.734375, -2.18359375, -1.6328125, -1.08203125, -0.53125, 0.01953125, 0.5703125, 1.12109375, 1.671875, 2.22265625, 2.7734375, 3.32421875, 3.875, 4.42578125, 4.9765625, 5.52734375, 6.078125, 6.62890625, 7.1796875, 7.73046875, 8.28125, 8.83203125, 9.3828125, 9.93359375, 10.484375, 11.03515625, 11.5859375, 12.13671875, 12.6875, 13.23828125, 13.7890625, 14.33984375, 14.890625, 15.44140625, 15.9921875, 16.54296875, 17.09375]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 2.0, 6.0, 5.0, 5.0, 8.0, 18.0, 17.0, 16.0, 25.0, 22.0, 49.0, 72.0, 63.0, 122.0, 122.0, 112.0, 80.0, 81.0, 45.0, 36.0, 32.0, 14.0, 13.0, 4.0, 14.0, 9.0, 3.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.0703125, -11.6767578125, -11.283203125, -10.8896484375, -10.49609375, -10.1025390625, -9.708984375, -9.3154296875, -8.921875, -8.5283203125, -8.134765625, -7.7412109375, -7.34765625, -6.9541015625, -6.560546875, -6.1669921875, -5.7734375, -5.3798828125, -4.986328125, -4.5927734375, -4.19921875, -3.8056640625, -3.412109375, -3.0185546875, -2.625, -2.2314453125, -1.837890625, -1.4443359375, -1.05078125, -0.6572265625, -0.263671875, 0.1298828125, 0.5234375, 0.9169921875, 1.310546875, 1.7041015625, 2.09765625, 2.4912109375, 2.884765625, 3.2783203125, 3.671875, 4.0654296875, 4.458984375, 4.8525390625, 5.24609375, 5.6396484375, 6.033203125, 6.4267578125, 6.8203125, 7.2138671875, 7.607421875, 8.0009765625, 8.39453125, 8.7880859375, 9.181640625, 9.5751953125, 9.96875, 10.3623046875, 10.755859375, 11.1494140625, 11.54296875, 11.9365234375, 12.330078125, 12.7236328125, 13.1171875]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 9.0, 67.0, 203.0, 474.0, 185.0, 43.0, 13.0, 6.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-606.1787109375, -592.8401489257812, -579.5016479492188, -566.1630859375, -552.8245849609375, -539.4860229492188, -526.1475219726562, -512.8089599609375, -499.4704284667969, -486.13189697265625, -472.7933654785156, -459.454833984375, -446.1163024902344, -432.77777099609375, -419.439208984375, -406.1006774902344, -392.76214599609375, -379.4236145019531, -366.0850830078125, -352.7465515136719, -339.40802001953125, -326.0694580078125, -312.73095703125, -299.39239501953125, -286.05389404296875, -272.7153625488281, -259.3768310546875, -246.03829956054688, -232.6997528076172, -219.36122131347656, -206.02268981933594, -192.68414306640625, -179.34559631347656, -166.00706481933594, -152.6685333251953, -139.32998657226562, -125.991455078125, -112.65292358398438, -99.31439208984375, -85.9758529663086, -72.63732147216797, -59.29878616333008, -45.96025085449219, -32.62171936035156, -19.283184051513672, -5.944648742675781, 7.393882751464844, 20.732421875, 34.070953369140625, 47.409488677978516, 60.748023986816406, 74.08655548095703, 87.42509460449219, 100.76362609863281, 114.10215759277344, 127.4406967163086, 140.77923583984375, 154.11776733398438, 167.456298828125, 180.79483032226562, 194.1333770751953, 207.47190856933594, 220.81044006347656, 234.14898681640625, 247.4875030517578]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 6.0, 1.0, 9.0, 7.0, 10.0, 9.0, 10.0, 16.0, 15.0, 28.0, 30.0, 41.0, 39.0, 46.0, 43.0, 60.0, 51.0, 72.0, 54.0, 56.0, 64.0, 46.0, 56.0, 38.0, 39.0, 30.0, 36.0, 16.0, 17.0, 16.0, 13.0, 10.0, 9.0, 5.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-149.04537963867188, -145.2171173095703, -141.3888702392578, -137.56060791015625, -133.73236083984375, -129.9040985107422, -126.07583618164062, -122.2475814819336, -118.41932678222656, -114.59107208251953, -110.7628173828125, -106.93455505371094, -103.1063003540039, -99.27804565429688, -95.44978332519531, -91.62152862548828, -87.79327392578125, -83.96501922607422, -80.13676452636719, -76.30850219726562, -72.4802474975586, -68.65199279785156, -64.82373046875, -60.99547576904297, -57.16722106933594, -53.338966369628906, -49.51070785522461, -45.68244934082031, -41.85419464111328, -38.02593994140625, -34.19768142700195, -30.36942481994629, -26.541168212890625, -22.71291160583496, -18.884654998779297, -15.056398391723633, -11.228141784667969, -7.399885177612305, -3.5716285705566406, 0.25662803649902344, 4.0848846435546875, 7.913141250610352, 11.741397857666016, 15.56965446472168, 19.397911071777344, 23.226167678833008, 27.054424285888672, 30.882680892944336, 34.7109375, 38.53919219970703, 42.36745071411133, 46.195709228515625, 50.023963928222656, 53.85221862792969, 57.680477142333984, 61.50873565673828, 65.33699035644531, 69.16524505615234, 72.99349975585938, 76.82176208496094, 80.65001678466797, 84.478271484375, 88.30653381347656, 92.1347885131836, 95.96304321289062]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 5.0, 8.0, 5.0, 12.0, 19.0, 20.0, 34.0, 42.0, 69.0, 96.0, 160.0, 269.0, 933.0, 55139.0, 4132557.0, 3936.0, 406.0, 180.0, 118.0, 73.0, 57.0, 49.0, 22.0, 19.0, 13.0, 8.0, 7.0, 9.0, 2.0, 2.0, 1.0, 0.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-99.125, -96.462890625, -93.80078125, -91.138671875, -88.4765625, -85.814453125, -83.15234375, -80.490234375, -77.828125, -75.166015625, -72.50390625, -69.841796875, -67.1796875, -64.517578125, -61.85546875, -59.193359375, -56.53125, -53.869140625, -51.20703125, -48.544921875, -45.8828125, -43.220703125, -40.55859375, -37.896484375, -35.234375, -32.572265625, -29.91015625, -27.248046875, -24.5859375, -21.923828125, -19.26171875, -16.599609375, -13.9375, -11.275390625, -8.61328125, -5.951171875, -3.2890625, -0.626953125, 2.03515625, 4.697265625, 7.359375, 10.021484375, 12.68359375, 15.345703125, 18.0078125, 20.669921875, 23.33203125, 25.994140625, 28.65625, 31.318359375, 33.98046875, 36.642578125, 39.3046875, 41.966796875, 44.62890625, 47.291015625, 49.953125, 52.615234375, 55.27734375, 57.939453125, 60.6015625, 63.263671875, 65.92578125, 68.587890625, 71.25]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 4.0, 8.0, 18.0, 11.0, 26.0, 36.0, 49.0, 53.0, 62.0, 67.0, 86.0, 96.0, 70.0, 77.0, 63.0, 72.0, 51.0, 31.0, 38.0, 24.0, 21.0, 17.0, 6.0, 10.0, 5.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-10.8125, -10.53607177734375, -10.2596435546875, -9.98321533203125, -9.706787109375, -9.43035888671875, -9.1539306640625, -8.87750244140625, -8.60107421875, -8.32464599609375, -8.0482177734375, -7.77178955078125, -7.495361328125, -7.21893310546875, -6.9425048828125, -6.66607666015625, -6.3896484375, -6.11322021484375, -5.8367919921875, -5.56036376953125, -5.283935546875, -5.00750732421875, -4.7310791015625, -4.45465087890625, -4.17822265625, -3.90179443359375, -3.6253662109375, -3.34893798828125, -3.072509765625, -2.79608154296875, -2.5196533203125, -2.24322509765625, -1.966796875, -1.69036865234375, -1.4139404296875, -1.13751220703125, -0.861083984375, -0.58465576171875, -0.3082275390625, -0.03179931640625, 0.24462890625, 0.52105712890625, 0.7974853515625, 1.07391357421875, 1.350341796875, 1.62677001953125, 1.9031982421875, 2.17962646484375, 2.4560546875, 2.73248291015625, 3.0089111328125, 3.28533935546875, 3.561767578125, 3.83819580078125, 4.1146240234375, 4.39105224609375, 4.66748046875, 4.94390869140625, 5.2203369140625, 5.49676513671875, 5.773193359375, 6.04962158203125, 6.3260498046875, 6.60247802734375, 6.87890625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 6.0, 7.0, 11.0, 17.0, 19.0, 46.0, 61.0, 87.0, 135.0, 305.0, 533.0, 1097.0, 2654.0, 7076.0, 25620.0, 252955.0, 3653848.0, 216295.0, 23015.0, 6286.0, 2218.0, 926.0, 441.0, 205.0, 153.0, 85.0, 63.0, 38.0, 24.0, 15.0, 9.0, 11.0, 5.0, 6.0, 5.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.8046875, -15.1590576171875, -14.513427734375, -13.8677978515625, -13.22216796875, -12.5765380859375, -11.930908203125, -11.2852783203125, -10.6396484375, -9.9940185546875, -9.348388671875, -8.7027587890625, -8.05712890625, -7.4114990234375, -6.765869140625, -6.1202392578125, -5.474609375, -4.8289794921875, -4.183349609375, -3.5377197265625, -2.89208984375, -2.2464599609375, -1.600830078125, -0.9552001953125, -0.3095703125, 0.3360595703125, 0.981689453125, 1.6273193359375, 2.27294921875, 2.9185791015625, 3.564208984375, 4.2098388671875, 4.85546875, 5.5010986328125, 6.146728515625, 6.7923583984375, 7.43798828125, 8.0836181640625, 8.729248046875, 9.3748779296875, 10.0205078125, 10.6661376953125, 11.311767578125, 11.9573974609375, 12.60302734375, 13.2486572265625, 13.894287109375, 14.5399169921875, 15.185546875, 15.8311767578125, 16.476806640625, 17.1224365234375, 17.76806640625, 18.4136962890625, 19.059326171875, 19.7049560546875, 20.3505859375, 20.9962158203125, 21.641845703125, 22.2874755859375, 22.93310546875, 23.5787353515625, 24.224365234375, 24.8699951171875, 25.515625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 4.0, 7.0, 12.0, 16.0, 18.0, 43.0, 40.0, 96.0, 215.0, 472.0, 984.0, 1096.0, 592.0, 233.0, 105.0, 65.0, 22.0, 18.0, 5.0, 12.0, 6.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.4375, -20.789794921875, -20.14208984375, -19.494384765625, -18.8466796875, -18.198974609375, -17.55126953125, -16.903564453125, -16.255859375, -15.608154296875, -14.96044921875, -14.312744140625, -13.6650390625, -13.017333984375, -12.36962890625, -11.721923828125, -11.07421875, -10.426513671875, -9.77880859375, -9.131103515625, -8.4833984375, -7.835693359375, -7.18798828125, -6.540283203125, -5.892578125, -5.244873046875, -4.59716796875, -3.949462890625, -3.3017578125, -2.654052734375, -2.00634765625, -1.358642578125, -0.7109375, -0.063232421875, 0.58447265625, 1.232177734375, 1.8798828125, 2.527587890625, 3.17529296875, 3.822998046875, 4.470703125, 5.118408203125, 5.76611328125, 6.413818359375, 7.0615234375, 7.709228515625, 8.35693359375, 9.004638671875, 9.65234375, 10.300048828125, 10.94775390625, 11.595458984375, 12.2431640625, 12.890869140625, 13.53857421875, 14.186279296875, 14.833984375, 15.481689453125, 16.12939453125, 16.777099609375, 17.4248046875, 18.072509765625, 18.72021484375, 19.367919921875, 20.015625]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 6.0, 12.0, 29.0, 85.0, 181.0, 249.0, 232.0, 116.0, 41.0, 23.0, 12.0, 6.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-120.39412689208984, -113.67118835449219, -106.9482421875, -100.22530364990234, -93.50235748291016, -86.7794189453125, -80.05647277832031, -73.33353424072266, -66.610595703125, -59.88765335083008, -53.164710998535156, -46.4417724609375, -39.71882629394531, -32.995887756347656, -26.272945404052734, -19.550003051757812, -12.827056884765625, -6.104115009307861, 0.6188268661499023, 7.341768264770508, 14.06471061706543, 20.78765106201172, 27.51059341430664, 34.23353576660156, 40.956478118896484, 47.679420471191406, 54.40236282348633, 61.12530517578125, 67.8482437133789, 74.57118225097656, 81.29412841796875, 88.01707458496094, 94.74000549316406, 101.46294403076172, 108.1858901977539, 114.90882873535156, 121.63177490234375, 128.35470581054688, 135.07765197753906, 141.80059814453125, 148.52354431152344, 155.24649047851562, 161.96942138671875, 168.69236755371094, 175.41531372070312, 182.13824462890625, 188.86119079589844, 195.58413696289062, 202.30706787109375, 209.03001403808594, 215.75294494628906, 222.47589111328125, 229.19883728027344, 235.92178344726562, 242.64471435546875, 249.36766052246094, 256.0906066894531, 262.81353759765625, 269.5364990234375, 276.2594299316406, 282.98236083984375, 289.705322265625, 296.4282531738281, 303.15118408203125, 309.8741455078125]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 5.0, 8.0, 9.0, 8.0, 12.0, 14.0, 15.0, 19.0, 23.0, 27.0, 32.0, 35.0, 49.0, 49.0, 48.0, 40.0, 51.0, 57.0, 44.0, 57.0, 49.0, 51.0, 33.0, 49.0, 38.0, 28.0, 26.0, 20.0, 21.0, 18.0, 6.0, 15.0, 13.0, 8.0, 6.0, 8.0, 3.0, 3.0, 4.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-73.71693420410156, -71.59661102294922, -69.47628784179688, -67.35596466064453, -65.23564147949219, -63.115318298339844, -60.994991302490234, -58.87466812133789, -56.75434494018555, -54.6340217590332, -52.51369857788086, -50.393375396728516, -48.273048400878906, -46.15272521972656, -44.03240203857422, -41.912078857421875, -39.79175567626953, -37.67143249511719, -35.551109313964844, -33.4307861328125, -31.310461044311523, -29.19013786315918, -27.069812774658203, -24.94948959350586, -22.829166412353516, -20.708843231201172, -18.588520050048828, -16.46819496154785, -14.347871780395508, -12.227548599243164, -10.107224464416504, -7.986900329589844, -5.866569519042969, -3.746245861053467, -1.6259222030639648, 0.4944014549255371, 2.614725112915039, 4.735048294067383, 6.855372428894043, 8.975696563720703, 11.096019744873047, 13.21634292602539, 15.33666706085205, 17.45699119567871, 19.577314376831055, 21.6976375579834, 23.817962646484375, 25.93828582763672, 28.058609008789062, 30.178932189941406, 32.29925537109375, 34.419578552246094, 36.53990173339844, 38.66022491455078, 40.78055191040039, 42.900875091552734, 45.02119827270508, 47.14152145385742, 49.261844635009766, 51.38216781616211, 53.50249481201172, 55.62281799316406, 57.743141174316406, 59.86346435546875, 61.983787536621094]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 6.0, 7.0, 9.0, 10.0, 26.0, 36.0, 64.0, 123.0, 204.0, 429.0, 863.0, 2072.0, 5443.0, 15316.0, 49287.0, 198369.0, 522963.0, 183569.0, 46229.0, 14687.0, 5151.0, 1898.0, 915.0, 400.0, 201.0, 119.0, 76.0, 30.0, 23.0, 18.0, 5.0, 9.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.1796875, -13.6986083984375, -13.217529296875, -12.7364501953125, -12.25537109375, -11.7742919921875, -11.293212890625, -10.8121337890625, -10.3310546875, -9.8499755859375, -9.368896484375, -8.8878173828125, -8.40673828125, -7.9256591796875, -7.444580078125, -6.9635009765625, -6.482421875, -6.0013427734375, -5.520263671875, -5.0391845703125, -4.55810546875, -4.0770263671875, -3.595947265625, -3.1148681640625, -2.6337890625, -2.1527099609375, -1.671630859375, -1.1905517578125, -0.70947265625, -0.2283935546875, 0.252685546875, 0.7337646484375, 1.21484375, 1.6959228515625, 2.177001953125, 2.6580810546875, 3.13916015625, 3.6202392578125, 4.101318359375, 4.5823974609375, 5.0634765625, 5.5445556640625, 6.025634765625, 6.5067138671875, 6.98779296875, 7.4688720703125, 7.949951171875, 8.4310302734375, 8.912109375, 9.3931884765625, 9.874267578125, 10.3553466796875, 10.83642578125, 11.3175048828125, 11.798583984375, 12.2796630859375, 12.7607421875, 13.2418212890625, 13.722900390625, 14.2039794921875, 14.68505859375, 15.1661376953125, 15.647216796875, 16.1282958984375, 16.609375]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 8.0, 5.0, 7.0, 6.0, 9.0, 15.0, 18.0, 23.0, 21.0, 17.0, 29.0, 35.0, 31.0, 41.0, 40.0, 46.0, 47.0, 48.0, 61.0, 43.0, 49.0, 46.0, 44.0, 40.0, 45.0, 45.0, 28.0, 28.0, 24.0, 16.0, 21.0, 16.0, 10.0, 6.0, 10.0, 5.0, 4.0, 9.0, 6.0, 1.0, 3.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.9140625, -5.72900390625, -5.5439453125, -5.35888671875, -5.173828125, -4.98876953125, -4.8037109375, -4.61865234375, -4.43359375, -4.24853515625, -4.0634765625, -3.87841796875, -3.693359375, -3.50830078125, -3.3232421875, -3.13818359375, -2.953125, -2.76806640625, -2.5830078125, -2.39794921875, -2.212890625, -2.02783203125, -1.8427734375, -1.65771484375, -1.47265625, -1.28759765625, -1.1025390625, -0.91748046875, -0.732421875, -0.54736328125, -0.3623046875, -0.17724609375, 0.0078125, 0.19287109375, 0.3779296875, 0.56298828125, 0.748046875, 0.93310546875, 1.1181640625, 1.30322265625, 1.48828125, 1.67333984375, 1.8583984375, 2.04345703125, 2.228515625, 2.41357421875, 2.5986328125, 2.78369140625, 2.96875, 3.15380859375, 3.3388671875, 3.52392578125, 3.708984375, 3.89404296875, 4.0791015625, 4.26416015625, 4.44921875, 4.63427734375, 4.8193359375, 5.00439453125, 5.189453125, 5.37451171875, 5.5595703125, 5.74462890625, 5.9296875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 2.0, 4.0, 0.0, 5.0, 5.0, 15.0, 34.0, 49.0, 90.0, 145.0, 285.0, 713.0, 2082.0, 11139.0, 169772.0, 821350.0, 36270.0, 4475.0, 1240.0, 454.0, 186.0, 94.0, 65.0, 30.0, 18.0, 15.0, 9.0, 2.0, 4.0, 1.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.53125, -33.26416015625, -31.9970703125, -30.72998046875, -29.462890625, -28.19580078125, -26.9287109375, -25.66162109375, -24.39453125, -23.12744140625, -21.8603515625, -20.59326171875, -19.326171875, -18.05908203125, -16.7919921875, -15.52490234375, -14.2578125, -12.99072265625, -11.7236328125, -10.45654296875, -9.189453125, -7.92236328125, -6.6552734375, -5.38818359375, -4.12109375, -2.85400390625, -1.5869140625, -0.31982421875, 0.947265625, 2.21435546875, 3.4814453125, 4.74853515625, 6.015625, 7.28271484375, 8.5498046875, 9.81689453125, 11.083984375, 12.35107421875, 13.6181640625, 14.88525390625, 16.15234375, 17.41943359375, 18.6865234375, 19.95361328125, 21.220703125, 22.48779296875, 23.7548828125, 25.02197265625, 26.2890625, 27.55615234375, 28.8232421875, 30.09033203125, 31.357421875, 32.62451171875, 33.8916015625, 35.15869140625, 36.42578125, 37.69287109375, 38.9599609375, 40.22705078125, 41.494140625, 42.76123046875, 44.0283203125, 45.29541015625, 46.5625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 4.0, 6.0, 6.0, 5.0, 12.0, 13.0, 11.0, 26.0, 21.0, 22.0, 26.0, 35.0, 34.0, 46.0, 44.0, 50.0, 50.0, 53.0, 51.0, 49.0, 61.0, 48.0, 47.0, 37.0, 43.0, 25.0, 35.0, 30.0, 20.0, 15.0, 24.0, 16.0, 10.0, 8.0, 5.0, 4.0, 2.0, 3.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0], "bins": [-27.484375, -26.662841796875, -25.84130859375, -25.019775390625, -24.1982421875, -23.376708984375, -22.55517578125, -21.733642578125, -20.912109375, -20.090576171875, -19.26904296875, -18.447509765625, -17.6259765625, -16.804443359375, -15.98291015625, -15.161376953125, -14.33984375, -13.518310546875, -12.69677734375, -11.875244140625, -11.0537109375, -10.232177734375, -9.41064453125, -8.589111328125, -7.767578125, -6.946044921875, -6.12451171875, -5.302978515625, -4.4814453125, -3.659912109375, -2.83837890625, -2.016845703125, -1.1953125, -0.373779296875, 0.44775390625, 1.269287109375, 2.0908203125, 2.912353515625, 3.73388671875, 4.555419921875, 5.376953125, 6.198486328125, 7.02001953125, 7.841552734375, 8.6630859375, 9.484619140625, 10.30615234375, 11.127685546875, 11.94921875, 12.770751953125, 13.59228515625, 14.413818359375, 15.2353515625, 16.056884765625, 16.87841796875, 17.699951171875, 18.521484375, 19.343017578125, 20.16455078125, 20.986083984375, 21.8076171875, 22.629150390625, 23.45068359375, 24.272216796875, 25.09375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 7.0, 8.0, 9.0, 16.0, 22.0, 31.0, 40.0, 71.0, 133.0, 210.0, 623.0, 1929.0, 10416.0, 664264.0, 358883.0, 9002.0, 1756.0, 575.0, 242.0, 116.0, 69.0, 41.0, 27.0, 17.0, 13.0, 12.0, 4.0, 5.0, 2.0, 1.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-34.0625, -33.0595703125, -32.056640625, -31.0537109375, -30.05078125, -29.0478515625, -28.044921875, -27.0419921875, -26.0390625, -25.0361328125, -24.033203125, -23.0302734375, -22.02734375, -21.0244140625, -20.021484375, -19.0185546875, -18.015625, -17.0126953125, -16.009765625, -15.0068359375, -14.00390625, -13.0009765625, -11.998046875, -10.9951171875, -9.9921875, -8.9892578125, -7.986328125, -6.9833984375, -5.98046875, -4.9775390625, -3.974609375, -2.9716796875, -1.96875, -0.9658203125, 0.037109375, 1.0400390625, 2.04296875, 3.0458984375, 4.048828125, 5.0517578125, 6.0546875, 7.0576171875, 8.060546875, 9.0634765625, 10.06640625, 11.0693359375, 12.072265625, 13.0751953125, 14.078125, 15.0810546875, 16.083984375, 17.0869140625, 18.08984375, 19.0927734375, 20.095703125, 21.0986328125, 22.1015625, 23.1044921875, 24.107421875, 25.1103515625, 26.11328125, 27.1162109375, 28.119140625, 29.1220703125, 30.125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 5.0, 5.0, 7.0, 13.0, 19.0, 34.0, 55.0, 124.0, 323.0, 216.0, 104.0, 34.0, 23.0, 7.0, 14.0, 4.0, 3.0, 8.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0047760009765625, -0.004620969295501709, -0.004465937614440918, -0.004310905933380127, -0.004155874252319336, -0.004000842571258545, -0.003845810890197754, -0.003690779209136963, -0.003535747528076172, -0.003380715847015381, -0.00322568416595459, -0.003070652484893799, -0.002915620803833008, -0.002760589122772217, -0.0026055574417114258, -0.0024505257606506348, -0.0022954940795898438, -0.0021404623985290527, -0.0019854307174682617, -0.0018303990364074707, -0.0016753673553466797, -0.0015203356742858887, -0.0013653039932250977, -0.0012102723121643066, -0.0010552406311035156, -0.0009002089500427246, -0.0007451772689819336, -0.0005901455879211426, -0.00043511390686035156, -0.00028008222579956055, -0.00012505054473876953, 2.9981136322021484e-05, 0.0001850128173828125, 0.0003400444984436035, 0.0004950761795043945, 0.0006501078605651855, 0.0008051395416259766, 0.0009601712226867676, 0.0011152029037475586, 0.0012702345848083496, 0.0014252662658691406, 0.0015802979469299316, 0.0017353296279907227, 0.0018903613090515137, 0.0020453929901123047, 0.0022004246711730957, 0.0023554563522338867, 0.0025104880332946777, 0.0026655197143554688, 0.0028205513954162598, 0.0029755830764770508, 0.003130614757537842, 0.003285646438598633, 0.003440678119659424, 0.003595709800720215, 0.003750741481781006, 0.003905773162841797, 0.004060804843902588, 0.004215836524963379, 0.00437086820602417, 0.004525899887084961, 0.004680931568145752, 0.004835963249206543, 0.004990994930267334, 0.005146026611328125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 5.0, 11.0, 8.0, 12.0, 18.0, 31.0, 36.0, 57.0, 120.0, 208.0, 514.0, 1557.0, 6959.0, 76768.0, 916889.0, 38425.0, 4785.0, 1238.0, 454.0, 199.0, 103.0, 54.0, 42.0, 24.0, 16.0, 9.0, 4.0, 6.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.8125, -19.0322265625, -18.251953125, -17.4716796875, -16.69140625, -15.9111328125, -15.130859375, -14.3505859375, -13.5703125, -12.7900390625, -12.009765625, -11.2294921875, -10.44921875, -9.6689453125, -8.888671875, -8.1083984375, -7.328125, -6.5478515625, -5.767578125, -4.9873046875, -4.20703125, -3.4267578125, -2.646484375, -1.8662109375, -1.0859375, -0.3056640625, 0.474609375, 1.2548828125, 2.03515625, 2.8154296875, 3.595703125, 4.3759765625, 5.15625, 5.9365234375, 6.716796875, 7.4970703125, 8.27734375, 9.0576171875, 9.837890625, 10.6181640625, 11.3984375, 12.1787109375, 12.958984375, 13.7392578125, 14.51953125, 15.2998046875, 16.080078125, 16.8603515625, 17.640625, 18.4208984375, 19.201171875, 19.9814453125, 20.76171875, 21.5419921875, 22.322265625, 23.1025390625, 23.8828125, 24.6630859375, 25.443359375, 26.2236328125, 27.00390625, 27.7841796875, 28.564453125, 29.3447265625, 30.125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 1.0, 4.0, 4.0, 7.0, 14.0, 17.0, 43.0, 64.0, 154.0, 262.0, 201.0, 96.0, 49.0, 32.0, 17.0, 18.0, 12.0, 4.0, 1.0, 5.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-31.546875, -30.824462890625, -30.10205078125, -29.379638671875, -28.6572265625, -27.934814453125, -27.21240234375, -26.489990234375, -25.767578125, -25.045166015625, -24.32275390625, -23.600341796875, -22.8779296875, -22.155517578125, -21.43310546875, -20.710693359375, -19.98828125, -19.265869140625, -18.54345703125, -17.821044921875, -17.0986328125, -16.376220703125, -15.65380859375, -14.931396484375, -14.208984375, -13.486572265625, -12.76416015625, -12.041748046875, -11.3193359375, -10.596923828125, -9.87451171875, -9.152099609375, -8.4296875, -7.707275390625, -6.98486328125, -6.262451171875, -5.5400390625, -4.817626953125, -4.09521484375, -3.372802734375, -2.650390625, -1.927978515625, -1.20556640625, -0.483154296875, 0.2392578125, 0.961669921875, 1.68408203125, 2.406494140625, 3.12890625, 3.851318359375, 4.57373046875, 5.296142578125, 6.0185546875, 6.740966796875, 7.46337890625, 8.185791015625, 8.908203125, 9.630615234375, 10.35302734375, 11.075439453125, 11.7978515625, 12.520263671875, 13.24267578125, 13.965087890625, 14.6875]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 4.0, 13.0, 58.0, 364.0, 429.0, 95.0, 34.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-691.30908203125, -673.5811157226562, -655.8531494140625, -638.1251220703125, -620.3971557617188, -602.669189453125, -584.941162109375, -567.2131958007812, -549.4852294921875, -531.7572631835938, -514.029296875, -496.30126953125, -478.57330322265625, -460.8453369140625, -443.1173400878906, -425.38934326171875, -407.661376953125, -389.93341064453125, -372.2054138183594, -354.4774169921875, -336.74945068359375, -319.021484375, -301.2934875488281, -283.56549072265625, -265.8375244140625, -248.1095428466797, -230.38156127929688, -212.65357971191406, -194.92559814453125, -177.19761657714844, -159.46963500976562, -141.7416534423828, -124.01370239257812, -106.28572082519531, -88.5577392578125, -70.82975769042969, -53.101776123046875, -35.37379455566406, -17.64581298828125, 0.0821685791015625, 17.810150146484375, 35.53813171386719, 53.26611328125, 70.99409484863281, 88.72207641601562, 106.45005798339844, 124.17803955078125, 141.90602111816406, 159.63400268554688, 177.3619842529297, 195.0899658203125, 212.8179473876953, 230.54592895507812, 248.27391052246094, 266.00189208984375, 283.7298583984375, 301.4578552246094, 319.18585205078125, 336.913818359375, 354.64178466796875, 372.3697814941406, 390.0977783203125, 407.82574462890625, 425.5537109375, 443.2817077636719]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 6.0, 3.0, 7.0, 8.0, 11.0, 14.0, 20.0, 19.0, 20.0, 26.0, 34.0, 41.0, 46.0, 46.0, 53.0, 59.0, 89.0, 82.0, 70.0, 58.0, 53.0, 49.0, 48.0, 30.0, 17.0, 24.0, 16.0, 18.0, 13.0, 10.0, 5.0, 6.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-162.4191131591797, -157.65037536621094, -152.88165283203125, -148.1129150390625, -143.34417724609375, -138.575439453125, -133.8067169189453, -129.03797912597656, -124.26924896240234, -119.50051879882812, -114.73178100585938, -109.96305084228516, -105.19432067871094, -100.42558288574219, -95.65685272216797, -90.88812255859375, -86.119384765625, -81.35065460205078, -76.58191680908203, -71.81318664550781, -67.04444885253906, -62.275718688964844, -57.506988525390625, -52.73825454711914, -47.969520568847656, -43.20078659057617, -38.43205261230469, -33.66332244873047, -28.894588470458984, -24.1258544921875, -19.35712242126465, -14.588390350341797, -9.819671630859375, -5.050938606262207, -0.28220558166503906, 4.486527442932129, 9.255260467529297, 14.023994445800781, 18.792726516723633, 23.561458587646484, 28.33019256591797, 33.09892654418945, 37.86766052246094, 42.636390686035156, 47.40512466430664, 52.173858642578125, 56.942588806152344, 61.71132278442383, 66.48005676269531, 71.24878692626953, 76.01752471923828, 80.7862548828125, 85.55499267578125, 90.32372283935547, 95.09245300292969, 99.86119079589844, 104.62992095947266, 109.39865112304688, 114.16738891601562, 118.93611907958984, 123.70484924316406, 128.4735870361328, 133.24232482910156, 138.01104736328125, 142.77978515625]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 3.0, 1.0, 2.0, 8.0, 6.0, 6.0, 11.0, 8.0, 14.0, 16.0, 29.0, 36.0, 50.0, 78.0, 104.0, 166.0, 257.0, 476.0, 951.0, 2016.0, 4909.0, 14659.0, 70174.0, 1424708.0, 2539906.0, 106425.0, 18575.0, 5924.0, 2452.0, 1032.0, 529.0, 266.0, 162.0, 98.0, 65.0, 42.0, 40.0, 13.0, 22.0, 7.0, 12.0, 6.0, 3.0, 3.0, 3.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 2.0, 2.0, 1.0, 3.0], "bins": [-18.109375, -17.562255859375, -17.01513671875, -16.468017578125, -15.9208984375, -15.373779296875, -14.82666015625, -14.279541015625, -13.732421875, -13.185302734375, -12.63818359375, -12.091064453125, -11.5439453125, -10.996826171875, -10.44970703125, -9.902587890625, -9.35546875, -8.808349609375, -8.26123046875, -7.714111328125, -7.1669921875, -6.619873046875, -6.07275390625, -5.525634765625, -4.978515625, -4.431396484375, -3.88427734375, -3.337158203125, -2.7900390625, -2.242919921875, -1.69580078125, -1.148681640625, -0.6015625, -0.054443359375, 0.49267578125, 1.039794921875, 1.5869140625, 2.134033203125, 2.68115234375, 3.228271484375, 3.775390625, 4.322509765625, 4.86962890625, 5.416748046875, 5.9638671875, 6.510986328125, 7.05810546875, 7.605224609375, 8.15234375, 8.699462890625, 9.24658203125, 9.793701171875, 10.3408203125, 10.887939453125, 11.43505859375, 11.982177734375, 12.529296875, 13.076416015625, 13.62353515625, 14.170654296875, 14.7177734375, 15.264892578125, 15.81201171875, 16.359130859375, 16.90625]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 5.0, 7.0, 2.0, 9.0, 14.0, 21.0, 26.0, 31.0, 36.0, 50.0, 63.0, 61.0, 89.0, 61.0, 58.0, 57.0, 71.0, 66.0, 50.0, 44.0, 44.0, 29.0, 25.0, 16.0, 20.0, 12.0, 15.0, 10.0, 5.0, 4.0, 3.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.28515625, -5.04229736328125, -4.7994384765625, -4.55657958984375, -4.313720703125, -4.07086181640625, -3.8280029296875, -3.58514404296875, -3.34228515625, -3.09942626953125, -2.8565673828125, -2.61370849609375, -2.370849609375, -2.12799072265625, -1.8851318359375, -1.64227294921875, -1.3994140625, -1.15655517578125, -0.9136962890625, -0.67083740234375, -0.427978515625, -0.18511962890625, 0.0577392578125, 0.30059814453125, 0.54345703125, 0.78631591796875, 1.0291748046875, 1.27203369140625, 1.514892578125, 1.75775146484375, 2.0006103515625, 2.24346923828125, 2.486328125, 2.72918701171875, 2.9720458984375, 3.21490478515625, 3.457763671875, 3.70062255859375, 3.9434814453125, 4.18634033203125, 4.42919921875, 4.67205810546875, 4.9149169921875, 5.15777587890625, 5.400634765625, 5.64349365234375, 5.8863525390625, 6.12921142578125, 6.3720703125, 6.61492919921875, 6.8577880859375, 7.10064697265625, 7.343505859375, 7.58636474609375, 7.8292236328125, 8.07208251953125, 8.31494140625, 8.55780029296875, 8.8006591796875, 9.04351806640625, 9.286376953125, 9.52923583984375, 9.7720947265625, 10.01495361328125, 10.2578125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 16.0, 23.0, 30.0, 40.0, 72.0, 136.0, 256.0, 536.0, 1361.0, 4785.0, 26969.0, 475258.0, 3559770.0, 108897.0, 11974.0, 2616.0, 863.0, 350.0, 156.0, 68.0, 37.0, 22.0, 16.0, 11.0, 7.0, 4.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-29.75, -28.906982421875, -28.06396484375, -27.220947265625, -26.3779296875, -25.534912109375, -24.69189453125, -23.848876953125, -23.005859375, -22.162841796875, -21.31982421875, -20.476806640625, -19.6337890625, -18.790771484375, -17.94775390625, -17.104736328125, -16.26171875, -15.418701171875, -14.57568359375, -13.732666015625, -12.8896484375, -12.046630859375, -11.20361328125, -10.360595703125, -9.517578125, -8.674560546875, -7.83154296875, -6.988525390625, -6.1455078125, -5.302490234375, -4.45947265625, -3.616455078125, -2.7734375, -1.930419921875, -1.08740234375, -0.244384765625, 0.5986328125, 1.441650390625, 2.28466796875, 3.127685546875, 3.970703125, 4.813720703125, 5.65673828125, 6.499755859375, 7.3427734375, 8.185791015625, 9.02880859375, 9.871826171875, 10.71484375, 11.557861328125, 12.40087890625, 13.243896484375, 14.0869140625, 14.929931640625, 15.77294921875, 16.615966796875, 17.458984375, 18.302001953125, 19.14501953125, 19.988037109375, 20.8310546875, 21.674072265625, 22.51708984375, 23.360107421875, 24.203125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 6.0, 7.0, 9.0, 10.0, 30.0, 32.0, 60.0, 102.0, 205.0, 372.0, 786.0, 1072.0, 658.0, 323.0, 169.0, 95.0, 50.0, 37.0, 17.0, 14.0, 7.0, 10.0, 2.0, 4.0, 0.0, 2.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.859375, -29.082763671875, -28.30615234375, -27.529541015625, -26.7529296875, -25.976318359375, -25.19970703125, -24.423095703125, -23.646484375, -22.869873046875, -22.09326171875, -21.316650390625, -20.5400390625, -19.763427734375, -18.98681640625, -18.210205078125, -17.43359375, -16.656982421875, -15.88037109375, -15.103759765625, -14.3271484375, -13.550537109375, -12.77392578125, -11.997314453125, -11.220703125, -10.444091796875, -9.66748046875, -8.890869140625, -8.1142578125, -7.337646484375, -6.56103515625, -5.784423828125, -5.0078125, -4.231201171875, -3.45458984375, -2.677978515625, -1.9013671875, -1.124755859375, -0.34814453125, 0.428466796875, 1.205078125, 1.981689453125, 2.75830078125, 3.534912109375, 4.3115234375, 5.088134765625, 5.86474609375, 6.641357421875, 7.41796875, 8.194580078125, 8.97119140625, 9.747802734375, 10.5244140625, 11.301025390625, 12.07763671875, 12.854248046875, 13.630859375, 14.407470703125, 15.18408203125, 15.960693359375, 16.7373046875, 17.513916015625, 18.29052734375, 19.067138671875, 19.84375]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 4.0, 4.0, 17.0, 33.0, 115.0, 307.0, 314.0, 153.0, 30.0, 19.0, 5.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-532.1575317382812, -520.6707763671875, -509.18402099609375, -497.697265625, -486.21051025390625, -474.7237548828125, -463.23699951171875, -451.7502136230469, -440.2634582519531, -428.7767028808594, -417.2899475097656, -405.8031921386719, -394.3164367675781, -382.82965087890625, -371.3428955078125, -359.85614013671875, -348.369384765625, -336.88262939453125, -325.3958740234375, -313.90911865234375, -302.42236328125, -290.93560791015625, -279.4488525390625, -267.9620666503906, -256.475341796875, -244.98858642578125, -233.5018310546875, -222.01507568359375, -210.52830505371094, -199.0415496826172, -187.55479431152344, -176.06802368164062, -164.58126831054688, -153.09451293945312, -141.60775756835938, -130.12100219726562, -118.63423156738281, -107.14747619628906, -95.66072082519531, -84.17395782470703, -72.68720245361328, -61.200443267822266, -49.71368408203125, -38.2269287109375, -26.740169525146484, -15.253410339355469, -3.7666549682617188, 7.7201080322265625, 19.206863403320312, 30.693622589111328, 42.180381774902344, 53.667137145996094, 65.15390014648438, 76.64065551757812, 88.12741088867188, 99.61417388916016, 111.1009292602539, 122.58768463134766, 134.07444763183594, 145.5612030029297, 157.04795837402344, 168.53472900390625, 180.021484375, 191.50823974609375, 202.9949951171875]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 2.0, 6.0, 6.0, 7.0, 10.0, 12.0, 6.0, 8.0, 15.0, 16.0, 24.0, 32.0, 38.0, 37.0, 31.0, 34.0, 40.0, 52.0, 48.0, 48.0, 55.0, 55.0, 36.0, 40.0, 57.0, 44.0, 41.0, 35.0, 34.0, 20.0, 20.0, 23.0, 14.0, 17.0, 15.0, 11.0, 9.0, 1.0, 2.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-94.20802307128906, -91.28093719482422, -88.35384368896484, -85.4267578125, -82.49967193603516, -79.57258605957031, -76.64549255371094, -73.7184066772461, -70.79132080078125, -67.8642349243164, -64.93714141845703, -62.01005554199219, -59.082969665527344, -56.155879974365234, -53.228790283203125, -50.30170440673828, -47.374610900878906, -44.4475212097168, -41.52043533325195, -38.593345642089844, -35.666259765625, -32.73917007446289, -29.81208038330078, -26.884992599487305, -23.957904815673828, -21.03081703186035, -18.103729248046875, -15.176639556884766, -12.249551773071289, -9.322463989257812, -6.395374298095703, -3.4682865142822266, -0.5412063598632812, 2.3858819007873535, 5.312970161437988, 8.240058898925781, 11.167146682739258, 14.094234466552734, 17.021324157714844, 19.94841194152832, 22.875499725341797, 25.802587509155273, 28.72967529296875, 31.65676498413086, 34.58385467529297, 37.51094055175781, 40.43803024291992, 43.36511993408203, 46.292205810546875, 49.219295501708984, 52.14638137817383, 55.07347106933594, 58.00055694580078, 60.92764663696289, 63.854736328125, 66.78182220458984, 69.70890808105469, 72.63599395751953, 75.5630874633789, 78.49017333984375, 81.4172592163086, 84.34434509277344, 87.27143859863281, 90.19852447509766, 93.12561798095703]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 3.0, 2.0, 1.0, 7.0, 11.0, 13.0, 13.0, 22.0, 34.0, 46.0, 101.0, 141.0, 231.0, 441.0, 885.0, 1872.0, 4865.0, 13932.0, 45036.0, 162263.0, 461985.0, 255141.0, 68966.0, 20563.0, 6941.0, 2561.0, 1190.0, 549.0, 284.0, 189.0, 88.0, 54.0, 41.0, 28.0, 18.0, 15.0, 9.0, 3.0, 4.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-16.34375, -15.843505859375, -15.34326171875, -14.843017578125, -14.3427734375, -13.842529296875, -13.34228515625, -12.842041015625, -12.341796875, -11.841552734375, -11.34130859375, -10.841064453125, -10.3408203125, -9.840576171875, -9.34033203125, -8.840087890625, -8.33984375, -7.839599609375, -7.33935546875, -6.839111328125, -6.3388671875, -5.838623046875, -5.33837890625, -4.838134765625, -4.337890625, -3.837646484375, -3.33740234375, -2.837158203125, -2.3369140625, -1.836669921875, -1.33642578125, -0.836181640625, -0.3359375, 0.164306640625, 0.66455078125, 1.164794921875, 1.6650390625, 2.165283203125, 2.66552734375, 3.165771484375, 3.666015625, 4.166259765625, 4.66650390625, 5.166748046875, 5.6669921875, 6.167236328125, 6.66748046875, 7.167724609375, 7.66796875, 8.168212890625, 8.66845703125, 9.168701171875, 9.6689453125, 10.169189453125, 10.66943359375, 11.169677734375, 11.669921875, 12.170166015625, 12.67041015625, 13.170654296875, 13.6708984375, 14.171142578125, 14.67138671875, 15.171630859375, 15.671875]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 5.0, 11.0, 7.0, 13.0, 23.0, 32.0, 29.0, 44.0, 52.0, 40.0, 52.0, 58.0, 59.0, 63.0, 63.0, 56.0, 53.0, 52.0, 45.0, 46.0, 37.0, 35.0, 28.0, 25.0, 15.0, 19.0, 10.0, 8.0, 7.0, 9.0, 4.0, 2.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.4609375, -8.234619140625, -8.00830078125, -7.781982421875, -7.5556640625, -7.329345703125, -7.10302734375, -6.876708984375, -6.650390625, -6.424072265625, -6.19775390625, -5.971435546875, -5.7451171875, -5.518798828125, -5.29248046875, -5.066162109375, -4.83984375, -4.613525390625, -4.38720703125, -4.160888671875, -3.9345703125, -3.708251953125, -3.48193359375, -3.255615234375, -3.029296875, -2.802978515625, -2.57666015625, -2.350341796875, -2.1240234375, -1.897705078125, -1.67138671875, -1.445068359375, -1.21875, -0.992431640625, -0.76611328125, -0.539794921875, -0.3134765625, -0.087158203125, 0.13916015625, 0.365478515625, 0.591796875, 0.818115234375, 1.04443359375, 1.270751953125, 1.4970703125, 1.723388671875, 1.94970703125, 2.176025390625, 2.40234375, 2.628662109375, 2.85498046875, 3.081298828125, 3.3076171875, 3.533935546875, 3.76025390625, 3.986572265625, 4.212890625, 4.439208984375, 4.66552734375, 4.891845703125, 5.1181640625, 5.344482421875, 5.57080078125, 5.797119140625, 6.0234375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 2.0, 6.0, 12.0, 10.0, 16.0, 22.0, 53.0, 71.0, 134.0, 210.0, 393.0, 833.0, 1793.0, 5301.0, 31580.0, 694975.0, 287569.0, 18762.0, 3863.0, 1383.0, 673.0, 370.0, 186.0, 139.0, 79.0, 42.0, 28.0, 16.0, 8.0, 10.0, 8.0, 5.0, 5.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.15625, -33.93896484375, -32.7216796875, -31.50439453125, -30.287109375, -29.06982421875, -27.8525390625, -26.63525390625, -25.41796875, -24.20068359375, -22.9833984375, -21.76611328125, -20.548828125, -19.33154296875, -18.1142578125, -16.89697265625, -15.6796875, -14.46240234375, -13.2451171875, -12.02783203125, -10.810546875, -9.59326171875, -8.3759765625, -7.15869140625, -5.94140625, -4.72412109375, -3.5068359375, -2.28955078125, -1.072265625, 0.14501953125, 1.3623046875, 2.57958984375, 3.796875, 5.01416015625, 6.2314453125, 7.44873046875, 8.666015625, 9.88330078125, 11.1005859375, 12.31787109375, 13.53515625, 14.75244140625, 15.9697265625, 17.18701171875, 18.404296875, 19.62158203125, 20.8388671875, 22.05615234375, 23.2734375, 24.49072265625, 25.7080078125, 26.92529296875, 28.142578125, 29.35986328125, 30.5771484375, 31.79443359375, 33.01171875, 34.22900390625, 35.4462890625, 36.66357421875, 37.880859375, 39.09814453125, 40.3154296875, 41.53271484375, 42.75]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 3.0, 2.0, 4.0, 3.0, 4.0, 7.0, 13.0, 11.0, 21.0, 12.0, 18.0, 15.0, 27.0, 23.0, 28.0, 33.0, 41.0, 39.0, 36.0, 34.0, 52.0, 44.0, 44.0, 43.0, 44.0, 38.0, 35.0, 36.0, 36.0, 37.0, 30.0, 31.0, 22.0, 20.0, 24.0, 13.0, 13.0, 12.0, 9.0, 9.0, 9.0, 6.0, 5.0, 6.0, 2.0, 4.0, 2.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-23.53125, -22.79931640625, -22.0673828125, -21.33544921875, -20.603515625, -19.87158203125, -19.1396484375, -18.40771484375, -17.67578125, -16.94384765625, -16.2119140625, -15.47998046875, -14.748046875, -14.01611328125, -13.2841796875, -12.55224609375, -11.8203125, -11.08837890625, -10.3564453125, -9.62451171875, -8.892578125, -8.16064453125, -7.4287109375, -6.69677734375, -5.96484375, -5.23291015625, -4.5009765625, -3.76904296875, -3.037109375, -2.30517578125, -1.5732421875, -0.84130859375, -0.109375, 0.62255859375, 1.3544921875, 2.08642578125, 2.818359375, 3.55029296875, 4.2822265625, 5.01416015625, 5.74609375, 6.47802734375, 7.2099609375, 7.94189453125, 8.673828125, 9.40576171875, 10.1376953125, 10.86962890625, 11.6015625, 12.33349609375, 13.0654296875, 13.79736328125, 14.529296875, 15.26123046875, 15.9931640625, 16.72509765625, 17.45703125, 18.18896484375, 18.9208984375, 19.65283203125, 20.384765625, 21.11669921875, 21.8486328125, 22.58056640625, 23.3125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 2.0, 9.0, 8.0, 4.0, 11.0, 22.0, 22.0, 27.0, 44.0, 53.0, 76.0, 118.0, 156.0, 335.0, 585.0, 1223.0, 2908.0, 8520.0, 34861.0, 239735.0, 674432.0, 64407.0, 13316.0, 4242.0, 1644.0, 728.0, 417.0, 200.0, 133.0, 77.0, 64.0, 51.0, 30.0, 19.0, 20.0, 12.0, 10.0, 9.0, 6.0, 6.0, 7.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.46875, -11.0467529296875, -10.624755859375, -10.2027587890625, -9.78076171875, -9.3587646484375, -8.936767578125, -8.5147705078125, -8.0927734375, -7.6707763671875, -7.248779296875, -6.8267822265625, -6.40478515625, -5.9827880859375, -5.560791015625, -5.1387939453125, -4.716796875, -4.2947998046875, -3.872802734375, -3.4508056640625, -3.02880859375, -2.6068115234375, -2.184814453125, -1.7628173828125, -1.3408203125, -0.9188232421875, -0.496826171875, -0.0748291015625, 0.34716796875, 0.7691650390625, 1.191162109375, 1.6131591796875, 2.03515625, 2.4571533203125, 2.879150390625, 3.3011474609375, 3.72314453125, 4.1451416015625, 4.567138671875, 4.9891357421875, 5.4111328125, 5.8331298828125, 6.255126953125, 6.6771240234375, 7.09912109375, 7.5211181640625, 7.943115234375, 8.3651123046875, 8.787109375, 9.2091064453125, 9.631103515625, 10.0531005859375, 10.47509765625, 10.8970947265625, 11.319091796875, 11.7410888671875, 12.1630859375, 12.5850830078125, 13.007080078125, 13.4290771484375, 13.85107421875, 14.2730712890625, 14.695068359375, 15.1170654296875, 15.5390625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 2.0, 6.0, 12.0, 19.0, 36.0, 41.0, 53.0, 88.0, 186.0, 260.0, 111.0, 56.0, 50.0, 30.0, 22.0, 4.0, 9.0, 6.0, 2.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 4.0], "bins": [-0.009490966796875, -0.009289741516113281, -0.009088516235351562, -0.008887290954589844, -0.008686065673828125, -0.008484840393066406, -0.008283615112304688, -0.008082389831542969, -0.00788116455078125, -0.007679939270019531, -0.0074787139892578125, -0.007277488708496094, -0.007076263427734375, -0.006875038146972656, -0.0066738128662109375, -0.006472587585449219, -0.0062713623046875, -0.006070137023925781, -0.0058689117431640625, -0.005667686462402344, -0.005466461181640625, -0.005265235900878906, -0.0050640106201171875, -0.004862785339355469, -0.00466156005859375, -0.004460334777832031, -0.0042591094970703125, -0.004057884216308594, -0.003856658935546875, -0.0036554336547851562, -0.0034542083740234375, -0.0032529830932617188, -0.0030517578125, -0.0028505325317382812, -0.0026493072509765625, -0.0024480819702148438, -0.002246856689453125, -0.0020456314086914062, -0.0018444061279296875, -0.0016431808471679688, -0.00144195556640625, -0.0012407302856445312, -0.0010395050048828125, -0.0008382797241210938, -0.000637054443359375, -0.00043582916259765625, -0.0002346038818359375, -3.337860107421875e-05, 0.0001678466796875, 0.00036907196044921875, 0.0005702972412109375, 0.0007715225219726562, 0.000972747802734375, 0.0011739730834960938, 0.0013751983642578125, 0.0015764236450195312, 0.00177764892578125, 0.0019788742065429688, 0.0021800994873046875, 0.0023813247680664062, 0.002582550048828125, 0.0027837753295898438, 0.0029850006103515625, 0.0031862258911132812, 0.003387451171875]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [5.0, 0.0, 1.0, 3.0, 3.0, 1.0, 4.0, 3.0, 6.0, 6.0, 9.0, 7.0, 6.0, 18.0, 16.0, 23.0, 29.0, 52.0, 69.0, 91.0, 125.0, 260.0, 372.0, 588.0, 1055.0, 2113.0, 4801.0, 13305.0, 52475.0, 578033.0, 331602.0, 43284.0, 11354.0, 4323.0, 1907.0, 1033.0, 560.0, 358.0, 201.0, 139.0, 84.0, 56.0, 41.0, 36.0, 20.0, 19.0, 17.0, 8.0, 7.0, 11.0, 11.0, 4.0, 7.0, 2.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.1640625, -12.724365234375, -12.28466796875, -11.844970703125, -11.4052734375, -10.965576171875, -10.52587890625, -10.086181640625, -9.646484375, -9.206787109375, -8.76708984375, -8.327392578125, -7.8876953125, -7.447998046875, -7.00830078125, -6.568603515625, -6.12890625, -5.689208984375, -5.24951171875, -4.809814453125, -4.3701171875, -3.930419921875, -3.49072265625, -3.051025390625, -2.611328125, -2.171630859375, -1.73193359375, -1.292236328125, -0.8525390625, -0.412841796875, 0.02685546875, 0.466552734375, 0.90625, 1.345947265625, 1.78564453125, 2.225341796875, 2.6650390625, 3.104736328125, 3.54443359375, 3.984130859375, 4.423828125, 4.863525390625, 5.30322265625, 5.742919921875, 6.1826171875, 6.622314453125, 7.06201171875, 7.501708984375, 7.94140625, 8.381103515625, 8.82080078125, 9.260498046875, 9.7001953125, 10.139892578125, 10.57958984375, 11.019287109375, 11.458984375, 11.898681640625, 12.33837890625, 12.778076171875, 13.2177734375, 13.657470703125, 14.09716796875, 14.536865234375, 14.9765625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 5.0, 2.0, 3.0, 7.0, 6.0, 9.0, 6.0, 8.0, 10.0, 21.0, 24.0, 15.0, 33.0, 34.0, 39.0, 59.0, 72.0, 92.0, 127.0, 94.0, 55.0, 45.0, 54.0, 30.0, 38.0, 30.0, 23.0, 19.0, 8.0, 3.0, 6.0, 5.0, 7.0, 2.0, 2.0, 5.0, 0.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-11.4609375, -11.119873046875, -10.77880859375, -10.437744140625, -10.0966796875, -9.755615234375, -9.41455078125, -9.073486328125, -8.732421875, -8.391357421875, -8.05029296875, -7.709228515625, -7.3681640625, -7.027099609375, -6.68603515625, -6.344970703125, -6.00390625, -5.662841796875, -5.32177734375, -4.980712890625, -4.6396484375, -4.298583984375, -3.95751953125, -3.616455078125, -3.275390625, -2.934326171875, -2.59326171875, -2.252197265625, -1.9111328125, -1.570068359375, -1.22900390625, -0.887939453125, -0.546875, -0.205810546875, 0.13525390625, 0.476318359375, 0.8173828125, 1.158447265625, 1.49951171875, 1.840576171875, 2.181640625, 2.522705078125, 2.86376953125, 3.204833984375, 3.5458984375, 3.886962890625, 4.22802734375, 4.569091796875, 4.91015625, 5.251220703125, 5.59228515625, 5.933349609375, 6.2744140625, 6.615478515625, 6.95654296875, 7.297607421875, 7.638671875, 7.979736328125, 8.32080078125, 8.661865234375, 9.0029296875, 9.343994140625, 9.68505859375, 10.026123046875, 10.3671875]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 7.0, 9.0, 20.0, 23.0, 77.0, 159.0, 309.0, 220.0, 90.0, 48.0, 11.0, 13.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-303.3929443359375, -293.54205322265625, -283.6911926269531, -273.84033203125, -263.98944091796875, -254.13856506347656, -244.28768920898438, -234.4368133544922, -224.5859375, -214.7350616455078, -204.88418579101562, -195.03330993652344, -185.18243408203125, -175.33155822753906, -165.48068237304688, -155.6298065185547, -145.7789306640625, -135.9280548095703, -126.07717895507812, -116.22630310058594, -106.37542724609375, -96.52455139160156, -86.67367553710938, -76.82279968261719, -66.971923828125, -57.12104797363281, -47.270172119140625, -37.41929626464844, -27.56842041015625, -17.717544555664062, -7.866668701171875, 1.9842071533203125, 11.8350830078125, 21.685958862304688, 31.536834716796875, 41.38771057128906, 51.23858642578125, 61.08946228027344, 70.94033813476562, 80.79121398925781, 90.64208984375, 100.49296569824219, 110.34384155273438, 120.19471740722656, 130.04559326171875, 139.89646911621094, 149.74734497070312, 159.5982208251953, 169.4490966796875, 179.2999725341797, 189.15084838867188, 199.00172424316406, 208.85260009765625, 218.70347595214844, 228.55435180664062, 238.4052276611328, 248.256103515625, 258.10699462890625, 267.9578552246094, 277.8087158203125, 287.65960693359375, 297.510498046875, 307.3613586425781, 317.21221923828125, 327.0631103515625]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 6.0, 7.0, 6.0, 7.0, 10.0, 17.0, 11.0, 12.0, 20.0, 20.0, 18.0, 33.0, 30.0, 27.0, 33.0, 40.0, 57.0, 46.0, 58.0, 71.0, 64.0, 59.0, 41.0, 39.0, 31.0, 31.0, 30.0, 35.0, 25.0, 15.0, 21.0, 17.0, 9.0, 14.0, 10.0, 3.0, 7.0, 9.0, 3.0, 4.0, 5.0, 1.0, 3.0, 3.0, 1.0, 1.0], "bins": [-129.80667114257812, -126.37604522705078, -122.94541931152344, -119.5147933959961, -116.08416748046875, -112.6535415649414, -109.22291564941406, -105.79228973388672, -102.36166381835938, -98.93103790283203, -95.50041198730469, -92.06978607177734, -88.63916015625, -85.20853424072266, -81.77790832519531, -78.34728240966797, -74.91665649414062, -71.48603057861328, -68.05540466308594, -64.6247787475586, -61.19415283203125, -57.763526916503906, -54.33290100097656, -50.90227508544922, -47.471649169921875, -44.04102325439453, -40.61039733886719, -37.179771423339844, -33.7491455078125, -30.318519592285156, -26.887893676757812, -23.45726776123047, -20.026634216308594, -16.59600830078125, -13.165382385253906, -9.734756469726562, -6.304130554199219, -2.873504638671875, 0.5571212768554688, 3.9877471923828125, 7.418373107910156, 10.8489990234375, 14.279624938964844, 17.710250854492188, 21.14087677001953, 24.571502685546875, 28.00212860107422, 31.432754516601562, 34.863380432128906, 38.29400634765625, 41.724632263183594, 45.15525817871094, 48.58588409423828, 52.016510009765625, 55.44713592529297, 58.87776184082031, 62.308387756347656, 65.739013671875, 69.16963958740234, 72.60026550292969, 76.03089141845703, 79.46151733398438, 82.89214324951172, 86.32276916503906, 89.7533950805664]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 4.0, 2.0, 2.0, 7.0, 8.0, 9.0, 8.0, 14.0, 16.0, 24.0, 13.0, 39.0, 57.0, 96.0, 194.0, 303.0, 679.0, 1543.0, 4450.0, 20004.0, 348701.0, 3697065.0, 103666.0, 11885.0, 3112.0, 1148.0, 518.0, 282.0, 152.0, 86.0, 53.0, 38.0, 19.0, 21.0, 18.0, 6.0, 4.0, 3.0, 8.0, 6.0, 3.0, 2.0, 3.0, 2.0, 1.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-26.703125, -25.90234375, -25.1015625, -24.30078125, -23.5, -22.69921875, -21.8984375, -21.09765625, -20.296875, -19.49609375, -18.6953125, -17.89453125, -17.09375, -16.29296875, -15.4921875, -14.69140625, -13.890625, -13.08984375, -12.2890625, -11.48828125, -10.6875, -9.88671875, -9.0859375, -8.28515625, -7.484375, -6.68359375, -5.8828125, -5.08203125, -4.28125, -3.48046875, -2.6796875, -1.87890625, -1.078125, -0.27734375, 0.5234375, 1.32421875, 2.125, 2.92578125, 3.7265625, 4.52734375, 5.328125, 6.12890625, 6.9296875, 7.73046875, 8.53125, 9.33203125, 10.1328125, 10.93359375, 11.734375, 12.53515625, 13.3359375, 14.13671875, 14.9375, 15.73828125, 16.5390625, 17.33984375, 18.140625, 18.94140625, 19.7421875, 20.54296875, 21.34375, 22.14453125, 22.9453125, 23.74609375, 24.546875]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 6.0, 6.0, 5.0, 4.0, 13.0, 12.0, 20.0, 29.0, 35.0, 43.0, 51.0, 43.0, 50.0, 67.0, 74.0, 67.0, 69.0, 74.0, 49.0, 60.0, 36.0, 42.0, 36.0, 28.0, 25.0, 15.0, 19.0, 13.0, 5.0, 6.0, 6.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.44140625, -6.18145751953125, -5.9215087890625, -5.66156005859375, -5.401611328125, -5.14166259765625, -4.8817138671875, -4.62176513671875, -4.36181640625, -4.10186767578125, -3.8419189453125, -3.58197021484375, -3.322021484375, -3.06207275390625, -2.8021240234375, -2.54217529296875, -2.2822265625, -2.02227783203125, -1.7623291015625, -1.50238037109375, -1.242431640625, -0.98248291015625, -0.7225341796875, -0.46258544921875, -0.20263671875, 0.05731201171875, 0.3172607421875, 0.57720947265625, 0.837158203125, 1.09710693359375, 1.3570556640625, 1.61700439453125, 1.876953125, 2.13690185546875, 2.3968505859375, 2.65679931640625, 2.916748046875, 3.17669677734375, 3.4366455078125, 3.69659423828125, 3.95654296875, 4.21649169921875, 4.4764404296875, 4.73638916015625, 4.996337890625, 5.25628662109375, 5.5162353515625, 5.77618408203125, 6.0361328125, 6.29608154296875, 6.5560302734375, 6.81597900390625, 7.075927734375, 7.33587646484375, 7.5958251953125, 7.85577392578125, 8.11572265625, 8.37567138671875, 8.6356201171875, 8.89556884765625, 9.155517578125, 9.41546630859375, 9.6754150390625, 9.93536376953125, 10.1953125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 6.0, 13.0, 24.0, 42.0, 81.0, 161.0, 355.0, 1169.0, 21598.0, 4145510.0, 23758.0, 1137.0, 258.0, 99.0, 45.0, 23.0, 2.0, 6.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-86.5, -83.9189453125, -81.337890625, -78.7568359375, -76.17578125, -73.5947265625, -71.013671875, -68.4326171875, -65.8515625, -63.2705078125, -60.689453125, -58.1083984375, -55.52734375, -52.9462890625, -50.365234375, -47.7841796875, -45.203125, -42.6220703125, -40.041015625, -37.4599609375, -34.87890625, -32.2978515625, -29.716796875, -27.1357421875, -24.5546875, -21.9736328125, -19.392578125, -16.8115234375, -14.23046875, -11.6494140625, -9.068359375, -6.4873046875, -3.90625, -1.3251953125, 1.255859375, 3.8369140625, 6.41796875, 8.9990234375, 11.580078125, 14.1611328125, 16.7421875, 19.3232421875, 21.904296875, 24.4853515625, 27.06640625, 29.6474609375, 32.228515625, 34.8095703125, 37.390625, 39.9716796875, 42.552734375, 45.1337890625, 47.71484375, 50.2958984375, 52.876953125, 55.4580078125, 58.0390625, 60.6201171875, 63.201171875, 65.7822265625, 68.36328125, 70.9443359375, 73.525390625, 76.1064453125, 78.6875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 13.0, 12.0, 49.0, 97.0, 297.0, 1254.0, 1641.0, 505.0, 126.0, 52.0, 16.0, 8.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-72.6875, -71.14697265625, -69.6064453125, -68.06591796875, -66.525390625, -64.98486328125, -63.4443359375, -61.90380859375, -60.36328125, -58.82275390625, -57.2822265625, -55.74169921875, -54.201171875, -52.66064453125, -51.1201171875, -49.57958984375, -48.0390625, -46.49853515625, -44.9580078125, -43.41748046875, -41.876953125, -40.33642578125, -38.7958984375, -37.25537109375, -35.71484375, -34.17431640625, -32.6337890625, -31.09326171875, -29.552734375, -28.01220703125, -26.4716796875, -24.93115234375, -23.390625, -21.85009765625, -20.3095703125, -18.76904296875, -17.228515625, -15.68798828125, -14.1474609375, -12.60693359375, -11.06640625, -9.52587890625, -7.9853515625, -6.44482421875, -4.904296875, -3.36376953125, -1.8232421875, -0.28271484375, 1.2578125, 2.79833984375, 4.3388671875, 5.87939453125, 7.419921875, 8.96044921875, 10.5009765625, 12.04150390625, 13.58203125, 15.12255859375, 16.6630859375, 18.20361328125, 19.744140625, 21.28466796875, 22.8251953125, 24.36572265625, 25.90625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 4.0, 14.0, 35.0, 92.0, 265.0, 358.0, 163.0, 54.0, 12.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-521.3150024414062, -508.3994445800781, -495.48388671875, -482.5683288574219, -469.65277099609375, -456.73724365234375, -443.8216552734375, -430.9061279296875, -417.9905700683594, -405.07501220703125, -392.1594543457031, -379.243896484375, -366.3283386230469, -353.41278076171875, -340.49725341796875, -327.5816955566406, -314.6661376953125, -301.7505798339844, -288.83502197265625, -275.9194641113281, -263.00390625, -250.08836364746094, -237.1728057861328, -224.25726318359375, -211.3416748046875, -198.42611694335938, -185.51055908203125, -172.59500122070312, -159.67945861816406, -146.76390075683594, -133.8483428955078, -120.93279266357422, -108.01724243164062, -95.1016845703125, -82.1861343383789, -69.27057647705078, -56.35502243041992, -43.43946838378906, -30.523910522460938, -17.608360290527344, -4.692802429199219, 8.222752571105957, 21.138307571411133, 34.053863525390625, 46.969417572021484, 59.884971618652344, 72.80052947998047, 85.71607971191406, 98.63163757324219, 111.54719543457031, 124.4627456665039, 137.3782958984375, 150.29385375976562, 163.20941162109375, 176.12496948242188, 189.04052734375, 201.95608520507812, 214.87164306640625, 227.78720092773438, 240.7027587890625, 253.61830139160156, 266.53387451171875, 279.44940185546875, 292.3649597167969, 305.280517578125]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0, 12.0, 26.0, 22.0, 50.0, 65.0, 99.0, 94.0, 118.0, 117.0, 128.0, 95.0, 62.0, 54.0, 26.0, 20.0, 10.0, 8.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-345.9951477050781, -338.9222717285156, -331.8493957519531, -324.7764892578125, -317.70361328125, -310.6307373046875, -303.557861328125, -296.4849853515625, -289.412109375, -282.3392333984375, -275.266357421875, -268.1934814453125, -261.1205749511719, -254.04769897460938, -246.97482299804688, -239.90194702148438, -232.8290557861328, -225.7561798095703, -218.68328857421875, -211.61041259765625, -204.53753662109375, -197.46466064453125, -190.3917694091797, -183.3188934326172, -176.24600219726562, -169.17312622070312, -162.10023498535156, -155.02735900878906, -147.95448303222656, -140.881591796875, -133.8087158203125, -126.73583984375, -119.66297912597656, -112.59009552001953, -105.51721954345703, -98.4443359375, -91.3714599609375, -84.29857635498047, -77.22569274902344, -70.15281677246094, -63.079933166503906, -56.00705337524414, -48.934173583984375, -41.861289978027344, -34.78841018676758, -27.715530395507812, -20.64264678955078, -13.569766998291016, -6.49688720703125, 0.575993537902832, 7.648874282836914, 14.721755981445312, 21.794635772705078, 28.867515563964844, 35.940399169921875, 43.01327896118164, 50.086158752441406, 57.15903854370117, 64.23191833496094, 71.30480194091797, 78.377685546875, 85.4505615234375, 92.52344512939453, 99.59632873535156, 106.66920471191406]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 4.0, 7.0, 4.0, 10.0, 15.0, 17.0, 26.0, 46.0, 63.0, 141.0, 353.0, 866.0, 2538.0, 10654.0, 69176.0, 598419.0, 322348.0, 34504.0, 6511.0, 1667.0, 655.0, 258.0, 114.0, 54.0, 42.0, 29.0, 17.0, 11.0, 5.0, 0.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.859375, -20.942138671875, -20.02490234375, -19.107666015625, -18.1904296875, -17.273193359375, -16.35595703125, -15.438720703125, -14.521484375, -13.604248046875, -12.68701171875, -11.769775390625, -10.8525390625, -9.935302734375, -9.01806640625, -8.100830078125, -7.18359375, -6.266357421875, -5.34912109375, -4.431884765625, -3.5146484375, -2.597412109375, -1.68017578125, -0.762939453125, 0.154296875, 1.071533203125, 1.98876953125, 2.906005859375, 3.8232421875, 4.740478515625, 5.65771484375, 6.574951171875, 7.4921875, 8.409423828125, 9.32666015625, 10.243896484375, 11.1611328125, 12.078369140625, 12.99560546875, 13.912841796875, 14.830078125, 15.747314453125, 16.66455078125, 17.581787109375, 18.4990234375, 19.416259765625, 20.33349609375, 21.250732421875, 22.16796875, 23.085205078125, 24.00244140625, 24.919677734375, 25.8369140625, 26.754150390625, 27.67138671875, 28.588623046875, 29.505859375, 30.423095703125, 31.34033203125, 32.257568359375, 33.1748046875, 34.092041015625, 35.00927734375, 35.926513671875, 36.84375]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 1.0, 6.0, 12.0, 9.0, 17.0, 17.0, 17.0, 28.0, 41.0, 47.0, 41.0, 43.0, 37.0, 51.0, 57.0, 62.0, 61.0, 47.0, 49.0, 41.0, 50.0, 42.0, 41.0, 40.0, 30.0, 28.0, 14.0, 16.0, 13.0, 8.0, 11.0, 9.0, 2.0, 4.0, 5.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-8.859375, -8.628173828125, -8.39697265625, -8.165771484375, -7.9345703125, -7.703369140625, -7.47216796875, -7.240966796875, -7.009765625, -6.778564453125, -6.54736328125, -6.316162109375, -6.0849609375, -5.853759765625, -5.62255859375, -5.391357421875, -5.16015625, -4.928955078125, -4.69775390625, -4.466552734375, -4.2353515625, -4.004150390625, -3.77294921875, -3.541748046875, -3.310546875, -3.079345703125, -2.84814453125, -2.616943359375, -2.3857421875, -2.154541015625, -1.92333984375, -1.692138671875, -1.4609375, -1.229736328125, -0.99853515625, -0.767333984375, -0.5361328125, -0.304931640625, -0.07373046875, 0.157470703125, 0.388671875, 0.619873046875, 0.85107421875, 1.082275390625, 1.3134765625, 1.544677734375, 1.77587890625, 2.007080078125, 2.23828125, 2.469482421875, 2.70068359375, 2.931884765625, 3.1630859375, 3.394287109375, 3.62548828125, 3.856689453125, 4.087890625, 4.319091796875, 4.55029296875, 4.781494140625, 5.0126953125, 5.243896484375, 5.47509765625, 5.706298828125, 5.9375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 6.0, 9.0, 9.0, 14.0, 27.0, 53.0, 104.0, 216.0, 599.0, 1774.0, 9168.0, 335459.0, 686068.0, 11844.0, 2061.0, 658.0, 255.0, 94.0, 62.0, 23.0, 20.0, 12.0, 9.0, 6.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.28125, -58.13232421875, -55.9833984375, -53.83447265625, -51.685546875, -49.53662109375, -47.3876953125, -45.23876953125, -43.08984375, -40.94091796875, -38.7919921875, -36.64306640625, -34.494140625, -32.34521484375, -30.1962890625, -28.04736328125, -25.8984375, -23.74951171875, -21.6005859375, -19.45166015625, -17.302734375, -15.15380859375, -13.0048828125, -10.85595703125, -8.70703125, -6.55810546875, -4.4091796875, -2.26025390625, -0.111328125, 2.03759765625, 4.1865234375, 6.33544921875, 8.484375, 10.63330078125, 12.7822265625, 14.93115234375, 17.080078125, 19.22900390625, 21.3779296875, 23.52685546875, 25.67578125, 27.82470703125, 29.9736328125, 32.12255859375, 34.271484375, 36.42041015625, 38.5693359375, 40.71826171875, 42.8671875, 45.01611328125, 47.1650390625, 49.31396484375, 51.462890625, 53.61181640625, 55.7607421875, 57.90966796875, 60.05859375, 62.20751953125, 64.3564453125, 66.50537109375, 68.654296875, 70.80322265625, 72.9521484375, 75.10107421875, 77.25]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 3.0, 5.0, 4.0, 4.0, 15.0, 17.0, 8.0, 27.0, 18.0, 23.0, 34.0, 46.0, 47.0, 51.0, 74.0, 70.0, 56.0, 50.0, 51.0, 53.0, 52.0, 50.0, 52.0, 36.0, 31.0, 27.0, 15.0, 25.0, 9.0, 4.0, 13.0, 8.0, 8.0, 5.0, 3.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-37.0, -35.849609375, -34.69921875, -33.548828125, -32.3984375, -31.248046875, -30.09765625, -28.947265625, -27.796875, -26.646484375, -25.49609375, -24.345703125, -23.1953125, -22.044921875, -20.89453125, -19.744140625, -18.59375, -17.443359375, -16.29296875, -15.142578125, -13.9921875, -12.841796875, -11.69140625, -10.541015625, -9.390625, -8.240234375, -7.08984375, -5.939453125, -4.7890625, -3.638671875, -2.48828125, -1.337890625, -0.1875, 0.962890625, 2.11328125, 3.263671875, 4.4140625, 5.564453125, 6.71484375, 7.865234375, 9.015625, 10.166015625, 11.31640625, 12.466796875, 13.6171875, 14.767578125, 15.91796875, 17.068359375, 18.21875, 19.369140625, 20.51953125, 21.669921875, 22.8203125, 23.970703125, 25.12109375, 26.271484375, 27.421875, 28.572265625, 29.72265625, 30.873046875, 32.0234375, 33.173828125, 34.32421875, 35.474609375, 36.625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 12.0, 26.0, 29.0, 95.0, 223.0, 707.0, 3091.0, 32344.0, 953712.0, 53148.0, 3889.0, 832.0, 249.0, 107.0, 38.0, 23.0, 16.0, 6.0, 7.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.40625, -23.09228515625, -21.7783203125, -20.46435546875, -19.150390625, -17.83642578125, -16.5224609375, -15.20849609375, -13.89453125, -12.58056640625, -11.2666015625, -9.95263671875, -8.638671875, -7.32470703125, -6.0107421875, -4.69677734375, -3.3828125, -2.06884765625, -0.7548828125, 0.55908203125, 1.873046875, 3.18701171875, 4.5009765625, 5.81494140625, 7.12890625, 8.44287109375, 9.7568359375, 11.07080078125, 12.384765625, 13.69873046875, 15.0126953125, 16.32666015625, 17.640625, 18.95458984375, 20.2685546875, 21.58251953125, 22.896484375, 24.21044921875, 25.5244140625, 26.83837890625, 28.15234375, 29.46630859375, 30.7802734375, 32.09423828125, 33.408203125, 34.72216796875, 36.0361328125, 37.35009765625, 38.6640625, 39.97802734375, 41.2919921875, 42.60595703125, 43.919921875, 45.23388671875, 46.5478515625, 47.86181640625, 49.17578125, 50.48974609375, 51.8037109375, 53.11767578125, 54.431640625, 55.74560546875, 57.0595703125, 58.37353515625, 59.6875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 5.0, 4.0, 4.0, 6.0, 16.0, 13.0, 20.0, 24.0, 29.0, 71.0, 171.0, 333.0, 138.0, 71.0, 33.0, 25.0, 16.0, 7.0, 10.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0099029541015625, -0.009638309478759766, -0.009373664855957031, -0.009109020233154297, -0.008844375610351562, -0.008579730987548828, -0.008315086364746094, -0.00805044174194336, -0.007785797119140625, -0.007521152496337891, -0.007256507873535156, -0.006991863250732422, -0.0067272186279296875, -0.006462574005126953, -0.006197929382324219, -0.005933284759521484, -0.00566864013671875, -0.005403995513916016, -0.005139350891113281, -0.004874706268310547, -0.0046100616455078125, -0.004345417022705078, -0.004080772399902344, -0.0038161277770996094, -0.003551483154296875, -0.0032868385314941406, -0.0030221939086914062, -0.002757549285888672, -0.0024929046630859375, -0.002228260040283203, -0.0019636154174804688, -0.0016989707946777344, -0.001434326171875, -0.0011696815490722656, -0.0009050369262695312, -0.0006403923034667969, -0.0003757476806640625, -0.00011110305786132812, 0.00015354156494140625, 0.0004181861877441406, 0.000682830810546875, 0.0009474754333496094, 0.0012121200561523438, 0.0014767646789550781, 0.0017414093017578125, 0.002006053924560547, 0.0022706985473632812, 0.0025353431701660156, 0.00279998779296875, 0.0030646324157714844, 0.0033292770385742188, 0.003593921661376953, 0.0038585662841796875, 0.004123210906982422, 0.004387855529785156, 0.004652500152587891, 0.004917144775390625, 0.005181789398193359, 0.005446434020996094, 0.005711078643798828, 0.0059757232666015625, 0.006240367889404297, 0.006505012512207031, 0.006769657135009766, 0.0070343017578125]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 5.0, 3.0, 1.0, 7.0, 9.0, 10.0, 15.0, 15.0, 42.0, 45.0, 53.0, 71.0, 111.0, 187.0, 327.0, 486.0, 983.0, 1818.0, 3749.0, 9543.0, 29381.0, 151285.0, 739439.0, 77973.0, 19751.0, 6872.0, 2990.0, 1418.0, 731.0, 431.0, 245.0, 186.0, 105.0, 65.0, 50.0, 43.0, 28.0, 29.0, 18.0, 17.0, 9.0, 7.0, 3.0, 2.0, 2.0, 2.0, 5.0, 0.0, 1.0, 2.0], "bins": [-19.09375, -18.5682373046875, -18.042724609375, -17.5172119140625, -16.99169921875, -16.4661865234375, -15.940673828125, -15.4151611328125, -14.8896484375, -14.3641357421875, -13.838623046875, -13.3131103515625, -12.78759765625, -12.2620849609375, -11.736572265625, -11.2110595703125, -10.685546875, -10.1600341796875, -9.634521484375, -9.1090087890625, -8.58349609375, -8.0579833984375, -7.532470703125, -7.0069580078125, -6.4814453125, -5.9559326171875, -5.430419921875, -4.9049072265625, -4.37939453125, -3.8538818359375, -3.328369140625, -2.8028564453125, -2.27734375, -1.7518310546875, -1.226318359375, -0.7008056640625, -0.17529296875, 0.3502197265625, 0.875732421875, 1.4012451171875, 1.9267578125, 2.4522705078125, 2.977783203125, 3.5032958984375, 4.02880859375, 4.5543212890625, 5.079833984375, 5.6053466796875, 6.130859375, 6.6563720703125, 7.181884765625, 7.7073974609375, 8.23291015625, 8.7584228515625, 9.283935546875, 9.8094482421875, 10.3349609375, 10.8604736328125, 11.385986328125, 11.9114990234375, 12.43701171875, 12.9625244140625, 13.488037109375, 14.0135498046875, 14.5390625]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 7.0, 6.0, 10.0, 12.0, 7.0, 10.0, 11.0, 18.0, 24.0, 34.0, 41.0, 86.0, 123.0, 174.0, 131.0, 83.0, 50.0, 35.0, 27.0, 24.0, 16.0, 11.0, 8.0, 12.0, 7.0, 2.0, 9.0, 4.0, 3.0, 2.0, 7.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-16.5, -15.9923095703125, -15.484619140625, -14.9769287109375, -14.46923828125, -13.9615478515625, -13.453857421875, -12.9461669921875, -12.4384765625, -11.9307861328125, -11.423095703125, -10.9154052734375, -10.40771484375, -9.9000244140625, -9.392333984375, -8.8846435546875, -8.376953125, -7.8692626953125, -7.361572265625, -6.8538818359375, -6.34619140625, -5.8385009765625, -5.330810546875, -4.8231201171875, -4.3154296875, -3.8077392578125, -3.300048828125, -2.7923583984375, -2.28466796875, -1.7769775390625, -1.269287109375, -0.7615966796875, -0.25390625, 0.2537841796875, 0.761474609375, 1.2691650390625, 1.77685546875, 2.2845458984375, 2.792236328125, 3.2999267578125, 3.8076171875, 4.3153076171875, 4.822998046875, 5.3306884765625, 5.83837890625, 6.3460693359375, 6.853759765625, 7.3614501953125, 7.869140625, 8.3768310546875, 8.884521484375, 9.3922119140625, 9.89990234375, 10.4075927734375, 10.915283203125, 11.4229736328125, 11.9306640625, 12.4383544921875, 12.946044921875, 13.4537353515625, 13.96142578125, 14.4691162109375, 14.976806640625, 15.4844970703125, 15.9921875]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 2.0, 4.0, 22.0, 67.0, 197.0, 448.0, 175.0, 47.0, 15.0, 8.0, 4.0, 5.0, 4.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-558.3154296875, -543.3786010742188, -528.4417724609375, -513.5048828125, -498.5680847167969, -483.6312255859375, -468.69439697265625, -453.757568359375, -438.82073974609375, -423.8839111328125, -408.9470520019531, -394.0102233886719, -379.0733947753906, -364.13653564453125, -349.19970703125, -334.26287841796875, -319.3260192871094, -304.3891906738281, -289.45233154296875, -274.5155029296875, -259.57867431640625, -244.64183044433594, -229.70498657226562, -214.76815795898438, -199.83131408691406, -184.89447021484375, -169.9576416015625, -155.0207977294922, -140.08395385742188, -125.14712524414062, -110.21028137207031, -95.27344512939453, -80.33660888671875, -65.39977264404297, -50.46293258666992, -35.526092529296875, -20.589256286621094, -5.6524200439453125, 9.284423828125, 24.22126007080078, 39.15809631347656, 54.094932556152344, 69.03176879882812, 83.96861267089844, 98.90544891357422, 113.84228515625, 128.7791290283203, 143.71597290039062, 158.65280151367188, 173.5896453857422, 188.52647399902344, 203.46331787109375, 218.400146484375, 233.3369903564453, 248.27383422851562, 263.2106628417969, 278.14752197265625, 293.0843505859375, 308.0212097167969, 322.9580383300781, 337.8948669433594, 352.83172607421875, 367.7685546875, 382.70538330078125, 397.6422119140625]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 5.0, 4.0, 7.0, 5.0, 6.0, 6.0, 6.0, 14.0, 6.0, 12.0, 16.0, 17.0, 18.0, 20.0, 24.0, 28.0, 32.0, 40.0, 31.0, 53.0, 55.0, 59.0, 72.0, 67.0, 69.0, 48.0, 36.0, 29.0, 30.0, 37.0, 23.0, 26.0, 26.0, 17.0, 12.0, 13.0, 9.0, 6.0, 2.0, 9.0, 8.0, 6.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-107.08128356933594, -102.89578247070312, -98.71028137207031, -94.5247802734375, -90.33927917480469, -86.15377807617188, -81.9682846069336, -77.78278350830078, -73.59728240966797, -69.41178131103516, -65.22628021240234, -61.0407829284668, -56.855281829833984, -52.66978073120117, -48.484283447265625, -44.29878234863281, -40.11328125, -35.92778015136719, -31.742280960083008, -27.556781768798828, -23.371280670166016, -19.185779571533203, -15.000280380249023, -10.814781188964844, -6.629280090332031, -2.443779945373535, 1.741720199584961, 5.927220344543457, 10.112720489501953, 14.298221588134766, 18.483720779418945, 22.669219970703125, 26.854705810546875, 31.040206909179688, 35.2257080078125, 39.41120529174805, 43.59670639038086, 47.78220748901367, 51.96770477294922, 56.15320587158203, 60.338706970214844, 64.52420806884766, 68.70970916748047, 72.89521026611328, 77.08070373535156, 81.26620483398438, 85.45170593261719, 89.63720703125, 93.82270812988281, 98.00820922851562, 102.19371032714844, 106.37921142578125, 110.56471252441406, 114.75021362304688, 118.93570709228516, 123.12120819091797, 127.30670928955078, 131.49220275878906, 135.67770385742188, 139.8632049560547, 144.0487060546875, 148.2342071533203, 152.41970825195312, 156.60520935058594, 160.79071044921875]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 2.0, 4.0, 0.0, 2.0, 2.0, 2.0, 5.0, 2.0, 8.0, 4.0, 4.0, 11.0, 17.0, 16.0, 25.0, 36.0, 56.0, 97.0, 156.0, 423.0, 1148.0, 5302.0, 66158.0, 4051580.0, 62832.0, 4627.0, 981.0, 329.0, 144.0, 77.0, 47.0, 49.0, 38.0, 17.0, 20.0, 13.0, 8.0, 9.0, 8.0, 5.0, 6.0, 5.0, 3.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-40.5625, -39.03173828125, -37.5009765625, -35.97021484375, -34.439453125, -32.90869140625, -31.3779296875, -29.84716796875, -28.31640625, -26.78564453125, -25.2548828125, -23.72412109375, -22.193359375, -20.66259765625, -19.1318359375, -17.60107421875, -16.0703125, -14.53955078125, -13.0087890625, -11.47802734375, -9.947265625, -8.41650390625, -6.8857421875, -5.35498046875, -3.82421875, -2.29345703125, -0.7626953125, 0.76806640625, 2.298828125, 3.82958984375, 5.3603515625, 6.89111328125, 8.421875, 9.95263671875, 11.4833984375, 13.01416015625, 14.544921875, 16.07568359375, 17.6064453125, 19.13720703125, 20.66796875, 22.19873046875, 23.7294921875, 25.26025390625, 26.791015625, 28.32177734375, 29.8525390625, 31.38330078125, 32.9140625, 34.44482421875, 35.9755859375, 37.50634765625, 39.037109375, 40.56787109375, 42.0986328125, 43.62939453125, 45.16015625, 46.69091796875, 48.2216796875, 49.75244140625, 51.283203125, 52.81396484375, 54.3447265625, 55.87548828125, 57.40625]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 6.0, 2.0, 4.0, 6.0, 13.0, 17.0, 17.0, 25.0, 21.0, 47.0, 46.0, 58.0, 56.0, 53.0, 79.0, 75.0, 67.0, 63.0, 66.0, 45.0, 63.0, 50.0, 29.0, 25.0, 22.0, 13.0, 10.0, 9.0, 8.0, 6.0, 2.0, 4.0, 2.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.55859375, -6.25897216796875, -5.9593505859375, -5.65972900390625, -5.360107421875, -5.06048583984375, -4.7608642578125, -4.46124267578125, -4.16162109375, -3.86199951171875, -3.5623779296875, -3.26275634765625, -2.963134765625, -2.66351318359375, -2.3638916015625, -2.06427001953125, -1.7646484375, -1.46502685546875, -1.1654052734375, -0.86578369140625, -0.566162109375, -0.26654052734375, 0.0330810546875, 0.33270263671875, 0.63232421875, 0.93194580078125, 1.2315673828125, 1.53118896484375, 1.830810546875, 2.13043212890625, 2.4300537109375, 2.72967529296875, 3.029296875, 3.32891845703125, 3.6285400390625, 3.92816162109375, 4.227783203125, 4.52740478515625, 4.8270263671875, 5.12664794921875, 5.42626953125, 5.72589111328125, 6.0255126953125, 6.32513427734375, 6.624755859375, 6.92437744140625, 7.2239990234375, 7.52362060546875, 7.8232421875, 8.12286376953125, 8.4224853515625, 8.72210693359375, 9.021728515625, 9.32135009765625, 9.6209716796875, 9.92059326171875, 10.22021484375, 10.51983642578125, 10.8194580078125, 11.11907958984375, 11.418701171875, 11.71832275390625, 12.0179443359375, 12.31756591796875, 12.6171875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 6.0, 11.0, 18.0, 30.0, 61.0, 102.0, 187.0, 354.0, 772.0, 2255.0, 20897.0, 4124745.0, 41066.0, 2530.0, 712.0, 277.0, 133.0, 65.0, 28.0, 16.0, 8.0, 6.0, 1.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-78.6875, -75.833984375, -72.98046875, -70.126953125, -67.2734375, -64.419921875, -61.56640625, -58.712890625, -55.859375, -53.005859375, -50.15234375, -47.298828125, -44.4453125, -41.591796875, -38.73828125, -35.884765625, -33.03125, -30.177734375, -27.32421875, -24.470703125, -21.6171875, -18.763671875, -15.91015625, -13.056640625, -10.203125, -7.349609375, -4.49609375, -1.642578125, 1.2109375, 4.064453125, 6.91796875, 9.771484375, 12.625, 15.478515625, 18.33203125, 21.185546875, 24.0390625, 26.892578125, 29.74609375, 32.599609375, 35.453125, 38.306640625, 41.16015625, 44.013671875, 46.8671875, 49.720703125, 52.57421875, 55.427734375, 58.28125, 61.134765625, 63.98828125, 66.841796875, 69.6953125, 72.548828125, 75.40234375, 78.255859375, 81.109375, 83.962890625, 86.81640625, 89.669921875, 92.5234375, 95.376953125, 98.23046875, 101.083984375, 103.9375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 5.0, 5.0, 16.0, 23.0, 64.0, 173.0, 641.0, 1790.0, 944.0, 231.0, 98.0, 46.0, 16.0, 11.0, 5.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.875, -65.3076171875, -63.740234375, -62.1728515625, -60.60546875, -59.0380859375, -57.470703125, -55.9033203125, -54.3359375, -52.7685546875, -51.201171875, -49.6337890625, -48.06640625, -46.4990234375, -44.931640625, -43.3642578125, -41.796875, -40.2294921875, -38.662109375, -37.0947265625, -35.52734375, -33.9599609375, -32.392578125, -30.8251953125, -29.2578125, -27.6904296875, -26.123046875, -24.5556640625, -22.98828125, -21.4208984375, -19.853515625, -18.2861328125, -16.71875, -15.1513671875, -13.583984375, -12.0166015625, -10.44921875, -8.8818359375, -7.314453125, -5.7470703125, -4.1796875, -2.6123046875, -1.044921875, 0.5224609375, 2.08984375, 3.6572265625, 5.224609375, 6.7919921875, 8.359375, 9.9267578125, 11.494140625, 13.0615234375, 14.62890625, 16.1962890625, 17.763671875, 19.3310546875, 20.8984375, 22.4658203125, 24.033203125, 25.6005859375, 27.16796875, 28.7353515625, 30.302734375, 31.8701171875, 33.4375]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 3.0, 9.0, 8.0, 17.0, 31.0, 78.0, 203.0, 304.0, 189.0, 83.0, 45.0, 12.0, 9.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-494.77117919921875, -483.129638671875, -471.4880676269531, -459.8465270996094, -448.2049560546875, -436.56341552734375, -424.921875, -413.28033447265625, -401.6387634277344, -389.9972229003906, -378.35565185546875, -366.714111328125, -355.07257080078125, -343.4309997558594, -331.7894592285156, -320.14788818359375, -308.50634765625, -296.86480712890625, -285.2232360839844, -273.5816955566406, -261.94012451171875, -250.298583984375, -238.65704345703125, -227.01548767089844, -215.37393188476562, -203.7323760986328, -192.0908203125, -180.44927978515625, -168.80772399902344, -157.16616821289062, -145.52462768554688, -133.88307189941406, -122.24154663085938, -110.59999084472656, -98.95844268798828, -87.31689453125, -75.67533874511719, -64.03378295898438, -52.392234802246094, -40.75068664550781, -29.109130859375, -17.467578887939453, -5.826026916503906, 5.815525054931641, 17.457077026367188, 29.098628997802734, 40.74018096923828, 52.38172912597656, 64.02328491210938, 75.66484069824219, 87.30638885498047, 98.94793701171875, 110.58949279785156, 122.23104858398438, 133.87258911132812, 145.51414489746094, 157.15570068359375, 168.79725646972656, 180.43881225585938, 192.08035278320312, 203.72190856933594, 215.36346435546875, 227.0050048828125, 238.6465606689453, 250.28811645507812]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 6.0, 7.0, 17.0, 26.0, 42.0, 65.0, 84.0, 118.0, 124.0, 134.0, 130.0, 96.0, 69.0, 40.0, 16.0, 18.0, 4.0, 8.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-223.9552459716797, -215.48777770996094, -207.0203094482422, -198.55282592773438, -190.08535766601562, -181.61788940429688, -173.15042114257812, -164.68295288085938, -156.21548461914062, -147.74801635742188, -139.28054809570312, -130.81307983398438, -122.34559631347656, -113.87812805175781, -105.41065979003906, -96.94319152832031, -88.4757080078125, -80.00823974609375, -71.54076385498047, -63.07329559326172, -54.6058235168457, -46.13835144042969, -37.67088317871094, -29.203411102294922, -20.735939025878906, -12.268467903137207, -3.800996780395508, 4.666473388671875, 13.13394546508789, 21.601417541503906, 30.068885803222656, 38.53635787963867, 47.003814697265625, 55.47128677368164, 63.938758850097656, 72.4062271118164, 80.87370300292969, 89.34117126464844, 97.80863952636719, 106.27610778808594, 114.74358367919922, 123.21105194091797, 131.67852783203125, 140.14599609375, 148.61346435546875, 157.0809326171875, 165.54840087890625, 174.01588439941406, 182.4833526611328, 190.95082092285156, 199.4182891845703, 207.88577270507812, 216.35324096679688, 224.82070922851562, 233.28817749023438, 241.75564575195312, 250.22311401367188, 258.6905822753906, 267.1580505371094, 275.6255187988281, 284.0929870605469, 292.56048583984375, 301.0279541015625, 309.49542236328125, 317.962890625]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 5.0, 4.0, 7.0, 3.0, 6.0, 7.0, 13.0, 20.0, 26.0, 28.0, 34.0, 59.0, 96.0, 125.0, 204.0, 384.0, 799.0, 2102.0, 6577.0, 27284.0, 202285.0, 652902.0, 127665.0, 19473.0, 5122.0, 1746.0, 704.0, 313.0, 164.0, 113.0, 77.0, 66.0, 40.0, 23.0, 27.0, 17.0, 5.0, 7.0, 10.0, 5.0, 5.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-24.421875, -23.591064453125, -22.76025390625, -21.929443359375, -21.0986328125, -20.267822265625, -19.43701171875, -18.606201171875, -17.775390625, -16.944580078125, -16.11376953125, -15.282958984375, -14.4521484375, -13.621337890625, -12.79052734375, -11.959716796875, -11.12890625, -10.298095703125, -9.46728515625, -8.636474609375, -7.8056640625, -6.974853515625, -6.14404296875, -5.313232421875, -4.482421875, -3.651611328125, -2.82080078125, -1.989990234375, -1.1591796875, -0.328369140625, 0.50244140625, 1.333251953125, 2.1640625, 2.994873046875, 3.82568359375, 4.656494140625, 5.4873046875, 6.318115234375, 7.14892578125, 7.979736328125, 8.810546875, 9.641357421875, 10.47216796875, 11.302978515625, 12.1337890625, 12.964599609375, 13.79541015625, 14.626220703125, 15.45703125, 16.287841796875, 17.11865234375, 17.949462890625, 18.7802734375, 19.611083984375, 20.44189453125, 21.272705078125, 22.103515625, 22.934326171875, 23.76513671875, 24.595947265625, 25.4267578125, 26.257568359375, 27.08837890625, 27.919189453125, 28.75]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 9.0, 19.0, 37.0, 50.0, 105.0, 115.0, 156.0, 152.0, 123.0, 117.0, 73.0, 31.0, 12.0, 9.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.78125, -25.971435546875, -25.16162109375, -24.351806640625, -23.5419921875, -22.732177734375, -21.92236328125, -21.112548828125, -20.302734375, -19.492919921875, -18.68310546875, -17.873291015625, -17.0634765625, -16.253662109375, -15.44384765625, -14.634033203125, -13.82421875, -13.014404296875, -12.20458984375, -11.394775390625, -10.5849609375, -9.775146484375, -8.96533203125, -8.155517578125, -7.345703125, -6.535888671875, -5.72607421875, -4.916259765625, -4.1064453125, -3.296630859375, -2.48681640625, -1.677001953125, -0.8671875, -0.057373046875, 0.75244140625, 1.562255859375, 2.3720703125, 3.181884765625, 3.99169921875, 4.801513671875, 5.611328125, 6.421142578125, 7.23095703125, 8.040771484375, 8.8505859375, 9.660400390625, 10.47021484375, 11.280029296875, 12.08984375, 12.899658203125, 13.70947265625, 14.519287109375, 15.3291015625, 16.138916015625, 16.94873046875, 17.758544921875, 18.568359375, 19.378173828125, 20.18798828125, 20.997802734375, 21.8076171875, 22.617431640625, 23.42724609375, 24.237060546875, 25.046875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 5.0, 4.0, 14.0, 15.0, 24.0, 45.0, 74.0, 164.0, 400.0, 1082.0, 3882.0, 27091.0, 692707.0, 302041.0, 16615.0, 2823.0, 878.0, 340.0, 168.0, 85.0, 38.0, 22.0, 17.0, 10.0, 4.0, 4.0, 8.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.59375, -51.16845703125, -49.7431640625, -48.31787109375, -46.892578125, -45.46728515625, -44.0419921875, -42.61669921875, -41.19140625, -39.76611328125, -38.3408203125, -36.91552734375, -35.490234375, -34.06494140625, -32.6396484375, -31.21435546875, -29.7890625, -28.36376953125, -26.9384765625, -25.51318359375, -24.087890625, -22.66259765625, -21.2373046875, -19.81201171875, -18.38671875, -16.96142578125, -15.5361328125, -14.11083984375, -12.685546875, -11.26025390625, -9.8349609375, -8.40966796875, -6.984375, -5.55908203125, -4.1337890625, -2.70849609375, -1.283203125, 0.14208984375, 1.5673828125, 2.99267578125, 4.41796875, 5.84326171875, 7.2685546875, 8.69384765625, 10.119140625, 11.54443359375, 12.9697265625, 14.39501953125, 15.8203125, 17.24560546875, 18.6708984375, 20.09619140625, 21.521484375, 22.94677734375, 24.3720703125, 25.79736328125, 27.22265625, 28.64794921875, 30.0732421875, 31.49853515625, 32.923828125, 34.34912109375, 35.7744140625, 37.19970703125, 38.625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 6.0, 3.0, 6.0, 15.0, 14.0, 24.0, 37.0, 49.0, 63.0, 64.0, 102.0, 96.0, 99.0, 102.0, 81.0, 54.0, 56.0, 40.0, 26.0, 26.0, 17.0, 14.0, 8.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-80.4375, -78.337890625, -76.23828125, -74.138671875, -72.0390625, -69.939453125, -67.83984375, -65.740234375, -63.640625, -61.541015625, -59.44140625, -57.341796875, -55.2421875, -53.142578125, -51.04296875, -48.943359375, -46.84375, -44.744140625, -42.64453125, -40.544921875, -38.4453125, -36.345703125, -34.24609375, -32.146484375, -30.046875, -27.947265625, -25.84765625, -23.748046875, -21.6484375, -19.548828125, -17.44921875, -15.349609375, -13.25, -11.150390625, -9.05078125, -6.951171875, -4.8515625, -2.751953125, -0.65234375, 1.447265625, 3.546875, 5.646484375, 7.74609375, 9.845703125, 11.9453125, 14.044921875, 16.14453125, 18.244140625, 20.34375, 22.443359375, 24.54296875, 26.642578125, 28.7421875, 30.841796875, 32.94140625, 35.041015625, 37.140625, 39.240234375, 41.33984375, 43.439453125, 45.5390625, 47.638671875, 49.73828125, 51.837890625, 53.9375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 4.0, 7.0, 9.0, 16.0, 30.0, 54.0, 117.0, 291.0, 880.0, 3140.0, 13796.0, 124351.0, 834116.0, 59559.0, 8958.0, 2159.0, 656.0, 224.0, 86.0, 40.0, 14.0, 19.0, 4.0, 6.0, 4.0, 2.0, 2.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.140625, -17.596923828125, -17.05322265625, -16.509521484375, -15.9658203125, -15.422119140625, -14.87841796875, -14.334716796875, -13.791015625, -13.247314453125, -12.70361328125, -12.159912109375, -11.6162109375, -11.072509765625, -10.52880859375, -9.985107421875, -9.44140625, -8.897705078125, -8.35400390625, -7.810302734375, -7.2666015625, -6.722900390625, -6.17919921875, -5.635498046875, -5.091796875, -4.548095703125, -4.00439453125, -3.460693359375, -2.9169921875, -2.373291015625, -1.82958984375, -1.285888671875, -0.7421875, -0.198486328125, 0.34521484375, 0.888916015625, 1.4326171875, 1.976318359375, 2.52001953125, 3.063720703125, 3.607421875, 4.151123046875, 4.69482421875, 5.238525390625, 5.7822265625, 6.325927734375, 6.86962890625, 7.413330078125, 7.95703125, 8.500732421875, 9.04443359375, 9.588134765625, 10.1318359375, 10.675537109375, 11.21923828125, 11.762939453125, 12.306640625, 12.850341796875, 13.39404296875, 13.937744140625, 14.4814453125, 15.025146484375, 15.56884765625, 16.112548828125, 16.65625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 5.0, 2.0, 0.0, 2.0, 3.0, 3.0, 5.0, 8.0, 15.0, 11.0, 23.0, 30.0, 52.0, 59.0, 164.0, 192.0, 151.0, 83.0, 63.0, 41.0, 25.0, 16.0, 6.0, 15.0, 8.0, 4.0, 4.0, 4.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0028285980224609375, -0.0027085840702056885, -0.0025885701179504395, -0.0024685561656951904, -0.0023485422134399414, -0.0022285282611846924, -0.0021085143089294434, -0.0019885003566741943, -0.0018684864044189453, -0.0017484724521636963, -0.0016284584999084473, -0.0015084445476531982, -0.0013884305953979492, -0.0012684166431427002, -0.0011484026908874512, -0.0010283887386322021, -0.0009083747863769531, -0.0007883608341217041, -0.0006683468818664551, -0.0005483329296112061, -0.00042831897735595703, -0.000308305025100708, -0.00018829107284545898, -6.827712059020996e-05, 5.173683166503906e-05, 0.00017175078392028809, 0.0002917647361755371, 0.00041177868843078613, 0.0005317926406860352, 0.0006518065929412842, 0.0007718205451965332, 0.0008918344974517822, 0.0010118484497070312, 0.0011318624019622803, 0.0012518763542175293, 0.0013718903064727783, 0.0014919042587280273, 0.0016119182109832764, 0.0017319321632385254, 0.0018519461154937744, 0.0019719600677490234, 0.0020919740200042725, 0.0022119879722595215, 0.0023320019245147705, 0.0024520158767700195, 0.0025720298290252686, 0.0026920437812805176, 0.0028120577335357666, 0.0029320716857910156, 0.0030520856380462646, 0.0031720995903015137, 0.0032921135425567627, 0.0034121274948120117, 0.0035321414470672607, 0.0036521553993225098, 0.003772169351577759, 0.003892183303833008, 0.004012197256088257, 0.004132211208343506, 0.004252225160598755, 0.004372239112854004, 0.004492253065109253, 0.004612267017364502, 0.004732280969619751, 0.004852294921875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 5.0, 2.0, 10.0, 16.0, 19.0, 31.0, 43.0, 75.0, 130.0, 229.0, 374.0, 758.0, 1584.0, 3485.0, 7829.0, 21355.0, 74598.0, 532080.0, 311418.0, 62451.0, 18744.0, 7218.0, 3116.0, 1438.0, 683.0, 380.0, 198.0, 117.0, 61.0, 39.0, 24.0, 9.0, 9.0, 11.0, 2.0, 5.0, 4.0, 6.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.390625, -11.09039306640625, -10.7901611328125, -10.48992919921875, -10.189697265625, -9.88946533203125, -9.5892333984375, -9.28900146484375, -8.98876953125, -8.68853759765625, -8.3883056640625, -8.08807373046875, -7.787841796875, -7.48760986328125, -7.1873779296875, -6.88714599609375, -6.5869140625, -6.28668212890625, -5.9864501953125, -5.68621826171875, -5.385986328125, -5.08575439453125, -4.7855224609375, -4.48529052734375, -4.18505859375, -3.88482666015625, -3.5845947265625, -3.28436279296875, -2.984130859375, -2.68389892578125, -2.3836669921875, -2.08343505859375, -1.783203125, -1.48297119140625, -1.1827392578125, -0.88250732421875, -0.582275390625, -0.28204345703125, 0.0181884765625, 0.31842041015625, 0.61865234375, 0.91888427734375, 1.2191162109375, 1.51934814453125, 1.819580078125, 2.11981201171875, 2.4200439453125, 2.72027587890625, 3.0205078125, 3.32073974609375, 3.6209716796875, 3.92120361328125, 4.221435546875, 4.52166748046875, 4.8218994140625, 5.12213134765625, 5.42236328125, 5.72259521484375, 6.0228271484375, 6.32305908203125, 6.623291015625, 6.92352294921875, 7.2237548828125, 7.52398681640625, 7.82421875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 3.0, 1.0, 2.0, 6.0, 2.0, 1.0, 4.0, 3.0, 4.0, 10.0, 7.0, 7.0, 16.0, 22.0, 29.0, 43.0, 52.0, 62.0, 88.0, 113.0, 122.0, 109.0, 73.0, 58.0, 37.0, 32.0, 20.0, 20.0, 8.0, 14.0, 6.0, 10.0, 8.0, 4.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.703125, -9.3612060546875, -9.019287109375, -8.6773681640625, -8.33544921875, -7.9935302734375, -7.651611328125, -7.3096923828125, -6.9677734375, -6.6258544921875, -6.283935546875, -5.9420166015625, -5.60009765625, -5.2581787109375, -4.916259765625, -4.5743408203125, -4.232421875, -3.8905029296875, -3.548583984375, -3.2066650390625, -2.86474609375, -2.5228271484375, -2.180908203125, -1.8389892578125, -1.4970703125, -1.1551513671875, -0.813232421875, -0.4713134765625, -0.12939453125, 0.2125244140625, 0.554443359375, 0.8963623046875, 1.23828125, 1.5802001953125, 1.922119140625, 2.2640380859375, 2.60595703125, 2.9478759765625, 3.289794921875, 3.6317138671875, 3.9736328125, 4.3155517578125, 4.657470703125, 4.9993896484375, 5.34130859375, 5.6832275390625, 6.025146484375, 6.3670654296875, 6.708984375, 7.0509033203125, 7.392822265625, 7.7347412109375, 8.07666015625, 8.4185791015625, 8.760498046875, 9.1024169921875, 9.4443359375, 9.7862548828125, 10.128173828125, 10.4700927734375, 10.81201171875, 11.1539306640625, 11.495849609375, 11.8377685546875, 12.1796875]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 5.0, 27.0, 119.0, 497.0, 267.0, 62.0, 8.0, 12.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-256.21905517578125, -237.69471740722656, -219.17037963867188, -200.6460418701172, -182.1217041015625, -163.5973663330078, -145.07302856445312, -126.54869079589844, -108.02435302734375, -89.50001525878906, -70.97567749023438, -52.45133972167969, -33.927001953125, -15.402664184570312, 3.121673583984375, 21.646011352539062, 40.17034912109375, 58.69468688964844, 77.21902465820312, 95.74336242675781, 114.2677001953125, 132.7920379638672, 151.31637573242188, 169.84071350097656, 188.36505126953125, 206.88938903808594, 225.41372680664062, 243.9380645751953, 262.46240234375, 280.98675537109375, 299.5110778808594, 318.035400390625, 336.559814453125, 355.08416748046875, 373.6084899902344, 392.1328125, 410.65716552734375, 429.1815185546875, 447.7058410644531, 466.23016357421875, 484.7545166015625, 503.27886962890625, 521.80322265625, 540.3275146484375, 558.8518676757812, 577.376220703125, 595.9005126953125, 614.4248657226562, 632.94921875, 651.4735717773438, 669.9979248046875, 688.522216796875, 707.0465698242188, 725.5709228515625, 744.09521484375, 762.6195678710938, 781.1439208984375, 799.6682739257812, 818.192626953125, 836.7169189453125, 855.2412719726562, 873.765625, 892.2899169921875, 910.8142700195312, 929.338623046875]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 10.0, 9.0, 14.0, 23.0, 23.0, 33.0, 42.0, 60.0, 68.0, 89.0, 145.0, 128.0, 96.0, 53.0, 58.0, 42.0, 30.0, 27.0, 21.0, 21.0, 10.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-303.801025390625, -294.5783996582031, -285.35577392578125, -276.1331787109375, -266.9105529785156, -257.68792724609375, -248.46530151367188, -239.24269104003906, -230.02008056640625, -220.79745483398438, -211.57484436035156, -202.3522186279297, -193.12960815429688, -183.906982421875, -174.68435668945312, -165.4617462158203, -156.23912048339844, -147.01649475097656, -137.79388427734375, -128.57125854492188, -119.34864807128906, -110.12602233886719, -100.90340423583984, -91.6807861328125, -82.45816802978516, -73.23554992675781, -64.01293182373047, -54.79030990600586, -45.567691802978516, -36.34507369995117, -27.122451782226562, -17.89983367919922, -8.677215576171875, 0.5454034805297852, 9.768022537231445, 18.990642547607422, 28.213260650634766, 37.43587875366211, 46.65850067138672, 55.88111877441406, 65.1037368774414, 74.32635498046875, 83.5489730834961, 92.77159118652344, 101.99421691894531, 111.21682739257812, 120.439453125, 129.66207885742188, 138.8846893310547, 148.10731506347656, 157.32992553710938, 166.55255126953125, 175.77516174316406, 184.99778747558594, 194.22039794921875, 203.44302368164062, 212.6656494140625, 221.88827514648438, 231.1108856201172, 240.33351135253906, 249.55612182617188, 258.77874755859375, 268.0013732910156, 277.2239990234375, 286.44659423828125]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 4.0, 9.0, 10.0, 7.0, 9.0, 18.0, 32.0, 57.0, 96.0, 191.0, 417.0, 1279.0, 4547.0, 31246.0, 2951255.0, 1181699.0, 19382.0, 2842.0, 661.0, 232.0, 81.0, 52.0, 36.0, 25.0, 20.0, 14.0, 14.0, 14.0, 6.0, 6.0, 4.0, 4.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-26.03125, -24.8427734375, -23.654296875, -22.4658203125, -21.27734375, -20.0888671875, -18.900390625, -17.7119140625, -16.5234375, -15.3349609375, -14.146484375, -12.9580078125, -11.76953125, -10.5810546875, -9.392578125, -8.2041015625, -7.015625, -5.8271484375, -4.638671875, -3.4501953125, -2.26171875, -1.0732421875, 0.115234375, 1.3037109375, 2.4921875, 3.6806640625, 4.869140625, 6.0576171875, 7.24609375, 8.4345703125, 9.623046875, 10.8115234375, 12.0, 13.1884765625, 14.376953125, 15.5654296875, 16.75390625, 17.9423828125, 19.130859375, 20.3193359375, 21.5078125, 22.6962890625, 23.884765625, 25.0732421875, 26.26171875, 27.4501953125, 28.638671875, 29.8271484375, 31.015625, 32.2041015625, 33.392578125, 34.5810546875, 35.76953125, 36.9580078125, 38.146484375, 39.3349609375, 40.5234375, 41.7119140625, 42.900390625, 44.0888671875, 45.27734375, 46.4658203125, 47.654296875, 48.8427734375, 50.03125]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 5.0, 3.0, 6.0, 4.0, 8.0, 15.0, 8.0, 32.0, 22.0, 33.0, 34.0, 49.0, 56.0, 57.0, 72.0, 68.0, 85.0, 73.0, 75.0, 54.0, 47.0, 46.0, 51.0, 26.0, 16.0, 17.0, 13.0, 7.0, 8.0, 4.0, 4.0, 0.0, 1.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.1953125, -8.7979736328125, -8.400634765625, -8.0032958984375, -7.60595703125, -7.2086181640625, -6.811279296875, -6.4139404296875, -6.0166015625, -5.6192626953125, -5.221923828125, -4.8245849609375, -4.42724609375, -4.0299072265625, -3.632568359375, -3.2352294921875, -2.837890625, -2.4405517578125, -2.043212890625, -1.6458740234375, -1.24853515625, -0.8511962890625, -0.453857421875, -0.0565185546875, 0.3408203125, 0.7381591796875, 1.135498046875, 1.5328369140625, 1.93017578125, 2.3275146484375, 2.724853515625, 3.1221923828125, 3.51953125, 3.9168701171875, 4.314208984375, 4.7115478515625, 5.10888671875, 5.5062255859375, 5.903564453125, 6.3009033203125, 6.6982421875, 7.0955810546875, 7.492919921875, 7.8902587890625, 8.28759765625, 8.6849365234375, 9.082275390625, 9.4796142578125, 9.876953125, 10.2742919921875, 10.671630859375, 11.0689697265625, 11.46630859375, 11.8636474609375, 12.260986328125, 12.6583251953125, 13.0556640625, 13.4530029296875, 13.850341796875, 14.2476806640625, 14.64501953125, 15.0423583984375, 15.439697265625, 15.8370361328125, 16.234375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 4.0, 13.0, 13.0, 15.0, 21.0, 29.0, 62.0, 101.0, 261.0, 728.0, 2362.0, 15313.0, 560408.0, 3569501.0, 39132.0, 4462.0, 1094.0, 400.0, 160.0, 84.0, 38.0, 35.0, 11.0, 9.0, 4.0, 5.0, 4.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-42.3125, -40.91064453125, -39.5087890625, -38.10693359375, -36.705078125, -35.30322265625, -33.9013671875, -32.49951171875, -31.09765625, -29.69580078125, -28.2939453125, -26.89208984375, -25.490234375, -24.08837890625, -22.6865234375, -21.28466796875, -19.8828125, -18.48095703125, -17.0791015625, -15.67724609375, -14.275390625, -12.87353515625, -11.4716796875, -10.06982421875, -8.66796875, -7.26611328125, -5.8642578125, -4.46240234375, -3.060546875, -1.65869140625, -0.2568359375, 1.14501953125, 2.546875, 3.94873046875, 5.3505859375, 6.75244140625, 8.154296875, 9.55615234375, 10.9580078125, 12.35986328125, 13.76171875, 15.16357421875, 16.5654296875, 17.96728515625, 19.369140625, 20.77099609375, 22.1728515625, 23.57470703125, 24.9765625, 26.37841796875, 27.7802734375, 29.18212890625, 30.583984375, 31.98583984375, 33.3876953125, 34.78955078125, 36.19140625, 37.59326171875, 38.9951171875, 40.39697265625, 41.798828125, 43.20068359375, 44.6025390625, 46.00439453125, 47.40625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 5.0, 2.0, 5.0, 11.0, 9.0, 23.0, 30.0, 43.0, 98.0, 150.0, 330.0, 637.0, 1069.0, 782.0, 406.0, 187.0, 105.0, 71.0, 33.0, 27.0, 18.0, 12.0, 6.0, 7.0, 5.0, 1.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.546875, -29.640625, -28.734375, -27.828125, -26.921875, -26.015625, -25.109375, -24.203125, -23.296875, -22.390625, -21.484375, -20.578125, -19.671875, -18.765625, -17.859375, -16.953125, -16.046875, -15.140625, -14.234375, -13.328125, -12.421875, -11.515625, -10.609375, -9.703125, -8.796875, -7.890625, -6.984375, -6.078125, -5.171875, -4.265625, -3.359375, -2.453125, -1.546875, -0.640625, 0.265625, 1.171875, 2.078125, 2.984375, 3.890625, 4.796875, 5.703125, 6.609375, 7.515625, 8.421875, 9.328125, 10.234375, 11.140625, 12.046875, 12.953125, 13.859375, 14.765625, 15.671875, 16.578125, 17.484375, 18.390625, 19.296875, 20.203125, 21.109375, 22.015625, 22.921875, 23.828125, 24.734375, 25.640625, 26.546875, 27.453125]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 10.0, 14.0, 24.0, 50.0, 99.0, 135.0, 175.0, 171.0, 108.0, 100.0, 48.0, 31.0, 13.0, 13.0, 8.0, 3.0, 4.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-97.69384002685547, -91.04043579101562, -84.38702392578125, -77.7336196899414, -71.08020782470703, -64.42680358886719, -57.77339553833008, -51.11998748779297, -44.46657943725586, -37.81317138671875, -31.15976333618164, -24.506357192993164, -17.852949142456055, -11.199542999267578, -4.546134948730469, 2.1072731018066406, 8.76068115234375, 15.41408920288086, 22.06749725341797, 28.720903396606445, 35.37431335449219, 42.02771759033203, 48.68112564086914, 55.33453369140625, 61.98794174194336, 68.64134979248047, 75.29475402832031, 81.94816589355469, 88.60157012939453, 95.25497436523438, 101.90838623046875, 108.56179809570312, 115.21519470214844, 121.86859893798828, 128.52200317382812, 135.1754150390625, 141.82882690429688, 148.48223876953125, 155.13563537597656, 161.78904724121094, 168.4424591064453, 175.0958709716797, 181.749267578125, 188.40267944335938, 195.05609130859375, 201.70950317382812, 208.36289978027344, 215.0163116455078, 221.66970825195312, 228.3231201171875, 234.9765167236328, 241.6299285888672, 248.28334045410156, 254.93673706054688, 261.59014892578125, 268.2435607910156, 274.89697265625, 281.5503845214844, 288.20379638671875, 294.8572082519531, 301.5105895996094, 308.16400146484375, 314.8174133300781, 321.4708251953125, 328.1242370605469]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 7.0, 3.0, 5.0, 11.0, 7.0, 10.0, 12.0, 19.0, 11.0, 20.0, 27.0, 22.0, 26.0, 35.0, 30.0, 48.0, 53.0, 46.0, 51.0, 52.0, 51.0, 50.0, 54.0, 52.0, 47.0, 36.0, 30.0, 40.0, 33.0, 21.0, 18.0, 21.0, 11.0, 10.0, 10.0, 11.0, 3.0, 3.0, 7.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-93.21646118164062, -90.42561340332031, -87.63475799560547, -84.84391021728516, -82.05305480957031, -79.26220703125, -76.47135162353516, -73.68050384521484, -70.8896484375, -68.09880065917969, -65.30794525146484, -62.517093658447266, -59.72624206542969, -56.93539047241211, -54.14453887939453, -51.35369110107422, -48.56283950805664, -45.77198791503906, -42.981136322021484, -40.190284729003906, -37.39943313598633, -34.60858154296875, -31.817731857299805, -29.026880264282227, -26.23602867126465, -23.44517707824707, -20.654325485229492, -17.863475799560547, -15.072623252868652, -12.281771659851074, -9.490921020507812, -6.700069427490234, -3.9092178344726562, -1.1183664798736572, 1.6724848747253418, 4.463335990905762, 7.25418758392334, 10.045039176940918, 12.83588981628418, 15.626741409301758, 18.417593002319336, 21.208444595336914, 23.999296188354492, 26.790145874023438, 29.580997467041016, 32.371849060058594, 35.16270065307617, 37.95355224609375, 40.74440383911133, 43.535255432128906, 46.326107025146484, 49.11695861816406, 51.90781021118164, 54.69866180419922, 57.48950958251953, 60.280364990234375, 63.07121276855469, 65.862060546875, 68.65291595458984, 71.44376373291016, 74.234619140625, 77.02546691894531, 79.81632232666016, 82.60717010498047, 85.39802551269531]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 4.0, 10.0, 12.0, 18.0, 34.0, 40.0, 79.0, 121.0, 203.0, 396.0, 878.0, 2528.0, 9452.0, 55510.0, 521506.0, 403255.0, 43010.0, 7736.0, 2103.0, 817.0, 354.0, 200.0, 106.0, 75.0, 37.0, 23.0, 8.0, 8.0, 7.0, 8.0, 4.0, 3.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-26.765625, -25.927490234375, -25.08935546875, -24.251220703125, -23.4130859375, -22.574951171875, -21.73681640625, -20.898681640625, -20.060546875, -19.222412109375, -18.38427734375, -17.546142578125, -16.7080078125, -15.869873046875, -15.03173828125, -14.193603515625, -13.35546875, -12.517333984375, -11.67919921875, -10.841064453125, -10.0029296875, -9.164794921875, -8.32666015625, -7.488525390625, -6.650390625, -5.812255859375, -4.97412109375, -4.135986328125, -3.2978515625, -2.459716796875, -1.62158203125, -0.783447265625, 0.0546875, 0.892822265625, 1.73095703125, 2.569091796875, 3.4072265625, 4.245361328125, 5.08349609375, 5.921630859375, 6.759765625, 7.597900390625, 8.43603515625, 9.274169921875, 10.1123046875, 10.950439453125, 11.78857421875, 12.626708984375, 13.46484375, 14.302978515625, 15.14111328125, 15.979248046875, 16.8173828125, 17.655517578125, 18.49365234375, 19.331787109375, 20.169921875, 21.008056640625, 21.84619140625, 22.684326171875, 23.5224609375, 24.360595703125, 25.19873046875, 26.036865234375, 26.875]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 9.0, 11.0, 16.0, 12.0, 20.0, 24.0, 32.0, 46.0, 55.0, 63.0, 80.0, 75.0, 79.0, 68.0, 67.0, 72.0, 53.0, 47.0, 44.0, 29.0, 22.0, 24.0, 18.0, 11.0, 5.0, 5.0, 5.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.0234375, -11.5731201171875, -11.122802734375, -10.6724853515625, -10.22216796875, -9.7718505859375, -9.321533203125, -8.8712158203125, -8.4208984375, -7.9705810546875, -7.520263671875, -7.0699462890625, -6.61962890625, -6.1693115234375, -5.718994140625, -5.2686767578125, -4.818359375, -4.3680419921875, -3.917724609375, -3.4674072265625, -3.01708984375, -2.5667724609375, -2.116455078125, -1.6661376953125, -1.2158203125, -0.7655029296875, -0.315185546875, 0.1351318359375, 0.58544921875, 1.0357666015625, 1.486083984375, 1.9364013671875, 2.38671875, 2.8370361328125, 3.287353515625, 3.7376708984375, 4.18798828125, 4.6383056640625, 5.088623046875, 5.5389404296875, 5.9892578125, 6.4395751953125, 6.889892578125, 7.3402099609375, 7.79052734375, 8.2408447265625, 8.691162109375, 9.1414794921875, 9.591796875, 10.0421142578125, 10.492431640625, 10.9427490234375, 11.39306640625, 11.8433837890625, 12.293701171875, 12.7440185546875, 13.1943359375, 13.6446533203125, 14.094970703125, 14.5452880859375, 14.99560546875, 15.4459228515625, 15.896240234375, 16.3465576171875, 16.796875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 2.0, 6.0, 7.0, 9.0, 18.0, 19.0, 40.0, 58.0, 102.0, 158.0, 277.0, 549.0, 1251.0, 3647.0, 14277.0, 93157.0, 778296.0, 131268.0, 18332.0, 4263.0, 1387.0, 610.0, 314.0, 193.0, 122.0, 74.0, 36.0, 30.0, 13.0, 12.0, 8.0, 5.0, 3.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-32.21875, -31.286865234375, -30.35498046875, -29.423095703125, -28.4912109375, -27.559326171875, -26.62744140625, -25.695556640625, -24.763671875, -23.831787109375, -22.89990234375, -21.968017578125, -21.0361328125, -20.104248046875, -19.17236328125, -18.240478515625, -17.30859375, -16.376708984375, -15.44482421875, -14.512939453125, -13.5810546875, -12.649169921875, -11.71728515625, -10.785400390625, -9.853515625, -8.921630859375, -7.98974609375, -7.057861328125, -6.1259765625, -5.194091796875, -4.26220703125, -3.330322265625, -2.3984375, -1.466552734375, -0.53466796875, 0.397216796875, 1.3291015625, 2.260986328125, 3.19287109375, 4.124755859375, 5.056640625, 5.988525390625, 6.92041015625, 7.852294921875, 8.7841796875, 9.716064453125, 10.64794921875, 11.579833984375, 12.51171875, 13.443603515625, 14.37548828125, 15.307373046875, 16.2392578125, 17.171142578125, 18.10302734375, 19.034912109375, 19.966796875, 20.898681640625, 21.83056640625, 22.762451171875, 23.6943359375, 24.626220703125, 25.55810546875, 26.489990234375, 27.421875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 0.0, 1.0, 1.0, 2.0, 7.0, 8.0, 15.0, 11.0, 8.0, 8.0, 10.0, 9.0, 16.0, 32.0, 28.0, 30.0, 36.0, 45.0, 38.0, 47.0, 44.0, 40.0, 53.0, 55.0, 54.0, 52.0, 54.0, 43.0, 36.0, 36.0, 30.0, 24.0, 27.0, 24.0, 9.0, 15.0, 7.0, 13.0, 7.0, 4.0, 1.0, 6.0, 4.0, 6.0, 4.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-39.65625, -38.36181640625, -37.0673828125, -35.77294921875, -34.478515625, -33.18408203125, -31.8896484375, -30.59521484375, -29.30078125, -28.00634765625, -26.7119140625, -25.41748046875, -24.123046875, -22.82861328125, -21.5341796875, -20.23974609375, -18.9453125, -17.65087890625, -16.3564453125, -15.06201171875, -13.767578125, -12.47314453125, -11.1787109375, -9.88427734375, -8.58984375, -7.29541015625, -6.0009765625, -4.70654296875, -3.412109375, -2.11767578125, -0.8232421875, 0.47119140625, 1.765625, 3.06005859375, 4.3544921875, 5.64892578125, 6.943359375, 8.23779296875, 9.5322265625, 10.82666015625, 12.12109375, 13.41552734375, 14.7099609375, 16.00439453125, 17.298828125, 18.59326171875, 19.8876953125, 21.18212890625, 22.4765625, 23.77099609375, 25.0654296875, 26.35986328125, 27.654296875, 28.94873046875, 30.2431640625, 31.53759765625, 32.83203125, 34.12646484375, 35.4208984375, 36.71533203125, 38.009765625, 39.30419921875, 40.5986328125, 41.89306640625, 43.1875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 4.0, 3.0, 3.0, 7.0, 9.0, 12.0, 16.0, 22.0, 30.0, 33.0, 44.0, 68.0, 119.0, 207.0, 406.0, 759.0, 1730.0, 4103.0, 11456.0, 39091.0, 246939.0, 660375.0, 58147.0, 15368.0, 5313.0, 2155.0, 960.0, 532.0, 230.0, 141.0, 75.0, 51.0, 48.0, 19.0, 19.0, 19.0, 13.0, 7.0, 8.0, 7.0, 5.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.1328125, -8.857177734375, -8.58154296875, -8.305908203125, -8.0302734375, -7.754638671875, -7.47900390625, -7.203369140625, -6.927734375, -6.652099609375, -6.37646484375, -6.100830078125, -5.8251953125, -5.549560546875, -5.27392578125, -4.998291015625, -4.72265625, -4.447021484375, -4.17138671875, -3.895751953125, -3.6201171875, -3.344482421875, -3.06884765625, -2.793212890625, -2.517578125, -2.241943359375, -1.96630859375, -1.690673828125, -1.4150390625, -1.139404296875, -0.86376953125, -0.588134765625, -0.3125, -0.036865234375, 0.23876953125, 0.514404296875, 0.7900390625, 1.065673828125, 1.34130859375, 1.616943359375, 1.892578125, 2.168212890625, 2.44384765625, 2.719482421875, 2.9951171875, 3.270751953125, 3.54638671875, 3.822021484375, 4.09765625, 4.373291015625, 4.64892578125, 4.924560546875, 5.2001953125, 5.475830078125, 5.75146484375, 6.027099609375, 6.302734375, 6.578369140625, 6.85400390625, 7.129638671875, 7.4052734375, 7.680908203125, 7.95654296875, 8.232177734375, 8.5078125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 7.0, 4.0, 2.0, 2.0, 2.0, 4.0, 4.0, 8.0, 8.0, 5.0, 12.0, 15.0, 32.0, 25.0, 41.0, 51.0, 104.0, 148.0, 148.0, 106.0, 78.0, 50.0, 26.0, 32.0, 22.0, 21.0, 9.0, 8.0, 7.0, 5.0, 3.0, 4.0, 4.0, 3.0, 2.0, 0.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.0025348663330078125, -0.0024645626544952393, -0.002394258975982666, -0.0023239552974700928, -0.0022536516189575195, -0.0021833479404449463, -0.002113044261932373, -0.0020427405834198, -0.0019724369049072266, -0.0019021332263946533, -0.00183182954788208, -0.0017615258693695068, -0.0016912221908569336, -0.0016209185123443604, -0.0015506148338317871, -0.0014803111553192139, -0.0014100074768066406, -0.0013397037982940674, -0.0012694001197814941, -0.001199096441268921, -0.0011287927627563477, -0.0010584890842437744, -0.0009881854057312012, -0.0009178817272186279, -0.0008475780487060547, -0.0007772743701934814, -0.0007069706916809082, -0.000636667013168335, -0.0005663633346557617, -0.0004960596561431885, -0.00042575597763061523, -0.000355452299118042, -0.00028514862060546875, -0.0002148449420928955, -0.00014454126358032227, -7.423758506774902e-05, -3.933906555175781e-06, 6.636977195739746e-05, 0.0001366734504699707, 0.00020697712898254395, 0.0002772808074951172, 0.00034758448600769043, 0.00041788816452026367, 0.0004881918430328369, 0.0005584955215454102, 0.0006287992000579834, 0.0006991028785705566, 0.0007694065570831299, 0.0008397102355957031, 0.0009100139141082764, 0.0009803175926208496, 0.0010506212711334229, 0.001120924949645996, 0.0011912286281585693, 0.0012615323066711426, 0.0013318359851837158, 0.001402139663696289, 0.0014724433422088623, 0.0015427470207214355, 0.0016130506992340088, 0.001683354377746582, 0.0017536580562591553, 0.0018239617347717285, 0.0018942654132843018, 0.001964569091796875]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 6.0, 2.0, 14.0, 19.0, 29.0, 51.0, 74.0, 117.0, 221.0, 350.0, 645.0, 1284.0, 2916.0, 7545.0, 25476.0, 134086.0, 757381.0, 88060.0, 19259.0, 6127.0, 2407.0, 1093.0, 556.0, 314.0, 192.0, 125.0, 75.0, 34.0, 34.0, 19.0, 12.0, 7.0, 3.0, 4.0, 5.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-9.765625, -9.4443359375, -9.123046875, -8.8017578125, -8.48046875, -8.1591796875, -7.837890625, -7.5166015625, -7.1953125, -6.8740234375, -6.552734375, -6.2314453125, -5.91015625, -5.5888671875, -5.267578125, -4.9462890625, -4.625, -4.3037109375, -3.982421875, -3.6611328125, -3.33984375, -3.0185546875, -2.697265625, -2.3759765625, -2.0546875, -1.7333984375, -1.412109375, -1.0908203125, -0.76953125, -0.4482421875, -0.126953125, 0.1943359375, 0.515625, 0.8369140625, 1.158203125, 1.4794921875, 1.80078125, 2.1220703125, 2.443359375, 2.7646484375, 3.0859375, 3.4072265625, 3.728515625, 4.0498046875, 4.37109375, 4.6923828125, 5.013671875, 5.3349609375, 5.65625, 5.9775390625, 6.298828125, 6.6201171875, 6.94140625, 7.2626953125, 7.583984375, 7.9052734375, 8.2265625, 8.5478515625, 8.869140625, 9.1904296875, 9.51171875, 9.8330078125, 10.154296875, 10.4755859375, 10.796875]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 8.0, 3.0, 6.0, 11.0, 27.0, 16.0, 25.0, 30.0, 50.0, 79.0, 151.0, 190.0, 167.0, 60.0, 50.0, 28.0, 31.0, 19.0, 11.0, 15.0, 12.0, 3.0, 5.0, 2.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.90625, -15.50341796875, -15.1005859375, -14.69775390625, -14.294921875, -13.89208984375, -13.4892578125, -13.08642578125, -12.68359375, -12.28076171875, -11.8779296875, -11.47509765625, -11.072265625, -10.66943359375, -10.2666015625, -9.86376953125, -9.4609375, -9.05810546875, -8.6552734375, -8.25244140625, -7.849609375, -7.44677734375, -7.0439453125, -6.64111328125, -6.23828125, -5.83544921875, -5.4326171875, -5.02978515625, -4.626953125, -4.22412109375, -3.8212890625, -3.41845703125, -3.015625, -2.61279296875, -2.2099609375, -1.80712890625, -1.404296875, -1.00146484375, -0.5986328125, -0.19580078125, 0.20703125, 0.60986328125, 1.0126953125, 1.41552734375, 1.818359375, 2.22119140625, 2.6240234375, 3.02685546875, 3.4296875, 3.83251953125, 4.2353515625, 4.63818359375, 5.041015625, 5.44384765625, 5.8466796875, 6.24951171875, 6.65234375, 7.05517578125, 7.4580078125, 7.86083984375, 8.263671875, 8.66650390625, 9.0693359375, 9.47216796875, 9.875]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 7.0, 18.0, 53.0, 243.0, 498.0, 133.0, 24.0, 12.0, 11.0, 5.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-339.7746276855469, -324.47076416015625, -309.1669006347656, -293.863037109375, -278.5591735839844, -263.25531005859375, -247.95144653320312, -232.6475830078125, -217.34371948242188, -202.03985595703125, -186.73599243164062, -171.43212890625, -156.12826538085938, -140.82440185546875, -125.52053833007812, -110.2166748046875, -94.91281127929688, -79.60894775390625, -64.30508422851562, -49.001220703125, -33.697357177734375, -18.39349365234375, -3.089630126953125, 12.2142333984375, 27.518096923828125, 42.82196044921875, 58.125823974609375, 73.4296875, 88.73355102539062, 104.03741455078125, 119.34127807617188, 134.6451416015625, 149.948974609375, 165.25283813476562, 180.55670166015625, 195.86056518554688, 211.1644287109375, 226.46829223632812, 241.77215576171875, 257.0760192871094, 272.3798828125, 287.6837463378906, 302.98760986328125, 318.2914733886719, 333.5953369140625, 348.8992004394531, 364.20306396484375, 379.5069274902344, 394.810791015625, 410.1146545410156, 425.41851806640625, 440.7223815917969, 456.0262451171875, 471.3301086425781, 486.63397216796875, 501.9378356933594, 517.24169921875, 532.5455322265625, 547.8494262695312, 563.1533203125, 578.4571533203125, 593.760986328125, 609.0648803710938, 624.3687744140625, 639.672607421875]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 7.0, 5.0, 3.0, 8.0, 4.0, 9.0, 12.0, 9.0, 8.0, 21.0, 13.0, 20.0, 10.0, 27.0, 29.0, 31.0, 37.0, 37.0, 56.0, 75.0, 92.0, 100.0, 72.0, 52.0, 38.0, 32.0, 25.0, 28.0, 29.0, 12.0, 18.0, 19.0, 12.0, 6.0, 11.0, 12.0, 8.0, 4.0, 6.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-178.70608520507812, -172.8904266357422, -167.07476806640625, -161.25912475585938, -155.44346618652344, -149.6278076171875, -143.81214904785156, -137.99649047851562, -132.18084716796875, -126.36518859863281, -120.5495376586914, -114.73387908935547, -108.91822814941406, -103.10256958007812, -97.28691101074219, -91.47125244140625, -85.65559387207031, -79.83993530273438, -74.02428436279297, -68.20862579345703, -62.39297103881836, -56.57731628417969, -50.76165771484375, -44.94600296020508, -39.130348205566406, -33.314693450927734, -27.49903678894043, -21.683380126953125, -15.867725372314453, -10.052070617675781, -4.236412048339844, 1.5792427062988281, 7.3948974609375, 13.210553169250488, 19.026208877563477, 24.84186553955078, 30.657520294189453, 36.473175048828125, 42.28883361816406, 48.104488372802734, 53.920143127441406, 59.73579788208008, 65.55145263671875, 71.36711120605469, 77.18276977539062, 82.99842071533203, 88.81407928466797, 94.62973022460938, 100.44538879394531, 106.26104736328125, 112.07669830322266, 117.8923568725586, 123.7080078125, 129.52366638183594, 135.33932495117188, 141.1549835205078, 146.97064208984375, 152.7863006591797, 158.60195922851562, 164.4176025390625, 170.23326110839844, 176.04891967773438, 181.8645782470703, 187.68023681640625, 193.49588012695312]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 3.0, 8.0, 4.0, 8.0, 13.0, 21.0, 35.0, 33.0, 71.0, 179.0, 438.0, 1294.0, 4439.0, 24483.0, 838811.0, 3240212.0, 73649.0, 7989.0, 1750.0, 446.0, 161.0, 65.0, 40.0, 44.0, 22.0, 18.0, 14.0, 8.0, 7.0, 6.0, 2.0, 2.0, 2.0, 6.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.421875, -23.524169921875, -22.62646484375, -21.728759765625, -20.8310546875, -19.933349609375, -19.03564453125, -18.137939453125, -17.240234375, -16.342529296875, -15.44482421875, -14.547119140625, -13.6494140625, -12.751708984375, -11.85400390625, -10.956298828125, -10.05859375, -9.160888671875, -8.26318359375, -7.365478515625, -6.4677734375, -5.570068359375, -4.67236328125, -3.774658203125, -2.876953125, -1.979248046875, -1.08154296875, -0.183837890625, 0.7138671875, 1.611572265625, 2.50927734375, 3.406982421875, 4.3046875, 5.202392578125, 6.10009765625, 6.997802734375, 7.8955078125, 8.793212890625, 9.69091796875, 10.588623046875, 11.486328125, 12.384033203125, 13.28173828125, 14.179443359375, 15.0771484375, 15.974853515625, 16.87255859375, 17.770263671875, 18.66796875, 19.565673828125, 20.46337890625, 21.361083984375, 22.2587890625, 23.156494140625, 24.05419921875, 24.951904296875, 25.849609375, 26.747314453125, 27.64501953125, 28.542724609375, 29.4404296875, 30.338134765625, 31.23583984375, 32.133544921875, 33.03125]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 6.0, 11.0, 16.0, 17.0, 17.0, 31.0, 34.0, 45.0, 51.0, 74.0, 83.0, 80.0, 71.0, 64.0, 74.0, 68.0, 56.0, 40.0, 38.0, 33.0, 26.0, 17.0, 20.0, 6.0, 8.0, 6.0, 5.0, 4.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.75, -14.3111572265625, -13.872314453125, -13.4334716796875, -12.99462890625, -12.5557861328125, -12.116943359375, -11.6781005859375, -11.2392578125, -10.8004150390625, -10.361572265625, -9.9227294921875, -9.48388671875, -9.0450439453125, -8.606201171875, -8.1673583984375, -7.728515625, -7.2896728515625, -6.850830078125, -6.4119873046875, -5.97314453125, -5.5343017578125, -5.095458984375, -4.6566162109375, -4.2177734375, -3.7789306640625, -3.340087890625, -2.9012451171875, -2.46240234375, -2.0235595703125, -1.584716796875, -1.1458740234375, -0.70703125, -0.2681884765625, 0.170654296875, 0.6094970703125, 1.04833984375, 1.4871826171875, 1.926025390625, 2.3648681640625, 2.8037109375, 3.2425537109375, 3.681396484375, 4.1202392578125, 4.55908203125, 4.9979248046875, 5.436767578125, 5.8756103515625, 6.314453125, 6.7532958984375, 7.192138671875, 7.6309814453125, 8.06982421875, 8.5086669921875, 8.947509765625, 9.3863525390625, 9.8251953125, 10.2640380859375, 10.702880859375, 11.1417236328125, 11.58056640625, 12.0194091796875, 12.458251953125, 12.8970947265625, 13.3359375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 6.0, 6.0, 13.0, 13.0, 27.0, 33.0, 60.0, 153.0, 353.0, 1038.0, 5427.0, 114164.0, 3999357.0, 67859.0, 4263.0, 891.0, 294.0, 137.0, 86.0, 47.0, 19.0, 20.0, 10.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.90625, -45.365234375, -43.82421875, -42.283203125, -40.7421875, -39.201171875, -37.66015625, -36.119140625, -34.578125, -33.037109375, -31.49609375, -29.955078125, -28.4140625, -26.873046875, -25.33203125, -23.791015625, -22.25, -20.708984375, -19.16796875, -17.626953125, -16.0859375, -14.544921875, -13.00390625, -11.462890625, -9.921875, -8.380859375, -6.83984375, -5.298828125, -3.7578125, -2.216796875, -0.67578125, 0.865234375, 2.40625, 3.947265625, 5.48828125, 7.029296875, 8.5703125, 10.111328125, 11.65234375, 13.193359375, 14.734375, 16.275390625, 17.81640625, 19.357421875, 20.8984375, 22.439453125, 23.98046875, 25.521484375, 27.0625, 28.603515625, 30.14453125, 31.685546875, 33.2265625, 34.767578125, 36.30859375, 37.849609375, 39.390625, 40.931640625, 42.47265625, 44.013671875, 45.5546875, 47.095703125, 48.63671875, 50.177734375, 51.71875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 9.0, 4.0, 13.0, 20.0, 26.0, 33.0, 44.0, 70.0, 127.0, 209.0, 420.0, 745.0, 883.0, 625.0, 361.0, 212.0, 101.0, 64.0, 30.0, 29.0, 15.0, 7.0, 8.0, 6.0, 3.0, 3.0, 1.0, 3.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.4375, -20.623291015625, -19.80908203125, -18.994873046875, -18.1806640625, -17.366455078125, -16.55224609375, -15.738037109375, -14.923828125, -14.109619140625, -13.29541015625, -12.481201171875, -11.6669921875, -10.852783203125, -10.03857421875, -9.224365234375, -8.41015625, -7.595947265625, -6.78173828125, -5.967529296875, -5.1533203125, -4.339111328125, -3.52490234375, -2.710693359375, -1.896484375, -1.082275390625, -0.26806640625, 0.546142578125, 1.3603515625, 2.174560546875, 2.98876953125, 3.802978515625, 4.6171875, 5.431396484375, 6.24560546875, 7.059814453125, 7.8740234375, 8.688232421875, 9.50244140625, 10.316650390625, 11.130859375, 11.945068359375, 12.75927734375, 13.573486328125, 14.3876953125, 15.201904296875, 16.01611328125, 16.830322265625, 17.64453125, 18.458740234375, 19.27294921875, 20.087158203125, 20.9013671875, 21.715576171875, 22.52978515625, 23.343994140625, 24.158203125, 24.972412109375, 25.78662109375, 26.600830078125, 27.4150390625, 28.229248046875, 29.04345703125, 29.857666015625, 30.671875]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 7.0, 8.0, 12.0, 16.0, 39.0, 67.0, 104.0, 141.0, 160.0, 161.0, 94.0, 91.0, 44.0, 23.0, 14.0, 8.0, 6.0, 4.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-137.1199951171875, -131.57003784179688, -126.02008819580078, -120.47013854980469, -114.92018127441406, -109.37023162841797, -103.82028198242188, -98.27032470703125, -92.72036743164062, -87.17041778564453, -81.6204605102539, -76.07051086425781, -70.52055358886719, -64.9706039428711, -59.420650482177734, -53.870697021484375, -48.32074737548828, -42.77079391479492, -37.22084045410156, -31.670888900756836, -26.120935440063477, -20.570981979370117, -15.02103042602539, -9.471076965332031, -3.921123504638672, 1.6288294792175293, 7.1787824630737305, 12.728734970092773, 18.278688430786133, 23.828641891479492, 29.37859344482422, 34.92854690551758, 40.47850036621094, 46.0284538269043, 51.578407287597656, 57.12835693359375, 62.678314208984375, 68.22826385498047, 73.77821350097656, 79.32817077636719, 84.87812805175781, 90.4280776977539, 95.97803497314453, 101.52798461914062, 107.07794189453125, 112.62789154052734, 118.17784118652344, 123.72779846191406, 129.27774047851562, 134.82769775390625, 140.3776397705078, 145.92759704589844, 151.47755432128906, 157.0275115966797, 162.57745361328125, 168.12741088867188, 173.6773681640625, 179.22732543945312, 184.7772674560547, 190.3272247314453, 195.87718200683594, 201.42713928222656, 206.97708129882812, 212.52703857421875, 218.07699584960938]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 6.0, 7.0, 15.0, 12.0, 20.0, 20.0, 26.0, 24.0, 30.0, 39.0, 38.0, 65.0, 63.0, 48.0, 64.0, 53.0, 63.0, 53.0, 56.0, 44.0, 42.0, 43.0, 39.0, 23.0, 21.0, 14.0, 16.0, 10.0, 10.0, 15.0, 5.0, 8.0, 6.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-113.61149597167969, -110.34532165527344, -107.07914733886719, -103.81297302246094, -100.54679870605469, -97.28062438964844, -94.01445007324219, -90.74827575683594, -87.48210144042969, -84.21592712402344, -80.94975280761719, -77.68357849121094, -74.41740417480469, -71.15122985839844, -67.88505554199219, -64.61888122558594, -61.352699279785156, -58.086524963378906, -54.820350646972656, -51.554176330566406, -48.288002014160156, -45.021827697753906, -41.75564956665039, -38.48947525024414, -35.22330093383789, -31.95712661743164, -28.69095230102539, -25.424776077270508, -22.158601760864258, -18.892427444458008, -15.626251220703125, -12.360076904296875, -9.093910217285156, -5.827735424041748, -2.56156063079834, 0.7046146392822266, 3.9707889556884766, 7.236963272094727, 10.50313949584961, 13.76931381225586, 17.03548812866211, 20.30166244506836, 23.56783676147461, 26.834012985229492, 30.100187301635742, 33.366363525390625, 36.632537841796875, 39.898712158203125, 43.164886474609375, 46.431060791015625, 49.697235107421875, 52.963409423828125, 56.229583740234375, 59.495758056640625, 62.76193618774414, 66.02810668945312, 69.29428100585938, 72.56045532226562, 75.82662963867188, 79.09280395507812, 82.35897827148438, 85.62515258789062, 88.89132690429688, 92.15750122070312, 95.4236831665039]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 6.0, 5.0, 8.0, 17.0, 14.0, 15.0, 40.0, 39.0, 69.0, 120.0, 179.0, 356.0, 804.0, 1836.0, 5163.0, 16270.0, 65178.0, 337753.0, 490173.0, 96204.0, 23137.0, 6836.0, 2291.0, 996.0, 435.0, 258.0, 134.0, 80.0, 39.0, 32.0, 22.0, 15.0, 10.0, 10.0, 5.0, 4.0, 0.0, 2.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.15625, -20.497802734375, -19.83935546875, -19.180908203125, -18.5224609375, -17.864013671875, -17.20556640625, -16.547119140625, -15.888671875, -15.230224609375, -14.57177734375, -13.913330078125, -13.2548828125, -12.596435546875, -11.93798828125, -11.279541015625, -10.62109375, -9.962646484375, -9.30419921875, -8.645751953125, -7.9873046875, -7.328857421875, -6.67041015625, -6.011962890625, -5.353515625, -4.695068359375, -4.03662109375, -3.378173828125, -2.7197265625, -2.061279296875, -1.40283203125, -0.744384765625, -0.0859375, 0.572509765625, 1.23095703125, 1.889404296875, 2.5478515625, 3.206298828125, 3.86474609375, 4.523193359375, 5.181640625, 5.840087890625, 6.49853515625, 7.156982421875, 7.8154296875, 8.473876953125, 9.13232421875, 9.790771484375, 10.44921875, 11.107666015625, 11.76611328125, 12.424560546875, 13.0830078125, 13.741455078125, 14.39990234375, 15.058349609375, 15.716796875, 16.375244140625, 17.03369140625, 17.692138671875, 18.3505859375, 19.009033203125, 19.66748046875, 20.325927734375, 20.984375]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 7.0, 3.0, 9.0, 11.0, 24.0, 31.0, 25.0, 49.0, 54.0, 46.0, 55.0, 59.0, 79.0, 89.0, 73.0, 79.0, 66.0, 53.0, 49.0, 34.0, 36.0, 27.0, 17.0, 12.0, 9.0, 3.0, 7.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.90625, -10.442138671875, -9.97802734375, -9.513916015625, -9.0498046875, -8.585693359375, -8.12158203125, -7.657470703125, -7.193359375, -6.729248046875, -6.26513671875, -5.801025390625, -5.3369140625, -4.872802734375, -4.40869140625, -3.944580078125, -3.48046875, -3.016357421875, -2.55224609375, -2.088134765625, -1.6240234375, -1.159912109375, -0.69580078125, -0.231689453125, 0.232421875, 0.696533203125, 1.16064453125, 1.624755859375, 2.0888671875, 2.552978515625, 3.01708984375, 3.481201171875, 3.9453125, 4.409423828125, 4.87353515625, 5.337646484375, 5.8017578125, 6.265869140625, 6.72998046875, 7.194091796875, 7.658203125, 8.122314453125, 8.58642578125, 9.050537109375, 9.5146484375, 9.978759765625, 10.44287109375, 10.906982421875, 11.37109375, 11.835205078125, 12.29931640625, 12.763427734375, 13.2275390625, 13.691650390625, 14.15576171875, 14.619873046875, 15.083984375, 15.548095703125, 16.01220703125, 16.476318359375, 16.9404296875, 17.404541015625, 17.86865234375, 18.332763671875, 18.796875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 0.0, 1.0, 3.0, 6.0, 7.0, 12.0, 18.0, 23.0, 33.0, 49.0, 88.0, 112.0, 200.0, 357.0, 739.0, 1593.0, 4715.0, 23590.0, 319944.0, 660047.0, 28420.0, 5208.0, 1681.0, 723.0, 410.0, 208.0, 113.0, 82.0, 57.0, 37.0, 19.0, 18.0, 8.0, 13.0, 8.0, 7.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-41.46875, -40.349365234375, -39.22998046875, -38.110595703125, -36.9912109375, -35.871826171875, -34.75244140625, -33.633056640625, -32.513671875, -31.394287109375, -30.27490234375, -29.155517578125, -28.0361328125, -26.916748046875, -25.79736328125, -24.677978515625, -23.55859375, -22.439208984375, -21.31982421875, -20.200439453125, -19.0810546875, -17.961669921875, -16.84228515625, -15.722900390625, -14.603515625, -13.484130859375, -12.36474609375, -11.245361328125, -10.1259765625, -9.006591796875, -7.88720703125, -6.767822265625, -5.6484375, -4.529052734375, -3.40966796875, -2.290283203125, -1.1708984375, -0.051513671875, 1.06787109375, 2.187255859375, 3.306640625, 4.426025390625, 5.54541015625, 6.664794921875, 7.7841796875, 8.903564453125, 10.02294921875, 11.142333984375, 12.26171875, 13.381103515625, 14.50048828125, 15.619873046875, 16.7392578125, 17.858642578125, 18.97802734375, 20.097412109375, 21.216796875, 22.336181640625, 23.45556640625, 24.574951171875, 25.6943359375, 26.813720703125, 27.93310546875, 29.052490234375, 30.171875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 6.0, 5.0, 8.0, 17.0, 21.0, 21.0, 21.0, 55.0, 46.0, 73.0, 80.0, 99.0, 122.0, 90.0, 96.0, 65.0, 53.0, 42.0, 34.0, 22.0, 6.0, 8.0, 5.0, 6.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-78.1875, -76.03369140625, -73.8798828125, -71.72607421875, -69.572265625, -67.41845703125, -65.2646484375, -63.11083984375, -60.95703125, -58.80322265625, -56.6494140625, -54.49560546875, -52.341796875, -50.18798828125, -48.0341796875, -45.88037109375, -43.7265625, -41.57275390625, -39.4189453125, -37.26513671875, -35.111328125, -32.95751953125, -30.8037109375, -28.64990234375, -26.49609375, -24.34228515625, -22.1884765625, -20.03466796875, -17.880859375, -15.72705078125, -13.5732421875, -11.41943359375, -9.265625, -7.11181640625, -4.9580078125, -2.80419921875, -0.650390625, 1.50341796875, 3.6572265625, 5.81103515625, 7.96484375, 10.11865234375, 12.2724609375, 14.42626953125, 16.580078125, 18.73388671875, 20.8876953125, 23.04150390625, 25.1953125, 27.34912109375, 29.5029296875, 31.65673828125, 33.810546875, 35.96435546875, 38.1181640625, 40.27197265625, 42.42578125, 44.57958984375, 46.7333984375, 48.88720703125, 51.041015625, 53.19482421875, 55.3486328125, 57.50244140625, 59.65625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 6.0, 1.0, 5.0, 2.0, 7.0, 12.0, 12.0, 36.0, 43.0, 67.0, 133.0, 246.0, 548.0, 1609.0, 5696.0, 33119.0, 801009.0, 183635.0, 17015.0, 3532.0, 1045.0, 363.0, 195.0, 92.0, 60.0, 24.0, 14.0, 14.0, 7.0, 2.0, 3.0, 5.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.78125, -18.191162109375, -17.60107421875, -17.010986328125, -16.4208984375, -15.830810546875, -15.24072265625, -14.650634765625, -14.060546875, -13.470458984375, -12.88037109375, -12.290283203125, -11.7001953125, -11.110107421875, -10.52001953125, -9.929931640625, -9.33984375, -8.749755859375, -8.15966796875, -7.569580078125, -6.9794921875, -6.389404296875, -5.79931640625, -5.209228515625, -4.619140625, -4.029052734375, -3.43896484375, -2.848876953125, -2.2587890625, -1.668701171875, -1.07861328125, -0.488525390625, 0.1015625, 0.691650390625, 1.28173828125, 1.871826171875, 2.4619140625, 3.052001953125, 3.64208984375, 4.232177734375, 4.822265625, 5.412353515625, 6.00244140625, 6.592529296875, 7.1826171875, 7.772705078125, 8.36279296875, 8.952880859375, 9.54296875, 10.133056640625, 10.72314453125, 11.313232421875, 11.9033203125, 12.493408203125, 13.08349609375, 13.673583984375, 14.263671875, 14.853759765625, 15.44384765625, 16.033935546875, 16.6240234375, 17.214111328125, 17.80419921875, 18.394287109375, 18.984375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 6.0, 10.0, 9.0, 10.0, 21.0, 29.0, 45.0, 101.0, 175.0, 221.0, 138.0, 87.0, 37.0, 28.0, 20.0, 12.0, 10.0, 9.0, 7.0, 3.0, 6.0, 3.0, 5.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004230499267578125, -0.004075527191162109, -0.003920555114746094, -0.003765583038330078, -0.0036106109619140625, -0.003455638885498047, -0.0033006668090820312, -0.0031456947326660156, -0.00299072265625, -0.0028357505798339844, -0.0026807785034179688, -0.002525806427001953, -0.0023708343505859375, -0.002215862274169922, -0.0020608901977539062, -0.0019059181213378906, -0.001750946044921875, -0.0015959739685058594, -0.0014410018920898438, -0.0012860298156738281, -0.0011310577392578125, -0.0009760856628417969, -0.0008211135864257812, -0.0006661415100097656, -0.00051116943359375, -0.0003561973571777344, -0.00020122528076171875, -4.6253204345703125e-05, 0.0001087188720703125, 0.0002636909484863281, 0.00041866302490234375, 0.0005736351013183594, 0.000728607177734375, 0.0008835792541503906, 0.0010385513305664062, 0.0011935234069824219, 0.0013484954833984375, 0.0015034675598144531, 0.0016584396362304688, 0.0018134117126464844, 0.0019683837890625, 0.0021233558654785156, 0.0022783279418945312, 0.002433300018310547, 0.0025882720947265625, 0.002743244171142578, 0.0028982162475585938, 0.0030531883239746094, 0.003208160400390625, 0.0033631324768066406, 0.0035181045532226562, 0.003673076629638672, 0.0038280487060546875, 0.003983020782470703, 0.004137992858886719, 0.004292964935302734, 0.00444793701171875, 0.004602909088134766, 0.004757881164550781, 0.004912853240966797, 0.0050678253173828125, 0.005222797393798828, 0.005377769470214844, 0.005532741546630859, 0.005687713623046875]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 0.0, 0.0, 1.0, 4.0, 4.0, 3.0, 11.0, 9.0, 16.0, 28.0, 34.0, 69.0, 113.0, 224.0, 421.0, 990.0, 2774.0, 10157.0, 56963.0, 804121.0, 146354.0, 18847.0, 4607.0, 1543.0, 597.0, 278.0, 163.0, 82.0, 45.0, 29.0, 21.0, 12.0, 9.0, 4.0, 11.0, 5.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.5390625, -13.083251953125, -12.62744140625, -12.171630859375, -11.7158203125, -11.260009765625, -10.80419921875, -10.348388671875, -9.892578125, -9.436767578125, -8.98095703125, -8.525146484375, -8.0693359375, -7.613525390625, -7.15771484375, -6.701904296875, -6.24609375, -5.790283203125, -5.33447265625, -4.878662109375, -4.4228515625, -3.967041015625, -3.51123046875, -3.055419921875, -2.599609375, -2.143798828125, -1.68798828125, -1.232177734375, -0.7763671875, -0.320556640625, 0.13525390625, 0.591064453125, 1.046875, 1.502685546875, 1.95849609375, 2.414306640625, 2.8701171875, 3.325927734375, 3.78173828125, 4.237548828125, 4.693359375, 5.149169921875, 5.60498046875, 6.060791015625, 6.5166015625, 6.972412109375, 7.42822265625, 7.884033203125, 8.33984375, 8.795654296875, 9.25146484375, 9.707275390625, 10.1630859375, 10.618896484375, 11.07470703125, 11.530517578125, 11.986328125, 12.442138671875, 12.89794921875, 13.353759765625, 13.8095703125, 14.265380859375, 14.72119140625, 15.177001953125, 15.6328125]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 4.0, 1.0, 3.0, 4.0, 3.0, 3.0, 6.0, 1.0, 8.0, 10.0, 11.0, 17.0, 21.0, 23.0, 25.0, 32.0, 46.0, 57.0, 61.0, 79.0, 109.0, 109.0, 52.0, 57.0, 37.0, 45.0, 21.0, 22.0, 23.0, 20.0, 15.0, 12.0, 9.0, 6.0, 12.0, 12.0, 8.0, 10.0, 6.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.57421875, -7.3431396484375, -7.112060546875, -6.8809814453125, -6.64990234375, -6.4188232421875, -6.187744140625, -5.9566650390625, -5.7255859375, -5.4945068359375, -5.263427734375, -5.0323486328125, -4.80126953125, -4.5701904296875, -4.339111328125, -4.1080322265625, -3.876953125, -3.6458740234375, -3.414794921875, -3.1837158203125, -2.95263671875, -2.7215576171875, -2.490478515625, -2.2593994140625, -2.0283203125, -1.7972412109375, -1.566162109375, -1.3350830078125, -1.10400390625, -0.8729248046875, -0.641845703125, -0.4107666015625, -0.1796875, 0.0513916015625, 0.282470703125, 0.5135498046875, 0.74462890625, 0.9757080078125, 1.206787109375, 1.4378662109375, 1.6689453125, 1.9000244140625, 2.131103515625, 2.3621826171875, 2.59326171875, 2.8243408203125, 3.055419921875, 3.2864990234375, 3.517578125, 3.7486572265625, 3.979736328125, 4.2108154296875, 4.44189453125, 4.6729736328125, 4.904052734375, 5.1351318359375, 5.3662109375, 5.5972900390625, 5.828369140625, 6.0594482421875, 6.29052734375, 6.5216064453125, 6.752685546875, 6.9837646484375, 7.21484375]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 8.0, 7.0, 21.0, 51.0, 184.0, 544.0, 121.0, 39.0, 11.0, 9.0, 6.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-736.0587768554688, -717.9351196289062, -699.8115234375, -681.6878662109375, -663.564208984375, -645.4405517578125, -627.3169555664062, -609.1932983398438, -591.0697021484375, -572.946044921875, -554.8224487304688, -536.6987915039062, -518.5751342773438, -500.4515075683594, -482.327880859375, -464.2042236328125, -446.08056640625, -427.9569396972656, -409.8332824707031, -391.70965576171875, -373.58599853515625, -355.4623718261719, -337.3387451171875, -319.215087890625, -301.0914611816406, -282.96783447265625, -264.84417724609375, -246.72055053710938, -228.59690856933594, -210.4732666015625, -192.34963989257812, -174.2259979248047, -156.102294921875, -137.97865295410156, -119.85501861572266, -101.73138427734375, -83.60774230957031, -65.48410034179688, -47.36046600341797, -29.236831665039062, -11.113189697265625, 7.010448455810547, 25.13408660888672, 43.25772476196289, 61.38136291503906, 79.5050048828125, 97.6286392211914, 115.75227355957031, 133.87591552734375, 151.9995574951172, 170.12319946289062, 188.246826171875, 206.37046813964844, 224.49411010742188, 242.61773681640625, 260.74139404296875, 278.8650207519531, 296.9886474609375, 315.1123046875, 333.2359313964844, 351.35955810546875, 369.48321533203125, 387.6068420410156, 405.73046875, 423.8541259765625]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 6.0, 5.0, 8.0, 10.0, 11.0, 13.0, 25.0, 30.0, 30.0, 25.0, 49.0, 36.0, 38.0, 102.0, 200.0, 97.0, 63.0, 55.0, 33.0, 30.0, 26.0, 22.0, 25.0, 18.0, 6.0, 15.0, 7.0, 4.0, 4.0, 8.0, 3.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-272.8546142578125, -265.7618713378906, -258.6691589355469, -251.57643127441406, -244.48370361328125, -237.39096069335938, -230.29823303222656, -223.20550537109375, -216.11277770996094, -209.02005004882812, -201.9273223876953, -194.8345947265625, -187.74185180664062, -180.64913940429688, -173.556396484375, -166.4636688232422, -159.37094116210938, -152.27821350097656, -145.18548583984375, -138.09275817871094, -131.00003051757812, -123.90729522705078, -116.81455993652344, -109.72183227539062, -102.62910461425781, -95.536376953125, -88.44364929199219, -81.35091400146484, -74.25818634033203, -67.16545867919922, -60.07272720336914, -52.97999572753906, -45.88728332519531, -38.7945556640625, -31.701824188232422, -24.609094619750977, -17.51636505126953, -10.423637390136719, -3.3309059143066406, 3.7618255615234375, 10.85455322265625, 17.947282791137695, 25.04001235961914, 32.13274383544922, 39.22547149658203, 46.318199157714844, 53.41093063354492, 60.503662109375, 67.59638977050781, 74.68911743164062, 81.78184509277344, 88.87458038330078, 95.9673080444336, 103.0600357055664, 110.15277099609375, 117.24549865722656, 124.33822631835938, 131.4309539794922, 138.523681640625, 145.6164093017578, 152.70913696289062, 159.8018798828125, 166.8946075439453, 173.98733520507812, 181.08006286621094]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 6.0, 5.0, 13.0, 18.0, 36.0, 49.0, 74.0, 167.0, 368.0, 817.0, 2321.0, 9054.0, 73965.0, 2395832.0, 1648251.0, 51876.0, 7869.0, 2227.0, 724.0, 277.0, 146.0, 63.0, 47.0, 19.0, 7.0, 10.0, 9.0, 12.0, 9.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-50.53125, -49.2333984375, -47.935546875, -46.6376953125, -45.33984375, -44.0419921875, -42.744140625, -41.4462890625, -40.1484375, -38.8505859375, -37.552734375, -36.2548828125, -34.95703125, -33.6591796875, -32.361328125, -31.0634765625, -29.765625, -28.4677734375, -27.169921875, -25.8720703125, -24.57421875, -23.2763671875, -21.978515625, -20.6806640625, -19.3828125, -18.0849609375, -16.787109375, -15.4892578125, -14.19140625, -12.8935546875, -11.595703125, -10.2978515625, -9.0, -7.7021484375, -6.404296875, -5.1064453125, -3.80859375, -2.5107421875, -1.212890625, 0.0849609375, 1.3828125, 2.6806640625, 3.978515625, 5.2763671875, 6.57421875, 7.8720703125, 9.169921875, 10.4677734375, 11.765625, 13.0634765625, 14.361328125, 15.6591796875, 16.95703125, 18.2548828125, 19.552734375, 20.8505859375, 22.1484375, 23.4462890625, 24.744140625, 26.0419921875, 27.33984375, 28.6376953125, 29.935546875, 31.2333984375, 32.53125]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 6.0, 16.0, 18.0, 28.0, 37.0, 66.0, 89.0, 104.0, 91.0, 96.0, 83.0, 91.0, 67.0, 73.0, 40.0, 38.0, 27.0, 19.0, 5.0, 6.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-28.78125, -28.163330078125, -27.54541015625, -26.927490234375, -26.3095703125, -25.691650390625, -25.07373046875, -24.455810546875, -23.837890625, -23.219970703125, -22.60205078125, -21.984130859375, -21.3662109375, -20.748291015625, -20.13037109375, -19.512451171875, -18.89453125, -18.276611328125, -17.65869140625, -17.040771484375, -16.4228515625, -15.804931640625, -15.18701171875, -14.569091796875, -13.951171875, -13.333251953125, -12.71533203125, -12.097412109375, -11.4794921875, -10.861572265625, -10.24365234375, -9.625732421875, -9.0078125, -8.389892578125, -7.77197265625, -7.154052734375, -6.5361328125, -5.918212890625, -5.30029296875, -4.682373046875, -4.064453125, -3.446533203125, -2.82861328125, -2.210693359375, -1.5927734375, -0.974853515625, -0.35693359375, 0.260986328125, 0.87890625, 1.496826171875, 2.11474609375, 2.732666015625, 3.3505859375, 3.968505859375, 4.58642578125, 5.204345703125, 5.822265625, 6.440185546875, 7.05810546875, 7.676025390625, 8.2939453125, 8.911865234375, 9.52978515625, 10.147705078125, 10.765625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 9.0, 10.0, 14.0, 33.0, 66.0, 175.0, 479.0, 2204.0, 815941.0, 3371952.0, 2639.0, 519.0, 139.0, 54.0, 16.0, 12.0, 11.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-209.5, -202.75, -196.0, -189.25, -182.5, -175.75, -169.0, -162.25, -155.5, -148.75, -142.0, -135.25, -128.5, -121.75, -115.0, -108.25, -101.5, -94.75, -88.0, -81.25, -74.5, -67.75, -61.0, -54.25, -47.5, -40.75, -34.0, -27.25, -20.5, -13.75, -7.0, -0.25, 6.5, 13.25, 20.0, 26.75, 33.5, 40.25, 47.0, 53.75, 60.5, 67.25, 74.0, 80.75, 87.5, 94.25, 101.0, 107.75, 114.5, 121.25, 128.0, 134.75, 141.5, 148.25, 155.0, 161.75, 168.5, 175.25, 182.0, 188.75, 195.5, 202.25, 209.0, 215.75, 222.5]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 9.0, 11.0, 40.0, 103.0, 286.0, 791.0, 1611.0, 820.0, 269.0, 88.0, 31.0, 8.0, 7.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-141.625, -138.294921875, -134.96484375, -131.634765625, -128.3046875, -124.974609375, -121.64453125, -118.314453125, -114.984375, -111.654296875, -108.32421875, -104.994140625, -101.6640625, -98.333984375, -95.00390625, -91.673828125, -88.34375, -85.013671875, -81.68359375, -78.353515625, -75.0234375, -71.693359375, -68.36328125, -65.033203125, -61.703125, -58.373046875, -55.04296875, -51.712890625, -48.3828125, -45.052734375, -41.72265625, -38.392578125, -35.0625, -31.732421875, -28.40234375, -25.072265625, -21.7421875, -18.412109375, -15.08203125, -11.751953125, -8.421875, -5.091796875, -1.76171875, 1.568359375, 4.8984375, 8.228515625, 11.55859375, 14.888671875, 18.21875, 21.548828125, 24.87890625, 28.208984375, 31.5390625, 34.869140625, 38.19921875, 41.529296875, 44.859375, 48.189453125, 51.51953125, 54.849609375, 58.1796875, 61.509765625, 64.83984375, 68.169921875, 71.5]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 7.0, 1.0, 10.0, 19.0, 48.0, 181.0, 409.0, 227.0, 62.0, 26.0, 10.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1769.67041015625, -1735.419189453125, -1701.16796875, -1666.916748046875, -1632.66552734375, -1598.414306640625, -1564.1630859375, -1529.911865234375, -1495.66064453125, -1461.409423828125, -1427.158203125, -1392.906982421875, -1358.65576171875, -1324.404541015625, -1290.1533203125, -1255.902099609375, -1221.65087890625, -1187.399658203125, -1153.1484375, -1118.897216796875, -1084.64599609375, -1050.394775390625, -1016.1435546875, -981.892333984375, -947.6412353515625, -913.3900146484375, -879.1387939453125, -844.8875732421875, -810.6363525390625, -776.3851318359375, -742.1339111328125, -707.8826904296875, -673.6314697265625, -639.3802490234375, -605.1290283203125, -570.8778076171875, -536.6265869140625, -502.3753662109375, -468.1241760253906, -433.8729553222656, -399.6217346191406, -365.3705139160156, -331.1192932128906, -296.86810302734375, -262.61688232421875, -228.3656463623047, -194.11444091796875, -159.86322021484375, -125.61199951171875, -91.36077880859375, -57.10956573486328, -22.858352661132812, 11.392868041992188, 45.64408874511719, 79.89529418945312, 114.14651489257812, 148.39773559570312, 182.64895629882812, 216.90017700195312, 251.15138244628906, 285.402587890625, 319.65380859375, 353.905029296875, 388.15625, 422.407470703125]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 2.0, 3.0, 6.0, 8.0, 7.0, 18.0, 17.0, 32.0, 38.0, 36.0, 58.0, 63.0, 73.0, 89.0, 90.0, 93.0, 70.0, 63.0, 45.0, 46.0, 32.0, 30.0, 12.0, 19.0, 8.0, 9.0, 6.0, 5.0, 6.0, 5.0, 2.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-309.8646240234375, -297.5186767578125, -285.1727294921875, -272.8267822265625, -260.4808349609375, -248.1348876953125, -235.7889404296875, -223.4429931640625, -211.0970458984375, -198.7510986328125, -186.4051513671875, -174.0592041015625, -161.7132568359375, -149.3673095703125, -137.0213623046875, -124.67542266845703, -112.32948303222656, -99.98353576660156, -87.63758850097656, -75.29164123535156, -62.94569778442383, -50.59975051879883, -38.253807067871094, -25.907859802246094, -13.561912536621094, -1.2159662246704102, 11.129980087280273, 23.47592544555664, 35.82187271118164, 48.16781997680664, 60.513763427734375, 72.85971069335938, 85.20565795898438, 97.55160522460938, 109.89755249023438, 122.24349975585938, 134.58944702148438, 146.93539428710938, 159.28134155273438, 171.62728881835938, 183.97323608398438, 196.31918334960938, 208.66513061523438, 221.01107788085938, 233.35702514648438, 245.70297241210938, 258.0489196777344, 270.3948669433594, 282.74078369140625, 295.08673095703125, 307.43267822265625, 319.77862548828125, 332.12457275390625, 344.47052001953125, 356.81646728515625, 369.16241455078125, 381.50836181640625, 393.85430908203125, 406.20025634765625, 418.54620361328125, 430.89215087890625, 443.23809814453125, 455.58404541015625, 467.92999267578125, 480.27593994140625]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 15.0, 20.0, 24.0, 33.0, 45.0, 99.0, 181.0, 351.0, 856.0, 2114.0, 6524.0, 32829.0, 509082.0, 455510.0, 30907.0, 6336.0, 1979.0, 817.0, 355.0, 194.0, 118.0, 64.0, 30.0, 23.0, 12.0, 11.0, 11.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.953125, -29.761962890625, -28.57080078125, -27.379638671875, -26.1884765625, -24.997314453125, -23.80615234375, -22.614990234375, -21.423828125, -20.232666015625, -19.04150390625, -17.850341796875, -16.6591796875, -15.468017578125, -14.27685546875, -13.085693359375, -11.89453125, -10.703369140625, -9.51220703125, -8.321044921875, -7.1298828125, -5.938720703125, -4.74755859375, -3.556396484375, -2.365234375, -1.174072265625, 0.01708984375, 1.208251953125, 2.3994140625, 3.590576171875, 4.78173828125, 5.972900390625, 7.1640625, 8.355224609375, 9.54638671875, 10.737548828125, 11.9287109375, 13.119873046875, 14.31103515625, 15.502197265625, 16.693359375, 17.884521484375, 19.07568359375, 20.266845703125, 21.4580078125, 22.649169921875, 23.84033203125, 25.031494140625, 26.22265625, 27.413818359375, 28.60498046875, 29.796142578125, 30.9873046875, 32.178466796875, 33.36962890625, 34.560791015625, 35.751953125, 36.943115234375, 38.13427734375, 39.325439453125, 40.5166015625, 41.707763671875, 42.89892578125, 44.090087890625, 45.28125]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 5.0, 9.0, 7.0, 10.0, 18.0, 22.0, 39.0, 42.0, 55.0, 74.0, 75.0, 78.0, 78.0, 82.0, 75.0, 63.0, 57.0, 50.0, 38.0, 34.0, 28.0, 14.0, 21.0, 3.0, 7.0, 7.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.71875, -18.958984375, -18.19921875, -17.439453125, -16.6796875, -15.919921875, -15.16015625, -14.400390625, -13.640625, -12.880859375, -12.12109375, -11.361328125, -10.6015625, -9.841796875, -9.08203125, -8.322265625, -7.5625, -6.802734375, -6.04296875, -5.283203125, -4.5234375, -3.763671875, -3.00390625, -2.244140625, -1.484375, -0.724609375, 0.03515625, 0.794921875, 1.5546875, 2.314453125, 3.07421875, 3.833984375, 4.59375, 5.353515625, 6.11328125, 6.873046875, 7.6328125, 8.392578125, 9.15234375, 9.912109375, 10.671875, 11.431640625, 12.19140625, 12.951171875, 13.7109375, 14.470703125, 15.23046875, 15.990234375, 16.75, 17.509765625, 18.26953125, 19.029296875, 19.7890625, 20.548828125, 21.30859375, 22.068359375, 22.828125, 23.587890625, 24.34765625, 25.107421875, 25.8671875, 26.626953125, 27.38671875, 28.146484375, 28.90625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 3.0, 4.0, 2.0, 7.0, 9.0, 8.0, 11.0, 11.0, 13.0, 13.0, 29.0, 38.0, 44.0, 70.0, 114.0, 173.0, 298.0, 576.0, 1208.0, 3192.0, 12858.0, 113010.0, 868179.0, 37852.0, 6566.0, 2027.0, 909.0, 456.0, 315.0, 154.0, 122.0, 78.0, 54.0, 39.0, 30.0, 17.0, 15.0, 11.0, 11.0, 5.0, 6.0, 5.0, 7.0, 3.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-29.578125, -28.531982421875, -27.48583984375, -26.439697265625, -25.3935546875, -24.347412109375, -23.30126953125, -22.255126953125, -21.208984375, -20.162841796875, -19.11669921875, -18.070556640625, -17.0244140625, -15.978271484375, -14.93212890625, -13.885986328125, -12.83984375, -11.793701171875, -10.74755859375, -9.701416015625, -8.6552734375, -7.609130859375, -6.56298828125, -5.516845703125, -4.470703125, -3.424560546875, -2.37841796875, -1.332275390625, -0.2861328125, 0.760009765625, 1.80615234375, 2.852294921875, 3.8984375, 4.944580078125, 5.99072265625, 7.036865234375, 8.0830078125, 9.129150390625, 10.17529296875, 11.221435546875, 12.267578125, 13.313720703125, 14.35986328125, 15.406005859375, 16.4521484375, 17.498291015625, 18.54443359375, 19.590576171875, 20.63671875, 21.682861328125, 22.72900390625, 23.775146484375, 24.8212890625, 25.867431640625, 26.91357421875, 27.959716796875, 29.005859375, 30.052001953125, 31.09814453125, 32.144287109375, 33.1904296875, 34.236572265625, 35.28271484375, 36.328857421875, 37.375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 1.0, 3.0, 5.0, 5.0, 8.0, 5.0, 9.0, 8.0, 13.0, 10.0, 14.0, 18.0, 14.0, 11.0, 17.0, 23.0, 32.0, 43.0, 43.0, 63.0, 73.0, 54.0, 75.0, 56.0, 59.0, 53.0, 35.0, 32.0, 22.0, 23.0, 33.0, 17.0, 18.0, 16.0, 11.0, 26.0, 15.0, 4.0, 6.0, 10.0, 8.0, 6.0, 2.0, 4.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-61.03125, -59.18505859375, -57.3388671875, -55.49267578125, -53.646484375, -51.80029296875, -49.9541015625, -48.10791015625, -46.26171875, -44.41552734375, -42.5693359375, -40.72314453125, -38.876953125, -37.03076171875, -35.1845703125, -33.33837890625, -31.4921875, -29.64599609375, -27.7998046875, -25.95361328125, -24.107421875, -22.26123046875, -20.4150390625, -18.56884765625, -16.72265625, -14.87646484375, -13.0302734375, -11.18408203125, -9.337890625, -7.49169921875, -5.6455078125, -3.79931640625, -1.953125, -0.10693359375, 1.7392578125, 3.58544921875, 5.431640625, 7.27783203125, 9.1240234375, 10.97021484375, 12.81640625, 14.66259765625, 16.5087890625, 18.35498046875, 20.201171875, 22.04736328125, 23.8935546875, 25.73974609375, 27.5859375, 29.43212890625, 31.2783203125, 33.12451171875, 34.970703125, 36.81689453125, 38.6630859375, 40.50927734375, 42.35546875, 44.20166015625, 46.0478515625, 47.89404296875, 49.740234375, 51.58642578125, 53.4326171875, 55.27880859375, 57.125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 2.0, 1.0, 3.0, 6.0, 7.0, 3.0, 15.0, 8.0, 11.0, 19.0, 23.0, 38.0, 65.0, 78.0, 137.0, 267.0, 507.0, 1189.0, 3266.0, 12841.0, 102156.0, 882610.0, 34875.0, 6561.0, 2096.0, 835.0, 401.0, 163.0, 127.0, 73.0, 50.0, 33.0, 21.0, 16.0, 15.0, 11.0, 3.0, 6.0, 8.0, 6.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.5625, -6.35919189453125, -6.1558837890625, -5.95257568359375, -5.749267578125, -5.54595947265625, -5.3426513671875, -5.13934326171875, -4.93603515625, -4.73272705078125, -4.5294189453125, -4.32611083984375, -4.122802734375, -3.91949462890625, -3.7161865234375, -3.51287841796875, -3.3095703125, -3.10626220703125, -2.9029541015625, -2.69964599609375, -2.496337890625, -2.29302978515625, -2.0897216796875, -1.88641357421875, -1.68310546875, -1.47979736328125, -1.2764892578125, -1.07318115234375, -0.869873046875, -0.66656494140625, -0.4632568359375, -0.25994873046875, -0.056640625, 0.14666748046875, 0.3499755859375, 0.55328369140625, 0.756591796875, 0.95989990234375, 1.1632080078125, 1.36651611328125, 1.56982421875, 1.77313232421875, 1.9764404296875, 2.17974853515625, 2.383056640625, 2.58636474609375, 2.7896728515625, 2.99298095703125, 3.1962890625, 3.39959716796875, 3.6029052734375, 3.80621337890625, 4.009521484375, 4.21282958984375, 4.4161376953125, 4.61944580078125, 4.82275390625, 5.02606201171875, 5.2293701171875, 5.43267822265625, 5.635986328125, 5.83929443359375, 6.0426025390625, 6.24591064453125, 6.44921875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 4.0, 1.0, 3.0, 2.0, 2.0, 6.0, 7.0, 7.0, 6.0, 12.0, 10.0, 12.0, 19.0, 32.0, 39.0, 66.0, 109.0, 158.0, 160.0, 113.0, 69.0, 41.0, 26.0, 17.0, 14.0, 15.0, 12.0, 6.0, 6.0, 4.0, 5.0, 5.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.0017709732055664062, -0.001718863844871521, -0.0016667544841766357, -0.0016146451234817505, -0.0015625357627868652, -0.00151042640209198, -0.0014583170413970947, -0.0014062076807022095, -0.0013540983200073242, -0.001301988959312439, -0.0012498795986175537, -0.0011977702379226685, -0.0011456608772277832, -0.001093551516532898, -0.0010414421558380127, -0.0009893327951431274, -0.0009372234344482422, -0.0008851140737533569, -0.0008330047130584717, -0.0007808953523635864, -0.0007287859916687012, -0.0006766766309738159, -0.0006245672702789307, -0.0005724579095840454, -0.0005203485488891602, -0.0004682391881942749, -0.00041612982749938965, -0.0003640204668045044, -0.00031191110610961914, -0.0002598017454147339, -0.00020769238471984863, -0.00015558302402496338, -0.00010347366333007812, -5.136430263519287e-05, 7.450580596923828e-07, 5.285441875457764e-05, 0.00010496377944946289, 0.00015707314014434814, 0.0002091825008392334, 0.00026129186153411865, 0.0003134012222290039, 0.00036551058292388916, 0.0004176199436187744, 0.00046972930431365967, 0.0005218386650085449, 0.0005739480257034302, 0.0006260573863983154, 0.0006781667470932007, 0.0007302761077880859, 0.0007823854684829712, 0.0008344948291778564, 0.0008866041898727417, 0.000938713550567627, 0.0009908229112625122, 0.0010429322719573975, 0.0010950416326522827, 0.001147150993347168, 0.0011992603540420532, 0.0012513697147369385, 0.0013034790754318237, 0.001355588436126709, 0.0014076977968215942, 0.0014598071575164795, 0.0015119165182113647, 0.00156402587890625]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 6.0, 5.0, 9.0, 17.0, 11.0, 24.0, 48.0, 89.0, 146.0, 288.0, 574.0, 1359.0, 3511.0, 12433.0, 62961.0, 865041.0, 80491.0, 14521.0, 4118.0, 1546.0, 642.0, 323.0, 157.0, 95.0, 56.0, 23.0, 29.0, 16.0, 8.0, 9.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.7109375, -5.52996826171875, -5.3489990234375, -5.16802978515625, -4.987060546875, -4.80609130859375, -4.6251220703125, -4.44415283203125, -4.26318359375, -4.08221435546875, -3.9012451171875, -3.72027587890625, -3.539306640625, -3.35833740234375, -3.1773681640625, -2.99639892578125, -2.8154296875, -2.63446044921875, -2.4534912109375, -2.27252197265625, -2.091552734375, -1.91058349609375, -1.7296142578125, -1.54864501953125, -1.36767578125, -1.18670654296875, -1.0057373046875, -0.82476806640625, -0.643798828125, -0.46282958984375, -0.2818603515625, -0.10089111328125, 0.080078125, 0.26104736328125, 0.4420166015625, 0.62298583984375, 0.803955078125, 0.98492431640625, 1.1658935546875, 1.34686279296875, 1.52783203125, 1.70880126953125, 1.8897705078125, 2.07073974609375, 2.251708984375, 2.43267822265625, 2.6136474609375, 2.79461669921875, 2.9755859375, 3.15655517578125, 3.3375244140625, 3.51849365234375, 3.699462890625, 3.88043212890625, 4.0614013671875, 4.24237060546875, 4.42333984375, 4.60430908203125, 4.7852783203125, 4.96624755859375, 5.147216796875, 5.32818603515625, 5.5091552734375, 5.69012451171875, 5.87109375]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 9.0, 12.0, 4.0, 7.0, 15.0, 9.0, 18.0, 25.0, 33.0, 42.0, 74.0, 134.0, 172.0, 120.0, 93.0, 58.0, 48.0, 25.0, 28.0, 14.0, 17.0, 14.0, 5.0, 7.0, 6.0, 3.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0], "bins": [-9.4140625, -9.19329833984375, -8.9725341796875, -8.75177001953125, -8.531005859375, -8.31024169921875, -8.0894775390625, -7.86871337890625, -7.64794921875, -7.42718505859375, -7.2064208984375, -6.98565673828125, -6.764892578125, -6.54412841796875, -6.3233642578125, -6.10260009765625, -5.8818359375, -5.66107177734375, -5.4403076171875, -5.21954345703125, -4.998779296875, -4.77801513671875, -4.5572509765625, -4.33648681640625, -4.11572265625, -3.89495849609375, -3.6741943359375, -3.45343017578125, -3.232666015625, -3.01190185546875, -2.7911376953125, -2.57037353515625, -2.349609375, -2.12884521484375, -1.9080810546875, -1.68731689453125, -1.466552734375, -1.24578857421875, -1.0250244140625, -0.80426025390625, -0.58349609375, -0.36273193359375, -0.1419677734375, 0.07879638671875, 0.299560546875, 0.52032470703125, 0.7410888671875, 0.96185302734375, 1.1826171875, 1.40338134765625, 1.6241455078125, 1.84490966796875, 2.065673828125, 2.28643798828125, 2.5072021484375, 2.72796630859375, 2.94873046875, 3.16949462890625, 3.3902587890625, 3.61102294921875, 3.831787109375, 4.05255126953125, 4.2733154296875, 4.49407958984375, 4.71484375]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 0.0, 2.0, 12.0, 15.0, 15.0, 55.0, 113.0, 485.0, 165.0, 62.0, 31.0, 20.0, 13.0, 7.0, 3.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-348.80047607421875, -338.10931396484375, -327.4181213378906, -316.7269592285156, -306.0357666015625, -295.3446044921875, -284.6534423828125, -273.9622497558594, -263.2710876464844, -252.5799102783203, -241.88873291015625, -231.19757080078125, -220.5063934326172, -209.81521606445312, -199.12403869628906, -188.432861328125, -177.74168395996094, -167.05050659179688, -156.3593292236328, -145.66815185546875, -134.97698974609375, -124.28581237792969, -113.59463500976562, -102.9034652709961, -92.21228790283203, -81.52111053466797, -70.82994079589844, -60.138763427734375, -49.44758987426758, -38.75641632080078, -28.06523895263672, -17.374069213867188, -6.682891845703125, 4.008282661437988, 14.699457168579102, 25.39063262939453, 36.08180618286133, 46.772979736328125, 57.46415710449219, 68.15532684326172, 78.84650421142578, 89.53768157958984, 100.22885131835938, 110.92002868652344, 121.6112060546875, 132.3023681640625, 142.99356079101562, 153.68472290039062, 164.3759002685547, 175.06707763671875, 185.7582550048828, 196.44943237304688, 207.14059448242188, 217.83177185058594, 228.52294921875, 239.214111328125, 249.90530395507812, 260.5964660644531, 271.28765869140625, 281.97882080078125, 292.6700134277344, 303.3611755371094, 314.0523681640625, 324.7435302734375, 335.4346923828125]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 12.0, 9.0, 14.0, 16.0, 9.0, 33.0, 27.0, 28.0, 41.0, 144.0, 181.0, 222.0, 72.0, 32.0, 35.0, 35.0, 14.0, 18.0, 13.0, 15.0, 6.0, 9.0, 6.0, 1.0, 2.0, 5.0, 2.0, 0.0, 1.0, 2.0], "bins": [-447.53302001953125, -437.53424072265625, -427.53546142578125, -417.53668212890625, -407.53790283203125, -397.5391540527344, -387.5403747558594, -377.5415954589844, -367.5428161621094, -357.5440368652344, -347.5452575683594, -337.5464782714844, -327.5477294921875, -317.5489501953125, -307.5501708984375, -297.5513916015625, -287.5526123046875, -277.5538330078125, -267.5550537109375, -257.5562744140625, -247.55751037597656, -237.55873107910156, -227.55996704101562, -217.56118774414062, -207.56240844726562, -197.56362915039062, -187.56484985351562, -177.5660858154297, -167.5673065185547, -157.5685272216797, -147.56976318359375, -137.57098388671875, -127.57220458984375, -117.57342529296875, -107.57465362548828, -97.57588195800781, -87.57710266113281, -77.57832336425781, -67.57955169677734, -57.580780029296875, -47.582000732421875, -37.58322525024414, -27.584449768066406, -17.585674285888672, -7.5868988037109375, 2.411876678466797, 12.410652160644531, 22.409423828125, 32.408203125, 42.406978607177734, 52.40575408935547, 62.4045295715332, 72.40330505371094, 82.40208435058594, 92.4008560180664, 102.39962768554688, 112.39840698242188, 122.39718627929688, 132.39596557617188, 142.3947296142578, 152.3935089111328, 162.3922882080078, 172.39105224609375, 182.38983154296875, 192.38861083984375]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 3.0, 5.0, 8.0, 2.0, 10.0, 12.0, 11.0, 9.0, 17.0, 18.0, 25.0, 24.0, 22.0, 45.0, 51.0, 51.0, 181.0, 155.0, 62.0, 38.0, 30.0, 28.0, 33.0, 21.0, 24.0, 11.0, 22.0, 12.0, 9.0, 10.0, 11.0, 7.0, 7.0, 8.0, 5.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.890625, -15.3934326171875, -14.896240234375, -14.3990478515625, -13.90185546875, -13.4046630859375, -12.907470703125, -12.4102783203125, -11.9130859375, -11.4158935546875, -10.918701171875, -10.4215087890625, -9.92431640625, -9.4271240234375, -8.929931640625, -8.4327392578125, -7.935546875, -7.4383544921875, -6.941162109375, -6.4439697265625, -5.94677734375, -5.4495849609375, -4.952392578125, -4.4552001953125, -3.9580078125, -3.4608154296875, -2.963623046875, -2.4664306640625, -1.96923828125, -1.4720458984375, -0.974853515625, -0.4776611328125, 0.01953125, 0.5167236328125, 1.013916015625, 1.5111083984375, 2.00830078125, 2.5054931640625, 3.002685546875, 3.4998779296875, 3.9970703125, 4.4942626953125, 4.991455078125, 5.4886474609375, 5.98583984375, 6.4830322265625, 6.980224609375, 7.4774169921875, 7.974609375, 8.4718017578125, 8.968994140625, 9.4661865234375, 9.96337890625, 10.4605712890625, 10.957763671875, 11.4549560546875, 11.9521484375, 12.4493408203125, 12.946533203125, 13.4437255859375, 13.94091796875, 14.4381103515625, 14.935302734375, 15.4324951171875, 15.9296875]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 6.0, 1.0, 3.0, 6.0, 2.0, 8.0, 17.0, 16.0, 21.0, 32.0, 41.0, 61.0, 117.0, 227.0, 570.0, 2390.0, 32767.0, 8344527.0, 6082.0, 1013.0, 296.0, 139.0, 72.0, 42.0, 30.0, 31.0, 15.0, 4.0, 15.0, 9.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 3.0], "bins": [-169.83935546875, -164.02932739257812, -158.21929931640625, -152.40927124023438, -146.5992431640625, -140.78921508789062, -134.97918701171875, -129.16915893554688, -123.35912322998047, -117.5490951538086, -111.73906707763672, -105.92903137207031, -100.11900329589844, -94.30897521972656, -88.49894714355469, -82.68891906738281, -76.87889099121094, -71.06886291503906, -65.25883483886719, -59.44880294799805, -53.63877487182617, -47.8287467956543, -42.018714904785156, -36.20868682861328, -30.398658752441406, -24.58863067626953, -18.778600692749023, -12.968570709228516, -7.158542633056641, -1.3485145568847656, 4.461517333984375, 10.27154541015625, 16.081573486328125, 21.8916015625, 27.701631546020508, 33.511661529541016, 39.32168960571289, 45.131717681884766, 50.941749572753906, 56.75177764892578, 62.561805725097656, 68.37183380126953, 74.1818618774414, 79.99189758300781, 85.80192565917969, 91.61195373535156, 97.42198181152344, 103.23200988769531, 109.04203796386719, 114.85206604003906, 120.66209411621094, 126.47212219238281, 132.2821502685547, 138.09217834472656, 143.9022216796875, 149.71224975585938, 155.52227783203125, 161.33230590820312, 167.142333984375, 172.95236206054688, 178.76239013671875, 184.57241821289062, 190.3824462890625, 196.19247436523438, 202.00250244140625]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 6.0, 3.0, 1.0, 4.0, 5.0, 3.0, 4.0, 3.0, 6.0, 6.0, 2.0, 8.0, 2.0, 5.0, 3.0, 6.0, 4.0, 1.0, 7.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-191.10089111328125, -184.21043395996094, -177.31996154785156, -170.42950439453125, -163.53903198242188, -156.64857482910156, -149.75811767578125, -142.86764526367188, -135.97718811035156, -129.08673095703125, -122.19625854492188, -115.30580139160156, -108.41533660888672, -101.52487182617188, -94.63441467285156, -87.74394989013672, -80.85348510742188, -73.96302032470703, -67.07255554199219, -60.182098388671875, -53.29163360595703, -46.40116882324219, -39.51070785522461, -32.62024688720703, -25.729782104492188, -18.839319229125977, -11.948856353759766, -5.058393478393555, 1.8320693969726562, 8.7225341796875, 15.612995147705078, 22.503456115722656, 29.393905639648438, 36.28437042236328, 43.17483139038086, 50.06529235839844, 56.95575714111328, 63.846221923828125, 70.73667907714844, 77.62714385986328, 84.51760864257812, 91.40807342529297, 98.29853820800781, 105.18899536132812, 112.07946014404297, 118.96992492675781, 125.86038208007812, 132.7508544921875, 139.6413116455078, 146.53176879882812, 153.4222412109375, 160.3126983642578, 167.20315551757812, 174.0936279296875, 180.9840850830078, 187.87454223632812, 194.7650146484375, 201.6554718017578, 208.5459442138672, 215.4364013671875, 222.32687377929688, 229.2173309326172, 236.1077880859375, 242.99826049804688, 249.8887176513672]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 3.0, 0.0, 6.0, 5.0, 6.0, 14.0, 14.0, 22.0, 10.0, 33.0, 25.0, 33.0, 31.0, 39.0, 58.0, 55.0, 64.0, 73.0, 62.0, 58.0, 68.0, 51.0, 52.0, 42.0, 38.0, 20.0, 33.0, 16.0, 16.0, 16.0, 9.0, 9.0, 3.0, 6.0, 3.0, 2.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.8671875, -9.5693359375, -9.271484375, -8.9736328125, -8.67578125, -8.3779296875, -8.080078125, -7.7822265625, -7.484375, -7.1865234375, -6.888671875, -6.5908203125, -6.29296875, -5.9951171875, -5.697265625, -5.3994140625, -5.1015625, -4.8037109375, -4.505859375, -4.2080078125, -3.91015625, -3.6123046875, -3.314453125, -3.0166015625, -2.71875, -2.4208984375, -2.123046875, -1.8251953125, -1.52734375, -1.2294921875, -0.931640625, -0.6337890625, -0.3359375, -0.0380859375, 0.259765625, 0.5576171875, 0.85546875, 1.1533203125, 1.451171875, 1.7490234375, 2.046875, 2.3447265625, 2.642578125, 2.9404296875, 3.23828125, 3.5361328125, 3.833984375, 4.1318359375, 4.4296875, 4.7275390625, 5.025390625, 5.3232421875, 5.62109375, 5.9189453125, 6.216796875, 6.5146484375, 6.8125, 7.1103515625, 7.408203125, 7.7060546875, 8.00390625, 8.3017578125, 8.599609375, 8.8974609375, 9.1953125]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 12.0, 9.0, 13.0, 10.0, 20.0, 34.0, 43.0, 62.0, 115.0, 196.0, 318.0, 590.0, 1187.0, 2520.0, 6541.0, 18652.0, 61304.0, 189941.0, 165410.0, 51164.0, 15762.0, 5700.0, 2269.0, 1073.0, 571.0, 275.0, 162.0, 115.0, 63.0, 50.0, 25.0, 23.0, 13.0, 8.0, 6.0, 5.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-113.75, -110.4931640625, -107.236328125, -103.9794921875, -100.72265625, -97.4658203125, -94.208984375, -90.9521484375, -87.6953125, -84.4384765625, -81.181640625, -77.9248046875, -74.66796875, -71.4111328125, -68.154296875, -64.8974609375, -61.640625, -58.3837890625, -55.126953125, -51.8701171875, -48.61328125, -45.3564453125, -42.099609375, -38.8427734375, -35.5859375, -32.3291015625, -29.072265625, -25.8154296875, -22.55859375, -19.3017578125, -16.044921875, -12.7880859375, -9.53125, -6.2744140625, -3.017578125, 0.2392578125, 3.49609375, 6.7529296875, 10.009765625, 13.2666015625, 16.5234375, 19.7802734375, 23.037109375, 26.2939453125, 29.55078125, 32.8076171875, 36.064453125, 39.3212890625, 42.578125, 45.8349609375, 49.091796875, 52.3486328125, 55.60546875, 58.8623046875, 62.119140625, 65.3759765625, 68.6328125, 71.8896484375, 75.146484375, 78.4033203125, 81.66015625, 84.9169921875, 88.173828125, 91.4306640625, 94.6875]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 6.0, 6.0, 4.0, 7.0, 8.0, 10.0, 15.0, 15.0, 15.0, 26.0, 24.0, 38.0, 43.0, 58.0, 55.0, 76.0, 66.0, 86.0, 73.0, 58.0, 45.0, 62.0, 31.0, 33.0, 22.0, 24.0, 19.0, 16.0, 8.0, 12.0, 10.0, 7.0, 5.0, 6.0, 3.0, 3.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.515625, -13.98583984375, -13.4560546875, -12.92626953125, -12.396484375, -11.86669921875, -11.3369140625, -10.80712890625, -10.27734375, -9.74755859375, -9.2177734375, -8.68798828125, -8.158203125, -7.62841796875, -7.0986328125, -6.56884765625, -6.0390625, -5.50927734375, -4.9794921875, -4.44970703125, -3.919921875, -3.39013671875, -2.8603515625, -2.33056640625, -1.80078125, -1.27099609375, -0.7412109375, -0.21142578125, 0.318359375, 0.84814453125, 1.3779296875, 1.90771484375, 2.4375, 2.96728515625, 3.4970703125, 4.02685546875, 4.556640625, 5.08642578125, 5.6162109375, 6.14599609375, 6.67578125, 7.20556640625, 7.7353515625, 8.26513671875, 8.794921875, 9.32470703125, 9.8544921875, 10.38427734375, 10.9140625, 11.44384765625, 11.9736328125, 12.50341796875, 13.033203125, 13.56298828125, 14.0927734375, 14.62255859375, 15.15234375, 15.68212890625, 16.2119140625, 16.74169921875, 17.271484375, 17.80126953125, 18.3310546875, 18.86083984375, 19.390625]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 5.0, 9.0, 5.0, 13.0, 12.0, 15.0, 20.0, 40.0, 40.0, 64.0, 69.0, 54.0, 37.0, 24.0, 19.0, 11.0, 9.0, 5.0, 6.0, 4.0, 4.0, 3.0, 2.0, 6.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-83.76661682128906, -81.0662612915039, -78.36590576171875, -75.6655502319336, -72.96519470214844, -70.26483917236328, -67.56448364257812, -64.8641357421875, -62.16377639770508, -59.46342086791992, -56.763065338134766, -54.062713623046875, -51.36235809326172, -48.66200256347656, -45.961647033691406, -43.26129150390625, -40.560935974121094, -37.86058044433594, -35.16022491455078, -32.459869384765625, -29.7595157623291, -27.059160232543945, -24.358806610107422, -21.658451080322266, -18.95809555053711, -16.257740020751953, -13.557385444641113, -10.857030868530273, -8.156675338745117, -5.456319808959961, -2.7559661865234375, -0.05561065673828125, 2.6447525024414062, 5.345107555389404, 8.045462608337402, 10.745817184448242, 13.446172714233398, 16.146528244018555, 18.846881866455078, 21.547237396240234, 24.24759292602539, 26.947948455810547, 29.648303985595703, 32.348655700683594, 35.04901123046875, 37.749366760253906, 40.44972229003906, 43.15007781982422, 45.850433349609375, 48.55078887939453, 51.25114440917969, 53.951499938964844, 56.65185546875, 59.352210998535156, 62.05256271362305, 64.75291442871094, 67.45327758789062, 70.15363311767578, 72.85398864746094, 75.5543441772461, 78.25469970703125, 80.9550552368164, 83.65541076660156, 86.35575866699219, 89.05611419677734]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 5.0, 2.0, 5.0, 3.0, 2.0, 2.0, 1.0, 5.0, 3.0, 9.0, 9.0, 6.0, 15.0, 20.0, 35.0, 42.0, 63.0, 63.0, 49.0, 43.0, 29.0, 13.0, 15.0, 12.0, 9.0, 7.0, 3.0, 6.0, 4.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-81.45079803466797, -78.36444091796875, -75.27808380126953, -72.19172668457031, -69.1053695678711, -66.01901245117188, -62.932655334472656, -59.84629821777344, -56.75994110107422, -53.673583984375, -50.58722686767578, -47.50086975097656, -44.414512634277344, -41.328155517578125, -38.241798400878906, -35.15544128417969, -32.06908416748047, -28.98272705078125, -25.89636993408203, -22.810012817382812, -19.723655700683594, -16.637298583984375, -13.550941467285156, -10.464584350585938, -7.378227233886719, -4.2918701171875, -1.2055130004882812, 1.8808441162109375, 4.967201232910156, 8.053558349609375, 11.139915466308594, 14.226272583007812, 17.31262969970703, 20.39898681640625, 23.48534393310547, 26.571701049804688, 29.658058166503906, 32.744415283203125, 35.830772399902344, 38.91712951660156, 42.00348663330078, 45.08984375, 48.17620086669922, 51.26255798339844, 54.348915100097656, 57.435272216796875, 60.521629333496094, 63.60798645019531, 66.69434356689453, 69.78070068359375, 72.86705780029297, 75.95341491699219, 79.0397720336914, 82.12612915039062, 85.21248626708984, 88.29884338378906, 91.38520050048828, 94.4715576171875, 97.55791473388672, 100.64427185058594, 103.73062896728516, 106.81698608398438, 109.9033432006836, 112.98970031738281, 116.07605743408203]}, "eval/loss": 5.471095085144043, "eval/wer": 1.5604323681078938, "eval/runtime": 668.0797, "eval/samples_per_second": 3.955, "eval/steps_per_second": 0.495} \ No newline at end of file +{"train/loss": 3.3434, "train/learning_rate": 2.5073239436619717e-05, "train/epoch": 5.04, "train/global_step": 4500, "_runtime": 26859, "_timestamp": 1648168203, "_step": 4502, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 5.0, 3.0, 0.0, 2.0, 4.0, 5.0, 6.0, 6.0, 6.0, 8.0, 19.0, 11.0, 11.0, 18.0, 20.0, 23.0, 37.0, 21.0, 38.0, 48.0, 54.0, 42.0, 54.0, 50.0, 59.0, 50.0, 58.0, 46.0, 51.0, 35.0, 31.0, 40.0, 26.0, 30.0, 15.0, 23.0, 5.0, 10.0, 11.0, 8.0, 10.0, 5.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-47.145931243896484, -46.14273452758789, -45.13954162597656, -44.13634490966797, -43.133148193359375, -42.12995147705078, -41.12675476074219, -40.12356185913086, -39.120365142822266, -38.11716842651367, -37.113975524902344, -36.11077880859375, -35.107582092285156, -34.10438537597656, -33.10118865966797, -32.09799575805664, -31.094799041748047, -30.091602325439453, -29.088407516479492, -28.08521270751953, -27.082015991210938, -26.078819274902344, -25.075624465942383, -24.072429656982422, -23.069232940673828, -22.066036224365234, -21.062841415405273, -20.059646606445312, -19.05644989013672, -18.053253173828125, -17.050058364868164, -16.046863555908203, -15.04366683959961, -14.040471076965332, -13.037275314331055, -12.034079551696777, -11.0308837890625, -10.027688026428223, -9.024492263793945, -8.021296501159668, -7.018100738525391, -6.014904975891113, -5.011709213256836, -4.008513450622559, -3.0053176879882812, -2.002121925354004, -0.9989261627197266, 0.004269599914550781, 1.0074653625488281, 2.0106611251831055, 3.013856887817383, 4.01705265045166, 5.0202484130859375, 6.023444175720215, 7.026639938354492, 8.02983570098877, 9.033031463623047, 10.036227226257324, 11.039422988891602, 12.042618751525879, 13.045814514160156, 14.049010276794434, 15.052206039428711, 16.055400848388672, 17.058597564697266]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 8.0, 1.0, 7.0, 14.0, 6.0, 12.0, 9.0, 16.0, 18.0, 12.0, 17.0, 25.0, 20.0, 28.0, 28.0, 26.0, 31.0, 42.0, 32.0, 27.0, 45.0, 31.0, 34.0, 30.0, 38.0, 45.0, 43.0, 32.0, 27.0, 38.0, 26.0, 31.0, 23.0, 22.0, 18.0, 16.0, 19.0, 19.0, 10.0, 16.0, 17.0, 13.0, 11.0, 2.0, 2.0, 8.0, 5.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-24.34871482849121, -23.52866554260254, -22.708616256713867, -21.888566970825195, -21.068517684936523, -20.24846839904785, -19.42841911315918, -18.608369827270508, -17.788320541381836, -16.968271255493164, -16.148221969604492, -15.32817268371582, -14.508123397827148, -13.688074111938477, -12.868024826049805, -12.047975540161133, -11.227926254272461, -10.407876968383789, -9.587827682495117, -8.767778396606445, -7.947729110717773, -7.127679824829102, -6.30763053894043, -5.487581253051758, -4.667531967163086, -3.847482681274414, -3.027433395385742, -2.2073841094970703, -1.3873348236083984, -0.5672855377197266, 0.2527637481689453, 1.0728130340576172, 1.8928642272949219, 2.7129135131835938, 3.5329627990722656, 4.3530120849609375, 5.173061370849609, 5.993110656738281, 6.813159942626953, 7.633209228515625, 8.453258514404297, 9.273307800292969, 10.09335708618164, 10.913406372070312, 11.733455657958984, 12.553504943847656, 13.373554229736328, 14.193603515625, 15.013652801513672, 15.833702087402344, 16.653751373291016, 17.473800659179688, 18.29384994506836, 19.11389923095703, 19.933948516845703, 20.753997802734375, 21.574047088623047, 22.39409637451172, 23.21414566040039, 24.034194946289062, 24.854244232177734, 25.674293518066406, 26.494342803955078, 27.31439208984375, 28.134441375732422]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 9.0, 6.0, 8.0, 22.0, 26.0, 52.0, 82.0, 142.0, 226.0, 408.0, 652.0, 1048.0, 1850.0, 3235.0, 5480.0, 9769.0, 16576.0, 29675.0, 51925.0, 90893.0, 156444.0, 256832.0, 401361.0, 560558.0, 658964.0, 629369.0, 491966.0, 333319.0, 206527.0, 121915.0, 70879.0, 40066.0, 22798.0, 13093.0, 7371.0, 4458.0, 2564.0, 1489.0, 864.0, 550.0, 307.0, 199.0, 117.0, 63.0, 46.0, 38.0, 22.0, 9.0, 8.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0], "bins": [-25.21875, -24.425048828125, -23.63134765625, -22.837646484375, -22.0439453125, -21.250244140625, -20.45654296875, -19.662841796875, -18.869140625, -18.075439453125, -17.28173828125, -16.488037109375, -15.6943359375, -14.900634765625, -14.10693359375, -13.313232421875, -12.51953125, -11.725830078125, -10.93212890625, -10.138427734375, -9.3447265625, -8.551025390625, -7.75732421875, -6.963623046875, -6.169921875, -5.376220703125, -4.58251953125, -3.788818359375, -2.9951171875, -2.201416015625, -1.40771484375, -0.614013671875, 0.1796875, 0.973388671875, 1.76708984375, 2.560791015625, 3.3544921875, 4.148193359375, 4.94189453125, 5.735595703125, 6.529296875, 7.322998046875, 8.11669921875, 8.910400390625, 9.7041015625, 10.497802734375, 11.29150390625, 12.085205078125, 12.87890625, 13.672607421875, 14.46630859375, 15.260009765625, 16.0537109375, 16.847412109375, 17.64111328125, 18.434814453125, 19.228515625, 20.022216796875, 20.81591796875, 21.609619140625, 22.4033203125, 23.197021484375, 23.99072265625, 24.784423828125, 25.578125]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 5.0, 10.0, 5.0, 8.0, 11.0, 11.0, 11.0, 19.0, 16.0, 21.0, 15.0, 30.0, 18.0, 31.0, 33.0, 28.0, 41.0, 31.0, 33.0, 49.0, 48.0, 45.0, 40.0, 36.0, 26.0, 35.0, 36.0, 29.0, 36.0, 29.0, 29.0, 27.0, 18.0, 13.0, 22.0, 11.0, 11.0, 15.0, 15.0, 9.0, 8.0, 7.0, 8.0, 9.0, 7.0, 4.0, 2.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-20.828125, -20.1787109375, -19.529296875, -18.8798828125, -18.23046875, -17.5810546875, -16.931640625, -16.2822265625, -15.6328125, -14.9833984375, -14.333984375, -13.6845703125, -13.03515625, -12.3857421875, -11.736328125, -11.0869140625, -10.4375, -9.7880859375, -9.138671875, -8.4892578125, -7.83984375, -7.1904296875, -6.541015625, -5.8916015625, -5.2421875, -4.5927734375, -3.943359375, -3.2939453125, -2.64453125, -1.9951171875, -1.345703125, -0.6962890625, -0.046875, 0.6025390625, 1.251953125, 1.9013671875, 2.55078125, 3.2001953125, 3.849609375, 4.4990234375, 5.1484375, 5.7978515625, 6.447265625, 7.0966796875, 7.74609375, 8.3955078125, 9.044921875, 9.6943359375, 10.34375, 10.9931640625, 11.642578125, 12.2919921875, 12.94140625, 13.5908203125, 14.240234375, 14.8896484375, 15.5390625, 16.1884765625, 16.837890625, 17.4873046875, 18.13671875, 18.7861328125, 19.435546875, 20.0849609375, 20.734375]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [1.0, 4.0, 1.0, 3.0, 9.0, 8.0, 14.0, 31.0, 34.0, 51.0, 90.0, 107.0, 213.0, 375.0, 683.0, 1197.0, 2065.0, 3555.0, 6384.0, 11185.0, 19083.0, 33172.0, 56416.0, 92094.0, 145956.0, 222635.0, 318146.0, 423327.0, 510879.0, 545873.0, 505098.0, 414425.0, 309257.0, 214775.0, 140354.0, 88363.0, 53664.0, 31565.0, 18397.0, 10652.0, 5984.0, 3472.0, 1881.0, 1200.0, 638.0, 397.0, 209.0, 151.0, 91.0, 41.0, 39.0, 15.0, 10.0, 15.0, 7.0, 2.0, 0.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-20.171875, -19.487060546875, -18.80224609375, -18.117431640625, -17.4326171875, -16.747802734375, -16.06298828125, -15.378173828125, -14.693359375, -14.008544921875, -13.32373046875, -12.638916015625, -11.9541015625, -11.269287109375, -10.58447265625, -9.899658203125, -9.21484375, -8.530029296875, -7.84521484375, -7.160400390625, -6.4755859375, -5.790771484375, -5.10595703125, -4.421142578125, -3.736328125, -3.051513671875, -2.36669921875, -1.681884765625, -0.9970703125, -0.312255859375, 0.37255859375, 1.057373046875, 1.7421875, 2.427001953125, 3.11181640625, 3.796630859375, 4.4814453125, 5.166259765625, 5.85107421875, 6.535888671875, 7.220703125, 7.905517578125, 8.59033203125, 9.275146484375, 9.9599609375, 10.644775390625, 11.32958984375, 12.014404296875, 12.69921875, 13.384033203125, 14.06884765625, 14.753662109375, 15.4384765625, 16.123291015625, 16.80810546875, 17.492919921875, 18.177734375, 18.862548828125, 19.54736328125, 20.232177734375, 20.9169921875, 21.601806640625, 22.28662109375, 22.971435546875, 23.65625]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 1.0, 3.0, 6.0, 5.0, 10.0, 20.0, 20.0, 29.0, 34.0, 43.0, 66.0, 68.0, 82.0, 108.0, 137.0, 156.0, 203.0, 225.0, 240.0, 290.0, 240.0, 279.0, 276.0, 233.0, 213.0, 193.0, 171.0, 131.0, 134.0, 109.0, 88.0, 61.0, 54.0, 40.0, 29.0, 23.0, 18.0, 11.0, 6.0, 5.0, 9.0, 1.0, 1.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-10.9765625, -10.613037109375, -10.24951171875, -9.885986328125, -9.5224609375, -9.158935546875, -8.79541015625, -8.431884765625, -8.068359375, -7.704833984375, -7.34130859375, -6.977783203125, -6.6142578125, -6.250732421875, -5.88720703125, -5.523681640625, -5.16015625, -4.796630859375, -4.43310546875, -4.069580078125, -3.7060546875, -3.342529296875, -2.97900390625, -2.615478515625, -2.251953125, -1.888427734375, -1.52490234375, -1.161376953125, -0.7978515625, -0.434326171875, -0.07080078125, 0.292724609375, 0.65625, 1.019775390625, 1.38330078125, 1.746826171875, 2.1103515625, 2.473876953125, 2.83740234375, 3.200927734375, 3.564453125, 3.927978515625, 4.29150390625, 4.655029296875, 5.0185546875, 5.382080078125, 5.74560546875, 6.109130859375, 6.47265625, 6.836181640625, 7.19970703125, 7.563232421875, 7.9267578125, 8.290283203125, 8.65380859375, 9.017333984375, 9.380859375, 9.744384765625, 10.10791015625, 10.471435546875, 10.8349609375, 11.198486328125, 11.56201171875, 11.925537109375, 12.2890625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 5.0, 3.0, 1.0, 3.0, 5.0, 7.0, 5.0, 6.0, 6.0, 14.0, 16.0, 21.0, 28.0, 26.0, 21.0, 30.0, 26.0, 38.0, 42.0, 56.0, 44.0, 39.0, 49.0, 48.0, 48.0, 43.0, 41.0, 48.0, 47.0, 33.0, 36.0, 31.0, 26.0, 17.0, 25.0, 10.0, 14.0, 9.0, 4.0, 4.0, 9.0, 7.0, 6.0, 2.0, 4.0, 4.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-26.54071617126465, -25.7466983795166, -24.952680587768555, -24.158662796020508, -23.364646911621094, -22.570629119873047, -21.776611328125, -20.982593536376953, -20.188575744628906, -19.39455795288086, -18.600540161132812, -17.806522369384766, -17.01250457763672, -16.218488693237305, -15.424470901489258, -14.630453109741211, -13.836435317993164, -13.042417526245117, -12.24839973449707, -11.45438289642334, -10.660365104675293, -9.866347312927246, -9.072330474853516, -8.278312683105469, -7.484294891357422, -6.690277099609375, -5.896259784698486, -5.102242469787598, -4.308224678039551, -3.514207124710083, -2.7201895713806152, -1.9261722564697266, -1.1321544647216797, -0.3381369113922119, 0.45588064193725586, 1.2498981952667236, 2.0439157485961914, 2.837933301925659, 3.631950855255127, 4.425968170166016, 5.2199859619140625, 6.014003753662109, 6.808021068572998, 7.602038383483887, 8.396056175231934, 9.19007396697998, 9.984090805053711, 10.778108596801758, 11.572126388549805, 12.366144180297852, 13.160161972045898, 13.954178810119629, 14.748196601867676, 15.542214393615723, 16.336231231689453, 17.1302490234375, 17.924266815185547, 18.718284606933594, 19.51230239868164, 20.306320190429688, 21.100337982177734, 21.89435386657715, 22.688371658325195, 23.482389450073242, 24.27640724182129]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 4.0, 5.0, 11.0, 8.0, 10.0, 11.0, 11.0, 15.0, 24.0, 25.0, 20.0, 23.0, 32.0, 25.0, 21.0, 30.0, 31.0, 38.0, 34.0, 37.0, 38.0, 44.0, 49.0, 42.0, 35.0, 38.0, 28.0, 37.0, 33.0, 32.0, 20.0, 21.0, 22.0, 18.0, 16.0, 13.0, 15.0, 10.0, 12.0, 8.0, 9.0, 14.0, 6.0, 6.0, 7.0, 6.0, 3.0, 3.0, 1.0, 3.0, 3.0, 1.0, 2.0], "bins": [-23.881210327148438, -23.164676666259766, -22.448143005371094, -21.731609344482422, -21.01507568359375, -20.29854393005371, -19.58201026916504, -18.865476608276367, -18.148942947387695, -17.432409286499023, -16.71587562561035, -15.999342918395996, -15.282809257507324, -14.566275596618652, -13.849742889404297, -13.133209228515625, -12.416675567626953, -11.700141906738281, -10.98360824584961, -10.267075538635254, -9.550541877746582, -8.83400821685791, -8.117475509643555, -7.400941848754883, -6.684408187866211, -5.967874526977539, -5.251341342926025, -4.534808158874512, -3.81827449798584, -3.101741075515747, -2.3852076530456543, -1.6686744689941406, -0.9521408081054688, -0.23560738563537598, 0.4809260368347168, 1.1974594593048096, 1.9139928817749023, 2.630526304244995, 3.347059726715088, 4.063592910766602, 4.780126571655273, 5.496660232543945, 6.213193416595459, 6.929726600646973, 7.6462602615356445, 8.362793922424316, 9.079326629638672, 9.795860290527344, 10.512393951416016, 11.228927612304688, 11.94546127319336, 12.661993980407715, 13.378527641296387, 14.095061302185059, 14.811594009399414, 15.528127670288086, 16.244661331176758, 16.96119499206543, 17.6777286529541, 18.394262313842773, 19.110794067382812, 19.827327728271484, 20.543861389160156, 21.260395050048828, 21.9769287109375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 10.0, 16.0, 21.0, 28.0, 49.0, 93.0, 142.0, 207.0, 312.0, 495.0, 690.0, 1197.0, 1905.0, 2997.0, 4486.0, 6909.0, 10652.0, 16423.0, 24872.0, 38160.0, 57801.0, 85411.0, 118619.0, 147336.0, 148610.0, 121910.0, 87269.0, 59070.0, 39046.0, 25456.0, 17078.0, 11167.0, 7179.0, 4603.0, 2957.0, 1954.0, 1271.0, 778.0, 516.0, 311.0, 196.0, 124.0, 87.0, 54.0, 33.0, 18.0, 25.0, 3.0, 6.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-24.203125, -23.447509765625, -22.69189453125, -21.936279296875, -21.1806640625, -20.425048828125, -19.66943359375, -18.913818359375, -18.158203125, -17.402587890625, -16.64697265625, -15.891357421875, -15.1357421875, -14.380126953125, -13.62451171875, -12.868896484375, -12.11328125, -11.357666015625, -10.60205078125, -9.846435546875, -9.0908203125, -8.335205078125, -7.57958984375, -6.823974609375, -6.068359375, -5.312744140625, -4.55712890625, -3.801513671875, -3.0458984375, -2.290283203125, -1.53466796875, -0.779052734375, -0.0234375, 0.732177734375, 1.48779296875, 2.243408203125, 2.9990234375, 3.754638671875, 4.51025390625, 5.265869140625, 6.021484375, 6.777099609375, 7.53271484375, 8.288330078125, 9.0439453125, 9.799560546875, 10.55517578125, 11.310791015625, 12.06640625, 12.822021484375, 13.57763671875, 14.333251953125, 15.0888671875, 15.844482421875, 16.60009765625, 17.355712890625, 18.111328125, 18.866943359375, 19.62255859375, 20.378173828125, 21.1337890625, 21.889404296875, 22.64501953125, 23.400634765625, 24.15625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 7.0, 8.0, 9.0, 7.0, 14.0, 12.0, 15.0, 21.0, 25.0, 18.0, 22.0, 22.0, 26.0, 33.0, 41.0, 29.0, 33.0, 32.0, 28.0, 45.0, 42.0, 55.0, 27.0, 42.0, 43.0, 31.0, 28.0, 35.0, 30.0, 27.0, 21.0, 21.0, 22.0, 20.0, 16.0, 10.0, 8.0, 13.0, 17.0, 6.0, 7.0, 6.0, 5.0, 3.0, 8.0, 5.0, 5.0, 2.0, 2.0, 1.0, 2.0], "bins": [-23.53125, -22.84326171875, -22.1552734375, -21.46728515625, -20.779296875, -20.09130859375, -19.4033203125, -18.71533203125, -18.02734375, -17.33935546875, -16.6513671875, -15.96337890625, -15.275390625, -14.58740234375, -13.8994140625, -13.21142578125, -12.5234375, -11.83544921875, -11.1474609375, -10.45947265625, -9.771484375, -9.08349609375, -8.3955078125, -7.70751953125, -7.01953125, -6.33154296875, -5.6435546875, -4.95556640625, -4.267578125, -3.57958984375, -2.8916015625, -2.20361328125, -1.515625, -0.82763671875, -0.1396484375, 0.54833984375, 1.236328125, 1.92431640625, 2.6123046875, 3.30029296875, 3.98828125, 4.67626953125, 5.3642578125, 6.05224609375, 6.740234375, 7.42822265625, 8.1162109375, 8.80419921875, 9.4921875, 10.18017578125, 10.8681640625, 11.55615234375, 12.244140625, 12.93212890625, 13.6201171875, 14.30810546875, 14.99609375, 15.68408203125, 16.3720703125, 17.06005859375, 17.748046875, 18.43603515625, 19.1240234375, 19.81201171875, 20.5]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 7.0, 3.0, 12.0, 18.0, 25.0, 51.0, 75.0, 121.0, 173.0, 223.0, 362.0, 591.0, 922.0, 1352.0, 2029.0, 3039.0, 4745.0, 7222.0, 11090.0, 17712.0, 27944.0, 44362.0, 71287.0, 110192.0, 154529.0, 173421.0, 144395.0, 99952.0, 63581.0, 39595.0, 25162.0, 15667.0, 10170.0, 6456.0, 4290.0, 2632.0, 1803.0, 1174.0, 820.0, 494.0, 298.0, 224.0, 125.0, 89.0, 47.0, 29.0, 20.0, 13.0, 7.0, 9.0, 1.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.71875, -20.05859375, -19.3984375, -18.73828125, -18.078125, -17.41796875, -16.7578125, -16.09765625, -15.4375, -14.77734375, -14.1171875, -13.45703125, -12.796875, -12.13671875, -11.4765625, -10.81640625, -10.15625, -9.49609375, -8.8359375, -8.17578125, -7.515625, -6.85546875, -6.1953125, -5.53515625, -4.875, -4.21484375, -3.5546875, -2.89453125, -2.234375, -1.57421875, -0.9140625, -0.25390625, 0.40625, 1.06640625, 1.7265625, 2.38671875, 3.046875, 3.70703125, 4.3671875, 5.02734375, 5.6875, 6.34765625, 7.0078125, 7.66796875, 8.328125, 8.98828125, 9.6484375, 10.30859375, 10.96875, 11.62890625, 12.2890625, 12.94921875, 13.609375, 14.26953125, 14.9296875, 15.58984375, 16.25, 16.91015625, 17.5703125, 18.23046875, 18.890625, 19.55078125, 20.2109375, 20.87109375, 21.53125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 8.0, 6.0, 3.0, 2.0, 8.0, 8.0, 8.0, 12.0, 13.0, 8.0, 14.0, 13.0, 12.0, 14.0, 24.0, 31.0, 25.0, 18.0, 29.0, 45.0, 40.0, 40.0, 34.0, 41.0, 46.0, 34.0, 43.0, 41.0, 35.0, 50.0, 31.0, 39.0, 28.0, 25.0, 25.0, 31.0, 20.0, 23.0, 16.0, 20.0, 9.0, 7.0, 5.0, 7.0, 5.0, 5.0, 5.0, 1.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.546875, -17.0335693359375, -16.520263671875, -16.0069580078125, -15.49365234375, -14.9803466796875, -14.467041015625, -13.9537353515625, -13.4404296875, -12.9271240234375, -12.413818359375, -11.9005126953125, -11.38720703125, -10.8739013671875, -10.360595703125, -9.8472900390625, -9.333984375, -8.8206787109375, -8.307373046875, -7.7940673828125, -7.28076171875, -6.7674560546875, -6.254150390625, -5.7408447265625, -5.2275390625, -4.7142333984375, -4.200927734375, -3.6876220703125, -3.17431640625, -2.6610107421875, -2.147705078125, -1.6343994140625, -1.12109375, -0.6077880859375, -0.094482421875, 0.4188232421875, 0.93212890625, 1.4454345703125, 1.958740234375, 2.4720458984375, 2.9853515625, 3.4986572265625, 4.011962890625, 4.5252685546875, 5.03857421875, 5.5518798828125, 6.065185546875, 6.5784912109375, 7.091796875, 7.6051025390625, 8.118408203125, 8.6317138671875, 9.14501953125, 9.6583251953125, 10.171630859375, 10.6849365234375, 11.1982421875, 11.7115478515625, 12.224853515625, 12.7381591796875, 13.25146484375, 13.7647705078125, 14.278076171875, 14.7913818359375, 15.3046875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 1.0, 2.0, 4.0, 8.0, 7.0, 10.0, 19.0, 16.0, 27.0, 48.0, 69.0, 105.0, 140.0, 258.0, 333.0, 535.0, 905.0, 1767.0, 3794.0, 10153.0, 32774.0, 142110.0, 609087.0, 186160.0, 39673.0, 11670.0, 4311.0, 1935.0, 1009.0, 597.0, 316.0, 224.0, 133.0, 115.0, 71.0, 49.0, 41.0, 27.0, 21.0, 14.0, 11.0, 9.0, 3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.75, -44.921875, -43.09375, -41.265625, -39.4375, -37.609375, -35.78125, -33.953125, -32.125, -30.296875, -28.46875, -26.640625, -24.8125, -22.984375, -21.15625, -19.328125, -17.5, -15.671875, -13.84375, -12.015625, -10.1875, -8.359375, -6.53125, -4.703125, -2.875, -1.046875, 0.78125, 2.609375, 4.4375, 6.265625, 8.09375, 9.921875, 11.75, 13.578125, 15.40625, 17.234375, 19.0625, 20.890625, 22.71875, 24.546875, 26.375, 28.203125, 30.03125, 31.859375, 33.6875, 35.515625, 37.34375, 39.171875, 41.0, 42.828125, 44.65625, 46.484375, 48.3125, 50.140625, 51.96875, 53.796875, 55.625, 57.453125, 59.28125, 61.109375, 62.9375, 64.765625, 66.59375, 68.421875, 70.25]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 5.0, 6.0, 7.0, 8.0, 8.0, 12.0, 19.0, 22.0, 46.0, 60.0, 98.0, 175.0, 213.0, 109.0, 70.0, 44.0, 23.0, 26.0, 12.0, 12.0, 11.0, 4.0, 4.0, 5.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.005031585693359375, -0.004888176918029785, -0.004744768142700195, -0.0046013593673706055, -0.004457950592041016, -0.004314541816711426, -0.004171133041381836, -0.004027724266052246, -0.0038843154907226562, -0.0037409067153930664, -0.0035974979400634766, -0.0034540891647338867, -0.003310680389404297, -0.003167271614074707, -0.003023862838745117, -0.0028804540634155273, -0.0027370452880859375, -0.0025936365127563477, -0.002450227737426758, -0.002306818962097168, -0.002163410186767578, -0.0020200014114379883, -0.0018765926361083984, -0.0017331838607788086, -0.0015897750854492188, -0.001446366310119629, -0.001302957534790039, -0.0011595487594604492, -0.0010161399841308594, -0.0008727312088012695, -0.0007293224334716797, -0.0005859136581420898, -0.0004425048828125, -0.00029909610748291016, -0.0001556873321533203, -1.2278556823730469e-05, 0.00013113021850585938, 0.0002745389938354492, 0.00041794776916503906, 0.0005613565444946289, 0.0007047653198242188, 0.0008481740951538086, 0.0009915828704833984, 0.0011349916458129883, 0.0012784004211425781, 0.001421809196472168, 0.0015652179718017578, 0.0017086267471313477, 0.0018520355224609375, 0.0019954442977905273, 0.002138853073120117, 0.002282261848449707, 0.002425670623779297, 0.0025690793991088867, 0.0027124881744384766, 0.0028558969497680664, 0.0029993057250976562, 0.003142714500427246, 0.003286123275756836, 0.0034295320510864258, 0.0035729408264160156, 0.0037163496017456055, 0.0038597583770751953, 0.004003167152404785, 0.004146575927734375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 6.0, 2.0, 5.0, 6.0, 8.0, 21.0, 27.0, 29.0, 48.0, 86.0, 103.0, 143.0, 220.0, 294.0, 450.0, 758.0, 1118.0, 1728.0, 2706.0, 4493.0, 7627.0, 13558.0, 23554.0, 42528.0, 77795.0, 150765.0, 247447.0, 215850.0, 115990.0, 60766.0, 34094.0, 18980.0, 10807.0, 6231.0, 3798.0, 2279.0, 1462.0, 939.0, 630.0, 415.0, 239.0, 182.0, 120.0, 73.0, 49.0, 39.0, 31.0, 24.0, 13.0, 9.0, 3.0, 7.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0], "bins": [-25.125, -24.359130859375, -23.59326171875, -22.827392578125, -22.0615234375, -21.295654296875, -20.52978515625, -19.763916015625, -18.998046875, -18.232177734375, -17.46630859375, -16.700439453125, -15.9345703125, -15.168701171875, -14.40283203125, -13.636962890625, -12.87109375, -12.105224609375, -11.33935546875, -10.573486328125, -9.8076171875, -9.041748046875, -8.27587890625, -7.510009765625, -6.744140625, -5.978271484375, -5.21240234375, -4.446533203125, -3.6806640625, -2.914794921875, -2.14892578125, -1.383056640625, -0.6171875, 0.148681640625, 0.91455078125, 1.680419921875, 2.4462890625, 3.212158203125, 3.97802734375, 4.743896484375, 5.509765625, 6.275634765625, 7.04150390625, 7.807373046875, 8.5732421875, 9.339111328125, 10.10498046875, 10.870849609375, 11.63671875, 12.402587890625, 13.16845703125, 13.934326171875, 14.7001953125, 15.466064453125, 16.23193359375, 16.997802734375, 17.763671875, 18.529541015625, 19.29541015625, 20.061279296875, 20.8271484375, 21.593017578125, 22.35888671875, 23.124755859375, 23.890625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 2.0, 3.0, 8.0, 6.0, 5.0, 11.0, 8.0, 20.0, 9.0, 14.0, 16.0, 26.0, 36.0, 28.0, 40.0, 58.0, 71.0, 78.0, 88.0, 88.0, 65.0, 61.0, 39.0, 43.0, 29.0, 30.0, 26.0, 21.0, 18.0, 12.0, 11.0, 9.0, 11.0, 2.0, 5.0, 8.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-10.8203125, -10.53411865234375, -10.2479248046875, -9.96173095703125, -9.675537109375, -9.38934326171875, -9.1031494140625, -8.81695556640625, -8.53076171875, -8.24456787109375, -7.9583740234375, -7.67218017578125, -7.385986328125, -7.09979248046875, -6.8135986328125, -6.52740478515625, -6.2412109375, -5.95501708984375, -5.6688232421875, -5.38262939453125, -5.096435546875, -4.81024169921875, -4.5240478515625, -4.23785400390625, -3.95166015625, -3.66546630859375, -3.3792724609375, -3.09307861328125, -2.806884765625, -2.52069091796875, -2.2344970703125, -1.94830322265625, -1.662109375, -1.37591552734375, -1.0897216796875, -0.80352783203125, -0.517333984375, -0.23114013671875, 0.0550537109375, 0.34124755859375, 0.62744140625, 0.91363525390625, 1.1998291015625, 1.48602294921875, 1.772216796875, 2.05841064453125, 2.3446044921875, 2.63079833984375, 2.9169921875, 3.20318603515625, 3.4893798828125, 3.77557373046875, 4.061767578125, 4.34796142578125, 4.6341552734375, 4.92034912109375, 5.20654296875, 5.49273681640625, 5.7789306640625, 6.06512451171875, 6.351318359375, 6.63751220703125, 6.9237060546875, 7.20989990234375, 7.49609375]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 3.0, 5.0, 5.0, 7.0, 6.0, 15.0, 8.0, 14.0, 23.0, 18.0, 16.0, 30.0, 23.0, 44.0, 31.0, 43.0, 44.0, 45.0, 41.0, 57.0, 46.0, 48.0, 47.0, 39.0, 39.0, 40.0, 45.0, 38.0, 42.0, 15.0, 27.0, 20.0, 20.0, 18.0, 7.0, 6.0, 6.0, 7.0, 6.0, 2.0, 0.0, 1.0, 3.0, 0.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.890993118286133, -24.126096725463867, -23.3612003326416, -22.596303939819336, -21.83140754699707, -21.066511154174805, -20.30161476135254, -19.536718368530273, -18.771821975708008, -18.006925582885742, -17.242029190063477, -16.47713279724121, -15.712236404418945, -14.94734001159668, -14.182443618774414, -13.417547225952148, -12.652650833129883, -11.887754440307617, -11.122858047485352, -10.357961654663086, -9.59306526184082, -8.828168869018555, -8.063272476196289, -7.298376083374023, -6.533479690551758, -5.768583297729492, -5.003686904907227, -4.238790512084961, -3.4738941192626953, -2.7089977264404297, -1.944101333618164, -1.1792049407958984, -0.414306640625, 0.3505897521972656, 1.1154861450195312, 1.8803825378417969, 2.6452789306640625, 3.410175323486328, 4.175071716308594, 4.939968109130859, 5.704864501953125, 6.469760894775391, 7.234657287597656, 7.999553680419922, 8.764450073242188, 9.529346466064453, 10.294242858886719, 11.059139251708984, 11.82403564453125, 12.588932037353516, 13.353828430175781, 14.118724822998047, 14.883621215820312, 15.648517608642578, 16.413414001464844, 17.17831039428711, 17.943206787109375, 18.70810317993164, 19.472999572753906, 20.237895965576172, 21.002792358398438, 21.767688751220703, 22.53258514404297, 23.297481536865234, 24.0623779296875]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 7.0, 3.0, 8.0, 9.0, 8.0, 12.0, 11.0, 17.0, 14.0, 17.0, 19.0, 20.0, 16.0, 15.0, 19.0, 32.0, 33.0, 36.0, 22.0, 39.0, 32.0, 32.0, 44.0, 34.0, 43.0, 39.0, 38.0, 37.0, 41.0, 33.0, 31.0, 22.0, 27.0, 29.0, 17.0, 13.0, 21.0, 13.0, 21.0, 14.0, 3.0, 11.0, 3.0, 14.0, 7.0, 5.0, 8.0, 3.0, 5.0, 3.0, 5.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-20.59387969970703, -19.931934356689453, -19.269987106323242, -18.608041763305664, -17.946096420288086, -17.284149169921875, -16.622203826904297, -15.960258483886719, -15.298312187194824, -14.63636589050293, -13.974420547485352, -13.312474250793457, -12.650527954101562, -11.988582611083984, -11.32663631439209, -10.664690017700195, -10.002744674682617, -9.340798377990723, -8.678853034973145, -8.01690673828125, -7.354960918426514, -6.693015098571777, -6.031068801879883, -5.3691229820251465, -4.70717716217041, -4.045231342315674, -3.3832852840423584, -2.721339225769043, -2.0593934059143066, -1.3974475860595703, -0.7355015277862549, -0.07355546951293945, 0.5883922576904297, 1.2503381967544556, 1.9122841358184814, 2.574230194091797, 3.236176013946533, 3.8981218338012695, 4.560068130493164, 5.2220139503479, 5.883959770202637, 6.545905590057373, 7.207851409912109, 7.869797706604004, 8.531744003295898, 9.193689346313477, 9.855635643005371, 10.517581939697266, 11.179527282714844, 11.841473579406738, 12.503418922424316, 13.165365219116211, 13.827310562133789, 14.489256858825684, 15.151203155517578, 15.813148498535156, 16.475093841552734, 17.137039184570312, 17.798986434936523, 18.4609317779541, 19.12287712097168, 19.78482437133789, 20.44676971435547, 21.108715057373047, 21.770662307739258]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 5.0, 7.0, 11.0, 17.0, 27.0, 47.0, 75.0, 148.0, 226.0, 316.0, 538.0, 780.0, 1306.0, 2014.0, 3131.0, 4899.0, 7499.0, 11257.0, 16839.0, 24721.0, 35175.0, 48171.0, 62924.0, 77916.0, 91429.0, 100068.0, 102782.0, 97844.0, 87443.0, 72676.0, 57830.0, 43387.0, 31743.0, 21891.0, 14955.0, 10128.0, 6776.0, 4087.0, 2756.0, 1742.0, 1099.0, 700.0, 463.0, 272.0, 178.0, 98.0, 60.0, 35.0, 25.0, 18.0, 13.0, 7.0, 6.0, 2.0, 3.0, 0.0, 3.0], "bins": [-14.3046875, -13.8756103515625, -13.446533203125, -13.0174560546875, -12.58837890625, -12.1593017578125, -11.730224609375, -11.3011474609375, -10.8720703125, -10.4429931640625, -10.013916015625, -9.5848388671875, -9.15576171875, -8.7266845703125, -8.297607421875, -7.8685302734375, -7.439453125, -7.0103759765625, -6.581298828125, -6.1522216796875, -5.72314453125, -5.2940673828125, -4.864990234375, -4.4359130859375, -4.0068359375, -3.5777587890625, -3.148681640625, -2.7196044921875, -2.29052734375, -1.8614501953125, -1.432373046875, -1.0032958984375, -0.57421875, -0.1451416015625, 0.283935546875, 0.7130126953125, 1.14208984375, 1.5711669921875, 2.000244140625, 2.4293212890625, 2.8583984375, 3.2874755859375, 3.716552734375, 4.1456298828125, 4.57470703125, 5.0037841796875, 5.432861328125, 5.8619384765625, 6.291015625, 6.7200927734375, 7.149169921875, 7.5782470703125, 8.00732421875, 8.4364013671875, 8.865478515625, 9.2945556640625, 9.7236328125, 10.1527099609375, 10.581787109375, 11.0108642578125, 11.43994140625, 11.8690185546875, 12.298095703125, 12.7271728515625, 13.15625]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 0.0, 6.0, 4.0, 9.0, 8.0, 9.0, 17.0, 11.0, 18.0, 21.0, 13.0, 22.0, 23.0, 23.0, 31.0, 26.0, 29.0, 32.0, 36.0, 42.0, 40.0, 41.0, 41.0, 40.0, 40.0, 38.0, 44.0, 36.0, 26.0, 35.0, 22.0, 30.0, 22.0, 26.0, 17.0, 17.0, 15.0, 15.0, 12.0, 10.0, 8.0, 10.0, 7.0, 2.0, 11.0, 6.0, 5.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-21.4375, -20.7265625, -20.015625, -19.3046875, -18.59375, -17.8828125, -17.171875, -16.4609375, -15.75, -15.0390625, -14.328125, -13.6171875, -12.90625, -12.1953125, -11.484375, -10.7734375, -10.0625, -9.3515625, -8.640625, -7.9296875, -7.21875, -6.5078125, -5.796875, -5.0859375, -4.375, -3.6640625, -2.953125, -2.2421875, -1.53125, -0.8203125, -0.109375, 0.6015625, 1.3125, 2.0234375, 2.734375, 3.4453125, 4.15625, 4.8671875, 5.578125, 6.2890625, 7.0, 7.7109375, 8.421875, 9.1328125, 9.84375, 10.5546875, 11.265625, 11.9765625, 12.6875, 13.3984375, 14.109375, 14.8203125, 15.53125, 16.2421875, 16.953125, 17.6640625, 18.375, 19.0859375, 19.796875, 20.5078125, 21.21875, 21.9296875, 22.640625, 23.3515625, 24.0625]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 5.0, 6.0, 7.0, 12.0, 16.0, 34.0, 42.0, 59.0, 82.0, 125.0, 168.0, 274.0, 338.0, 521.0, 763.0, 1137.0, 1768.0, 2511.0, 3889.0, 5761.0, 8976.0, 13598.0, 20132.0, 29535.0, 42356.0, 58540.0, 77329.0, 94106.0, 106920.0, 111695.0, 106994.0, 94139.0, 76747.0, 58671.0, 42215.0, 29657.0, 19826.0, 13317.0, 8758.0, 5844.0, 3873.0, 2468.0, 1733.0, 1167.0, 810.0, 516.0, 356.0, 272.0, 164.0, 106.0, 66.0, 44.0, 37.0, 36.0, 13.0, 15.0, 4.0, 9.0, 6.0, 3.0, 2.0], "bins": [-17.53125, -16.99169921875, -16.4521484375, -15.91259765625, -15.373046875, -14.83349609375, -14.2939453125, -13.75439453125, -13.21484375, -12.67529296875, -12.1357421875, -11.59619140625, -11.056640625, -10.51708984375, -9.9775390625, -9.43798828125, -8.8984375, -8.35888671875, -7.8193359375, -7.27978515625, -6.740234375, -6.20068359375, -5.6611328125, -5.12158203125, -4.58203125, -4.04248046875, -3.5029296875, -2.96337890625, -2.423828125, -1.88427734375, -1.3447265625, -0.80517578125, -0.265625, 0.27392578125, 0.8134765625, 1.35302734375, 1.892578125, 2.43212890625, 2.9716796875, 3.51123046875, 4.05078125, 4.59033203125, 5.1298828125, 5.66943359375, 6.208984375, 6.74853515625, 7.2880859375, 7.82763671875, 8.3671875, 8.90673828125, 9.4462890625, 9.98583984375, 10.525390625, 11.06494140625, 11.6044921875, 12.14404296875, 12.68359375, 13.22314453125, 13.7626953125, 14.30224609375, 14.841796875, 15.38134765625, 15.9208984375, 16.46044921875, 17.0]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 1.0, 5.0, 4.0, 2.0, 7.0, 7.0, 9.0, 13.0, 16.0, 16.0, 12.0, 13.0, 16.0, 20.0, 24.0, 30.0, 31.0, 30.0, 33.0, 36.0, 35.0, 43.0, 31.0, 32.0, 40.0, 45.0, 47.0, 45.0, 42.0, 37.0, 20.0, 31.0, 36.0, 27.0, 19.0, 23.0, 26.0, 16.0, 10.0, 13.0, 15.0, 7.0, 10.0, 5.0, 3.0, 7.0, 5.0, 3.0, 3.0, 4.0, 0.0, 2.0], "bins": [-17.390625, -16.918701171875, -16.44677734375, -15.974853515625, -15.5029296875, -15.031005859375, -14.55908203125, -14.087158203125, -13.615234375, -13.143310546875, -12.67138671875, -12.199462890625, -11.7275390625, -11.255615234375, -10.78369140625, -10.311767578125, -9.83984375, -9.367919921875, -8.89599609375, -8.424072265625, -7.9521484375, -7.480224609375, -7.00830078125, -6.536376953125, -6.064453125, -5.592529296875, -5.12060546875, -4.648681640625, -4.1767578125, -3.704833984375, -3.23291015625, -2.760986328125, -2.2890625, -1.817138671875, -1.34521484375, -0.873291015625, -0.4013671875, 0.070556640625, 0.54248046875, 1.014404296875, 1.486328125, 1.958251953125, 2.43017578125, 2.902099609375, 3.3740234375, 3.845947265625, 4.31787109375, 4.789794921875, 5.26171875, 5.733642578125, 6.20556640625, 6.677490234375, 7.1494140625, 7.621337890625, 8.09326171875, 8.565185546875, 9.037109375, 9.509033203125, 9.98095703125, 10.452880859375, 10.9248046875, 11.396728515625, 11.86865234375, 12.340576171875, 12.8125]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 5.0, 3.0, 9.0, 11.0, 15.0, 22.0, 30.0, 42.0, 70.0, 108.0, 169.0, 239.0, 378.0, 566.0, 861.0, 1303.0, 2199.0, 3270.0, 5310.0, 8401.0, 13352.0, 21065.0, 32951.0, 49412.0, 70497.0, 94624.0, 115502.0, 127354.0, 124511.0, 108335.0, 85650.0, 62720.0, 42704.0, 28263.0, 17917.0, 11496.0, 6967.0, 4415.0, 2839.0, 1727.0, 1139.0, 705.0, 446.0, 309.0, 210.0, 136.0, 102.0, 73.0, 56.0, 24.0, 22.0, 11.0, 11.0, 7.0, 1.0, 4.0, 2.0, 1.0, 1.0], "bins": [-6.2734375, -6.082275390625, -5.89111328125, -5.699951171875, -5.5087890625, -5.317626953125, -5.12646484375, -4.935302734375, -4.744140625, -4.552978515625, -4.36181640625, -4.170654296875, -3.9794921875, -3.788330078125, -3.59716796875, -3.406005859375, -3.21484375, -3.023681640625, -2.83251953125, -2.641357421875, -2.4501953125, -2.259033203125, -2.06787109375, -1.876708984375, -1.685546875, -1.494384765625, -1.30322265625, -1.112060546875, -0.9208984375, -0.729736328125, -0.53857421875, -0.347412109375, -0.15625, 0.034912109375, 0.22607421875, 0.417236328125, 0.6083984375, 0.799560546875, 0.99072265625, 1.181884765625, 1.373046875, 1.564208984375, 1.75537109375, 1.946533203125, 2.1376953125, 2.328857421875, 2.52001953125, 2.711181640625, 2.90234375, 3.093505859375, 3.28466796875, 3.475830078125, 3.6669921875, 3.858154296875, 4.04931640625, 4.240478515625, 4.431640625, 4.622802734375, 4.81396484375, 5.005126953125, 5.1962890625, 5.387451171875, 5.57861328125, 5.769775390625, 5.9609375]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 3.0, 5.0, 5.0, 8.0, 7.0, 14.0, 19.0, 24.0, 26.0, 21.0, 23.0, 21.0, 38.0, 33.0, 53.0, 54.0, 55.0, 59.0, 46.0, 59.0, 52.0, 55.0, 55.0, 37.0, 28.0, 45.0, 31.0, 26.0, 26.0, 18.0, 10.0, 7.0, 9.0, 8.0, 5.0, 3.0, 4.0, 3.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0007405281066894531, -0.0007174089550971985, -0.0006942898035049438, -0.0006711706519126892, -0.0006480515003204346, -0.0006249323487281799, -0.0006018131971359253, -0.0005786940455436707, -0.000555574893951416, -0.0005324557423591614, -0.0005093365907669067, -0.0004862174391746521, -0.00046309828758239746, -0.0004399791359901428, -0.0004168599843978882, -0.00039374083280563354, -0.0003706216812133789, -0.00034750252962112427, -0.00032438337802886963, -0.000301264226436615, -0.00027814507484436035, -0.0002550259232521057, -0.00023190677165985107, -0.00020878762006759644, -0.0001856684684753418, -0.00016254931688308716, -0.00013943016529083252, -0.00011631101369857788, -9.319186210632324e-05, -7.00727105140686e-05, -4.6953558921813965e-05, -2.3834407329559326e-05, -7.152557373046875e-07, 2.240389585494995e-05, 4.552304744720459e-05, 6.864219903945923e-05, 9.176135063171387e-05, 0.0001148805022239685, 0.00013799965381622314, 0.00016111880540847778, 0.00018423795700073242, 0.00020735710859298706, 0.0002304762601852417, 0.00025359541177749634, 0.000276714563369751, 0.0002998337149620056, 0.00032295286655426025, 0.0003460720181465149, 0.00036919116973876953, 0.00039231032133102417, 0.0004154294729232788, 0.00043854862451553345, 0.0004616677761077881, 0.0004847869277000427, 0.0005079060792922974, 0.000531025230884552, 0.0005541443824768066, 0.0005772635340690613, 0.0006003826856613159, 0.0006235018372535706, 0.0006466209888458252, 0.0006697401404380798, 0.0006928592920303345, 0.0007159784436225891, 0.0007390975952148438]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 4.0, 6.0, 2.0, 13.0, 16.0, 20.0, 47.0, 53.0, 65.0, 116.0, 168.0, 227.0, 339.0, 552.0, 869.0, 1421.0, 2162.0, 3386.0, 5283.0, 8380.0, 12792.0, 19949.0, 30350.0, 43891.0, 61310.0, 81264.0, 100202.0, 114483.0, 116827.0, 110181.0, 93926.0, 73879.0, 54664.0, 38208.0, 26007.0, 16929.0, 10881.0, 7082.0, 4562.0, 2888.0, 1819.0, 1130.0, 768.0, 490.0, 316.0, 203.0, 144.0, 83.0, 63.0, 49.0, 31.0, 16.0, 22.0, 11.0, 8.0, 3.0, 2.0, 2.0, 1.0, 4.0], "bins": [-5.6171875, -5.443359375, -5.26953125, -5.095703125, -4.921875, -4.748046875, -4.57421875, -4.400390625, -4.2265625, -4.052734375, -3.87890625, -3.705078125, -3.53125, -3.357421875, -3.18359375, -3.009765625, -2.8359375, -2.662109375, -2.48828125, -2.314453125, -2.140625, -1.966796875, -1.79296875, -1.619140625, -1.4453125, -1.271484375, -1.09765625, -0.923828125, -0.75, -0.576171875, -0.40234375, -0.228515625, -0.0546875, 0.119140625, 0.29296875, 0.466796875, 0.640625, 0.814453125, 0.98828125, 1.162109375, 1.3359375, 1.509765625, 1.68359375, 1.857421875, 2.03125, 2.205078125, 2.37890625, 2.552734375, 2.7265625, 2.900390625, 3.07421875, 3.248046875, 3.421875, 3.595703125, 3.76953125, 3.943359375, 4.1171875, 4.291015625, 4.46484375, 4.638671875, 4.8125, 4.986328125, 5.16015625, 5.333984375, 5.5078125]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 6.0, 3.0, 4.0, 7.0, 8.0, 12.0, 10.0, 13.0, 26.0, 30.0, 40.0, 32.0, 35.0, 45.0, 50.0, 54.0, 56.0, 48.0, 62.0, 57.0, 56.0, 41.0, 49.0, 45.0, 37.0, 43.0, 30.0, 31.0, 14.0, 15.0, 10.0, 6.0, 12.0, 6.0, 4.0, 3.0, 1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.54296875, -2.44940185546875, -2.3558349609375, -2.26226806640625, -2.168701171875, -2.07513427734375, -1.9815673828125, -1.88800048828125, -1.79443359375, -1.70086669921875, -1.6072998046875, -1.51373291015625, -1.420166015625, -1.32659912109375, -1.2330322265625, -1.13946533203125, -1.0458984375, -0.95233154296875, -0.8587646484375, -0.76519775390625, -0.671630859375, -0.57806396484375, -0.4844970703125, -0.39093017578125, -0.29736328125, -0.20379638671875, -0.1102294921875, -0.01666259765625, 0.076904296875, 0.17047119140625, 0.2640380859375, 0.35760498046875, 0.451171875, 0.54473876953125, 0.6383056640625, 0.73187255859375, 0.825439453125, 0.91900634765625, 1.0125732421875, 1.10614013671875, 1.19970703125, 1.29327392578125, 1.3868408203125, 1.48040771484375, 1.573974609375, 1.66754150390625, 1.7611083984375, 1.85467529296875, 1.9482421875, 2.04180908203125, 2.1353759765625, 2.22894287109375, 2.322509765625, 2.41607666015625, 2.5096435546875, 2.60321044921875, 2.69677734375, 2.79034423828125, 2.8839111328125, 2.97747802734375, 3.071044921875, 3.16461181640625, 3.2581787109375, 3.35174560546875, 3.4453125]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 6.0, 4.0, 4.0, 6.0, 11.0, 7.0, 21.0, 18.0, 14.0, 19.0, 21.0, 13.0, 24.0, 29.0, 30.0, 29.0, 51.0, 45.0, 44.0, 49.0, 51.0, 38.0, 42.0, 46.0, 48.0, 37.0, 32.0, 37.0, 37.0, 28.0, 23.0, 23.0, 25.0, 16.0, 9.0, 10.0, 14.0, 7.0, 11.0, 4.0, 8.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-21.46728515625, -20.751571655273438, -20.035856246948242, -19.32014274597168, -18.604427337646484, -17.888713836669922, -17.172998428344727, -16.457284927368164, -15.741569519042969, -15.02585506439209, -14.310140609741211, -13.594426155090332, -12.878711700439453, -12.162997245788574, -11.447282791137695, -10.731569290161133, -10.015854835510254, -9.300140380859375, -8.584425926208496, -7.868711471557617, -7.152997016906738, -6.437282562255859, -5.721568584442139, -5.00585412979126, -4.290139675140381, -3.574425220489502, -2.858710765838623, -2.1429965496063232, -1.4272820949554443, -0.7115676403045654, 0.004146575927734375, 0.7198610305786133, 1.4355754852294922, 2.151289939880371, 2.86700439453125, 3.58271861076355, 4.298433303833008, 5.014147758483887, 5.729861736297607, 6.445576190948486, 7.161290645599365, 7.877005100250244, 8.592719078063965, 9.308433532714844, 10.024147987365723, 10.739862442016602, 11.45557689666748, 12.17129135131836, 12.887005805969238, 13.602720260620117, 14.318434715270996, 15.034149169921875, 15.749863624572754, 16.465578079223633, 17.181291580200195, 17.89700698852539, 18.612720489501953, 19.328433990478516, 20.04414939880371, 20.759862899780273, 21.47557830810547, 22.19129180908203, 22.907007217407227, 23.62272071838379, 24.338436126708984]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 6.0, 4.0, 5.0, 6.0, 7.0, 13.0, 16.0, 14.0, 19.0, 22.0, 18.0, 17.0, 28.0, 27.0, 29.0, 24.0, 36.0, 24.0, 36.0, 41.0, 31.0, 44.0, 39.0, 46.0, 37.0, 50.0, 34.0, 23.0, 37.0, 33.0, 20.0, 20.0, 22.0, 19.0, 20.0, 17.0, 21.0, 18.0, 15.0, 7.0, 11.0, 10.0, 9.0, 6.0, 6.0, 5.0, 6.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 3.0], "bins": [-23.3586368560791, -22.635541915893555, -21.912445068359375, -21.189350128173828, -20.46625518798828, -19.7431583404541, -19.020063400268555, -18.296966552734375, -17.573871612548828, -16.85077667236328, -16.1276798248291, -15.404584884643555, -14.681488990783691, -13.958393096923828, -13.235298156738281, -12.512202262878418, -11.789106369018555, -11.066010475158691, -10.342914581298828, -9.619819641113281, -8.896723747253418, -8.173627853393555, -7.45053243637085, -6.7274370193481445, -6.004341125488281, -5.281245231628418, -4.558149814605713, -3.8350541591644287, -3.1119585037231445, -2.3888628482818604, -1.6657671928405762, -0.9426717758178711, -0.2195758819580078, 0.5035197734832764, 1.2266154289245605, 1.9497110843658447, 2.672806739807129, 3.395902395248413, 4.118998050689697, 4.842093467712402, 5.565189361572266, 6.288285255432129, 7.011380672454834, 7.734476089477539, 8.457571983337402, 9.180667877197266, 9.903762817382812, 10.626858711242676, 11.349954605102539, 12.073050498962402, 12.796146392822266, 13.519241333007812, 14.242337226867676, 14.965433120727539, 15.688528060913086, 16.411624908447266, 17.134719848632812, 17.85781478881836, 18.58091163635254, 19.304006576538086, 20.027103424072266, 20.750198364257812, 21.47329330444336, 22.196388244628906, 22.919485092163086]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 1.0, 6.0, 7.0, 7.0, 18.0, 45.0, 83.0, 133.0, 212.0, 370.0, 603.0, 1036.0, 1806.0, 2940.0, 5054.0, 8331.0, 14356.0, 24829.0, 42801.0, 73086.0, 123074.0, 201944.0, 311443.0, 441128.0, 555609.0, 599334.0, 551253.0, 437214.0, 307542.0, 197430.0, 120616.0, 71636.0, 41414.0, 24259.0, 14248.0, 8160.0, 4844.0, 2905.0, 1733.0, 1031.0, 635.0, 405.0, 244.0, 169.0, 98.0, 68.0, 44.0, 27.0, 21.0, 18.0, 7.0, 8.0, 2.0, 5.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-18.0, -17.389404296875, -16.77880859375, -16.168212890625, -15.5576171875, -14.947021484375, -14.33642578125, -13.725830078125, -13.115234375, -12.504638671875, -11.89404296875, -11.283447265625, -10.6728515625, -10.062255859375, -9.45166015625, -8.841064453125, -8.23046875, -7.619873046875, -7.00927734375, -6.398681640625, -5.7880859375, -5.177490234375, -4.56689453125, -3.956298828125, -3.345703125, -2.735107421875, -2.12451171875, -1.513916015625, -0.9033203125, -0.292724609375, 0.31787109375, 0.928466796875, 1.5390625, 2.149658203125, 2.76025390625, 3.370849609375, 3.9814453125, 4.592041015625, 5.20263671875, 5.813232421875, 6.423828125, 7.034423828125, 7.64501953125, 8.255615234375, 8.8662109375, 9.476806640625, 10.08740234375, 10.697998046875, 11.30859375, 11.919189453125, 12.52978515625, 13.140380859375, 13.7509765625, 14.361572265625, 14.97216796875, 15.582763671875, 16.193359375, 16.803955078125, 17.41455078125, 18.025146484375, 18.6357421875, 19.246337890625, 19.85693359375, 20.467529296875, 21.078125]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 4.0, 2.0, 5.0, 3.0, 3.0, 7.0, 6.0, 12.0, 7.0, 13.0, 15.0, 11.0, 22.0, 17.0, 20.0, 21.0, 20.0, 19.0, 28.0, 32.0, 34.0, 38.0, 38.0, 36.0, 42.0, 35.0, 47.0, 26.0, 37.0, 34.0, 40.0, 28.0, 29.0, 26.0, 22.0, 19.0, 23.0, 20.0, 20.0, 18.0, 15.0, 27.0, 11.0, 15.0, 8.0, 10.0, 9.0, 11.0, 5.0, 3.0, 3.0, 2.0, 4.0, 2.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 3.0], "bins": [-16.0, -15.460693359375, -14.92138671875, -14.382080078125, -13.8427734375, -13.303466796875, -12.76416015625, -12.224853515625, -11.685546875, -11.146240234375, -10.60693359375, -10.067626953125, -9.5283203125, -8.989013671875, -8.44970703125, -7.910400390625, -7.37109375, -6.831787109375, -6.29248046875, -5.753173828125, -5.2138671875, -4.674560546875, -4.13525390625, -3.595947265625, -3.056640625, -2.517333984375, -1.97802734375, -1.438720703125, -0.8994140625, -0.360107421875, 0.17919921875, 0.718505859375, 1.2578125, 1.797119140625, 2.33642578125, 2.875732421875, 3.4150390625, 3.954345703125, 4.49365234375, 5.032958984375, 5.572265625, 6.111572265625, 6.65087890625, 7.190185546875, 7.7294921875, 8.268798828125, 8.80810546875, 9.347412109375, 9.88671875, 10.426025390625, 10.96533203125, 11.504638671875, 12.0439453125, 12.583251953125, 13.12255859375, 13.661865234375, 14.201171875, 14.740478515625, 15.27978515625, 15.819091796875, 16.3583984375, 16.897705078125, 17.43701171875, 17.976318359375, 18.515625]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 5.0, 3.0, 6.0, 11.0, 20.0, 30.0, 51.0, 112.0, 177.0, 266.0, 468.0, 847.0, 1374.0, 2288.0, 3813.0, 6378.0, 10740.0, 17784.0, 29248.0, 47339.0, 74269.0, 114430.0, 169608.0, 240301.0, 319101.0, 398717.0, 454638.0, 474231.0, 449031.0, 388734.0, 308566.0, 229636.0, 160930.0, 108743.0, 69560.0, 43984.0, 27363.0, 16654.0, 10086.0, 5901.0, 3633.0, 2066.0, 1287.0, 693.0, 439.0, 291.0, 182.0, 109.0, 57.0, 29.0, 24.0, 20.0, 14.0, 8.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.0625, -15.53466796875, -15.0068359375, -14.47900390625, -13.951171875, -13.42333984375, -12.8955078125, -12.36767578125, -11.83984375, -11.31201171875, -10.7841796875, -10.25634765625, -9.728515625, -9.20068359375, -8.6728515625, -8.14501953125, -7.6171875, -7.08935546875, -6.5615234375, -6.03369140625, -5.505859375, -4.97802734375, -4.4501953125, -3.92236328125, -3.39453125, -2.86669921875, -2.3388671875, -1.81103515625, -1.283203125, -0.75537109375, -0.2275390625, 0.30029296875, 0.828125, 1.35595703125, 1.8837890625, 2.41162109375, 2.939453125, 3.46728515625, 3.9951171875, 4.52294921875, 5.05078125, 5.57861328125, 6.1064453125, 6.63427734375, 7.162109375, 7.68994140625, 8.2177734375, 8.74560546875, 9.2734375, 9.80126953125, 10.3291015625, 10.85693359375, 11.384765625, 11.91259765625, 12.4404296875, 12.96826171875, 13.49609375, 14.02392578125, 14.5517578125, 15.07958984375, 15.607421875, 16.13525390625, 16.6630859375, 17.19091796875, 17.71875]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 4.0, 5.0, 5.0, 10.0, 13.0, 26.0, 16.0, 25.0, 27.0, 41.0, 51.0, 55.0, 68.0, 78.0, 88.0, 116.0, 133.0, 157.0, 173.0, 202.0, 193.0, 192.0, 203.0, 216.0, 251.0, 190.0, 212.0, 180.0, 157.0, 143.0, 151.0, 122.0, 102.0, 84.0, 69.0, 63.0, 53.0, 47.0, 39.0, 34.0, 21.0, 12.0, 13.0, 5.0, 8.0, 3.0, 4.0, 3.0, 4.0, 3.0, 3.0, 2.0, 4.0, 1.0, 2.0, 0.0, 2.0], "bins": [-8.2578125, -7.990478515625, -7.72314453125, -7.455810546875, -7.1884765625, -6.921142578125, -6.65380859375, -6.386474609375, -6.119140625, -5.851806640625, -5.58447265625, -5.317138671875, -5.0498046875, -4.782470703125, -4.51513671875, -4.247802734375, -3.98046875, -3.713134765625, -3.44580078125, -3.178466796875, -2.9111328125, -2.643798828125, -2.37646484375, -2.109130859375, -1.841796875, -1.574462890625, -1.30712890625, -1.039794921875, -0.7724609375, -0.505126953125, -0.23779296875, 0.029541015625, 0.296875, 0.564208984375, 0.83154296875, 1.098876953125, 1.3662109375, 1.633544921875, 1.90087890625, 2.168212890625, 2.435546875, 2.702880859375, 2.97021484375, 3.237548828125, 3.5048828125, 3.772216796875, 4.03955078125, 4.306884765625, 4.57421875, 4.841552734375, 5.10888671875, 5.376220703125, 5.6435546875, 5.910888671875, 6.17822265625, 6.445556640625, 6.712890625, 6.980224609375, 7.24755859375, 7.514892578125, 7.7822265625, 8.049560546875, 8.31689453125, 8.584228515625, 8.8515625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 6.0, 3.0, 5.0, 6.0, 8.0, 6.0, 15.0, 17.0, 8.0, 29.0, 32.0, 30.0, 39.0, 29.0, 33.0, 34.0, 48.0, 59.0, 41.0, 47.0, 55.0, 49.0, 44.0, 41.0, 42.0, 37.0, 47.0, 34.0, 26.0, 25.0, 19.0, 17.0, 17.0, 8.0, 13.0, 14.0, 13.0, 4.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.689062118530273, -17.978342056274414, -17.267623901367188, -16.556903839111328, -15.846183776855469, -15.135464668273926, -14.424745559692383, -13.714025497436523, -13.00330638885498, -12.292587280273438, -11.581867218017578, -10.871148109436035, -10.160429000854492, -9.449708938598633, -8.73898983001709, -8.028270721435547, -7.3175506591796875, -6.606831073760986, -5.896111488342285, -5.185392379760742, -4.474672794342041, -3.76395320892334, -3.053234100341797, -2.3425145149230957, -1.6317949295043945, -0.9210754632949829, -0.2103559970855713, 0.5003633499145508, 1.211082935333252, 1.9218025207519531, 2.632521629333496, 3.3432412147521973, 4.053962707519531, 4.764682292938232, 5.475401878356934, 6.186120986938477, 6.896840572357178, 7.607560157775879, 8.318279266357422, 9.028999328613281, 9.739718437194824, 10.450437545776367, 11.161157608032227, 11.87187671661377, 12.582595825195312, 13.293315887451172, 14.004034996032715, 14.714754104614258, 15.425474166870117, 16.136194229125977, 16.846912384033203, 17.557632446289062, 18.268352508544922, 18.97907257080078, 19.689790725708008, 20.400510787963867, 21.111228942871094, 21.821949005126953, 22.53266716003418, 23.24338722229004, 23.9541072845459, 24.664825439453125, 25.375545501708984, 26.086265563964844, 26.796985626220703]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 5.0, 9.0, 7.0, 6.0, 12.0, 13.0, 18.0, 15.0, 25.0, 17.0, 30.0, 30.0, 40.0, 27.0, 30.0, 28.0, 45.0, 40.0, 44.0, 45.0, 46.0, 44.0, 34.0, 36.0, 37.0, 27.0, 35.0, 32.0, 22.0, 29.0, 18.0, 18.0, 15.0, 17.0, 22.0, 13.0, 15.0, 15.0, 13.0, 5.0, 8.0, 2.0, 2.0, 2.0, 6.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-22.43413734436035, -21.75115394592285, -21.06817054748535, -20.38518714904785, -19.70220375061035, -19.01922035217285, -18.336238861083984, -17.653255462646484, -16.970272064208984, -16.287288665771484, -15.604305267333984, -14.921321868896484, -14.238338470458984, -13.555355072021484, -12.8723726272583, -12.1893892288208, -11.506404876708984, -10.823421478271484, -10.140438079833984, -9.457454681396484, -8.774471282958984, -8.091487884521484, -7.408505439758301, -6.725522041320801, -6.042538642883301, -5.359555244445801, -4.676571846008301, -3.993588924407959, -3.310605525970459, -2.627622127532959, -1.9446392059326172, -1.2616558074951172, -0.5786724090576172, 0.10431087017059326, 0.7872941493988037, 1.4702773094177246, 2.1532607078552246, 2.8362441062927246, 3.5192270278930664, 4.202210426330566, 4.885193824768066, 5.568177223205566, 6.251160621643066, 6.934143543243408, 7.617126941680908, 8.30010986328125, 8.98309326171875, 9.66607666015625, 10.34906005859375, 11.03204345703125, 11.71502685546875, 12.39801025390625, 13.08099365234375, 13.76397705078125, 14.446959495544434, 15.129942893981934, 15.812926292419434, 16.495908737182617, 17.178892135620117, 17.861875534057617, 18.544858932495117, 19.227842330932617, 19.910825729370117, 20.593809127807617, 21.276792526245117]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 10.0, 7.0, 14.0, 21.0, 36.0, 56.0, 103.0, 130.0, 225.0, 390.0, 539.0, 897.0, 1252.0, 1895.0, 3057.0, 4324.0, 6527.0, 9232.0, 13413.0, 19140.0, 26694.0, 36998.0, 51230.0, 67899.0, 88286.0, 107495.0, 118073.0, 113450.0, 97462.0, 76652.0, 57905.0, 42494.0, 30632.0, 22254.0, 15709.0, 10922.0, 7667.0, 5207.0, 3574.0, 2374.0, 1478.0, 1028.0, 630.0, 430.0, 255.0, 166.0, 135.0, 76.0, 40.0, 31.0, 23.0, 12.0, 8.0, 6.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.34375, -19.6591796875, -18.974609375, -18.2900390625, -17.60546875, -16.9208984375, -16.236328125, -15.5517578125, -14.8671875, -14.1826171875, -13.498046875, -12.8134765625, -12.12890625, -11.4443359375, -10.759765625, -10.0751953125, -9.390625, -8.7060546875, -8.021484375, -7.3369140625, -6.65234375, -5.9677734375, -5.283203125, -4.5986328125, -3.9140625, -3.2294921875, -2.544921875, -1.8603515625, -1.17578125, -0.4912109375, 0.193359375, 0.8779296875, 1.5625, 2.2470703125, 2.931640625, 3.6162109375, 4.30078125, 4.9853515625, 5.669921875, 6.3544921875, 7.0390625, 7.7236328125, 8.408203125, 9.0927734375, 9.77734375, 10.4619140625, 11.146484375, 11.8310546875, 12.515625, 13.2001953125, 13.884765625, 14.5693359375, 15.25390625, 15.9384765625, 16.623046875, 17.3076171875, 17.9921875, 18.6767578125, 19.361328125, 20.0458984375, 20.73046875, 21.4150390625, 22.099609375, 22.7841796875, 23.46875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 4.0, 0.0, 5.0, 5.0, 7.0, 7.0, 10.0, 13.0, 17.0, 12.0, 28.0, 17.0, 29.0, 30.0, 23.0, 27.0, 39.0, 34.0, 41.0, 34.0, 46.0, 42.0, 38.0, 45.0, 45.0, 45.0, 36.0, 29.0, 31.0, 29.0, 30.0, 28.0, 26.0, 20.0, 20.0, 22.0, 18.0, 16.0, 10.0, 14.0, 9.0, 6.0, 3.0, 8.0, 5.0, 2.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-21.03125, -20.412841796875, -19.79443359375, -19.176025390625, -18.5576171875, -17.939208984375, -17.32080078125, -16.702392578125, -16.083984375, -15.465576171875, -14.84716796875, -14.228759765625, -13.6103515625, -12.991943359375, -12.37353515625, -11.755126953125, -11.13671875, -10.518310546875, -9.89990234375, -9.281494140625, -8.6630859375, -8.044677734375, -7.42626953125, -6.807861328125, -6.189453125, -5.571044921875, -4.95263671875, -4.334228515625, -3.7158203125, -3.097412109375, -2.47900390625, -1.860595703125, -1.2421875, -0.623779296875, -0.00537109375, 0.613037109375, 1.2314453125, 1.849853515625, 2.46826171875, 3.086669921875, 3.705078125, 4.323486328125, 4.94189453125, 5.560302734375, 6.1787109375, 6.797119140625, 7.41552734375, 8.033935546875, 8.65234375, 9.270751953125, 9.88916015625, 10.507568359375, 11.1259765625, 11.744384765625, 12.36279296875, 12.981201171875, 13.599609375, 14.218017578125, 14.83642578125, 15.454833984375, 16.0732421875, 16.691650390625, 17.31005859375, 17.928466796875, 18.546875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 11.0, 11.0, 20.0, 29.0, 44.0, 71.0, 84.0, 175.0, 275.0, 428.0, 647.0, 1023.0, 1534.0, 2445.0, 3989.0, 6349.0, 9917.0, 15755.0, 25190.0, 39706.0, 62969.0, 98932.0, 145657.0, 176629.0, 156637.0, 109623.0, 70809.0, 44345.0, 27815.0, 17697.0, 10974.0, 7010.0, 4308.0, 2743.0, 1755.0, 1089.0, 702.0, 442.0, 261.0, 205.0, 108.0, 54.0, 37.0, 30.0, 14.0, 9.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-29.015625, -28.152587890625, -27.28955078125, -26.426513671875, -25.5634765625, -24.700439453125, -23.83740234375, -22.974365234375, -22.111328125, -21.248291015625, -20.38525390625, -19.522216796875, -18.6591796875, -17.796142578125, -16.93310546875, -16.070068359375, -15.20703125, -14.343994140625, -13.48095703125, -12.617919921875, -11.7548828125, -10.891845703125, -10.02880859375, -9.165771484375, -8.302734375, -7.439697265625, -6.57666015625, -5.713623046875, -4.8505859375, -3.987548828125, -3.12451171875, -2.261474609375, -1.3984375, -0.535400390625, 0.32763671875, 1.190673828125, 2.0537109375, 2.916748046875, 3.77978515625, 4.642822265625, 5.505859375, 6.368896484375, 7.23193359375, 8.094970703125, 8.9580078125, 9.821044921875, 10.68408203125, 11.547119140625, 12.41015625, 13.273193359375, 14.13623046875, 14.999267578125, 15.8623046875, 16.725341796875, 17.58837890625, 18.451416015625, 19.314453125, 20.177490234375, 21.04052734375, 21.903564453125, 22.7666015625, 23.629638671875, 24.49267578125, 25.355712890625, 26.21875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 4.0, 2.0, 2.0, 3.0, 2.0, 4.0, 3.0, 4.0, 5.0, 5.0, 6.0, 13.0, 11.0, 12.0, 10.0, 22.0, 19.0, 21.0, 26.0, 27.0, 20.0, 24.0, 40.0, 35.0, 35.0, 29.0, 34.0, 37.0, 38.0, 42.0, 35.0, 40.0, 43.0, 34.0, 39.0, 37.0, 31.0, 28.0, 31.0, 27.0, 24.0, 15.0, 18.0, 24.0, 5.0, 9.0, 8.0, 9.0, 8.0, 5.0, 4.0, 2.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-14.1953125, -13.725830078125, -13.25634765625, -12.786865234375, -12.3173828125, -11.847900390625, -11.37841796875, -10.908935546875, -10.439453125, -9.969970703125, -9.50048828125, -9.031005859375, -8.5615234375, -8.092041015625, -7.62255859375, -7.153076171875, -6.68359375, -6.214111328125, -5.74462890625, -5.275146484375, -4.8056640625, -4.336181640625, -3.86669921875, -3.397216796875, -2.927734375, -2.458251953125, -1.98876953125, -1.519287109375, -1.0498046875, -0.580322265625, -0.11083984375, 0.358642578125, 0.828125, 1.297607421875, 1.76708984375, 2.236572265625, 2.7060546875, 3.175537109375, 3.64501953125, 4.114501953125, 4.583984375, 5.053466796875, 5.52294921875, 5.992431640625, 6.4619140625, 6.931396484375, 7.40087890625, 7.870361328125, 8.33984375, 8.809326171875, 9.27880859375, 9.748291015625, 10.2177734375, 10.687255859375, 11.15673828125, 11.626220703125, 12.095703125, 12.565185546875, 13.03466796875, 13.504150390625, 13.9736328125, 14.443115234375, 14.91259765625, 15.382080078125, 15.8515625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 14.0, 7.0, 16.0, 21.0, 25.0, 24.0, 56.0, 74.0, 126.0, 163.0, 222.0, 314.0, 501.0, 798.0, 1127.0, 1890.0, 3131.0, 5146.0, 8695.0, 15690.0, 29482.0, 61524.0, 169305.0, 506826.0, 131857.0, 52704.0, 25372.0, 13562.0, 7837.0, 4530.0, 2700.0, 1686.0, 1070.0, 646.0, 467.0, 318.0, 197.0, 150.0, 88.0, 49.0, 44.0, 33.0, 25.0, 14.0, 15.0, 10.0, 5.0, 4.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-66.75, -64.6240234375, -62.498046875, -60.3720703125, -58.24609375, -56.1201171875, -53.994140625, -51.8681640625, -49.7421875, -47.6162109375, -45.490234375, -43.3642578125, -41.23828125, -39.1123046875, -36.986328125, -34.8603515625, -32.734375, -30.6083984375, -28.482421875, -26.3564453125, -24.23046875, -22.1044921875, -19.978515625, -17.8525390625, -15.7265625, -13.6005859375, -11.474609375, -9.3486328125, -7.22265625, -5.0966796875, -2.970703125, -0.8447265625, 1.28125, 3.4072265625, 5.533203125, 7.6591796875, 9.78515625, 11.9111328125, 14.037109375, 16.1630859375, 18.2890625, 20.4150390625, 22.541015625, 24.6669921875, 26.79296875, 28.9189453125, 31.044921875, 33.1708984375, 35.296875, 37.4228515625, 39.548828125, 41.6748046875, 43.80078125, 45.9267578125, 48.052734375, 50.1787109375, 52.3046875, 54.4306640625, 56.556640625, 58.6826171875, 60.80859375, 62.9345703125, 65.060546875, 67.1865234375, 69.3125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 1.0, 8.0, 2.0, 8.0, 8.0, 13.0, 10.0, 14.0, 8.0, 19.0, 25.0, 43.0, 38.0, 66.0, 127.0, 221.0, 121.0, 61.0, 57.0, 37.0, 22.0, 22.0, 18.0, 14.0, 8.0, 8.0, 7.0, 6.0, 4.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00991058349609375, -0.009652256965637207, -0.009393930435180664, -0.009135603904724121, -0.008877277374267578, -0.008618950843811035, -0.008360624313354492, -0.00810229778289795, -0.007843971252441406, -0.007585644721984863, -0.00732731819152832, -0.007068991661071777, -0.006810665130615234, -0.006552338600158691, -0.0062940120697021484, -0.0060356855392456055, -0.0057773590087890625, -0.0055190324783325195, -0.0052607059478759766, -0.005002379417419434, -0.004744052886962891, -0.004485726356506348, -0.004227399826049805, -0.003969073295593262, -0.0037107467651367188, -0.0034524202346801758, -0.003194093704223633, -0.00293576717376709, -0.002677440643310547, -0.002419114112854004, -0.002160787582397461, -0.001902461051940918, -0.001644134521484375, -0.001385807991027832, -0.001127481460571289, -0.0008691549301147461, -0.0006108283996582031, -0.00035250186920166016, -9.417533874511719e-05, 0.00016415119171142578, 0.00042247772216796875, 0.0006808042526245117, 0.0009391307830810547, 0.0011974573135375977, 0.0014557838439941406, 0.0017141103744506836, 0.0019724369049072266, 0.0022307634353637695, 0.0024890899658203125, 0.0027474164962768555, 0.0030057430267333984, 0.0032640695571899414, 0.0035223960876464844, 0.0037807226181030273, 0.00403904914855957, 0.004297375679016113, 0.004555702209472656, 0.004814028739929199, 0.005072355270385742, 0.005330681800842285, 0.005589008331298828, 0.005847334861755371, 0.006105661392211914, 0.006363987922668457, 0.006622314453125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 5.0, 6.0, 7.0, 4.0, 17.0, 24.0, 31.0, 42.0, 57.0, 59.0, 100.0, 139.0, 212.0, 305.0, 491.0, 707.0, 1166.0, 1750.0, 2793.0, 4159.0, 6594.0, 10062.0, 15599.0, 23878.0, 37810.0, 60880.0, 114595.0, 276048.0, 238086.0, 99373.0, 55859.0, 34483.0, 22403.0, 14225.0, 9568.0, 6083.0, 3879.0, 2424.0, 1573.0, 1029.0, 684.0, 411.0, 292.0, 191.0, 137.0, 98.0, 59.0, 45.0, 27.0, 27.0, 25.0, 10.0, 12.0, 9.0, 4.0, 7.0, 7.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-32.15625, -31.0810546875, -30.005859375, -28.9306640625, -27.85546875, -26.7802734375, -25.705078125, -24.6298828125, -23.5546875, -22.4794921875, -21.404296875, -20.3291015625, -19.25390625, -18.1787109375, -17.103515625, -16.0283203125, -14.953125, -13.8779296875, -12.802734375, -11.7275390625, -10.65234375, -9.5771484375, -8.501953125, -7.4267578125, -6.3515625, -5.2763671875, -4.201171875, -3.1259765625, -2.05078125, -0.9755859375, 0.099609375, 1.1748046875, 2.25, 3.3251953125, 4.400390625, 5.4755859375, 6.55078125, 7.6259765625, 8.701171875, 9.7763671875, 10.8515625, 11.9267578125, 13.001953125, 14.0771484375, 15.15234375, 16.2275390625, 17.302734375, 18.3779296875, 19.453125, 20.5283203125, 21.603515625, 22.6787109375, 23.75390625, 24.8291015625, 25.904296875, 26.9794921875, 28.0546875, 29.1298828125, 30.205078125, 31.2802734375, 32.35546875, 33.4306640625, 34.505859375, 35.5810546875, 36.65625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 4.0, 0.0, 6.0, 5.0, 3.0, 7.0, 10.0, 9.0, 7.0, 11.0, 14.0, 12.0, 14.0, 22.0, 25.0, 24.0, 38.0, 48.0, 77.0, 100.0, 145.0, 108.0, 55.0, 50.0, 47.0, 25.0, 31.0, 25.0, 18.0, 18.0, 7.0, 13.0, 8.0, 6.0, 5.0, 9.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.078125, -16.534423828125, -15.99072265625, -15.447021484375, -14.9033203125, -14.359619140625, -13.81591796875, -13.272216796875, -12.728515625, -12.184814453125, -11.64111328125, -11.097412109375, -10.5537109375, -10.010009765625, -9.46630859375, -8.922607421875, -8.37890625, -7.835205078125, -7.29150390625, -6.747802734375, -6.2041015625, -5.660400390625, -5.11669921875, -4.572998046875, -4.029296875, -3.485595703125, -2.94189453125, -2.398193359375, -1.8544921875, -1.310791015625, -0.76708984375, -0.223388671875, 0.3203125, 0.864013671875, 1.40771484375, 1.951416015625, 2.4951171875, 3.038818359375, 3.58251953125, 4.126220703125, 4.669921875, 5.213623046875, 5.75732421875, 6.301025390625, 6.8447265625, 7.388427734375, 7.93212890625, 8.475830078125, 9.01953125, 9.563232421875, 10.10693359375, 10.650634765625, 11.1943359375, 11.738037109375, 12.28173828125, 12.825439453125, 13.369140625, 13.912841796875, 14.45654296875, 15.000244140625, 15.5439453125, 16.087646484375, 16.63134765625, 17.175048828125, 17.71875]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 4.0, 2.0, 15.0, 15.0, 16.0, 18.0, 30.0, 36.0, 29.0, 39.0, 36.0, 42.0, 51.0, 63.0, 65.0, 53.0, 52.0, 54.0, 53.0, 47.0, 59.0, 28.0, 39.0, 37.0, 35.0, 24.0, 15.0, 15.0, 8.0, 7.0, 8.0, 7.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.163423538208008, -24.25939178466797, -23.355361938476562, -22.451330184936523, -21.547300338745117, -20.643268585205078, -19.739238739013672, -18.835206985473633, -17.931175231933594, -17.027143478393555, -16.12311363220215, -15.21908187866211, -14.315052032470703, -13.411020278930664, -12.506989479064941, -11.602958679199219, -10.698928833007812, -9.79489803314209, -8.890867233276367, -7.986835956573486, -7.082805156707764, -6.178774356842041, -5.27474308013916, -4.3707122802734375, -3.466681480407715, -2.562650680541992, -1.6586196422576904, -0.7545886039733887, 0.14944219589233398, 1.0534729957580566, 1.9575042724609375, 2.86153507232666, 3.7655677795410156, 4.669598579406738, 5.573629379272461, 6.477660655975342, 7.3816914558410645, 8.285722732543945, 9.189753532409668, 10.09378433227539, 10.997815132141113, 11.901845932006836, 12.805876731872559, 13.709907531738281, 14.61393928527832, 15.517969131469727, 16.422000885009766, 17.326030731201172, 18.23006248474121, 19.13409423828125, 20.038124084472656, 20.942155838012695, 21.8461856842041, 22.75021743774414, 23.654247283935547, 24.558279037475586, 25.462310791015625, 26.366342544555664, 27.27037239074707, 28.17440414428711, 29.078433990478516, 29.982465744018555, 30.886497497558594, 31.79052734375, 32.694557189941406]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 5.0, 2.0, 6.0, 6.0, 7.0, 9.0, 9.0, 9.0, 17.0, 22.0, 23.0, 17.0, 24.0, 26.0, 28.0, 27.0, 31.0, 37.0, 43.0, 38.0, 46.0, 36.0, 38.0, 39.0, 33.0, 36.0, 31.0, 34.0, 40.0, 22.0, 45.0, 30.0, 27.0, 20.0, 19.0, 19.0, 14.0, 16.0, 11.0, 11.0, 8.0, 13.0, 8.0, 5.0, 3.0, 4.0, 3.0, 2.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-23.623764038085938, -22.84136199951172, -22.0589599609375, -21.27655792236328, -20.494157791137695, -19.711755752563477, -18.929353713989258, -18.14695167541504, -17.364551544189453, -16.582149505615234, -15.799748420715332, -15.017346382141113, -14.234945297241211, -13.452543258666992, -12.670141220092773, -11.887739181518555, -11.105337142944336, -10.322935104370117, -9.540534019470215, -8.758131980895996, -7.9757304191589355, -7.193328857421875, -6.410926818847656, -5.628525257110596, -4.846123695373535, -4.063722133636475, -3.281320333480835, -2.4989185333251953, -1.7165169715881348, -0.9341154098510742, -0.15171337127685547, 0.6306881904602051, 1.4130916595458984, 2.195493221282959, 2.9778950214385986, 3.7602968215942383, 4.542698383331299, 5.325099945068359, 6.107501983642578, 6.889903545379639, 7.672305107116699, 8.454707145690918, 9.23710823059082, 10.019510269165039, 10.801912307739258, 11.58431339263916, 12.366715431213379, 13.149116516113281, 13.9315185546875, 14.713920593261719, 15.496321678161621, 16.278724670410156, 17.061124801635742, 17.84352684020996, 18.62592887878418, 19.4083309173584, 20.190731048583984, 20.973133087158203, 21.755535125732422, 22.53793716430664, 23.320337295532227, 24.102739334106445, 24.885141372680664, 25.667543411254883, 26.4499454498291]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 9.0, 2.0, 15.0, 13.0, 32.0, 38.0, 54.0, 96.0, 142.0, 192.0, 332.0, 504.0, 911.0, 1353.0, 2122.0, 3414.0, 5209.0, 8205.0, 12867.0, 19678.0, 29120.0, 42396.0, 59674.0, 78535.0, 96921.0, 110631.0, 115325.0, 109482.0, 95110.0, 76323.0, 57830.0, 41448.0, 28044.0, 18821.0, 12248.0, 7782.0, 5081.0, 3145.0, 1996.0, 1256.0, 775.0, 497.0, 354.0, 234.0, 124.0, 84.0, 56.0, 33.0, 20.0, 13.0, 9.0, 2.0, 4.0, 3.0, 0.0, 2.0, 0.0, 2.0], "bins": [-16.515625, -16.006591796875, -15.49755859375, -14.988525390625, -14.4794921875, -13.970458984375, -13.46142578125, -12.952392578125, -12.443359375, -11.934326171875, -11.42529296875, -10.916259765625, -10.4072265625, -9.898193359375, -9.38916015625, -8.880126953125, -8.37109375, -7.862060546875, -7.35302734375, -6.843994140625, -6.3349609375, -5.825927734375, -5.31689453125, -4.807861328125, -4.298828125, -3.789794921875, -3.28076171875, -2.771728515625, -2.2626953125, -1.753662109375, -1.24462890625, -0.735595703125, -0.2265625, 0.282470703125, 0.79150390625, 1.300537109375, 1.8095703125, 2.318603515625, 2.82763671875, 3.336669921875, 3.845703125, 4.354736328125, 4.86376953125, 5.372802734375, 5.8818359375, 6.390869140625, 6.89990234375, 7.408935546875, 7.91796875, 8.427001953125, 8.93603515625, 9.445068359375, 9.9541015625, 10.463134765625, 10.97216796875, 11.481201171875, 11.990234375, 12.499267578125, 13.00830078125, 13.517333984375, 14.0263671875, 14.535400390625, 15.04443359375, 15.553466796875, 16.0625]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 1.0, 2.0, 3.0, 4.0, 6.0, 7.0, 4.0, 5.0, 3.0, 10.0, 14.0, 12.0, 17.0, 21.0, 15.0, 22.0, 24.0, 30.0, 30.0, 31.0, 41.0, 33.0, 36.0, 41.0, 35.0, 43.0, 40.0, 37.0, 26.0, 41.0, 37.0, 34.0, 48.0, 27.0, 25.0, 23.0, 18.0, 20.0, 21.0, 20.0, 15.0, 15.0, 13.0, 13.0, 8.0, 7.0, 5.0, 4.0, 7.0, 5.0, 3.0, 2.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-22.1875, -21.440185546875, -20.69287109375, -19.945556640625, -19.1982421875, -18.450927734375, -17.70361328125, -16.956298828125, -16.208984375, -15.461669921875, -14.71435546875, -13.967041015625, -13.2197265625, -12.472412109375, -11.72509765625, -10.977783203125, -10.23046875, -9.483154296875, -8.73583984375, -7.988525390625, -7.2412109375, -6.493896484375, -5.74658203125, -4.999267578125, -4.251953125, -3.504638671875, -2.75732421875, -2.010009765625, -1.2626953125, -0.515380859375, 0.23193359375, 0.979248046875, 1.7265625, 2.473876953125, 3.22119140625, 3.968505859375, 4.7158203125, 5.463134765625, 6.21044921875, 6.957763671875, 7.705078125, 8.452392578125, 9.19970703125, 9.947021484375, 10.6943359375, 11.441650390625, 12.18896484375, 12.936279296875, 13.68359375, 14.430908203125, 15.17822265625, 15.925537109375, 16.6728515625, 17.420166015625, 18.16748046875, 18.914794921875, 19.662109375, 20.409423828125, 21.15673828125, 21.904052734375, 22.6513671875, 23.398681640625, 24.14599609375, 24.893310546875, 25.640625]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 9.0, 23.0, 34.0, 37.0, 65.0, 97.0, 171.0, 247.0, 421.0, 677.0, 1057.0, 1790.0, 2771.0, 4405.0, 7330.0, 11687.0, 19050.0, 30067.0, 46098.0, 69042.0, 94694.0, 119314.0, 135038.0, 131570.0, 113148.0, 87064.0, 61768.0, 40802.0, 26452.0, 16548.0, 10355.0, 6441.0, 3908.0, 2403.0, 1439.0, 944.0, 591.0, 332.0, 233.0, 162.0, 96.0, 70.0, 34.0, 29.0, 11.0, 11.0, 7.0, 9.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.4375, -18.763916015625, -18.09033203125, -17.416748046875, -16.7431640625, -16.069580078125, -15.39599609375, -14.722412109375, -14.048828125, -13.375244140625, -12.70166015625, -12.028076171875, -11.3544921875, -10.680908203125, -10.00732421875, -9.333740234375, -8.66015625, -7.986572265625, -7.31298828125, -6.639404296875, -5.9658203125, -5.292236328125, -4.61865234375, -3.945068359375, -3.271484375, -2.597900390625, -1.92431640625, -1.250732421875, -0.5771484375, 0.096435546875, 0.77001953125, 1.443603515625, 2.1171875, 2.790771484375, 3.46435546875, 4.137939453125, 4.8115234375, 5.485107421875, 6.15869140625, 6.832275390625, 7.505859375, 8.179443359375, 8.85302734375, 9.526611328125, 10.2001953125, 10.873779296875, 11.54736328125, 12.220947265625, 12.89453125, 13.568115234375, 14.24169921875, 14.915283203125, 15.5888671875, 16.262451171875, 16.93603515625, 17.609619140625, 18.283203125, 18.956787109375, 19.63037109375, 20.303955078125, 20.9775390625, 21.651123046875, 22.32470703125, 22.998291015625, 23.671875]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 4.0, 5.0, 6.0, 8.0, 6.0, 20.0, 16.0, 11.0, 14.0, 25.0, 19.0, 35.0, 24.0, 28.0, 31.0, 33.0, 31.0, 36.0, 46.0, 48.0, 39.0, 37.0, 49.0, 38.0, 38.0, 39.0, 38.0, 38.0, 27.0, 27.0, 24.0, 22.0, 17.0, 30.0, 20.0, 11.0, 19.0, 17.0, 10.0, 3.0, 4.0, 3.0, 6.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-20.984375, -20.398193359375, -19.81201171875, -19.225830078125, -18.6396484375, -18.053466796875, -17.46728515625, -16.881103515625, -16.294921875, -15.708740234375, -15.12255859375, -14.536376953125, -13.9501953125, -13.364013671875, -12.77783203125, -12.191650390625, -11.60546875, -11.019287109375, -10.43310546875, -9.846923828125, -9.2607421875, -8.674560546875, -8.08837890625, -7.502197265625, -6.916015625, -6.329833984375, -5.74365234375, -5.157470703125, -4.5712890625, -3.985107421875, -3.39892578125, -2.812744140625, -2.2265625, -1.640380859375, -1.05419921875, -0.468017578125, 0.1181640625, 0.704345703125, 1.29052734375, 1.876708984375, 2.462890625, 3.049072265625, 3.63525390625, 4.221435546875, 4.8076171875, 5.393798828125, 5.97998046875, 6.566162109375, 7.15234375, 7.738525390625, 8.32470703125, 8.910888671875, 9.4970703125, 10.083251953125, 10.66943359375, 11.255615234375, 11.841796875, 12.427978515625, 13.01416015625, 13.600341796875, 14.1865234375, 14.772705078125, 15.35888671875, 15.945068359375, 16.53125]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 8.0, 8.0, 18.0, 31.0, 38.0, 63.0, 85.0, 137.0, 226.0, 391.0, 715.0, 1386.0, 3018.0, 6690.0, 16545.0, 45867.0, 141009.0, 335318.0, 310306.0, 121045.0, 39433.0, 14446.0, 6134.0, 2708.0, 1235.0, 681.0, 432.0, 218.0, 122.0, 84.0, 59.0, 35.0, 16.0, 18.0, 14.0, 6.0, 7.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-33.34375, -32.361083984375, -31.37841796875, -30.395751953125, -29.4130859375, -28.430419921875, -27.44775390625, -26.465087890625, -25.482421875, -24.499755859375, -23.51708984375, -22.534423828125, -21.5517578125, -20.569091796875, -19.58642578125, -18.603759765625, -17.62109375, -16.638427734375, -15.65576171875, -14.673095703125, -13.6904296875, -12.707763671875, -11.72509765625, -10.742431640625, -9.759765625, -8.777099609375, -7.79443359375, -6.811767578125, -5.8291015625, -4.846435546875, -3.86376953125, -2.881103515625, -1.8984375, -0.915771484375, 0.06689453125, 1.049560546875, 2.0322265625, 3.014892578125, 3.99755859375, 4.980224609375, 5.962890625, 6.945556640625, 7.92822265625, 8.910888671875, 9.8935546875, 10.876220703125, 11.85888671875, 12.841552734375, 13.82421875, 14.806884765625, 15.78955078125, 16.772216796875, 17.7548828125, 18.737548828125, 19.72021484375, 20.702880859375, 21.685546875, 22.668212890625, 23.65087890625, 24.633544921875, 25.6162109375, 26.598876953125, 27.58154296875, 28.564208984375, 29.546875]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 1.0, 3.0, 2.0, 5.0, 9.0, 8.0, 12.0, 22.0, 27.0, 31.0, 45.0, 68.0, 75.0, 64.0, 86.0, 96.0, 107.0, 98.0, 60.0, 58.0, 44.0, 28.0, 21.0, 14.0, 9.0, 9.0, 1.0, 1.0, 6.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00316619873046875, -0.003093242645263672, -0.0030202865600585938, -0.0029473304748535156, -0.0028743743896484375, -0.0028014183044433594, -0.0027284622192382812, -0.002655506134033203, -0.002582550048828125, -0.002509593963623047, -0.0024366378784179688, -0.0023636817932128906, -0.0022907257080078125, -0.0022177696228027344, -0.0021448135375976562, -0.002071857452392578, -0.0019989013671875, -0.0019259452819824219, -0.0018529891967773438, -0.0017800331115722656, -0.0017070770263671875, -0.0016341209411621094, -0.0015611648559570312, -0.0014882087707519531, -0.001415252685546875, -0.0013422966003417969, -0.0012693405151367188, -0.0011963844299316406, -0.0011234283447265625, -0.0010504722595214844, -0.0009775161743164062, -0.0009045600891113281, -0.00083160400390625, -0.0007586479187011719, -0.0006856918334960938, -0.0006127357482910156, -0.0005397796630859375, -0.0004668235778808594, -0.00039386749267578125, -0.0003209114074707031, -0.000247955322265625, -0.00017499923706054688, -0.00010204315185546875, -2.9087066650390625e-05, 4.38690185546875e-05, 0.00011682510375976562, 0.00018978118896484375, 0.0002627372741699219, 0.000335693359375, 0.0004086494445800781, 0.00048160552978515625, 0.0005545616149902344, 0.0006275177001953125, 0.0007004737854003906, 0.0007734298706054688, 0.0008463859558105469, 0.000919342041015625, 0.0009922981262207031, 0.0010652542114257812, 0.0011382102966308594, 0.0012111663818359375, 0.0012841224670410156, 0.0013570785522460938, 0.0014300346374511719, 0.00150299072265625]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 2.0, 3.0, 1.0, 8.0, 13.0, 8.0, 16.0, 21.0, 34.0, 56.0, 76.0, 92.0, 135.0, 199.0, 293.0, 422.0, 592.0, 827.0, 1331.0, 1941.0, 3199.0, 5232.0, 8563.0, 15148.0, 27463.0, 49963.0, 88290.0, 140126.0, 183069.0, 182509.0, 138982.0, 86878.0, 49005.0, 26804.0, 14622.0, 8400.0, 5029.0, 3104.0, 1964.0, 1319.0, 912.0, 565.0, 392.0, 308.0, 177.0, 141.0, 115.0, 66.0, 50.0, 31.0, 22.0, 13.0, 15.0, 5.0, 6.0, 3.0, 4.0, 1.0, 1.0, 0.0, 2.0], "bins": [-14.734375, -14.273681640625, -13.81298828125, -13.352294921875, -12.8916015625, -12.430908203125, -11.97021484375, -11.509521484375, -11.048828125, -10.588134765625, -10.12744140625, -9.666748046875, -9.2060546875, -8.745361328125, -8.28466796875, -7.823974609375, -7.36328125, -6.902587890625, -6.44189453125, -5.981201171875, -5.5205078125, -5.059814453125, -4.59912109375, -4.138427734375, -3.677734375, -3.217041015625, -2.75634765625, -2.295654296875, -1.8349609375, -1.374267578125, -0.91357421875, -0.452880859375, 0.0078125, 0.468505859375, 0.92919921875, 1.389892578125, 1.8505859375, 2.311279296875, 2.77197265625, 3.232666015625, 3.693359375, 4.154052734375, 4.61474609375, 5.075439453125, 5.5361328125, 5.996826171875, 6.45751953125, 6.918212890625, 7.37890625, 7.839599609375, 8.30029296875, 8.760986328125, 9.2216796875, 9.682373046875, 10.14306640625, 10.603759765625, 11.064453125, 11.525146484375, 11.98583984375, 12.446533203125, 12.9072265625, 13.367919921875, 13.82861328125, 14.289306640625, 14.75]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 5.0, 4.0, 4.0, 7.0, 5.0, 9.0, 10.0, 14.0, 19.0, 20.0, 43.0, 30.0, 45.0, 62.0, 50.0, 65.0, 74.0, 64.0, 69.0, 72.0, 71.0, 48.0, 48.0, 43.0, 14.0, 30.0, 9.0, 11.0, 18.0, 5.0, 10.0, 5.0, 6.0, 4.0, 0.0, 7.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.30078125, -7.04510498046875, -6.7894287109375, -6.53375244140625, -6.278076171875, -6.02239990234375, -5.7667236328125, -5.51104736328125, -5.25537109375, -4.99969482421875, -4.7440185546875, -4.48834228515625, -4.232666015625, -3.97698974609375, -3.7213134765625, -3.46563720703125, -3.2099609375, -2.95428466796875, -2.6986083984375, -2.44293212890625, -2.187255859375, -1.93157958984375, -1.6759033203125, -1.42022705078125, -1.16455078125, -0.90887451171875, -0.6531982421875, -0.39752197265625, -0.141845703125, 0.11383056640625, 0.3695068359375, 0.62518310546875, 0.880859375, 1.13653564453125, 1.3922119140625, 1.64788818359375, 1.903564453125, 2.15924072265625, 2.4149169921875, 2.67059326171875, 2.92626953125, 3.18194580078125, 3.4376220703125, 3.69329833984375, 3.948974609375, 4.20465087890625, 4.4603271484375, 4.71600341796875, 4.9716796875, 5.22735595703125, 5.4830322265625, 5.73870849609375, 5.994384765625, 6.25006103515625, 6.5057373046875, 6.76141357421875, 7.01708984375, 7.27276611328125, 7.5284423828125, 7.78411865234375, 8.039794921875, 8.29547119140625, 8.5511474609375, 8.80682373046875, 9.0625]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 4.0, 4.0, 4.0, 7.0, 7.0, 14.0, 18.0, 22.0, 29.0, 17.0, 30.0, 32.0, 35.0, 39.0, 36.0, 50.0, 52.0, 47.0, 65.0, 60.0, 50.0, 46.0, 47.0, 51.0, 33.0, 32.0, 29.0, 35.0, 29.0, 20.0, 14.0, 10.0, 13.0, 7.0, 10.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.14018440246582, -21.32505989074707, -20.509937286376953, -19.694812774658203, -18.879688262939453, -18.064563751220703, -17.249441146850586, -16.434316635131836, -15.619193077087402, -14.804069519042969, -13.988945007324219, -13.173821449279785, -12.358697891235352, -11.543573379516602, -10.728449821472168, -9.913326263427734, -9.098201751708984, -8.28307819366455, -7.467953681945801, -6.652830123901367, -5.837706089019775, -5.022582054138184, -4.20745849609375, -3.392334461212158, -2.5772104263305664, -1.7620865106582642, -0.9469625949859619, -0.13183879852294922, 0.6832852363586426, 1.4984092712402344, 2.313532829284668, 3.1286568641662598, 3.9437789916992188, 4.7589030265808105, 5.574027061462402, 6.389150619506836, 7.204274654388428, 8.01939868927002, 8.834522247314453, 9.649646759033203, 10.464770317077637, 11.27989387512207, 12.09501838684082, 12.910141944885254, 13.725265502929688, 14.540390014648438, 15.355513572692871, 16.170637130737305, 16.985761642456055, 17.800886154174805, 18.616008758544922, 19.431133270263672, 20.246257781982422, 21.061382293701172, 21.87650489807129, 22.69162940979004, 23.506752014160156, 24.321876525878906, 25.136999130249023, 25.952123641967773, 26.767248153686523, 27.58237075805664, 28.39749526977539, 29.21261978149414, 30.02774429321289]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 9.0, 5.0, 4.0, 6.0, 7.0, 11.0, 11.0, 16.0, 11.0, 14.0, 20.0, 22.0, 24.0, 33.0, 24.0, 29.0, 42.0, 49.0, 34.0, 40.0, 44.0, 49.0, 36.0, 50.0, 41.0, 33.0, 41.0, 38.0, 34.0, 28.0, 29.0, 16.0, 13.0, 26.0, 17.0, 14.0, 12.0, 13.0, 11.0, 9.0, 18.0, 11.0, 1.0, 4.0, 5.0, 3.0, 1.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.98694610595703, -24.161849975585938, -23.336753845214844, -22.51165771484375, -21.686561584472656, -20.861465454101562, -20.03636932373047, -19.211273193359375, -18.38617706298828, -17.561080932617188, -16.735984802246094, -15.910888671875, -15.085792541503906, -14.260696411132812, -13.435600280761719, -12.610504150390625, -11.785408973693848, -10.960312843322754, -10.13521671295166, -9.310120582580566, -8.485024452209473, -7.659928798675537, -6.834832668304443, -6.00973653793335, -5.184640407562256, -4.359544277191162, -3.5344481468200684, -2.7093522548675537, -1.88425612449646, -1.0591602325439453, -0.23406410217285156, 0.5910320281982422, 1.416128158569336, 2.2412242889404297, 3.0663204193115234, 3.891416311264038, 4.716512680053711, 5.5416083335876465, 6.36670446395874, 7.191800594329834, 8.016897201538086, 8.84199333190918, 9.667089462280273, 10.492185592651367, 11.317281723022461, 12.142377853393555, 12.967473983764648, 13.792570114135742, 14.61766529083252, 15.442761421203613, 16.26785659790039, 17.092952728271484, 17.918048858642578, 18.743144989013672, 19.568241119384766, 20.39333724975586, 21.218433380126953, 22.043529510498047, 22.86862564086914, 23.693721771240234, 24.518817901611328, 25.343914031982422, 26.169010162353516, 26.99410629272461, 27.819202423095703]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [6.0, 2.0, 3.0, 11.0, 10.0, 21.0, 25.0, 54.0, 63.0, 118.0, 181.0, 280.0, 398.0, 701.0, 1029.0, 1623.0, 2695.0, 4102.0, 6588.0, 10400.0, 16693.0, 26871.0, 43431.0, 69475.0, 109633.0, 168860.0, 249833.0, 345825.0, 441087.0, 506787.0, 517456.0, 469642.0, 380972.0, 283356.0, 194654.0, 127184.0, 81073.0, 50641.0, 31236.0, 19174.0, 11986.0, 7511.0, 4754.0, 2864.0, 1850.0, 1142.0, 689.0, 467.0, 304.0, 197.0, 121.0, 82.0, 52.0, 41.0, 21.0, 10.0, 5.0, 4.0, 6.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-14.28125, -13.807861328125, -13.33447265625, -12.861083984375, -12.3876953125, -11.914306640625, -11.44091796875, -10.967529296875, -10.494140625, -10.020751953125, -9.54736328125, -9.073974609375, -8.6005859375, -8.127197265625, -7.65380859375, -7.180419921875, -6.70703125, -6.233642578125, -5.76025390625, -5.286865234375, -4.8134765625, -4.340087890625, -3.86669921875, -3.393310546875, -2.919921875, -2.446533203125, -1.97314453125, -1.499755859375, -1.0263671875, -0.552978515625, -0.07958984375, 0.393798828125, 0.8671875, 1.340576171875, 1.81396484375, 2.287353515625, 2.7607421875, 3.234130859375, 3.70751953125, 4.180908203125, 4.654296875, 5.127685546875, 5.60107421875, 6.074462890625, 6.5478515625, 7.021240234375, 7.49462890625, 7.968017578125, 8.44140625, 8.914794921875, 9.38818359375, 9.861572265625, 10.3349609375, 10.808349609375, 11.28173828125, 11.755126953125, 12.228515625, 12.701904296875, 13.17529296875, 13.648681640625, 14.1220703125, 14.595458984375, 15.06884765625, 15.542236328125, 16.015625]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 4.0, 5.0, 2.0, 6.0, 9.0, 5.0, 8.0, 17.0, 15.0, 21.0, 12.0, 20.0, 26.0, 31.0, 37.0, 46.0, 33.0, 40.0, 39.0, 37.0, 60.0, 36.0, 36.0, 44.0, 43.0, 49.0, 36.0, 28.0, 36.0, 27.0, 27.0, 19.0, 28.0, 19.0, 13.0, 18.0, 15.0, 13.0, 9.0, 8.0, 8.0, 3.0, 3.0, 4.0, 5.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.140625, -19.448974609375, -18.75732421875, -18.065673828125, -17.3740234375, -16.682373046875, -15.99072265625, -15.299072265625, -14.607421875, -13.915771484375, -13.22412109375, -12.532470703125, -11.8408203125, -11.149169921875, -10.45751953125, -9.765869140625, -9.07421875, -8.382568359375, -7.69091796875, -6.999267578125, -6.3076171875, -5.615966796875, -4.92431640625, -4.232666015625, -3.541015625, -2.849365234375, -2.15771484375, -1.466064453125, -0.7744140625, -0.082763671875, 0.60888671875, 1.300537109375, 1.9921875, 2.683837890625, 3.37548828125, 4.067138671875, 4.7587890625, 5.450439453125, 6.14208984375, 6.833740234375, 7.525390625, 8.217041015625, 8.90869140625, 9.600341796875, 10.2919921875, 10.983642578125, 11.67529296875, 12.366943359375, 13.05859375, 13.750244140625, 14.44189453125, 15.133544921875, 15.8251953125, 16.516845703125, 17.20849609375, 17.900146484375, 18.591796875, 19.283447265625, 19.97509765625, 20.666748046875, 21.3583984375, 22.050048828125, 22.74169921875, 23.433349609375, 24.125]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 8.0, 18.0, 15.0, 28.0, 42.0, 73.0, 121.0, 199.0, 341.0, 547.0, 807.0, 1406.0, 2348.0, 3903.0, 6599.0, 10908.0, 18151.0, 29493.0, 48699.0, 77264.0, 120593.0, 181727.0, 260787.0, 352846.0, 441256.0, 498357.0, 503226.0, 453310.0, 368168.0, 276057.0, 192767.0, 128462.0, 82593.0, 51800.0, 32033.0, 19494.0, 11785.0, 7079.0, 4422.0, 2581.0, 1542.0, 945.0, 546.0, 356.0, 243.0, 137.0, 84.0, 40.0, 34.0, 22.0, 7.0, 7.0, 7.0, 5.0, 1.0, 1.0, 3.0], "bins": [-17.5, -16.970947265625, -16.44189453125, -15.912841796875, -15.3837890625, -14.854736328125, -14.32568359375, -13.796630859375, -13.267578125, -12.738525390625, -12.20947265625, -11.680419921875, -11.1513671875, -10.622314453125, -10.09326171875, -9.564208984375, -9.03515625, -8.506103515625, -7.97705078125, -7.447998046875, -6.9189453125, -6.389892578125, -5.86083984375, -5.331787109375, -4.802734375, -4.273681640625, -3.74462890625, -3.215576171875, -2.6865234375, -2.157470703125, -1.62841796875, -1.099365234375, -0.5703125, -0.041259765625, 0.48779296875, 1.016845703125, 1.5458984375, 2.074951171875, 2.60400390625, 3.133056640625, 3.662109375, 4.191162109375, 4.72021484375, 5.249267578125, 5.7783203125, 6.307373046875, 6.83642578125, 7.365478515625, 7.89453125, 8.423583984375, 8.95263671875, 9.481689453125, 10.0107421875, 10.539794921875, 11.06884765625, 11.597900390625, 12.126953125, 12.656005859375, 13.18505859375, 13.714111328125, 14.2431640625, 14.772216796875, 15.30126953125, 15.830322265625, 16.359375]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 5.0, 10.0, 5.0, 14.0, 7.0, 18.0, 27.0, 36.0, 35.0, 54.0, 49.0, 66.0, 96.0, 103.0, 117.0, 143.0, 123.0, 170.0, 188.0, 201.0, 186.0, 188.0, 221.0, 229.0, 233.0, 190.0, 185.0, 199.0, 152.0, 137.0, 115.0, 104.0, 103.0, 71.0, 62.0, 44.0, 39.0, 28.0, 28.0, 27.0, 15.0, 18.0, 5.0, 6.0, 9.0, 5.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0], "bins": [-8.953125, -8.68115234375, -8.4091796875, -8.13720703125, -7.865234375, -7.59326171875, -7.3212890625, -7.04931640625, -6.77734375, -6.50537109375, -6.2333984375, -5.96142578125, -5.689453125, -5.41748046875, -5.1455078125, -4.87353515625, -4.6015625, -4.32958984375, -4.0576171875, -3.78564453125, -3.513671875, -3.24169921875, -2.9697265625, -2.69775390625, -2.42578125, -2.15380859375, -1.8818359375, -1.60986328125, -1.337890625, -1.06591796875, -0.7939453125, -0.52197265625, -0.25, 0.02197265625, 0.2939453125, 0.56591796875, 0.837890625, 1.10986328125, 1.3818359375, 1.65380859375, 1.92578125, 2.19775390625, 2.4697265625, 2.74169921875, 3.013671875, 3.28564453125, 3.5576171875, 3.82958984375, 4.1015625, 4.37353515625, 4.6455078125, 4.91748046875, 5.189453125, 5.46142578125, 5.7333984375, 6.00537109375, 6.27734375, 6.54931640625, 6.8212890625, 7.09326171875, 7.365234375, 7.63720703125, 7.9091796875, 8.18115234375, 8.453125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 5.0, 2.0, 9.0, 5.0, 7.0, 15.0, 4.0, 17.0, 34.0, 22.0, 25.0, 31.0, 28.0, 41.0, 38.0, 48.0, 51.0, 39.0, 45.0, 66.0, 51.0, 52.0, 54.0, 45.0, 34.0, 51.0, 34.0, 27.0, 16.0, 21.0, 22.0, 17.0, 15.0, 10.0, 9.0, 8.0, 10.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.552875518798828, -20.764923095703125, -19.976972579956055, -19.18902015686035, -18.40106964111328, -17.613117218017578, -16.825164794921875, -16.037212371826172, -15.249261856079102, -14.461310386657715, -13.673358917236328, -12.885406494140625, -12.097455024719238, -11.309503555297852, -10.521551132202148, -9.733599662780762, -8.945648193359375, -8.157696723937988, -7.369744777679443, -6.581792831420898, -5.793841361999512, -5.005889892578125, -4.21793794631958, -3.429986000061035, -2.6420345306396484, -1.8540828227996826, -1.0661311149597168, -0.278179407119751, 0.5097723007202148, 1.2977240085601807, 2.0856757164001465, 2.8736276626586914, 3.6615772247314453, 4.449528694152832, 5.237480640411377, 6.025432586669922, 6.813384056091309, 7.601335525512695, 8.389287948608398, 9.177239418029785, 9.965190887451172, 10.753142356872559, 11.541093826293945, 12.329046249389648, 13.116997718811035, 13.904949188232422, 14.692901611328125, 15.480853080749512, 16.2688045501709, 17.0567569732666, 17.844707489013672, 18.632659912109375, 19.420612335205078, 20.20856285095215, 20.99651527404785, 21.784465789794922, 22.572418212890625, 23.360370635986328, 24.1483211517334, 24.9362735748291, 25.724224090576172, 26.512176513671875, 27.300128936767578, 28.08808135986328, 28.87603187561035]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 4.0, 3.0, 6.0, 5.0, 7.0, 10.0, 12.0, 7.0, 17.0, 13.0, 19.0, 19.0, 27.0, 30.0, 28.0, 26.0, 49.0, 38.0, 45.0, 37.0, 25.0, 49.0, 44.0, 47.0, 54.0, 31.0, 28.0, 34.0, 29.0, 36.0, 19.0, 31.0, 30.0, 15.0, 15.0, 13.0, 15.0, 16.0, 12.0, 17.0, 7.0, 9.0, 3.0, 9.0, 8.0, 3.0, 0.0, 1.0, 1.0, 6.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-24.072805404663086, -23.315345764160156, -22.557886123657227, -21.80042839050293, -21.04296875, -20.28550910949707, -19.52804946899414, -18.770591735839844, -18.013132095336914, -17.255672454833984, -16.498212814331055, -15.740754127502441, -14.983295440673828, -14.225835800170898, -13.468376159667969, -12.710917472839355, -11.953457832336426, -11.195998191833496, -10.438539505004883, -9.681079864501953, -8.92362117767334, -8.16616153717041, -7.408702373504639, -6.651243209838867, -5.893784046173096, -5.136324882507324, -4.378865718841553, -3.621406316757202, -2.8639471530914307, -2.106487989425659, -1.3490285873413086, -0.5915694236755371, 0.16588973999023438, 0.9233489632606506, 1.680808186531067, 2.438267469406128, 3.1957266330718994, 3.953185796737671, 4.7106451988220215, 5.468104362487793, 6.2255635261535645, 6.983022689819336, 7.740481853485107, 8.497941017150879, 9.255400657653809, 10.012859344482422, 10.770318984985352, 11.527778625488281, 12.285237312316895, 13.042696952819824, 13.800155639648438, 14.557615280151367, 15.31507396697998, 16.072532653808594, 16.829992294311523, 17.587451934814453, 18.344911575317383, 19.102371215820312, 19.859830856323242, 20.61728858947754, 21.37474822998047, 22.1322078704834, 22.889667510986328, 23.647125244140625, 24.404584884643555]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 3.0, 11.0, 10.0, 16.0, 34.0, 39.0, 63.0, 87.0, 134.0, 186.0, 246.0, 365.0, 530.0, 797.0, 1171.0, 1689.0, 2591.0, 3878.0, 5662.0, 8432.0, 12723.0, 18935.0, 29591.0, 45826.0, 74023.0, 121248.0, 174733.0, 183303.0, 133248.0, 82578.0, 51117.0, 32256.0, 20959.0, 13926.0, 9252.0, 6195.0, 4024.0, 2699.0, 1877.0, 1256.0, 890.0, 619.0, 410.0, 300.0, 190.0, 137.0, 101.0, 78.0, 44.0, 35.0, 16.0, 17.0, 10.0, 5.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-24.265625, -23.459716796875, -22.65380859375, -21.847900390625, -21.0419921875, -20.236083984375, -19.43017578125, -18.624267578125, -17.818359375, -17.012451171875, -16.20654296875, -15.400634765625, -14.5947265625, -13.788818359375, -12.98291015625, -12.177001953125, -11.37109375, -10.565185546875, -9.75927734375, -8.953369140625, -8.1474609375, -7.341552734375, -6.53564453125, -5.729736328125, -4.923828125, -4.117919921875, -3.31201171875, -2.506103515625, -1.7001953125, -0.894287109375, -0.08837890625, 0.717529296875, 1.5234375, 2.329345703125, 3.13525390625, 3.941162109375, 4.7470703125, 5.552978515625, 6.35888671875, 7.164794921875, 7.970703125, 8.776611328125, 9.58251953125, 10.388427734375, 11.1943359375, 12.000244140625, 12.80615234375, 13.612060546875, 14.41796875, 15.223876953125, 16.02978515625, 16.835693359375, 17.6416015625, 18.447509765625, 19.25341796875, 20.059326171875, 20.865234375, 21.671142578125, 22.47705078125, 23.282958984375, 24.0888671875, 24.894775390625, 25.70068359375, 26.506591796875, 27.3125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 4.0, 3.0, 7.0, 2.0, 8.0, 14.0, 17.0, 17.0, 14.0, 15.0, 32.0, 25.0, 27.0, 32.0, 42.0, 32.0, 36.0, 50.0, 54.0, 34.0, 56.0, 38.0, 41.0, 39.0, 39.0, 44.0, 25.0, 34.0, 19.0, 27.0, 30.0, 22.0, 16.0, 18.0, 16.0, 15.0, 14.0, 11.0, 8.0, 9.0, 5.0, 2.0, 3.0, 3.0, 0.0, 4.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.28125, -24.515869140625, -23.75048828125, -22.985107421875, -22.2197265625, -21.454345703125, -20.68896484375, -19.923583984375, -19.158203125, -18.392822265625, -17.62744140625, -16.862060546875, -16.0966796875, -15.331298828125, -14.56591796875, -13.800537109375, -13.03515625, -12.269775390625, -11.50439453125, -10.739013671875, -9.9736328125, -9.208251953125, -8.44287109375, -7.677490234375, -6.912109375, -6.146728515625, -5.38134765625, -4.615966796875, -3.8505859375, -3.085205078125, -2.31982421875, -1.554443359375, -0.7890625, -0.023681640625, 0.74169921875, 1.507080078125, 2.2724609375, 3.037841796875, 3.80322265625, 4.568603515625, 5.333984375, 6.099365234375, 6.86474609375, 7.630126953125, 8.3955078125, 9.160888671875, 9.92626953125, 10.691650390625, 11.45703125, 12.222412109375, 12.98779296875, 13.753173828125, 14.5185546875, 15.283935546875, 16.04931640625, 16.814697265625, 17.580078125, 18.345458984375, 19.11083984375, 19.876220703125, 20.6416015625, 21.406982421875, 22.17236328125, 22.937744140625, 23.703125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 5.0, 8.0, 10.0, 22.0, 39.0, 33.0, 53.0, 82.0, 114.0, 189.0, 255.0, 349.0, 524.0, 816.0, 1157.0, 1735.0, 2620.0, 4162.0, 6359.0, 10060.0, 15883.0, 25987.0, 44026.0, 77628.0, 145491.0, 234267.0, 204785.0, 114606.0, 61942.0, 35787.0, 21954.0, 13550.0, 8311.0, 5484.0, 3547.0, 2245.0, 1502.0, 971.0, 673.0, 406.0, 281.0, 190.0, 136.0, 106.0, 68.0, 57.0, 24.0, 21.0, 19.0, 11.0, 7.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-26.65625, -25.73095703125, -24.8056640625, -23.88037109375, -22.955078125, -22.02978515625, -21.1044921875, -20.17919921875, -19.25390625, -18.32861328125, -17.4033203125, -16.47802734375, -15.552734375, -14.62744140625, -13.7021484375, -12.77685546875, -11.8515625, -10.92626953125, -10.0009765625, -9.07568359375, -8.150390625, -7.22509765625, -6.2998046875, -5.37451171875, -4.44921875, -3.52392578125, -2.5986328125, -1.67333984375, -0.748046875, 0.17724609375, 1.1025390625, 2.02783203125, 2.953125, 3.87841796875, 4.8037109375, 5.72900390625, 6.654296875, 7.57958984375, 8.5048828125, 9.43017578125, 10.35546875, 11.28076171875, 12.2060546875, 13.13134765625, 14.056640625, 14.98193359375, 15.9072265625, 16.83251953125, 17.7578125, 18.68310546875, 19.6083984375, 20.53369140625, 21.458984375, 22.38427734375, 23.3095703125, 24.23486328125, 25.16015625, 26.08544921875, 27.0107421875, 27.93603515625, 28.861328125, 29.78662109375, 30.7119140625, 31.63720703125, 32.5625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 7.0, 6.0, 9.0, 14.0, 22.0, 21.0, 22.0, 19.0, 20.0, 30.0, 38.0, 35.0, 43.0, 36.0, 42.0, 49.0, 38.0, 42.0, 46.0, 39.0, 48.0, 49.0, 44.0, 44.0, 40.0, 34.0, 23.0, 27.0, 14.0, 16.0, 17.0, 14.0, 13.0, 10.0, 9.0, 9.0, 6.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.34375, -21.69140625, -21.0390625, -20.38671875, -19.734375, -19.08203125, -18.4296875, -17.77734375, -17.125, -16.47265625, -15.8203125, -15.16796875, -14.515625, -13.86328125, -13.2109375, -12.55859375, -11.90625, -11.25390625, -10.6015625, -9.94921875, -9.296875, -8.64453125, -7.9921875, -7.33984375, -6.6875, -6.03515625, -5.3828125, -4.73046875, -4.078125, -3.42578125, -2.7734375, -2.12109375, -1.46875, -0.81640625, -0.1640625, 0.48828125, 1.140625, 1.79296875, 2.4453125, 3.09765625, 3.75, 4.40234375, 5.0546875, 5.70703125, 6.359375, 7.01171875, 7.6640625, 8.31640625, 8.96875, 9.62109375, 10.2734375, 10.92578125, 11.578125, 12.23046875, 12.8828125, 13.53515625, 14.1875, 14.83984375, 15.4921875, 16.14453125, 16.796875, 17.44921875, 18.1015625, 18.75390625, 19.40625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 2.0, 4.0, 9.0, 7.0, 10.0, 15.0, 30.0, 29.0, 41.0, 73.0, 95.0, 144.0, 209.0, 304.0, 444.0, 603.0, 914.0, 1437.0, 2210.0, 3426.0, 5587.0, 9454.0, 16982.0, 39296.0, 209795.0, 617677.0, 81711.0, 25370.0, 12774.0, 7364.0, 4412.0, 2721.0, 1793.0, 1183.0, 765.0, 557.0, 346.0, 211.0, 146.0, 126.0, 76.0, 49.0, 40.0, 35.0, 31.0, 17.0, 14.0, 10.0, 8.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-57.6875, -55.89990234375, -54.1123046875, -52.32470703125, -50.537109375, -48.74951171875, -46.9619140625, -45.17431640625, -43.38671875, -41.59912109375, -39.8115234375, -38.02392578125, -36.236328125, -34.44873046875, -32.6611328125, -30.87353515625, -29.0859375, -27.29833984375, -25.5107421875, -23.72314453125, -21.935546875, -20.14794921875, -18.3603515625, -16.57275390625, -14.78515625, -12.99755859375, -11.2099609375, -9.42236328125, -7.634765625, -5.84716796875, -4.0595703125, -2.27197265625, -0.484375, 1.30322265625, 3.0908203125, 4.87841796875, 6.666015625, 8.45361328125, 10.2412109375, 12.02880859375, 13.81640625, 15.60400390625, 17.3916015625, 19.17919921875, 20.966796875, 22.75439453125, 24.5419921875, 26.32958984375, 28.1171875, 29.90478515625, 31.6923828125, 33.47998046875, 35.267578125, 37.05517578125, 38.8427734375, 40.63037109375, 42.41796875, 44.20556640625, 45.9931640625, 47.78076171875, 49.568359375, 51.35595703125, 53.1435546875, 54.93115234375, 56.71875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 7.0, 4.0, 6.0, 7.0, 14.0, 9.0, 9.0, 16.0, 41.0, 82.0, 267.0, 319.0, 100.0, 30.0, 19.0, 16.0, 10.0, 8.0, 9.0, 4.0, 4.0, 5.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.00960540771484375, -0.009371817111968994, -0.009138226509094238, -0.008904635906219482, -0.008671045303344727, -0.00843745470046997, -0.008203864097595215, -0.007970273494720459, -0.007736682891845703, -0.007503092288970947, -0.007269501686096191, -0.0070359110832214355, -0.00680232048034668, -0.006568729877471924, -0.006335139274597168, -0.006101548671722412, -0.005867958068847656, -0.0056343674659729, -0.0054007768630981445, -0.005167186260223389, -0.004933595657348633, -0.004700005054473877, -0.004466414451599121, -0.004232823848724365, -0.003999233245849609, -0.0037656426429748535, -0.0035320520401000977, -0.003298461437225342, -0.003064870834350586, -0.00283128023147583, -0.0025976896286010742, -0.0023640990257263184, -0.0021305084228515625, -0.0018969178199768066, -0.0016633272171020508, -0.001429736614227295, -0.001196146011352539, -0.0009625554084777832, -0.0007289648056030273, -0.0004953742027282715, -0.0002617835998535156, -2.8192996978759766e-05, 0.0002053976058959961, 0.00043898820877075195, 0.0006725788116455078, 0.0009061694145202637, 0.0011397600173950195, 0.0013733506202697754, 0.0016069412231445312, 0.0018405318260192871, 0.002074122428894043, 0.002307713031768799, 0.0025413036346435547, 0.0027748942375183105, 0.0030084848403930664, 0.0032420754432678223, 0.003475666046142578, 0.003709256649017334, 0.00394284725189209, 0.004176437854766846, 0.0044100284576416016, 0.004643619060516357, 0.004877209663391113, 0.005110800266265869, 0.005344390869140625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 4.0, 7.0, 11.0, 11.0, 11.0, 23.0, 24.0, 42.0, 66.0, 92.0, 127.0, 166.0, 259.0, 327.0, 464.0, 643.0, 864.0, 1164.0, 1665.0, 2335.0, 3480.0, 5309.0, 8466.0, 14392.0, 28080.0, 75952.0, 344927.0, 397750.0, 88498.0, 31052.0, 15410.0, 8983.0, 5697.0, 3637.0, 2458.0, 1783.0, 1176.0, 862.0, 659.0, 434.0, 336.0, 269.0, 187.0, 140.0, 101.0, 70.0, 54.0, 30.0, 22.0, 17.0, 15.0, 6.0, 7.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-35.65625, -34.42919921875, -33.2021484375, -31.97509765625, -30.748046875, -29.52099609375, -28.2939453125, -27.06689453125, -25.83984375, -24.61279296875, -23.3857421875, -22.15869140625, -20.931640625, -19.70458984375, -18.4775390625, -17.25048828125, -16.0234375, -14.79638671875, -13.5693359375, -12.34228515625, -11.115234375, -9.88818359375, -8.6611328125, -7.43408203125, -6.20703125, -4.97998046875, -3.7529296875, -2.52587890625, -1.298828125, -0.07177734375, 1.1552734375, 2.38232421875, 3.609375, 4.83642578125, 6.0634765625, 7.29052734375, 8.517578125, 9.74462890625, 10.9716796875, 12.19873046875, 13.42578125, 14.65283203125, 15.8798828125, 17.10693359375, 18.333984375, 19.56103515625, 20.7880859375, 22.01513671875, 23.2421875, 24.46923828125, 25.6962890625, 26.92333984375, 28.150390625, 29.37744140625, 30.6044921875, 31.83154296875, 33.05859375, 34.28564453125, 35.5126953125, 36.73974609375, 37.966796875, 39.19384765625, 40.4208984375, 41.64794921875, 42.875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 1.0, 5.0, 5.0, 2.0, 6.0, 5.0, 3.0, 7.0, 4.0, 11.0, 21.0, 27.0, 54.0, 69.0, 177.0, 222.0, 164.0, 81.0, 30.0, 28.0, 22.0, 9.0, 6.0, 9.0, 6.0, 9.0, 1.0, 3.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-20.109375, -19.490966796875, -18.87255859375, -18.254150390625, -17.6357421875, -17.017333984375, -16.39892578125, -15.780517578125, -15.162109375, -14.543701171875, -13.92529296875, -13.306884765625, -12.6884765625, -12.070068359375, -11.45166015625, -10.833251953125, -10.21484375, -9.596435546875, -8.97802734375, -8.359619140625, -7.7412109375, -7.122802734375, -6.50439453125, -5.885986328125, -5.267578125, -4.649169921875, -4.03076171875, -3.412353515625, -2.7939453125, -2.175537109375, -1.55712890625, -0.938720703125, -0.3203125, 0.298095703125, 0.91650390625, 1.534912109375, 2.1533203125, 2.771728515625, 3.39013671875, 4.008544921875, 4.626953125, 5.245361328125, 5.86376953125, 6.482177734375, 7.1005859375, 7.718994140625, 8.33740234375, 8.955810546875, 9.57421875, 10.192626953125, 10.81103515625, 11.429443359375, 12.0478515625, 12.666259765625, 13.28466796875, 13.903076171875, 14.521484375, 15.139892578125, 15.75830078125, 16.376708984375, 16.9951171875, 17.613525390625, 18.23193359375, 18.850341796875, 19.46875]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 8.0, 10.0, 5.0, 16.0, 14.0, 15.0, 12.0, 33.0, 37.0, 36.0, 39.0, 50.0, 56.0, 54.0, 53.0, 51.0, 55.0, 54.0, 53.0, 57.0, 45.0, 55.0, 28.0, 42.0, 27.0, 18.0, 11.0, 12.0, 18.0, 12.0, 8.0, 11.0, 4.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.906810760498047, -28.981761932373047, -28.05671501159668, -27.13166618347168, -26.20661735534668, -25.281570434570312, -24.356521606445312, -23.431472778320312, -22.506423950195312, -21.581375122070312, -20.656328201293945, -19.731279373168945, -18.806230545043945, -17.881183624267578, -16.956134796142578, -16.031085968017578, -15.106039047241211, -14.180991172790527, -13.255942344665527, -12.330894470214844, -11.405845642089844, -10.48079776763916, -9.555749893188477, -8.630701065063477, -7.705653190612793, -6.780604839324951, -5.855556488037109, -4.930508613586426, -4.005460262298584, -3.080411911010742, -2.1553640365600586, -1.2303156852722168, -0.3052692413330078, 0.6197789907455444, 1.5448272228240967, 2.4698753356933594, 3.394923686981201, 4.319972038269043, 5.245019912719727, 6.170068264007568, 7.09511661529541, 8.020164489746094, 8.945213317871094, 9.870261192321777, 10.795309066772461, 11.720357894897461, 12.645405769348145, 13.570453643798828, 14.495502471923828, 15.420550346374512, 16.345598220825195, 17.270647048950195, 18.195695877075195, 19.120742797851562, 20.045791625976562, 20.970840454101562, 21.895889282226562, 22.820938110351562, 23.74598503112793, 24.67103385925293, 25.59608268737793, 26.521129608154297, 27.446178436279297, 28.371227264404297, 29.296274185180664]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 4.0, 4.0, 6.0, 7.0, 7.0, 9.0, 13.0, 8.0, 12.0, 22.0, 16.0, 17.0, 32.0, 33.0, 32.0, 32.0, 30.0, 28.0, 35.0, 41.0, 49.0, 48.0, 40.0, 39.0, 41.0, 33.0, 35.0, 38.0, 36.0, 32.0, 28.0, 25.0, 24.0, 27.0, 16.0, 16.0, 19.0, 17.0, 11.0, 8.0, 5.0, 11.0, 7.0, 2.0, 4.0, 4.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-28.03859519958496, -27.12749671936035, -26.216400146484375, -25.305301666259766, -24.394203186035156, -23.483104705810547, -22.57200813293457, -21.66090965270996, -20.74981117248535, -19.838712692260742, -18.927616119384766, -18.016517639160156, -17.105419158935547, -16.194320678710938, -15.283224105834961, -14.372125625610352, -13.461028099060059, -12.549930572509766, -11.638832092285156, -10.727734565734863, -9.816636085510254, -8.905538558959961, -7.99444055557251, -7.083342552185059, -6.172244548797607, -5.261146545410156, -4.350048542022705, -3.438950777053833, -2.527852773666382, -1.6167550086975098, -0.7056570053100586, 0.20544099807739258, 1.1165390014648438, 2.027637004852295, 2.938735008239746, 3.849832773208618, 4.760931015014648, 5.672028541564941, 6.583126544952393, 7.494224548339844, 8.405323028564453, 9.316420555114746, 10.227519035339355, 11.138616561889648, 12.049715042114258, 12.96081256866455, 13.871910095214844, 14.783008575439453, 15.694106101989746, 16.60520362854004, 17.51630210876465, 18.427400588989258, 19.338497161865234, 20.249595642089844, 21.160694122314453, 22.071792602539062, 22.98288917541504, 23.89398765563965, 24.805084228515625, 25.716182708740234, 26.627281188964844, 27.538379669189453, 28.44947624206543, 29.36057472229004, 30.27167320251465]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 1.0, 4.0, 4.0, 13.0, 20.0, 25.0, 62.0, 82.0, 117.0, 188.0, 378.0, 668.0, 1090.0, 1892.0, 3111.0, 5125.0, 8646.0, 13874.0, 22580.0, 34533.0, 52325.0, 74060.0, 97966.0, 118796.0, 128630.0, 124204.0, 106852.0, 83298.0, 59956.0, 40780.0, 26470.0, 16970.0, 10322.0, 6260.0, 3667.0, 2317.0, 1360.0, 791.0, 473.0, 255.0, 154.0, 100.0, 65.0, 31.0, 16.0, 12.0, 10.0, 8.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.734375, -20.10009765625, -19.4658203125, -18.83154296875, -18.197265625, -17.56298828125, -16.9287109375, -16.29443359375, -15.66015625, -15.02587890625, -14.3916015625, -13.75732421875, -13.123046875, -12.48876953125, -11.8544921875, -11.22021484375, -10.5859375, -9.95166015625, -9.3173828125, -8.68310546875, -8.048828125, -7.41455078125, -6.7802734375, -6.14599609375, -5.51171875, -4.87744140625, -4.2431640625, -3.60888671875, -2.974609375, -2.34033203125, -1.7060546875, -1.07177734375, -0.4375, 0.19677734375, 0.8310546875, 1.46533203125, 2.099609375, 2.73388671875, 3.3681640625, 4.00244140625, 4.63671875, 5.27099609375, 5.9052734375, 6.53955078125, 7.173828125, 7.80810546875, 8.4423828125, 9.07666015625, 9.7109375, 10.34521484375, 10.9794921875, 11.61376953125, 12.248046875, 12.88232421875, 13.5166015625, 14.15087890625, 14.78515625, 15.41943359375, 16.0537109375, 16.68798828125, 17.322265625, 17.95654296875, 18.5908203125, 19.22509765625, 19.859375]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 3.0, 2.0, 5.0, 3.0, 8.0, 10.0, 9.0, 14.0, 11.0, 15.0, 13.0, 19.0, 21.0, 29.0, 25.0, 40.0, 28.0, 34.0, 31.0, 41.0, 40.0, 38.0, 43.0, 41.0, 41.0, 40.0, 26.0, 38.0, 36.0, 32.0, 33.0, 35.0, 31.0, 21.0, 19.0, 24.0, 15.0, 21.0, 14.0, 7.0, 6.0, 10.0, 6.0, 5.0, 5.0, 6.0, 2.0, 4.0, 4.0, 1.0, 0.0, 4.0, 1.0, 0.0, 2.0], "bins": [-27.453125, -26.61083984375, -25.7685546875, -24.92626953125, -24.083984375, -23.24169921875, -22.3994140625, -21.55712890625, -20.71484375, -19.87255859375, -19.0302734375, -18.18798828125, -17.345703125, -16.50341796875, -15.6611328125, -14.81884765625, -13.9765625, -13.13427734375, -12.2919921875, -11.44970703125, -10.607421875, -9.76513671875, -8.9228515625, -8.08056640625, -7.23828125, -6.39599609375, -5.5537109375, -4.71142578125, -3.869140625, -3.02685546875, -2.1845703125, -1.34228515625, -0.5, 0.34228515625, 1.1845703125, 2.02685546875, 2.869140625, 3.71142578125, 4.5537109375, 5.39599609375, 6.23828125, 7.08056640625, 7.9228515625, 8.76513671875, 9.607421875, 10.44970703125, 11.2919921875, 12.13427734375, 12.9765625, 13.81884765625, 14.6611328125, 15.50341796875, 16.345703125, 17.18798828125, 18.0302734375, 18.87255859375, 19.71484375, 20.55712890625, 21.3994140625, 22.24169921875, 23.083984375, 23.92626953125, 24.7685546875, 25.61083984375, 26.453125]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 6.0, 8.0, 10.0, 9.0, 21.0, 31.0, 48.0, 78.0, 92.0, 188.0, 274.0, 419.0, 793.0, 1331.0, 2302.0, 4004.0, 7234.0, 12902.0, 22705.0, 39137.0, 65038.0, 100956.0, 139025.0, 162264.0, 155284.0, 123102.0, 85522.0, 53214.0, 31167.0, 17931.0, 10093.0, 5649.0, 3191.0, 1819.0, 1087.0, 643.0, 357.0, 211.0, 165.0, 84.0, 57.0, 32.0, 27.0, 13.0, 11.0, 6.0, 3.0, 3.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 3.0], "bins": [-28.484375, -27.61572265625, -26.7470703125, -25.87841796875, -25.009765625, -24.14111328125, -23.2724609375, -22.40380859375, -21.53515625, -20.66650390625, -19.7978515625, -18.92919921875, -18.060546875, -17.19189453125, -16.3232421875, -15.45458984375, -14.5859375, -13.71728515625, -12.8486328125, -11.97998046875, -11.111328125, -10.24267578125, -9.3740234375, -8.50537109375, -7.63671875, -6.76806640625, -5.8994140625, -5.03076171875, -4.162109375, -3.29345703125, -2.4248046875, -1.55615234375, -0.6875, 0.18115234375, 1.0498046875, 1.91845703125, 2.787109375, 3.65576171875, 4.5244140625, 5.39306640625, 6.26171875, 7.13037109375, 7.9990234375, 8.86767578125, 9.736328125, 10.60498046875, 11.4736328125, 12.34228515625, 13.2109375, 14.07958984375, 14.9482421875, 15.81689453125, 16.685546875, 17.55419921875, 18.4228515625, 19.29150390625, 20.16015625, 21.02880859375, 21.8974609375, 22.76611328125, 23.634765625, 24.50341796875, 25.3720703125, 26.24072265625, 27.109375]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 4.0, 1.0, 0.0, 3.0, 5.0, 4.0, 9.0, 8.0, 8.0, 10.0, 13.0, 17.0, 14.0, 17.0, 17.0, 21.0, 44.0, 34.0, 24.0, 37.0, 37.0, 51.0, 45.0, 36.0, 50.0, 35.0, 36.0, 43.0, 40.0, 40.0, 39.0, 29.0, 30.0, 33.0, 35.0, 31.0, 16.0, 15.0, 8.0, 11.0, 16.0, 16.0, 7.0, 7.0, 5.0, 3.0, 2.0, 6.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.515625, -15.890380859375, -15.26513671875, -14.639892578125, -14.0146484375, -13.389404296875, -12.76416015625, -12.138916015625, -11.513671875, -10.888427734375, -10.26318359375, -9.637939453125, -9.0126953125, -8.387451171875, -7.76220703125, -7.136962890625, -6.51171875, -5.886474609375, -5.26123046875, -4.635986328125, -4.0107421875, -3.385498046875, -2.76025390625, -2.135009765625, -1.509765625, -0.884521484375, -0.25927734375, 0.365966796875, 0.9912109375, 1.616455078125, 2.24169921875, 2.866943359375, 3.4921875, 4.117431640625, 4.74267578125, 5.367919921875, 5.9931640625, 6.618408203125, 7.24365234375, 7.868896484375, 8.494140625, 9.119384765625, 9.74462890625, 10.369873046875, 10.9951171875, 11.620361328125, 12.24560546875, 12.870849609375, 13.49609375, 14.121337890625, 14.74658203125, 15.371826171875, 15.9970703125, 16.622314453125, 17.24755859375, 17.872802734375, 18.498046875, 19.123291015625, 19.74853515625, 20.373779296875, 20.9990234375, 21.624267578125, 22.24951171875, 22.874755859375, 23.5]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 8.0, 3.0, 11.0, 16.0, 22.0, 40.0, 53.0, 87.0, 135.0, 171.0, 327.0, 484.0, 740.0, 1233.0, 2210.0, 3984.0, 7684.0, 16381.0, 38401.0, 95587.0, 217484.0, 305971.0, 203671.0, 87510.0, 34990.0, 15263.0, 7131.0, 3623.0, 2087.0, 1235.0, 725.0, 460.0, 294.0, 163.0, 134.0, 82.0, 43.0, 37.0, 28.0, 14.0, 12.0, 4.0, 5.0, 8.0, 4.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.796875, -24.94970703125, -24.1025390625, -23.25537109375, -22.408203125, -21.56103515625, -20.7138671875, -19.86669921875, -19.01953125, -18.17236328125, -17.3251953125, -16.47802734375, -15.630859375, -14.78369140625, -13.9365234375, -13.08935546875, -12.2421875, -11.39501953125, -10.5478515625, -9.70068359375, -8.853515625, -8.00634765625, -7.1591796875, -6.31201171875, -5.46484375, -4.61767578125, -3.7705078125, -2.92333984375, -2.076171875, -1.22900390625, -0.3818359375, 0.46533203125, 1.3125, 2.15966796875, 3.0068359375, 3.85400390625, 4.701171875, 5.54833984375, 6.3955078125, 7.24267578125, 8.08984375, 8.93701171875, 9.7841796875, 10.63134765625, 11.478515625, 12.32568359375, 13.1728515625, 14.02001953125, 14.8671875, 15.71435546875, 16.5615234375, 17.40869140625, 18.255859375, 19.10302734375, 19.9501953125, 20.79736328125, 21.64453125, 22.49169921875, 23.3388671875, 24.18603515625, 25.033203125, 25.88037109375, 26.7275390625, 27.57470703125, 28.421875]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 6.0, 4.0, 2.0, 4.0, 13.0, 17.0, 20.0, 19.0, 21.0, 21.0, 33.0, 41.0, 45.0, 51.0, 50.0, 63.0, 72.0, 55.0, 58.0, 70.0, 53.0, 51.0, 38.0, 33.0, 27.0, 30.0, 18.0, 23.0, 7.0, 13.0, 11.0, 5.0, 6.0, 4.0, 4.0, 4.0, 2.0, 6.0, 3.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0015687942504882812, -0.0015223771333694458, -0.0014759600162506104, -0.001429542899131775, -0.0013831257820129395, -0.001336708664894104, -0.0012902915477752686, -0.001243874430656433, -0.0011974573135375977, -0.0011510401964187622, -0.0011046230792999268, -0.0010582059621810913, -0.0010117888450622559, -0.0009653717279434204, -0.000918954610824585, -0.0008725374937057495, -0.0008261203765869141, -0.0007797032594680786, -0.0007332861423492432, -0.0006868690252304077, -0.0006404519081115723, -0.0005940347909927368, -0.0005476176738739014, -0.0005012005567550659, -0.00045478343963623047, -0.000408366322517395, -0.00036194920539855957, -0.0003155320882797241, -0.00026911497116088867, -0.00022269785404205322, -0.00017628073692321777, -0.00012986361980438232, -8.344650268554688e-05, -3.7029385566711426e-05, 9.387731552124023e-06, 5.580484867095947e-05, 0.00010222196578979492, 0.00014863908290863037, 0.00019505620002746582, 0.00024147331714630127, 0.0002878904342651367, 0.00033430755138397217, 0.0003807246685028076, 0.00042714178562164307, 0.0004735589027404785, 0.000519976019859314, 0.0005663931369781494, 0.0006128102540969849, 0.0006592273712158203, 0.0007056444883346558, 0.0007520616054534912, 0.0007984787225723267, 0.0008448958396911621, 0.0008913129568099976, 0.000937730073928833, 0.0009841471910476685, 0.001030564308166504, 0.0010769814252853394, 0.0011233985424041748, 0.0011698156595230103, 0.0012162327766418457, 0.0012626498937606812, 0.0013090670108795166, 0.001355484127998352, 0.0014019012451171875]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 2.0, 10.0, 16.0, 20.0, 29.0, 45.0, 61.0, 59.0, 129.0, 171.0, 269.0, 368.0, 539.0, 841.0, 1248.0, 2020.0, 3439.0, 5662.0, 10170.0, 18962.0, 36229.0, 68600.0, 120417.0, 178480.0, 201469.0, 165387.0, 106195.0, 58878.0, 30555.0, 16105.0, 8911.0, 4963.0, 2982.0, 1834.0, 1181.0, 715.0, 515.0, 324.0, 243.0, 166.0, 108.0, 79.0, 40.0, 38.0, 28.0, 20.0, 12.0, 8.0, 6.0, 4.0, 4.0, 5.0, 2.0], "bins": [-18.296875, -17.7796630859375, -17.262451171875, -16.7452392578125, -16.22802734375, -15.7108154296875, -15.193603515625, -14.6763916015625, -14.1591796875, -13.6419677734375, -13.124755859375, -12.6075439453125, -12.09033203125, -11.5731201171875, -11.055908203125, -10.5386962890625, -10.021484375, -9.5042724609375, -8.987060546875, -8.4698486328125, -7.95263671875, -7.4354248046875, -6.918212890625, -6.4010009765625, -5.8837890625, -5.3665771484375, -4.849365234375, -4.3321533203125, -3.81494140625, -3.2977294921875, -2.780517578125, -2.2633056640625, -1.74609375, -1.2288818359375, -0.711669921875, -0.1944580078125, 0.32275390625, 0.8399658203125, 1.357177734375, 1.8743896484375, 2.3916015625, 2.9088134765625, 3.426025390625, 3.9432373046875, 4.46044921875, 4.9776611328125, 5.494873046875, 6.0120849609375, 6.529296875, 7.0465087890625, 7.563720703125, 8.0809326171875, 8.59814453125, 9.1153564453125, 9.632568359375, 10.1497802734375, 10.6669921875, 11.1842041015625, 11.701416015625, 12.2186279296875, 12.73583984375, 13.2530517578125, 13.770263671875, 14.2874755859375, 14.8046875]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 4.0, 9.0, 2.0, 3.0, 1.0, 11.0, 13.0, 12.0, 14.0, 23.0, 27.0, 46.0, 45.0, 63.0, 59.0, 73.0, 80.0, 99.0, 92.0, 58.0, 63.0, 47.0, 37.0, 26.0, 22.0, 22.0, 15.0, 11.0, 6.0, 4.0, 4.0, 4.0, 6.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.6875, -10.3619384765625, -10.036376953125, -9.7108154296875, -9.38525390625, -9.0596923828125, -8.734130859375, -8.4085693359375, -8.0830078125, -7.7574462890625, -7.431884765625, -7.1063232421875, -6.78076171875, -6.4552001953125, -6.129638671875, -5.8040771484375, -5.478515625, -5.1529541015625, -4.827392578125, -4.5018310546875, -4.17626953125, -3.8507080078125, -3.525146484375, -3.1995849609375, -2.8740234375, -2.5484619140625, -2.222900390625, -1.8973388671875, -1.57177734375, -1.2462158203125, -0.920654296875, -0.5950927734375, -0.26953125, 0.0560302734375, 0.381591796875, 0.7071533203125, 1.03271484375, 1.3582763671875, 1.683837890625, 2.0093994140625, 2.3349609375, 2.6605224609375, 2.986083984375, 3.3116455078125, 3.63720703125, 3.9627685546875, 4.288330078125, 4.6138916015625, 4.939453125, 5.2650146484375, 5.590576171875, 5.9161376953125, 6.24169921875, 6.5672607421875, 6.892822265625, 7.2183837890625, 7.5439453125, 7.8695068359375, 8.195068359375, 8.5206298828125, 8.84619140625, 9.1717529296875, 9.497314453125, 9.8228759765625, 10.1484375]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 3.0, 3.0, 4.0, 9.0, 6.0, 5.0, 5.0, 10.0, 25.0, 28.0, 38.0, 35.0, 37.0, 49.0, 40.0, 40.0, 54.0, 57.0, 57.0, 40.0, 91.0, 52.0, 51.0, 46.0, 47.0, 35.0, 29.0, 17.0, 15.0, 18.0, 18.0, 13.0, 12.0, 11.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-37.04381561279297, -36.105934143066406, -35.168052673339844, -34.230167388916016, -33.29228591918945, -32.35440444946289, -31.416521072387695, -30.478639602661133, -29.540756225585938, -28.602874755859375, -27.66499137878418, -26.727109909057617, -25.789226531982422, -24.85134506225586, -23.913461685180664, -22.9755802154541, -22.037696838378906, -21.099815368652344, -20.16193199157715, -19.224050521850586, -18.28616714477539, -17.348285675048828, -16.410402297973633, -15.47252082824707, -14.534639358520508, -13.596756935119629, -12.65887451171875, -11.720992088317871, -10.783109664916992, -9.84522819519043, -8.907344818115234, -7.969462871551514, -7.031579971313477, -6.093697547912598, -5.155815124511719, -4.21793270111084, -3.28005051612854, -2.3421683311462402, -1.4042859077453613, -0.4664034843444824, 0.4714789390563965, 1.4093613624572754, 2.3472437858581543, 3.285125970840454, 4.223008155822754, 5.160890579223633, 6.098773002624512, 7.036655426025391, 7.9745378494262695, 8.912420272827148, 9.850302696228027, 10.788185119628906, 11.726067543029785, 12.663949966430664, 13.601831436157227, 14.539714813232422, 15.477596282958984, 16.415477752685547, 17.353361129760742, 18.291242599487305, 19.2291259765625, 20.167007446289062, 21.104890823364258, 22.04277229309082, 22.980655670166016]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 6.0, 8.0, 14.0, 3.0, 6.0, 5.0, 11.0, 14.0, 15.0, 19.0, 24.0, 19.0, 26.0, 38.0, 45.0, 32.0, 40.0, 31.0, 46.0, 44.0, 38.0, 41.0, 36.0, 36.0, 31.0, 53.0, 30.0, 34.0, 25.0, 34.0, 29.0, 30.0, 17.0, 24.0, 18.0, 13.0, 9.0, 5.0, 9.0, 13.0, 13.0, 1.0, 2.0, 8.0, 7.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-29.39780616760254, -28.473628997802734, -27.549453735351562, -26.62527847290039, -25.701101303100586, -24.77692413330078, -23.85274887084961, -22.928573608398438, -22.004396438598633, -21.080219268798828, -20.156044006347656, -19.231868743896484, -18.30769157409668, -17.383514404296875, -16.459339141845703, -15.535162925720215, -14.610986709594727, -13.686810493469238, -12.76263427734375, -11.838458061218262, -10.914281845092773, -9.990105628967285, -9.065929412841797, -8.141753196716309, -7.21757698059082, -6.293400764465332, -5.369224548339844, -4.4450483322143555, -3.520872116088867, -2.596695899963379, -1.6725196838378906, -0.7483434677124023, 0.17583084106445312, 1.1000070571899414, 2.0241832733154297, 2.948359489440918, 3.8725357055664062, 4.7967119216918945, 5.720888137817383, 6.645064353942871, 7.569240570068359, 8.493416786193848, 9.417593002319336, 10.341769218444824, 11.265945434570312, 12.1901216506958, 13.114297866821289, 14.038474082946777, 14.962650299072266, 15.886826515197754, 16.811002731323242, 17.735179901123047, 18.65935516357422, 19.58353042602539, 20.507707595825195, 21.431884765625, 22.356060028076172, 23.280235290527344, 24.20441246032715, 25.128589630126953, 26.052764892578125, 26.976940155029297, 27.9011173248291, 28.825294494628906, 29.749469757080078]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 9.0, 8.0, 14.0, 15.0, 35.0, 53.0, 86.0, 126.0, 212.0, 342.0, 486.0, 812.0, 1183.0, 2031.0, 3205.0, 5177.0, 8132.0, 13815.0, 22271.0, 37912.0, 63093.0, 107131.0, 178316.0, 284551.0, 418990.0, 548678.0, 612573.0, 578651.0, 462897.0, 324516.0, 206970.0, 125897.0, 74844.0, 44112.0, 26256.0, 15563.0, 9643.0, 5953.0, 3629.0, 2247.0, 1459.0, 894.0, 548.0, 371.0, 228.0, 130.0, 77.0, 66.0, 38.0, 26.0, 9.0, 8.0, 5.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.078125, -16.502197265625, -15.92626953125, -15.350341796875, -14.7744140625, -14.198486328125, -13.62255859375, -13.046630859375, -12.470703125, -11.894775390625, -11.31884765625, -10.742919921875, -10.1669921875, -9.591064453125, -9.01513671875, -8.439208984375, -7.86328125, -7.287353515625, -6.71142578125, -6.135498046875, -5.5595703125, -4.983642578125, -4.40771484375, -3.831787109375, -3.255859375, -2.679931640625, -2.10400390625, -1.528076171875, -0.9521484375, -0.376220703125, 0.19970703125, 0.775634765625, 1.3515625, 1.927490234375, 2.50341796875, 3.079345703125, 3.6552734375, 4.231201171875, 4.80712890625, 5.383056640625, 5.958984375, 6.534912109375, 7.11083984375, 7.686767578125, 8.2626953125, 8.838623046875, 9.41455078125, 9.990478515625, 10.56640625, 11.142333984375, 11.71826171875, 12.294189453125, 12.8701171875, 13.446044921875, 14.02197265625, 14.597900390625, 15.173828125, 15.749755859375, 16.32568359375, 16.901611328125, 17.4775390625, 18.053466796875, 18.62939453125, 19.205322265625, 19.78125]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 4.0, 3.0, 4.0, 9.0, 5.0, 9.0, 6.0, 19.0, 19.0, 24.0, 20.0, 28.0, 36.0, 31.0, 37.0, 35.0, 40.0, 46.0, 46.0, 44.0, 41.0, 38.0, 58.0, 39.0, 34.0, 49.0, 34.0, 33.0, 32.0, 20.0, 30.0, 16.0, 19.0, 15.0, 23.0, 12.0, 5.0, 5.0, 8.0, 8.0, 4.0, 10.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-24.015625, -23.216064453125, -22.41650390625, -21.616943359375, -20.8173828125, -20.017822265625, -19.21826171875, -18.418701171875, -17.619140625, -16.819580078125, -16.02001953125, -15.220458984375, -14.4208984375, -13.621337890625, -12.82177734375, -12.022216796875, -11.22265625, -10.423095703125, -9.62353515625, -8.823974609375, -8.0244140625, -7.224853515625, -6.42529296875, -5.625732421875, -4.826171875, -4.026611328125, -3.22705078125, -2.427490234375, -1.6279296875, -0.828369140625, -0.02880859375, 0.770751953125, 1.5703125, 2.369873046875, 3.16943359375, 3.968994140625, 4.7685546875, 5.568115234375, 6.36767578125, 7.167236328125, 7.966796875, 8.766357421875, 9.56591796875, 10.365478515625, 11.1650390625, 11.964599609375, 12.76416015625, 13.563720703125, 14.36328125, 15.162841796875, 15.96240234375, 16.761962890625, 17.5615234375, 18.361083984375, 19.16064453125, 19.960205078125, 20.759765625, 21.559326171875, 22.35888671875, 23.158447265625, 23.9580078125, 24.757568359375, 25.55712890625, 26.356689453125, 27.15625]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 5.0, 9.0, 7.0, 18.0, 41.0, 49.0, 80.0, 129.0, 219.0, 339.0, 590.0, 967.0, 1547.0, 2501.0, 3932.0, 6447.0, 10495.0, 17044.0, 28087.0, 45789.0, 74113.0, 117548.0, 180703.0, 266869.0, 370853.0, 470259.0, 532574.0, 529425.0, 460563.0, 356364.0, 254627.0, 171708.0, 110665.0, 68892.0, 42783.0, 26430.0, 15954.0, 9862.0, 6072.0, 3743.0, 2318.0, 1472.0, 850.0, 517.0, 309.0, 217.0, 134.0, 71.0, 52.0, 24.0, 11.0, 9.0, 4.0, 4.0, 2.0, 4.0], "bins": [-20.0, -19.427490234375, -18.85498046875, -18.282470703125, -17.7099609375, -17.137451171875, -16.56494140625, -15.992431640625, -15.419921875, -14.847412109375, -14.27490234375, -13.702392578125, -13.1298828125, -12.557373046875, -11.98486328125, -11.412353515625, -10.83984375, -10.267333984375, -9.69482421875, -9.122314453125, -8.5498046875, -7.977294921875, -7.40478515625, -6.832275390625, -6.259765625, -5.687255859375, -5.11474609375, -4.542236328125, -3.9697265625, -3.397216796875, -2.82470703125, -2.252197265625, -1.6796875, -1.107177734375, -0.53466796875, 0.037841796875, 0.6103515625, 1.182861328125, 1.75537109375, 2.327880859375, 2.900390625, 3.472900390625, 4.04541015625, 4.617919921875, 5.1904296875, 5.762939453125, 6.33544921875, 6.907958984375, 7.48046875, 8.052978515625, 8.62548828125, 9.197998046875, 9.7705078125, 10.343017578125, 10.91552734375, 11.488037109375, 12.060546875, 12.633056640625, 13.20556640625, 13.778076171875, 14.3505859375, 14.923095703125, 15.49560546875, 16.068115234375, 16.640625]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 8.0, 9.0, 9.0, 17.0, 17.0, 34.0, 22.0, 45.0, 52.0, 62.0, 70.0, 87.0, 103.0, 124.0, 133.0, 151.0, 179.0, 185.0, 196.0, 226.0, 234.0, 206.0, 222.0, 219.0, 206.0, 173.0, 187.0, 152.0, 119.0, 108.0, 93.0, 79.0, 65.0, 72.0, 46.0, 32.0, 28.0, 25.0, 16.0, 17.0, 13.0, 14.0, 5.0, 3.0, 6.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-10.28125, -9.97265625, -9.6640625, -9.35546875, -9.046875, -8.73828125, -8.4296875, -8.12109375, -7.8125, -7.50390625, -7.1953125, -6.88671875, -6.578125, -6.26953125, -5.9609375, -5.65234375, -5.34375, -5.03515625, -4.7265625, -4.41796875, -4.109375, -3.80078125, -3.4921875, -3.18359375, -2.875, -2.56640625, -2.2578125, -1.94921875, -1.640625, -1.33203125, -1.0234375, -0.71484375, -0.40625, -0.09765625, 0.2109375, 0.51953125, 0.828125, 1.13671875, 1.4453125, 1.75390625, 2.0625, 2.37109375, 2.6796875, 2.98828125, 3.296875, 3.60546875, 3.9140625, 4.22265625, 4.53125, 4.83984375, 5.1484375, 5.45703125, 5.765625, 6.07421875, 6.3828125, 6.69140625, 7.0, 7.30859375, 7.6171875, 7.92578125, 8.234375, 8.54296875, 8.8515625, 9.16015625, 9.46875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 2.0, 0.0, 3.0, 3.0, 2.0, 5.0, 6.0, 10.0, 14.0, 12.0, 12.0, 17.0, 26.0, 21.0, 39.0, 42.0, 41.0, 37.0, 41.0, 39.0, 44.0, 64.0, 49.0, 47.0, 50.0, 41.0, 45.0, 51.0, 38.0, 28.0, 29.0, 23.0, 18.0, 25.0, 10.0, 13.0, 12.0, 10.0, 7.0, 5.0, 9.0, 6.0, 11.0, 0.0, 2.0, 2.0, 2.0], "bins": [-30.46190643310547, -29.689592361450195, -28.917280197143555, -28.14496612548828, -27.372652053833008, -26.600337982177734, -25.828025817871094, -25.05571174621582, -24.283397674560547, -23.511083602905273, -22.738771438598633, -21.96645736694336, -21.194143295288086, -20.421829223632812, -19.649517059326172, -18.8772029876709, -18.104890823364258, -17.332576751708984, -16.560264587402344, -15.78795051574707, -15.015636444091797, -14.24332332611084, -13.471010208129883, -12.69869613647461, -11.926383018493652, -11.154069900512695, -10.381755828857422, -9.609442710876465, -8.837129592895508, -8.064815521240234, -7.292502403259277, -6.520188808441162, -5.747875213623047, -4.975561618804932, -4.203248023986816, -3.4309349060058594, -2.658621311187744, -1.886307716369629, -1.1139945983886719, -0.34168100357055664, 0.4306325912475586, 1.2029460668563843, 1.97525954246521, 2.747572898864746, 3.5198864936828613, 4.292200088500977, 5.064513206481934, 5.836826801300049, 6.609140396118164, 7.381453990936279, 8.153767585754395, 8.926080703735352, 9.698394775390625, 10.470707893371582, 11.243021011352539, 12.015335083007812, 12.78764820098877, 13.559961318969727, 14.332275390625, 15.104588508605957, 15.876901626586914, 16.649215698242188, 17.421527862548828, 18.1938419342041, 18.966156005859375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 1.0, 4.0, 6.0, 8.0, 12.0, 5.0, 17.0, 19.0, 18.0, 14.0, 21.0, 16.0, 31.0, 28.0, 26.0, 42.0, 27.0, 32.0, 27.0, 27.0, 40.0, 43.0, 47.0, 50.0, 39.0, 39.0, 35.0, 34.0, 35.0, 32.0, 33.0, 22.0, 25.0, 27.0, 18.0, 16.0, 13.0, 18.0, 13.0, 12.0, 5.0, 3.0, 6.0, 8.0, 3.0, 0.0, 4.0, 1.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0], "bins": [-27.46792984008789, -26.59942054748535, -25.730911254882812, -24.862403869628906, -23.993894577026367, -23.125385284423828, -22.25687599182129, -21.38836669921875, -20.51985740661621, -19.651348114013672, -18.782838821411133, -17.914329528808594, -17.045822143554688, -16.17731285095215, -15.30880355834961, -14.44029426574707, -13.571785926818848, -12.703276634216309, -11.834768295288086, -10.966259002685547, -10.097749710083008, -9.229240417480469, -8.360732078552246, -7.492222785949707, -6.623713970184326, -5.755205154418945, -4.886695861816406, -4.018187046051025, -3.1496779918670654, -2.2811689376831055, -1.4126601219177246, -0.5441508293151855, 0.3243579864501953, 1.1928670406341553, 2.0613760948181152, 2.929884910583496, 3.798393964767456, 4.666903018951416, 5.535411834716797, 6.403921127319336, 7.272429943084717, 8.140938758850098, 9.009448051452637, 9.87795639038086, 10.746465682983398, 11.614974975585938, 12.483484268188477, 13.351993560791016, 14.220501899719238, 15.089011192321777, 15.95751953125, 16.82602882385254, 17.694538116455078, 18.563047409057617, 19.431556701660156, 20.300064086914062, 21.1685733795166, 22.03708267211914, 22.90559196472168, 23.77410125732422, 24.642608642578125, 25.511117935180664, 26.379627227783203, 27.248136520385742, 28.11664581298828]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 4.0, 3.0, 5.0, 12.0, 16.0, 14.0, 36.0, 41.0, 62.0, 83.0, 147.0, 233.0, 357.0, 526.0, 822.0, 1231.0, 2091.0, 3234.0, 5211.0, 8612.0, 14099.0, 23630.0, 39871.0, 68061.0, 115028.0, 176568.0, 199777.0, 154617.0, 95531.0, 55358.0, 33178.0, 19696.0, 11610.0, 6913.0, 4353.0, 2756.0, 1662.0, 1126.0, 708.0, 451.0, 295.0, 187.0, 122.0, 75.0, 51.0, 30.0, 26.0, 16.0, 10.0, 12.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.484375, -20.7255859375, -19.966796875, -19.2080078125, -18.44921875, -17.6904296875, -16.931640625, -16.1728515625, -15.4140625, -14.6552734375, -13.896484375, -13.1376953125, -12.37890625, -11.6201171875, -10.861328125, -10.1025390625, -9.34375, -8.5849609375, -7.826171875, -7.0673828125, -6.30859375, -5.5498046875, -4.791015625, -4.0322265625, -3.2734375, -2.5146484375, -1.755859375, -0.9970703125, -0.23828125, 0.5205078125, 1.279296875, 2.0380859375, 2.796875, 3.5556640625, 4.314453125, 5.0732421875, 5.83203125, 6.5908203125, 7.349609375, 8.1083984375, 8.8671875, 9.6259765625, 10.384765625, 11.1435546875, 11.90234375, 12.6611328125, 13.419921875, 14.1787109375, 14.9375, 15.6962890625, 16.455078125, 17.2138671875, 17.97265625, 18.7314453125, 19.490234375, 20.2490234375, 21.0078125, 21.7666015625, 22.525390625, 23.2841796875, 24.04296875, 24.8017578125, 25.560546875, 26.3193359375, 27.078125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 3.0, 5.0, 7.0, 19.0, 9.0, 22.0, 11.0, 23.0, 18.0, 21.0, 24.0, 22.0, 32.0, 45.0, 37.0, 36.0, 38.0, 35.0, 45.0, 44.0, 42.0, 46.0, 39.0, 49.0, 35.0, 40.0, 26.0, 43.0, 22.0, 22.0, 27.0, 17.0, 19.0, 9.0, 15.0, 17.0, 9.0, 7.0, 6.0, 5.0, 5.0, 4.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-30.421875, -29.4990234375, -28.576171875, -27.6533203125, -26.73046875, -25.8076171875, -24.884765625, -23.9619140625, -23.0390625, -22.1162109375, -21.193359375, -20.2705078125, -19.34765625, -18.4248046875, -17.501953125, -16.5791015625, -15.65625, -14.7333984375, -13.810546875, -12.8876953125, -11.96484375, -11.0419921875, -10.119140625, -9.1962890625, -8.2734375, -7.3505859375, -6.427734375, -5.5048828125, -4.58203125, -3.6591796875, -2.736328125, -1.8134765625, -0.890625, 0.0322265625, 0.955078125, 1.8779296875, 2.80078125, 3.7236328125, 4.646484375, 5.5693359375, 6.4921875, 7.4150390625, 8.337890625, 9.2607421875, 10.18359375, 11.1064453125, 12.029296875, 12.9521484375, 13.875, 14.7978515625, 15.720703125, 16.6435546875, 17.56640625, 18.4892578125, 19.412109375, 20.3349609375, 21.2578125, 22.1806640625, 23.103515625, 24.0263671875, 24.94921875, 25.8720703125, 26.794921875, 27.7177734375, 28.640625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 5.0, 12.0, 18.0, 11.0, 25.0, 38.0, 60.0, 89.0, 125.0, 224.0, 299.0, 502.0, 647.0, 1098.0, 1756.0, 2900.0, 4798.0, 7793.0, 12652.0, 21210.0, 36438.0, 64239.0, 112443.0, 184520.0, 218662.0, 157421.0, 92484.0, 52455.0, 30268.0, 17873.0, 10527.0, 6429.0, 3960.0, 2394.0, 1511.0, 990.0, 599.0, 377.0, 242.0, 154.0, 90.0, 77.0, 47.0, 33.0, 23.0, 12.0, 11.0, 6.0, 2.0, 4.0, 2.0, 5.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.984375, -23.193359375, -22.40234375, -21.611328125, -20.8203125, -20.029296875, -19.23828125, -18.447265625, -17.65625, -16.865234375, -16.07421875, -15.283203125, -14.4921875, -13.701171875, -12.91015625, -12.119140625, -11.328125, -10.537109375, -9.74609375, -8.955078125, -8.1640625, -7.373046875, -6.58203125, -5.791015625, -5.0, -4.208984375, -3.41796875, -2.626953125, -1.8359375, -1.044921875, -0.25390625, 0.537109375, 1.328125, 2.119140625, 2.91015625, 3.701171875, 4.4921875, 5.283203125, 6.07421875, 6.865234375, 7.65625, 8.447265625, 9.23828125, 10.029296875, 10.8203125, 11.611328125, 12.40234375, 13.193359375, 13.984375, 14.775390625, 15.56640625, 16.357421875, 17.1484375, 17.939453125, 18.73046875, 19.521484375, 20.3125, 21.103515625, 21.89453125, 22.685546875, 23.4765625, 24.267578125, 25.05859375, 25.849609375, 26.640625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 5.0, 0.0, 0.0, 1.0, 4.0, 3.0, 5.0, 4.0, 7.0, 12.0, 3.0, 8.0, 10.0, 16.0, 13.0, 13.0, 16.0, 18.0, 24.0, 25.0, 28.0, 31.0, 27.0, 34.0, 50.0, 27.0, 32.0, 38.0, 33.0, 43.0, 42.0, 35.0, 37.0, 31.0, 27.0, 35.0, 28.0, 30.0, 29.0, 23.0, 15.0, 20.0, 25.0, 21.0, 13.0, 14.0, 9.0, 18.0, 11.0, 7.0, 7.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-18.8125, -18.263671875, -17.71484375, -17.166015625, -16.6171875, -16.068359375, -15.51953125, -14.970703125, -14.421875, -13.873046875, -13.32421875, -12.775390625, -12.2265625, -11.677734375, -11.12890625, -10.580078125, -10.03125, -9.482421875, -8.93359375, -8.384765625, -7.8359375, -7.287109375, -6.73828125, -6.189453125, -5.640625, -5.091796875, -4.54296875, -3.994140625, -3.4453125, -2.896484375, -2.34765625, -1.798828125, -1.25, -0.701171875, -0.15234375, 0.396484375, 0.9453125, 1.494140625, 2.04296875, 2.591796875, 3.140625, 3.689453125, 4.23828125, 4.787109375, 5.3359375, 5.884765625, 6.43359375, 6.982421875, 7.53125, 8.080078125, 8.62890625, 9.177734375, 9.7265625, 10.275390625, 10.82421875, 11.373046875, 11.921875, 12.470703125, 13.01953125, 13.568359375, 14.1171875, 14.666015625, 15.21484375, 15.763671875, 16.3125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 2.0, 8.0, 4.0, 10.0, 9.0, 19.0, 27.0, 40.0, 40.0, 99.0, 131.0, 180.0, 274.0, 406.0, 681.0, 1085.0, 1730.0, 2827.0, 4655.0, 7939.0, 14225.0, 26487.0, 53924.0, 127161.0, 300149.0, 282857.0, 115765.0, 50220.0, 24978.0, 13309.0, 7630.0, 4518.0, 2562.0, 1668.0, 1066.0, 668.0, 411.0, 263.0, 179.0, 118.0, 75.0, 57.0, 29.0, 27.0, 15.0, 9.0, 7.0, 8.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.859375, -16.314697265625, -15.77001953125, -15.225341796875, -14.6806640625, -14.135986328125, -13.59130859375, -13.046630859375, -12.501953125, -11.957275390625, -11.41259765625, -10.867919921875, -10.3232421875, -9.778564453125, -9.23388671875, -8.689208984375, -8.14453125, -7.599853515625, -7.05517578125, -6.510498046875, -5.9658203125, -5.421142578125, -4.87646484375, -4.331787109375, -3.787109375, -3.242431640625, -2.69775390625, -2.153076171875, -1.6083984375, -1.063720703125, -0.51904296875, 0.025634765625, 0.5703125, 1.114990234375, 1.65966796875, 2.204345703125, 2.7490234375, 3.293701171875, 3.83837890625, 4.383056640625, 4.927734375, 5.472412109375, 6.01708984375, 6.561767578125, 7.1064453125, 7.651123046875, 8.19580078125, 8.740478515625, 9.28515625, 9.829833984375, 10.37451171875, 10.919189453125, 11.4638671875, 12.008544921875, 12.55322265625, 13.097900390625, 13.642578125, 14.187255859375, 14.73193359375, 15.276611328125, 15.8212890625, 16.365966796875, 16.91064453125, 17.455322265625, 18.0]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 4.0, 0.0, 1.0, 5.0, 7.0, 2.0, 3.0, 4.0, 13.0, 4.0, 14.0, 8.0, 21.0, 22.0, 22.0, 35.0, 49.0, 53.0, 86.0, 102.0, 87.0, 102.0, 70.0, 68.0, 49.0, 35.0, 33.0, 24.0, 20.0, 10.0, 8.0, 7.0, 6.0, 6.0, 7.0, 4.0, 4.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001346588134765625, -0.0013026893138885498, -0.0012587904930114746, -0.0012148916721343994, -0.0011709928512573242, -0.001127094030380249, -0.0010831952095031738, -0.0010392963886260986, -0.0009953975677490234, -0.0009514987468719482, -0.000907599925994873, -0.0008637011051177979, -0.0008198022842407227, -0.0007759034633636475, -0.0007320046424865723, -0.0006881058216094971, -0.0006442070007324219, -0.0006003081798553467, -0.0005564093589782715, -0.0005125105381011963, -0.0004686117172241211, -0.0004247128963470459, -0.0003808140754699707, -0.0003369152545928955, -0.0002930164337158203, -0.0002491176128387451, -0.00020521879196166992, -0.00016131997108459473, -0.00011742115020751953, -7.352232933044434e-05, -2.962350845336914e-05, 1.4275312423706055e-05, 5.817413330078125e-05, 0.00010207295417785645, 0.00014597177505493164, 0.00018987059593200684, 0.00023376941680908203, 0.0002776682376861572, 0.0003215670585632324, 0.0003654658794403076, 0.0004093647003173828, 0.000453263521194458, 0.0004971623420715332, 0.0005410611629486084, 0.0005849599838256836, 0.0006288588047027588, 0.000672757625579834, 0.0007166564464569092, 0.0007605552673339844, 0.0008044540882110596, 0.0008483529090881348, 0.00089225172996521, 0.0009361505508422852, 0.0009800493717193604, 0.0010239481925964355, 0.0010678470134735107, 0.001111745834350586, 0.0011556446552276611, 0.0011995434761047363, 0.0012434422969818115, 0.0012873411178588867, 0.001331239938735962, 0.0013751387596130371, 0.0014190375804901123, 0.0014629364013671875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 5.0, 4.0, 12.0, 14.0, 31.0, 35.0, 66.0, 105.0, 140.0, 198.0, 327.0, 433.0, 737.0, 1175.0, 1821.0, 3004.0, 4657.0, 7477.0, 12552.0, 20635.0, 36148.0, 67724.0, 129813.0, 215107.0, 226433.0, 144811.0, 76204.0, 40712.0, 22791.0, 13306.0, 8379.0, 4958.0, 3090.0, 2035.0, 1288.0, 834.0, 532.0, 341.0, 207.0, 141.0, 108.0, 64.0, 39.0, 28.0, 22.0, 11.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-14.828125, -14.3800048828125, -13.931884765625, -13.4837646484375, -13.03564453125, -12.5875244140625, -12.139404296875, -11.6912841796875, -11.2431640625, -10.7950439453125, -10.346923828125, -9.8988037109375, -9.45068359375, -9.0025634765625, -8.554443359375, -8.1063232421875, -7.658203125, -7.2100830078125, -6.761962890625, -6.3138427734375, -5.86572265625, -5.4176025390625, -4.969482421875, -4.5213623046875, -4.0732421875, -3.6251220703125, -3.177001953125, -2.7288818359375, -2.28076171875, -1.8326416015625, -1.384521484375, -0.9364013671875, -0.48828125, -0.0401611328125, 0.407958984375, 0.8560791015625, 1.30419921875, 1.7523193359375, 2.200439453125, 2.6485595703125, 3.0966796875, 3.5447998046875, 3.992919921875, 4.4410400390625, 4.88916015625, 5.3372802734375, 5.785400390625, 6.2335205078125, 6.681640625, 7.1297607421875, 7.577880859375, 8.0260009765625, 8.47412109375, 8.9222412109375, 9.370361328125, 9.8184814453125, 10.2666015625, 10.7147216796875, 11.162841796875, 11.6109619140625, 12.05908203125, 12.5072021484375, 12.955322265625, 13.4034423828125, 13.8515625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 4.0, 3.0, 4.0, 5.0, 6.0, 6.0, 5.0, 9.0, 6.0, 13.0, 11.0, 11.0, 18.0, 24.0, 31.0, 26.0, 33.0, 30.0, 37.0, 50.0, 50.0, 56.0, 50.0, 51.0, 68.0, 56.0, 61.0, 43.0, 43.0, 31.0, 23.0, 21.0, 15.0, 9.0, 17.0, 15.0, 8.0, 13.0, 6.0, 6.0, 5.0, 8.0, 2.0, 2.0, 5.0, 2.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.7421875, -4.59814453125, -4.4541015625, -4.31005859375, -4.166015625, -4.02197265625, -3.8779296875, -3.73388671875, -3.58984375, -3.44580078125, -3.3017578125, -3.15771484375, -3.013671875, -2.86962890625, -2.7255859375, -2.58154296875, -2.4375, -2.29345703125, -2.1494140625, -2.00537109375, -1.861328125, -1.71728515625, -1.5732421875, -1.42919921875, -1.28515625, -1.14111328125, -0.9970703125, -0.85302734375, -0.708984375, -0.56494140625, -0.4208984375, -0.27685546875, -0.1328125, 0.01123046875, 0.1552734375, 0.29931640625, 0.443359375, 0.58740234375, 0.7314453125, 0.87548828125, 1.01953125, 1.16357421875, 1.3076171875, 1.45166015625, 1.595703125, 1.73974609375, 1.8837890625, 2.02783203125, 2.171875, 2.31591796875, 2.4599609375, 2.60400390625, 2.748046875, 2.89208984375, 3.0361328125, 3.18017578125, 3.32421875, 3.46826171875, 3.6123046875, 3.75634765625, 3.900390625, 4.04443359375, 4.1884765625, 4.33251953125, 4.4765625]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 3.0, 2.0, 0.0, 4.0, 1.0, 5.0, 4.0, 5.0, 8.0, 6.0, 17.0, 20.0, 13.0, 24.0, 27.0, 35.0, 45.0, 34.0, 49.0, 47.0, 49.0, 45.0, 58.0, 49.0, 56.0, 54.0, 41.0, 45.0, 44.0, 26.0, 37.0, 33.0, 19.0, 16.0, 17.0, 13.0, 16.0, 12.0, 5.0, 6.0, 5.0, 4.0, 3.0, 4.0, 2.0, 3.0, 3.0, 0.0, 0.0, 2.0], "bins": [-29.077295303344727, -28.300304412841797, -27.523313522338867, -26.746322631835938, -25.969331741333008, -25.192340850830078, -24.41535186767578, -23.63836097717285, -22.861370086669922, -22.084379196166992, -21.307388305664062, -20.530397415161133, -19.753406524658203, -18.976417541503906, -18.199424743652344, -17.422435760498047, -16.645442962646484, -15.868452072143555, -15.091461181640625, -14.314470291137695, -13.537480354309082, -12.760489463806152, -11.983498573303223, -11.20650863647461, -10.42951774597168, -9.65252685546875, -8.87553596496582, -8.09854507446289, -7.321555137634277, -6.544564247131348, -5.767573356628418, -4.9905829429626465, -4.213592529296875, -3.4366018772125244, -2.659611225128174, -1.8826203346252441, -1.1056296825408936, -0.32863903045654297, 0.4483518600463867, 1.2253422737121582, 2.002333164215088, 2.7793238162994385, 3.556314468383789, 4.333305358886719, 5.110296249389648, 5.88728666305542, 6.66427755355835, 7.441267967224121, 8.21825885772705, 8.99524974822998, 9.77224063873291, 10.549230575561523, 11.326221466064453, 12.103212356567383, 12.880203247070312, 13.657194137573242, 14.434185028076172, 15.211175918579102, 15.988166809082031, 16.76515769958496, 17.54214859008789, 18.319137573242188, 19.09613037109375, 19.873119354248047, 20.650110244750977]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 4.0, 12.0, 8.0, 15.0, 17.0, 15.0, 21.0, 22.0, 13.0, 21.0, 26.0, 30.0, 40.0, 30.0, 33.0, 31.0, 40.0, 32.0, 47.0, 43.0, 35.0, 50.0, 43.0, 45.0, 31.0, 30.0, 32.0, 25.0, 33.0, 24.0, 33.0, 20.0, 18.0, 14.0, 13.0, 11.0, 12.0, 6.0, 5.0, 6.0, 3.0, 3.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 3.0], "bins": [-29.650087356567383, -28.74713897705078, -27.844188690185547, -26.941240310668945, -26.038291931152344, -25.13534164428711, -24.232393264770508, -23.329444885253906, -22.426494598388672, -21.52354621887207, -20.620595932006836, -19.717647552490234, -18.814699172973633, -17.91175079345703, -17.008800506591797, -16.105852127075195, -15.202903747558594, -14.299954414367676, -13.397006034851074, -12.494056701660156, -11.591108322143555, -10.688158988952637, -9.785209655761719, -8.882261276245117, -7.979311943054199, -7.0763630867004395, -6.17341423034668, -5.270464897155762, -4.367516040802002, -3.464567184448242, -2.561617851257324, -1.6586689949035645, -0.7557220458984375, 0.14722692966461182, 1.0501759052276611, 1.953125, 2.8560738563537598, 3.7590227127075195, 4.6619720458984375, 5.564920902252197, 6.467869758605957, 7.370818614959717, 8.273767471313477, 9.176716804504395, 10.079666137695312, 10.982614517211914, 11.885563850402832, 12.78851318359375, 13.691461563110352, 14.59441089630127, 15.497359275817871, 16.40030860900879, 17.30325698852539, 18.206207275390625, 19.109155654907227, 20.012104034423828, 20.915054321289062, 21.818002700805664, 22.7209529876709, 23.6239013671875, 24.5268497467041, 25.429798126220703, 26.332748413085938, 27.23569679260254, 28.13864517211914]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 1.0, 5.0, 4.0, 9.0, 20.0, 27.0, 52.0, 71.0, 116.0, 176.0, 261.0, 461.0, 719.0, 1175.0, 1820.0, 2860.0, 4497.0, 6986.0, 10645.0, 16204.0, 23990.0, 35134.0, 49318.0, 66577.0, 84676.0, 101040.0, 110917.0, 111948.0, 102304.0, 87356.0, 68859.0, 50960.0, 36099.0, 25222.0, 17078.0, 11144.0, 7207.0, 4627.0, 2906.0, 1916.0, 1169.0, 727.0, 498.0, 294.0, 169.0, 123.0, 67.0, 57.0, 27.0, 21.0, 14.0, 7.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.046875, -15.512939453125, -14.97900390625, -14.445068359375, -13.9111328125, -13.377197265625, -12.84326171875, -12.309326171875, -11.775390625, -11.241455078125, -10.70751953125, -10.173583984375, -9.6396484375, -9.105712890625, -8.57177734375, -8.037841796875, -7.50390625, -6.969970703125, -6.43603515625, -5.902099609375, -5.3681640625, -4.834228515625, -4.30029296875, -3.766357421875, -3.232421875, -2.698486328125, -2.16455078125, -1.630615234375, -1.0966796875, -0.562744140625, -0.02880859375, 0.505126953125, 1.0390625, 1.572998046875, 2.10693359375, 2.640869140625, 3.1748046875, 3.708740234375, 4.24267578125, 4.776611328125, 5.310546875, 5.844482421875, 6.37841796875, 6.912353515625, 7.4462890625, 7.980224609375, 8.51416015625, 9.048095703125, 9.58203125, 10.115966796875, 10.64990234375, 11.183837890625, 11.7177734375, 12.251708984375, 12.78564453125, 13.319580078125, 13.853515625, 14.387451171875, 14.92138671875, 15.455322265625, 15.9892578125, 16.523193359375, 17.05712890625, 17.591064453125, 18.125]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 8.0, 9.0, 9.0, 16.0, 12.0, 13.0, 14.0, 30.0, 16.0, 29.0, 39.0, 26.0, 32.0, 34.0, 27.0, 40.0, 45.0, 41.0, 51.0, 45.0, 57.0, 49.0, 36.0, 38.0, 27.0, 40.0, 29.0, 31.0, 29.0, 20.0, 25.0, 14.0, 12.0, 10.0, 15.0, 6.0, 4.0, 6.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0], "bins": [-31.921875, -30.98388671875, -30.0458984375, -29.10791015625, -28.169921875, -27.23193359375, -26.2939453125, -25.35595703125, -24.41796875, -23.47998046875, -22.5419921875, -21.60400390625, -20.666015625, -19.72802734375, -18.7900390625, -17.85205078125, -16.9140625, -15.97607421875, -15.0380859375, -14.10009765625, -13.162109375, -12.22412109375, -11.2861328125, -10.34814453125, -9.41015625, -8.47216796875, -7.5341796875, -6.59619140625, -5.658203125, -4.72021484375, -3.7822265625, -2.84423828125, -1.90625, -0.96826171875, -0.0302734375, 0.90771484375, 1.845703125, 2.78369140625, 3.7216796875, 4.65966796875, 5.59765625, 6.53564453125, 7.4736328125, 8.41162109375, 9.349609375, 10.28759765625, 11.2255859375, 12.16357421875, 13.1015625, 14.03955078125, 14.9775390625, 15.91552734375, 16.853515625, 17.79150390625, 18.7294921875, 19.66748046875, 20.60546875, 21.54345703125, 22.4814453125, 23.41943359375, 24.357421875, 25.29541015625, 26.2333984375, 27.17138671875, 28.109375]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 4.0, 8.0, 12.0, 12.0, 27.0, 32.0, 60.0, 87.0, 119.0, 179.0, 311.0, 481.0, 722.0, 1204.0, 1903.0, 2913.0, 4747.0, 7543.0, 11935.0, 18863.0, 28877.0, 44647.0, 65898.0, 91225.0, 116578.0, 132425.0, 132051.0, 114951.0, 88453.0, 62950.0, 42750.0, 27841.0, 17803.0, 11297.0, 7224.0, 4650.0, 2826.0, 1783.0, 1082.0, 729.0, 446.0, 302.0, 222.0, 130.0, 81.0, 59.0, 40.0, 28.0, 17.0, 14.0, 6.0, 7.0, 5.0, 4.0, 2.0, 1.0, 1.0], "bins": [-22.78125, -22.08984375, -21.3984375, -20.70703125, -20.015625, -19.32421875, -18.6328125, -17.94140625, -17.25, -16.55859375, -15.8671875, -15.17578125, -14.484375, -13.79296875, -13.1015625, -12.41015625, -11.71875, -11.02734375, -10.3359375, -9.64453125, -8.953125, -8.26171875, -7.5703125, -6.87890625, -6.1875, -5.49609375, -4.8046875, -4.11328125, -3.421875, -2.73046875, -2.0390625, -1.34765625, -0.65625, 0.03515625, 0.7265625, 1.41796875, 2.109375, 2.80078125, 3.4921875, 4.18359375, 4.875, 5.56640625, 6.2578125, 6.94921875, 7.640625, 8.33203125, 9.0234375, 9.71484375, 10.40625, 11.09765625, 11.7890625, 12.48046875, 13.171875, 13.86328125, 14.5546875, 15.24609375, 15.9375, 16.62890625, 17.3203125, 18.01171875, 18.703125, 19.39453125, 20.0859375, 20.77734375, 21.46875]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 5.0, 9.0, 8.0, 6.0, 9.0, 15.0, 12.0, 23.0, 15.0, 21.0, 21.0, 21.0, 22.0, 23.0, 36.0, 30.0, 44.0, 35.0, 47.0, 50.0, 46.0, 44.0, 56.0, 42.0, 34.0, 41.0, 44.0, 35.0, 28.0, 25.0, 26.0, 27.0, 28.0, 20.0, 10.0, 13.0, 7.0, 5.0, 6.0, 10.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.015625, -20.3408203125, -19.666015625, -18.9912109375, -18.31640625, -17.6416015625, -16.966796875, -16.2919921875, -15.6171875, -14.9423828125, -14.267578125, -13.5927734375, -12.91796875, -12.2431640625, -11.568359375, -10.8935546875, -10.21875, -9.5439453125, -8.869140625, -8.1943359375, -7.51953125, -6.8447265625, -6.169921875, -5.4951171875, -4.8203125, -4.1455078125, -3.470703125, -2.7958984375, -2.12109375, -1.4462890625, -0.771484375, -0.0966796875, 0.578125, 1.2529296875, 1.927734375, 2.6025390625, 3.27734375, 3.9521484375, 4.626953125, 5.3017578125, 5.9765625, 6.6513671875, 7.326171875, 8.0009765625, 8.67578125, 9.3505859375, 10.025390625, 10.7001953125, 11.375, 12.0498046875, 12.724609375, 13.3994140625, 14.07421875, 14.7490234375, 15.423828125, 16.0986328125, 16.7734375, 17.4482421875, 18.123046875, 18.7978515625, 19.47265625, 20.1474609375, 20.822265625, 21.4970703125, 22.171875]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 4.0, 5.0, 15.0, 13.0, 15.0, 25.0, 23.0, 37.0, 56.0, 67.0, 93.0, 142.0, 203.0, 287.0, 398.0, 551.0, 904.0, 1423.0, 2437.0, 4274.0, 7844.0, 14821.0, 29334.0, 58372.0, 115865.0, 200701.0, 239413.0, 174626.0, 96168.0, 48052.0, 24173.0, 12247.0, 6557.0, 3614.0, 1996.0, 1298.0, 773.0, 521.0, 362.0, 251.0, 175.0, 104.0, 79.0, 60.0, 48.0, 41.0, 27.0, 19.0, 11.0, 16.0, 6.0, 6.0, 7.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-20.125, -19.439453125, -18.75390625, -18.068359375, -17.3828125, -16.697265625, -16.01171875, -15.326171875, -14.640625, -13.955078125, -13.26953125, -12.583984375, -11.8984375, -11.212890625, -10.52734375, -9.841796875, -9.15625, -8.470703125, -7.78515625, -7.099609375, -6.4140625, -5.728515625, -5.04296875, -4.357421875, -3.671875, -2.986328125, -2.30078125, -1.615234375, -0.9296875, -0.244140625, 0.44140625, 1.126953125, 1.8125, 2.498046875, 3.18359375, 3.869140625, 4.5546875, 5.240234375, 5.92578125, 6.611328125, 7.296875, 7.982421875, 8.66796875, 9.353515625, 10.0390625, 10.724609375, 11.41015625, 12.095703125, 12.78125, 13.466796875, 14.15234375, 14.837890625, 15.5234375, 16.208984375, 16.89453125, 17.580078125, 18.265625, 18.951171875, 19.63671875, 20.322265625, 21.0078125, 21.693359375, 22.37890625, 23.064453125, 23.75]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 0.0, 3.0, 3.0, 8.0, 4.0, 5.0, 10.0, 14.0, 23.0, 32.0, 33.0, 44.0, 57.0, 69.0, 74.0, 85.0, 96.0, 102.0, 74.0, 56.0, 53.0, 35.0, 39.0, 21.0, 20.0, 11.0, 13.0, 9.0, 6.0, 3.0, 3.0, 0.0, 5.0, 1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00250244140625, -0.002427995204925537, -0.0023535490036010742, -0.0022791028022766113, -0.0022046566009521484, -0.0021302103996276855, -0.0020557641983032227, -0.0019813179969787598, -0.0019068717956542969, -0.001832425594329834, -0.001757979393005371, -0.0016835331916809082, -0.0016090869903564453, -0.0015346407890319824, -0.0014601945877075195, -0.0013857483863830566, -0.0013113021850585938, -0.0012368559837341309, -0.001162409782409668, -0.001087963581085205, -0.0010135173797607422, -0.0009390711784362793, -0.0008646249771118164, -0.0007901787757873535, -0.0007157325744628906, -0.0006412863731384277, -0.0005668401718139648, -0.000492393970489502, -0.00041794776916503906, -0.00034350156784057617, -0.0002690553665161133, -0.0001946091651916504, -0.0001201629638671875, -4.571676254272461e-05, 2.872943878173828e-05, 0.00010317564010620117, 0.00017762184143066406, 0.00025206804275512695, 0.00032651424407958984, 0.00040096044540405273, 0.0004754066467285156, 0.0005498528480529785, 0.0006242990493774414, 0.0006987452507019043, 0.0007731914520263672, 0.0008476376533508301, 0.000922083854675293, 0.0009965300559997559, 0.0010709762573242188, 0.0011454224586486816, 0.0012198686599731445, 0.0012943148612976074, 0.0013687610626220703, 0.0014432072639465332, 0.001517653465270996, 0.001592099666595459, 0.0016665458679199219, 0.0017409920692443848, 0.0018154382705688477, 0.0018898844718933105, 0.0019643306732177734, 0.0020387768745422363, 0.0021132230758666992, 0.002187669277191162, 0.002262115478515625]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 9.0, 9.0, 14.0, 19.0, 28.0, 46.0, 65.0, 84.0, 113.0, 174.0, 287.0, 430.0, 605.0, 1073.0, 1685.0, 2829.0, 4808.0, 8253.0, 14270.0, 24852.0, 43785.0, 74731.0, 118791.0, 162882.0, 178708.0, 151719.0, 105307.0, 64421.0, 37140.0, 21447.0, 12185.0, 7008.0, 4104.0, 2490.0, 1458.0, 950.0, 602.0, 423.0, 242.0, 171.0, 120.0, 72.0, 53.0, 27.0, 21.0, 14.0, 9.0, 12.0, 3.0, 7.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.546875, -15.06640625, -14.5859375, -14.10546875, -13.625, -13.14453125, -12.6640625, -12.18359375, -11.703125, -11.22265625, -10.7421875, -10.26171875, -9.78125, -9.30078125, -8.8203125, -8.33984375, -7.859375, -7.37890625, -6.8984375, -6.41796875, -5.9375, -5.45703125, -4.9765625, -4.49609375, -4.015625, -3.53515625, -3.0546875, -2.57421875, -2.09375, -1.61328125, -1.1328125, -0.65234375, -0.171875, 0.30859375, 0.7890625, 1.26953125, 1.75, 2.23046875, 2.7109375, 3.19140625, 3.671875, 4.15234375, 4.6328125, 5.11328125, 5.59375, 6.07421875, 6.5546875, 7.03515625, 7.515625, 7.99609375, 8.4765625, 8.95703125, 9.4375, 9.91796875, 10.3984375, 10.87890625, 11.359375, 11.83984375, 12.3203125, 12.80078125, 13.28125, 13.76171875, 14.2421875, 14.72265625, 15.203125]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 9.0, 6.0, 11.0, 9.0, 20.0, 28.0, 38.0, 43.0, 55.0, 78.0, 61.0, 88.0, 85.0, 68.0, 83.0, 76.0, 61.0, 42.0, 30.0, 29.0, 22.0, 17.0, 9.0, 8.0, 2.0, 6.0, 3.0, 3.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.6171875, -9.280517578125, -8.94384765625, -8.607177734375, -8.2705078125, -7.933837890625, -7.59716796875, -7.260498046875, -6.923828125, -6.587158203125, -6.25048828125, -5.913818359375, -5.5771484375, -5.240478515625, -4.90380859375, -4.567138671875, -4.23046875, -3.893798828125, -3.55712890625, -3.220458984375, -2.8837890625, -2.547119140625, -2.21044921875, -1.873779296875, -1.537109375, -1.200439453125, -0.86376953125, -0.527099609375, -0.1904296875, 0.146240234375, 0.48291015625, 0.819580078125, 1.15625, 1.492919921875, 1.82958984375, 2.166259765625, 2.5029296875, 2.839599609375, 3.17626953125, 3.512939453125, 3.849609375, 4.186279296875, 4.52294921875, 4.859619140625, 5.1962890625, 5.532958984375, 5.86962890625, 6.206298828125, 6.54296875, 6.879638671875, 7.21630859375, 7.552978515625, 7.8896484375, 8.226318359375, 8.56298828125, 8.899658203125, 9.236328125, 9.572998046875, 9.90966796875, 10.246337890625, 10.5830078125, 10.919677734375, 11.25634765625, 11.593017578125, 11.9296875]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 5.0, 3.0, 6.0, 4.0, 6.0, 2.0, 12.0, 14.0, 17.0, 18.0, 32.0, 20.0, 35.0, 37.0, 39.0, 42.0, 59.0, 50.0, 40.0, 53.0, 44.0, 48.0, 59.0, 39.0, 52.0, 46.0, 42.0, 29.0, 31.0, 26.0, 12.0, 19.0, 14.0, 11.0, 8.0, 6.0, 6.0, 7.0, 3.0, 5.0, 5.0, 1.0, 5.0], "bins": [-32.30500793457031, -31.516483306884766, -30.727956771850586, -29.93943214416504, -29.150907516479492, -28.362380981445312, -27.573856353759766, -26.78533172607422, -25.996807098388672, -25.208282470703125, -24.419755935668945, -23.6312313079834, -22.84270668029785, -22.054180145263672, -21.265655517578125, -20.477130889892578, -19.6886043548584, -18.90007972717285, -18.111553192138672, -17.323028564453125, -16.534503936767578, -15.745978355407715, -14.957452774047852, -14.168928146362305, -13.380402565002441, -12.591876983642578, -11.803352355957031, -11.014826774597168, -10.226301193237305, -9.437776565551758, -8.649250984191895, -7.8607258796691895, -7.072198867797852, -6.2836737632751465, -5.495148658752441, -4.706623077392578, -3.918097972869873, -3.129572868347168, -2.3410472869873047, -1.5525221824645996, -0.7639970779418945, 0.024528145790100098, 0.8130533695220947, 1.601578712463379, 2.390103816986084, 3.178628921508789, 3.9671545028686523, 4.755679607391357, 5.5442047119140625, 6.332729816436768, 7.121254920959473, 7.909780502319336, 8.698305130004883, 9.486830711364746, 10.27535629272461, 11.063880920410156, 11.85240650177002, 12.640932083129883, 13.42945671081543, 14.217982292175293, 15.006507873535156, 15.795032501220703, 16.58355712890625, 17.37208366394043, 18.160608291625977]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 9.0, 2.0, 7.0, 4.0, 5.0, 4.0, 12.0, 10.0, 7.0, 14.0, 24.0, 19.0, 20.0, 31.0, 36.0, 30.0, 33.0, 23.0, 29.0, 37.0, 33.0, 40.0, 34.0, 38.0, 33.0, 45.0, 38.0, 43.0, 28.0, 42.0, 34.0, 23.0, 40.0, 28.0, 27.0, 28.0, 18.0, 15.0, 7.0, 13.0, 9.0, 6.0, 7.0, 2.0, 7.0, 5.0, 3.0, 4.0, 2.0, 1.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.205394744873047, -24.30290985107422, -23.40042495727539, -22.49793815612793, -21.5954532623291, -20.692968368530273, -19.790481567382812, -18.887996673583984, -17.985511779785156, -17.083026885986328, -16.1805419921875, -15.278055191040039, -14.375570297241211, -13.473085403442383, -12.570599555969238, -11.668113708496094, -10.765628814697266, -9.863143920898438, -8.960658073425293, -8.058172225952148, -7.15568733215332, -6.253201961517334, -5.350716590881348, -4.448231220245361, -3.545745849609375, -2.6432604789733887, -1.7407751083374023, -0.838289737701416, 0.06419563293457031, 0.9666810035705566, 1.869166374206543, 2.7716517448425293, 3.6741371154785156, 4.576622486114502, 5.479107856750488, 6.381593227386475, 7.284078598022461, 8.186563491821289, 9.089049339294434, 9.991535186767578, 10.894020080566406, 11.796504974365234, 12.698990821838379, 13.601476669311523, 14.503961563110352, 15.40644645690918, 16.30893325805664, 17.21141815185547, 18.113903045654297, 19.016387939453125, 19.918872833251953, 20.821359634399414, 21.723844528198242, 22.62632942199707, 23.52881622314453, 24.43130111694336, 25.333786010742188, 26.236270904541016, 27.138755798339844, 28.041242599487305, 28.943727493286133, 29.84621238708496, 30.748699188232422, 31.65118408203125, 32.55366897583008]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 4.0, 8.0, 6.0, 14.0, 34.0, 47.0, 57.0, 103.0, 164.0, 238.0, 368.0, 601.0, 1012.0, 1526.0, 2387.0, 3973.0, 6604.0, 10788.0, 18430.0, 31089.0, 53124.0, 90123.0, 150711.0, 244683.0, 369966.0, 506163.0, 598654.0, 598541.0, 507836.0, 374785.0, 248451.0, 152631.0, 91274.0, 53119.0, 31002.0, 18114.0, 10943.0, 6392.0, 4002.0, 2356.0, 1415.0, 879.0, 618.0, 338.0, 243.0, 172.0, 106.0, 62.0, 51.0, 30.0, 17.0, 12.0, 14.0, 7.0, 3.0, 3.0, 2.0, 2.0, 0.0, 3.0], "bins": [-17.6875, -17.1171875, -16.546875, -15.9765625, -15.40625, -14.8359375, -14.265625, -13.6953125, -13.125, -12.5546875, -11.984375, -11.4140625, -10.84375, -10.2734375, -9.703125, -9.1328125, -8.5625, -7.9921875, -7.421875, -6.8515625, -6.28125, -5.7109375, -5.140625, -4.5703125, -4.0, -3.4296875, -2.859375, -2.2890625, -1.71875, -1.1484375, -0.578125, -0.0078125, 0.5625, 1.1328125, 1.703125, 2.2734375, 2.84375, 3.4140625, 3.984375, 4.5546875, 5.125, 5.6953125, 6.265625, 6.8359375, 7.40625, 7.9765625, 8.546875, 9.1171875, 9.6875, 10.2578125, 10.828125, 11.3984375, 11.96875, 12.5390625, 13.109375, 13.6796875, 14.25, 14.8203125, 15.390625, 15.9609375, 16.53125, 17.1015625, 17.671875, 18.2421875, 18.8125]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [2.0, 5.0, 1.0, 5.0, 1.0, 3.0, 4.0, 9.0, 5.0, 6.0, 9.0, 12.0, 9.0, 12.0, 19.0, 23.0, 29.0, 21.0, 34.0, 32.0, 24.0, 24.0, 38.0, 28.0, 37.0, 34.0, 32.0, 39.0, 39.0, 34.0, 38.0, 38.0, 40.0, 42.0, 23.0, 28.0, 34.0, 33.0, 33.0, 26.0, 18.0, 18.0, 12.0, 7.0, 8.0, 4.0, 7.0, 10.0, 4.0, 8.0, 2.0, 2.0, 2.0, 5.0, 1.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-19.46875, -18.78173828125, -18.0947265625, -17.40771484375, -16.720703125, -16.03369140625, -15.3466796875, -14.65966796875, -13.97265625, -13.28564453125, -12.5986328125, -11.91162109375, -11.224609375, -10.53759765625, -9.8505859375, -9.16357421875, -8.4765625, -7.78955078125, -7.1025390625, -6.41552734375, -5.728515625, -5.04150390625, -4.3544921875, -3.66748046875, -2.98046875, -2.29345703125, -1.6064453125, -0.91943359375, -0.232421875, 0.45458984375, 1.1416015625, 1.82861328125, 2.515625, 3.20263671875, 3.8896484375, 4.57666015625, 5.263671875, 5.95068359375, 6.6376953125, 7.32470703125, 8.01171875, 8.69873046875, 9.3857421875, 10.07275390625, 10.759765625, 11.44677734375, 12.1337890625, 12.82080078125, 13.5078125, 14.19482421875, 14.8818359375, 15.56884765625, 16.255859375, 16.94287109375, 17.6298828125, 18.31689453125, 19.00390625, 19.69091796875, 20.3779296875, 21.06494140625, 21.751953125, 22.43896484375, 23.1259765625, 23.81298828125, 24.5]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [1.0, 4.0, 3.0, 5.0, 6.0, 14.0, 14.0, 37.0, 47.0, 61.0, 89.0, 159.0, 188.0, 324.0, 523.0, 852.0, 1225.0, 2020.0, 3090.0, 4594.0, 7431.0, 11670.0, 18027.0, 28873.0, 44529.0, 68998.0, 105704.0, 157994.0, 226122.0, 308528.0, 395126.0, 463484.0, 490183.0, 462684.0, 396481.0, 309245.0, 226935.0, 159234.0, 105779.0, 69526.0, 45354.0, 28496.0, 18504.0, 11735.0, 7391.0, 4671.0, 2971.0, 1887.0, 1248.0, 813.0, 510.0, 329.0, 195.0, 146.0, 83.0, 62.0, 38.0, 22.0, 10.0, 12.0, 5.0, 8.0, 1.0, 4.0], "bins": [-16.59375, -16.083251953125, -15.57275390625, -15.062255859375, -14.5517578125, -14.041259765625, -13.53076171875, -13.020263671875, -12.509765625, -11.999267578125, -11.48876953125, -10.978271484375, -10.4677734375, -9.957275390625, -9.44677734375, -8.936279296875, -8.42578125, -7.915283203125, -7.40478515625, -6.894287109375, -6.3837890625, -5.873291015625, -5.36279296875, -4.852294921875, -4.341796875, -3.831298828125, -3.32080078125, -2.810302734375, -2.2998046875, -1.789306640625, -1.27880859375, -0.768310546875, -0.2578125, 0.252685546875, 0.76318359375, 1.273681640625, 1.7841796875, 2.294677734375, 2.80517578125, 3.315673828125, 3.826171875, 4.336669921875, 4.84716796875, 5.357666015625, 5.8681640625, 6.378662109375, 6.88916015625, 7.399658203125, 7.91015625, 8.420654296875, 8.93115234375, 9.441650390625, 9.9521484375, 10.462646484375, 10.97314453125, 11.483642578125, 11.994140625, 12.504638671875, 13.01513671875, 13.525634765625, 14.0361328125, 14.546630859375, 15.05712890625, 15.567626953125, 16.078125]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 3.0, 6.0, 11.0, 14.0, 20.0, 19.0, 22.0, 35.0, 48.0, 28.0, 64.0, 89.0, 106.0, 123.0, 132.0, 135.0, 163.0, 197.0, 182.0, 227.0, 175.0, 217.0, 245.0, 237.0, 208.0, 207.0, 170.0, 146.0, 145.0, 127.0, 92.0, 85.0, 77.0, 64.0, 53.0, 45.0, 35.0, 31.0, 21.0, 23.0, 13.0, 15.0, 12.0, 3.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.515625, -9.2093505859375, -8.903076171875, -8.5968017578125, -8.29052734375, -7.9842529296875, -7.677978515625, -7.3717041015625, -7.0654296875, -6.7591552734375, -6.452880859375, -6.1466064453125, -5.84033203125, -5.5340576171875, -5.227783203125, -4.9215087890625, -4.615234375, -4.3089599609375, -4.002685546875, -3.6964111328125, -3.39013671875, -3.0838623046875, -2.777587890625, -2.4713134765625, -2.1650390625, -1.8587646484375, -1.552490234375, -1.2462158203125, -0.93994140625, -0.6336669921875, -0.327392578125, -0.0211181640625, 0.28515625, 0.5914306640625, 0.897705078125, 1.2039794921875, 1.51025390625, 1.8165283203125, 2.122802734375, 2.4290771484375, 2.7353515625, 3.0416259765625, 3.347900390625, 3.6541748046875, 3.96044921875, 4.2667236328125, 4.572998046875, 4.8792724609375, 5.185546875, 5.4918212890625, 5.798095703125, 6.1043701171875, 6.41064453125, 6.7169189453125, 7.023193359375, 7.3294677734375, 7.6357421875, 7.9420166015625, 8.248291015625, 8.5545654296875, 8.86083984375, 9.1671142578125, 9.473388671875, 9.7796630859375, 10.0859375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 5.0, 6.0, 5.0, 12.0, 15.0, 9.0, 15.0, 19.0, 17.0, 27.0, 25.0, 35.0, 36.0, 31.0, 37.0, 43.0, 47.0, 39.0, 43.0, 54.0, 48.0, 48.0, 55.0, 51.0, 45.0, 34.0, 23.0, 29.0, 25.0, 20.0, 26.0, 10.0, 10.0, 12.0, 7.0, 9.0, 7.0, 8.0, 2.0, 3.0, 2.0, 0.0, 6.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.60715103149414, -23.904407501220703, -23.201663970947266, -22.498920440673828, -21.79617691040039, -21.093433380126953, -20.390689849853516, -19.687946319580078, -18.98520278930664, -18.282459259033203, -17.579715728759766, -16.876972198486328, -16.17422866821289, -15.471485137939453, -14.768741607666016, -14.065998077392578, -13.36325454711914, -12.660511016845703, -11.957767486572266, -11.255023956298828, -10.55228042602539, -9.849536895751953, -9.146793365478516, -8.444049835205078, -7.741306304931641, -7.038562774658203, -6.335819244384766, -5.633075714111328, -4.930332183837891, -4.227588653564453, -3.5248451232910156, -2.822101593017578, -2.119356155395508, -1.4166126251220703, -0.7138690948486328, -0.011125564575195312, 0.6916179656982422, 1.3943614959716797, 2.097105026245117, 2.7998485565185547, 3.502592086791992, 4.20533561706543, 4.908079147338867, 5.610822677612305, 6.313566207885742, 7.01630973815918, 7.719053268432617, 8.421796798706055, 9.124540328979492, 9.82728385925293, 10.530027389526367, 11.232770919799805, 11.935514450073242, 12.63825798034668, 13.341001510620117, 14.043745040893555, 14.746488571166992, 15.44923210144043, 16.151975631713867, 16.854719161987305, 17.557462692260742, 18.26020622253418, 18.962949752807617, 19.665693283081055, 20.368436813354492]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 3.0, 6.0, 4.0, 4.0, 9.0, 10.0, 16.0, 10.0, 13.0, 15.0, 28.0, 23.0, 18.0, 27.0, 29.0, 29.0, 29.0, 34.0, 27.0, 37.0, 34.0, 31.0, 40.0, 51.0, 44.0, 48.0, 39.0, 39.0, 30.0, 38.0, 40.0, 31.0, 25.0, 11.0, 22.0, 19.0, 20.0, 17.0, 11.0, 8.0, 6.0, 5.0, 5.0, 6.0, 5.0, 3.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-26.19291114807129, -25.311534881591797, -24.430158615112305, -23.54878044128418, -22.667404174804688, -21.786027908325195, -20.904651641845703, -20.023273468017578, -19.141897201538086, -18.260520935058594, -17.3791446685791, -16.497766494750977, -15.616390228271484, -14.735013961791992, -13.8536376953125, -12.972260475158691, -12.0908842086792, -11.209507942199707, -10.328130722045898, -9.446754455566406, -8.565377235412598, -7.6840009689331055, -6.802624225616455, -5.921247482299805, -5.039870738983154, -4.158493995666504, -3.2771172523498535, -2.3957407474517822, -1.5143640041351318, -0.6329874992370605, 0.24838924407958984, 1.1297659873962402, 2.0111427307128906, 2.892519474029541, 3.7738962173461914, 4.655272483825684, 5.536649703979492, 6.418025970458984, 7.299402713775635, 8.180779457092285, 9.062156677246094, 9.943532943725586, 10.824910163879395, 11.706286430358887, 12.587663650512695, 13.469039916992188, 14.35041618347168, 15.231793403625488, 16.113170623779297, 16.99454689025879, 17.87592315673828, 18.757301330566406, 19.6386775970459, 20.52005386352539, 21.401430130004883, 22.282806396484375, 23.164182662963867, 24.04555892944336, 24.92693519592285, 25.808313369750977, 26.68968963623047, 27.57106590270996, 28.452442169189453, 29.333820343017578, 30.21519660949707]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 5.0, 6.0, 7.0, 16.0, 25.0, 35.0, 60.0, 81.0, 114.0, 149.0, 222.0, 331.0, 513.0, 732.0, 1132.0, 1706.0, 2603.0, 4090.0, 6378.0, 10305.0, 16526.0, 26816.0, 42939.0, 70304.0, 108693.0, 153279.0, 174713.0, 148326.0, 103687.0, 65836.0, 40887.0, 25210.0, 15629.0, 9957.0, 6150.0, 3779.0, 2472.0, 1629.0, 1018.0, 692.0, 483.0, 328.0, 210.0, 154.0, 96.0, 76.0, 57.0, 28.0, 22.0, 19.0, 23.0, 7.0, 3.0, 3.0, 3.0, 0.0, 0.0, 3.0], "bins": [-17.828125, -17.278564453125, -16.72900390625, -16.179443359375, -15.6298828125, -15.080322265625, -14.53076171875, -13.981201171875, -13.431640625, -12.882080078125, -12.33251953125, -11.782958984375, -11.2333984375, -10.683837890625, -10.13427734375, -9.584716796875, -9.03515625, -8.485595703125, -7.93603515625, -7.386474609375, -6.8369140625, -6.287353515625, -5.73779296875, -5.188232421875, -4.638671875, -4.089111328125, -3.53955078125, -2.989990234375, -2.4404296875, -1.890869140625, -1.34130859375, -0.791748046875, -0.2421875, 0.307373046875, 0.85693359375, 1.406494140625, 1.9560546875, 2.505615234375, 3.05517578125, 3.604736328125, 4.154296875, 4.703857421875, 5.25341796875, 5.802978515625, 6.3525390625, 6.902099609375, 7.45166015625, 8.001220703125, 8.55078125, 9.100341796875, 9.64990234375, 10.199462890625, 10.7490234375, 11.298583984375, 11.84814453125, 12.397705078125, 12.947265625, 13.496826171875, 14.04638671875, 14.595947265625, 15.1455078125, 15.695068359375, 16.24462890625, 16.794189453125, 17.34375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 5.0, 4.0, 5.0, 8.0, 10.0, 14.0, 6.0, 17.0, 13.0, 21.0, 25.0, 27.0, 32.0, 22.0, 29.0, 31.0, 36.0, 39.0, 33.0, 35.0, 46.0, 48.0, 50.0, 51.0, 34.0, 32.0, 41.0, 32.0, 36.0, 36.0, 31.0, 21.0, 20.0, 23.0, 14.0, 18.0, 9.0, 9.0, 11.0, 3.0, 6.0, 8.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-26.875, -25.9609375, -25.046875, -24.1328125, -23.21875, -22.3046875, -21.390625, -20.4765625, -19.5625, -18.6484375, -17.734375, -16.8203125, -15.90625, -14.9921875, -14.078125, -13.1640625, -12.25, -11.3359375, -10.421875, -9.5078125, -8.59375, -7.6796875, -6.765625, -5.8515625, -4.9375, -4.0234375, -3.109375, -2.1953125, -1.28125, -0.3671875, 0.546875, 1.4609375, 2.375, 3.2890625, 4.203125, 5.1171875, 6.03125, 6.9453125, 7.859375, 8.7734375, 9.6875, 10.6015625, 11.515625, 12.4296875, 13.34375, 14.2578125, 15.171875, 16.0859375, 17.0, 17.9140625, 18.828125, 19.7421875, 20.65625, 21.5703125, 22.484375, 23.3984375, 24.3125, 25.2265625, 26.140625, 27.0546875, 27.96875, 28.8828125, 29.796875, 30.7109375, 31.625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 7.0, 6.0, 8.0, 19.0, 30.0, 47.0, 67.0, 93.0, 106.0, 194.0, 262.0, 387.0, 610.0, 946.0, 1503.0, 2228.0, 3578.0, 5673.0, 9014.0, 14482.0, 24076.0, 39938.0, 68235.0, 114405.0, 174177.0, 198581.0, 152698.0, 94766.0, 56307.0, 33066.0, 19813.0, 12109.0, 7640.0, 4704.0, 3082.0, 1951.0, 1293.0, 827.0, 534.0, 404.0, 242.0, 147.0, 106.0, 68.0, 38.0, 31.0, 17.0, 18.0, 7.0, 8.0, 5.0, 6.0, 3.0, 3.0, 2.0, 2.0], "bins": [-20.25, -19.64208984375, -19.0341796875, -18.42626953125, -17.818359375, -17.21044921875, -16.6025390625, -15.99462890625, -15.38671875, -14.77880859375, -14.1708984375, -13.56298828125, -12.955078125, -12.34716796875, -11.7392578125, -11.13134765625, -10.5234375, -9.91552734375, -9.3076171875, -8.69970703125, -8.091796875, -7.48388671875, -6.8759765625, -6.26806640625, -5.66015625, -5.05224609375, -4.4443359375, -3.83642578125, -3.228515625, -2.62060546875, -2.0126953125, -1.40478515625, -0.796875, -0.18896484375, 0.4189453125, 1.02685546875, 1.634765625, 2.24267578125, 2.8505859375, 3.45849609375, 4.06640625, 4.67431640625, 5.2822265625, 5.89013671875, 6.498046875, 7.10595703125, 7.7138671875, 8.32177734375, 8.9296875, 9.53759765625, 10.1455078125, 10.75341796875, 11.361328125, 11.96923828125, 12.5771484375, 13.18505859375, 13.79296875, 14.40087890625, 15.0087890625, 15.61669921875, 16.224609375, 16.83251953125, 17.4404296875, 18.04833984375, 18.65625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 1.0, 2.0, 5.0, 8.0, 3.0, 2.0, 5.0, 13.0, 15.0, 15.0, 19.0, 23.0, 22.0, 20.0, 22.0, 26.0, 22.0, 22.0, 39.0, 39.0, 27.0, 42.0, 44.0, 30.0, 50.0, 38.0, 36.0, 30.0, 30.0, 33.0, 31.0, 28.0, 19.0, 26.0, 24.0, 28.0, 27.0, 20.0, 18.0, 21.0, 12.0, 19.0, 10.0, 5.0, 9.0, 8.0, 8.0, 4.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0], "bins": [-17.65625, -17.11669921875, -16.5771484375, -16.03759765625, -15.498046875, -14.95849609375, -14.4189453125, -13.87939453125, -13.33984375, -12.80029296875, -12.2607421875, -11.72119140625, -11.181640625, -10.64208984375, -10.1025390625, -9.56298828125, -9.0234375, -8.48388671875, -7.9443359375, -7.40478515625, -6.865234375, -6.32568359375, -5.7861328125, -5.24658203125, -4.70703125, -4.16748046875, -3.6279296875, -3.08837890625, -2.548828125, -2.00927734375, -1.4697265625, -0.93017578125, -0.390625, 0.14892578125, 0.6884765625, 1.22802734375, 1.767578125, 2.30712890625, 2.8466796875, 3.38623046875, 3.92578125, 4.46533203125, 5.0048828125, 5.54443359375, 6.083984375, 6.62353515625, 7.1630859375, 7.70263671875, 8.2421875, 8.78173828125, 9.3212890625, 9.86083984375, 10.400390625, 10.93994140625, 11.4794921875, 12.01904296875, 12.55859375, 13.09814453125, 13.6376953125, 14.17724609375, 14.716796875, 15.25634765625, 15.7958984375, 16.33544921875, 16.875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 3.0, 8.0, 5.0, 18.0, 13.0, 16.0, 37.0, 46.0, 70.0, 95.0, 118.0, 166.0, 246.0, 340.0, 485.0, 736.0, 1118.0, 1760.0, 2606.0, 4044.0, 6386.0, 10644.0, 17462.0, 30885.0, 56423.0, 108053.0, 199440.0, 248642.0, 163915.0, 85484.0, 45168.0, 25309.0, 14582.0, 8749.0, 5399.0, 3414.0, 2205.0, 1508.0, 920.0, 611.0, 444.0, 308.0, 189.0, 142.0, 101.0, 75.0, 54.0, 36.0, 22.0, 17.0, 19.0, 9.0, 8.0, 8.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-9.5703125, -9.2647705078125, -8.959228515625, -8.6536865234375, -8.34814453125, -8.0426025390625, -7.737060546875, -7.4315185546875, -7.1259765625, -6.8204345703125, -6.514892578125, -6.2093505859375, -5.90380859375, -5.5982666015625, -5.292724609375, -4.9871826171875, -4.681640625, -4.3760986328125, -4.070556640625, -3.7650146484375, -3.45947265625, -3.1539306640625, -2.848388671875, -2.5428466796875, -2.2373046875, -1.9317626953125, -1.626220703125, -1.3206787109375, -1.01513671875, -0.7095947265625, -0.404052734375, -0.0985107421875, 0.20703125, 0.5125732421875, 0.818115234375, 1.1236572265625, 1.42919921875, 1.7347412109375, 2.040283203125, 2.3458251953125, 2.6513671875, 2.9569091796875, 3.262451171875, 3.5679931640625, 3.87353515625, 4.1790771484375, 4.484619140625, 4.7901611328125, 5.095703125, 5.4012451171875, 5.706787109375, 6.0123291015625, 6.31787109375, 6.6234130859375, 6.928955078125, 7.2344970703125, 7.5400390625, 7.8455810546875, 8.151123046875, 8.4566650390625, 8.76220703125, 9.0677490234375, 9.373291015625, 9.6788330078125, 9.984375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 3.0, 1.0, 4.0, 7.0, 7.0, 7.0, 21.0, 20.0, 24.0, 31.0, 72.0, 109.0, 135.0, 182.0, 131.0, 96.0, 58.0, 28.0, 19.0, 10.0, 11.0, 3.0, 6.0, 2.0, 3.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0014295578002929688, -0.0013772249221801758, -0.0013248920440673828, -0.0012725591659545898, -0.0012202262878417969, -0.001167893409729004, -0.001115560531616211, -0.001063227653503418, -0.001010894775390625, -0.000958561897277832, -0.0009062290191650391, -0.0008538961410522461, -0.0008015632629394531, -0.0007492303848266602, -0.0006968975067138672, -0.0006445646286010742, -0.0005922317504882812, -0.0005398988723754883, -0.0004875659942626953, -0.00043523311614990234, -0.0003829002380371094, -0.0003305673599243164, -0.00027823448181152344, -0.00022590160369873047, -0.0001735687255859375, -0.00012123584747314453, -6.890296936035156e-05, -1.6570091247558594e-05, 3.5762786865234375e-05, 8.809566497802734e-05, 0.0001404285430908203, 0.00019276142120361328, 0.00024509429931640625, 0.0002974271774291992, 0.0003497600555419922, 0.00040209293365478516, 0.0004544258117675781, 0.0005067586898803711, 0.0005590915679931641, 0.000611424446105957, 0.00066375732421875, 0.000716090202331543, 0.0007684230804443359, 0.0008207559585571289, 0.0008730888366699219, 0.0009254217147827148, 0.0009777545928955078, 0.0010300874710083008, 0.0010824203491210938, 0.0011347532272338867, 0.0011870861053466797, 0.0012394189834594727, 0.0012917518615722656, 0.0013440847396850586, 0.0013964176177978516, 0.0014487504959106445, 0.0015010833740234375, 0.0015534162521362305, 0.0016057491302490234, 0.0016580820083618164, 0.0017104148864746094, 0.0017627477645874023, 0.0018150806427001953, 0.0018674135208129883, 0.0019197463989257812]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 5.0, 4.0, 12.0, 9.0, 14.0, 32.0, 43.0, 60.0, 90.0, 205.0, 287.0, 436.0, 690.0, 996.0, 1615.0, 2496.0, 3930.0, 6003.0, 9401.0, 14683.0, 23275.0, 36741.0, 57589.0, 89971.0, 133555.0, 167673.0, 160394.0, 120435.0, 79594.0, 50605.0, 31585.0, 20230.0, 12859.0, 8162.0, 5274.0, 3448.0, 2172.0, 1419.0, 906.0, 649.0, 386.0, 238.0, 134.0, 99.0, 60.0, 39.0, 31.0, 11.0, 7.0, 9.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.1796875, -7.91455078125, -7.6494140625, -7.38427734375, -7.119140625, -6.85400390625, -6.5888671875, -6.32373046875, -6.05859375, -5.79345703125, -5.5283203125, -5.26318359375, -4.998046875, -4.73291015625, -4.4677734375, -4.20263671875, -3.9375, -3.67236328125, -3.4072265625, -3.14208984375, -2.876953125, -2.61181640625, -2.3466796875, -2.08154296875, -1.81640625, -1.55126953125, -1.2861328125, -1.02099609375, -0.755859375, -0.49072265625, -0.2255859375, 0.03955078125, 0.3046875, 0.56982421875, 0.8349609375, 1.10009765625, 1.365234375, 1.63037109375, 1.8955078125, 2.16064453125, 2.42578125, 2.69091796875, 2.9560546875, 3.22119140625, 3.486328125, 3.75146484375, 4.0166015625, 4.28173828125, 4.546875, 4.81201171875, 5.0771484375, 5.34228515625, 5.607421875, 5.87255859375, 6.1376953125, 6.40283203125, 6.66796875, 6.93310546875, 7.1982421875, 7.46337890625, 7.728515625, 7.99365234375, 8.2587890625, 8.52392578125, 8.7890625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 7.0, 7.0, 3.0, 3.0, 5.0, 9.0, 5.0, 15.0, 12.0, 10.0, 16.0, 20.0, 25.0, 21.0, 33.0, 43.0, 59.0, 49.0, 59.0, 71.0, 54.0, 61.0, 65.0, 45.0, 62.0, 41.0, 35.0, 21.0, 29.0, 17.0, 21.0, 14.0, 7.0, 13.0, 10.0, 16.0, 8.0, 3.0, 5.0, 4.0, 4.0, 0.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-3.74609375, -3.628570556640625, -3.51104736328125, -3.393524169921875, -3.2760009765625, -3.158477783203125, -3.04095458984375, -2.923431396484375, -2.805908203125, -2.688385009765625, -2.57086181640625, -2.453338623046875, -2.3358154296875, -2.218292236328125, -2.10076904296875, -1.983245849609375, -1.86572265625, -1.748199462890625, -1.63067626953125, -1.513153076171875, -1.3956298828125, -1.278106689453125, -1.16058349609375, -1.043060302734375, -0.925537109375, -0.808013916015625, -0.69049072265625, -0.572967529296875, -0.4554443359375, -0.337921142578125, -0.22039794921875, -0.102874755859375, 0.0146484375, 0.132171630859375, 0.24969482421875, 0.367218017578125, 0.4847412109375, 0.602264404296875, 0.71978759765625, 0.837310791015625, 0.954833984375, 1.072357177734375, 1.18988037109375, 1.307403564453125, 1.4249267578125, 1.542449951171875, 1.65997314453125, 1.777496337890625, 1.89501953125, 2.012542724609375, 2.13006591796875, 2.247589111328125, 2.3651123046875, 2.482635498046875, 2.60015869140625, 2.717681884765625, 2.835205078125, 2.952728271484375, 3.07025146484375, 3.187774658203125, 3.3052978515625, 3.422821044921875, 3.54034423828125, 3.657867431640625, 3.775390625]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 5.0, 7.0, 5.0, 7.0, 8.0, 11.0, 14.0, 19.0, 22.0, 24.0, 17.0, 27.0, 31.0, 22.0, 30.0, 40.0, 47.0, 46.0, 58.0, 46.0, 34.0, 55.0, 55.0, 49.0, 47.0, 43.0, 31.0, 26.0, 41.0, 23.0, 27.0, 14.0, 8.0, 15.0, 5.0, 7.0, 9.0, 10.0, 10.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-23.748291015625, -23.056793212890625, -22.365293502807617, -21.67379379272461, -20.982295989990234, -20.29079818725586, -19.59929847717285, -18.907798767089844, -18.21630096435547, -17.524803161621094, -16.833303451538086, -16.141803741455078, -15.450305938720703, -14.758807182312012, -14.06730842590332, -13.375809669494629, -12.684310913085938, -11.992812156677246, -11.301313400268555, -10.609814643859863, -9.918315887451172, -9.22681713104248, -8.535318374633789, -7.843819618225098, -7.152320861816406, -6.460822105407715, -5.769323348999023, -5.077824592590332, -4.386325836181641, -3.694827079772949, -3.003328323364258, -2.3118295669555664, -1.620330810546875, -0.9288320541381836, -0.2373332977294922, 0.4541654586791992, 1.1456642150878906, 1.837162971496582, 2.5286617279052734, 3.220160484313965, 3.9116592407226562, 4.603157997131348, 5.294656753540039, 5.9861555099487305, 6.677654266357422, 7.369153022766113, 8.060651779174805, 8.752150535583496, 9.443649291992188, 10.135148048400879, 10.82664680480957, 11.518145561218262, 12.209644317626953, 12.901143074035645, 13.592641830444336, 14.284140586853027, 14.975639343261719, 15.66713809967041, 16.3586368560791, 17.05013656616211, 17.741634368896484, 18.43313217163086, 19.124631881713867, 19.816131591796875, 20.50762939453125]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 0.0, 3.0, 6.0, 2.0, 4.0, 4.0, 5.0, 4.0, 9.0, 14.0, 17.0, 13.0, 18.0, 12.0, 32.0, 23.0, 26.0, 21.0, 31.0, 26.0, 29.0, 43.0, 28.0, 38.0, 27.0, 36.0, 62.0, 39.0, 47.0, 45.0, 34.0, 35.0, 33.0, 43.0, 30.0, 22.0, 25.0, 17.0, 20.0, 23.0, 10.0, 12.0, 9.0, 8.0, 8.0, 2.0, 4.0, 5.0, 2.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-26.028541564941406, -25.133867263793945, -24.239192962646484, -23.34451675415039, -22.44984245300293, -21.55516815185547, -20.660493850708008, -19.765819549560547, -18.871143341064453, -17.976469039916992, -17.08179473876953, -16.187118530273438, -15.292444229125977, -14.397769927978516, -13.503095626831055, -12.608420372009277, -11.713746070861816, -10.819071769714355, -9.924396514892578, -9.029722213745117, -8.13504695892334, -7.240372657775879, -6.34569787979126, -5.451023101806641, -4.5563483238220215, -3.6616735458374023, -2.766998767852783, -1.8723242282867432, -0.977649450302124, -0.08297491073608398, 0.8116998672485352, 1.7063746452331543, 2.6010494232177734, 3.4957242012023926, 4.390398979187012, 5.285073280334473, 6.17974853515625, 7.074422836303711, 7.96909761428833, 8.86377239227295, 9.758447647094727, 10.653121948242188, 11.547797203063965, 12.442471504211426, 13.337146759033203, 14.231821060180664, 15.126495361328125, 16.02117156982422, 16.915843963623047, 17.810518264770508, 18.70519256591797, 19.599868774414062, 20.494543075561523, 21.389217376708984, 22.283891677856445, 23.178565979003906, 24.0732421875, 24.96791648864746, 25.862590789794922, 26.757266998291016, 27.651941299438477, 28.546615600585938, 29.4412899017334, 30.33596420288086, 31.230640411376953]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 5.0, 8.0, 6.0, 9.0, 11.0, 25.0, 41.0, 52.0, 95.0, 132.0, 200.0, 316.0, 492.0, 756.0, 1158.0, 1733.0, 2616.0, 3991.0, 6040.0, 8907.0, 13242.0, 19252.0, 27370.0, 38099.0, 51118.0, 66181.0, 81243.0, 92243.0, 100360.0, 101183.0, 94545.0, 82923.0, 68301.0, 53250.0, 40316.0, 28949.0, 20423.0, 14267.0, 9785.0, 6430.0, 4270.0, 2787.0, 1905.0, 1199.0, 808.0, 497.0, 332.0, 251.0, 147.0, 101.0, 86.0, 49.0, 25.0, 11.0, 7.0, 6.0, 6.0, 3.0, 2.0, 1.0, 1.0, 4.0], "bins": [-13.78125, -13.337890625, -12.89453125, -12.451171875, -12.0078125, -11.564453125, -11.12109375, -10.677734375, -10.234375, -9.791015625, -9.34765625, -8.904296875, -8.4609375, -8.017578125, -7.57421875, -7.130859375, -6.6875, -6.244140625, -5.80078125, -5.357421875, -4.9140625, -4.470703125, -4.02734375, -3.583984375, -3.140625, -2.697265625, -2.25390625, -1.810546875, -1.3671875, -0.923828125, -0.48046875, -0.037109375, 0.40625, 0.849609375, 1.29296875, 1.736328125, 2.1796875, 2.623046875, 3.06640625, 3.509765625, 3.953125, 4.396484375, 4.83984375, 5.283203125, 5.7265625, 6.169921875, 6.61328125, 7.056640625, 7.5, 7.943359375, 8.38671875, 8.830078125, 9.2734375, 9.716796875, 10.16015625, 10.603515625, 11.046875, 11.490234375, 11.93359375, 12.376953125, 12.8203125, 13.263671875, 13.70703125, 14.150390625, 14.59375]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 5.0, 4.0, 2.0, 2.0, 4.0, 5.0, 7.0, 7.0, 5.0, 15.0, 23.0, 16.0, 23.0, 21.0, 18.0, 29.0, 32.0, 25.0, 27.0, 28.0, 31.0, 44.0, 34.0, 36.0, 38.0, 32.0, 46.0, 35.0, 51.0, 50.0, 35.0, 34.0, 33.0, 28.0, 27.0, 23.0, 23.0, 18.0, 15.0, 21.0, 16.0, 13.0, 2.0, 5.0, 2.0, 6.0, 5.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.125, -24.23681640625, -23.3486328125, -22.46044921875, -21.572265625, -20.68408203125, -19.7958984375, -18.90771484375, -18.01953125, -17.13134765625, -16.2431640625, -15.35498046875, -14.466796875, -13.57861328125, -12.6904296875, -11.80224609375, -10.9140625, -10.02587890625, -9.1376953125, -8.24951171875, -7.361328125, -6.47314453125, -5.5849609375, -4.69677734375, -3.80859375, -2.92041015625, -2.0322265625, -1.14404296875, -0.255859375, 0.63232421875, 1.5205078125, 2.40869140625, 3.296875, 4.18505859375, 5.0732421875, 5.96142578125, 6.849609375, 7.73779296875, 8.6259765625, 9.51416015625, 10.40234375, 11.29052734375, 12.1787109375, 13.06689453125, 13.955078125, 14.84326171875, 15.7314453125, 16.61962890625, 17.5078125, 18.39599609375, 19.2841796875, 20.17236328125, 21.060546875, 21.94873046875, 22.8369140625, 23.72509765625, 24.61328125, 25.50146484375, 26.3896484375, 27.27783203125, 28.166015625, 29.05419921875, 29.9423828125, 30.83056640625, 31.71875]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [4.0, 2.0, 6.0, 7.0, 7.0, 10.0, 21.0, 23.0, 43.0, 64.0, 84.0, 135.0, 242.0, 337.0, 561.0, 843.0, 1372.0, 2183.0, 3543.0, 5776.0, 9352.0, 14953.0, 24029.0, 37038.0, 56241.0, 80864.0, 105945.0, 126433.0, 133264.0, 122356.0, 101699.0, 75787.0, 52377.0, 34616.0, 22066.0, 13883.0, 8425.0, 5257.0, 3183.0, 2055.0, 1303.0, 817.0, 459.0, 322.0, 182.0, 124.0, 98.0, 62.0, 38.0, 36.0, 12.0, 15.0, 10.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.046875, -17.41162109375, -16.7763671875, -16.14111328125, -15.505859375, -14.87060546875, -14.2353515625, -13.60009765625, -12.96484375, -12.32958984375, -11.6943359375, -11.05908203125, -10.423828125, -9.78857421875, -9.1533203125, -8.51806640625, -7.8828125, -7.24755859375, -6.6123046875, -5.97705078125, -5.341796875, -4.70654296875, -4.0712890625, -3.43603515625, -2.80078125, -2.16552734375, -1.5302734375, -0.89501953125, -0.259765625, 0.37548828125, 1.0107421875, 1.64599609375, 2.28125, 2.91650390625, 3.5517578125, 4.18701171875, 4.822265625, 5.45751953125, 6.0927734375, 6.72802734375, 7.36328125, 7.99853515625, 8.6337890625, 9.26904296875, 9.904296875, 10.53955078125, 11.1748046875, 11.81005859375, 12.4453125, 13.08056640625, 13.7158203125, 14.35107421875, 14.986328125, 15.62158203125, 16.2568359375, 16.89208984375, 17.52734375, 18.16259765625, 18.7978515625, 19.43310546875, 20.068359375, 20.70361328125, 21.3388671875, 21.97412109375, 22.609375]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 3.0, 3.0, 7.0, 1.0, 8.0, 9.0, 9.0, 5.0, 17.0, 21.0, 22.0, 25.0, 29.0, 28.0, 21.0, 29.0, 33.0, 29.0, 41.0, 39.0, 39.0, 36.0, 54.0, 41.0, 44.0, 49.0, 31.0, 31.0, 36.0, 32.0, 30.0, 41.0, 23.0, 19.0, 17.0, 18.0, 24.0, 14.0, 15.0, 9.0, 7.0, 5.0, 10.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.75, -17.093994140625, -16.43798828125, -15.781982421875, -15.1259765625, -14.469970703125, -13.81396484375, -13.157958984375, -12.501953125, -11.845947265625, -11.18994140625, -10.533935546875, -9.8779296875, -9.221923828125, -8.56591796875, -7.909912109375, -7.25390625, -6.597900390625, -5.94189453125, -5.285888671875, -4.6298828125, -3.973876953125, -3.31787109375, -2.661865234375, -2.005859375, -1.349853515625, -0.69384765625, -0.037841796875, 0.6181640625, 1.274169921875, 1.93017578125, 2.586181640625, 3.2421875, 3.898193359375, 4.55419921875, 5.210205078125, 5.8662109375, 6.522216796875, 7.17822265625, 7.834228515625, 8.490234375, 9.146240234375, 9.80224609375, 10.458251953125, 11.1142578125, 11.770263671875, 12.42626953125, 13.082275390625, 13.73828125, 14.394287109375, 15.05029296875, 15.706298828125, 16.3623046875, 17.018310546875, 17.67431640625, 18.330322265625, 18.986328125, 19.642333984375, 20.29833984375, 20.954345703125, 21.6103515625, 22.266357421875, 22.92236328125, 23.578369140625, 24.234375]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 6.0, 2.0, 9.0, 6.0, 15.0, 13.0, 29.0, 36.0, 47.0, 69.0, 99.0, 159.0, 214.0, 349.0, 500.0, 779.0, 1380.0, 2047.0, 3404.0, 5782.0, 9679.0, 17402.0, 30250.0, 54933.0, 92629.0, 138973.0, 174858.0, 171150.0, 134679.0, 87971.0, 52099.0, 29230.0, 16318.0, 9385.0, 5471.0, 3169.0, 1934.0, 1232.0, 730.0, 530.0, 323.0, 212.0, 148.0, 90.0, 63.0, 42.0, 29.0, 33.0, 18.0, 12.0, 11.0, 4.0, 11.0, 4.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-12.9375, -12.5325927734375, -12.127685546875, -11.7227783203125, -11.31787109375, -10.9129638671875, -10.508056640625, -10.1031494140625, -9.6982421875, -9.2933349609375, -8.888427734375, -8.4835205078125, -8.07861328125, -7.6737060546875, -7.268798828125, -6.8638916015625, -6.458984375, -6.0540771484375, -5.649169921875, -5.2442626953125, -4.83935546875, -4.4344482421875, -4.029541015625, -3.6246337890625, -3.2197265625, -2.8148193359375, -2.409912109375, -2.0050048828125, -1.60009765625, -1.1951904296875, -0.790283203125, -0.3853759765625, 0.01953125, 0.4244384765625, 0.829345703125, 1.2342529296875, 1.63916015625, 2.0440673828125, 2.448974609375, 2.8538818359375, 3.2587890625, 3.6636962890625, 4.068603515625, 4.4735107421875, 4.87841796875, 5.2833251953125, 5.688232421875, 6.0931396484375, 6.498046875, 6.9029541015625, 7.307861328125, 7.7127685546875, 8.11767578125, 8.5225830078125, 8.927490234375, 9.3323974609375, 9.7373046875, 10.1422119140625, 10.547119140625, 10.9520263671875, 11.35693359375, 11.7618408203125, 12.166748046875, 12.5716552734375, 12.9765625]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 1.0, 2.0, 2.0, 1.0, 7.0, 6.0, 7.0, 5.0, 8.0, 10.0, 10.0, 14.0, 12.0, 16.0, 13.0, 23.0, 22.0, 25.0, 27.0, 25.0, 38.0, 39.0, 45.0, 45.0, 33.0, 43.0, 53.0, 50.0, 42.0, 42.0, 47.0, 41.0, 28.0, 24.0, 23.0, 28.0, 30.0, 18.0, 15.0, 17.0, 13.0, 11.0, 9.0, 10.0, 5.0, 9.0, 1.0, 4.0, 3.0, 1.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0009455680847167969, -0.0009164810180664062, -0.0008873939514160156, -0.000858306884765625, -0.0008292198181152344, -0.0008001327514648438, -0.0007710456848144531, -0.0007419586181640625, -0.0007128715515136719, -0.0006837844848632812, -0.0006546974182128906, -0.0006256103515625, -0.0005965232849121094, -0.0005674362182617188, -0.0005383491516113281, -0.0005092620849609375, -0.0004801750183105469, -0.00045108795166015625, -0.0004220008850097656, -0.000392913818359375, -0.0003638267517089844, -0.00033473968505859375, -0.0003056526184082031, -0.0002765655517578125, -0.0002474784851074219, -0.00021839141845703125, -0.00018930435180664062, -0.00016021728515625, -0.00013113021850585938, -0.00010204315185546875, -7.295608520507812e-05, -4.38690185546875e-05, -1.4781951904296875e-05, 1.430511474609375e-05, 4.3392181396484375e-05, 7.2479248046875e-05, 0.00010156631469726562, 0.00013065338134765625, 0.00015974044799804688, 0.0001888275146484375, 0.00021791458129882812, 0.00024700164794921875, 0.0002760887145996094, 0.00030517578125, 0.0003342628479003906, 0.00036334991455078125, 0.0003924369812011719, 0.0004215240478515625, 0.0004506111145019531, 0.00047969818115234375, 0.0005087852478027344, 0.000537872314453125, 0.0005669593811035156, 0.0005960464477539062, 0.0006251335144042969, 0.0006542205810546875, 0.0006833076477050781, 0.0007123947143554688, 0.0007414817810058594, 0.00077056884765625, 0.0007996559143066406, 0.0008287429809570312, 0.0008578300476074219, 0.0008869171142578125, 0.0009160041809082031]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 4.0, 9.0, 22.0, 25.0, 34.0, 44.0, 60.0, 98.0, 144.0, 187.0, 304.0, 491.0, 818.0, 1401.0, 2300.0, 4005.0, 7179.0, 12819.0, 23420.0, 41784.0, 70599.0, 110234.0, 149547.0, 169817.0, 155494.0, 117234.0, 76027.0, 45561.0, 25891.0, 14112.0, 7963.0, 4427.0, 2547.0, 1520.0, 895.0, 552.0, 346.0, 223.0, 131.0, 89.0, 59.0, 34.0, 27.0, 27.0, 14.0, 22.0, 7.0, 4.0, 4.0, 6.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.015625, -11.6468505859375, -11.278076171875, -10.9093017578125, -10.54052734375, -10.1717529296875, -9.802978515625, -9.4342041015625, -9.0654296875, -8.6966552734375, -8.327880859375, -7.9591064453125, -7.59033203125, -7.2215576171875, -6.852783203125, -6.4840087890625, -6.115234375, -5.7464599609375, -5.377685546875, -5.0089111328125, -4.64013671875, -4.2713623046875, -3.902587890625, -3.5338134765625, -3.1650390625, -2.7962646484375, -2.427490234375, -2.0587158203125, -1.68994140625, -1.3211669921875, -0.952392578125, -0.5836181640625, -0.21484375, 0.1539306640625, 0.522705078125, 0.8914794921875, 1.26025390625, 1.6290283203125, 1.997802734375, 2.3665771484375, 2.7353515625, 3.1041259765625, 3.472900390625, 3.8416748046875, 4.21044921875, 4.5792236328125, 4.947998046875, 5.3167724609375, 5.685546875, 6.0543212890625, 6.423095703125, 6.7918701171875, 7.16064453125, 7.5294189453125, 7.898193359375, 8.2669677734375, 8.6357421875, 9.0045166015625, 9.373291015625, 9.7420654296875, 10.11083984375, 10.4796142578125, 10.848388671875, 11.2171630859375, 11.5859375]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 6.0, 2.0, 6.0, 10.0, 4.0, 14.0, 10.0, 20.0, 28.0, 35.0, 46.0, 35.0, 38.0, 81.0, 68.0, 66.0, 88.0, 79.0, 63.0, 56.0, 57.0, 34.0, 36.0, 28.0, 19.0, 16.0, 15.0, 10.0, 14.0, 8.0, 9.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.21484375, -5.95672607421875, -5.6986083984375, -5.44049072265625, -5.182373046875, -4.92425537109375, -4.6661376953125, -4.40802001953125, -4.14990234375, -3.89178466796875, -3.6336669921875, -3.37554931640625, -3.117431640625, -2.85931396484375, -2.6011962890625, -2.34307861328125, -2.0849609375, -1.82684326171875, -1.5687255859375, -1.31060791015625, -1.052490234375, -0.79437255859375, -0.5362548828125, -0.27813720703125, -0.02001953125, 0.23809814453125, 0.4962158203125, 0.75433349609375, 1.012451171875, 1.27056884765625, 1.5286865234375, 1.78680419921875, 2.044921875, 2.30303955078125, 2.5611572265625, 2.81927490234375, 3.077392578125, 3.33551025390625, 3.5936279296875, 3.85174560546875, 4.10986328125, 4.36798095703125, 4.6260986328125, 4.88421630859375, 5.142333984375, 5.40045166015625, 5.6585693359375, 5.91668701171875, 6.1748046875, 6.43292236328125, 6.6910400390625, 6.94915771484375, 7.207275390625, 7.46539306640625, 7.7235107421875, 7.98162841796875, 8.23974609375, 8.49786376953125, 8.7559814453125, 9.01409912109375, 9.272216796875, 9.53033447265625, 9.7884521484375, 10.04656982421875, 10.3046875]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 4.0, 3.0, 2.0, 6.0, 5.0, 16.0, 7.0, 15.0, 18.0, 17.0, 14.0, 16.0, 28.0, 24.0, 29.0, 42.0, 23.0, 48.0, 55.0, 56.0, 36.0, 61.0, 40.0, 53.0, 58.0, 47.0, 47.0, 36.0, 28.0, 33.0, 26.0, 20.0, 14.0, 17.0, 14.0, 14.0, 11.0, 2.0, 10.0, 6.0, 2.0, 1.0, 0.0, 5.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-22.085845947265625, -21.354745864868164, -20.623647689819336, -19.892547607421875, -19.161447525024414, -18.430347442626953, -17.699249267578125, -16.968149185180664, -16.237049102783203, -15.505949974060059, -14.774849891662598, -14.043750762939453, -13.312650680541992, -12.581551551818848, -11.850452423095703, -11.119352340698242, -10.388254165649414, -9.65715503692627, -8.926054954528809, -8.194955825805664, -7.463856220245361, -6.732756614685059, -6.001657485961914, -5.270557880401611, -4.539458274841309, -3.808358669281006, -3.0772593021392822, -2.3461599349975586, -1.6150603294372559, -0.8839607238769531, -0.1528615951538086, 0.5782380104064941, 1.3093376159667969, 2.0404372215270996, 2.7715365886688232, 3.502635955810547, 4.23373556137085, 4.964835166931152, 5.695934295654297, 6.4270339012146, 7.158133506774902, 7.889233112335205, 8.620332717895508, 9.351431846618652, 10.082530975341797, 10.813631057739258, 11.544730186462402, 12.275829315185547, 13.006929397583008, 13.738028526306152, 14.469128608703613, 15.200227737426758, 15.931327819824219, 16.662425994873047, 17.393526077270508, 18.12462615966797, 18.855724334716797, 19.586824417114258, 20.317922592163086, 21.049022674560547, 21.780122756958008, 22.51122283935547, 23.242321014404297, 23.973421096801758, 24.70452117919922]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 3.0, 2.0, 8.0, 7.0, 3.0, 11.0, 15.0, 13.0, 18.0, 22.0, 15.0, 21.0, 23.0, 29.0, 35.0, 24.0, 32.0, 37.0, 23.0, 35.0, 40.0, 36.0, 44.0, 33.0, 43.0, 44.0, 36.0, 28.0, 30.0, 32.0, 39.0, 31.0, 29.0, 30.0, 15.0, 21.0, 15.0, 19.0, 12.0, 9.0, 7.0, 10.0, 8.0, 3.0, 3.0, 6.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-28.8968505859375, -27.958961486816406, -27.021072387695312, -26.08318328857422, -25.145292282104492, -24.2074031829834, -23.269514083862305, -22.33162498474121, -21.393733978271484, -20.45584487915039, -19.517955780029297, -18.580066680908203, -17.642175674438477, -16.704286575317383, -15.766397476196289, -14.828508377075195, -13.890619277954102, -12.952730178833008, -12.014840126037598, -11.076951026916504, -10.139060974121094, -9.201171875, -8.263282775878906, -7.325393199920654, -6.387503623962402, -5.44961404800415, -4.511724472045898, -3.5738353729248047, -2.6359457969665527, -1.6980562210083008, -0.760167121887207, 0.17772245407104492, 1.115610122680664, 2.053499698638916, 2.991389036178589, 3.9292783737182617, 4.867167949676514, 5.805057525634766, 6.742946624755859, 7.680836200714111, 8.618725776672363, 9.556614875793457, 10.494504928588867, 11.432394027709961, 12.370283126831055, 13.308173179626465, 14.246062278747559, 15.183952331542969, 16.121841430664062, 17.059730529785156, 17.99761962890625, 18.935508728027344, 19.87339973449707, 20.811288833618164, 21.749177932739258, 22.68706703186035, 23.624958038330078, 24.562847137451172, 25.500736236572266, 26.43862533569336, 27.376516342163086, 28.31440544128418, 29.252294540405273, 30.190183639526367, 31.12807273864746]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 7.0, 8.0, 13.0, 30.0, 45.0, 70.0, 132.0, 223.0, 342.0, 546.0, 915.0, 1531.0, 2601.0, 4367.0, 7348.0, 12868.0, 22292.0, 38971.0, 67808.0, 117602.0, 201687.0, 324878.0, 478329.0, 610866.0, 649698.0, 568915.0, 419756.0, 273884.0, 165495.0, 95840.0, 54649.0, 30515.0, 17409.0, 10023.0, 5873.0, 3388.0, 2081.0, 1192.0, 804.0, 480.0, 308.0, 170.0, 104.0, 87.0, 68.0, 28.0, 25.0, 10.0, 6.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-19.46875, -18.865966796875, -18.26318359375, -17.660400390625, -17.0576171875, -16.454833984375, -15.85205078125, -15.249267578125, -14.646484375, -14.043701171875, -13.44091796875, -12.838134765625, -12.2353515625, -11.632568359375, -11.02978515625, -10.427001953125, -9.82421875, -9.221435546875, -8.61865234375, -8.015869140625, -7.4130859375, -6.810302734375, -6.20751953125, -5.604736328125, -5.001953125, -4.399169921875, -3.79638671875, -3.193603515625, -2.5908203125, -1.988037109375, -1.38525390625, -0.782470703125, -0.1796875, 0.423095703125, 1.02587890625, 1.628662109375, 2.2314453125, 2.834228515625, 3.43701171875, 4.039794921875, 4.642578125, 5.245361328125, 5.84814453125, 6.450927734375, 7.0537109375, 7.656494140625, 8.25927734375, 8.862060546875, 9.46484375, 10.067626953125, 10.67041015625, 11.273193359375, 11.8759765625, 12.478759765625, 13.08154296875, 13.684326171875, 14.287109375, 14.889892578125, 15.49267578125, 16.095458984375, 16.6982421875, 17.301025390625, 17.90380859375, 18.506591796875, 19.109375]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [5.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 10.0, 7.0, 9.0, 12.0, 17.0, 17.0, 16.0, 18.0, 19.0, 25.0, 28.0, 36.0, 31.0, 34.0, 32.0, 22.0, 36.0, 38.0, 55.0, 40.0, 37.0, 36.0, 38.0, 32.0, 33.0, 43.0, 33.0, 34.0, 36.0, 22.0, 29.0, 23.0, 24.0, 10.0, 9.0, 18.0, 12.0, 7.0, 4.0, 3.0, 6.0, 3.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.203125, -20.44091796875, -19.6787109375, -18.91650390625, -18.154296875, -17.39208984375, -16.6298828125, -15.86767578125, -15.10546875, -14.34326171875, -13.5810546875, -12.81884765625, -12.056640625, -11.29443359375, -10.5322265625, -9.77001953125, -9.0078125, -8.24560546875, -7.4833984375, -6.72119140625, -5.958984375, -5.19677734375, -4.4345703125, -3.67236328125, -2.91015625, -2.14794921875, -1.3857421875, -0.62353515625, 0.138671875, 0.90087890625, 1.6630859375, 2.42529296875, 3.1875, 3.94970703125, 4.7119140625, 5.47412109375, 6.236328125, 6.99853515625, 7.7607421875, 8.52294921875, 9.28515625, 10.04736328125, 10.8095703125, 11.57177734375, 12.333984375, 13.09619140625, 13.8583984375, 14.62060546875, 15.3828125, 16.14501953125, 16.9072265625, 17.66943359375, 18.431640625, 19.19384765625, 19.9560546875, 20.71826171875, 21.48046875, 22.24267578125, 23.0048828125, 23.76708984375, 24.529296875, 25.29150390625, 26.0537109375, 26.81591796875, 27.578125]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 5.0, 9.0, 10.0, 17.0, 37.0, 46.0, 93.0, 128.0, 215.0, 387.0, 639.0, 1052.0, 1916.0, 3113.0, 5409.0, 9453.0, 16877.0, 29537.0, 52510.0, 89866.0, 151007.0, 244282.0, 364686.0, 496457.0, 590157.0, 594229.0, 511619.0, 383884.0, 257991.0, 161654.0, 96707.0, 55908.0, 32303.0, 17876.0, 10228.0, 5812.0, 3404.0, 2011.0, 1138.0, 636.0, 381.0, 212.0, 161.0, 81.0, 55.0, 36.0, 27.0, 13.0, 9.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-20.859375, -20.228515625, -19.59765625, -18.966796875, -18.3359375, -17.705078125, -17.07421875, -16.443359375, -15.8125, -15.181640625, -14.55078125, -13.919921875, -13.2890625, -12.658203125, -12.02734375, -11.396484375, -10.765625, -10.134765625, -9.50390625, -8.873046875, -8.2421875, -7.611328125, -6.98046875, -6.349609375, -5.71875, -5.087890625, -4.45703125, -3.826171875, -3.1953125, -2.564453125, -1.93359375, -1.302734375, -0.671875, -0.041015625, 0.58984375, 1.220703125, 1.8515625, 2.482421875, 3.11328125, 3.744140625, 4.375, 5.005859375, 5.63671875, 6.267578125, 6.8984375, 7.529296875, 8.16015625, 8.791015625, 9.421875, 10.052734375, 10.68359375, 11.314453125, 11.9453125, 12.576171875, 13.20703125, 13.837890625, 14.46875, 15.099609375, 15.73046875, 16.361328125, 16.9921875, 17.623046875, 18.25390625, 18.884765625, 19.515625]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 6.0, 2.0, 6.0, 8.0, 6.0, 13.0, 16.0, 28.0, 30.0, 33.0, 44.0, 54.0, 74.0, 101.0, 102.0, 116.0, 165.0, 170.0, 192.0, 201.0, 220.0, 229.0, 238.0, 242.0, 234.0, 217.0, 225.0, 208.0, 167.0, 137.0, 108.0, 119.0, 95.0, 71.0, 44.0, 33.0, 31.0, 14.0, 20.0, 12.0, 17.0, 13.0, 7.0, 5.0, 4.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.25, -10.8980712890625, -10.546142578125, -10.1942138671875, -9.84228515625, -9.4903564453125, -9.138427734375, -8.7864990234375, -8.4345703125, -8.0826416015625, -7.730712890625, -7.3787841796875, -7.02685546875, -6.6749267578125, -6.322998046875, -5.9710693359375, -5.619140625, -5.2672119140625, -4.915283203125, -4.5633544921875, -4.21142578125, -3.8594970703125, -3.507568359375, -3.1556396484375, -2.8037109375, -2.4517822265625, -2.099853515625, -1.7479248046875, -1.39599609375, -1.0440673828125, -0.692138671875, -0.3402099609375, 0.01171875, 0.3636474609375, 0.715576171875, 1.0675048828125, 1.41943359375, 1.7713623046875, 2.123291015625, 2.4752197265625, 2.8271484375, 3.1790771484375, 3.531005859375, 3.8829345703125, 4.23486328125, 4.5867919921875, 4.938720703125, 5.2906494140625, 5.642578125, 5.9945068359375, 6.346435546875, 6.6983642578125, 7.05029296875, 7.4022216796875, 7.754150390625, 8.1060791015625, 8.4580078125, 8.8099365234375, 9.161865234375, 9.5137939453125, 9.86572265625, 10.2176513671875, 10.569580078125, 10.9215087890625, 11.2734375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 5.0, 6.0, 4.0, 4.0, 5.0, 4.0, 7.0, 10.0, 5.0, 5.0, 12.0, 19.0, 17.0, 22.0, 25.0, 24.0, 33.0, 37.0, 42.0, 39.0, 61.0, 47.0, 50.0, 36.0, 45.0, 39.0, 50.0, 43.0, 34.0, 38.0, 39.0, 35.0, 28.0, 19.0, 18.0, 21.0, 17.0, 21.0, 13.0, 6.0, 5.0, 5.0, 5.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-20.41901206970215, -19.735322952270508, -19.051633834838867, -18.367944717407227, -17.684255599975586, -17.000566482543945, -16.316879272460938, -15.63318920135498, -14.94950008392334, -14.2658109664917, -13.582121849060059, -12.898433685302734, -12.214744567871094, -11.531055450439453, -10.847366333007812, -10.163677215576172, -9.479988098144531, -8.79629898071289, -8.11260986328125, -7.428921222686768, -6.745232105255127, -6.061542987823486, -5.377854347229004, -4.694165229797363, -4.010476112365723, -3.326786994934082, -2.6430981159210205, -1.959409236907959, -1.2757201194763184, -0.5920310020446777, 0.09165763854980469, 0.7753467559814453, 1.4590339660644531, 2.1427230834960938, 2.8264119625091553, 3.510100841522217, 4.193789958953857, 4.877479076385498, 5.5611677169799805, 6.244856834411621, 6.928545951843262, 7.612235069274902, 8.295924186706543, 8.979612350463867, 9.663301467895508, 10.346990585327148, 11.030679702758789, 11.71436882019043, 12.39805793762207, 13.081747055053711, 13.765436172485352, 14.449125289916992, 15.132814407348633, 15.816503524780273, 16.50019073486328, 17.183879852294922, 17.867568969726562, 18.551258087158203, 19.234947204589844, 19.918636322021484, 20.602325439453125, 21.286014556884766, 21.969703674316406, 22.653392791748047, 23.337081909179688]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 6.0, 4.0, 7.0, 5.0, 4.0, 13.0, 10.0, 11.0, 12.0, 12.0, 14.0, 17.0, 16.0, 22.0, 28.0, 33.0, 35.0, 19.0, 29.0, 27.0, 37.0, 44.0, 29.0, 34.0, 41.0, 41.0, 44.0, 44.0, 32.0, 22.0, 35.0, 38.0, 29.0, 21.0, 30.0, 33.0, 18.0, 15.0, 18.0, 10.0, 15.0, 6.0, 13.0, 8.0, 8.0, 7.0, 5.0, 3.0, 2.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-25.08544158935547, -24.21485710144043, -23.344270706176758, -22.47368621826172, -21.60310173034668, -20.73251724243164, -19.86193084716797, -18.99134635925293, -18.12076187133789, -17.25017738342285, -16.37959098815918, -15.50900650024414, -14.638422012329102, -13.767836570739746, -12.89725112915039, -12.026666641235352, -11.15608024597168, -10.285494804382324, -9.414910316467285, -8.54432487487793, -7.673739910125732, -6.803154945373535, -5.93256950378418, -5.061984539031982, -4.191399574279785, -3.320814609527588, -2.4502294063568115, -1.5796442031860352, -0.7090592384338379, 0.16152572631835938, 1.0321111679077148, 1.902696132659912, 2.7732791900634766, 3.643864154815674, 4.514449119567871, 5.385034561157227, 6.255619525909424, 7.126204490661621, 7.996789932250977, 8.867374420166016, 9.737959861755371, 10.608545303344727, 11.479129791259766, 12.349715232849121, 13.220300674438477, 14.090885162353516, 14.961470603942871, 15.832056045532227, 16.702640533447266, 17.573225021362305, 18.443811416625977, 19.314395904541016, 20.184980392456055, 21.055564880371094, 21.926151275634766, 22.796735763549805, 23.667320251464844, 24.537904739379883, 25.408491134643555, 26.279075622558594, 27.149660110473633, 28.020244598388672, 28.890830993652344, 29.761415481567383, 30.632001876831055]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 5.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 8.0, 9.0, 13.0, 20.0, 40.0, 42.0, 65.0, 105.0, 152.0, 231.0, 342.0, 573.0, 891.0, 1498.0, 2663.0, 4792.0, 8801.0, 16295.0, 30236.0, 55988.0, 98297.0, 155512.0, 198151.0, 181405.0, 127048.0, 74736.0, 41039.0, 22240.0, 12140.0, 6608.0, 3510.0, 2024.0, 1190.0, 664.0, 425.0, 271.0, 148.0, 134.0, 70.0, 53.0, 38.0, 25.0, 20.0, 8.0, 5.0, 8.0, 7.0, 3.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-15.390625, -14.9058837890625, -14.421142578125, -13.9364013671875, -13.45166015625, -12.9669189453125, -12.482177734375, -11.9974365234375, -11.5126953125, -11.0279541015625, -10.543212890625, -10.0584716796875, -9.57373046875, -9.0889892578125, -8.604248046875, -8.1195068359375, -7.634765625, -7.1500244140625, -6.665283203125, -6.1805419921875, -5.69580078125, -5.2110595703125, -4.726318359375, -4.2415771484375, -3.7568359375, -3.2720947265625, -2.787353515625, -2.3026123046875, -1.81787109375, -1.3331298828125, -0.848388671875, -0.3636474609375, 0.12109375, 0.6058349609375, 1.090576171875, 1.5753173828125, 2.06005859375, 2.5447998046875, 3.029541015625, 3.5142822265625, 3.9990234375, 4.4837646484375, 4.968505859375, 5.4532470703125, 5.93798828125, 6.4227294921875, 6.907470703125, 7.3922119140625, 7.876953125, 8.3616943359375, 8.846435546875, 9.3311767578125, 9.81591796875, 10.3006591796875, 10.785400390625, 11.2701416015625, 11.7548828125, 12.2396240234375, 12.724365234375, 13.2091064453125, 13.69384765625, 14.1785888671875, 14.663330078125, 15.1480712890625, 15.6328125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 3.0, 5.0, 3.0, 6.0, 5.0, 3.0, 10.0, 12.0, 14.0, 16.0, 19.0, 8.0, 18.0, 24.0, 34.0, 30.0, 25.0, 21.0, 27.0, 34.0, 38.0, 39.0, 46.0, 38.0, 33.0, 40.0, 49.0, 42.0, 32.0, 29.0, 34.0, 29.0, 31.0, 37.0, 33.0, 17.0, 14.0, 12.0, 24.0, 12.0, 14.0, 10.0, 7.0, 9.0, 8.0, 3.0, 5.0, 3.0, 1.0, 5.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.1875, -24.27783203125, -23.3681640625, -22.45849609375, -21.548828125, -20.63916015625, -19.7294921875, -18.81982421875, -17.91015625, -17.00048828125, -16.0908203125, -15.18115234375, -14.271484375, -13.36181640625, -12.4521484375, -11.54248046875, -10.6328125, -9.72314453125, -8.8134765625, -7.90380859375, -6.994140625, -6.08447265625, -5.1748046875, -4.26513671875, -3.35546875, -2.44580078125, -1.5361328125, -0.62646484375, 0.283203125, 1.19287109375, 2.1025390625, 3.01220703125, 3.921875, 4.83154296875, 5.7412109375, 6.65087890625, 7.560546875, 8.47021484375, 9.3798828125, 10.28955078125, 11.19921875, 12.10888671875, 13.0185546875, 13.92822265625, 14.837890625, 15.74755859375, 16.6572265625, 17.56689453125, 18.4765625, 19.38623046875, 20.2958984375, 21.20556640625, 22.115234375, 23.02490234375, 23.9345703125, 24.84423828125, 25.75390625, 26.66357421875, 27.5732421875, 28.48291015625, 29.392578125, 30.30224609375, 31.2119140625, 32.12158203125, 33.03125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 6.0, 17.0, 22.0, 24.0, 59.0, 65.0, 104.0, 177.0, 281.0, 457.0, 718.0, 1243.0, 2073.0, 3562.0, 6700.0, 12326.0, 23997.0, 47400.0, 93701.0, 170788.0, 237589.0, 202225.0, 118432.0, 61075.0, 30727.0, 15773.0, 8257.0, 4417.0, 2591.0, 1460.0, 813.0, 557.0, 312.0, 215.0, 127.0, 95.0, 52.0, 40.0, 27.0, 24.0, 13.0, 6.0, 6.0, 6.0, 3.0, 0.0, 0.0, 2.0], "bins": [-20.78125, -20.2147216796875, -19.648193359375, -19.0816650390625, -18.51513671875, -17.9486083984375, -17.382080078125, -16.8155517578125, -16.2490234375, -15.6824951171875, -15.115966796875, -14.5494384765625, -13.98291015625, -13.4163818359375, -12.849853515625, -12.2833251953125, -11.716796875, -11.1502685546875, -10.583740234375, -10.0172119140625, -9.45068359375, -8.8841552734375, -8.317626953125, -7.7510986328125, -7.1845703125, -6.6180419921875, -6.051513671875, -5.4849853515625, -4.91845703125, -4.3519287109375, -3.785400390625, -3.2188720703125, -2.65234375, -2.0858154296875, -1.519287109375, -0.9527587890625, -0.38623046875, 0.1802978515625, 0.746826171875, 1.3133544921875, 1.8798828125, 2.4464111328125, 3.012939453125, 3.5794677734375, 4.14599609375, 4.7125244140625, 5.279052734375, 5.8455810546875, 6.412109375, 6.9786376953125, 7.545166015625, 8.1116943359375, 8.67822265625, 9.2447509765625, 9.811279296875, 10.3778076171875, 10.9443359375, 11.5108642578125, 12.077392578125, 12.6439208984375, 13.21044921875, 13.7769775390625, 14.343505859375, 14.9100341796875, 15.4765625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 5.0, 5.0, 5.0, 6.0, 4.0, 6.0, 13.0, 12.0, 12.0, 13.0, 16.0, 20.0, 25.0, 38.0, 25.0, 29.0, 26.0, 36.0, 23.0, 30.0, 25.0, 39.0, 43.0, 44.0, 38.0, 38.0, 46.0, 36.0, 30.0, 26.0, 20.0, 30.0, 23.0, 35.0, 30.0, 23.0, 16.0, 18.0, 16.0, 20.0, 14.0, 9.0, 11.0, 6.0, 6.0, 3.0, 4.0, 3.0, 1.0, 2.0, 0.0, 2.0, 4.0, 2.0, 0.0, 1.0, 2.0], "bins": [-17.609375, -17.038818359375, -16.46826171875, -15.897705078125, -15.3271484375, -14.756591796875, -14.18603515625, -13.615478515625, -13.044921875, -12.474365234375, -11.90380859375, -11.333251953125, -10.7626953125, -10.192138671875, -9.62158203125, -9.051025390625, -8.48046875, -7.909912109375, -7.33935546875, -6.768798828125, -6.1982421875, -5.627685546875, -5.05712890625, -4.486572265625, -3.916015625, -3.345458984375, -2.77490234375, -2.204345703125, -1.6337890625, -1.063232421875, -0.49267578125, 0.077880859375, 0.6484375, 1.218994140625, 1.78955078125, 2.360107421875, 2.9306640625, 3.501220703125, 4.07177734375, 4.642333984375, 5.212890625, 5.783447265625, 6.35400390625, 6.924560546875, 7.4951171875, 8.065673828125, 8.63623046875, 9.206787109375, 9.77734375, 10.347900390625, 10.91845703125, 11.489013671875, 12.0595703125, 12.630126953125, 13.20068359375, 13.771240234375, 14.341796875, 14.912353515625, 15.48291015625, 16.053466796875, 16.6240234375, 17.194580078125, 17.76513671875, 18.335693359375, 18.90625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 9.0, 17.0, 22.0, 27.0, 24.0, 35.0, 54.0, 71.0, 95.0, 129.0, 200.0, 323.0, 472.0, 710.0, 1241.0, 2101.0, 3974.0, 7976.0, 19279.0, 57207.0, 204214.0, 443411.0, 210458.0, 58911.0, 19775.0, 8249.0, 3956.0, 2095.0, 1223.0, 759.0, 488.0, 305.0, 215.0, 146.0, 113.0, 94.0, 50.0, 42.0, 19.0, 18.0, 11.0, 6.0, 10.0, 5.0, 5.0, 7.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.34375, -13.8885498046875, -13.433349609375, -12.9781494140625, -12.52294921875, -12.0677490234375, -11.612548828125, -11.1573486328125, -10.7021484375, -10.2469482421875, -9.791748046875, -9.3365478515625, -8.88134765625, -8.4261474609375, -7.970947265625, -7.5157470703125, -7.060546875, -6.6053466796875, -6.150146484375, -5.6949462890625, -5.23974609375, -4.7845458984375, -4.329345703125, -3.8741455078125, -3.4189453125, -2.9637451171875, -2.508544921875, -2.0533447265625, -1.59814453125, -1.1429443359375, -0.687744140625, -0.2325439453125, 0.22265625, 0.6778564453125, 1.133056640625, 1.5882568359375, 2.04345703125, 2.4986572265625, 2.953857421875, 3.4090576171875, 3.8642578125, 4.3194580078125, 4.774658203125, 5.2298583984375, 5.68505859375, 6.1402587890625, 6.595458984375, 7.0506591796875, 7.505859375, 7.9610595703125, 8.416259765625, 8.8714599609375, 9.32666015625, 9.7818603515625, 10.237060546875, 10.6922607421875, 11.1474609375, 11.6026611328125, 12.057861328125, 12.5130615234375, 12.96826171875, 13.4234619140625, 13.878662109375, 14.3338623046875, 14.7890625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 4.0, 3.0, 2.0, 8.0, 13.0, 16.0, 30.0, 26.0, 57.0, 68.0, 98.0, 133.0, 149.0, 114.0, 87.0, 67.0, 49.0, 24.0, 15.0, 11.0, 7.0, 4.0, 4.0, 3.0, 7.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008373260498046875, -0.0008054673671722412, -0.0007736086845397949, -0.0007417500019073486, -0.0007098913192749023, -0.0006780326366424561, -0.0006461739540100098, -0.0006143152713775635, -0.0005824565887451172, -0.0005505979061126709, -0.0005187392234802246, -0.0004868805408477783, -0.00045502185821533203, -0.00042316317558288574, -0.00039130449295043945, -0.00035944581031799316, -0.0003275871276855469, -0.0002957284450531006, -0.0002638697624206543, -0.000232011079788208, -0.00020015239715576172, -0.00016829371452331543, -0.00013643503189086914, -0.00010457634925842285, -7.271766662597656e-05, -4.0858983993530273e-05, -9.000301361083984e-06, 2.2858381271362305e-05, 5.4717063903808594e-05, 8.657574653625488e-05, 0.00011843442916870117, 0.00015029311180114746, 0.00018215179443359375, 0.00021401047706604004, 0.00024586915969848633, 0.0002777278423309326, 0.0003095865249633789, 0.0003414452075958252, 0.0003733038902282715, 0.0004051625728607178, 0.00043702125549316406, 0.00046887993812561035, 0.0005007386207580566, 0.0005325973033905029, 0.0005644559860229492, 0.0005963146686553955, 0.0006281733512878418, 0.0006600320339202881, 0.0006918907165527344, 0.0007237493991851807, 0.000755608081817627, 0.0007874667644500732, 0.0008193254470825195, 0.0008511841297149658, 0.0008830428123474121, 0.0009149014949798584, 0.0009467601776123047, 0.000978618860244751, 0.0010104775428771973, 0.0010423362255096436, 0.0010741949081420898, 0.0011060535907745361, 0.0011379122734069824, 0.0011697709560394287, 0.001201629638671875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 9.0, 2.0, 8.0, 5.0, 11.0, 10.0, 27.0, 21.0, 29.0, 48.0, 70.0, 110.0, 147.0, 218.0, 320.0, 452.0, 724.0, 1110.0, 1728.0, 2769.0, 5178.0, 10748.0, 25532.0, 67579.0, 180000.0, 325048.0, 252202.0, 104374.0, 38303.0, 15316.0, 6892.0, 3529.0, 2055.0, 1291.0, 839.0, 527.0, 388.0, 271.0, 179.0, 146.0, 107.0, 72.0, 44.0, 37.0, 25.0, 19.0, 17.0, 6.0, 5.0, 5.0, 5.0, 5.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-12.1875, -11.77734375, -11.3671875, -10.95703125, -10.546875, -10.13671875, -9.7265625, -9.31640625, -8.90625, -8.49609375, -8.0859375, -7.67578125, -7.265625, -6.85546875, -6.4453125, -6.03515625, -5.625, -5.21484375, -4.8046875, -4.39453125, -3.984375, -3.57421875, -3.1640625, -2.75390625, -2.34375, -1.93359375, -1.5234375, -1.11328125, -0.703125, -0.29296875, 0.1171875, 0.52734375, 0.9375, 1.34765625, 1.7578125, 2.16796875, 2.578125, 2.98828125, 3.3984375, 3.80859375, 4.21875, 4.62890625, 5.0390625, 5.44921875, 5.859375, 6.26953125, 6.6796875, 7.08984375, 7.5, 7.91015625, 8.3203125, 8.73046875, 9.140625, 9.55078125, 9.9609375, 10.37109375, 10.78125, 11.19140625, 11.6015625, 12.01171875, 12.421875, 12.83203125, 13.2421875, 13.65234375, 14.0625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 5.0, 6.0, 10.0, 19.0, 16.0, 20.0, 24.0, 40.0, 47.0, 58.0, 86.0, 98.0, 77.0, 101.0, 100.0, 79.0, 49.0, 40.0, 33.0, 24.0, 18.0, 9.0, 9.0, 7.0, 8.0, 6.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.64453125, -5.45361328125, -5.2626953125, -5.07177734375, -4.880859375, -4.68994140625, -4.4990234375, -4.30810546875, -4.1171875, -3.92626953125, -3.7353515625, -3.54443359375, -3.353515625, -3.16259765625, -2.9716796875, -2.78076171875, -2.58984375, -2.39892578125, -2.2080078125, -2.01708984375, -1.826171875, -1.63525390625, -1.4443359375, -1.25341796875, -1.0625, -0.87158203125, -0.6806640625, -0.48974609375, -0.298828125, -0.10791015625, 0.0830078125, 0.27392578125, 0.46484375, 0.65576171875, 0.8466796875, 1.03759765625, 1.228515625, 1.41943359375, 1.6103515625, 1.80126953125, 1.9921875, 2.18310546875, 2.3740234375, 2.56494140625, 2.755859375, 2.94677734375, 3.1376953125, 3.32861328125, 3.51953125, 3.71044921875, 3.9013671875, 4.09228515625, 4.283203125, 4.47412109375, 4.6650390625, 4.85595703125, 5.046875, 5.23779296875, 5.4287109375, 5.61962890625, 5.810546875, 6.00146484375, 6.1923828125, 6.38330078125, 6.57421875]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 7.0, 5.0, 4.0, 4.0, 5.0, 9.0, 8.0, 11.0, 7.0, 8.0, 18.0, 15.0, 23.0, 26.0, 25.0, 29.0, 37.0, 43.0, 44.0, 61.0, 39.0, 53.0, 45.0, 45.0, 51.0, 42.0, 45.0, 36.0, 31.0, 46.0, 28.0, 22.0, 17.0, 24.0, 26.0, 20.0, 13.0, 9.0, 8.0, 3.0, 6.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.514890670776367, -19.821317672729492, -19.127744674682617, -18.434171676635742, -17.740598678588867, -17.047025680541992, -16.35345458984375, -15.659880638122559, -14.966307640075684, -14.272734642028809, -13.579161643981934, -12.885589599609375, -12.1920166015625, -11.498443603515625, -10.80487060546875, -10.111297607421875, -9.417724609375, -8.724151611328125, -8.03057861328125, -7.337006092071533, -6.643433094024658, -5.949860095977783, -5.256287574768066, -4.562714576721191, -3.8691415786743164, -3.1755685806274414, -2.4819958209991455, -1.7884230613708496, -1.0948500633239746, -0.4012770652770996, 0.2922954559326172, 0.9858684539794922, 1.6794414520263672, 2.373014450073242, 3.066587209701538, 3.760159969329834, 4.453732967376709, 5.147305965423584, 5.840878486633301, 6.534451484680176, 7.228024482727051, 7.921597480773926, 8.6151704788208, 9.30874252319336, 10.002315521240234, 10.69588851928711, 11.389461517333984, 12.08303451538086, 12.776607513427734, 13.47018051147461, 14.163753509521484, 14.85732650756836, 15.550899505615234, 16.24447250366211, 16.938045501708984, 17.63161849975586, 18.325191497802734, 19.01876449584961, 19.712337493896484, 20.40591049194336, 21.099483489990234, 21.79305648803711, 22.486629486083984, 23.18020248413086, 23.8737735748291]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 3.0, 2.0, 9.0, 7.0, 9.0, 4.0, 10.0, 8.0, 14.0, 14.0, 15.0, 16.0, 21.0, 25.0, 26.0, 22.0, 28.0, 30.0, 35.0, 32.0, 39.0, 24.0, 35.0, 43.0, 35.0, 38.0, 51.0, 36.0, 38.0, 25.0, 29.0, 25.0, 37.0, 27.0, 26.0, 37.0, 23.0, 12.0, 16.0, 16.0, 8.0, 11.0, 8.0, 8.0, 11.0, 6.0, 5.0, 5.0, 2.0, 3.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-23.788162231445312, -22.935501098632812, -22.08283805847168, -21.23017692565918, -20.377513885498047, -19.524852752685547, -18.672191619873047, -17.819528579711914, -16.96686553955078, -16.11420440673828, -15.261541366577148, -14.408880233764648, -13.556217193603516, -12.703556060791016, -11.8508939743042, -10.998231887817383, -10.145570755004883, -9.292908668518066, -8.44024658203125, -7.587584972381592, -6.734922885894775, -5.882260799407959, -5.029599189758301, -4.176937103271484, -3.324275016784668, -2.4716129302978516, -1.6189510822296143, -0.766289234161377, 0.08637285232543945, 0.9390349388122559, 1.791696548461914, 2.6443586349487305, 3.497018814086914, 4.3496809005737305, 5.202342987060547, 6.055004596710205, 6.9076666831970215, 7.760328769683838, 8.612990379333496, 9.465652465820312, 10.318314552307129, 11.170976638793945, 12.023638725280762, 12.876300811767578, 13.728961944580078, 14.581624984741211, 15.434286117553711, 16.286949157714844, 17.139610290527344, 17.992271423339844, 18.844934463500977, 19.697595596313477, 20.55025863647461, 21.40291976928711, 22.25558090209961, 23.108243942260742, 23.960906982421875, 24.813568115234375, 25.666231155395508, 26.518892288208008, 27.37155532836914, 28.22421646118164, 29.07687759399414, 29.929540634155273, 30.782201766967773]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 4.0, 8.0, 6.0, 11.0, 17.0, 26.0, 38.0, 61.0, 94.0, 165.0, 213.0, 343.0, 486.0, 709.0, 1130.0, 1800.0, 2560.0, 3778.0, 5619.0, 8248.0, 12354.0, 18316.0, 25882.0, 35867.0, 48735.0, 62570.0, 77795.0, 90969.0, 100383.0, 101916.0, 96898.0, 84785.0, 70993.0, 55524.0, 41841.0, 30540.0, 21524.0, 15077.0, 10355.0, 7023.0, 4672.0, 3000.0, 2116.0, 1351.0, 920.0, 594.0, 425.0, 287.0, 177.0, 121.0, 94.0, 53.0, 34.0, 21.0, 14.0, 12.0, 2.0, 4.0, 3.0, 4.0, 2.0], "bins": [-13.34375, -12.9300537109375, -12.516357421875, -12.1026611328125, -11.68896484375, -11.2752685546875, -10.861572265625, -10.4478759765625, -10.0341796875, -9.6204833984375, -9.206787109375, -8.7930908203125, -8.37939453125, -7.9656982421875, -7.552001953125, -7.1383056640625, -6.724609375, -6.3109130859375, -5.897216796875, -5.4835205078125, -5.06982421875, -4.6561279296875, -4.242431640625, -3.8287353515625, -3.4150390625, -3.0013427734375, -2.587646484375, -2.1739501953125, -1.76025390625, -1.3465576171875, -0.932861328125, -0.5191650390625, -0.10546875, 0.3082275390625, 0.721923828125, 1.1356201171875, 1.54931640625, 1.9630126953125, 2.376708984375, 2.7904052734375, 3.2041015625, 3.6177978515625, 4.031494140625, 4.4451904296875, 4.85888671875, 5.2725830078125, 5.686279296875, 6.0999755859375, 6.513671875, 6.9273681640625, 7.341064453125, 7.7547607421875, 8.16845703125, 8.5821533203125, 8.995849609375, 9.4095458984375, 9.8232421875, 10.2369384765625, 10.650634765625, 11.0643310546875, 11.47802734375, 11.8917236328125, 12.305419921875, 12.7191162109375, 13.1328125]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 3.0, 4.0, 2.0, 6.0, 8.0, 9.0, 9.0, 14.0, 11.0, 14.0, 13.0, 22.0, 14.0, 17.0, 31.0, 22.0, 39.0, 36.0, 33.0, 51.0, 25.0, 34.0, 43.0, 41.0, 42.0, 42.0, 41.0, 39.0, 29.0, 32.0, 34.0, 37.0, 29.0, 26.0, 22.0, 20.0, 21.0, 17.0, 17.0, 13.0, 13.0, 7.0, 3.0, 11.0, 4.0, 6.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.25, -23.35498046875, -22.4599609375, -21.56494140625, -20.669921875, -19.77490234375, -18.8798828125, -17.98486328125, -17.08984375, -16.19482421875, -15.2998046875, -14.40478515625, -13.509765625, -12.61474609375, -11.7197265625, -10.82470703125, -9.9296875, -9.03466796875, -8.1396484375, -7.24462890625, -6.349609375, -5.45458984375, -4.5595703125, -3.66455078125, -2.76953125, -1.87451171875, -0.9794921875, -0.08447265625, 0.810546875, 1.70556640625, 2.6005859375, 3.49560546875, 4.390625, 5.28564453125, 6.1806640625, 7.07568359375, 7.970703125, 8.86572265625, 9.7607421875, 10.65576171875, 11.55078125, 12.44580078125, 13.3408203125, 14.23583984375, 15.130859375, 16.02587890625, 16.9208984375, 17.81591796875, 18.7109375, 19.60595703125, 20.5009765625, 21.39599609375, 22.291015625, 23.18603515625, 24.0810546875, 24.97607421875, 25.87109375, 26.76611328125, 27.6611328125, 28.55615234375, 29.451171875, 30.34619140625, 31.2412109375, 32.13623046875, 33.03125]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 16.0, 12.0, 14.0, 39.0, 64.0, 61.0, 129.0, 168.0, 255.0, 404.0, 649.0, 1000.0, 1608.0, 2315.0, 3792.0, 5891.0, 9508.0, 14962.0, 23894.0, 37023.0, 56072.0, 79311.0, 104538.0, 124001.0, 131275.0, 122341.0, 101451.0, 76123.0, 53740.0, 35692.0, 22972.0, 14313.0, 9213.0, 5635.0, 3698.0, 2346.0, 1495.0, 885.0, 573.0, 393.0, 232.0, 165.0, 102.0, 61.0, 46.0, 31.0, 20.0, 11.0, 10.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-18.109375, -17.55126953125, -16.9931640625, -16.43505859375, -15.876953125, -15.31884765625, -14.7607421875, -14.20263671875, -13.64453125, -13.08642578125, -12.5283203125, -11.97021484375, -11.412109375, -10.85400390625, -10.2958984375, -9.73779296875, -9.1796875, -8.62158203125, -8.0634765625, -7.50537109375, -6.947265625, -6.38916015625, -5.8310546875, -5.27294921875, -4.71484375, -4.15673828125, -3.5986328125, -3.04052734375, -2.482421875, -1.92431640625, -1.3662109375, -0.80810546875, -0.25, 0.30810546875, 0.8662109375, 1.42431640625, 1.982421875, 2.54052734375, 3.0986328125, 3.65673828125, 4.21484375, 4.77294921875, 5.3310546875, 5.88916015625, 6.447265625, 7.00537109375, 7.5634765625, 8.12158203125, 8.6796875, 9.23779296875, 9.7958984375, 10.35400390625, 10.912109375, 11.47021484375, 12.0283203125, 12.58642578125, 13.14453125, 13.70263671875, 14.2607421875, 14.81884765625, 15.376953125, 15.93505859375, 16.4931640625, 17.05126953125, 17.609375]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 8.0, 3.0, 7.0, 7.0, 5.0, 13.0, 9.0, 14.0, 18.0, 15.0, 22.0, 23.0, 20.0, 26.0, 33.0, 25.0, 40.0, 46.0, 46.0, 45.0, 41.0, 52.0, 37.0, 30.0, 46.0, 52.0, 35.0, 32.0, 44.0, 35.0, 22.0, 30.0, 19.0, 21.0, 15.0, 16.0, 16.0, 13.0, 9.0, 5.0, 3.0, 7.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-20.890625, -20.190673828125, -19.49072265625, -18.790771484375, -18.0908203125, -17.390869140625, -16.69091796875, -15.990966796875, -15.291015625, -14.591064453125, -13.89111328125, -13.191162109375, -12.4912109375, -11.791259765625, -11.09130859375, -10.391357421875, -9.69140625, -8.991455078125, -8.29150390625, -7.591552734375, -6.8916015625, -6.191650390625, -5.49169921875, -4.791748046875, -4.091796875, -3.391845703125, -2.69189453125, -1.991943359375, -1.2919921875, -0.592041015625, 0.10791015625, 0.807861328125, 1.5078125, 2.207763671875, 2.90771484375, 3.607666015625, 4.3076171875, 5.007568359375, 5.70751953125, 6.407470703125, 7.107421875, 7.807373046875, 8.50732421875, 9.207275390625, 9.9072265625, 10.607177734375, 11.30712890625, 12.007080078125, 12.70703125, 13.406982421875, 14.10693359375, 14.806884765625, 15.5068359375, 16.206787109375, 16.90673828125, 17.606689453125, 18.306640625, 19.006591796875, 19.70654296875, 20.406494140625, 21.1064453125, 21.806396484375, 22.50634765625, 23.206298828125, 23.90625]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 3.0, 2.0, 4.0, 3.0, 10.0, 7.0, 18.0, 37.0, 41.0, 65.0, 86.0, 131.0, 185.0, 258.0, 365.0, 534.0, 765.0, 1167.0, 1828.0, 2735.0, 4373.0, 7157.0, 11825.0, 20262.0, 36076.0, 64387.0, 111295.0, 168394.0, 197070.0, 165200.0, 107450.0, 61794.0, 34710.0, 19657.0, 11558.0, 6774.0, 4297.0, 2668.0, 1770.0, 1117.0, 789.0, 542.0, 349.0, 257.0, 152.0, 110.0, 88.0, 62.0, 42.0, 29.0, 21.0, 15.0, 13.0, 10.0, 4.0, 3.0, 1.0, 2.0, 2.0, 2.0], "bins": [-14.921875, -14.4622802734375, -14.002685546875, -13.5430908203125, -13.08349609375, -12.6239013671875, -12.164306640625, -11.7047119140625, -11.2451171875, -10.7855224609375, -10.325927734375, -9.8663330078125, -9.40673828125, -8.9471435546875, -8.487548828125, -8.0279541015625, -7.568359375, -7.1087646484375, -6.649169921875, -6.1895751953125, -5.72998046875, -5.2703857421875, -4.810791015625, -4.3511962890625, -3.8916015625, -3.4320068359375, -2.972412109375, -2.5128173828125, -2.05322265625, -1.5936279296875, -1.134033203125, -0.6744384765625, -0.21484375, 0.2447509765625, 0.704345703125, 1.1639404296875, 1.62353515625, 2.0831298828125, 2.542724609375, 3.0023193359375, 3.4619140625, 3.9215087890625, 4.381103515625, 4.8406982421875, 5.30029296875, 5.7598876953125, 6.219482421875, 6.6790771484375, 7.138671875, 7.5982666015625, 8.057861328125, 8.5174560546875, 8.97705078125, 9.4366455078125, 9.896240234375, 10.3558349609375, 10.8154296875, 11.2750244140625, 11.734619140625, 12.1942138671875, 12.65380859375, 13.1134033203125, 13.572998046875, 14.0325927734375, 14.4921875]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 4.0, 7.0, 12.0, 11.0, 14.0, 11.0, 14.0, 29.0, 30.0, 26.0, 48.0, 36.0, 51.0, 46.0, 57.0, 72.0, 64.0, 65.0, 67.0, 66.0, 45.0, 45.0, 34.0, 28.0, 26.0, 22.0, 20.0, 16.0, 12.0, 8.0, 7.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0013151168823242188, -0.0012736916542053223, -0.0012322664260864258, -0.0011908411979675293, -0.0011494159698486328, -0.0011079907417297363, -0.0010665655136108398, -0.0010251402854919434, -0.0009837150573730469, -0.0009422898292541504, -0.0009008646011352539, -0.0008594393730163574, -0.0008180141448974609, -0.0007765889167785645, -0.000735163688659668, -0.0006937384605407715, -0.000652313232421875, -0.0006108880043029785, -0.000569462776184082, -0.0005280375480651855, -0.00048661231994628906, -0.0004451870918273926, -0.0004037618637084961, -0.0003623366355895996, -0.0003209114074707031, -0.00027948617935180664, -0.00023806095123291016, -0.00019663572311401367, -0.0001552104949951172, -0.0001137852668762207, -7.236003875732422e-05, -3.0934810638427734e-05, 1.049041748046875e-05, 5.1915645599365234e-05, 9.334087371826172e-05, 0.0001347661018371582, 0.0001761913299560547, 0.00021761655807495117, 0.00025904178619384766, 0.00030046701431274414, 0.0003418922424316406, 0.0003833174705505371, 0.0004247426986694336, 0.0004661679267883301, 0.0005075931549072266, 0.000549018383026123, 0.0005904436111450195, 0.000631868839263916, 0.0006732940673828125, 0.000714719295501709, 0.0007561445236206055, 0.000797569751739502, 0.0008389949798583984, 0.0008804202079772949, 0.0009218454360961914, 0.0009632706642150879, 0.0010046958923339844, 0.0010461211204528809, 0.0010875463485717773, 0.0011289715766906738, 0.0011703968048095703, 0.0012118220329284668, 0.0012532472610473633, 0.0012946724891662598, 0.0013360977172851562]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 8.0, 7.0, 15.0, 16.0, 33.0, 41.0, 56.0, 92.0, 102.0, 159.0, 196.0, 325.0, 429.0, 638.0, 895.0, 1312.0, 1910.0, 2837.0, 4295.0, 6555.0, 10085.0, 15931.0, 24733.0, 38872.0, 60328.0, 88548.0, 118603.0, 139950.0, 141830.0, 121807.0, 90883.0, 62703.0, 40676.0, 25714.0, 16529.0, 10623.0, 6929.0, 4388.0, 3064.0, 2007.0, 1415.0, 894.0, 644.0, 419.0, 341.0, 212.0, 170.0, 97.0, 87.0, 48.0, 30.0, 25.0, 25.0, 13.0, 12.0, 5.0, 3.0, 2.0, 2.0, 2.0], "bins": [-10.578125, -10.248046875, -9.91796875, -9.587890625, -9.2578125, -8.927734375, -8.59765625, -8.267578125, -7.9375, -7.607421875, -7.27734375, -6.947265625, -6.6171875, -6.287109375, -5.95703125, -5.626953125, -5.296875, -4.966796875, -4.63671875, -4.306640625, -3.9765625, -3.646484375, -3.31640625, -2.986328125, -2.65625, -2.326171875, -1.99609375, -1.666015625, -1.3359375, -1.005859375, -0.67578125, -0.345703125, -0.015625, 0.314453125, 0.64453125, 0.974609375, 1.3046875, 1.634765625, 1.96484375, 2.294921875, 2.625, 2.955078125, 3.28515625, 3.615234375, 3.9453125, 4.275390625, 4.60546875, 4.935546875, 5.265625, 5.595703125, 5.92578125, 6.255859375, 6.5859375, 6.916015625, 7.24609375, 7.576171875, 7.90625, 8.236328125, 8.56640625, 8.896484375, 9.2265625, 9.556640625, 9.88671875, 10.216796875, 10.546875]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 5.0, 7.0, 9.0, 4.0, 7.0, 7.0, 21.0, 15.0, 24.0, 18.0, 23.0, 30.0, 28.0, 34.0, 43.0, 57.0, 68.0, 61.0, 58.0, 64.0, 52.0, 56.0, 40.0, 47.0, 23.0, 32.0, 19.0, 24.0, 19.0, 16.0, 11.0, 14.0, 10.0, 9.0, 6.0, 6.0, 13.0, 6.0, 1.0, 3.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.7109375, -8.426025390625, -8.14111328125, -7.856201171875, -7.5712890625, -7.286376953125, -7.00146484375, -6.716552734375, -6.431640625, -6.146728515625, -5.86181640625, -5.576904296875, -5.2919921875, -5.007080078125, -4.72216796875, -4.437255859375, -4.15234375, -3.867431640625, -3.58251953125, -3.297607421875, -3.0126953125, -2.727783203125, -2.44287109375, -2.157958984375, -1.873046875, -1.588134765625, -1.30322265625, -1.018310546875, -0.7333984375, -0.448486328125, -0.16357421875, 0.121337890625, 0.40625, 0.691162109375, 0.97607421875, 1.260986328125, 1.5458984375, 1.830810546875, 2.11572265625, 2.400634765625, 2.685546875, 2.970458984375, 3.25537109375, 3.540283203125, 3.8251953125, 4.110107421875, 4.39501953125, 4.679931640625, 4.96484375, 5.249755859375, 5.53466796875, 5.819580078125, 6.1044921875, 6.389404296875, 6.67431640625, 6.959228515625, 7.244140625, 7.529052734375, 7.81396484375, 8.098876953125, 8.3837890625, 8.668701171875, 8.95361328125, 9.238525390625, 9.5234375]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 6.0, 6.0, 2.0, 8.0, 5.0, 11.0, 15.0, 12.0, 13.0, 15.0, 20.0, 26.0, 34.0, 20.0, 34.0, 45.0, 52.0, 42.0, 57.0, 58.0, 38.0, 44.0, 58.0, 48.0, 43.0, 46.0, 37.0, 29.0, 40.0, 25.0, 28.0, 21.0, 13.0, 14.0, 9.0, 10.0, 6.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.716594696044922, -20.99232292175293, -20.26805305480957, -19.543781280517578, -18.819509506225586, -18.095237731933594, -17.370967864990234, -16.646696090698242, -15.92242431640625, -15.198153495788574, -14.473881721496582, -13.749610900878906, -13.025339126586914, -12.301068305969238, -11.576797485351562, -10.85252571105957, -10.128254890441895, -9.403984069824219, -8.679712295532227, -7.955441474914551, -7.231169700622559, -6.506898880004883, -5.782627582550049, -5.058356285095215, -4.334084987640381, -3.609813690185547, -2.885542392730713, -2.161271333694458, -1.437000036239624, -0.71272873878479, 0.011542320251464844, 0.7358136177062988, 1.4600849151611328, 2.184356212615967, 2.908627510070801, 3.6328985691070557, 4.357170104980469, 5.0814409255981445, 5.8057122230529785, 6.5299835205078125, 7.2542548179626465, 7.9785261154174805, 8.702796936035156, 9.427068710327148, 10.151339530944824, 10.875611305236816, 11.599882125854492, 12.324153900146484, 13.04842472076416, 13.772695541381836, 14.496967315673828, 15.221238136291504, 15.945509910583496, 16.669780731201172, 17.394052505493164, 18.118324279785156, 18.842594146728516, 19.566865921020508, 20.291135787963867, 21.01540756225586, 21.73967933654785, 22.463951110839844, 23.188220977783203, 23.912492752075195, 24.636764526367188]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 4.0, 2.0, 7.0, 5.0, 0.0, 2.0, 6.0, 11.0, 9.0, 8.0, 12.0, 13.0, 10.0, 20.0, 10.0, 18.0, 27.0, 32.0, 21.0, 24.0, 27.0, 34.0, 31.0, 36.0, 38.0, 34.0, 47.0, 31.0, 45.0, 46.0, 40.0, 33.0, 34.0, 37.0, 25.0, 29.0, 28.0, 24.0, 19.0, 23.0, 15.0, 14.0, 12.0, 22.0, 10.0, 12.0, 9.0, 8.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.908458709716797, -25.028287887573242, -24.148115158081055, -23.2679443359375, -22.387773513793945, -21.50760269165039, -20.627429962158203, -19.74725914001465, -18.867088317871094, -17.98691749572754, -17.10674476623535, -16.226573944091797, -15.346403121948242, -14.466231346130371, -13.5860595703125, -12.705888748168945, -11.825716018676758, -10.945544242858887, -10.065373420715332, -9.185201644897461, -8.305030822753906, -7.424859046936035, -6.544687271118164, -5.664515972137451, -4.784344673156738, -3.9041733741760254, -3.0240018367767334, -2.1438302993774414, -1.2636590003967285, -0.3834877014160156, 0.49668407440185547, 1.3768553733825684, 2.257028579711914, 3.137199878692627, 4.01737117767334, 4.897542953491211, 5.777714252471924, 6.657885551452637, 7.538057327270508, 8.418228149414062, 9.298399925231934, 10.178571701049805, 11.05874252319336, 11.93891429901123, 12.819086074829102, 13.699256896972656, 14.579428672790527, 15.459600448608398, 16.339771270751953, 17.219942092895508, 18.100114822387695, 18.98028564453125, 19.860456466674805, 20.74062728881836, 21.620800018310547, 22.5009708404541, 23.381141662597656, 24.26131248474121, 25.1414852142334, 26.021656036376953, 26.901826858520508, 27.781997680664062, 28.66217041015625, 29.542341232299805, 30.422513961791992]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 5.0, 2.0, 4.0, 8.0, 14.0, 9.0, 13.0, 32.0, 68.0, 106.0, 133.0, 256.0, 397.0, 606.0, 1002.0, 1590.0, 2689.0, 4293.0, 7156.0, 11924.0, 19874.0, 33091.0, 55862.0, 93614.0, 153926.0, 245272.0, 367213.0, 493260.0, 585574.0, 587684.0, 501184.0, 374239.0, 251873.0, 158468.0, 96087.0, 57850.0, 35116.0, 20906.0, 12635.0, 7747.0, 4693.0, 2878.0, 1844.0, 1108.0, 732.0, 441.0, 288.0, 219.0, 114.0, 68.0, 51.0, 32.0, 14.0, 15.0, 6.0, 6.0, 3.0, 6.0, 1.0, 1.0], "bins": [-18.1875, -17.636962890625, -17.08642578125, -16.535888671875, -15.9853515625, -15.434814453125, -14.88427734375, -14.333740234375, -13.783203125, -13.232666015625, -12.68212890625, -12.131591796875, -11.5810546875, -11.030517578125, -10.47998046875, -9.929443359375, -9.37890625, -8.828369140625, -8.27783203125, -7.727294921875, -7.1767578125, -6.626220703125, -6.07568359375, -5.525146484375, -4.974609375, -4.424072265625, -3.87353515625, -3.322998046875, -2.7724609375, -2.221923828125, -1.67138671875, -1.120849609375, -0.5703125, -0.019775390625, 0.53076171875, 1.081298828125, 1.6318359375, 2.182373046875, 2.73291015625, 3.283447265625, 3.833984375, 4.384521484375, 4.93505859375, 5.485595703125, 6.0361328125, 6.586669921875, 7.13720703125, 7.687744140625, 8.23828125, 8.788818359375, 9.33935546875, 9.889892578125, 10.4404296875, 10.990966796875, 11.54150390625, 12.092041015625, 12.642578125, 13.193115234375, 13.74365234375, 14.294189453125, 14.8447265625, 15.395263671875, 15.94580078125, 16.496337890625, 17.046875]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 6.0, 0.0, 3.0, 4.0, 6.0, 4.0, 1.0, 9.0, 10.0, 15.0, 10.0, 12.0, 15.0, 12.0, 12.0, 21.0, 27.0, 24.0, 28.0, 24.0, 41.0, 30.0, 27.0, 44.0, 34.0, 35.0, 41.0, 40.0, 37.0, 33.0, 39.0, 46.0, 35.0, 40.0, 28.0, 25.0, 20.0, 27.0, 23.0, 24.0, 18.0, 12.0, 9.0, 18.0, 11.0, 11.0, 6.0, 4.0, 5.0, 4.0, 5.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-21.765625, -21.066650390625, -20.36767578125, -19.668701171875, -18.9697265625, -18.270751953125, -17.57177734375, -16.872802734375, -16.173828125, -15.474853515625, -14.77587890625, -14.076904296875, -13.3779296875, -12.678955078125, -11.97998046875, -11.281005859375, -10.58203125, -9.883056640625, -9.18408203125, -8.485107421875, -7.7861328125, -7.087158203125, -6.38818359375, -5.689208984375, -4.990234375, -4.291259765625, -3.59228515625, -2.893310546875, -2.1943359375, -1.495361328125, -0.79638671875, -0.097412109375, 0.6015625, 1.300537109375, 1.99951171875, 2.698486328125, 3.3974609375, 4.096435546875, 4.79541015625, 5.494384765625, 6.193359375, 6.892333984375, 7.59130859375, 8.290283203125, 8.9892578125, 9.688232421875, 10.38720703125, 11.086181640625, 11.78515625, 12.484130859375, 13.18310546875, 13.882080078125, 14.5810546875, 15.280029296875, 15.97900390625, 16.677978515625, 17.376953125, 18.075927734375, 18.77490234375, 19.473876953125, 20.1728515625, 20.871826171875, 21.57080078125, 22.269775390625, 22.96875]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 7.0, 6.0, 15.0, 32.0, 54.0, 83.0, 134.0, 205.0, 330.0, 563.0, 883.0, 1509.0, 2640.0, 4270.0, 7450.0, 12624.0, 21815.0, 37343.0, 63004.0, 105131.0, 168205.0, 258851.0, 370394.0, 484327.0, 556448.0, 558196.0, 482242.0, 371631.0, 259091.0, 168812.0, 104830.0, 62965.0, 37506.0, 21710.0, 12858.0, 7402.0, 4326.0, 2583.0, 1455.0, 879.0, 567.0, 334.0, 204.0, 126.0, 77.0, 59.0, 35.0, 27.0, 24.0, 7.0, 5.0, 7.0, 6.0, 1.0, 1.0, 0.0, 2.0], "bins": [-18.75, -18.1640625, -17.578125, -16.9921875, -16.40625, -15.8203125, -15.234375, -14.6484375, -14.0625, -13.4765625, -12.890625, -12.3046875, -11.71875, -11.1328125, -10.546875, -9.9609375, -9.375, -8.7890625, -8.203125, -7.6171875, -7.03125, -6.4453125, -5.859375, -5.2734375, -4.6875, -4.1015625, -3.515625, -2.9296875, -2.34375, -1.7578125, -1.171875, -0.5859375, 0.0, 0.5859375, 1.171875, 1.7578125, 2.34375, 2.9296875, 3.515625, 4.1015625, 4.6875, 5.2734375, 5.859375, 6.4453125, 7.03125, 7.6171875, 8.203125, 8.7890625, 9.375, 9.9609375, 10.546875, 11.1328125, 11.71875, 12.3046875, 12.890625, 13.4765625, 14.0625, 14.6484375, 15.234375, 15.8203125, 16.40625, 16.9921875, 17.578125, 18.1640625, 18.75]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 5.0, 12.0, 10.0, 27.0, 20.0, 36.0, 33.0, 48.0, 68.0, 87.0, 88.0, 110.0, 156.0, 172.0, 191.0, 208.0, 235.0, 283.0, 231.0, 242.0, 267.0, 230.0, 222.0, 208.0, 182.0, 149.0, 136.0, 91.0, 73.0, 61.0, 54.0, 45.0, 21.0, 26.0, 19.0, 11.0, 12.0, 1.0, 3.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.46875, -10.1014404296875, -9.734130859375, -9.3668212890625, -8.99951171875, -8.6322021484375, -8.264892578125, -7.8975830078125, -7.5302734375, -7.1629638671875, -6.795654296875, -6.4283447265625, -6.06103515625, -5.6937255859375, -5.326416015625, -4.9591064453125, -4.591796875, -4.2244873046875, -3.857177734375, -3.4898681640625, -3.12255859375, -2.7552490234375, -2.387939453125, -2.0206298828125, -1.6533203125, -1.2860107421875, -0.918701171875, -0.5513916015625, -0.18408203125, 0.1832275390625, 0.550537109375, 0.9178466796875, 1.28515625, 1.6524658203125, 2.019775390625, 2.3870849609375, 2.75439453125, 3.1217041015625, 3.489013671875, 3.8563232421875, 4.2236328125, 4.5909423828125, 4.958251953125, 5.3255615234375, 5.69287109375, 6.0601806640625, 6.427490234375, 6.7947998046875, 7.162109375, 7.5294189453125, 7.896728515625, 8.2640380859375, 8.63134765625, 8.9986572265625, 9.365966796875, 9.7332763671875, 10.1005859375, 10.4678955078125, 10.835205078125, 11.2025146484375, 11.56982421875, 11.9371337890625, 12.304443359375, 12.6717529296875, 13.0390625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 6.0, 1.0, 7.0, 3.0, 2.0, 5.0, 7.0, 6.0, 10.0, 13.0, 17.0, 21.0, 16.0, 22.0, 21.0, 28.0, 35.0, 41.0, 40.0, 29.0, 39.0, 60.0, 33.0, 42.0, 48.0, 41.0, 38.0, 40.0, 55.0, 48.0, 38.0, 30.0, 26.0, 25.0, 16.0, 15.0, 18.0, 14.0, 11.0, 9.0, 10.0, 3.0, 7.0, 3.0, 2.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.928218841552734, -20.271717071533203, -19.615217208862305, -18.958715438842773, -18.302215576171875, -17.645713806152344, -16.989213943481445, -16.332712173461914, -15.676212310791016, -15.0197114944458, -14.363210678100586, -13.706709861755371, -13.050209045410156, -12.393708229064941, -11.737207412719727, -11.080705642700195, -10.42420482635498, -9.767704010009766, -9.11120319366455, -8.454702377319336, -7.798201560974121, -7.141700744628906, -6.485199451446533, -5.828698635101318, -5.1721978187561035, -4.515697002410889, -3.859196186065674, -3.20269513130188, -2.546194314956665, -1.8896934986114502, -1.2331924438476562, -0.5766916275024414, 0.07980918884277344, 0.7363100647926331, 1.3928109407424927, 2.049311876296997, 2.705812692642212, 3.3623135089874268, 4.018814563751221, 4.6753153800964355, 5.33181619644165, 5.988317012786865, 6.64481782913208, 7.301319122314453, 7.957819938659668, 8.614320755004883, 9.270821571350098, 9.927322387695312, 10.583823204040527, 11.240324020385742, 11.896824836730957, 12.553325653076172, 13.209826469421387, 13.866327285766602, 14.522829055786133, 15.179328918457031, 15.835830688476562, 16.492332458496094, 17.148832321166992, 17.805334091186523, 18.461833953857422, 19.118335723876953, 19.77483558654785, 20.431337356567383, 21.08783721923828]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 2.0, 6.0, 10.0, 9.0, 7.0, 12.0, 11.0, 12.0, 17.0, 16.0, 20.0, 38.0, 20.0, 20.0, 46.0, 30.0, 23.0, 38.0, 43.0, 34.0, 44.0, 45.0, 47.0, 38.0, 46.0, 45.0, 44.0, 33.0, 30.0, 23.0, 21.0, 31.0, 21.0, 17.0, 14.0, 23.0, 13.0, 13.0, 11.0, 7.0, 5.0, 7.0, 5.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-28.027969360351562, -27.137474060058594, -26.246976852416992, -25.356481552124023, -24.465984344482422, -23.575489044189453, -22.684993743896484, -21.794496536254883, -20.90399932861328, -20.013504028320312, -19.12300682067871, -18.232511520385742, -17.34201431274414, -16.451519012451172, -15.561022758483887, -14.670526504516602, -13.780031204223633, -12.889534950256348, -11.999038696289062, -11.108543395996094, -10.218046188354492, -9.327550888061523, -8.437054634094238, -7.546558380126953, -6.656062126159668, -5.765565872192383, -4.875069618225098, -3.9845738410949707, -3.0940775871276855, -2.2035813331604004, -1.3130855560302734, -0.4225893020629883, 0.4679069519042969, 1.3584030866622925, 2.248899221420288, 3.139395236968994, 4.029891490936279, 4.9203877449035645, 5.810883522033691, 6.701379776000977, 7.591876029968262, 8.482372283935547, 9.372868537902832, 10.263364791870117, 11.153860092163086, 12.044357299804688, 12.934852600097656, 13.825348854064941, 14.715845108032227, 15.606341361999512, 16.496837615966797, 17.387332916259766, 18.277830123901367, 19.168325424194336, 20.058822631835938, 20.949317932128906, 21.839813232421875, 22.730308532714844, 23.620805740356445, 24.511301040649414, 25.401798248291016, 26.292293548583984, 27.182788848876953, 28.073286056518555, 28.963783264160156]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 6.0, 5.0, 14.0, 13.0, 19.0, 33.0, 36.0, 54.0, 87.0, 131.0, 195.0, 345.0, 543.0, 910.0, 1550.0, 2620.0, 4623.0, 8368.0, 15604.0, 29452.0, 54777.0, 98866.0, 157047.0, 198076.0, 183305.0, 128012.0, 74735.0, 40940.0, 21668.0, 11630.0, 6371.0, 3523.0, 2039.0, 1162.0, 646.0, 411.0, 261.0, 156.0, 107.0, 73.0, 59.0, 35.0, 20.0, 15.0, 9.0, 6.0, 2.0, 2.0, 3.0, 1.0, 2.0], "bins": [-14.7890625, -14.38671875, -13.984375, -13.58203125, -13.1796875, -12.77734375, -12.375, -11.97265625, -11.5703125, -11.16796875, -10.765625, -10.36328125, -9.9609375, -9.55859375, -9.15625, -8.75390625, -8.3515625, -7.94921875, -7.546875, -7.14453125, -6.7421875, -6.33984375, -5.9375, -5.53515625, -5.1328125, -4.73046875, -4.328125, -3.92578125, -3.5234375, -3.12109375, -2.71875, -2.31640625, -1.9140625, -1.51171875, -1.109375, -0.70703125, -0.3046875, 0.09765625, 0.5, 0.90234375, 1.3046875, 1.70703125, 2.109375, 2.51171875, 2.9140625, 3.31640625, 3.71875, 4.12109375, 4.5234375, 4.92578125, 5.328125, 5.73046875, 6.1328125, 6.53515625, 6.9375, 7.33984375, 7.7421875, 8.14453125, 8.546875, 8.94921875, 9.3515625, 9.75390625, 10.15625, 10.55859375, 10.9609375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 7.0, 2.0, 5.0, 7.0, 10.0, 12.0, 15.0, 14.0, 15.0, 21.0, 17.0, 27.0, 27.0, 33.0, 34.0, 24.0, 35.0, 29.0, 39.0, 51.0, 43.0, 47.0, 48.0, 43.0, 50.0, 32.0, 48.0, 40.0, 28.0, 18.0, 22.0, 23.0, 18.0, 20.0, 20.0, 15.0, 20.0, 5.0, 13.0, 7.0, 6.0, 4.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-29.609375, -28.697998046875, -27.78662109375, -26.875244140625, -25.9638671875, -25.052490234375, -24.14111328125, -23.229736328125, -22.318359375, -21.406982421875, -20.49560546875, -19.584228515625, -18.6728515625, -17.761474609375, -16.85009765625, -15.938720703125, -15.02734375, -14.115966796875, -13.20458984375, -12.293212890625, -11.3818359375, -10.470458984375, -9.55908203125, -8.647705078125, -7.736328125, -6.824951171875, -5.91357421875, -5.002197265625, -4.0908203125, -3.179443359375, -2.26806640625, -1.356689453125, -0.4453125, 0.466064453125, 1.37744140625, 2.288818359375, 3.2001953125, 4.111572265625, 5.02294921875, 5.934326171875, 6.845703125, 7.757080078125, 8.66845703125, 9.579833984375, 10.4912109375, 11.402587890625, 12.31396484375, 13.225341796875, 14.13671875, 15.048095703125, 15.95947265625, 16.870849609375, 17.7822265625, 18.693603515625, 19.60498046875, 20.516357421875, 21.427734375, 22.339111328125, 23.25048828125, 24.161865234375, 25.0732421875, 25.984619140625, 26.89599609375, 27.807373046875, 28.71875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 7.0, 3.0, 3.0, 4.0, 9.0, 20.0, 23.0, 20.0, 44.0, 46.0, 74.0, 89.0, 137.0, 192.0, 305.0, 490.0, 789.0, 1316.0, 2218.0, 3967.0, 7546.0, 15483.0, 32233.0, 70520.0, 147388.0, 244725.0, 241860.0, 145581.0, 69412.0, 31929.0, 15017.0, 7399.0, 3964.0, 2231.0, 1274.0, 781.0, 488.0, 307.0, 190.0, 139.0, 98.0, 69.0, 43.0, 37.0, 21.0, 18.0, 15.0, 10.0, 8.0, 6.0, 7.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0], "bins": [-16.640625, -16.13623046875, -15.6318359375, -15.12744140625, -14.623046875, -14.11865234375, -13.6142578125, -13.10986328125, -12.60546875, -12.10107421875, -11.5966796875, -11.09228515625, -10.587890625, -10.08349609375, -9.5791015625, -9.07470703125, -8.5703125, -8.06591796875, -7.5615234375, -7.05712890625, -6.552734375, -6.04833984375, -5.5439453125, -5.03955078125, -4.53515625, -4.03076171875, -3.5263671875, -3.02197265625, -2.517578125, -2.01318359375, -1.5087890625, -1.00439453125, -0.5, 0.00439453125, 0.5087890625, 1.01318359375, 1.517578125, 2.02197265625, 2.5263671875, 3.03076171875, 3.53515625, 4.03955078125, 4.5439453125, 5.04833984375, 5.552734375, 6.05712890625, 6.5615234375, 7.06591796875, 7.5703125, 8.07470703125, 8.5791015625, 9.08349609375, 9.587890625, 10.09228515625, 10.5966796875, 11.10107421875, 11.60546875, 12.10986328125, 12.6142578125, 13.11865234375, 13.623046875, 14.12744140625, 14.6318359375, 15.13623046875, 15.640625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 3.0, 3.0, 9.0, 8.0, 7.0, 14.0, 14.0, 14.0, 20.0, 18.0, 22.0, 37.0, 28.0, 32.0, 36.0, 39.0, 51.0, 49.0, 61.0, 29.0, 41.0, 45.0, 39.0, 52.0, 44.0, 45.0, 26.0, 37.0, 27.0, 27.0, 27.0, 16.0, 16.0, 15.0, 7.0, 13.0, 5.0, 8.0, 9.0, 7.0, 2.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.0625, -20.44580078125, -19.8291015625, -19.21240234375, -18.595703125, -17.97900390625, -17.3623046875, -16.74560546875, -16.12890625, -15.51220703125, -14.8955078125, -14.27880859375, -13.662109375, -13.04541015625, -12.4287109375, -11.81201171875, -11.1953125, -10.57861328125, -9.9619140625, -9.34521484375, -8.728515625, -8.11181640625, -7.4951171875, -6.87841796875, -6.26171875, -5.64501953125, -5.0283203125, -4.41162109375, -3.794921875, -3.17822265625, -2.5615234375, -1.94482421875, -1.328125, -0.71142578125, -0.0947265625, 0.52197265625, 1.138671875, 1.75537109375, 2.3720703125, 2.98876953125, 3.60546875, 4.22216796875, 4.8388671875, 5.45556640625, 6.072265625, 6.68896484375, 7.3056640625, 7.92236328125, 8.5390625, 9.15576171875, 9.7724609375, 10.38916015625, 11.005859375, 11.62255859375, 12.2392578125, 12.85595703125, 13.47265625, 14.08935546875, 14.7060546875, 15.32275390625, 15.939453125, 16.55615234375, 17.1728515625, 17.78955078125, 18.40625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 6.0, 3.0, 8.0, 14.0, 15.0, 18.0, 27.0, 43.0, 41.0, 67.0, 83.0, 124.0, 167.0, 205.0, 289.0, 389.0, 544.0, 785.0, 1302.0, 1985.0, 3493.0, 6739.0, 14613.0, 39866.0, 125817.0, 346296.0, 326816.0, 113359.0, 36112.0, 13690.0, 6307.0, 3370.0, 1955.0, 1275.0, 755.0, 576.0, 369.0, 291.0, 207.0, 129.0, 126.0, 80.0, 46.0, 35.0, 36.0, 25.0, 23.0, 14.0, 10.0, 2.0, 6.0, 5.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-11.8828125, -11.510986328125, -11.13916015625, -10.767333984375, -10.3955078125, -10.023681640625, -9.65185546875, -9.280029296875, -8.908203125, -8.536376953125, -8.16455078125, -7.792724609375, -7.4208984375, -7.049072265625, -6.67724609375, -6.305419921875, -5.93359375, -5.561767578125, -5.18994140625, -4.818115234375, -4.4462890625, -4.074462890625, -3.70263671875, -3.330810546875, -2.958984375, -2.587158203125, -2.21533203125, -1.843505859375, -1.4716796875, -1.099853515625, -0.72802734375, -0.356201171875, 0.015625, 0.387451171875, 0.75927734375, 1.131103515625, 1.5029296875, 1.874755859375, 2.24658203125, 2.618408203125, 2.990234375, 3.362060546875, 3.73388671875, 4.105712890625, 4.4775390625, 4.849365234375, 5.22119140625, 5.593017578125, 5.96484375, 6.336669921875, 6.70849609375, 7.080322265625, 7.4521484375, 7.823974609375, 8.19580078125, 8.567626953125, 8.939453125, 9.311279296875, 9.68310546875, 10.054931640625, 10.4267578125, 10.798583984375, 11.17041015625, 11.542236328125, 11.9140625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 7.0, 9.0, 10.0, 15.0, 13.0, 42.0, 65.0, 102.0, 142.0, 143.0, 126.0, 115.0, 73.0, 47.0, 30.0, 26.0, 8.0, 9.0, 2.0, 5.0, 2.0, 6.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0010738372802734375, -0.0010475069284439087, -0.0010211765766143799, -0.000994846224784851, -0.0009685158729553223, -0.0009421855211257935, -0.0009158551692962646, -0.0008895248174667358, -0.000863194465637207, -0.0008368641138076782, -0.0008105337619781494, -0.0007842034101486206, -0.0007578730583190918, -0.000731542706489563, -0.0007052123546600342, -0.0006788820028305054, -0.0006525516510009766, -0.0006262212991714478, -0.0005998909473419189, -0.0005735605955123901, -0.0005472302436828613, -0.0005208998918533325, -0.0004945695400238037, -0.0004682391881942749, -0.0004419088363647461, -0.0004155784845352173, -0.0003892481327056885, -0.00036291778087615967, -0.00033658742904663086, -0.00031025707721710205, -0.00028392672538757324, -0.00025759637355804443, -0.00023126602172851562, -0.00020493566989898682, -0.000178605318069458, -0.0001522749662399292, -0.0001259446144104004, -9.961426258087158e-05, -7.328391075134277e-05, -4.6953558921813965e-05, -2.0623207092285156e-05, 5.707144737243652e-06, 3.203749656677246e-05, 5.836784839630127e-05, 8.469820022583008e-05, 0.00011102855205535889, 0.0001373589038848877, 0.0001636892557144165, 0.0001900196075439453, 0.00021634995937347412, 0.00024268031120300293, 0.00026901066303253174, 0.00029534101486206055, 0.00032167136669158936, 0.00034800171852111816, 0.00037433207035064697, 0.0004006624221801758, 0.0004269927740097046, 0.0004533231258392334, 0.0004796534776687622, 0.000505983829498291, 0.0005323141813278198, 0.0005586445331573486, 0.0005849748849868774, 0.0006113052368164062]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 4.0, 2.0, 6.0, 4.0, 9.0, 15.0, 17.0, 22.0, 26.0, 46.0, 52.0, 76.0, 96.0, 122.0, 182.0, 228.0, 314.0, 450.0, 673.0, 889.0, 1623.0, 2655.0, 4725.0, 8830.0, 18347.0, 40157.0, 91352.0, 190694.0, 273334.0, 213520.0, 107824.0, 47309.0, 21172.0, 10131.0, 5203.0, 3052.0, 1763.0, 1087.0, 721.0, 503.0, 338.0, 270.0, 165.0, 135.0, 119.0, 75.0, 68.0, 45.0, 25.0, 28.0, 20.0, 13.0, 8.0, 8.0, 8.0, 0.0, 1.0, 5.0, 2.0, 1.0], "bins": [-9.953125, -9.6478271484375, -9.342529296875, -9.0372314453125, -8.73193359375, -8.4266357421875, -8.121337890625, -7.8160400390625, -7.5107421875, -7.2054443359375, -6.900146484375, -6.5948486328125, -6.28955078125, -5.9842529296875, -5.678955078125, -5.3736572265625, -5.068359375, -4.7630615234375, -4.457763671875, -4.1524658203125, -3.84716796875, -3.5418701171875, -3.236572265625, -2.9312744140625, -2.6259765625, -2.3206787109375, -2.015380859375, -1.7100830078125, -1.40478515625, -1.0994873046875, -0.794189453125, -0.4888916015625, -0.18359375, 0.1217041015625, 0.427001953125, 0.7322998046875, 1.03759765625, 1.3428955078125, 1.648193359375, 1.9534912109375, 2.2587890625, 2.5640869140625, 2.869384765625, 3.1746826171875, 3.47998046875, 3.7852783203125, 4.090576171875, 4.3958740234375, 4.701171875, 5.0064697265625, 5.311767578125, 5.6170654296875, 5.92236328125, 6.2276611328125, 6.532958984375, 6.8382568359375, 7.1435546875, 7.4488525390625, 7.754150390625, 8.0594482421875, 8.36474609375, 8.6700439453125, 8.975341796875, 9.2806396484375, 9.5859375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 6.0, 8.0, 6.0, 8.0, 15.0, 18.0, 27.0, 28.0, 44.0, 54.0, 63.0, 80.0, 94.0, 81.0, 77.0, 66.0, 80.0, 57.0, 34.0, 33.0, 28.0, 23.0, 15.0, 10.0, 8.0, 8.0, 4.0, 5.0, 5.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.689453125, -3.564910888671875, -3.44036865234375, -3.315826416015625, -3.1912841796875, -3.066741943359375, -2.94219970703125, -2.817657470703125, -2.693115234375, -2.568572998046875, -2.44403076171875, -2.319488525390625, -2.1949462890625, -2.070404052734375, -1.94586181640625, -1.821319580078125, -1.69677734375, -1.572235107421875, -1.44769287109375, -1.323150634765625, -1.1986083984375, -1.074066162109375, -0.94952392578125, -0.824981689453125, -0.700439453125, -0.575897216796875, -0.45135498046875, -0.326812744140625, -0.2022705078125, -0.077728271484375, 0.04681396484375, 0.171356201171875, 0.2958984375, 0.420440673828125, 0.54498291015625, 0.669525146484375, 0.7940673828125, 0.918609619140625, 1.04315185546875, 1.167694091796875, 1.292236328125, 1.416778564453125, 1.54132080078125, 1.665863037109375, 1.7904052734375, 1.914947509765625, 2.03948974609375, 2.164031982421875, 2.28857421875, 2.413116455078125, 2.53765869140625, 2.662200927734375, 2.7867431640625, 2.911285400390625, 3.03582763671875, 3.160369873046875, 3.284912109375, 3.409454345703125, 3.53399658203125, 3.658538818359375, 3.7830810546875, 3.907623291015625, 4.03216552734375, 4.156707763671875, 4.28125]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 5.0, 2.0, 3.0, 5.0, 8.0, 4.0, 6.0, 6.0, 9.0, 17.0, 20.0, 17.0, 19.0, 24.0, 29.0, 38.0, 36.0, 32.0, 36.0, 48.0, 47.0, 44.0, 40.0, 40.0, 46.0, 35.0, 41.0, 52.0, 47.0, 37.0, 42.0, 28.0, 23.0, 20.0, 18.0, 12.0, 14.0, 9.0, 13.0, 5.0, 7.0, 7.0, 3.0, 3.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-21.23821258544922, -20.594074249267578, -19.949934005737305, -19.305795669555664, -18.66165542602539, -18.01751708984375, -17.373376846313477, -16.729238510131836, -16.085098266601562, -15.440958976745605, -14.796819686889648, -14.152680397033691, -13.508541107177734, -12.864402770996094, -12.220263481140137, -11.57612419128418, -10.931985855102539, -10.287846565246582, -9.643707275390625, -8.999567985534668, -8.355428695678711, -7.711289882659912, -7.067151069641113, -6.423011779785156, -5.778872489929199, -5.134733200073242, -4.490593910217285, -3.8464550971984863, -3.2023158073425293, -2.5581765174865723, -1.9140374660491943, -1.2698984146118164, -0.6257610321044922, 0.018378138542175293, 0.6625173091888428, 1.3066564798355103, 1.9507956504821777, 2.5949349403381348, 3.2390739917755127, 3.8832130432128906, 4.527352333068848, 5.171491622924805, 5.815630912780762, 6.4597697257995605, 7.103909015655518, 7.748048305511475, 8.392187118530273, 9.03632640838623, 9.680465698242188, 10.324604988098145, 10.968744277954102, 11.612883567810059, 12.257022857666016, 12.901161193847656, 13.545300483703613, 14.18943977355957, 14.833579063415527, 15.477718353271484, 16.121856689453125, 16.7659969329834, 17.41013526916504, 18.054275512695312, 18.698413848876953, 19.342552185058594, 19.986692428588867]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 1.0, 2.0, 8.0, 8.0, 7.0, 8.0, 10.0, 10.0, 11.0, 12.0, 21.0, 18.0, 24.0, 31.0, 23.0, 20.0, 34.0, 34.0, 39.0, 37.0, 35.0, 34.0, 39.0, 52.0, 38.0, 50.0, 37.0, 46.0, 44.0, 32.0, 30.0, 20.0, 23.0, 34.0, 15.0, 19.0, 17.0, 18.0, 18.0, 10.0, 8.0, 7.0, 6.0, 6.0, 4.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-27.404603958129883, -26.529218673706055, -25.65383529663086, -24.77845001220703, -23.903064727783203, -23.027681350708008, -22.15229606628418, -21.276912689208984, -20.401527404785156, -19.526142120361328, -18.650758743286133, -17.775373458862305, -16.89999008178711, -16.02460479736328, -15.149219512939453, -14.273835182189941, -13.39845085144043, -12.523066520690918, -11.647682189941406, -10.772296905517578, -9.896912574768066, -9.021528244018555, -8.146142959594727, -7.270758628845215, -6.395374298095703, -5.519989967346191, -4.6446051597595215, -3.7692205905914307, -2.89383602142334, -2.018451690673828, -1.1430668830871582, -0.2676820755004883, 0.6077003479003906, 1.4830849170684814, 2.3584694862365723, 3.233854055404663, 4.109238624572754, 4.984622955322266, 5.8600077629089355, 6.7353925704956055, 7.610776901245117, 8.486161231994629, 9.36154556274414, 10.236930847167969, 11.11231517791748, 11.987699508666992, 12.86308479309082, 13.738469123840332, 14.613853454589844, 15.489237785339355, 16.364622116088867, 17.240007400512695, 18.11539077758789, 18.99077606201172, 19.866161346435547, 20.741546630859375, 21.61693000793457, 22.4923152923584, 23.367698669433594, 24.243083953857422, 25.11846923828125, 25.993852615356445, 26.869237899780273, 27.74462127685547, 28.620006561279297]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 3.0, 5.0, 6.0, 18.0, 19.0, 19.0, 34.0, 58.0, 85.0, 109.0, 206.0, 282.0, 461.0, 722.0, 1118.0, 1880.0, 2878.0, 4797.0, 7349.0, 11760.0, 18167.0, 27663.0, 40532.0, 57383.0, 76599.0, 96650.0, 111412.0, 117517.0, 112854.0, 98105.0, 78388.0, 58858.0, 42275.0, 28251.0, 18853.0, 12102.0, 7895.0, 4886.0, 3088.0, 1957.0, 1233.0, 745.0, 492.0, 306.0, 214.0, 123.0, 75.0, 45.0, 32.0, 17.0, 15.0, 9.0, 6.0, 4.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0], "bins": [-14.0703125, -13.624267578125, -13.17822265625, -12.732177734375, -12.2861328125, -11.840087890625, -11.39404296875, -10.947998046875, -10.501953125, -10.055908203125, -9.60986328125, -9.163818359375, -8.7177734375, -8.271728515625, -7.82568359375, -7.379638671875, -6.93359375, -6.487548828125, -6.04150390625, -5.595458984375, -5.1494140625, -4.703369140625, -4.25732421875, -3.811279296875, -3.365234375, -2.919189453125, -2.47314453125, -2.027099609375, -1.5810546875, -1.135009765625, -0.68896484375, -0.242919921875, 0.203125, 0.649169921875, 1.09521484375, 1.541259765625, 1.9873046875, 2.433349609375, 2.87939453125, 3.325439453125, 3.771484375, 4.217529296875, 4.66357421875, 5.109619140625, 5.5556640625, 6.001708984375, 6.44775390625, 6.893798828125, 7.33984375, 7.785888671875, 8.23193359375, 8.677978515625, 9.1240234375, 9.570068359375, 10.01611328125, 10.462158203125, 10.908203125, 11.354248046875, 11.80029296875, 12.246337890625, 12.6923828125, 13.138427734375, 13.58447265625, 14.030517578125, 14.4765625]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 6.0, 6.0, 7.0, 3.0, 7.0, 15.0, 17.0, 17.0, 20.0, 15.0, 24.0, 19.0, 29.0, 34.0, 34.0, 45.0, 41.0, 35.0, 38.0, 46.0, 47.0, 55.0, 46.0, 43.0, 39.0, 41.0, 35.0, 25.0, 36.0, 32.0, 19.0, 21.0, 21.0, 14.0, 18.0, 9.0, 14.0, 8.0, 7.0, 6.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-29.703125, -28.762939453125, -27.82275390625, -26.882568359375, -25.9423828125, -25.002197265625, -24.06201171875, -23.121826171875, -22.181640625, -21.241455078125, -20.30126953125, -19.361083984375, -18.4208984375, -17.480712890625, -16.54052734375, -15.600341796875, -14.66015625, -13.719970703125, -12.77978515625, -11.839599609375, -10.8994140625, -9.959228515625, -9.01904296875, -8.078857421875, -7.138671875, -6.198486328125, -5.25830078125, -4.318115234375, -3.3779296875, -2.437744140625, -1.49755859375, -0.557373046875, 0.3828125, 1.322998046875, 2.26318359375, 3.203369140625, 4.1435546875, 5.083740234375, 6.02392578125, 6.964111328125, 7.904296875, 8.844482421875, 9.78466796875, 10.724853515625, 11.6650390625, 12.605224609375, 13.54541015625, 14.485595703125, 15.42578125, 16.365966796875, 17.30615234375, 18.246337890625, 19.1865234375, 20.126708984375, 21.06689453125, 22.007080078125, 22.947265625, 23.887451171875, 24.82763671875, 25.767822265625, 26.7080078125, 27.648193359375, 28.58837890625, 29.528564453125, 30.46875]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 6.0, 6.0, 7.0, 9.0, 13.0, 23.0, 42.0, 50.0, 91.0, 149.0, 195.0, 328.0, 489.0, 789.0, 1137.0, 1891.0, 2830.0, 4401.0, 6748.0, 10666.0, 15783.0, 24648.0, 35923.0, 50947.0, 69355.0, 88619.0, 104791.0, 114673.0, 113436.0, 102240.0, 85558.0, 65564.0, 48116.0, 33788.0, 22530.0, 14995.0, 9838.0, 6307.0, 4122.0, 2649.0, 1738.0, 1031.0, 737.0, 461.0, 303.0, 209.0, 122.0, 84.0, 56.0, 26.0, 17.0, 14.0, 9.0, 5.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.984375, -13.531982421875, -13.07958984375, -12.627197265625, -12.1748046875, -11.722412109375, -11.27001953125, -10.817626953125, -10.365234375, -9.912841796875, -9.46044921875, -9.008056640625, -8.5556640625, -8.103271484375, -7.65087890625, -7.198486328125, -6.74609375, -6.293701171875, -5.84130859375, -5.388916015625, -4.9365234375, -4.484130859375, -4.03173828125, -3.579345703125, -3.126953125, -2.674560546875, -2.22216796875, -1.769775390625, -1.3173828125, -0.864990234375, -0.41259765625, 0.039794921875, 0.4921875, 0.944580078125, 1.39697265625, 1.849365234375, 2.3017578125, 2.754150390625, 3.20654296875, 3.658935546875, 4.111328125, 4.563720703125, 5.01611328125, 5.468505859375, 5.9208984375, 6.373291015625, 6.82568359375, 7.278076171875, 7.73046875, 8.182861328125, 8.63525390625, 9.087646484375, 9.5400390625, 9.992431640625, 10.44482421875, 10.897216796875, 11.349609375, 11.802001953125, 12.25439453125, 12.706787109375, 13.1591796875, 13.611572265625, 14.06396484375, 14.516357421875, 14.96875]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 9.0, 7.0, 4.0, 2.0, 13.0, 15.0, 23.0, 19.0, 17.0, 12.0, 25.0, 21.0, 29.0, 28.0, 33.0, 32.0, 51.0, 42.0, 37.0, 46.0, 51.0, 46.0, 39.0, 40.0, 36.0, 36.0, 37.0, 38.0, 39.0, 23.0, 27.0, 24.0, 18.0, 14.0, 9.0, 9.0, 8.0, 11.0, 9.0, 10.0, 5.0, 6.0, 4.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.0, -19.392822265625, -18.78564453125, -18.178466796875, -17.5712890625, -16.964111328125, -16.35693359375, -15.749755859375, -15.142578125, -14.535400390625, -13.92822265625, -13.321044921875, -12.7138671875, -12.106689453125, -11.49951171875, -10.892333984375, -10.28515625, -9.677978515625, -9.07080078125, -8.463623046875, -7.8564453125, -7.249267578125, -6.64208984375, -6.034912109375, -5.427734375, -4.820556640625, -4.21337890625, -3.606201171875, -2.9990234375, -2.391845703125, -1.78466796875, -1.177490234375, -0.5703125, 0.036865234375, 0.64404296875, 1.251220703125, 1.8583984375, 2.465576171875, 3.07275390625, 3.679931640625, 4.287109375, 4.894287109375, 5.50146484375, 6.108642578125, 6.7158203125, 7.322998046875, 7.93017578125, 8.537353515625, 9.14453125, 9.751708984375, 10.35888671875, 10.966064453125, 11.5732421875, 12.180419921875, 12.78759765625, 13.394775390625, 14.001953125, 14.609130859375, 15.21630859375, 15.823486328125, 16.4306640625, 17.037841796875, 17.64501953125, 18.252197265625, 18.859375]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 8.0, 12.0, 14.0, 18.0, 23.0, 41.0, 43.0, 71.0, 114.0, 141.0, 256.0, 414.0, 540.0, 839.0, 1228.0, 2045.0, 3113.0, 5008.0, 8136.0, 13416.0, 22039.0, 36236.0, 57430.0, 87597.0, 120727.0, 144884.0, 148262.0, 128859.0, 95936.0, 65112.0, 40674.0, 25328.0, 15135.0, 9169.0, 5749.0, 3551.0, 2197.0, 1444.0, 926.0, 571.0, 396.0, 298.0, 168.0, 122.0, 68.0, 77.0, 36.0, 30.0, 17.0, 14.0, 11.0, 7.0, 5.0, 3.0, 1.0, 2.0, 2.0], "bins": [-8.8203125, -8.5540771484375, -8.287841796875, -8.0216064453125, -7.75537109375, -7.4891357421875, -7.222900390625, -6.9566650390625, -6.6904296875, -6.4241943359375, -6.157958984375, -5.8917236328125, -5.62548828125, -5.3592529296875, -5.093017578125, -4.8267822265625, -4.560546875, -4.2943115234375, -4.028076171875, -3.7618408203125, -3.49560546875, -3.2293701171875, -2.963134765625, -2.6968994140625, -2.4306640625, -2.1644287109375, -1.898193359375, -1.6319580078125, -1.36572265625, -1.0994873046875, -0.833251953125, -0.5670166015625, -0.30078125, -0.0345458984375, 0.231689453125, 0.4979248046875, 0.76416015625, 1.0303955078125, 1.296630859375, 1.5628662109375, 1.8291015625, 2.0953369140625, 2.361572265625, 2.6278076171875, 2.89404296875, 3.1602783203125, 3.426513671875, 3.6927490234375, 3.958984375, 4.2252197265625, 4.491455078125, 4.7576904296875, 5.02392578125, 5.2901611328125, 5.556396484375, 5.8226318359375, 6.0888671875, 6.3551025390625, 6.621337890625, 6.8875732421875, 7.15380859375, 7.4200439453125, 7.686279296875, 7.9525146484375, 8.21875]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 2.0, 5.0, 6.0, 12.0, 10.0, 12.0, 16.0, 20.0, 36.0, 33.0, 40.0, 59.0, 60.0, 54.0, 53.0, 56.0, 45.0, 47.0, 48.0, 60.0, 50.0, 44.0, 36.0, 30.0, 26.0, 23.0, 17.0, 25.0, 16.0, 11.0, 7.0, 12.0, 6.0, 3.0, 10.0, 3.0, 1.0, 6.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007410049438476562, -0.0007145777344703674, -0.0006881505250930786, -0.0006617233157157898, -0.000635296106338501, -0.0006088688969612122, -0.0005824416875839233, -0.0005560144782066345, -0.0005295872688293457, -0.0005031600594520569, -0.00047673285007476807, -0.00045030564069747925, -0.00042387843132019043, -0.0003974512219429016, -0.0003710240125656128, -0.000344596803188324, -0.00031816959381103516, -0.00029174238443374634, -0.0002653151750564575, -0.0002388879656791687, -0.00021246075630187988, -0.00018603354692459106, -0.00015960633754730225, -0.00013317912817001343, -0.00010675191879272461, -8.032470941543579e-05, -5.389750003814697e-05, -2.7470290660858154e-05, -1.043081283569336e-06, 2.5384128093719482e-05, 5.18113374710083e-05, 7.823854684829712e-05, 0.00010466575622558594, 0.00013109296560287476, 0.00015752017498016357, 0.0001839473843574524, 0.0002103745937347412, 0.00023680180311203003, 0.00026322901248931885, 0.00028965622186660767, 0.0003160834312438965, 0.0003425106406211853, 0.0003689378499984741, 0.00039536505937576294, 0.00042179226875305176, 0.0004482194781303406, 0.0004746466875076294, 0.0005010738968849182, 0.000527501106262207, 0.0005539283156394958, 0.0005803555250167847, 0.0006067827343940735, 0.0006332099437713623, 0.0006596371531486511, 0.0006860643625259399, 0.0007124915719032288, 0.0007389187812805176, 0.0007653459906578064, 0.0007917732000350952, 0.000818200409412384, 0.0008446276187896729, 0.0008710548281669617, 0.0008974820375442505, 0.0009239092469215393, 0.0009503364562988281]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 8.0, 7.0, 16.0, 18.0, 41.0, 37.0, 60.0, 87.0, 148.0, 210.0, 281.0, 474.0, 794.0, 1342.0, 2312.0, 3756.0, 6462.0, 10975.0, 18740.0, 31723.0, 52731.0, 81288.0, 114916.0, 143562.0, 152299.0, 137047.0, 105337.0, 71854.0, 45022.0, 27652.0, 16344.0, 9437.0, 5376.0, 3127.0, 1937.0, 1221.0, 697.0, 428.0, 281.0, 180.0, 113.0, 59.0, 46.0, 37.0, 20.0, 18.0, 11.0, 9.0, 5.0, 6.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0], "bins": [-8.953125, -8.6763916015625, -8.399658203125, -8.1229248046875, -7.84619140625, -7.5694580078125, -7.292724609375, -7.0159912109375, -6.7392578125, -6.4625244140625, -6.185791015625, -5.9090576171875, -5.63232421875, -5.3555908203125, -5.078857421875, -4.8021240234375, -4.525390625, -4.2486572265625, -3.971923828125, -3.6951904296875, -3.41845703125, -3.1417236328125, -2.864990234375, -2.5882568359375, -2.3115234375, -2.0347900390625, -1.758056640625, -1.4813232421875, -1.20458984375, -0.9278564453125, -0.651123046875, -0.3743896484375, -0.09765625, 0.1790771484375, 0.455810546875, 0.7325439453125, 1.00927734375, 1.2860107421875, 1.562744140625, 1.8394775390625, 2.1162109375, 2.3929443359375, 2.669677734375, 2.9464111328125, 3.22314453125, 3.4998779296875, 3.776611328125, 4.0533447265625, 4.330078125, 4.6068115234375, 4.883544921875, 5.1602783203125, 5.43701171875, 5.7137451171875, 5.990478515625, 6.2672119140625, 6.5439453125, 6.8206787109375, 7.097412109375, 7.3741455078125, 7.65087890625, 7.9276123046875, 8.204345703125, 8.4810791015625, 8.7578125]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 6.0, 1.0, 6.0, 7.0, 9.0, 16.0, 21.0, 10.0, 16.0, 33.0, 23.0, 30.0, 42.0, 37.0, 49.0, 55.0, 52.0, 69.0, 58.0, 54.0, 59.0, 59.0, 46.0, 43.0, 38.0, 44.0, 24.0, 17.0, 15.0, 13.0, 8.0, 8.0, 8.0, 6.0, 6.0, 4.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0], "bins": [-8.1796875, -7.96417236328125, -7.7486572265625, -7.53314208984375, -7.317626953125, -7.10211181640625, -6.8865966796875, -6.67108154296875, -6.45556640625, -6.24005126953125, -6.0245361328125, -5.80902099609375, -5.593505859375, -5.37799072265625, -5.1624755859375, -4.94696044921875, -4.7314453125, -4.51593017578125, -4.3004150390625, -4.08489990234375, -3.869384765625, -3.65386962890625, -3.4383544921875, -3.22283935546875, -3.00732421875, -2.79180908203125, -2.5762939453125, -2.36077880859375, -2.145263671875, -1.92974853515625, -1.7142333984375, -1.49871826171875, -1.283203125, -1.06768798828125, -0.8521728515625, -0.63665771484375, -0.421142578125, -0.20562744140625, 0.0098876953125, 0.22540283203125, 0.44091796875, 0.65643310546875, 0.8719482421875, 1.08746337890625, 1.302978515625, 1.51849365234375, 1.7340087890625, 1.94952392578125, 2.1650390625, 2.38055419921875, 2.5960693359375, 2.81158447265625, 3.027099609375, 3.24261474609375, 3.4581298828125, 3.67364501953125, 3.88916015625, 4.10467529296875, 4.3201904296875, 4.53570556640625, 4.751220703125, 4.96673583984375, 5.1822509765625, 5.39776611328125, 5.61328125]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 2.0, 0.0, 5.0, 2.0, 6.0, 2.0, 6.0, 15.0, 22.0, 10.0, 13.0, 18.0, 21.0, 29.0, 42.0, 35.0, 36.0, 46.0, 36.0, 32.0, 45.0, 61.0, 72.0, 51.0, 44.0, 43.0, 48.0, 43.0, 47.0, 26.0, 28.0, 18.0, 25.0, 20.0, 11.0, 12.0, 10.0, 7.0, 5.0, 5.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-22.688817977905273, -21.973594665527344, -21.25836944580078, -20.54314613342285, -19.82792091369629, -19.11269760131836, -18.397472381591797, -17.682249069213867, -16.967023849487305, -16.251800537109375, -15.536575317382812, -14.821351051330566, -14.10612678527832, -13.390902519226074, -12.675678253173828, -11.960454940795898, -11.245230674743652, -10.530006408691406, -9.81478214263916, -9.099557876586914, -8.384333610534668, -7.669109344482422, -6.953885555267334, -6.238661289215088, -5.523437023162842, -4.808212757110596, -4.09298849105835, -3.3777644634246826, -2.6625401973724365, -1.9473159313201904, -1.2320919036865234, -0.5168676376342773, 0.19835662841796875, 0.9135808348655701, 1.6288050413131714, 2.344029188156128, 3.059253454208374, 3.77447772026062, 4.489701747894287, 5.204926013946533, 5.920150279998779, 6.635374546051025, 7.3505988121032715, 8.06582260131836, 8.781046867370605, 9.496271133422852, 10.211495399475098, 10.926719665527344, 11.64194393157959, 12.357168197631836, 13.072392463684082, 13.787616729736328, 14.502840995788574, 15.21806526184082, 15.93328857421875, 16.648513793945312, 17.363737106323242, 18.078960418701172, 18.794185638427734, 19.509408950805664, 20.224634170532227, 20.939857482910156, 21.65508270263672, 22.37030601501465, 23.08553123474121]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 4.0, 2.0, 0.0, 0.0, 2.0, 2.0, 6.0, 10.0, 6.0, 11.0, 8.0, 12.0, 13.0, 14.0, 13.0, 31.0, 23.0, 33.0, 22.0, 29.0, 40.0, 49.0, 23.0, 40.0, 46.0, 52.0, 45.0, 35.0, 40.0, 42.0, 28.0, 30.0, 37.0, 38.0, 30.0, 34.0, 24.0, 20.0, 23.0, 19.0, 16.0, 8.0, 9.0, 12.0, 9.0, 6.0, 3.0, 5.0, 1.0, 3.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.70754051208496, -24.83597755432129, -23.964412689208984, -23.092849731445312, -22.22128677368164, -21.34972381591797, -20.478158950805664, -19.606595993041992, -18.735031127929688, -17.863468170166016, -16.99190330505371, -16.12034034729004, -15.248777389526367, -14.377213478088379, -13.50564956665039, -12.634086608886719, -11.762523651123047, -10.890959739685059, -10.019396781921387, -9.147832870483398, -8.276269912719727, -7.404706001281738, -6.53314208984375, -5.66157865524292, -4.79001522064209, -3.9184517860412598, -3.0468881130218506, -2.1753244400024414, -1.3037610054016113, -0.43219757080078125, 0.43936634063720703, 1.310929775238037, 2.182493209838867, 3.0540566444396973, 3.9256203174591064, 4.797183990478516, 5.668747425079346, 6.540310859680176, 7.411874771118164, 8.283437728881836, 9.155001640319824, 10.026565551757812, 10.898128509521484, 11.769692420959473, 12.641256332397461, 13.512819290161133, 14.384383201599121, 15.25594711303711, 16.12751007080078, 16.999073028564453, 17.870637893676758, 18.74220085144043, 19.6137638092041, 20.485328674316406, 21.356891632080078, 22.22845458984375, 23.100017547607422, 23.971580505371094, 24.8431453704834, 25.71470832824707, 26.586271286010742, 27.457836151123047, 28.32939910888672, 29.20096206665039, 30.072526931762695]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 5.0, 9.0, 15.0, 18.0, 28.0, 37.0, 71.0, 95.0, 165.0, 217.0, 344.0, 524.0, 733.0, 1157.0, 1699.0, 2614.0, 3939.0, 5976.0, 9204.0, 14587.0, 22455.0, 34937.0, 54133.0, 84059.0, 128716.0, 192566.0, 276622.0, 371909.0, 459375.0, 509053.0, 499611.0, 438015.0, 341931.0, 249285.0, 169977.0, 113674.0, 73487.0, 47401.0, 30724.0, 19276.0, 12560.0, 8177.0, 5100.0, 3315.0, 2196.0, 1448.0, 987.0, 668.0, 407.0, 273.0, 181.0, 109.0, 76.0, 57.0, 42.0, 29.0, 15.0, 8.0, 3.0, 1.0, 1.0], "bins": [-15.8203125, -15.338623046875, -14.85693359375, -14.375244140625, -13.8935546875, -13.411865234375, -12.93017578125, -12.448486328125, -11.966796875, -11.485107421875, -11.00341796875, -10.521728515625, -10.0400390625, -9.558349609375, -9.07666015625, -8.594970703125, -8.11328125, -7.631591796875, -7.14990234375, -6.668212890625, -6.1865234375, -5.704833984375, -5.22314453125, -4.741455078125, -4.259765625, -3.778076171875, -3.29638671875, -2.814697265625, -2.3330078125, -1.851318359375, -1.36962890625, -0.887939453125, -0.40625, 0.075439453125, 0.55712890625, 1.038818359375, 1.5205078125, 2.002197265625, 2.48388671875, 2.965576171875, 3.447265625, 3.928955078125, 4.41064453125, 4.892333984375, 5.3740234375, 5.855712890625, 6.33740234375, 6.819091796875, 7.30078125, 7.782470703125, 8.26416015625, 8.745849609375, 9.2275390625, 9.709228515625, 10.19091796875, 10.672607421875, 11.154296875, 11.635986328125, 12.11767578125, 12.599365234375, 13.0810546875, 13.562744140625, 14.04443359375, 14.526123046875, 15.0078125]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 4.0, 7.0, 8.0, 8.0, 6.0, 8.0, 16.0, 17.0, 14.0, 24.0, 17.0, 18.0, 30.0, 29.0, 24.0, 46.0, 44.0, 39.0, 38.0, 44.0, 28.0, 44.0, 44.0, 40.0, 35.0, 41.0, 27.0, 37.0, 33.0, 39.0, 22.0, 34.0, 26.0, 18.0, 21.0, 11.0, 13.0, 10.0, 7.0, 11.0, 4.0, 3.0, 5.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.046875, -20.3583984375, -19.669921875, -18.9814453125, -18.29296875, -17.6044921875, -16.916015625, -16.2275390625, -15.5390625, -14.8505859375, -14.162109375, -13.4736328125, -12.78515625, -12.0966796875, -11.408203125, -10.7197265625, -10.03125, -9.3427734375, -8.654296875, -7.9658203125, -7.27734375, -6.5888671875, -5.900390625, -5.2119140625, -4.5234375, -3.8349609375, -3.146484375, -2.4580078125, -1.76953125, -1.0810546875, -0.392578125, 0.2958984375, 0.984375, 1.6728515625, 2.361328125, 3.0498046875, 3.73828125, 4.4267578125, 5.115234375, 5.8037109375, 6.4921875, 7.1806640625, 7.869140625, 8.5576171875, 9.24609375, 9.9345703125, 10.623046875, 11.3115234375, 12.0, 12.6884765625, 13.376953125, 14.0654296875, 14.75390625, 15.4423828125, 16.130859375, 16.8193359375, 17.5078125, 18.1962890625, 18.884765625, 19.5732421875, 20.26171875, 20.9501953125, 21.638671875, 22.3271484375, 23.015625]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 2.0, 10.0, 18.0, 24.0, 44.0, 61.0, 99.0, 169.0, 265.0, 425.0, 703.0, 1219.0, 2021.0, 3275.0, 5557.0, 9196.0, 15272.0, 25905.0, 42696.0, 68875.0, 110974.0, 171648.0, 254881.0, 352463.0, 453136.0, 518332.0, 524795.0, 470715.0, 376972.0, 275848.0, 189614.0, 123356.0, 76990.0, 47241.0, 28371.0, 17201.0, 10370.0, 6153.0, 3697.0, 2249.0, 1338.0, 852.0, 445.0, 322.0, 204.0, 102.0, 78.0, 41.0, 30.0, 14.0, 11.0, 4.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-17.078125, -16.510986328125, -15.94384765625, -15.376708984375, -14.8095703125, -14.242431640625, -13.67529296875, -13.108154296875, -12.541015625, -11.973876953125, -11.40673828125, -10.839599609375, -10.2724609375, -9.705322265625, -9.13818359375, -8.571044921875, -8.00390625, -7.436767578125, -6.86962890625, -6.302490234375, -5.7353515625, -5.168212890625, -4.60107421875, -4.033935546875, -3.466796875, -2.899658203125, -2.33251953125, -1.765380859375, -1.1982421875, -0.631103515625, -0.06396484375, 0.503173828125, 1.0703125, 1.637451171875, 2.20458984375, 2.771728515625, 3.3388671875, 3.906005859375, 4.47314453125, 5.040283203125, 5.607421875, 6.174560546875, 6.74169921875, 7.308837890625, 7.8759765625, 8.443115234375, 9.01025390625, 9.577392578125, 10.14453125, 10.711669921875, 11.27880859375, 11.845947265625, 12.4130859375, 12.980224609375, 13.54736328125, 14.114501953125, 14.681640625, 15.248779296875, 15.81591796875, 16.383056640625, 16.9501953125, 17.517333984375, 18.08447265625, 18.651611328125, 19.21875]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 1.0, 3.0, 3.0, 8.0, 8.0, 11.0, 15.0, 12.0, 25.0, 31.0, 38.0, 41.0, 47.0, 70.0, 82.0, 122.0, 116.0, 131.0, 168.0, 171.0, 180.0, 206.0, 230.0, 222.0, 228.0, 232.0, 202.0, 221.0, 212.0, 160.0, 136.0, 141.0, 123.0, 96.0, 86.0, 61.0, 56.0, 36.0, 44.0, 24.0, 16.0, 21.0, 12.0, 10.0, 7.0, 5.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-11.265625, -10.949462890625, -10.63330078125, -10.317138671875, -10.0009765625, -9.684814453125, -9.36865234375, -9.052490234375, -8.736328125, -8.420166015625, -8.10400390625, -7.787841796875, -7.4716796875, -7.155517578125, -6.83935546875, -6.523193359375, -6.20703125, -5.890869140625, -5.57470703125, -5.258544921875, -4.9423828125, -4.626220703125, -4.31005859375, -3.993896484375, -3.677734375, -3.361572265625, -3.04541015625, -2.729248046875, -2.4130859375, -2.096923828125, -1.78076171875, -1.464599609375, -1.1484375, -0.832275390625, -0.51611328125, -0.199951171875, 0.1162109375, 0.432373046875, 0.74853515625, 1.064697265625, 1.380859375, 1.697021484375, 2.01318359375, 2.329345703125, 2.6455078125, 2.961669921875, 3.27783203125, 3.593994140625, 3.91015625, 4.226318359375, 4.54248046875, 4.858642578125, 5.1748046875, 5.490966796875, 5.80712890625, 6.123291015625, 6.439453125, 6.755615234375, 7.07177734375, 7.387939453125, 7.7041015625, 8.020263671875, 8.33642578125, 8.652587890625, 8.96875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 2.0, 2.0, 8.0, 6.0, 8.0, 9.0, 20.0, 18.0, 19.0, 25.0, 29.0, 42.0, 33.0, 44.0, 48.0, 57.0, 63.0, 44.0, 57.0, 75.0, 59.0, 38.0, 51.0, 48.0, 42.0, 36.0, 23.0, 26.0, 22.0, 12.0, 18.0, 6.0, 7.0, 4.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.37006950378418, -26.518503189086914, -25.66693687438965, -24.815372467041016, -23.96380615234375, -23.112239837646484, -22.26067352294922, -21.409107208251953, -20.557540893554688, -19.705974578857422, -18.854408264160156, -18.00284194946289, -17.151277542114258, -16.299711227416992, -15.448144912719727, -14.596578598022461, -13.745014190673828, -12.893447875976562, -12.041882514953613, -11.190316200256348, -10.338750839233398, -9.487184524536133, -8.635618209838867, -7.78405237197876, -6.932486534118652, -6.080920696258545, -5.2293548583984375, -4.377788543701172, -3.5262227058410645, -2.674656867980957, -1.8230905532836914, -0.971524715423584, -0.11995697021484375, 0.7316089868545532, 1.5831749439239502, 2.4347410202026367, 3.286306858062744, 4.137872695922852, 4.989439010620117, 5.841004848480225, 6.692570686340332, 7.5441365242004395, 8.395702362060547, 9.247268676757812, 10.098834991455078, 10.950400352478027, 11.801966667175293, 12.653532028198242, 13.505098342895508, 14.356664657592773, 15.208230018615723, 16.059795379638672, 16.911361694335938, 17.762928009033203, 18.61449432373047, 19.466060638427734, 20.317626953125, 21.169193267822266, 22.02075958251953, 22.872325897216797, 23.72389030456543, 24.575456619262695, 25.42702293395996, 26.278589248657227, 27.13015365600586]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 6.0, 2.0, 10.0, 7.0, 10.0, 15.0, 12.0, 20.0, 24.0, 17.0, 23.0, 24.0, 35.0, 44.0, 39.0, 36.0, 49.0, 39.0, 49.0, 36.0, 51.0, 37.0, 45.0, 31.0, 33.0, 46.0, 30.0, 35.0, 35.0, 30.0, 17.0, 26.0, 21.0, 13.0, 9.0, 9.0, 7.0, 6.0, 6.0, 9.0, 8.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.633066177368164, -26.737417221069336, -25.841766357421875, -24.946117401123047, -24.050466537475586, -23.154817581176758, -22.259166717529297, -21.36351776123047, -20.46786880493164, -19.572219848632812, -18.67656898498535, -17.780920028686523, -16.885269165039062, -15.989620208740234, -15.09397029876709, -14.198320388793945, -13.302669525146484, -12.40701961517334, -11.511369705200195, -10.615720748901367, -9.720069885253906, -8.824420928955078, -7.928771018981934, -7.033121109008789, -6.1374711990356445, -5.2418212890625, -4.3461713790893555, -3.450521945953369, -2.5548720359802246, -1.65922212600708, -0.7635726928710938, 0.13207721710205078, 1.0277271270751953, 1.9233769178390503, 2.8190267086029053, 3.7146763801574707, 4.610326290130615, 5.50597620010376, 6.401625633239746, 7.297275543212891, 8.192925453186035, 9.08857536315918, 9.984225273132324, 10.879875183105469, 11.775524139404297, 12.671175003051758, 13.566823959350586, 14.46247386932373, 15.358123779296875, 16.253772735595703, 17.149423599243164, 18.045072555541992, 18.940723419189453, 19.83637237548828, 20.73202133178711, 21.62767219543457, 22.52332305908203, 23.41897201538086, 24.31462287902832, 25.21027183532715, 26.10592269897461, 27.001571655273438, 27.897220611572266, 28.792871475219727, 29.688520431518555]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 4.0, 1.0, 7.0, 7.0, 10.0, 16.0, 25.0, 38.0, 54.0, 91.0, 134.0, 222.0, 311.0, 523.0, 893.0, 1448.0, 2490.0, 4140.0, 7341.0, 13552.0, 24793.0, 45578.0, 81096.0, 129538.0, 175944.0, 185125.0, 149756.0, 98136.0, 57032.0, 31259.0, 16916.0, 9204.0, 5197.0, 3033.0, 1754.0, 1122.0, 635.0, 407.0, 295.0, 141.0, 89.0, 61.0, 53.0, 36.0, 23.0, 15.0, 11.0, 4.0, 3.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.4921875, -9.1669921875, -8.841796875, -8.5166015625, -8.19140625, -7.8662109375, -7.541015625, -7.2158203125, -6.890625, -6.5654296875, -6.240234375, -5.9150390625, -5.58984375, -5.2646484375, -4.939453125, -4.6142578125, -4.2890625, -3.9638671875, -3.638671875, -3.3134765625, -2.98828125, -2.6630859375, -2.337890625, -2.0126953125, -1.6875, -1.3623046875, -1.037109375, -0.7119140625, -0.38671875, -0.0615234375, 0.263671875, 0.5888671875, 0.9140625, 1.2392578125, 1.564453125, 1.8896484375, 2.21484375, 2.5400390625, 2.865234375, 3.1904296875, 3.515625, 3.8408203125, 4.166015625, 4.4912109375, 4.81640625, 5.1416015625, 5.466796875, 5.7919921875, 6.1171875, 6.4423828125, 6.767578125, 7.0927734375, 7.41796875, 7.7431640625, 8.068359375, 8.3935546875, 8.71875, 9.0439453125, 9.369140625, 9.6943359375, 10.01953125, 10.3447265625, 10.669921875, 10.9951171875, 11.3203125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 5.0, 2.0, 7.0, 9.0, 9.0, 9.0, 12.0, 13.0, 14.0, 21.0, 23.0, 28.0, 33.0, 35.0, 40.0, 40.0, 45.0, 40.0, 36.0, 50.0, 47.0, 43.0, 46.0, 41.0, 43.0, 54.0, 37.0, 31.0, 38.0, 25.0, 18.0, 24.0, 22.0, 17.0, 9.0, 5.0, 9.0, 8.0, 5.0, 4.0, 7.0, 6.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.203125, -29.242919921875, -28.28271484375, -27.322509765625, -26.3623046875, -25.402099609375, -24.44189453125, -23.481689453125, -22.521484375, -21.561279296875, -20.60107421875, -19.640869140625, -18.6806640625, -17.720458984375, -16.76025390625, -15.800048828125, -14.83984375, -13.879638671875, -12.91943359375, -11.959228515625, -10.9990234375, -10.038818359375, -9.07861328125, -8.118408203125, -7.158203125, -6.197998046875, -5.23779296875, -4.277587890625, -3.3173828125, -2.357177734375, -1.39697265625, -0.436767578125, 0.5234375, 1.483642578125, 2.44384765625, 3.404052734375, 4.3642578125, 5.324462890625, 6.28466796875, 7.244873046875, 8.205078125, 9.165283203125, 10.12548828125, 11.085693359375, 12.0458984375, 13.006103515625, 13.96630859375, 14.926513671875, 15.88671875, 16.846923828125, 17.80712890625, 18.767333984375, 19.7275390625, 20.687744140625, 21.64794921875, 22.608154296875, 23.568359375, 24.528564453125, 25.48876953125, 26.448974609375, 27.4091796875, 28.369384765625, 29.32958984375, 30.289794921875, 31.25]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 9.0, 9.0, 11.0, 20.0, 14.0, 21.0, 44.0, 59.0, 97.0, 120.0, 187.0, 266.0, 464.0, 782.0, 1297.0, 2332.0, 4314.0, 8182.0, 16938.0, 34467.0, 70952.0, 134677.0, 211436.0, 227438.0, 160098.0, 86996.0, 43723.0, 20868.0, 10523.0, 5397.0, 2874.0, 1541.0, 919.0, 498.0, 370.0, 204.0, 129.0, 90.0, 66.0, 40.0, 34.0, 27.0, 10.0, 6.0, 8.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.3828125, -11.9581298828125, -11.533447265625, -11.1087646484375, -10.68408203125, -10.2593994140625, -9.834716796875, -9.4100341796875, -8.9853515625, -8.5606689453125, -8.135986328125, -7.7113037109375, -7.28662109375, -6.8619384765625, -6.437255859375, -6.0125732421875, -5.587890625, -5.1632080078125, -4.738525390625, -4.3138427734375, -3.88916015625, -3.4644775390625, -3.039794921875, -2.6151123046875, -2.1904296875, -1.7657470703125, -1.341064453125, -0.9163818359375, -0.49169921875, -0.0670166015625, 0.357666015625, 0.7823486328125, 1.20703125, 1.6317138671875, 2.056396484375, 2.4810791015625, 2.90576171875, 3.3304443359375, 3.755126953125, 4.1798095703125, 4.6044921875, 5.0291748046875, 5.453857421875, 5.8785400390625, 6.30322265625, 6.7279052734375, 7.152587890625, 7.5772705078125, 8.001953125, 8.4266357421875, 8.851318359375, 9.2760009765625, 9.70068359375, 10.1253662109375, 10.550048828125, 10.9747314453125, 11.3994140625, 11.8240966796875, 12.248779296875, 12.6734619140625, 13.09814453125, 13.5228271484375, 13.947509765625, 14.3721923828125, 14.796875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 6.0, 4.0, 2.0, 10.0, 7.0, 12.0, 11.0, 6.0, 12.0, 20.0, 14.0, 14.0, 26.0, 22.0, 24.0, 32.0, 37.0, 27.0, 35.0, 29.0, 38.0, 30.0, 32.0, 38.0, 35.0, 49.0, 29.0, 38.0, 27.0, 34.0, 28.0, 32.0, 23.0, 17.0, 17.0, 22.0, 23.0, 19.0, 22.0, 16.0, 13.0, 10.0, 8.0, 11.0, 13.0, 9.0, 7.0, 4.0, 2.0, 4.0, 5.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0], "bins": [-14.4453125, -13.98779296875, -13.5302734375, -13.07275390625, -12.615234375, -12.15771484375, -11.7001953125, -11.24267578125, -10.78515625, -10.32763671875, -9.8701171875, -9.41259765625, -8.955078125, -8.49755859375, -8.0400390625, -7.58251953125, -7.125, -6.66748046875, -6.2099609375, -5.75244140625, -5.294921875, -4.83740234375, -4.3798828125, -3.92236328125, -3.46484375, -3.00732421875, -2.5498046875, -2.09228515625, -1.634765625, -1.17724609375, -0.7197265625, -0.26220703125, 0.1953125, 0.65283203125, 1.1103515625, 1.56787109375, 2.025390625, 2.48291015625, 2.9404296875, 3.39794921875, 3.85546875, 4.31298828125, 4.7705078125, 5.22802734375, 5.685546875, 6.14306640625, 6.6005859375, 7.05810546875, 7.515625, 7.97314453125, 8.4306640625, 8.88818359375, 9.345703125, 9.80322265625, 10.2607421875, 10.71826171875, 11.17578125, 11.63330078125, 12.0908203125, 12.54833984375, 13.005859375, 13.46337890625, 13.9208984375, 14.37841796875, 14.8359375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 6.0, 11.0, 6.0, 12.0, 12.0, 39.0, 41.0, 75.0, 114.0, 160.0, 248.0, 414.0, 610.0, 1119.0, 2096.0, 4241.0, 9490.0, 23514.0, 65261.0, 180533.0, 345773.0, 255161.0, 98798.0, 35099.0, 13480.0, 5876.0, 2738.0, 1431.0, 813.0, 475.0, 302.0, 196.0, 139.0, 83.0, 47.0, 47.0, 38.0, 18.0, 13.0, 11.0, 8.0, 6.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.36328125, -7.09747314453125, -6.8316650390625, -6.56585693359375, -6.300048828125, -6.03424072265625, -5.7684326171875, -5.50262451171875, -5.23681640625, -4.97100830078125, -4.7052001953125, -4.43939208984375, -4.173583984375, -3.90777587890625, -3.6419677734375, -3.37615966796875, -3.1103515625, -2.84454345703125, -2.5787353515625, -2.31292724609375, -2.047119140625, -1.78131103515625, -1.5155029296875, -1.24969482421875, -0.98388671875, -0.71807861328125, -0.4522705078125, -0.18646240234375, 0.079345703125, 0.34515380859375, 0.6109619140625, 0.87677001953125, 1.142578125, 1.40838623046875, 1.6741943359375, 1.94000244140625, 2.205810546875, 2.47161865234375, 2.7374267578125, 3.00323486328125, 3.26904296875, 3.53485107421875, 3.8006591796875, 4.06646728515625, 4.332275390625, 4.59808349609375, 4.8638916015625, 5.12969970703125, 5.3955078125, 5.66131591796875, 5.9271240234375, 6.19293212890625, 6.458740234375, 6.72454833984375, 6.9903564453125, 7.25616455078125, 7.52197265625, 7.78778076171875, 8.0535888671875, 8.31939697265625, 8.585205078125, 8.85101318359375, 9.1168212890625, 9.38262939453125, 9.6484375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 8.0, 6.0, 5.0, 23.0, 27.0, 56.0, 51.0, 79.0, 97.0, 133.0, 117.0, 110.0, 86.0, 68.0, 48.0, 35.0, 25.0, 12.0, 9.0, 5.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0005540847778320312, -0.0005336850881576538, -0.0005132853984832764, -0.0004928857088088989, -0.0004724860191345215, -0.00045208632946014404, -0.0004316866397857666, -0.00041128695011138916, -0.0003908872604370117, -0.0003704875707626343, -0.00035008788108825684, -0.0003296881914138794, -0.00030928850173950195, -0.0002888888120651245, -0.00026848912239074707, -0.00024808943271636963, -0.0002276897430419922, -0.00020729005336761475, -0.0001868903636932373, -0.00016649067401885986, -0.00014609098434448242, -0.00012569129467010498, -0.00010529160499572754, -8.48919153213501e-05, -6.449222564697266e-05, -4.4092535972595215e-05, -2.3692846298217773e-05, -3.293156623840332e-06, 1.710653305053711e-05, 3.750622272491455e-05, 5.790591239929199e-05, 7.830560207366943e-05, 9.870529174804688e-05, 0.00011910498142242432, 0.00013950467109680176, 0.0001599043607711792, 0.00018030405044555664, 0.00020070374011993408, 0.00022110342979431152, 0.00024150311946868896, 0.0002619028091430664, 0.00028230249881744385, 0.0003027021884918213, 0.00032310187816619873, 0.00034350156784057617, 0.0003639012575149536, 0.00038430094718933105, 0.0004047006368637085, 0.00042510032653808594, 0.0004455000162124634, 0.0004658997058868408, 0.00048629939556121826, 0.0005066990852355957, 0.0005270987749099731, 0.0005474984645843506, 0.000567898154258728, 0.0005882978439331055, 0.0006086975336074829, 0.0006290972232818604, 0.0006494969129562378, 0.0006698966026306152, 0.0006902962923049927, 0.0007106959819793701, 0.0007310956716537476, 0.000751495361328125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 5.0, 5.0, 2.0, 6.0, 9.0, 13.0, 17.0, 27.0, 24.0, 56.0, 79.0, 102.0, 152.0, 236.0, 341.0, 502.0, 712.0, 1120.0, 1767.0, 2736.0, 4410.0, 7496.0, 13014.0, 22576.0, 40265.0, 68789.0, 110885.0, 155887.0, 177900.0, 157872.0, 113513.0, 70501.0, 40869.0, 23352.0, 13168.0, 7556.0, 4597.0, 2887.0, 1656.0, 1143.0, 734.0, 479.0, 328.0, 214.0, 187.0, 127.0, 81.0, 60.0, 34.0, 30.0, 18.0, 11.0, 9.0, 2.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.14453125, -4.9813232421875, -4.818115234375, -4.6549072265625, -4.49169921875, -4.3284912109375, -4.165283203125, -4.0020751953125, -3.8388671875, -3.6756591796875, -3.512451171875, -3.3492431640625, -3.18603515625, -3.0228271484375, -2.859619140625, -2.6964111328125, -2.533203125, -2.3699951171875, -2.206787109375, -2.0435791015625, -1.88037109375, -1.7171630859375, -1.553955078125, -1.3907470703125, -1.2275390625, -1.0643310546875, -0.901123046875, -0.7379150390625, -0.57470703125, -0.4114990234375, -0.248291015625, -0.0850830078125, 0.078125, 0.2413330078125, 0.404541015625, 0.5677490234375, 0.73095703125, 0.8941650390625, 1.057373046875, 1.2205810546875, 1.3837890625, 1.5469970703125, 1.710205078125, 1.8734130859375, 2.03662109375, 2.1998291015625, 2.363037109375, 2.5262451171875, 2.689453125, 2.8526611328125, 3.015869140625, 3.1790771484375, 3.34228515625, 3.5054931640625, 3.668701171875, 3.8319091796875, 3.9951171875, 4.1583251953125, 4.321533203125, 4.4847412109375, 4.64794921875, 4.8111572265625, 4.974365234375, 5.1375732421875, 5.30078125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 5.0, 3.0, 2.0, 2.0, 8.0, 10.0, 10.0, 22.0, 30.0, 40.0, 55.0, 51.0, 51.0, 50.0, 57.0, 82.0, 58.0, 76.0, 87.0, 44.0, 59.0, 39.0, 42.0, 26.0, 27.0, 20.0, 11.0, 9.0, 8.0, 4.0, 7.0, 3.0, 1.0, 5.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.958984375, -2.874847412109375, -2.79071044921875, -2.706573486328125, -2.6224365234375, -2.538299560546875, -2.45416259765625, -2.370025634765625, -2.285888671875, -2.201751708984375, -2.11761474609375, -2.033477783203125, -1.9493408203125, -1.865203857421875, -1.78106689453125, -1.696929931640625, -1.61279296875, -1.528656005859375, -1.44451904296875, -1.360382080078125, -1.2762451171875, -1.192108154296875, -1.10797119140625, -1.023834228515625, -0.939697265625, -0.855560302734375, -0.77142333984375, -0.687286376953125, -0.6031494140625, -0.519012451171875, -0.43487548828125, -0.350738525390625, -0.2666015625, -0.182464599609375, -0.09832763671875, -0.014190673828125, 0.0699462890625, 0.154083251953125, 0.23822021484375, 0.322357177734375, 0.406494140625, 0.490631103515625, 0.57476806640625, 0.658905029296875, 0.7430419921875, 0.827178955078125, 0.91131591796875, 0.995452880859375, 1.07958984375, 1.163726806640625, 1.24786376953125, 1.332000732421875, 1.4161376953125, 1.500274658203125, 1.58441162109375, 1.668548583984375, 1.752685546875, 1.836822509765625, 1.92095947265625, 2.005096435546875, 2.0892333984375, 2.173370361328125, 2.25750732421875, 2.341644287109375, 2.42578125]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 4.0, 3.0, 7.0, 4.0, 12.0, 12.0, 13.0, 18.0, 20.0, 22.0, 24.0, 40.0, 41.0, 40.0, 43.0, 48.0, 66.0, 51.0, 60.0, 60.0, 66.0, 48.0, 45.0, 44.0, 50.0, 31.0, 24.0, 24.0, 23.0, 16.0, 15.0, 12.0, 6.0, 6.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.589956283569336, -26.762981414794922, -25.936006546020508, -25.109031677246094, -24.28205680847168, -23.455081939697266, -22.62810707092285, -21.801132202148438, -20.974157333374023, -20.14718246459961, -19.320207595825195, -18.49323272705078, -17.666257858276367, -16.839282989501953, -16.01230812072754, -15.185333251953125, -14.358358383178711, -13.531383514404297, -12.704408645629883, -11.877433776855469, -11.050458908081055, -10.22348403930664, -9.396509170532227, -8.569534301757812, -7.742559432983398, -6.915584564208984, -6.08860969543457, -5.261634826660156, -4.434659957885742, -3.607685089111328, -2.780710220336914, -1.9537353515625, -1.1267585754394531, -0.29978370666503906, 0.527191162109375, 1.354166030883789, 2.181140899658203, 3.008115768432617, 3.8350906372070312, 4.662065505981445, 5.489040374755859, 6.316015243530273, 7.1429901123046875, 7.969964981079102, 8.796939849853516, 9.62391471862793, 10.450889587402344, 11.277864456176758, 12.104839324951172, 12.931814193725586, 13.7587890625, 14.585763931274414, 15.412738800048828, 16.239713668823242, 17.066688537597656, 17.89366340637207, 18.720638275146484, 19.5476131439209, 20.374588012695312, 21.201562881469727, 22.02853775024414, 22.855512619018555, 23.68248748779297, 24.509462356567383, 25.336437225341797]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 2.0, 6.0, 6.0, 6.0, 10.0, 8.0, 14.0, 16.0, 21.0, 21.0, 22.0, 19.0, 34.0, 28.0, 43.0, 42.0, 45.0, 43.0, 43.0, 40.0, 47.0, 35.0, 47.0, 45.0, 32.0, 31.0, 42.0, 30.0, 39.0, 30.0, 24.0, 29.0, 19.0, 22.0, 8.0, 11.0, 9.0, 7.0, 6.0, 4.0, 10.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.389484405517578, -26.497068405151367, -25.604652404785156, -24.712234497070312, -23.8198184967041, -22.92740249633789, -22.03498649597168, -21.14257049560547, -20.250152587890625, -19.357736587524414, -18.465320587158203, -17.57290267944336, -16.68048667907715, -15.788070678710938, -14.895654678344727, -14.003238677978516, -13.110822677612305, -12.218406677246094, -11.325989723205566, -10.433573722839355, -9.541156768798828, -8.648740768432617, -7.756324768066406, -6.863908290863037, -5.971491813659668, -5.079075336456299, -4.18665885925293, -3.2942428588867188, -2.4018263816833496, -1.5094099044799805, -0.6169939041137695, 0.2754225730895996, 1.167837142944336, 2.060253620147705, 2.952669858932495, 3.845086097717285, 4.737502574920654, 5.629919052124023, 6.522335052490234, 7.4147515296936035, 8.307168006896973, 9.199584007263184, 10.092000961303711, 10.984416961669922, 11.876832962036133, 12.76924991607666, 13.661665916442871, 14.554082870483398, 15.44649887084961, 16.33891487121582, 17.23133087158203, 18.123748779296875, 19.016164779663086, 19.908580780029297, 20.800996780395508, 21.69341278076172, 22.585830688476562, 23.478246688842773, 24.370662689208984, 25.263080596923828, 26.15549659729004, 27.04791259765625, 27.94032859802246, 28.832744598388672, 29.725160598754883]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 7.0, 18.0, 15.0, 35.0, 50.0, 91.0, 145.0, 211.0, 298.0, 467.0, 754.0, 1206.0, 1795.0, 2944.0, 4648.0, 7411.0, 11607.0, 18106.0, 27342.0, 39803.0, 56225.0, 75072.0, 93928.0, 108251.0, 114222.0, 110976.0, 98767.0, 80435.0, 62008.0, 44558.0, 30204.0, 20233.0, 13252.0, 8549.0, 5500.0, 3399.0, 2204.0, 1389.0, 904.0, 555.0, 367.0, 209.0, 149.0, 106.0, 44.0, 43.0, 19.0, 19.0, 6.0, 7.0, 6.0, 2.0, 2.0, 0.0, 2.0], "bins": [-14.171875, -13.750732421875, -13.32958984375, -12.908447265625, -12.4873046875, -12.066162109375, -11.64501953125, -11.223876953125, -10.802734375, -10.381591796875, -9.96044921875, -9.539306640625, -9.1181640625, -8.697021484375, -8.27587890625, -7.854736328125, -7.43359375, -7.012451171875, -6.59130859375, -6.170166015625, -5.7490234375, -5.327880859375, -4.90673828125, -4.485595703125, -4.064453125, -3.643310546875, -3.22216796875, -2.801025390625, -2.3798828125, -1.958740234375, -1.53759765625, -1.116455078125, -0.6953125, -0.274169921875, 0.14697265625, 0.568115234375, 0.9892578125, 1.410400390625, 1.83154296875, 2.252685546875, 2.673828125, 3.094970703125, 3.51611328125, 3.937255859375, 4.3583984375, 4.779541015625, 5.20068359375, 5.621826171875, 6.04296875, 6.464111328125, 6.88525390625, 7.306396484375, 7.7275390625, 8.148681640625, 8.56982421875, 8.990966796875, 9.412109375, 9.833251953125, 10.25439453125, 10.675537109375, 11.0966796875, 11.517822265625, 11.93896484375, 12.360107421875, 12.78125]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 5.0, 7.0, 8.0, 10.0, 12.0, 9.0, 23.0, 20.0, 19.0, 14.0, 25.0, 29.0, 38.0, 43.0, 43.0, 41.0, 32.0, 42.0, 40.0, 45.0, 34.0, 32.0, 38.0, 29.0, 39.0, 37.0, 29.0, 41.0, 25.0, 37.0, 23.0, 22.0, 18.0, 16.0, 16.0, 7.0, 8.0, 10.0, 7.0, 5.0, 4.0, 7.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-28.46875, -27.6279296875, -26.787109375, -25.9462890625, -25.10546875, -24.2646484375, -23.423828125, -22.5830078125, -21.7421875, -20.9013671875, -20.060546875, -19.2197265625, -18.37890625, -17.5380859375, -16.697265625, -15.8564453125, -15.015625, -14.1748046875, -13.333984375, -12.4931640625, -11.65234375, -10.8115234375, -9.970703125, -9.1298828125, -8.2890625, -7.4482421875, -6.607421875, -5.7666015625, -4.92578125, -4.0849609375, -3.244140625, -2.4033203125, -1.5625, -0.7216796875, 0.119140625, 0.9599609375, 1.80078125, 2.6416015625, 3.482421875, 4.3232421875, 5.1640625, 6.0048828125, 6.845703125, 7.6865234375, 8.52734375, 9.3681640625, 10.208984375, 11.0498046875, 11.890625, 12.7314453125, 13.572265625, 14.4130859375, 15.25390625, 16.0947265625, 16.935546875, 17.7763671875, 18.6171875, 19.4580078125, 20.298828125, 21.1396484375, 21.98046875, 22.8212890625, 23.662109375, 24.5029296875, 25.34375]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 4.0, 8.0, 12.0, 15.0, 30.0, 41.0, 87.0, 148.0, 248.0, 398.0, 666.0, 1114.0, 1877.0, 3122.0, 5228.0, 8603.0, 14106.0, 22449.0, 35812.0, 52911.0, 75404.0, 98076.0, 118563.0, 127004.0, 122036.0, 106114.0, 83835.0, 60379.0, 41133.0, 26722.0, 16744.0, 10234.0, 6217.0, 3681.0, 2201.0, 1385.0, 790.0, 452.0, 289.0, 158.0, 90.0, 79.0, 44.0, 23.0, 15.0, 6.0, 6.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.4140625, -13.9283447265625, -13.442626953125, -12.9569091796875, -12.47119140625, -11.9854736328125, -11.499755859375, -11.0140380859375, -10.5283203125, -10.0426025390625, -9.556884765625, -9.0711669921875, -8.58544921875, -8.0997314453125, -7.614013671875, -7.1282958984375, -6.642578125, -6.1568603515625, -5.671142578125, -5.1854248046875, -4.69970703125, -4.2139892578125, -3.728271484375, -3.2425537109375, -2.7568359375, -2.2711181640625, -1.785400390625, -1.2996826171875, -0.81396484375, -0.3282470703125, 0.157470703125, 0.6431884765625, 1.12890625, 1.6146240234375, 2.100341796875, 2.5860595703125, 3.07177734375, 3.5574951171875, 4.043212890625, 4.5289306640625, 5.0146484375, 5.5003662109375, 5.986083984375, 6.4718017578125, 6.95751953125, 7.4432373046875, 7.928955078125, 8.4146728515625, 8.900390625, 9.3861083984375, 9.871826171875, 10.3575439453125, 10.84326171875, 11.3289794921875, 11.814697265625, 12.3004150390625, 12.7861328125, 13.2718505859375, 13.757568359375, 14.2432861328125, 14.72900390625, 15.2147216796875, 15.700439453125, 16.1861572265625, 16.671875]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 5.0, 2.0, 8.0, 8.0, 5.0, 9.0, 11.0, 17.0, 14.0, 18.0, 22.0, 28.0, 21.0, 35.0, 43.0, 32.0, 31.0, 37.0, 28.0, 42.0, 48.0, 40.0, 31.0, 47.0, 37.0, 41.0, 38.0, 41.0, 33.0, 23.0, 28.0, 20.0, 34.0, 25.0, 18.0, 15.0, 17.0, 8.0, 12.0, 10.0, 3.0, 8.0, 2.0, 5.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0], "bins": [-17.90625, -17.364501953125, -16.82275390625, -16.281005859375, -15.7392578125, -15.197509765625, -14.65576171875, -14.114013671875, -13.572265625, -13.030517578125, -12.48876953125, -11.947021484375, -11.4052734375, -10.863525390625, -10.32177734375, -9.780029296875, -9.23828125, -8.696533203125, -8.15478515625, -7.613037109375, -7.0712890625, -6.529541015625, -5.98779296875, -5.446044921875, -4.904296875, -4.362548828125, -3.82080078125, -3.279052734375, -2.7373046875, -2.195556640625, -1.65380859375, -1.112060546875, -0.5703125, -0.028564453125, 0.51318359375, 1.054931640625, 1.5966796875, 2.138427734375, 2.68017578125, 3.221923828125, 3.763671875, 4.305419921875, 4.84716796875, 5.388916015625, 5.9306640625, 6.472412109375, 7.01416015625, 7.555908203125, 8.09765625, 8.639404296875, 9.18115234375, 9.722900390625, 10.2646484375, 10.806396484375, 11.34814453125, 11.889892578125, 12.431640625, 12.973388671875, 13.51513671875, 14.056884765625, 14.5986328125, 15.140380859375, 15.68212890625, 16.223876953125, 16.765625]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 8.0, 11.0, 19.0, 31.0, 50.0, 72.0, 122.0, 193.0, 297.0, 459.0, 765.0, 1280.0, 2060.0, 3409.0, 6001.0, 10317.0, 16993.0, 29336.0, 48318.0, 75482.0, 109108.0, 138282.0, 150624.0, 140251.0, 111744.0, 78081.0, 50517.0, 30600.0, 18101.0, 10592.0, 6255.0, 3685.0, 2152.0, 1284.0, 751.0, 485.0, 299.0, 197.0, 123.0, 71.0, 48.0, 22.0, 18.0, 18.0, 12.0, 7.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-7.94921875, -7.69720458984375, -7.4451904296875, -7.19317626953125, -6.941162109375, -6.68914794921875, -6.4371337890625, -6.18511962890625, -5.93310546875, -5.68109130859375, -5.4290771484375, -5.17706298828125, -4.925048828125, -4.67303466796875, -4.4210205078125, -4.16900634765625, -3.9169921875, -3.66497802734375, -3.4129638671875, -3.16094970703125, -2.908935546875, -2.65692138671875, -2.4049072265625, -2.15289306640625, -1.90087890625, -1.64886474609375, -1.3968505859375, -1.14483642578125, -0.892822265625, -0.64080810546875, -0.3887939453125, -0.13677978515625, 0.115234375, 0.36724853515625, 0.6192626953125, 0.87127685546875, 1.123291015625, 1.37530517578125, 1.6273193359375, 1.87933349609375, 2.13134765625, 2.38336181640625, 2.6353759765625, 2.88739013671875, 3.139404296875, 3.39141845703125, 3.6434326171875, 3.89544677734375, 4.1474609375, 4.39947509765625, 4.6514892578125, 4.90350341796875, 5.155517578125, 5.40753173828125, 5.6595458984375, 5.91156005859375, 6.16357421875, 6.41558837890625, 6.6676025390625, 6.91961669921875, 7.171630859375, 7.42364501953125, 7.6756591796875, 7.92767333984375, 8.1796875]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 1.0, 5.0, 0.0, 4.0, 4.0, 7.0, 7.0, 8.0, 10.0, 9.0, 17.0, 17.0, 22.0, 30.0, 44.0, 37.0, 33.0, 41.0, 38.0, 54.0, 54.0, 54.0, 60.0, 51.0, 50.0, 43.0, 36.0, 38.0, 29.0, 42.0, 36.0, 21.0, 25.0, 17.0, 15.0, 11.0, 8.0, 7.0, 7.0, 5.0, 4.0, 4.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006213188171386719, -0.0005975440144538879, -0.000573769211769104, -0.0005499944090843201, -0.0005262196063995361, -0.0005024448037147522, -0.00047867000102996826, -0.0004548951983451843, -0.0004311203956604004, -0.00040734559297561646, -0.0003835707902908325, -0.0003597959876060486, -0.00033602118492126465, -0.0003122463822364807, -0.0002884715795516968, -0.00026469677686691284, -0.0002409219741821289, -0.00021714717149734497, -0.00019337236881256104, -0.0001695975661277771, -0.00014582276344299316, -0.00012204796075820923, -9.827315807342529e-05, -7.449835538864136e-05, -5.072355270385742e-05, -2.6948750019073486e-05, -3.1739473342895508e-06, 2.0600855350494385e-05, 4.437565803527832e-05, 6.815046072006226e-05, 9.192526340484619e-05, 0.00011570006608963013, 0.00013947486877441406, 0.000163249671459198, 0.00018702447414398193, 0.00021079927682876587, 0.0002345740795135498, 0.00025834888219833374, 0.0002821236848831177, 0.0003058984875679016, 0.00032967329025268555, 0.0003534480929374695, 0.0003772228956222534, 0.00040099769830703735, 0.0004247725009918213, 0.0004485473036766052, 0.00047232210636138916, 0.0004960969090461731, 0.000519871711730957, 0.000543646514415741, 0.0005674213171005249, 0.0005911961197853088, 0.0006149709224700928, 0.0006387457251548767, 0.0006625205278396606, 0.0006862953305244446, 0.0007100701332092285, 0.0007338449358940125, 0.0007576197385787964, 0.0007813945412635803, 0.0008051693439483643, 0.0008289441466331482, 0.0008527189493179321, 0.0008764937520027161, 0.0009002685546875]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 7.0, 1.0, 6.0, 7.0, 7.0, 20.0, 27.0, 32.0, 77.0, 92.0, 174.0, 312.0, 481.0, 873.0, 1470.0, 2512.0, 4097.0, 7118.0, 12032.0, 20158.0, 32855.0, 52319.0, 77329.0, 106317.0, 130790.0, 140676.0, 132279.0, 108470.0, 79052.0, 53330.0, 34188.0, 21103.0, 12685.0, 7328.0, 4177.0, 2526.0, 1499.0, 841.0, 493.0, 315.0, 196.0, 102.0, 77.0, 49.0, 31.0, 17.0, 3.0, 8.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-8.109375, -7.860107421875, -7.61083984375, -7.361572265625, -7.1123046875, -6.863037109375, -6.61376953125, -6.364501953125, -6.115234375, -5.865966796875, -5.61669921875, -5.367431640625, -5.1181640625, -4.868896484375, -4.61962890625, -4.370361328125, -4.12109375, -3.871826171875, -3.62255859375, -3.373291015625, -3.1240234375, -2.874755859375, -2.62548828125, -2.376220703125, -2.126953125, -1.877685546875, -1.62841796875, -1.379150390625, -1.1298828125, -0.880615234375, -0.63134765625, -0.382080078125, -0.1328125, 0.116455078125, 0.36572265625, 0.614990234375, 0.8642578125, 1.113525390625, 1.36279296875, 1.612060546875, 1.861328125, 2.110595703125, 2.35986328125, 2.609130859375, 2.8583984375, 3.107666015625, 3.35693359375, 3.606201171875, 3.85546875, 4.104736328125, 4.35400390625, 4.603271484375, 4.8525390625, 5.101806640625, 5.35107421875, 5.600341796875, 5.849609375, 6.098876953125, 6.34814453125, 6.597412109375, 6.8466796875, 7.095947265625, 7.34521484375, 7.594482421875, 7.84375]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 5.0, 8.0, 6.0, 4.0, 5.0, 10.0, 14.0, 12.0, 20.0, 24.0, 28.0, 38.0, 38.0, 50.0, 34.0, 63.0, 56.0, 62.0, 65.0, 55.0, 59.0, 53.0, 59.0, 44.0, 41.0, 33.0, 23.0, 25.0, 15.0, 10.0, 9.0, 8.0, 7.0, 5.0, 7.0, 4.0, 4.0, 2.0, 0.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.78515625, -6.59808349609375, -6.4110107421875, -6.22393798828125, -6.036865234375, -5.84979248046875, -5.6627197265625, -5.47564697265625, -5.28857421875, -5.10150146484375, -4.9144287109375, -4.72735595703125, -4.540283203125, -4.35321044921875, -4.1661376953125, -3.97906494140625, -3.7919921875, -3.60491943359375, -3.4178466796875, -3.23077392578125, -3.043701171875, -2.85662841796875, -2.6695556640625, -2.48248291015625, -2.29541015625, -2.10833740234375, -1.9212646484375, -1.73419189453125, -1.547119140625, -1.36004638671875, -1.1729736328125, -0.98590087890625, -0.798828125, -0.61175537109375, -0.4246826171875, -0.23760986328125, -0.050537109375, 0.13653564453125, 0.3236083984375, 0.51068115234375, 0.69775390625, 0.88482666015625, 1.0718994140625, 1.25897216796875, 1.446044921875, 1.63311767578125, 1.8201904296875, 2.00726318359375, 2.1943359375, 2.38140869140625, 2.5684814453125, 2.75555419921875, 2.942626953125, 3.12969970703125, 3.3167724609375, 3.50384521484375, 3.69091796875, 3.87799072265625, 4.0650634765625, 4.25213623046875, 4.439208984375, 4.62628173828125, 4.8133544921875, 5.00042724609375, 5.1875]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 0.0, 6.0, 3.0, 5.0, 6.0, 8.0, 17.0, 15.0, 16.0, 25.0, 22.0, 33.0, 26.0, 39.0, 39.0, 36.0, 43.0, 47.0, 48.0, 47.0, 58.0, 50.0, 44.0, 45.0, 41.0, 51.0, 45.0, 38.0, 27.0, 30.0, 25.0, 15.0, 7.0, 14.0, 8.0, 9.0, 4.0, 2.0, 4.0, 7.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-25.082735061645508, -24.34210777282715, -23.601478576660156, -22.860851287841797, -22.120223999023438, -21.379596710205078, -20.638967514038086, -19.898340225219727, -19.157711029052734, -18.417083740234375, -17.676454544067383, -16.935827255249023, -16.195199966430664, -15.454571723937988, -14.713943481445312, -13.973316192626953, -13.232688903808594, -12.492060661315918, -11.751433372497559, -11.010805130004883, -10.270177841186523, -9.529549598693848, -8.788921356201172, -8.048294067382812, -7.307665824890137, -6.567038059234619, -5.826410293579102, -5.085782051086426, -4.345154285430908, -3.6045265197753906, -2.863898277282715, -2.1232705116271973, -1.3826427459716797, -0.6420148611068726, 0.09861302375793457, 0.8392410278320312, 1.5798687934875488, 2.3204965591430664, 3.061124801635742, 3.8017525672912598, 4.542380332946777, 5.283008098602295, 6.0236358642578125, 6.764264106750488, 7.504891872406006, 8.245519638061523, 8.9861478805542, 9.726776123046875, 10.467403411865234, 11.20803165435791, 11.94865894317627, 12.689287185668945, 13.429914474487305, 14.17054271697998, 14.911170959472656, 15.651798248291016, 16.392425537109375, 17.133052825927734, 17.873682022094727, 18.614309310913086, 19.354936599731445, 20.095565795898438, 20.836193084716797, 21.576820373535156, 22.31744956970215]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 4.0, 6.0, 4.0, 5.0, 9.0, 14.0, 10.0, 10.0, 10.0, 22.0, 28.0, 28.0, 34.0, 29.0, 47.0, 40.0, 52.0, 49.0, 50.0, 49.0, 62.0, 43.0, 55.0, 52.0, 29.0, 39.0, 25.0, 34.0, 34.0, 34.0, 23.0, 17.0, 12.0, 11.0, 8.0, 12.0, 6.0, 6.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.29084587097168, -30.28542137145996, -29.279996871948242, -28.274572372436523, -27.269145965576172, -26.263721466064453, -25.258296966552734, -24.252872467041016, -23.247447967529297, -22.242023468017578, -21.23659896850586, -20.23117446899414, -19.225749969482422, -18.220325469970703, -17.21489906311035, -16.209474563598633, -15.204050064086914, -14.198625564575195, -13.193201065063477, -12.187775611877441, -11.182351112365723, -10.176926612854004, -9.171501159667969, -8.16607666015625, -7.160652160644531, -6.1552276611328125, -5.1498026847839355, -4.144377708435059, -3.13895320892334, -2.133528709411621, -1.1281037330627441, -0.12267875671386719, 0.8827438354492188, 1.8881685733795166, 2.8935933113098145, 3.8990180492401123, 4.90444278717041, 5.909867286682129, 6.915292263031006, 7.920717239379883, 8.926141738891602, 9.93156623840332, 10.936990737915039, 11.942416191101074, 12.947840690612793, 13.953265190124512, 14.958690643310547, 15.964115142822266, 16.969539642333984, 17.974964141845703, 18.980388641357422, 19.98581314086914, 20.99123764038086, 21.996662139892578, 23.00208854675293, 24.00751304626465, 25.012937545776367, 26.018362045288086, 27.023786544799805, 28.029211044311523, 29.034637451171875, 30.040061950683594, 31.045486450195312, 32.05091094970703, 33.05633544921875]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 2.0, 3.0, 4.0, 15.0, 14.0, 13.0, 25.0, 58.0, 91.0, 147.0, 202.0, 351.0, 551.0, 937.0, 1466.0, 2518.0, 3955.0, 6564.0, 10963.0, 18473.0, 31939.0, 54351.0, 91820.0, 153668.0, 244579.0, 368679.0, 501541.0, 592878.0, 594663.0, 503892.0, 373500.0, 249029.0, 155709.0, 94419.0, 56068.0, 32989.0, 19146.0, 11726.0, 6949.0, 4114.0, 2356.0, 1480.0, 936.0, 553.0, 377.0, 227.0, 133.0, 78.0, 53.0, 28.0, 19.0, 19.0, 16.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.453125, -17.8583984375, -17.263671875, -16.6689453125, -16.07421875, -15.4794921875, -14.884765625, -14.2900390625, -13.6953125, -13.1005859375, -12.505859375, -11.9111328125, -11.31640625, -10.7216796875, -10.126953125, -9.5322265625, -8.9375, -8.3427734375, -7.748046875, -7.1533203125, -6.55859375, -5.9638671875, -5.369140625, -4.7744140625, -4.1796875, -3.5849609375, -2.990234375, -2.3955078125, -1.80078125, -1.2060546875, -0.611328125, -0.0166015625, 0.578125, 1.1728515625, 1.767578125, 2.3623046875, 2.95703125, 3.5517578125, 4.146484375, 4.7412109375, 5.3359375, 5.9306640625, 6.525390625, 7.1201171875, 7.71484375, 8.3095703125, 8.904296875, 9.4990234375, 10.09375, 10.6884765625, 11.283203125, 11.8779296875, 12.47265625, 13.0673828125, 13.662109375, 14.2568359375, 14.8515625, 15.4462890625, 16.041015625, 16.6357421875, 17.23046875, 17.8251953125, 18.419921875, 19.0146484375, 19.609375]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 5.0, 5.0, 7.0, 6.0, 11.0, 11.0, 12.0, 15.0, 19.0, 23.0, 36.0, 29.0, 36.0, 23.0, 24.0, 49.0, 46.0, 41.0, 37.0, 54.0, 38.0, 50.0, 44.0, 43.0, 41.0, 41.0, 23.0, 41.0, 27.0, 20.0, 30.0, 30.0, 15.0, 19.0, 11.0, 9.0, 4.0, 10.0, 8.0, 4.0, 2.0, 1.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.015625, -22.27978515625, -21.5439453125, -20.80810546875, -20.072265625, -19.33642578125, -18.6005859375, -17.86474609375, -17.12890625, -16.39306640625, -15.6572265625, -14.92138671875, -14.185546875, -13.44970703125, -12.7138671875, -11.97802734375, -11.2421875, -10.50634765625, -9.7705078125, -9.03466796875, -8.298828125, -7.56298828125, -6.8271484375, -6.09130859375, -5.35546875, -4.61962890625, -3.8837890625, -3.14794921875, -2.412109375, -1.67626953125, -0.9404296875, -0.20458984375, 0.53125, 1.26708984375, 2.0029296875, 2.73876953125, 3.474609375, 4.21044921875, 4.9462890625, 5.68212890625, 6.41796875, 7.15380859375, 7.8896484375, 8.62548828125, 9.361328125, 10.09716796875, 10.8330078125, 11.56884765625, 12.3046875, 13.04052734375, 13.7763671875, 14.51220703125, 15.248046875, 15.98388671875, 16.7197265625, 17.45556640625, 18.19140625, 18.92724609375, 19.6630859375, 20.39892578125, 21.134765625, 21.87060546875, 22.6064453125, 23.34228515625, 24.078125]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [3.0, 2.0, 7.0, 5.0, 7.0, 12.0, 22.0, 45.0, 80.0, 124.0, 195.0, 353.0, 557.0, 985.0, 1743.0, 3055.0, 5370.0, 9488.0, 17128.0, 30564.0, 53513.0, 92709.0, 156123.0, 247826.0, 367750.0, 489325.0, 572564.0, 583194.0, 506518.0, 386383.0, 264951.0, 168008.0, 101211.0, 58450.0, 32954.0, 18550.0, 10577.0, 5920.0, 3315.0, 1951.0, 1112.0, 664.0, 393.0, 236.0, 141.0, 96.0, 47.0, 27.0, 18.0, 10.0, 9.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.09375, -17.425537109375, -16.75732421875, -16.089111328125, -15.4208984375, -14.752685546875, -14.08447265625, -13.416259765625, -12.748046875, -12.079833984375, -11.41162109375, -10.743408203125, -10.0751953125, -9.406982421875, -8.73876953125, -8.070556640625, -7.40234375, -6.734130859375, -6.06591796875, -5.397705078125, -4.7294921875, -4.061279296875, -3.39306640625, -2.724853515625, -2.056640625, -1.388427734375, -0.72021484375, -0.052001953125, 0.6162109375, 1.284423828125, 1.95263671875, 2.620849609375, 3.2890625, 3.957275390625, 4.62548828125, 5.293701171875, 5.9619140625, 6.630126953125, 7.29833984375, 7.966552734375, 8.634765625, 9.302978515625, 9.97119140625, 10.639404296875, 11.3076171875, 11.975830078125, 12.64404296875, 13.312255859375, 13.98046875, 14.648681640625, 15.31689453125, 15.985107421875, 16.6533203125, 17.321533203125, 17.98974609375, 18.657958984375, 19.326171875, 19.994384765625, 20.66259765625, 21.330810546875, 21.9990234375, 22.667236328125, 23.33544921875, 24.003662109375, 24.671875]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 4.0, 5.0, 5.0, 5.0, 3.0, 5.0, 12.0, 11.0, 9.0, 17.0, 17.0, 31.0, 35.0, 41.0, 43.0, 86.0, 73.0, 81.0, 72.0, 117.0, 129.0, 145.0, 153.0, 155.0, 189.0, 211.0, 200.0, 214.0, 190.0, 223.0, 185.0, 218.0, 181.0, 135.0, 135.0, 122.0, 106.0, 92.0, 71.0, 63.0, 72.0, 51.0, 33.0, 33.0, 28.0, 26.0, 13.0, 16.0, 8.0, 6.0, 5.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-9.875, -9.5758056640625, -9.276611328125, -8.9774169921875, -8.67822265625, -8.3790283203125, -8.079833984375, -7.7806396484375, -7.4814453125, -7.1822509765625, -6.883056640625, -6.5838623046875, -6.28466796875, -5.9854736328125, -5.686279296875, -5.3870849609375, -5.087890625, -4.7886962890625, -4.489501953125, -4.1903076171875, -3.89111328125, -3.5919189453125, -3.292724609375, -2.9935302734375, -2.6943359375, -2.3951416015625, -2.095947265625, -1.7967529296875, -1.49755859375, -1.1983642578125, -0.899169921875, -0.5999755859375, -0.30078125, -0.0015869140625, 0.297607421875, 0.5968017578125, 0.89599609375, 1.1951904296875, 1.494384765625, 1.7935791015625, 2.0927734375, 2.3919677734375, 2.691162109375, 2.9903564453125, 3.28955078125, 3.5887451171875, 3.887939453125, 4.1871337890625, 4.486328125, 4.7855224609375, 5.084716796875, 5.3839111328125, 5.68310546875, 5.9822998046875, 6.281494140625, 6.5806884765625, 6.8798828125, 7.1790771484375, 7.478271484375, 7.7774658203125, 8.07666015625, 8.3758544921875, 8.675048828125, 8.9742431640625, 9.2734375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 3.0, 2.0, 5.0, 3.0, 2.0, 19.0, 10.0, 4.0, 19.0, 12.0, 13.0, 24.0, 25.0, 19.0, 23.0, 25.0, 42.0, 37.0, 47.0, 34.0, 53.0, 39.0, 53.0, 41.0, 50.0, 45.0, 37.0, 39.0, 39.0, 34.0, 29.0, 37.0, 27.0, 19.0, 20.0, 12.0, 18.0, 6.0, 8.0, 4.0, 6.0, 5.0, 4.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-23.151472091674805, -22.441726684570312, -21.731979370117188, -21.022233963012695, -20.312488555908203, -19.602741241455078, -18.892995834350586, -18.183250427246094, -17.47350311279297, -16.763757705688477, -16.05401039123535, -15.34426498413086, -14.63451862335205, -13.924772262573242, -13.21502685546875, -12.505280494689941, -11.795534133911133, -11.085787773132324, -10.376041412353516, -9.666296005249023, -8.956549644470215, -8.246803283691406, -7.537057399749756, -6.8273115158081055, -6.117565155029297, -5.407818794250488, -4.698072910308838, -3.9883267879486084, -3.278580665588379, -2.5688345432281494, -1.85908842086792, -1.1493425369262695, -0.43959617614746094, 0.27014994621276855, 0.979896068572998, 1.6896421909332275, 2.399388313293457, 3.1091344356536865, 3.818880558013916, 4.528626441955566, 5.238372802734375, 5.948119163513184, 6.657865047454834, 7.367610931396484, 8.077357292175293, 8.787103652954102, 9.496849060058594, 10.206595420837402, 10.916341781616211, 11.62608814239502, 12.335834503173828, 13.04557991027832, 13.755326271057129, 14.465072631835938, 15.17481803894043, 15.884564399719238, 16.594310760498047, 17.30405616760254, 18.013803482055664, 18.723548889160156, 19.43329620361328, 20.143041610717773, 20.852787017822266, 21.56253433227539, 22.272279739379883]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 3.0, 1.0, 6.0, 7.0, 3.0, 11.0, 12.0, 16.0, 27.0, 18.0, 21.0, 27.0, 30.0, 41.0, 43.0, 42.0, 59.0, 42.0, 45.0, 48.0, 42.0, 44.0, 44.0, 52.0, 45.0, 41.0, 32.0, 38.0, 29.0, 29.0, 9.0, 23.0, 15.0, 16.0, 10.0, 9.0, 10.0, 1.0, 5.0, 6.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.966981887817383, -26.00594711303711, -25.044912338256836, -24.083877563476562, -23.122844696044922, -22.16180992126465, -21.200775146484375, -20.2397403717041, -19.278705596923828, -18.317670822143555, -17.35663604736328, -16.39560317993164, -15.434568405151367, -14.473533630371094, -13.51249885559082, -12.551464080810547, -11.590431213378906, -10.629396438598633, -9.668362617492676, -8.707327842712402, -7.746293544769287, -6.785259246826172, -5.824224472045898, -4.863190174102783, -3.902155876159668, -2.9411215782165527, -1.9800870418548584, -1.019052505493164, -0.05801820755004883, 0.9030160903930664, 1.8640508651733398, 2.825085163116455, 3.7861175537109375, 4.747151851654053, 5.708186149597168, 6.669220924377441, 7.630255222320557, 8.591289520263672, 9.552324295043945, 10.513359069824219, 11.474392890930176, 12.43542766571045, 13.396461486816406, 14.35749626159668, 15.318531036376953, 16.279563903808594, 17.2406005859375, 18.20163345336914, 19.162668228149414, 20.123703002929688, 21.08473777770996, 22.045772552490234, 23.006805419921875, 23.96784019470215, 24.928874969482422, 25.889909744262695, 26.85094451904297, 27.811979293823242, 28.773014068603516, 29.734046936035156, 30.69508171081543, 31.656116485595703, 32.617149353027344, 33.57818603515625, 34.53921890258789]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 12.0, 16.0, 33.0, 29.0, 68.0, 97.0, 163.0, 283.0, 571.0, 957.0, 1495.0, 2560.0, 4450.0, 7462.0, 12392.0, 20088.0, 32623.0, 50866.0, 73886.0, 101904.0, 126931.0, 137394.0, 131140.0, 109072.0, 82383.0, 56784.0, 36888.0, 23118.0, 14190.0, 8470.0, 5061.0, 2948.0, 1738.0, 977.0, 605.0, 358.0, 216.0, 122.0, 76.0, 52.0, 34.0, 16.0, 13.0, 9.0, 6.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0], "bins": [-7.640625, -7.4200439453125, -7.199462890625, -6.9788818359375, -6.75830078125, -6.5377197265625, -6.317138671875, -6.0965576171875, -5.8759765625, -5.6553955078125, -5.434814453125, -5.2142333984375, -4.99365234375, -4.7730712890625, -4.552490234375, -4.3319091796875, -4.111328125, -3.8907470703125, -3.670166015625, -3.4495849609375, -3.22900390625, -3.0084228515625, -2.787841796875, -2.5672607421875, -2.3466796875, -2.1260986328125, -1.905517578125, -1.6849365234375, -1.46435546875, -1.2437744140625, -1.023193359375, -0.8026123046875, -0.58203125, -0.3614501953125, -0.140869140625, 0.0797119140625, 0.30029296875, 0.5208740234375, 0.741455078125, 0.9620361328125, 1.1826171875, 1.4031982421875, 1.623779296875, 1.8443603515625, 2.06494140625, 2.2855224609375, 2.506103515625, 2.7266845703125, 2.947265625, 3.1678466796875, 3.388427734375, 3.6090087890625, 3.82958984375, 4.0501708984375, 4.270751953125, 4.4913330078125, 4.7119140625, 4.9324951171875, 5.153076171875, 5.3736572265625, 5.59423828125, 5.8148193359375, 6.035400390625, 6.2559814453125, 6.4765625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 4.0, 8.0, 11.0, 8.0, 6.0, 8.0, 22.0, 17.0, 26.0, 31.0, 45.0, 29.0, 37.0, 49.0, 49.0, 36.0, 45.0, 41.0, 43.0, 50.0, 54.0, 50.0, 50.0, 35.0, 45.0, 31.0, 24.0, 27.0, 21.0, 13.0, 25.0, 10.0, 10.0, 10.0, 6.0, 10.0, 8.0, 5.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.71875, -25.7451171875, -24.771484375, -23.7978515625, -22.82421875, -21.8505859375, -20.876953125, -19.9033203125, -18.9296875, -17.9560546875, -16.982421875, -16.0087890625, -15.03515625, -14.0615234375, -13.087890625, -12.1142578125, -11.140625, -10.1669921875, -9.193359375, -8.2197265625, -7.24609375, -6.2724609375, -5.298828125, -4.3251953125, -3.3515625, -2.3779296875, -1.404296875, -0.4306640625, 0.54296875, 1.5166015625, 2.490234375, 3.4638671875, 4.4375, 5.4111328125, 6.384765625, 7.3583984375, 8.33203125, 9.3056640625, 10.279296875, 11.2529296875, 12.2265625, 13.2001953125, 14.173828125, 15.1474609375, 16.12109375, 17.0947265625, 18.068359375, 19.0419921875, 20.015625, 20.9892578125, 21.962890625, 22.9365234375, 23.91015625, 24.8837890625, 25.857421875, 26.8310546875, 27.8046875, 28.7783203125, 29.751953125, 30.7255859375, 31.69921875, 32.6728515625, 33.646484375, 34.6201171875, 35.59375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 5.0, 7.0, 11.0, 8.0, 11.0, 22.0, 38.0, 65.0, 108.0, 136.0, 265.0, 387.0, 573.0, 965.0, 1521.0, 2711.0, 4231.0, 7183.0, 12311.0, 20577.0, 33977.0, 55466.0, 86708.0, 124093.0, 156150.0, 159181.0, 132382.0, 94374.0, 61289.0, 37458.0, 22752.0, 13335.0, 8051.0, 4667.0, 2887.0, 1784.0, 1065.0, 666.0, 393.0, 282.0, 172.0, 105.0, 78.0, 44.0, 25.0, 16.0, 7.0, 11.0, 5.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.79296875, -7.52520751953125, -7.2574462890625, -6.98968505859375, -6.721923828125, -6.45416259765625, -6.1864013671875, -5.91864013671875, -5.65087890625, -5.38311767578125, -5.1153564453125, -4.84759521484375, -4.579833984375, -4.31207275390625, -4.0443115234375, -3.77655029296875, -3.5087890625, -3.24102783203125, -2.9732666015625, -2.70550537109375, -2.437744140625, -2.16998291015625, -1.9022216796875, -1.63446044921875, -1.36669921875, -1.09893798828125, -0.8311767578125, -0.56341552734375, -0.295654296875, -0.02789306640625, 0.2398681640625, 0.50762939453125, 0.775390625, 1.04315185546875, 1.3109130859375, 1.57867431640625, 1.846435546875, 2.11419677734375, 2.3819580078125, 2.64971923828125, 2.91748046875, 3.18524169921875, 3.4530029296875, 3.72076416015625, 3.988525390625, 4.25628662109375, 4.5240478515625, 4.79180908203125, 5.0595703125, 5.32733154296875, 5.5950927734375, 5.86285400390625, 6.130615234375, 6.39837646484375, 6.6661376953125, 6.93389892578125, 7.20166015625, 7.46942138671875, 7.7371826171875, 8.00494384765625, 8.272705078125, 8.54046630859375, 8.8082275390625, 9.07598876953125, 9.34375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 3.0, 2.0, 0.0, 3.0, 7.0, 7.0, 9.0, 6.0, 10.0, 8.0, 18.0, 17.0, 18.0, 19.0, 27.0, 27.0, 27.0, 27.0, 27.0, 39.0, 37.0, 42.0, 36.0, 47.0, 43.0, 33.0, 41.0, 34.0, 38.0, 35.0, 37.0, 31.0, 40.0, 27.0, 25.0, 17.0, 22.0, 24.0, 19.0, 14.0, 12.0, 8.0, 10.0, 5.0, 6.0, 7.0, 6.0, 3.0, 2.0, 2.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-13.78125, -13.29833984375, -12.8154296875, -12.33251953125, -11.849609375, -11.36669921875, -10.8837890625, -10.40087890625, -9.91796875, -9.43505859375, -8.9521484375, -8.46923828125, -7.986328125, -7.50341796875, -7.0205078125, -6.53759765625, -6.0546875, -5.57177734375, -5.0888671875, -4.60595703125, -4.123046875, -3.64013671875, -3.1572265625, -2.67431640625, -2.19140625, -1.70849609375, -1.2255859375, -0.74267578125, -0.259765625, 0.22314453125, 0.7060546875, 1.18896484375, 1.671875, 2.15478515625, 2.6376953125, 3.12060546875, 3.603515625, 4.08642578125, 4.5693359375, 5.05224609375, 5.53515625, 6.01806640625, 6.5009765625, 6.98388671875, 7.466796875, 7.94970703125, 8.4326171875, 8.91552734375, 9.3984375, 9.88134765625, 10.3642578125, 10.84716796875, 11.330078125, 11.81298828125, 12.2958984375, 12.77880859375, 13.26171875, 13.74462890625, 14.2275390625, 14.71044921875, 15.193359375, 15.67626953125, 16.1591796875, 16.64208984375, 17.125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 5.0, 7.0, 14.0, 14.0, 22.0, 30.0, 45.0, 76.0, 128.0, 200.0, 334.0, 545.0, 1071.0, 1894.0, 3431.0, 6557.0, 12711.0, 24846.0, 46924.0, 86830.0, 147134.0, 201806.0, 197692.0, 140575.0, 82643.0, 44066.0, 23063.0, 12046.0, 6270.0, 3365.0, 1714.0, 1022.0, 572.0, 350.0, 213.0, 131.0, 62.0, 52.0, 32.0, 18.0, 19.0, 8.0, 10.0, 2.0, 3.0, 4.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.1484375, -4.014404296875, -3.88037109375, -3.746337890625, -3.6123046875, -3.478271484375, -3.34423828125, -3.210205078125, -3.076171875, -2.942138671875, -2.80810546875, -2.674072265625, -2.5400390625, -2.406005859375, -2.27197265625, -2.137939453125, -2.00390625, -1.869873046875, -1.73583984375, -1.601806640625, -1.4677734375, -1.333740234375, -1.19970703125, -1.065673828125, -0.931640625, -0.797607421875, -0.66357421875, -0.529541015625, -0.3955078125, -0.261474609375, -0.12744140625, 0.006591796875, 0.140625, 0.274658203125, 0.40869140625, 0.542724609375, 0.6767578125, 0.810791015625, 0.94482421875, 1.078857421875, 1.212890625, 1.346923828125, 1.48095703125, 1.614990234375, 1.7490234375, 1.883056640625, 2.01708984375, 2.151123046875, 2.28515625, 2.419189453125, 2.55322265625, 2.687255859375, 2.8212890625, 2.955322265625, 3.08935546875, 3.223388671875, 3.357421875, 3.491455078125, 3.62548828125, 3.759521484375, 3.8935546875, 4.027587890625, 4.16162109375, 4.295654296875, 4.4296875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 1.0, 5.0, 4.0, 10.0, 9.0, 17.0, 19.0, 18.0, 30.0, 29.0, 37.0, 28.0, 39.0, 51.0, 51.0, 52.0, 40.0, 53.0, 54.0, 46.0, 44.0, 50.0, 55.0, 27.0, 39.0, 25.0, 30.0, 34.0, 19.0, 19.0, 19.0, 15.0, 7.0, 10.0, 7.0, 8.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002307891845703125, -0.00022307410836219788, -0.00021535903215408325, -0.00020764395594596863, -0.000199928879737854, -0.00019221380352973938, -0.00018449872732162476, -0.00017678365111351013, -0.0001690685749053955, -0.00016135349869728088, -0.00015363842248916626, -0.00014592334628105164, -0.000138208270072937, -0.0001304931938648224, -0.00012277811765670776, -0.00011506304144859314, -0.00010734796524047852, -9.963288903236389e-05, -9.191781282424927e-05, -8.420273661613464e-05, -7.648766040802002e-05, -6.87725841999054e-05, -6.105750799179077e-05, -5.334243178367615e-05, -4.5627355575561523e-05, -3.79122793674469e-05, -3.0197203159332275e-05, -2.248212695121765e-05, -1.4767050743103027e-05, -7.051974534988403e-06, 6.631016731262207e-07, 8.378177881240845e-06, 1.609325408935547e-05, 2.3808330297470093e-05, 3.152340650558472e-05, 3.923848271369934e-05, 4.6953558921813965e-05, 5.466863512992859e-05, 6.238371133804321e-05, 7.009878754615784e-05, 7.781386375427246e-05, 8.552893996238708e-05, 9.324401617050171e-05, 0.00010095909237861633, 0.00010867416858673096, 0.00011638924479484558, 0.0001241043210029602, 0.00013181939721107483, 0.00013953447341918945, 0.00014724954962730408, 0.0001549646258354187, 0.00016267970204353333, 0.00017039477825164795, 0.00017810985445976257, 0.0001858249306678772, 0.00019354000687599182, 0.00020125508308410645, 0.00020897015929222107, 0.0002166852355003357, 0.00022440031170845032, 0.00023211538791656494, 0.00023983046412467957, 0.0002475455403327942, 0.0002552606165409088, 0.00026297569274902344]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 4.0, 1.0, 11.0, 6.0, 11.0, 25.0, 50.0, 70.0, 106.0, 154.0, 238.0, 374.0, 565.0, 873.0, 1396.0, 2268.0, 3654.0, 5886.0, 9103.0, 14484.0, 22537.0, 33938.0, 49313.0, 69154.0, 91677.0, 111717.0, 122613.0, 121597.0, 107181.0, 86031.0, 63819.0, 44615.0, 30382.0, 20017.0, 12760.0, 8167.0, 5096.0, 3240.0, 2031.0, 1238.0, 774.0, 509.0, 322.0, 207.0, 131.0, 85.0, 47.0, 33.0, 22.0, 14.0, 8.0, 5.0, 0.0, 3.0, 3.0], "bins": [-3.642578125, -3.541015625, -3.439453125, -3.337890625, -3.236328125, -3.134765625, -3.033203125, -2.931640625, -2.830078125, -2.728515625, -2.626953125, -2.525390625, -2.423828125, -2.322265625, -2.220703125, -2.119140625, -2.017578125, -1.916015625, -1.814453125, -1.712890625, -1.611328125, -1.509765625, -1.408203125, -1.306640625, -1.205078125, -1.103515625, -1.001953125, -0.900390625, -0.798828125, -0.697265625, -0.595703125, -0.494140625, -0.392578125, -0.291015625, -0.189453125, -0.087890625, 0.013671875, 0.115234375, 0.216796875, 0.318359375, 0.419921875, 0.521484375, 0.623046875, 0.724609375, 0.826171875, 0.927734375, 1.029296875, 1.130859375, 1.232421875, 1.333984375, 1.435546875, 1.537109375, 1.638671875, 1.740234375, 1.841796875, 1.943359375, 2.044921875, 2.146484375, 2.248046875, 2.349609375, 2.451171875, 2.552734375, 2.654296875, 2.755859375, 2.857421875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 2.0, 0.0, 2.0, 3.0, 4.0, 11.0, 5.0, 7.0, 20.0, 9.0, 12.0, 19.0, 15.0, 18.0, 24.0, 22.0, 39.0, 35.0, 34.0, 43.0, 46.0, 46.0, 58.0, 45.0, 48.0, 48.0, 45.0, 52.0, 37.0, 45.0, 30.0, 31.0, 25.0, 23.0, 13.0, 15.0, 13.0, 8.0, 12.0, 10.0, 11.0, 5.0, 8.0, 3.0, 4.0, 5.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.64453125, -1.5956573486328125, -1.546783447265625, -1.4979095458984375, -1.44903564453125, -1.4001617431640625, -1.351287841796875, -1.3024139404296875, -1.2535400390625, -1.2046661376953125, -1.155792236328125, -1.1069183349609375, -1.05804443359375, -1.0091705322265625, -0.960296630859375, -0.9114227294921875, -0.862548828125, -0.8136749267578125, -0.764801025390625, -0.7159271240234375, -0.66705322265625, -0.6181793212890625, -0.569305419921875, -0.5204315185546875, -0.4715576171875, -0.4226837158203125, -0.373809814453125, -0.3249359130859375, -0.27606201171875, -0.2271881103515625, -0.178314208984375, -0.1294403076171875, -0.08056640625, -0.0316925048828125, 0.017181396484375, 0.0660552978515625, 0.11492919921875, 0.1638031005859375, 0.212677001953125, 0.2615509033203125, 0.3104248046875, 0.3592987060546875, 0.408172607421875, 0.4570465087890625, 0.50592041015625, 0.5547943115234375, 0.603668212890625, 0.6525421142578125, 0.701416015625, 0.7502899169921875, 0.799163818359375, 0.8480377197265625, 0.89691162109375, 0.9457855224609375, 0.994659423828125, 1.0435333251953125, 1.0924072265625, 1.1412811279296875, 1.190155029296875, 1.2390289306640625, 1.28790283203125, 1.3367767333984375, 1.385650634765625, 1.4345245361328125, 1.4833984375]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 0.0, 5.0, 7.0, 4.0, 10.0, 10.0, 12.0, 12.0, 15.0, 20.0, 16.0, 24.0, 26.0, 21.0, 28.0, 39.0, 41.0, 44.0, 37.0, 47.0, 49.0, 54.0, 46.0, 47.0, 38.0, 37.0, 43.0, 37.0, 44.0, 26.0, 32.0, 28.0, 21.0, 19.0, 9.0, 14.0, 5.0, 9.0, 5.0, 6.0, 2.0, 5.0, 2.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.872983932495117, -22.14501190185547, -21.417041778564453, -20.689069747924805, -19.961097717285156, -19.23312759399414, -18.505155563354492, -17.777183532714844, -17.049213409423828, -16.32124137878418, -15.593271255493164, -14.865299224853516, -14.137328147888184, -13.409357070922852, -12.681385040283203, -11.953413963317871, -11.225442886352539, -10.497471809387207, -9.769500732421875, -9.041528701782227, -8.313557624816895, -7.5855865478515625, -6.857614994049072, -6.129643440246582, -5.40167236328125, -4.673701286315918, -3.9457297325134277, -3.2177584171295166, -2.4897871017456055, -1.7618157863616943, -1.0338444709777832, -0.30587291717529297, 0.42209815979003906, 1.1500694751739502, 1.8780407905578613, 2.6060121059417725, 3.3339834213256836, 4.061954498291016, 4.789926052093506, 5.517897605895996, 6.245868682861328, 6.97383975982666, 7.70181131362915, 8.42978286743164, 9.157753944396973, 9.885725021362305, 10.613697052001953, 11.341668128967285, 12.069639205932617, 12.79761028289795, 13.525581359863281, 14.25355339050293, 14.981524467468262, 15.709495544433594, 16.437467575073242, 17.16543960571289, 17.893409729003906, 18.621381759643555, 19.34935188293457, 20.07732391357422, 20.805294036865234, 21.533266067504883, 22.26123809814453, 22.989208221435547, 23.717180252075195]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 6.0, 5.0, 6.0, 11.0, 10.0, 15.0, 29.0, 23.0, 15.0, 25.0, 32.0, 43.0, 46.0, 39.0, 54.0, 44.0, 42.0, 45.0, 46.0, 42.0, 48.0, 54.0, 44.0, 40.0, 29.0, 38.0, 29.0, 31.0, 12.0, 20.0, 17.0, 18.0, 6.0, 9.0, 8.0, 5.0, 2.0, 9.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.685579299926758, -25.737878799438477, -24.790176391601562, -23.84247589111328, -22.894775390625, -21.94707489013672, -20.999372482299805, -20.051671981811523, -19.10396957397461, -18.156269073486328, -17.208566665649414, -16.260866165161133, -15.313165664672852, -14.365464210510254, -13.417762756347656, -12.470062255859375, -11.522361755371094, -10.574660301208496, -9.626959800720215, -8.679258346557617, -7.731557369232178, -6.783856391906738, -5.836154937744141, -4.888453960418701, -3.9407529830932617, -2.9930520057678223, -2.0453507900238037, -1.0976495742797852, -0.1499485969543457, 0.7977523803710938, 1.7454538345336914, 2.693154811859131, 3.6408538818359375, 4.588554859161377, 5.536255836486816, 6.483957290649414, 7.4316582679748535, 8.379359245300293, 9.32706069946289, 10.274761199951172, 11.22246265411377, 12.170164108276367, 13.117864608764648, 14.065566062927246, 15.013267517089844, 15.960968017578125, 16.908668518066406, 17.85637092590332, 18.8040714263916, 19.751771926879883, 20.699474334716797, 21.647174835205078, 22.59487533569336, 23.54257583618164, 24.490278244018555, 25.437978744506836, 26.38568115234375, 27.33338165283203, 28.281084060668945, 29.228784561157227, 30.176485061645508, 31.124187469482422, 32.0718879699707, 33.019588470458984, 33.967288970947266]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 10.0, 12.0, 17.0, 25.0, 34.0, 73.0, 101.0, 167.0, 306.0, 423.0, 700.0, 1196.0, 1996.0, 3206.0, 5312.0, 8491.0, 13106.0, 20585.0, 31275.0, 45661.0, 64154.0, 83577.0, 101952.0, 113541.0, 116144.0, 108388.0, 93170.0, 73441.0, 54149.0, 37720.0, 25530.0, 16605.0, 10516.0, 6542.0, 4092.0, 2529.0, 1508.0, 859.0, 541.0, 340.0, 203.0, 149.0, 76.0, 54.0, 29.0, 19.0, 21.0, 5.0, 8.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-14.203125, -13.788330078125, -13.37353515625, -12.958740234375, -12.5439453125, -12.129150390625, -11.71435546875, -11.299560546875, -10.884765625, -10.469970703125, -10.05517578125, -9.640380859375, -9.2255859375, -8.810791015625, -8.39599609375, -7.981201171875, -7.56640625, -7.151611328125, -6.73681640625, -6.322021484375, -5.9072265625, -5.492431640625, -5.07763671875, -4.662841796875, -4.248046875, -3.833251953125, -3.41845703125, -3.003662109375, -2.5888671875, -2.174072265625, -1.75927734375, -1.344482421875, -0.9296875, -0.514892578125, -0.10009765625, 0.314697265625, 0.7294921875, 1.144287109375, 1.55908203125, 1.973876953125, 2.388671875, 2.803466796875, 3.21826171875, 3.633056640625, 4.0478515625, 4.462646484375, 4.87744140625, 5.292236328125, 5.70703125, 6.121826171875, 6.53662109375, 6.951416015625, 7.3662109375, 7.781005859375, 8.19580078125, 8.610595703125, 9.025390625, 9.440185546875, 9.85498046875, 10.269775390625, 10.6845703125, 11.099365234375, 11.51416015625, 11.928955078125, 12.34375]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 3.0, 6.0, 3.0, 4.0, 6.0, 6.0, 15.0, 15.0, 12.0, 25.0, 21.0, 24.0, 29.0, 31.0, 40.0, 33.0, 35.0, 47.0, 59.0, 55.0, 48.0, 45.0, 43.0, 38.0, 42.0, 35.0, 39.0, 40.0, 24.0, 29.0, 25.0, 18.0, 24.0, 21.0, 15.0, 14.0, 9.0, 5.0, 8.0, 3.0, 3.0, 5.0, 5.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.4375, -24.49853515625, -23.5595703125, -22.62060546875, -21.681640625, -20.74267578125, -19.8037109375, -18.86474609375, -17.92578125, -16.98681640625, -16.0478515625, -15.10888671875, -14.169921875, -13.23095703125, -12.2919921875, -11.35302734375, -10.4140625, -9.47509765625, -8.5361328125, -7.59716796875, -6.658203125, -5.71923828125, -4.7802734375, -3.84130859375, -2.90234375, -1.96337890625, -1.0244140625, -0.08544921875, 0.853515625, 1.79248046875, 2.7314453125, 3.67041015625, 4.609375, 5.54833984375, 6.4873046875, 7.42626953125, 8.365234375, 9.30419921875, 10.2431640625, 11.18212890625, 12.12109375, 13.06005859375, 13.9990234375, 14.93798828125, 15.876953125, 16.81591796875, 17.7548828125, 18.69384765625, 19.6328125, 20.57177734375, 21.5107421875, 22.44970703125, 23.388671875, 24.32763671875, 25.2666015625, 26.20556640625, 27.14453125, 28.08349609375, 29.0224609375, 29.96142578125, 30.900390625, 31.83935546875, 32.7783203125, 33.71728515625, 34.65625]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 4.0, 5.0, 14.0, 20.0, 24.0, 54.0, 88.0, 129.0, 237.0, 389.0, 628.0, 1041.0, 1640.0, 2748.0, 4458.0, 7211.0, 11252.0, 17899.0, 27174.0, 40687.0, 58428.0, 78284.0, 98578.0, 113732.0, 119428.0, 113699.0, 98946.0, 78077.0, 58165.0, 40329.0, 27351.0, 17833.0, 11345.0, 7074.0, 4429.0, 2732.0, 1758.0, 1021.0, 646.0, 369.0, 282.0, 140.0, 96.0, 59.0, 28.0, 13.0, 10.0, 6.0, 1.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.8046875, -13.35205078125, -12.8994140625, -12.44677734375, -11.994140625, -11.54150390625, -11.0888671875, -10.63623046875, -10.18359375, -9.73095703125, -9.2783203125, -8.82568359375, -8.373046875, -7.92041015625, -7.4677734375, -7.01513671875, -6.5625, -6.10986328125, -5.6572265625, -5.20458984375, -4.751953125, -4.29931640625, -3.8466796875, -3.39404296875, -2.94140625, -2.48876953125, -2.0361328125, -1.58349609375, -1.130859375, -0.67822265625, -0.2255859375, 0.22705078125, 0.6796875, 1.13232421875, 1.5849609375, 2.03759765625, 2.490234375, 2.94287109375, 3.3955078125, 3.84814453125, 4.30078125, 4.75341796875, 5.2060546875, 5.65869140625, 6.111328125, 6.56396484375, 7.0166015625, 7.46923828125, 7.921875, 8.37451171875, 8.8271484375, 9.27978515625, 9.732421875, 10.18505859375, 10.6376953125, 11.09033203125, 11.54296875, 11.99560546875, 12.4482421875, 12.90087890625, 13.353515625, 13.80615234375, 14.2587890625, 14.71142578125, 15.1640625]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 0.0, 4.0, 4.0, 1.0, 1.0, 6.0, 8.0, 10.0, 10.0, 14.0, 14.0, 29.0, 24.0, 24.0, 24.0, 33.0, 37.0, 25.0, 33.0, 48.0, 47.0, 37.0, 38.0, 63.0, 43.0, 54.0, 38.0, 46.0, 38.0, 37.0, 34.0, 30.0, 23.0, 19.0, 19.0, 16.0, 14.0, 12.0, 11.0, 10.0, 8.0, 4.0, 6.0, 7.0, 2.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-20.8125, -20.226806640625, -19.64111328125, -19.055419921875, -18.4697265625, -17.884033203125, -17.29833984375, -16.712646484375, -16.126953125, -15.541259765625, -14.95556640625, -14.369873046875, -13.7841796875, -13.198486328125, -12.61279296875, -12.027099609375, -11.44140625, -10.855712890625, -10.27001953125, -9.684326171875, -9.0986328125, -8.512939453125, -7.92724609375, -7.341552734375, -6.755859375, -6.170166015625, -5.58447265625, -4.998779296875, -4.4130859375, -3.827392578125, -3.24169921875, -2.656005859375, -2.0703125, -1.484619140625, -0.89892578125, -0.313232421875, 0.2724609375, 0.858154296875, 1.44384765625, 2.029541015625, 2.615234375, 3.200927734375, 3.78662109375, 4.372314453125, 4.9580078125, 5.543701171875, 6.12939453125, 6.715087890625, 7.30078125, 7.886474609375, 8.47216796875, 9.057861328125, 9.6435546875, 10.229248046875, 10.81494140625, 11.400634765625, 11.986328125, 12.572021484375, 13.15771484375, 13.743408203125, 14.3291015625, 14.914794921875, 15.50048828125, 16.086181640625, 16.671875]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 14.0, 20.0, 40.0, 60.0, 65.0, 111.0, 199.0, 284.0, 495.0, 785.0, 1211.0, 2048.0, 3259.0, 5473.0, 9106.0, 14647.0, 23569.0, 36873.0, 55731.0, 78292.0, 102348.0, 120377.0, 128137.0, 122007.0, 103921.0, 80405.0, 57138.0, 38045.0, 24498.0, 15347.0, 9426.0, 5675.0, 3506.0, 2065.0, 1268.0, 759.0, 475.0, 293.0, 222.0, 129.0, 75.0, 51.0, 32.0, 21.0, 17.0, 13.0, 12.0, 6.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.015625, -5.82489013671875, -5.6341552734375, -5.44342041015625, -5.252685546875, -5.06195068359375, -4.8712158203125, -4.68048095703125, -4.48974609375, -4.29901123046875, -4.1082763671875, -3.91754150390625, -3.726806640625, -3.53607177734375, -3.3453369140625, -3.15460205078125, -2.9638671875, -2.77313232421875, -2.5823974609375, -2.39166259765625, -2.200927734375, -2.01019287109375, -1.8194580078125, -1.62872314453125, -1.43798828125, -1.24725341796875, -1.0565185546875, -0.86578369140625, -0.675048828125, -0.48431396484375, -0.2935791015625, -0.10284423828125, 0.087890625, 0.27862548828125, 0.4693603515625, 0.66009521484375, 0.850830078125, 1.04156494140625, 1.2322998046875, 1.42303466796875, 1.61376953125, 1.80450439453125, 1.9952392578125, 2.18597412109375, 2.376708984375, 2.56744384765625, 2.7581787109375, 2.94891357421875, 3.1396484375, 3.33038330078125, 3.5211181640625, 3.71185302734375, 3.902587890625, 4.09332275390625, 4.2840576171875, 4.47479248046875, 4.66552734375, 4.85626220703125, 5.0469970703125, 5.23773193359375, 5.428466796875, 5.61920166015625, 5.8099365234375, 6.00067138671875, 6.19140625]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 5.0, 11.0, 3.0, 13.0, 14.0, 14.0, 20.0, 15.0, 21.0, 28.0, 26.0, 44.0, 35.0, 37.0, 38.0, 43.0, 56.0, 46.0, 47.0, 56.0, 46.0, 45.0, 51.0, 38.0, 37.0, 42.0, 24.0, 24.0, 24.0, 27.0, 13.0, 15.0, 10.0, 13.0, 7.0, 7.0, 5.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0005846023559570312, -0.0005632787942886353, -0.0005419552326202393, -0.0005206316709518433, -0.0004993081092834473, -0.00047798454761505127, -0.0004566609859466553, -0.0004353374242782593, -0.0004140138626098633, -0.0003926903009414673, -0.0003713667392730713, -0.0003500431776046753, -0.0003287196159362793, -0.0003073960542678833, -0.0002860724925994873, -0.0002647489309310913, -0.0002434253692626953, -0.00022210180759429932, -0.00020077824592590332, -0.00017945468425750732, -0.00015813112258911133, -0.00013680756092071533, -0.00011548399925231934, -9.416043758392334e-05, -7.283687591552734e-05, -5.151331424713135e-05, -3.018975257873535e-05, -8.866190910339355e-06, 1.245737075805664e-05, 3.378093242645264e-05, 5.510449409484863e-05, 7.642805576324463e-05, 9.775161743164062e-05, 0.00011907517910003662, 0.00014039874076843262, 0.0001617223024368286, 0.0001830458641052246, 0.0002043694257736206, 0.0002256929874420166, 0.0002470165491104126, 0.0002683401107788086, 0.0002896636724472046, 0.0003109872341156006, 0.0003323107957839966, 0.0003536343574523926, 0.0003749579191207886, 0.00039628148078918457, 0.00041760504245758057, 0.00043892860412597656, 0.00046025216579437256, 0.00048157572746276855, 0.0005028992891311646, 0.0005242228507995605, 0.0005455464124679565, 0.0005668699741363525, 0.0005881935358047485, 0.0006095170974731445, 0.0006308406591415405, 0.0006521642208099365, 0.0006734877824783325, 0.0006948113441467285, 0.0007161349058151245, 0.0007374584674835205, 0.0007587820291519165, 0.0007801055908203125]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 5.0, 13.0, 17.0, 25.0, 35.0, 55.0, 96.0, 192.0, 321.0, 529.0, 911.0, 1629.0, 2899.0, 5312.0, 9341.0, 16789.0, 29576.0, 50279.0, 79843.0, 114661.0, 144631.0, 155530.0, 142119.0, 109460.0, 74734.0, 46749.0, 27477.0, 15770.0, 8523.0, 4843.0, 2636.0, 1435.0, 895.0, 522.0, 287.0, 165.0, 89.0, 50.0, 40.0, 21.0, 20.0, 9.0, 13.0, 4.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0], "bins": [-8.8984375, -8.64727783203125, -8.3961181640625, -8.14495849609375, -7.893798828125, -7.64263916015625, -7.3914794921875, -7.14031982421875, -6.88916015625, -6.63800048828125, -6.3868408203125, -6.13568115234375, -5.884521484375, -5.63336181640625, -5.3822021484375, -5.13104248046875, -4.8798828125, -4.62872314453125, -4.3775634765625, -4.12640380859375, -3.875244140625, -3.62408447265625, -3.3729248046875, -3.12176513671875, -2.87060546875, -2.61944580078125, -2.3682861328125, -2.11712646484375, -1.865966796875, -1.61480712890625, -1.3636474609375, -1.11248779296875, -0.861328125, -0.61016845703125, -0.3590087890625, -0.10784912109375, 0.143310546875, 0.39447021484375, 0.6456298828125, 0.89678955078125, 1.14794921875, 1.39910888671875, 1.6502685546875, 1.90142822265625, 2.152587890625, 2.40374755859375, 2.6549072265625, 2.90606689453125, 3.1572265625, 3.40838623046875, 3.6595458984375, 3.91070556640625, 4.161865234375, 4.41302490234375, 4.6641845703125, 4.91534423828125, 5.16650390625, 5.41766357421875, 5.6688232421875, 5.91998291015625, 6.171142578125, 6.42230224609375, 6.6734619140625, 6.92462158203125, 7.17578125]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 5.0, 2.0, 3.0, 9.0, 5.0, 8.0, 11.0, 15.0, 30.0, 25.0, 34.0, 54.0, 48.0, 48.0, 67.0, 72.0, 65.0, 66.0, 71.0, 65.0, 52.0, 53.0, 39.0, 29.0, 29.0, 35.0, 21.0, 12.0, 12.0, 6.0, 5.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.759765625, -3.611114501953125, -3.46246337890625, -3.313812255859375, -3.1651611328125, -3.016510009765625, -2.86785888671875, -2.719207763671875, -2.570556640625, -2.421905517578125, -2.27325439453125, -2.124603271484375, -1.9759521484375, -1.827301025390625, -1.67864990234375, -1.529998779296875, -1.38134765625, -1.232696533203125, -1.08404541015625, -0.935394287109375, -0.7867431640625, -0.638092041015625, -0.48944091796875, -0.340789794921875, -0.192138671875, -0.043487548828125, 0.10516357421875, 0.253814697265625, 0.4024658203125, 0.551116943359375, 0.69976806640625, 0.848419189453125, 0.9970703125, 1.145721435546875, 1.29437255859375, 1.443023681640625, 1.5916748046875, 1.740325927734375, 1.88897705078125, 2.037628173828125, 2.186279296875, 2.334930419921875, 2.48358154296875, 2.632232666015625, 2.7808837890625, 2.929534912109375, 3.07818603515625, 3.226837158203125, 3.37548828125, 3.524139404296875, 3.67279052734375, 3.821441650390625, 3.9700927734375, 4.118743896484375, 4.26739501953125, 4.416046142578125, 4.564697265625, 4.713348388671875, 4.86199951171875, 5.010650634765625, 5.1593017578125, 5.307952880859375, 5.45660400390625, 5.605255126953125, 5.75390625]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 8.0, 2.0, 8.0, 9.0, 6.0, 13.0, 18.0, 10.0, 12.0, 27.0, 28.0, 24.0, 31.0, 24.0, 35.0, 42.0, 36.0, 44.0, 47.0, 61.0, 42.0, 55.0, 53.0, 32.0, 31.0, 27.0, 36.0, 45.0, 36.0, 30.0, 25.0, 25.0, 16.0, 4.0, 10.0, 12.0, 6.0, 4.0, 11.0, 4.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.660484313964844, -20.9451904296875, -20.229896545410156, -19.514602661132812, -18.79930877685547, -18.084012985229492, -17.36871910095215, -16.653425216674805, -15.938131332397461, -15.222837448120117, -14.507543563842773, -13.792248725891113, -13.07695484161377, -12.361660957336426, -11.646366119384766, -10.931072235107422, -10.215778350830078, -9.500484466552734, -8.78519058227539, -8.06989574432373, -7.354601860046387, -6.639307975769043, -5.924013614654541, -5.208719253540039, -4.493425369262695, -3.7781312465667725, -3.0628371238708496, -2.3475430011749268, -1.632248878479004, -0.916954755783081, -0.2016606330871582, 0.5136337280273438, 1.2289276123046875, 1.9442217350006104, 2.659515857696533, 3.374809980392456, 4.090104103088379, 4.805397987365723, 5.520692348480225, 6.235986709594727, 6.95128059387207, 7.666574478149414, 8.381868362426758, 9.097163200378418, 9.812457084655762, 10.527750968933105, 11.243045806884766, 11.95833969116211, 12.673633575439453, 13.388927459716797, 14.10422134399414, 14.8195161819458, 15.534810066223145, 16.250104904174805, 16.96539878845215, 17.680692672729492, 18.395986557006836, 19.11128044128418, 19.826574325561523, 20.541868209838867, 21.257164001464844, 21.972457885742188, 22.68775177001953, 23.403045654296875, 24.11833953857422]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 6.0, 5.0, 0.0, 2.0, 2.0, 8.0, 7.0, 9.0, 20.0, 15.0, 13.0, 23.0, 26.0, 18.0, 35.0, 41.0, 36.0, 41.0, 31.0, 39.0, 49.0, 44.0, 47.0, 42.0, 36.0, 48.0, 43.0, 43.0, 38.0, 36.0, 40.0, 32.0, 20.0, 29.0, 16.0, 7.0, 8.0, 10.0, 9.0, 14.0, 9.0, 3.0, 6.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.38828468322754, -25.47492218017578, -24.561559677124023, -23.648197174072266, -22.734834671020508, -21.82147216796875, -20.90810775756836, -19.994747161865234, -19.081382751464844, -18.168020248413086, -17.254657745361328, -16.34129524230957, -15.427932739257812, -14.514570236206055, -13.60120677947998, -12.687844276428223, -11.774482727050781, -10.861120223999023, -9.947757720947266, -9.034395217895508, -8.12103271484375, -7.207669734954834, -6.294306755065918, -5.38094425201416, -4.467581748962402, -3.5542192459106445, -2.6408565044403076, -1.7274937629699707, -0.8141312599182129, 0.09923124313354492, 1.012594223022461, 1.9259567260742188, 2.8393211364746094, 3.752683639526367, 4.666046142578125, 5.579409122467041, 6.492771625518799, 7.406134128570557, 8.319497108459473, 9.23285961151123, 10.146222114562988, 11.059584617614746, 11.972947120666504, 12.886310577392578, 13.799673080444336, 14.713035583496094, 15.626398086547852, 16.53976058959961, 17.453123092651367, 18.366485595703125, 19.279848098754883, 20.19321060180664, 21.1065731048584, 22.019935607910156, 22.933300018310547, 23.846660614013672, 24.760025024414062, 25.67338752746582, 26.586750030517578, 27.500112533569336, 28.413475036621094, 29.32683753967285, 30.24020004272461, 31.153564453125, 32.066925048828125]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [3.0, 4.0, 3.0, 9.0, 13.0, 20.0, 37.0, 55.0, 75.0, 138.0, 221.0, 327.0, 504.0, 739.0, 1208.0, 1901.0, 3185.0, 4977.0, 7956.0, 12512.0, 20084.0, 32295.0, 50975.0, 80436.0, 125071.0, 187987.0, 270363.0, 364289.0, 453687.0, 506530.0, 502247.0, 444551.0, 353818.0, 260263.0, 178946.0, 118859.0, 76602.0, 48968.0, 30746.0, 19460.0, 12565.0, 7685.0, 5007.0, 3202.0, 2023.0, 1318.0, 843.0, 527.0, 357.0, 228.0, 161.0, 118.0, 68.0, 51.0, 34.0, 21.0, 10.0, 7.0, 3.0, 5.0, 4.0, 1.0, 1.0, 1.0], "bins": [-16.78125, -16.22119140625, -15.6611328125, -15.10107421875, -14.541015625, -13.98095703125, -13.4208984375, -12.86083984375, -12.30078125, -11.74072265625, -11.1806640625, -10.62060546875, -10.060546875, -9.50048828125, -8.9404296875, -8.38037109375, -7.8203125, -7.26025390625, -6.7001953125, -6.14013671875, -5.580078125, -5.02001953125, -4.4599609375, -3.89990234375, -3.33984375, -2.77978515625, -2.2197265625, -1.65966796875, -1.099609375, -0.53955078125, 0.0205078125, 0.58056640625, 1.140625, 1.70068359375, 2.2607421875, 2.82080078125, 3.380859375, 3.94091796875, 4.5009765625, 5.06103515625, 5.62109375, 6.18115234375, 6.7412109375, 7.30126953125, 7.861328125, 8.42138671875, 8.9814453125, 9.54150390625, 10.1015625, 10.66162109375, 11.2216796875, 11.78173828125, 12.341796875, 12.90185546875, 13.4619140625, 14.02197265625, 14.58203125, 15.14208984375, 15.7021484375, 16.26220703125, 16.822265625, 17.38232421875, 17.9423828125, 18.50244140625, 19.0625]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 4.0, 2.0, 3.0, 4.0, 10.0, 5.0, 13.0, 13.0, 16.0, 19.0, 23.0, 18.0, 27.0, 32.0, 42.0, 29.0, 46.0, 39.0, 36.0, 49.0, 44.0, 41.0, 41.0, 41.0, 46.0, 54.0, 40.0, 45.0, 46.0, 28.0, 22.0, 24.0, 18.0, 11.0, 13.0, 12.0, 8.0, 9.0, 14.0, 5.0, 9.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.1875, -22.40625, -21.625, -20.84375, -20.0625, -19.28125, -18.5, -17.71875, -16.9375, -16.15625, -15.375, -14.59375, -13.8125, -13.03125, -12.25, -11.46875, -10.6875, -9.90625, -9.125, -8.34375, -7.5625, -6.78125, -6.0, -5.21875, -4.4375, -3.65625, -2.875, -2.09375, -1.3125, -0.53125, 0.25, 1.03125, 1.8125, 2.59375, 3.375, 4.15625, 4.9375, 5.71875, 6.5, 7.28125, 8.0625, 8.84375, 9.625, 10.40625, 11.1875, 11.96875, 12.75, 13.53125, 14.3125, 15.09375, 15.875, 16.65625, 17.4375, 18.21875, 19.0, 19.78125, 20.5625, 21.34375, 22.125, 22.90625, 23.6875, 24.46875, 25.25, 26.03125, 26.8125]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 8.0, 11.0, 10.0, 20.0, 27.0, 66.0, 153.0, 249.0, 530.0, 1002.0, 2075.0, 3899.0, 8097.0, 15554.0, 31349.0, 60761.0, 112074.0, 201254.0, 332023.0, 486460.0, 617962.0, 658885.0, 582438.0, 435032.0, 283770.0, 168319.0, 92230.0, 49027.0, 25244.0, 12747.0, 6360.0, 3286.0, 1605.0, 840.0, 436.0, 241.0, 118.0, 60.0, 28.0, 17.0, 11.0, 3.0, 6.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.65625, -26.82666015625, -25.9970703125, -25.16748046875, -24.337890625, -23.50830078125, -22.6787109375, -21.84912109375, -21.01953125, -20.18994140625, -19.3603515625, -18.53076171875, -17.701171875, -16.87158203125, -16.0419921875, -15.21240234375, -14.3828125, -13.55322265625, -12.7236328125, -11.89404296875, -11.064453125, -10.23486328125, -9.4052734375, -8.57568359375, -7.74609375, -6.91650390625, -6.0869140625, -5.25732421875, -4.427734375, -3.59814453125, -2.7685546875, -1.93896484375, -1.109375, -0.27978515625, 0.5498046875, 1.37939453125, 2.208984375, 3.03857421875, 3.8681640625, 4.69775390625, 5.52734375, 6.35693359375, 7.1865234375, 8.01611328125, 8.845703125, 9.67529296875, 10.5048828125, 11.33447265625, 12.1640625, 12.99365234375, 13.8232421875, 14.65283203125, 15.482421875, 16.31201171875, 17.1416015625, 17.97119140625, 18.80078125, 19.63037109375, 20.4599609375, 21.28955078125, 22.119140625, 22.94873046875, 23.7783203125, 24.60791015625, 25.4375]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 7.0, 13.0, 5.0, 18.0, 16.0, 25.0, 34.0, 43.0, 55.0, 50.0, 78.0, 81.0, 107.0, 103.0, 132.0, 149.0, 177.0, 190.0, 197.0, 219.0, 203.0, 199.0, 224.0, 202.0, 197.0, 179.0, 171.0, 175.0, 153.0, 139.0, 115.0, 88.0, 72.0, 63.0, 42.0, 43.0, 39.0, 28.0, 16.0, 12.0, 5.0, 5.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.515625, -10.1741943359375, -9.832763671875, -9.4913330078125, -9.14990234375, -8.8084716796875, -8.467041015625, -8.1256103515625, -7.7841796875, -7.4427490234375, -7.101318359375, -6.7598876953125, -6.41845703125, -6.0770263671875, -5.735595703125, -5.3941650390625, -5.052734375, -4.7113037109375, -4.369873046875, -4.0284423828125, -3.68701171875, -3.3455810546875, -3.004150390625, -2.6627197265625, -2.3212890625, -1.9798583984375, -1.638427734375, -1.2969970703125, -0.95556640625, -0.6141357421875, -0.272705078125, 0.0687255859375, 0.41015625, 0.7515869140625, 1.093017578125, 1.4344482421875, 1.77587890625, 2.1173095703125, 2.458740234375, 2.8001708984375, 3.1416015625, 3.4830322265625, 3.824462890625, 4.1658935546875, 4.50732421875, 4.8487548828125, 5.190185546875, 5.5316162109375, 5.873046875, 6.2144775390625, 6.555908203125, 6.8973388671875, 7.23876953125, 7.5802001953125, 7.921630859375, 8.2630615234375, 8.6044921875, 8.9459228515625, 9.287353515625, 9.6287841796875, 9.97021484375, 10.3116455078125, 10.653076171875, 10.9945068359375, 11.3359375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 7.0, 3.0, 5.0, 5.0, 14.0, 10.0, 9.0, 12.0, 15.0, 16.0, 20.0, 24.0, 25.0, 32.0, 41.0, 41.0, 39.0, 40.0, 39.0, 39.0, 44.0, 50.0, 45.0, 57.0, 38.0, 38.0, 27.0, 45.0, 38.0, 29.0, 27.0, 27.0, 22.0, 11.0, 15.0, 11.0, 13.0, 12.0, 7.0, 4.0, 1.0, 3.0, 7.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-23.768598556518555, -22.987808227539062, -22.20701789855957, -21.426227569580078, -20.645435333251953, -19.86464500427246, -19.08385467529297, -18.303064346313477, -17.522274017333984, -16.741483688354492, -15.960693359375, -15.179902076721191, -14.3991117477417, -13.618321418762207, -12.837530136108398, -12.056739807128906, -11.275949478149414, -10.495159149169922, -9.71436882019043, -8.933577537536621, -8.152787208557129, -7.371996879577637, -6.591206073760986, -5.810415267944336, -5.029624938964844, -4.248834609985352, -3.468043804168701, -2.68725323677063, -1.9064626693725586, -1.1256721019744873, -0.344881534576416, 0.4359092712402344, 1.2166996002197266, 1.9974901676177979, 2.778280735015869, 3.5590713024139404, 4.339861869812012, 5.120652198791504, 5.901443004608154, 6.682233810424805, 7.463024139404297, 8.243814468383789, 9.024604797363281, 9.80539608001709, 10.586186408996582, 11.366976737976074, 12.147768020629883, 12.928558349609375, 13.709348678588867, 14.49013900756836, 15.270929336547852, 16.051719665527344, 16.83251190185547, 17.61330223083496, 18.394092559814453, 19.174882888793945, 19.955673217773438, 20.73646354675293, 21.517253875732422, 22.298044204711914, 23.078834533691406, 23.85962677001953, 24.640417098999023, 25.421207427978516, 26.201997756958008]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 7.0, 7.0, 2.0, 4.0, 5.0, 4.0, 12.0, 13.0, 8.0, 19.0, 21.0, 21.0, 28.0, 29.0, 34.0, 28.0, 34.0, 39.0, 31.0, 53.0, 38.0, 42.0, 46.0, 48.0, 39.0, 42.0, 35.0, 27.0, 33.0, 42.0, 22.0, 22.0, 24.0, 26.0, 20.0, 14.0, 18.0, 15.0, 12.0, 8.0, 7.0, 5.0, 5.0, 4.0, 5.0, 3.0, 4.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-27.339447021484375, -26.476778030395508, -25.61410903930664, -24.751441955566406, -23.88877296447754, -23.026103973388672, -22.163434982299805, -21.300765991210938, -20.438098907470703, -19.575429916381836, -18.71276092529297, -17.850093841552734, -16.987424850463867, -16.124755859375, -15.262086868286133, -14.399417877197266, -13.536748886108398, -12.674079895019531, -11.81141185760498, -10.948742866516113, -10.086074829101562, -9.223405838012695, -8.360736846923828, -7.498068332672119, -6.63539981842041, -5.772731304168701, -4.910062789916992, -4.047393798828125, -3.184725284576416, -2.322056770324707, -1.4593877792358398, -0.5967192649841309, 0.2659473419189453, 1.1286159753799438, 1.9912846088409424, 2.8539533615112305, 3.7166218757629395, 4.579290390014648, 5.441959381103516, 6.304627895355225, 7.167296409606934, 8.0299654006958, 8.892633438110352, 9.755302429199219, 10.617971420288086, 11.480639457702637, 12.343308448791504, 13.205976486206055, 14.068645477294922, 14.931314468383789, 15.79398250579834, 16.65665054321289, 17.519319534301758, 18.381988525390625, 19.244657516479492, 20.10732650756836, 20.969993591308594, 21.83266258239746, 22.695331573486328, 23.557998657226562, 24.42066764831543, 25.283336639404297, 26.146005630493164, 27.00867462158203, 27.8713436126709]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 8.0, 9.0, 9.0, 13.0, 23.0, 38.0, 52.0, 107.0, 120.0, 199.0, 353.0, 457.0, 757.0, 1188.0, 1831.0, 2973.0, 4617.0, 7242.0, 10834.0, 16851.0, 25317.0, 37536.0, 54430.0, 73634.0, 94972.0, 111130.0, 119327.0, 115411.0, 100828.0, 80612.0, 60443.0, 42453.0, 29389.0, 19350.0, 12775.0, 8290.0, 5364.0, 3431.0, 2163.0, 1458.0, 891.0, 591.0, 414.0, 251.0, 155.0, 93.0, 72.0, 42.0, 25.0, 15.0, 9.0, 4.0, 6.0, 1.0, 2.0, 1.0, 1.0], "bins": [-6.49609375, -6.30316162109375, -6.1102294921875, -5.91729736328125, -5.724365234375, -5.53143310546875, -5.3385009765625, -5.14556884765625, -4.95263671875, -4.75970458984375, -4.5667724609375, -4.37384033203125, -4.180908203125, -3.98797607421875, -3.7950439453125, -3.60211181640625, -3.4091796875, -3.21624755859375, -3.0233154296875, -2.83038330078125, -2.637451171875, -2.44451904296875, -2.2515869140625, -2.05865478515625, -1.86572265625, -1.67279052734375, -1.4798583984375, -1.28692626953125, -1.093994140625, -0.90106201171875, -0.7081298828125, -0.51519775390625, -0.322265625, -0.12933349609375, 0.0635986328125, 0.25653076171875, 0.449462890625, 0.64239501953125, 0.8353271484375, 1.02825927734375, 1.22119140625, 1.41412353515625, 1.6070556640625, 1.79998779296875, 1.992919921875, 2.18585205078125, 2.3787841796875, 2.57171630859375, 2.7646484375, 2.95758056640625, 3.1505126953125, 3.34344482421875, 3.536376953125, 3.72930908203125, 3.9222412109375, 4.11517333984375, 4.30810546875, 4.50103759765625, 4.6939697265625, 4.88690185546875, 5.079833984375, 5.27276611328125, 5.4656982421875, 5.65863037109375, 5.8515625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 4.0, 2.0, 4.0, 6.0, 3.0, 5.0, 3.0, 10.0, 10.0, 6.0, 23.0, 17.0, 20.0, 19.0, 30.0, 25.0, 35.0, 45.0, 27.0, 45.0, 37.0, 35.0, 42.0, 50.0, 47.0, 41.0, 31.0, 41.0, 31.0, 39.0, 35.0, 21.0, 32.0, 20.0, 27.0, 25.0, 13.0, 22.0, 11.0, 16.0, 11.0, 10.0, 7.0, 5.0, 5.0, 3.0, 3.0, 4.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-28.546875, -27.660888671875, -26.77490234375, -25.888916015625, -25.0029296875, -24.116943359375, -23.23095703125, -22.344970703125, -21.458984375, -20.572998046875, -19.68701171875, -18.801025390625, -17.9150390625, -17.029052734375, -16.14306640625, -15.257080078125, -14.37109375, -13.485107421875, -12.59912109375, -11.713134765625, -10.8271484375, -9.941162109375, -9.05517578125, -8.169189453125, -7.283203125, -6.397216796875, -5.51123046875, -4.625244140625, -3.7392578125, -2.853271484375, -1.96728515625, -1.081298828125, -0.1953125, 0.690673828125, 1.57666015625, 2.462646484375, 3.3486328125, 4.234619140625, 5.12060546875, 6.006591796875, 6.892578125, 7.778564453125, 8.66455078125, 9.550537109375, 10.4365234375, 11.322509765625, 12.20849609375, 13.094482421875, 13.98046875, 14.866455078125, 15.75244140625, 16.638427734375, 17.5244140625, 18.410400390625, 19.29638671875, 20.182373046875, 21.068359375, 21.954345703125, 22.84033203125, 23.726318359375, 24.6123046875, 25.498291015625, 26.38427734375, 27.270263671875, 28.15625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 6.0, 13.0, 13.0, 18.0, 36.0, 37.0, 59.0, 99.0, 161.0, 230.0, 341.0, 523.0, 883.0, 1398.0, 2152.0, 3448.0, 5679.0, 9046.0, 14517.0, 22993.0, 35972.0, 54971.0, 79985.0, 109308.0, 134091.0, 141628.0, 127690.0, 99628.0, 71374.0, 48002.0, 31244.0, 19742.0, 12434.0, 7759.0, 4869.0, 3019.0, 1915.0, 1200.0, 737.0, 485.0, 311.0, 184.0, 132.0, 69.0, 51.0, 36.0, 23.0, 13.0, 10.0, 8.0, 3.0, 5.0, 4.0, 3.0, 3.0, 2.0], "bins": [-8.046875, -7.80548095703125, -7.5640869140625, -7.32269287109375, -7.081298828125, -6.83990478515625, -6.5985107421875, -6.35711669921875, -6.11572265625, -5.87432861328125, -5.6329345703125, -5.39154052734375, -5.150146484375, -4.90875244140625, -4.6673583984375, -4.42596435546875, -4.1845703125, -3.94317626953125, -3.7017822265625, -3.46038818359375, -3.218994140625, -2.97760009765625, -2.7362060546875, -2.49481201171875, -2.25341796875, -2.01202392578125, -1.7706298828125, -1.52923583984375, -1.287841796875, -1.04644775390625, -0.8050537109375, -0.56365966796875, -0.322265625, -0.08087158203125, 0.1605224609375, 0.40191650390625, 0.643310546875, 0.88470458984375, 1.1260986328125, 1.36749267578125, 1.60888671875, 1.85028076171875, 2.0916748046875, 2.33306884765625, 2.574462890625, 2.81585693359375, 3.0572509765625, 3.29864501953125, 3.5400390625, 3.78143310546875, 4.0228271484375, 4.26422119140625, 4.505615234375, 4.74700927734375, 4.9884033203125, 5.22979736328125, 5.47119140625, 5.71258544921875, 5.9539794921875, 6.19537353515625, 6.436767578125, 6.67816162109375, 6.9195556640625, 7.16094970703125, 7.40234375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 4.0, 5.0, 1.0, 10.0, 4.0, 7.0, 9.0, 10.0, 15.0, 12.0, 18.0, 19.0, 26.0, 29.0, 35.0, 33.0, 33.0, 38.0, 37.0, 28.0, 47.0, 40.0, 28.0, 35.0, 32.0, 24.0, 28.0, 28.0, 38.0, 26.0, 37.0, 31.0, 29.0, 29.0, 23.0, 18.0, 23.0, 25.0, 23.0, 18.0, 9.0, 14.0, 6.0, 3.0, 9.0, 4.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-14.7734375, -14.3060302734375, -13.838623046875, -13.3712158203125, -12.90380859375, -12.4364013671875, -11.968994140625, -11.5015869140625, -11.0341796875, -10.5667724609375, -10.099365234375, -9.6319580078125, -9.16455078125, -8.6971435546875, -8.229736328125, -7.7623291015625, -7.294921875, -6.8275146484375, -6.360107421875, -5.8927001953125, -5.42529296875, -4.9578857421875, -4.490478515625, -4.0230712890625, -3.5556640625, -3.0882568359375, -2.620849609375, -2.1534423828125, -1.68603515625, -1.2186279296875, -0.751220703125, -0.2838134765625, 0.18359375, 0.6510009765625, 1.118408203125, 1.5858154296875, 2.05322265625, 2.5206298828125, 2.988037109375, 3.4554443359375, 3.9228515625, 4.3902587890625, 4.857666015625, 5.3250732421875, 5.79248046875, 6.2598876953125, 6.727294921875, 7.1947021484375, 7.662109375, 8.1295166015625, 8.596923828125, 9.0643310546875, 9.53173828125, 9.9991455078125, 10.466552734375, 10.9339599609375, 11.4013671875, 11.8687744140625, 12.336181640625, 12.8035888671875, 13.27099609375, 13.7384033203125, 14.205810546875, 14.6732177734375, 15.140625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 4.0, 13.0, 10.0, 11.0, 26.0, 56.0, 83.0, 110.0, 180.0, 289.0, 494.0, 712.0, 1250.0, 1971.0, 3293.0, 5689.0, 9912.0, 16694.0, 28237.0, 47612.0, 77638.0, 117963.0, 158467.0, 171625.0, 143955.0, 101730.0, 64297.0, 39233.0, 23429.0, 13796.0, 8090.0, 4699.0, 2778.0, 1651.0, 978.0, 596.0, 366.0, 211.0, 128.0, 98.0, 70.0, 41.0, 27.0, 10.0, 8.0, 8.0, 9.0, 5.0, 7.0, 2.0, 0.0, 1.0, 1.0], "bins": [-4.109375, -3.989593505859375, -3.86981201171875, -3.750030517578125, -3.6302490234375, -3.510467529296875, -3.39068603515625, -3.270904541015625, -3.151123046875, -3.031341552734375, -2.91156005859375, -2.791778564453125, -2.6719970703125, -2.552215576171875, -2.43243408203125, -2.312652587890625, -2.19287109375, -2.073089599609375, -1.95330810546875, -1.833526611328125, -1.7137451171875, -1.593963623046875, -1.47418212890625, -1.354400634765625, -1.234619140625, -1.114837646484375, -0.99505615234375, -0.875274658203125, -0.7554931640625, -0.635711669921875, -0.51593017578125, -0.396148681640625, -0.2763671875, -0.156585693359375, -0.03680419921875, 0.082977294921875, 0.2027587890625, 0.322540283203125, 0.44232177734375, 0.562103271484375, 0.681884765625, 0.801666259765625, 0.92144775390625, 1.041229248046875, 1.1610107421875, 1.280792236328125, 1.40057373046875, 1.520355224609375, 1.64013671875, 1.759918212890625, 1.87969970703125, 1.999481201171875, 2.1192626953125, 2.239044189453125, 2.35882568359375, 2.478607177734375, 2.598388671875, 2.718170166015625, 2.83795166015625, 2.957733154296875, 3.0775146484375, 3.197296142578125, 3.31707763671875, 3.436859130859375, 3.556640625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 0.0, 6.0, 4.0, 8.0, 3.0, 7.0, 10.0, 9.0, 16.0, 25.0, 20.0, 25.0, 34.0, 30.0, 35.0, 56.0, 37.0, 51.0, 69.0, 66.0, 56.0, 41.0, 48.0, 50.0, 45.0, 41.0, 36.0, 37.0, 22.0, 27.0, 23.0, 12.0, 14.0, 13.0, 6.0, 3.0, 1.0, 4.0, 6.0, 2.0, 3.0, 4.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002262592315673828, -0.00021835044026374817, -0.00021044164896011353, -0.00020253285765647888, -0.00019462406635284424, -0.0001867152750492096, -0.00017880648374557495, -0.0001708976924419403, -0.00016298890113830566, -0.00015508010983467102, -0.00014717131853103638, -0.00013926252722740173, -0.0001313537359237671, -0.00012344494462013245, -0.0001155361533164978, -0.00010762736201286316, -9.971857070922852e-05, -9.180977940559387e-05, -8.390098810195923e-05, -7.599219679832458e-05, -6.808340549468994e-05, -6.01746141910553e-05, -5.2265822887420654e-05, -4.435703158378601e-05, -3.644824028015137e-05, -2.8539448976516724e-05, -2.063065767288208e-05, -1.2721866369247437e-05, -4.813075065612793e-06, 3.0957162380218506e-06, 1.1004507541656494e-05, 1.8913298845291138e-05, 2.682209014892578e-05, 3.4730881452560425e-05, 4.263967275619507e-05, 5.054846405982971e-05, 5.8457255363464355e-05, 6.6366046667099e-05, 7.427483797073364e-05, 8.218362927436829e-05, 9.009242057800293e-05, 9.800121188163757e-05, 0.00010591000318527222, 0.00011381879448890686, 0.0001217275857925415, 0.00012963637709617615, 0.0001375451683998108, 0.00014545395970344543, 0.00015336275100708008, 0.00016127154231071472, 0.00016918033361434937, 0.000177089124917984, 0.00018499791622161865, 0.0001929067075252533, 0.00020081549882888794, 0.00020872429013252258, 0.00021663308143615723, 0.00022454187273979187, 0.00023245066404342651, 0.00024035945534706116, 0.0002482682466506958, 0.00025617703795433044, 0.0002640858292579651, 0.00027199462056159973, 0.0002799034118652344]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 7.0, 13.0, 8.0, 7.0, 22.0, 41.0, 52.0, 97.0, 131.0, 190.0, 246.0, 390.0, 599.0, 912.0, 1341.0, 2129.0, 2989.0, 4683.0, 6872.0, 10370.0, 15507.0, 22303.0, 32284.0, 45226.0, 61291.0, 79274.0, 96217.0, 107887.0, 111222.0, 104138.0, 89454.0, 72116.0, 54069.0, 39663.0, 27924.0, 19410.0, 12998.0, 8858.0, 5929.0, 3912.0, 2511.0, 1774.0, 1146.0, 783.0, 509.0, 330.0, 256.0, 164.0, 99.0, 66.0, 58.0, 41.0, 25.0, 9.0, 8.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.970703125, -2.872650146484375, -2.77459716796875, -2.676544189453125, -2.5784912109375, -2.480438232421875, -2.38238525390625, -2.284332275390625, -2.186279296875, -2.088226318359375, -1.99017333984375, -1.892120361328125, -1.7940673828125, -1.696014404296875, -1.59796142578125, -1.499908447265625, -1.40185546875, -1.303802490234375, -1.20574951171875, -1.107696533203125, -1.0096435546875, -0.911590576171875, -0.81353759765625, -0.715484619140625, -0.617431640625, -0.519378662109375, -0.42132568359375, -0.323272705078125, -0.2252197265625, -0.127166748046875, -0.02911376953125, 0.068939208984375, 0.1669921875, 0.265045166015625, 0.36309814453125, 0.461151123046875, 0.5592041015625, 0.657257080078125, 0.75531005859375, 0.853363037109375, 0.951416015625, 1.049468994140625, 1.14752197265625, 1.245574951171875, 1.3436279296875, 1.441680908203125, 1.53973388671875, 1.637786865234375, 1.73583984375, 1.833892822265625, 1.93194580078125, 2.029998779296875, 2.1280517578125, 2.226104736328125, 2.32415771484375, 2.422210693359375, 2.520263671875, 2.618316650390625, 2.71636962890625, 2.814422607421875, 2.9124755859375, 3.010528564453125, 3.10858154296875, 3.206634521484375, 3.3046875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 7.0, 12.0, 5.0, 13.0, 12.0, 14.0, 15.0, 22.0, 35.0, 25.0, 23.0, 38.0, 46.0, 41.0, 40.0, 47.0, 58.0, 57.0, 53.0, 44.0, 50.0, 45.0, 34.0, 44.0, 25.0, 35.0, 28.0, 20.0, 26.0, 14.0, 14.0, 10.0, 9.0, 13.0, 8.0, 1.0, 4.0, 4.0, 0.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.482421875, -1.4344482421875, -1.386474609375, -1.3385009765625, -1.29052734375, -1.2425537109375, -1.194580078125, -1.1466064453125, -1.0986328125, -1.0506591796875, -1.002685546875, -0.9547119140625, -0.90673828125, -0.8587646484375, -0.810791015625, -0.7628173828125, -0.71484375, -0.6668701171875, -0.618896484375, -0.5709228515625, -0.52294921875, -0.4749755859375, -0.427001953125, -0.3790283203125, -0.3310546875, -0.2830810546875, -0.235107421875, -0.1871337890625, -0.13916015625, -0.0911865234375, -0.043212890625, 0.0047607421875, 0.052734375, 0.1007080078125, 0.148681640625, 0.1966552734375, 0.24462890625, 0.2926025390625, 0.340576171875, 0.3885498046875, 0.4365234375, 0.4844970703125, 0.532470703125, 0.5804443359375, 0.62841796875, 0.6763916015625, 0.724365234375, 0.7723388671875, 0.8203125, 0.8682861328125, 0.916259765625, 0.9642333984375, 1.01220703125, 1.0601806640625, 1.108154296875, 1.1561279296875, 1.2041015625, 1.2520751953125, 1.300048828125, 1.3480224609375, 1.39599609375, 1.4439697265625, 1.491943359375, 1.5399169921875, 1.587890625]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 4.0, 4.0, 7.0, 6.0, 8.0, 11.0, 13.0, 17.0, 10.0, 21.0, 17.0, 20.0, 28.0, 38.0, 37.0, 41.0, 43.0, 44.0, 39.0, 39.0, 52.0, 42.0, 54.0, 46.0, 38.0, 42.0, 34.0, 40.0, 34.0, 29.0, 31.0, 17.0, 25.0, 11.0, 8.0, 15.0, 13.0, 11.0, 6.0, 1.0, 3.0, 3.0, 6.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-24.4010066986084, -23.616025924682617, -22.83104705810547, -22.046066284179688, -21.261085510253906, -20.476104736328125, -19.691125869750977, -18.906145095825195, -18.121166229248047, -17.336185455322266, -16.551206588745117, -15.766225814819336, -14.981245040893555, -14.19626522064209, -13.411285400390625, -12.626304626464844, -11.841323852539062, -11.056344032287598, -10.271363258361816, -9.486383438110352, -8.70140266418457, -7.9164228439331055, -7.131443023681641, -6.346462726593018, -5.5614824295043945, -4.7765021324157715, -3.9915220737457275, -3.2065420150756836, -2.4215617179870605, -1.6365814208984375, -0.8516016006469727, -0.06662130355834961, 0.7183609008789062, 1.5033410787582397, 2.2883212566375732, 3.073301315307617, 3.8582816123962402, 4.643261909484863, 5.428241729736328, 6.213222026824951, 6.998202323913574, 7.783182621002197, 8.56816291809082, 9.353142738342285, 10.13812255859375, 10.923103332519531, 11.708083152770996, 12.493062973022461, 13.278043746948242, 14.063023567199707, 14.848004341125488, 15.632984161376953, 16.417964935302734, 17.202945709228516, 17.987924575805664, 18.772905349731445, 19.557884216308594, 20.342864990234375, 21.127843856811523, 21.912824630737305, 22.697805404663086, 23.482784271240234, 24.267765045166016, 25.052745819091797, 25.837726593017578]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 5.0, 6.0, 6.0, 1.0, 7.0, 3.0, 13.0, 7.0, 13.0, 13.0, 23.0, 20.0, 26.0, 26.0, 34.0, 30.0, 32.0, 32.0, 42.0, 51.0, 36.0, 44.0, 41.0, 43.0, 46.0, 46.0, 41.0, 25.0, 25.0, 46.0, 27.0, 19.0, 29.0, 22.0, 21.0, 16.0, 20.0, 14.0, 11.0, 9.0, 8.0, 7.0, 3.0, 5.0, 4.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-27.532257080078125, -26.670007705688477, -25.807758331298828, -24.945510864257812, -24.083261489868164, -23.221012115478516, -22.358762741088867, -21.49651336669922, -20.63426399230957, -19.772014617919922, -18.909765243530273, -18.047515869140625, -17.18526840209961, -16.32301902770996, -15.460769653320312, -14.598520278930664, -13.736271858215332, -12.874022483825684, -12.011774063110352, -11.149524688720703, -10.287275314331055, -9.425025939941406, -8.562777519226074, -7.700528144836426, -6.8382792472839355, -5.976030349731445, -5.113780975341797, -4.251532077789307, -3.3892829418182373, -2.527033805847168, -1.6647849082946777, -0.8025355339050293, 0.05971336364746094, 0.9219624400138855, 1.78421151638031, 2.64646053314209, 3.508709669113159, 4.3709588050842285, 5.233207702636719, 6.095457077026367, 6.957705974578857, 7.819954872131348, 8.682204246520996, 9.544452667236328, 10.406702041625977, 11.268951416015625, 12.131200790405273, 12.993450164794922, 13.855698585510254, 14.717947959899902, 15.580196380615234, 16.442445755004883, 17.30469512939453, 18.16694450378418, 19.029193878173828, 19.891441345214844, 20.753690719604492, 21.61594009399414, 22.47818946838379, 23.340438842773438, 24.202686309814453, 25.0649356842041, 25.92718505859375, 26.7894344329834, 27.651683807373047]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 5.0, 5.0, 2.0, 10.0, 12.0, 14.0, 29.0, 46.0, 57.0, 96.0, 188.0, 266.0, 400.0, 730.0, 1154.0, 1775.0, 2920.0, 4478.0, 7081.0, 11092.0, 16888.0, 24953.0, 36283.0, 49771.0, 66355.0, 82756.0, 96606.0, 105579.0, 107513.0, 100503.0, 86836.0, 71121.0, 54122.0, 38891.0, 27570.0, 18525.0, 12246.0, 7941.0, 5113.0, 3253.0, 1951.0, 1297.0, 822.0, 514.0, 281.0, 176.0, 122.0, 78.0, 47.0, 38.0, 15.0, 14.0, 10.0, 7.0, 3.0, 5.0, 0.0, 1.0, 1.0, 3.0], "bins": [-12.671875, -12.2774658203125, -11.883056640625, -11.4886474609375, -11.09423828125, -10.6998291015625, -10.305419921875, -9.9110107421875, -9.5166015625, -9.1221923828125, -8.727783203125, -8.3333740234375, -7.93896484375, -7.5445556640625, -7.150146484375, -6.7557373046875, -6.361328125, -5.9669189453125, -5.572509765625, -5.1781005859375, -4.78369140625, -4.3892822265625, -3.994873046875, -3.6004638671875, -3.2060546875, -2.8116455078125, -2.417236328125, -2.0228271484375, -1.62841796875, -1.2340087890625, -0.839599609375, -0.4451904296875, -0.05078125, 0.3436279296875, 0.738037109375, 1.1324462890625, 1.52685546875, 1.9212646484375, 2.315673828125, 2.7100830078125, 3.1044921875, 3.4989013671875, 3.893310546875, 4.2877197265625, 4.68212890625, 5.0765380859375, 5.470947265625, 5.8653564453125, 6.259765625, 6.6541748046875, 7.048583984375, 7.4429931640625, 7.83740234375, 8.2318115234375, 8.626220703125, 9.0206298828125, 9.4150390625, 9.8094482421875, 10.203857421875, 10.5982666015625, 10.99267578125, 11.3870849609375, 11.781494140625, 12.1759033203125, 12.5703125]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 2.0, 4.0, 3.0, 2.0, 3.0, 9.0, 5.0, 11.0, 8.0, 12.0, 20.0, 17.0, 29.0, 22.0, 17.0, 22.0, 39.0, 29.0, 40.0, 37.0, 42.0, 40.0, 28.0, 47.0, 51.0, 44.0, 42.0, 48.0, 37.0, 33.0, 28.0, 29.0, 25.0, 19.0, 23.0, 18.0, 22.0, 15.0, 20.0, 15.0, 8.0, 7.0, 5.0, 7.0, 5.0, 8.0, 3.0, 4.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-26.5, -25.6240234375, -24.748046875, -23.8720703125, -22.99609375, -22.1201171875, -21.244140625, -20.3681640625, -19.4921875, -18.6162109375, -17.740234375, -16.8642578125, -15.98828125, -15.1123046875, -14.236328125, -13.3603515625, -12.484375, -11.6083984375, -10.732421875, -9.8564453125, -8.98046875, -8.1044921875, -7.228515625, -6.3525390625, -5.4765625, -4.6005859375, -3.724609375, -2.8486328125, -1.97265625, -1.0966796875, -0.220703125, 0.6552734375, 1.53125, 2.4072265625, 3.283203125, 4.1591796875, 5.03515625, 5.9111328125, 6.787109375, 7.6630859375, 8.5390625, 9.4150390625, 10.291015625, 11.1669921875, 12.04296875, 12.9189453125, 13.794921875, 14.6708984375, 15.546875, 16.4228515625, 17.298828125, 18.1748046875, 19.05078125, 19.9267578125, 20.802734375, 21.6787109375, 22.5546875, 23.4306640625, 24.306640625, 25.1826171875, 26.05859375, 26.9345703125, 27.810546875, 28.6865234375, 29.5625]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 10.0, 16.0, 15.0, 42.0, 31.0, 70.0, 139.0, 211.0, 337.0, 529.0, 780.0, 1152.0, 1713.0, 2755.0, 4023.0, 5995.0, 8935.0, 13314.0, 19242.0, 27810.0, 39028.0, 52383.0, 67010.0, 81468.0, 93777.0, 100553.0, 100761.0, 94135.0, 82591.0, 67765.0, 52871.0, 39525.0, 28443.0, 19889.0, 13728.0, 9359.0, 6208.0, 4075.0, 2782.0, 1765.0, 1143.0, 734.0, 520.0, 345.0, 203.0, 143.0, 85.0, 53.0, 40.0, 32.0, 12.0, 10.0, 9.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.734375, -11.3436279296875, -10.952880859375, -10.5621337890625, -10.17138671875, -9.7806396484375, -9.389892578125, -8.9991455078125, -8.6083984375, -8.2176513671875, -7.826904296875, -7.4361572265625, -7.04541015625, -6.6546630859375, -6.263916015625, -5.8731689453125, -5.482421875, -5.0916748046875, -4.700927734375, -4.3101806640625, -3.91943359375, -3.5286865234375, -3.137939453125, -2.7471923828125, -2.3564453125, -1.9656982421875, -1.574951171875, -1.1842041015625, -0.79345703125, -0.4027099609375, -0.011962890625, 0.3787841796875, 0.76953125, 1.1602783203125, 1.551025390625, 1.9417724609375, 2.33251953125, 2.7232666015625, 3.114013671875, 3.5047607421875, 3.8955078125, 4.2862548828125, 4.677001953125, 5.0677490234375, 5.45849609375, 5.8492431640625, 6.239990234375, 6.6307373046875, 7.021484375, 7.4122314453125, 7.802978515625, 8.1937255859375, 8.58447265625, 8.9752197265625, 9.365966796875, 9.7567138671875, 10.1474609375, 10.5382080078125, 10.928955078125, 11.3197021484375, 11.71044921875, 12.1011962890625, 12.491943359375, 12.8826904296875, 13.2734375]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 4.0, 1.0, 5.0, 6.0, 4.0, 5.0, 8.0, 15.0, 11.0, 12.0, 13.0, 22.0, 18.0, 24.0, 19.0, 22.0, 31.0, 22.0, 35.0, 38.0, 41.0, 31.0, 29.0, 36.0, 42.0, 32.0, 41.0, 44.0, 33.0, 43.0, 25.0, 40.0, 23.0, 34.0, 24.0, 21.0, 22.0, 16.0, 20.0, 13.0, 15.0, 13.0, 11.0, 8.0, 6.0, 6.0, 8.0, 7.0, 3.0, 2.0, 3.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.5625, -13.066162109375, -12.56982421875, -12.073486328125, -11.5771484375, -11.080810546875, -10.58447265625, -10.088134765625, -9.591796875, -9.095458984375, -8.59912109375, -8.102783203125, -7.6064453125, -7.110107421875, -6.61376953125, -6.117431640625, -5.62109375, -5.124755859375, -4.62841796875, -4.132080078125, -3.6357421875, -3.139404296875, -2.64306640625, -2.146728515625, -1.650390625, -1.154052734375, -0.65771484375, -0.161376953125, 0.3349609375, 0.831298828125, 1.32763671875, 1.823974609375, 2.3203125, 2.816650390625, 3.31298828125, 3.809326171875, 4.3056640625, 4.802001953125, 5.29833984375, 5.794677734375, 6.291015625, 6.787353515625, 7.28369140625, 7.780029296875, 8.2763671875, 8.772705078125, 9.26904296875, 9.765380859375, 10.26171875, 10.758056640625, 11.25439453125, 11.750732421875, 12.2470703125, 12.743408203125, 13.23974609375, 13.736083984375, 14.232421875, 14.728759765625, 15.22509765625, 15.721435546875, 16.2177734375, 16.714111328125, 17.21044921875, 17.706787109375, 18.203125]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 8.0, 9.0, 8.0, 15.0, 27.0, 42.0, 74.0, 96.0, 144.0, 247.0, 328.0, 486.0, 851.0, 1190.0, 1766.0, 2719.0, 4174.0, 6138.0, 9119.0, 13227.0, 19049.0, 26978.0, 37099.0, 48331.0, 61940.0, 75041.0, 87133.0, 94485.0, 96041.0, 92990.0, 83942.0, 71359.0, 57904.0, 44974.0, 33436.0, 24088.0, 17176.0, 11685.0, 7989.0, 5400.0, 3776.0, 2358.0, 1628.0, 1043.0, 710.0, 465.0, 278.0, 228.0, 125.0, 90.0, 52.0, 38.0, 26.0, 14.0, 7.0, 12.0, 2.0, 3.0, 4.0, 2.0], "bins": [-4.74609375, -4.599365234375, -4.45263671875, -4.305908203125, -4.1591796875, -4.012451171875, -3.86572265625, -3.718994140625, -3.572265625, -3.425537109375, -3.27880859375, -3.132080078125, -2.9853515625, -2.838623046875, -2.69189453125, -2.545166015625, -2.3984375, -2.251708984375, -2.10498046875, -1.958251953125, -1.8115234375, -1.664794921875, -1.51806640625, -1.371337890625, -1.224609375, -1.077880859375, -0.93115234375, -0.784423828125, -0.6376953125, -0.490966796875, -0.34423828125, -0.197509765625, -0.05078125, 0.095947265625, 0.24267578125, 0.389404296875, 0.5361328125, 0.682861328125, 0.82958984375, 0.976318359375, 1.123046875, 1.269775390625, 1.41650390625, 1.563232421875, 1.7099609375, 1.856689453125, 2.00341796875, 2.150146484375, 2.296875, 2.443603515625, 2.59033203125, 2.737060546875, 2.8837890625, 3.030517578125, 3.17724609375, 3.323974609375, 3.470703125, 3.617431640625, 3.76416015625, 3.910888671875, 4.0576171875, 4.204345703125, 4.35107421875, 4.497802734375, 4.64453125]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 6.0, 2.0, 5.0, 8.0, 9.0, 14.0, 7.0, 14.0, 20.0, 26.0, 26.0, 38.0, 36.0, 46.0, 42.0, 46.0, 54.0, 52.0, 62.0, 53.0, 52.0, 41.0, 61.0, 47.0, 45.0, 27.0, 26.0, 30.0, 28.0, 17.0, 14.0, 10.0, 8.0, 13.0, 7.0, 3.0, 6.0, 3.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0008568763732910156, -0.0008325502276420593, -0.000808224081993103, -0.0007838979363441467, -0.0007595717906951904, -0.0007352456450462341, -0.0007109194993972778, -0.0006865933537483215, -0.0006622672080993652, -0.0006379410624504089, -0.0006136149168014526, -0.0005892887711524963, -0.00056496262550354, -0.0005406364798545837, -0.0005163103342056274, -0.0004919841885566711, -0.00046765804290771484, -0.00044333189725875854, -0.00041900575160980225, -0.00039467960596084595, -0.00037035346031188965, -0.00034602731466293335, -0.00032170116901397705, -0.00029737502336502075, -0.00027304887771606445, -0.00024872273206710815, -0.00022439658641815186, -0.00020007044076919556, -0.00017574429512023926, -0.00015141814947128296, -0.00012709200382232666, -0.00010276585817337036, -7.843971252441406e-05, -5.4113566875457764e-05, -2.9787421226501465e-05, -5.461275577545166e-06, 1.8864870071411133e-05, 4.319101572036743e-05, 6.751716136932373e-05, 9.184330701828003e-05, 0.00011616945266723633, 0.00014049559831619263, 0.00016482174396514893, 0.00018914788961410522, 0.00021347403526306152, 0.00023780018091201782, 0.0002621263265609741, 0.0002864524722099304, 0.0003107786178588867, 0.000335104763507843, 0.0003594309091567993, 0.0003837570548057556, 0.0004080832004547119, 0.0004324093461036682, 0.0004567354917526245, 0.0004810616374015808, 0.0005053877830505371, 0.0005297139286994934, 0.0005540400743484497, 0.000578366219997406, 0.0006026923656463623, 0.0006270185112953186, 0.0006513446569442749, 0.0006756708025932312, 0.0006999969482421875]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [5.0, 2.0, 5.0, 5.0, 8.0, 18.0, 14.0, 22.0, 45.0, 55.0, 80.0, 146.0, 196.0, 259.0, 405.0, 663.0, 961.0, 1494.0, 2276.0, 3593.0, 5282.0, 7793.0, 11674.0, 17082.0, 24875.0, 34828.0, 47599.0, 62167.0, 77511.0, 91029.0, 99671.0, 102343.0, 97613.0, 86560.0, 72687.0, 57106.0, 43278.0, 31297.0, 22184.0, 15198.0, 10332.0, 6904.0, 4500.0, 3021.0, 2005.0, 1311.0, 837.0, 528.0, 367.0, 253.0, 153.0, 98.0, 70.0, 55.0, 32.0, 27.0, 22.0, 10.0, 8.0, 4.0, 4.0, 2.0, 1.0, 3.0], "bins": [-5.15625, -4.99169921875, -4.8271484375, -4.66259765625, -4.498046875, -4.33349609375, -4.1689453125, -4.00439453125, -3.83984375, -3.67529296875, -3.5107421875, -3.34619140625, -3.181640625, -3.01708984375, -2.8525390625, -2.68798828125, -2.5234375, -2.35888671875, -2.1943359375, -2.02978515625, -1.865234375, -1.70068359375, -1.5361328125, -1.37158203125, -1.20703125, -1.04248046875, -0.8779296875, -0.71337890625, -0.548828125, -0.38427734375, -0.2197265625, -0.05517578125, 0.109375, 0.27392578125, 0.4384765625, 0.60302734375, 0.767578125, 0.93212890625, 1.0966796875, 1.26123046875, 1.42578125, 1.59033203125, 1.7548828125, 1.91943359375, 2.083984375, 2.24853515625, 2.4130859375, 2.57763671875, 2.7421875, 2.90673828125, 3.0712890625, 3.23583984375, 3.400390625, 3.56494140625, 3.7294921875, 3.89404296875, 4.05859375, 4.22314453125, 4.3876953125, 4.55224609375, 4.716796875, 4.88134765625, 5.0458984375, 5.21044921875, 5.375]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 4.0, 4.0, 5.0, 9.0, 7.0, 7.0, 14.0, 15.0, 16.0, 22.0, 23.0, 27.0, 31.0, 28.0, 38.0, 41.0, 39.0, 38.0, 67.0, 54.0, 69.0, 43.0, 50.0, 33.0, 48.0, 32.0, 47.0, 22.0, 25.0, 35.0, 15.0, 13.0, 12.0, 13.0, 12.0, 6.0, 6.0, 8.0, 2.0, 4.0, 3.0, 4.0, 4.0, 5.0, 5.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-3.080078125, -2.9876708984375, -2.895263671875, -2.8028564453125, -2.71044921875, -2.6180419921875, -2.525634765625, -2.4332275390625, -2.3408203125, -2.2484130859375, -2.156005859375, -2.0635986328125, -1.97119140625, -1.8787841796875, -1.786376953125, -1.6939697265625, -1.6015625, -1.5091552734375, -1.416748046875, -1.3243408203125, -1.23193359375, -1.1395263671875, -1.047119140625, -0.9547119140625, -0.8623046875, -0.7698974609375, -0.677490234375, -0.5850830078125, -0.49267578125, -0.4002685546875, -0.307861328125, -0.2154541015625, -0.123046875, -0.0306396484375, 0.061767578125, 0.1541748046875, 0.24658203125, 0.3389892578125, 0.431396484375, 0.5238037109375, 0.6162109375, 0.7086181640625, 0.801025390625, 0.8934326171875, 0.98583984375, 1.0782470703125, 1.170654296875, 1.2630615234375, 1.35546875, 1.4478759765625, 1.540283203125, 1.6326904296875, 1.72509765625, 1.8175048828125, 1.909912109375, 2.0023193359375, 2.0947265625, 2.1871337890625, 2.279541015625, 2.3719482421875, 2.46435546875, 2.5567626953125, 2.649169921875, 2.7415771484375, 2.833984375]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 2.0, 5.0, 6.0, 3.0, 8.0, 13.0, 11.0, 14.0, 21.0, 18.0, 22.0, 25.0, 28.0, 39.0, 42.0, 36.0, 47.0, 45.0, 55.0, 46.0, 44.0, 55.0, 44.0, 47.0, 51.0, 39.0, 33.0, 35.0, 34.0, 23.0, 17.0, 26.0, 12.0, 19.0, 10.0, 7.0, 5.0, 7.0, 7.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.06755828857422, -25.234371185302734, -24.401185989379883, -23.5679988861084, -22.734811782836914, -21.901626586914062, -21.068439483642578, -20.235252380371094, -19.40206527709961, -18.568878173828125, -17.735692977905273, -16.90250587463379, -16.069318771362305, -15.236132621765137, -14.402946472167969, -13.569759368896484, -12.736574172973633, -11.903388023376465, -11.07020092010498, -10.237014770507812, -9.403827667236328, -8.57064151763916, -7.737455368041992, -6.904268741607666, -6.07108211517334, -5.237895488739014, -4.4047088623046875, -3.5715227127075195, -2.7383360862731934, -1.9051494598388672, -1.0719633102416992, -0.23877668380737305, 0.5944080352783203, 1.427594542503357, 2.2607810497283936, 3.0939674377441406, 3.927154064178467, 4.760340690612793, 5.593526840209961, 6.426713466644287, 7.259900093078613, 8.093086242675781, 8.926273345947266, 9.759459495544434, 10.592645645141602, 11.425832748413086, 12.259018898010254, 13.092205047607422, 13.925392150878906, 14.758578300476074, 15.591765403747559, 16.424951553344727, 17.25813865661621, 18.091323852539062, 18.924510955810547, 19.75769805908203, 20.590885162353516, 21.424072265625, 22.25725746154785, 23.090444564819336, 23.92363166809082, 24.756816864013672, 25.590003967285156, 26.42319107055664, 27.256376266479492]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 4.0, 4.0, 2.0, 7.0, 6.0, 3.0, 10.0, 13.0, 21.0, 17.0, 19.0, 22.0, 18.0, 38.0, 42.0, 31.0, 36.0, 36.0, 46.0, 48.0, 42.0, 46.0, 46.0, 33.0, 51.0, 47.0, 45.0, 28.0, 32.0, 39.0, 27.0, 30.0, 13.0, 21.0, 16.0, 15.0, 16.0, 13.0, 10.0, 3.0, 4.0, 2.0, 1.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.075557708740234, -31.07522201538086, -30.074886322021484, -29.07455062866211, -28.074214935302734, -27.07387924194336, -26.073545455932617, -25.073209762573242, -24.072874069213867, -23.072538375854492, -22.072202682495117, -21.071866989135742, -20.071533203125, -19.071197509765625, -18.07086181640625, -17.070526123046875, -16.0701904296875, -15.069854736328125, -14.06951904296875, -13.069184303283691, -12.068848609924316, -11.068512916564941, -10.068178176879883, -9.067842483520508, -8.067506790161133, -7.067171096801758, -6.066835880279541, -5.066500663757324, -4.066164970397949, -3.065829277038574, -2.0654940605163574, -1.0651588439941406, -0.06482124328613281, 0.9355142116546631, 1.935849666595459, 2.936185121536255, 3.936520576477051, 4.936856269836426, 5.937191486358643, 6.937526702880859, 7.937862396240234, 8.93819808959961, 9.938533782958984, 10.938868522644043, 11.939204216003418, 12.939539909362793, 13.939874649047852, 14.940210342407227, 15.940546035766602, 16.940881729125977, 17.94121742248535, 18.941553115844727, 19.94188690185547, 20.942222595214844, 21.94255828857422, 22.942893981933594, 23.94322967529297, 24.943565368652344, 25.94390106201172, 26.944236755371094, 27.94457244873047, 28.944908142089844, 29.945241928100586, 30.94557762145996, 31.945913314819336]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 2.0, 5.0, 5.0, 16.0, 24.0, 38.0, 41.0, 76.0, 131.0, 208.0, 284.0, 472.0, 720.0, 1187.0, 1884.0, 3099.0, 4823.0, 8032.0, 13397.0, 21877.0, 36263.0, 58998.0, 95589.0, 150510.0, 230285.0, 331372.0, 438991.0, 521952.0, 544422.0, 496578.0, 401689.0, 293403.0, 198392.0, 128964.0, 80839.0, 50005.0, 30536.0, 18804.0, 11480.0, 7141.0, 4320.0, 2718.0, 1685.0, 1024.0, 701.0, 457.0, 301.0, 208.0, 131.0, 72.0, 60.0, 34.0, 16.0, 12.0, 8.0, 7.0, 0.0, 3.0, 2.0, 2.0, 2.0], "bins": [-21.5625, -20.874267578125, -20.18603515625, -19.497802734375, -18.8095703125, -18.121337890625, -17.43310546875, -16.744873046875, -16.056640625, -15.368408203125, -14.68017578125, -13.991943359375, -13.3037109375, -12.615478515625, -11.92724609375, -11.239013671875, -10.55078125, -9.862548828125, -9.17431640625, -8.486083984375, -7.7978515625, -7.109619140625, -6.42138671875, -5.733154296875, -5.044921875, -4.356689453125, -3.66845703125, -2.980224609375, -2.2919921875, -1.603759765625, -0.91552734375, -0.227294921875, 0.4609375, 1.149169921875, 1.83740234375, 2.525634765625, 3.2138671875, 3.902099609375, 4.59033203125, 5.278564453125, 5.966796875, 6.655029296875, 7.34326171875, 8.031494140625, 8.7197265625, 9.407958984375, 10.09619140625, 10.784423828125, 11.47265625, 12.160888671875, 12.84912109375, 13.537353515625, 14.2255859375, 14.913818359375, 15.60205078125, 16.290283203125, 16.978515625, 17.666748046875, 18.35498046875, 19.043212890625, 19.7314453125, 20.419677734375, 21.10791015625, 21.796142578125, 22.484375]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 5.0, 6.0, 7.0, 3.0, 8.0, 6.0, 10.0, 8.0, 12.0, 22.0, 16.0, 22.0, 21.0, 22.0, 26.0, 25.0, 22.0, 40.0, 37.0, 38.0, 44.0, 27.0, 29.0, 45.0, 36.0, 38.0, 34.0, 39.0, 40.0, 37.0, 34.0, 30.0, 31.0, 24.0, 19.0, 17.0, 22.0, 17.0, 11.0, 18.0, 9.0, 13.0, 8.0, 6.0, 6.0, 3.0, 3.0, 1.0, 4.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0], "bins": [-22.640625, -21.90966796875, -21.1787109375, -20.44775390625, -19.716796875, -18.98583984375, -18.2548828125, -17.52392578125, -16.79296875, -16.06201171875, -15.3310546875, -14.60009765625, -13.869140625, -13.13818359375, -12.4072265625, -11.67626953125, -10.9453125, -10.21435546875, -9.4833984375, -8.75244140625, -8.021484375, -7.29052734375, -6.5595703125, -5.82861328125, -5.09765625, -4.36669921875, -3.6357421875, -2.90478515625, -2.173828125, -1.44287109375, -0.7119140625, 0.01904296875, 0.75, 1.48095703125, 2.2119140625, 2.94287109375, 3.673828125, 4.40478515625, 5.1357421875, 5.86669921875, 6.59765625, 7.32861328125, 8.0595703125, 8.79052734375, 9.521484375, 10.25244140625, 10.9833984375, 11.71435546875, 12.4453125, 13.17626953125, 13.9072265625, 14.63818359375, 15.369140625, 16.10009765625, 16.8310546875, 17.56201171875, 18.29296875, 19.02392578125, 19.7548828125, 20.48583984375, 21.216796875, 21.94775390625, 22.6787109375, 23.40966796875, 24.140625]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 9.0, 10.0, 16.0, 13.0, 27.0, 50.0, 97.0, 117.0, 190.0, 348.0, 561.0, 860.0, 1431.0, 2614.0, 4233.0, 7167.0, 12161.0, 20381.0, 33601.0, 56078.0, 90238.0, 140936.0, 213376.0, 302174.0, 397807.0, 476931.0, 514797.0, 493017.0, 425719.0, 332778.0, 238705.0, 161573.0, 103016.0, 65076.0, 39695.0, 23625.0, 14126.0, 8343.0, 5000.0, 2908.0, 1792.0, 1096.0, 639.0, 389.0, 212.0, 146.0, 81.0, 48.0, 32.0, 28.0, 15.0, 4.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-23.296875, -22.536865234375, -21.77685546875, -21.016845703125, -20.2568359375, -19.496826171875, -18.73681640625, -17.976806640625, -17.216796875, -16.456787109375, -15.69677734375, -14.936767578125, -14.1767578125, -13.416748046875, -12.65673828125, -11.896728515625, -11.13671875, -10.376708984375, -9.61669921875, -8.856689453125, -8.0966796875, -7.336669921875, -6.57666015625, -5.816650390625, -5.056640625, -4.296630859375, -3.53662109375, -2.776611328125, -2.0166015625, -1.256591796875, -0.49658203125, 0.263427734375, 1.0234375, 1.783447265625, 2.54345703125, 3.303466796875, 4.0634765625, 4.823486328125, 5.58349609375, 6.343505859375, 7.103515625, 7.863525390625, 8.62353515625, 9.383544921875, 10.1435546875, 10.903564453125, 11.66357421875, 12.423583984375, 13.18359375, 13.943603515625, 14.70361328125, 15.463623046875, 16.2236328125, 16.983642578125, 17.74365234375, 18.503662109375, 19.263671875, 20.023681640625, 20.78369140625, 21.543701171875, 22.3037109375, 23.063720703125, 23.82373046875, 24.583740234375, 25.34375]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 3.0, 5.0, 4.0, 8.0, 15.0, 15.0, 23.0, 23.0, 29.0, 40.0, 42.0, 73.0, 88.0, 108.0, 124.0, 131.0, 158.0, 181.0, 200.0, 211.0, 229.0, 242.0, 249.0, 221.0, 217.0, 231.0, 209.0, 162.0, 143.0, 121.0, 115.0, 97.0, 64.0, 72.0, 62.0, 39.0, 26.0, 30.0, 20.0, 19.0, 8.0, 12.0, 2.0, 4.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.3046875, -11.8741455078125, -11.443603515625, -11.0130615234375, -10.58251953125, -10.1519775390625, -9.721435546875, -9.2908935546875, -8.8603515625, -8.4298095703125, -7.999267578125, -7.5687255859375, -7.13818359375, -6.7076416015625, -6.277099609375, -5.8465576171875, -5.416015625, -4.9854736328125, -4.554931640625, -4.1243896484375, -3.69384765625, -3.2633056640625, -2.832763671875, -2.4022216796875, -1.9716796875, -1.5411376953125, -1.110595703125, -0.6800537109375, -0.24951171875, 0.1810302734375, 0.611572265625, 1.0421142578125, 1.47265625, 1.9031982421875, 2.333740234375, 2.7642822265625, 3.19482421875, 3.6253662109375, 4.055908203125, 4.4864501953125, 4.9169921875, 5.3475341796875, 5.778076171875, 6.2086181640625, 6.63916015625, 7.0697021484375, 7.500244140625, 7.9307861328125, 8.361328125, 8.7918701171875, 9.222412109375, 9.6529541015625, 10.08349609375, 10.5140380859375, 10.944580078125, 11.3751220703125, 11.8056640625, 12.2362060546875, 12.666748046875, 13.0972900390625, 13.52783203125, 13.9583740234375, 14.388916015625, 14.8194580078125, 15.25]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 2.0, 5.0, 5.0, 3.0, 7.0, 9.0, 8.0, 15.0, 22.0, 15.0, 31.0, 45.0, 42.0, 45.0, 46.0, 59.0, 53.0, 60.0, 46.0, 65.0, 63.0, 47.0, 43.0, 36.0, 38.0, 37.0, 29.0, 31.0, 23.0, 21.0, 15.0, 11.0, 9.0, 7.0, 8.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-34.91691589355469, -33.7827033996582, -32.64848709106445, -31.514272689819336, -30.38005828857422, -29.2458438873291, -28.111629486083984, -26.9774169921875, -25.84320068359375, -24.708986282348633, -23.574771881103516, -22.4405574798584, -21.30634307861328, -20.172128677368164, -19.037914276123047, -17.903701782226562, -16.769487380981445, -15.635272979736328, -14.501058578491211, -13.366844177246094, -12.232629776000977, -11.09841537475586, -9.964201927185059, -8.829987525939941, -7.695773124694824, -6.561558723449707, -5.42734432220459, -4.293130397796631, -3.1589159965515137, -2.0247015953063965, -0.8904876708984375, 0.2437267303466797, 1.3779411315917969, 2.512155532836914, 3.646369695663452, 4.78058385848999, 5.914798259735107, 7.049012660980225, 8.183226585388184, 9.3174409866333, 10.451655387878418, 11.585869789123535, 12.720084190368652, 13.854297637939453, 14.98851203918457, 16.122726440429688, 17.256940841674805, 18.391155242919922, 19.52536964416504, 20.659584045410156, 21.793798446655273, 22.92801284790039, 24.062227249145508, 25.196441650390625, 26.33065414428711, 27.46487045288086, 28.599082946777344, 29.73329734802246, 30.867511749267578, 32.00172424316406, 33.13594055175781, 34.2701530456543, 35.40436935424805, 36.53858184814453, 37.67279815673828]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 5.0, 7.0, 11.0, 8.0, 10.0, 6.0, 15.0, 18.0, 18.0, 24.0, 33.0, 36.0, 31.0, 53.0, 45.0, 49.0, 56.0, 43.0, 69.0, 52.0, 36.0, 47.0, 36.0, 38.0, 36.0, 34.0, 31.0, 27.0, 22.0, 28.0, 16.0, 20.0, 12.0, 14.0, 7.0, 2.0, 9.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.79008865356445, -33.54605484008789, -32.30202102661133, -31.057987213134766, -29.813953399658203, -28.56991958618164, -27.325883865356445, -26.081850051879883, -24.83781623840332, -23.593782424926758, -22.349748611450195, -21.105714797973633, -19.861679077148438, -18.617645263671875, -17.373611450195312, -16.12957763671875, -14.885543823242188, -13.641510009765625, -12.397476196289062, -11.153441429138184, -9.909407615661621, -8.665373802185059, -7.421339511871338, -6.177305221557617, -4.933271408081055, -3.689237356185913, -2.4452033042907715, -1.2011692523956299, 0.04286479949951172, 1.2868986129760742, 2.530932903289795, 3.7749671936035156, 5.019004821777344, 6.263038635253906, 7.507072925567627, 8.751107215881348, 9.99514102935791, 11.239174842834473, 12.483209609985352, 13.727243423461914, 14.971277236938477, 16.21531105041504, 17.4593448638916, 18.703378677368164, 19.94741439819336, 21.191448211669922, 22.435482025146484, 23.679515838623047, 24.92354965209961, 26.167583465576172, 27.411617279052734, 28.655651092529297, 29.89968490600586, 31.143718719482422, 32.387752532958984, 33.63179016113281, 34.875823974609375, 36.11985778808594, 37.3638916015625, 38.60792541503906, 39.851959228515625, 41.09599304199219, 42.34002685546875, 43.58406066894531, 44.828094482421875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 5.0, 6.0, 13.0, 12.0, 25.0, 41.0, 100.0, 143.0, 223.0, 330.0, 599.0, 1104.0, 1888.0, 3131.0, 5522.0, 10008.0, 17834.0, 30884.0, 51831.0, 82168.0, 117576.0, 148072.0, 157064.0, 139132.0, 106039.0, 71185.0, 43904.0, 25919.0, 14518.0, 8364.0, 4597.0, 2797.0, 1430.0, 834.0, 505.0, 287.0, 190.0, 114.0, 66.0, 38.0, 23.0, 14.0, 8.0, 9.0, 3.0, 8.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.0, -8.7127685546875, -8.425537109375, -8.1383056640625, -7.85107421875, -7.5638427734375, -7.276611328125, -6.9893798828125, -6.7021484375, -6.4149169921875, -6.127685546875, -5.8404541015625, -5.55322265625, -5.2659912109375, -4.978759765625, -4.6915283203125, -4.404296875, -4.1170654296875, -3.829833984375, -3.5426025390625, -3.25537109375, -2.9681396484375, -2.680908203125, -2.3936767578125, -2.1064453125, -1.8192138671875, -1.531982421875, -1.2447509765625, -0.95751953125, -0.6702880859375, -0.383056640625, -0.0958251953125, 0.19140625, 0.4786376953125, 0.765869140625, 1.0531005859375, 1.34033203125, 1.6275634765625, 1.914794921875, 2.2020263671875, 2.4892578125, 2.7764892578125, 3.063720703125, 3.3509521484375, 3.63818359375, 3.9254150390625, 4.212646484375, 4.4998779296875, 4.787109375, 5.0743408203125, 5.361572265625, 5.6488037109375, 5.93603515625, 6.2232666015625, 6.510498046875, 6.7977294921875, 7.0849609375, 7.3721923828125, 7.659423828125, 7.9466552734375, 8.23388671875, 8.5211181640625, 8.808349609375, 9.0955810546875, 9.3828125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 8.0, 3.0, 4.0, 5.0, 13.0, 9.0, 13.0, 19.0, 17.0, 20.0, 29.0, 35.0, 49.0, 51.0, 45.0, 46.0, 51.0, 48.0, 60.0, 54.0, 47.0, 41.0, 39.0, 33.0, 40.0, 36.0, 32.0, 30.0, 20.0, 19.0, 21.0, 22.0, 9.0, 15.0, 5.0, 5.0, 8.0, 4.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.34375, -36.0517578125, -34.759765625, -33.4677734375, -32.17578125, -30.8837890625, -29.591796875, -28.2998046875, -27.0078125, -25.7158203125, -24.423828125, -23.1318359375, -21.83984375, -20.5478515625, -19.255859375, -17.9638671875, -16.671875, -15.3798828125, -14.087890625, -12.7958984375, -11.50390625, -10.2119140625, -8.919921875, -7.6279296875, -6.3359375, -5.0439453125, -3.751953125, -2.4599609375, -1.16796875, 0.1240234375, 1.416015625, 2.7080078125, 4.0, 5.2919921875, 6.583984375, 7.8759765625, 9.16796875, 10.4599609375, 11.751953125, 13.0439453125, 14.3359375, 15.6279296875, 16.919921875, 18.2119140625, 19.50390625, 20.7958984375, 22.087890625, 23.3798828125, 24.671875, 25.9638671875, 27.255859375, 28.5478515625, 29.83984375, 31.1318359375, 32.423828125, 33.7158203125, 35.0078125, 36.2998046875, 37.591796875, 38.8837890625, 40.17578125, 41.4677734375, 42.759765625, 44.0517578125, 45.34375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 5.0, 4.0, 6.0, 7.0, 14.0, 10.0, 16.0, 32.0, 46.0, 73.0, 77.0, 141.0, 227.0, 337.0, 548.0, 831.0, 1311.0, 2099.0, 3420.0, 5489.0, 9195.0, 14906.0, 24105.0, 38481.0, 60985.0, 90174.0, 124276.0, 149165.0, 148183.0, 124056.0, 89444.0, 60079.0, 38597.0, 23927.0, 14810.0, 9113.0, 5388.0, 3385.0, 2023.0, 1247.0, 845.0, 501.0, 336.0, 190.0, 147.0, 103.0, 65.0, 43.0, 32.0, 17.0, 14.0, 14.0, 18.0, 7.0, 4.0, 1.0, 1.0, 2.0, 1.0], "bins": [-9.765625, -9.4696044921875, -9.173583984375, -8.8775634765625, -8.58154296875, -8.2855224609375, -7.989501953125, -7.6934814453125, -7.3974609375, -7.1014404296875, -6.805419921875, -6.5093994140625, -6.21337890625, -5.9173583984375, -5.621337890625, -5.3253173828125, -5.029296875, -4.7332763671875, -4.437255859375, -4.1412353515625, -3.84521484375, -3.5491943359375, -3.253173828125, -2.9571533203125, -2.6611328125, -2.3651123046875, -2.069091796875, -1.7730712890625, -1.47705078125, -1.1810302734375, -0.885009765625, -0.5889892578125, -0.29296875, 0.0030517578125, 0.299072265625, 0.5950927734375, 0.89111328125, 1.1871337890625, 1.483154296875, 1.7791748046875, 2.0751953125, 2.3712158203125, 2.667236328125, 2.9632568359375, 3.25927734375, 3.5552978515625, 3.851318359375, 4.1473388671875, 4.443359375, 4.7393798828125, 5.035400390625, 5.3314208984375, 5.62744140625, 5.9234619140625, 6.219482421875, 6.5155029296875, 6.8115234375, 7.1075439453125, 7.403564453125, 7.6995849609375, 7.99560546875, 8.2916259765625, 8.587646484375, 8.8836669921875, 9.1796875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 3.0, 4.0, 7.0, 7.0, 5.0, 4.0, 10.0, 11.0, 6.0, 13.0, 19.0, 13.0, 18.0, 13.0, 24.0, 27.0, 32.0, 42.0, 39.0, 37.0, 48.0, 41.0, 49.0, 39.0, 42.0, 33.0, 39.0, 43.0, 41.0, 35.0, 30.0, 24.0, 39.0, 36.0, 24.0, 12.0, 17.0, 15.0, 18.0, 16.0, 3.0, 4.0, 13.0, 5.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.46875, -18.85986328125, -18.2509765625, -17.64208984375, -17.033203125, -16.42431640625, -15.8154296875, -15.20654296875, -14.59765625, -13.98876953125, -13.3798828125, -12.77099609375, -12.162109375, -11.55322265625, -10.9443359375, -10.33544921875, -9.7265625, -9.11767578125, -8.5087890625, -7.89990234375, -7.291015625, -6.68212890625, -6.0732421875, -5.46435546875, -4.85546875, -4.24658203125, -3.6376953125, -3.02880859375, -2.419921875, -1.81103515625, -1.2021484375, -0.59326171875, 0.015625, 0.62451171875, 1.2333984375, 1.84228515625, 2.451171875, 3.06005859375, 3.6689453125, 4.27783203125, 4.88671875, 5.49560546875, 6.1044921875, 6.71337890625, 7.322265625, 7.93115234375, 8.5400390625, 9.14892578125, 9.7578125, 10.36669921875, 10.9755859375, 11.58447265625, 12.193359375, 12.80224609375, 13.4111328125, 14.02001953125, 14.62890625, 15.23779296875, 15.8466796875, 16.45556640625, 17.064453125, 17.67333984375, 18.2822265625, 18.89111328125, 19.5]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 7.0, 10.0, 12.0, 25.0, 34.0, 54.0, 80.0, 100.0, 185.0, 288.0, 504.0, 838.0, 1297.0, 2203.0, 3787.0, 6606.0, 11617.0, 19980.0, 34755.0, 57603.0, 93602.0, 139546.0, 174101.0, 168569.0, 126701.0, 83616.0, 50908.0, 29839.0, 17303.0, 9978.0, 5982.0, 3332.0, 2015.0, 1187.0, 719.0, 446.0, 245.0, 165.0, 107.0, 74.0, 49.0, 40.0, 20.0, 11.0, 6.0, 6.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.4296875, -4.29071044921875, -4.1517333984375, -4.01275634765625, -3.873779296875, -3.73480224609375, -3.5958251953125, -3.45684814453125, -3.31787109375, -3.17889404296875, -3.0399169921875, -2.90093994140625, -2.761962890625, -2.62298583984375, -2.4840087890625, -2.34503173828125, -2.2060546875, -2.06707763671875, -1.9281005859375, -1.78912353515625, -1.650146484375, -1.51116943359375, -1.3721923828125, -1.23321533203125, -1.09423828125, -0.95526123046875, -0.8162841796875, -0.67730712890625, -0.538330078125, -0.39935302734375, -0.2603759765625, -0.12139892578125, 0.017578125, 0.15655517578125, 0.2955322265625, 0.43450927734375, 0.573486328125, 0.71246337890625, 0.8514404296875, 0.99041748046875, 1.12939453125, 1.26837158203125, 1.4073486328125, 1.54632568359375, 1.685302734375, 1.82427978515625, 1.9632568359375, 2.10223388671875, 2.2412109375, 2.38018798828125, 2.5191650390625, 2.65814208984375, 2.797119140625, 2.93609619140625, 3.0750732421875, 3.21405029296875, 3.35302734375, 3.49200439453125, 3.6309814453125, 3.76995849609375, 3.908935546875, 4.04791259765625, 4.1868896484375, 4.32586669921875, 4.46484375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 2.0, 7.0, 6.0, 14.0, 12.0, 15.0, 19.0, 15.0, 19.0, 16.0, 25.0, 32.0, 29.0, 42.0, 41.0, 50.0, 47.0, 58.0, 50.0, 45.0, 44.0, 45.0, 47.0, 45.0, 39.0, 38.0, 38.0, 25.0, 19.0, 17.0, 23.0, 18.0, 12.0, 10.0, 7.0, 9.0, 5.0, 5.0, 6.0, 5.0, 3.0, 5.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.00028514862060546875, -0.0002774149179458618, -0.0002696812152862549, -0.00026194751262664795, -0.000254213809967041, -0.0002464801073074341, -0.00023874640464782715, -0.00023101270198822021, -0.00022327899932861328, -0.00021554529666900635, -0.00020781159400939941, -0.00020007789134979248, -0.00019234418869018555, -0.0001846104860305786, -0.00017687678337097168, -0.00016914308071136475, -0.0001614093780517578, -0.00015367567539215088, -0.00014594197273254395, -0.000138208270072937, -0.00013047456741333008, -0.00012274086475372314, -0.00011500716209411621, -0.00010727345943450928, -9.953975677490234e-05, -9.180605411529541e-05, -8.407235145568848e-05, -7.633864879608154e-05, -6.860494613647461e-05, -6.0871243476867676e-05, -5.313754081726074e-05, -4.540383815765381e-05, -3.7670135498046875e-05, -2.993643283843994e-05, -2.2202730178833008e-05, -1.4469027519226074e-05, -6.735324859619141e-06, 9.98377799987793e-07, 8.732080459594727e-06, 1.646578311920166e-05, 2.4199485778808594e-05, 3.193318843841553e-05, 3.966689109802246e-05, 4.7400593757629395e-05, 5.513429641723633e-05, 6.286799907684326e-05, 7.06017017364502e-05, 7.833540439605713e-05, 8.606910705566406e-05, 9.3802809715271e-05, 0.00010153651237487793, 0.00010927021503448486, 0.0001170039176940918, 0.00012473762035369873, 0.00013247132301330566, 0.0001402050256729126, 0.00014793872833251953, 0.00015567243099212646, 0.0001634061336517334, 0.00017113983631134033, 0.00017887353897094727, 0.0001866072416305542, 0.00019434094429016113, 0.00020207464694976807, 0.000209808349609375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 5.0, 2.0, 4.0, 7.0, 8.0, 15.0, 20.0, 42.0, 44.0, 67.0, 89.0, 157.0, 219.0, 357.0, 564.0, 756.0, 1299.0, 1931.0, 2881.0, 4486.0, 6820.0, 9907.0, 14869.0, 21441.0, 30608.0, 43147.0, 58303.0, 74589.0, 92083.0, 104036.0, 109370.0, 104684.0, 91804.0, 75513.0, 58169.0, 43214.0, 30981.0, 21474.0, 14814.0, 10074.0, 6729.0, 4371.0, 2972.0, 1981.0, 1264.0, 790.0, 567.0, 364.0, 220.0, 156.0, 115.0, 66.0, 56.0, 27.0, 19.0, 7.0, 2.0, 4.0, 4.0, 3.0, 1.0, 3.0], "bins": [-3.703125, -3.589202880859375, -3.47528076171875, -3.361358642578125, -3.2474365234375, -3.133514404296875, -3.01959228515625, -2.905670166015625, -2.791748046875, -2.677825927734375, -2.56390380859375, -2.449981689453125, -2.3360595703125, -2.222137451171875, -2.10821533203125, -1.994293212890625, -1.88037109375, -1.766448974609375, -1.65252685546875, -1.538604736328125, -1.4246826171875, -1.310760498046875, -1.19683837890625, -1.082916259765625, -0.968994140625, -0.855072021484375, -0.74114990234375, -0.627227783203125, -0.5133056640625, -0.399383544921875, -0.28546142578125, -0.171539306640625, -0.0576171875, 0.056304931640625, 0.17022705078125, 0.284149169921875, 0.3980712890625, 0.511993408203125, 0.62591552734375, 0.739837646484375, 0.853759765625, 0.967681884765625, 1.08160400390625, 1.195526123046875, 1.3094482421875, 1.423370361328125, 1.53729248046875, 1.651214599609375, 1.76513671875, 1.879058837890625, 1.99298095703125, 2.106903076171875, 2.2208251953125, 2.334747314453125, 2.44866943359375, 2.562591552734375, 2.676513671875, 2.790435791015625, 2.90435791015625, 3.018280029296875, 3.1322021484375, 3.246124267578125, 3.36004638671875, 3.473968505859375, 3.587890625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 4.0, 1.0, 1.0, 5.0, 4.0, 7.0, 13.0, 8.0, 9.0, 10.0, 11.0, 20.0, 26.0, 24.0, 33.0, 29.0, 37.0, 40.0, 42.0, 44.0, 49.0, 57.0, 49.0, 40.0, 54.0, 47.0, 35.0, 50.0, 39.0, 41.0, 33.0, 20.0, 35.0, 16.0, 12.0, 14.0, 6.0, 7.0, 12.0, 4.0, 8.0, 4.0, 3.0, 2.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.78125, -1.720489501953125, -1.65972900390625, -1.598968505859375, -1.5382080078125, -1.477447509765625, -1.41668701171875, -1.355926513671875, -1.295166015625, -1.234405517578125, -1.17364501953125, -1.112884521484375, -1.0521240234375, -0.991363525390625, -0.93060302734375, -0.869842529296875, -0.80908203125, -0.748321533203125, -0.68756103515625, -0.626800537109375, -0.5660400390625, -0.505279541015625, -0.44451904296875, -0.383758544921875, -0.322998046875, -0.262237548828125, -0.20147705078125, -0.140716552734375, -0.0799560546875, -0.019195556640625, 0.04156494140625, 0.102325439453125, 0.1630859375, 0.223846435546875, 0.28460693359375, 0.345367431640625, 0.4061279296875, 0.466888427734375, 0.52764892578125, 0.588409423828125, 0.649169921875, 0.709930419921875, 0.77069091796875, 0.831451416015625, 0.8922119140625, 0.952972412109375, 1.01373291015625, 1.074493408203125, 1.13525390625, 1.196014404296875, 1.25677490234375, 1.317535400390625, 1.3782958984375, 1.439056396484375, 1.49981689453125, 1.560577392578125, 1.621337890625, 1.682098388671875, 1.74285888671875, 1.803619384765625, 1.8643798828125, 1.925140380859375, 1.98590087890625, 2.046661376953125, 2.107421875]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 2.0, 4.0, 5.0, 4.0, 7.0, 10.0, 16.0, 7.0, 19.0, 22.0, 38.0, 44.0, 43.0, 36.0, 64.0, 48.0, 59.0, 50.0, 55.0, 64.0, 56.0, 53.0, 40.0, 34.0, 39.0, 36.0, 39.0, 18.0, 26.0, 20.0, 11.0, 7.0, 9.0, 9.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.52968978881836, -33.39360809326172, -32.257530212402344, -31.121450424194336, -29.985370635986328, -28.84929084777832, -27.713211059570312, -26.577131271362305, -25.441051483154297, -24.30497169494629, -23.16889190673828, -22.032812118530273, -20.896732330322266, -19.760652542114258, -18.62457275390625, -17.488492965698242, -16.352413177490234, -15.216333389282227, -14.080253601074219, -12.944173812866211, -11.808094024658203, -10.672014236450195, -9.535934448242188, -8.39985466003418, -7.263774871826172, -6.127695083618164, -4.991615295410156, -3.8555355072021484, -2.7194557189941406, -1.5833759307861328, -0.447296142578125, 0.6887836456298828, 1.8248634338378906, 2.9609432220458984, 4.097023010253906, 5.233102798461914, 6.369182586669922, 7.50526237487793, 8.641342163085938, 9.777421951293945, 10.913501739501953, 12.049581527709961, 13.185661315917969, 14.321741104125977, 15.457820892333984, 16.593900680541992, 17.72998046875, 18.866060256958008, 20.002140045166016, 21.138219833374023, 22.27429962158203, 23.41037940979004, 24.546459197998047, 25.682538986206055, 26.818618774414062, 27.95469856262207, 29.090778350830078, 30.226858139038086, 31.362937927246094, 32.49901580810547, 33.63509750366211, 34.77117919921875, 35.907257080078125, 37.0433349609375, 38.17941665649414]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 5.0, 2.0, 6.0, 12.0, 8.0, 11.0, 10.0, 13.0, 18.0, 18.0, 27.0, 33.0, 35.0, 40.0, 50.0, 41.0, 55.0, 54.0, 55.0, 58.0, 43.0, 37.0, 52.0, 33.0, 43.0, 32.0, 32.0, 35.0, 21.0, 26.0, 23.0, 24.0, 15.0, 12.0, 13.0, 3.0, 3.0, 8.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.3465576171875, -33.103755950927734, -31.86095428466797, -30.618152618408203, -29.375350952148438, -28.132549285888672, -26.88974952697754, -25.646947860717773, -24.404146194458008, -23.161344528198242, -21.918542861938477, -20.67574119567871, -19.432941436767578, -18.190139770507812, -16.947338104248047, -15.704536437988281, -14.461734771728516, -13.21893310546875, -11.976131439208984, -10.733330726623535, -9.49052906036377, -8.247727394104004, -7.0049262046813965, -5.762125015258789, -4.519323348999023, -3.276521921157837, -2.0337204933166504, -0.7909190654754639, 0.45188236236572266, 1.6946840286254883, 2.9374852180480957, 4.180286407470703, 5.423091888427734, 6.6658935546875, 7.908694744110107, 9.151495933532715, 10.39429759979248, 11.637099266052246, 12.879899978637695, 14.122701644897461, 15.365503311157227, 16.608304977416992, 17.851106643676758, 19.093908309936523, 20.336708068847656, 21.579509735107422, 22.822311401367188, 24.065113067626953, 25.30791473388672, 26.550716400146484, 27.79351806640625, 29.036319732666016, 30.27912139892578, 31.521923065185547, 32.76472473144531, 34.00752258300781, 35.250328063964844, 36.49312973022461, 37.735931396484375, 38.97873306274414, 40.221534729003906, 41.46433639526367, 42.70713806152344, 43.94993591308594, 45.1927375793457]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 10.0, 12.0, 18.0, 30.0, 48.0, 66.0, 90.0, 135.0, 252.0, 406.0, 654.0, 1018.0, 1665.0, 2831.0, 4456.0, 7146.0, 11734.0, 18496.0, 28629.0, 42315.0, 59616.0, 79857.0, 98414.0, 112014.0, 117248.0, 111166.0, 97452.0, 77805.0, 58322.0, 41169.0, 27771.0, 17977.0, 11252.0, 7151.0, 4398.0, 2626.0, 1608.0, 1008.0, 645.0, 370.0, 238.0, 156.0, 99.0, 63.0, 31.0, 33.0, 20.0, 12.0, 15.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-15.03125, -14.537841796875, -14.04443359375, -13.551025390625, -13.0576171875, -12.564208984375, -12.07080078125, -11.577392578125, -11.083984375, -10.590576171875, -10.09716796875, -9.603759765625, -9.1103515625, -8.616943359375, -8.12353515625, -7.630126953125, -7.13671875, -6.643310546875, -6.14990234375, -5.656494140625, -5.1630859375, -4.669677734375, -4.17626953125, -3.682861328125, -3.189453125, -2.696044921875, -2.20263671875, -1.709228515625, -1.2158203125, -0.722412109375, -0.22900390625, 0.264404296875, 0.7578125, 1.251220703125, 1.74462890625, 2.238037109375, 2.7314453125, 3.224853515625, 3.71826171875, 4.211669921875, 4.705078125, 5.198486328125, 5.69189453125, 6.185302734375, 6.6787109375, 7.172119140625, 7.66552734375, 8.158935546875, 8.65234375, 9.145751953125, 9.63916015625, 10.132568359375, 10.6259765625, 11.119384765625, 11.61279296875, 12.106201171875, 12.599609375, 13.093017578125, 13.58642578125, 14.079833984375, 14.5732421875, 15.066650390625, 15.56005859375, 16.053466796875, 16.546875]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 7.0, 7.0, 8.0, 8.0, 10.0, 11.0, 15.0, 15.0, 11.0, 20.0, 22.0, 28.0, 48.0, 43.0, 43.0, 49.0, 50.0, 38.0, 49.0, 36.0, 38.0, 45.0, 37.0, 44.0, 36.0, 35.0, 32.0, 30.0, 36.0, 15.0, 21.0, 27.0, 21.0, 10.0, 15.0, 10.0, 7.0, 4.0, 10.0, 5.0, 4.0, 4.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.6875, -33.5302734375, -32.373046875, -31.2158203125, -30.05859375, -28.9013671875, -27.744140625, -26.5869140625, -25.4296875, -24.2724609375, -23.115234375, -21.9580078125, -20.80078125, -19.6435546875, -18.486328125, -17.3291015625, -16.171875, -15.0146484375, -13.857421875, -12.7001953125, -11.54296875, -10.3857421875, -9.228515625, -8.0712890625, -6.9140625, -5.7568359375, -4.599609375, -3.4423828125, -2.28515625, -1.1279296875, 0.029296875, 1.1865234375, 2.34375, 3.5009765625, 4.658203125, 5.8154296875, 6.97265625, 8.1298828125, 9.287109375, 10.4443359375, 11.6015625, 12.7587890625, 13.916015625, 15.0732421875, 16.23046875, 17.3876953125, 18.544921875, 19.7021484375, 20.859375, 22.0166015625, 23.173828125, 24.3310546875, 25.48828125, 26.6455078125, 27.802734375, 28.9599609375, 30.1171875, 31.2744140625, 32.431640625, 33.5888671875, 34.74609375, 35.9033203125, 37.060546875, 38.2177734375, 39.375]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 5.0, 3.0, 6.0, 7.0, 14.0, 17.0, 15.0, 29.0, 43.0, 63.0, 124.0, 199.0, 256.0, 447.0, 707.0, 1073.0, 1656.0, 2542.0, 4102.0, 6134.0, 9546.0, 14955.0, 22631.0, 33951.0, 48538.0, 66161.0, 85109.0, 102529.0, 112968.0, 114024.0, 104854.0, 88678.0, 69493.0, 51400.0, 36281.0, 24284.0, 16187.0, 10597.0, 6784.0, 4243.0, 2862.0, 1788.0, 1125.0, 739.0, 459.0, 320.0, 223.0, 147.0, 87.0, 63.0, 39.0, 25.0, 19.0, 6.0, 6.0, 5.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-16.546875, -16.03125, -15.515625, -15.0, -14.484375, -13.96875, -13.453125, -12.9375, -12.421875, -11.90625, -11.390625, -10.875, -10.359375, -9.84375, -9.328125, -8.8125, -8.296875, -7.78125, -7.265625, -6.75, -6.234375, -5.71875, -5.203125, -4.6875, -4.171875, -3.65625, -3.140625, -2.625, -2.109375, -1.59375, -1.078125, -0.5625, -0.046875, 0.46875, 0.984375, 1.5, 2.015625, 2.53125, 3.046875, 3.5625, 4.078125, 4.59375, 5.109375, 5.625, 6.140625, 6.65625, 7.171875, 7.6875, 8.203125, 8.71875, 9.234375, 9.75, 10.265625, 10.78125, 11.296875, 11.8125, 12.328125, 12.84375, 13.359375, 13.875, 14.390625, 14.90625, 15.421875, 15.9375, 16.453125]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 5.0, 7.0, 8.0, 6.0, 11.0, 11.0, 10.0, 15.0, 22.0, 20.0, 18.0, 21.0, 31.0, 31.0, 30.0, 31.0, 22.0, 50.0, 43.0, 38.0, 37.0, 39.0, 40.0, 43.0, 40.0, 34.0, 36.0, 36.0, 31.0, 34.0, 28.0, 33.0, 18.0, 13.0, 16.0, 15.0, 15.0, 10.0, 9.0, 10.0, 7.0, 7.0, 7.0, 4.0, 3.0, 4.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.140625, -20.4658203125, -19.791015625, -19.1162109375, -18.44140625, -17.7666015625, -17.091796875, -16.4169921875, -15.7421875, -15.0673828125, -14.392578125, -13.7177734375, -13.04296875, -12.3681640625, -11.693359375, -11.0185546875, -10.34375, -9.6689453125, -8.994140625, -8.3193359375, -7.64453125, -6.9697265625, -6.294921875, -5.6201171875, -4.9453125, -4.2705078125, -3.595703125, -2.9208984375, -2.24609375, -1.5712890625, -0.896484375, -0.2216796875, 0.453125, 1.1279296875, 1.802734375, 2.4775390625, 3.15234375, 3.8271484375, 4.501953125, 5.1767578125, 5.8515625, 6.5263671875, 7.201171875, 7.8759765625, 8.55078125, 9.2255859375, 9.900390625, 10.5751953125, 11.25, 11.9248046875, 12.599609375, 13.2744140625, 13.94921875, 14.6240234375, 15.298828125, 15.9736328125, 16.6484375, 17.3232421875, 17.998046875, 18.6728515625, 19.34765625, 20.0224609375, 20.697265625, 21.3720703125, 22.046875]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 10.0, 2.0, 11.0, 13.0, 23.0, 32.0, 46.0, 87.0, 141.0, 195.0, 365.0, 666.0, 1079.0, 1972.0, 3456.0, 6194.0, 11210.0, 19711.0, 34952.0, 57210.0, 88300.0, 122387.0, 147706.0, 152725.0, 133437.0, 101158.0, 68218.0, 41749.0, 24152.0, 13847.0, 7666.0, 4269.0, 2410.0, 1308.0, 747.0, 416.0, 272.0, 162.0, 93.0, 73.0, 38.0, 24.0, 14.0, 7.0, 5.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.21875, -8.90283203125, -8.5869140625, -8.27099609375, -7.955078125, -7.63916015625, -7.3232421875, -7.00732421875, -6.69140625, -6.37548828125, -6.0595703125, -5.74365234375, -5.427734375, -5.11181640625, -4.7958984375, -4.47998046875, -4.1640625, -3.84814453125, -3.5322265625, -3.21630859375, -2.900390625, -2.58447265625, -2.2685546875, -1.95263671875, -1.63671875, -1.32080078125, -1.0048828125, -0.68896484375, -0.373046875, -0.05712890625, 0.2587890625, 0.57470703125, 0.890625, 1.20654296875, 1.5224609375, 1.83837890625, 2.154296875, 2.47021484375, 2.7861328125, 3.10205078125, 3.41796875, 3.73388671875, 4.0498046875, 4.36572265625, 4.681640625, 4.99755859375, 5.3134765625, 5.62939453125, 5.9453125, 6.26123046875, 6.5771484375, 6.89306640625, 7.208984375, 7.52490234375, 7.8408203125, 8.15673828125, 8.47265625, 8.78857421875, 9.1044921875, 9.42041015625, 9.736328125, 10.05224609375, 10.3681640625, 10.68408203125, 11.0]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 4.0, 5.0, 2.0, 3.0, 6.0, 10.0, 13.0, 14.0, 17.0, 21.0, 21.0, 27.0, 27.0, 37.0, 37.0, 50.0, 46.0, 60.0, 59.0, 53.0, 65.0, 63.0, 55.0, 51.0, 43.0, 40.0, 40.0, 27.0, 26.0, 19.0, 11.0, 10.0, 17.0, 6.0, 6.0, 3.0, 0.0, 4.0, 5.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.000888824462890625, -0.000855565071105957, -0.0008223056793212891, -0.0007890462875366211, -0.0007557868957519531, -0.0007225275039672852, -0.0006892681121826172, -0.0006560087203979492, -0.0006227493286132812, -0.0005894899368286133, -0.0005562305450439453, -0.0005229711532592773, -0.0004897117614746094, -0.0004564523696899414, -0.00042319297790527344, -0.00038993358612060547, -0.0003566741943359375, -0.00032341480255126953, -0.00029015541076660156, -0.0002568960189819336, -0.00022363662719726562, -0.00019037723541259766, -0.0001571178436279297, -0.00012385845184326172, -9.059906005859375e-05, -5.733966827392578e-05, -2.4080276489257812e-05, 9.179115295410156e-06, 4.2438507080078125e-05, 7.56978988647461e-05, 0.00010895729064941406, 0.00014221668243408203, 0.00017547607421875, 0.00020873546600341797, 0.00024199485778808594, 0.0002752542495727539, 0.0003085136413574219, 0.00034177303314208984, 0.0003750324249267578, 0.0004082918167114258, 0.00044155120849609375, 0.0004748106002807617, 0.0005080699920654297, 0.0005413293838500977, 0.0005745887756347656, 0.0006078481674194336, 0.0006411075592041016, 0.0006743669509887695, 0.0007076263427734375, 0.0007408857345581055, 0.0007741451263427734, 0.0008074045181274414, 0.0008406639099121094, 0.0008739233016967773, 0.0009071826934814453, 0.0009404420852661133, 0.0009737014770507812, 0.0010069608688354492, 0.0010402202606201172, 0.0010734796524047852, 0.0011067390441894531, 0.001139998435974121, 0.001173257827758789, 0.001206517219543457, 0.001239776611328125]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 6.0, 4.0, 5.0, 5.0, 4.0, 16.0, 11.0, 23.0, 36.0, 39.0, 85.0, 116.0, 201.0, 310.0, 424.0, 688.0, 1049.0, 1735.0, 2674.0, 4234.0, 6888.0, 11120.0, 18093.0, 28202.0, 43413.0, 64689.0, 89271.0, 113665.0, 128876.0, 130095.0, 115574.0, 92367.0, 67716.0, 45991.0, 29863.0, 19203.0, 12039.0, 7413.0, 4436.0, 2806.0, 1844.0, 1158.0, 740.0, 493.0, 298.0, 228.0, 149.0, 89.0, 72.0, 35.0, 28.0, 15.0, 9.0, 12.0, 5.0, 4.0, 2.0, 4.0, 0.0, 1.0], "bins": [-9.5625, -9.2733154296875, -8.984130859375, -8.6949462890625, -8.40576171875, -8.1165771484375, -7.827392578125, -7.5382080078125, -7.2490234375, -6.9598388671875, -6.670654296875, -6.3814697265625, -6.09228515625, -5.8031005859375, -5.513916015625, -5.2247314453125, -4.935546875, -4.6463623046875, -4.357177734375, -4.0679931640625, -3.77880859375, -3.4896240234375, -3.200439453125, -2.9112548828125, -2.6220703125, -2.3328857421875, -2.043701171875, -1.7545166015625, -1.46533203125, -1.1761474609375, -0.886962890625, -0.5977783203125, -0.30859375, -0.0194091796875, 0.269775390625, 0.5589599609375, 0.84814453125, 1.1373291015625, 1.426513671875, 1.7156982421875, 2.0048828125, 2.2940673828125, 2.583251953125, 2.8724365234375, 3.16162109375, 3.4508056640625, 3.739990234375, 4.0291748046875, 4.318359375, 4.6075439453125, 4.896728515625, 5.1859130859375, 5.47509765625, 5.7642822265625, 6.053466796875, 6.3426513671875, 6.6318359375, 6.9210205078125, 7.210205078125, 7.4993896484375, 7.78857421875, 8.0777587890625, 8.366943359375, 8.6561279296875, 8.9453125]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 5.0, 10.0, 7.0, 14.0, 11.0, 13.0, 15.0, 28.0, 39.0, 42.0, 38.0, 51.0, 60.0, 53.0, 65.0, 62.0, 70.0, 64.0, 45.0, 58.0, 47.0, 47.0, 34.0, 22.0, 18.0, 21.0, 22.0, 10.0, 5.0, 9.0, 7.0, 2.0, 1.0, 4.0, 4.0, 1.0, 2.0, 4.0, 1.0], "bins": [-6.64453125, -6.48004150390625, -6.3155517578125, -6.15106201171875, -5.986572265625, -5.82208251953125, -5.6575927734375, -5.49310302734375, -5.32861328125, -5.16412353515625, -4.9996337890625, -4.83514404296875, -4.670654296875, -4.50616455078125, -4.3416748046875, -4.17718505859375, -4.0126953125, -3.84820556640625, -3.6837158203125, -3.51922607421875, -3.354736328125, -3.19024658203125, -3.0257568359375, -2.86126708984375, -2.69677734375, -2.53228759765625, -2.3677978515625, -2.20330810546875, -2.038818359375, -1.87432861328125, -1.7098388671875, -1.54534912109375, -1.380859375, -1.21636962890625, -1.0518798828125, -0.88739013671875, -0.722900390625, -0.55841064453125, -0.3939208984375, -0.22943115234375, -0.06494140625, 0.09954833984375, 0.2640380859375, 0.42852783203125, 0.593017578125, 0.75750732421875, 0.9219970703125, 1.08648681640625, 1.2509765625, 1.41546630859375, 1.5799560546875, 1.74444580078125, 1.908935546875, 2.07342529296875, 2.2379150390625, 2.40240478515625, 2.56689453125, 2.73138427734375, 2.8958740234375, 3.06036376953125, 3.224853515625, 3.38934326171875, 3.5538330078125, 3.71832275390625, 3.8828125]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 7.0, 4.0, 3.0, 4.0, 5.0, 11.0, 11.0, 11.0, 15.0, 20.0, 15.0, 49.0, 37.0, 47.0, 57.0, 54.0, 58.0, 46.0, 61.0, 57.0, 52.0, 62.0, 44.0, 42.0, 38.0, 43.0, 31.0, 29.0, 31.0, 10.0, 13.0, 10.0, 9.0, 8.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.94009017944336, -31.797508239746094, -30.654924392700195, -29.51234245300293, -28.36975860595703, -27.227176666259766, -26.0845947265625, -24.9420108795166, -23.799427032470703, -22.656845092773438, -21.51426124572754, -20.371679306030273, -19.229095458984375, -18.08651351928711, -16.943931579589844, -15.801347732543945, -14.65876579284668, -13.516182899475098, -12.373600006103516, -11.23101806640625, -10.088434219360352, -8.945852279663086, -7.803269386291504, -6.660686492919922, -5.51810359954834, -4.375520706176758, -3.232938051223755, -2.090355396270752, -0.9477725028991699, 0.1948103904724121, 1.337392807006836, 2.479975700378418, 3.62255859375, 4.765141487121582, 5.907724380493164, 7.050306797027588, 8.192890167236328, 9.335472106933594, 10.478055000305176, 11.620637893676758, 12.76322078704834, 13.905803680419922, 15.048386573791504, 16.190969467163086, 17.33355140686035, 18.47613525390625, 19.618717193603516, 20.76129913330078, 21.90388298034668, 23.046464920043945, 24.189048767089844, 25.33163070678711, 26.474214553833008, 27.616796493530273, 28.759380340576172, 29.901962280273438, 31.044544219970703, 32.18712615966797, 33.329708099365234, 34.472293853759766, 35.61487579345703, 36.7574577331543, 37.90003967285156, 39.042625427246094, 40.18520736694336]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 3.0, 2.0, 2.0, 4.0, 6.0, 12.0, 13.0, 15.0, 21.0, 21.0, 28.0, 34.0, 37.0, 44.0, 42.0, 56.0, 59.0, 60.0, 47.0, 73.0, 49.0, 52.0, 50.0, 35.0, 41.0, 27.0, 16.0, 37.0, 26.0, 25.0, 15.0, 15.0, 9.0, 7.0, 6.0, 7.0, 1.0, 10.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.05831527709961, -48.4994010925293, -46.94048309326172, -45.381568908691406, -43.82265090942383, -42.263736724853516, -40.70481872558594, -39.145904541015625, -37.58699035644531, -36.028076171875, -34.46915817260742, -32.91024398803711, -31.35132598876953, -29.79241180419922, -28.233495712280273, -26.674579620361328, -25.11566162109375, -23.556745529174805, -21.99782943725586, -20.438915252685547, -18.87999725341797, -17.321083068847656, -15.762166976928711, -14.203250885009766, -12.64433479309082, -11.085418701171875, -9.52650260925293, -7.967587471008301, -6.4086713790893555, -4.84975528717041, -3.2908401489257812, -1.731924057006836, -0.173004150390625, 1.3859117031097412, 2.9448275566101074, 4.5037431716918945, 6.06265926361084, 7.621575355529785, 9.180490493774414, 10.73940658569336, 12.298322677612305, 13.85723876953125, 15.416154861450195, 16.97507095336914, 18.533985137939453, 20.09290313720703, 21.651817321777344, 23.21073341369629, 24.769649505615234, 26.32856559753418, 27.887481689453125, 29.446395874023438, 31.005313873291016, 32.56422805786133, 34.123146057128906, 35.68206024169922, 37.24097442626953, 38.799888610839844, 40.35880661010742, 41.917720794677734, 43.47663879394531, 45.035552978515625, 46.59446716308594, 48.153385162353516, 49.712303161621094]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 11.0, 18.0, 17.0, 30.0, 46.0, 72.0, 121.0, 227.0, 341.0, 547.0, 922.0, 1571.0, 2795.0, 4870.0, 8688.0, 15593.0, 27452.0, 49519.0, 88699.0, 155416.0, 258335.0, 400011.0, 549270.0, 641133.0, 620428.0, 501551.0, 350854.0, 220338.0, 129351.0, 73118.0, 40687.0, 22643.0, 12751.0, 7219.0, 4053.0, 2312.0, 1310.0, 806.0, 464.0, 278.0, 167.0, 103.0, 57.0, 36.0, 30.0, 9.0, 7.0, 12.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-34.875, -33.81298828125, -32.7509765625, -31.68896484375, -30.626953125, -29.56494140625, -28.5029296875, -27.44091796875, -26.37890625, -25.31689453125, -24.2548828125, -23.19287109375, -22.130859375, -21.06884765625, -20.0068359375, -18.94482421875, -17.8828125, -16.82080078125, -15.7587890625, -14.69677734375, -13.634765625, -12.57275390625, -11.5107421875, -10.44873046875, -9.38671875, -8.32470703125, -7.2626953125, -6.20068359375, -5.138671875, -4.07666015625, -3.0146484375, -1.95263671875, -0.890625, 0.17138671875, 1.2333984375, 2.29541015625, 3.357421875, 4.41943359375, 5.4814453125, 6.54345703125, 7.60546875, 8.66748046875, 9.7294921875, 10.79150390625, 11.853515625, 12.91552734375, 13.9775390625, 15.03955078125, 16.1015625, 17.16357421875, 18.2255859375, 19.28759765625, 20.349609375, 21.41162109375, 22.4736328125, 23.53564453125, 24.59765625, 25.65966796875, 26.7216796875, 27.78369140625, 28.845703125, 29.90771484375, 30.9697265625, 32.03173828125, 33.09375]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 2.0, 7.0, 6.0, 5.0, 10.0, 6.0, 21.0, 20.0, 17.0, 25.0, 31.0, 45.0, 29.0, 48.0, 64.0, 44.0, 55.0, 62.0, 55.0, 56.0, 52.0, 63.0, 36.0, 42.0, 28.0, 32.0, 28.0, 23.0, 23.0, 12.0, 8.0, 14.0, 15.0, 6.0, 4.0, 4.0, 3.0, 5.0, 3.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.03125, -45.57470703125, -44.1181640625, -42.66162109375, -41.205078125, -39.74853515625, -38.2919921875, -36.83544921875, -35.37890625, -33.92236328125, -32.4658203125, -31.00927734375, -29.552734375, -28.09619140625, -26.6396484375, -25.18310546875, -23.7265625, -22.27001953125, -20.8134765625, -19.35693359375, -17.900390625, -16.44384765625, -14.9873046875, -13.53076171875, -12.07421875, -10.61767578125, -9.1611328125, -7.70458984375, -6.248046875, -4.79150390625, -3.3349609375, -1.87841796875, -0.421875, 1.03466796875, 2.4912109375, 3.94775390625, 5.404296875, 6.86083984375, 8.3173828125, 9.77392578125, 11.23046875, 12.68701171875, 14.1435546875, 15.60009765625, 17.056640625, 18.51318359375, 19.9697265625, 21.42626953125, 22.8828125, 24.33935546875, 25.7958984375, 27.25244140625, 28.708984375, 30.16552734375, 31.6220703125, 33.07861328125, 34.53515625, 35.99169921875, 37.4482421875, 38.90478515625, 40.361328125, 41.81787109375, 43.2744140625, 44.73095703125, 46.1875]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 7.0, 5.0, 8.0, 12.0, 19.0, 35.0, 58.0, 79.0, 136.0, 243.0, 407.0, 795.0, 1330.0, 2466.0, 4420.0, 8003.0, 15068.0, 27536.0, 51110.0, 92518.0, 161927.0, 268590.0, 409556.0, 550052.0, 631987.0, 610142.0, 496639.0, 349306.0, 221494.0, 130474.0, 73004.0, 39752.0, 21510.0, 11801.0, 6180.0, 3328.0, 1804.0, 1062.0, 578.0, 328.0, 233.0, 107.0, 70.0, 43.0, 19.0, 26.0, 12.0, 8.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-43.53125, -42.2802734375, -41.029296875, -39.7783203125, -38.52734375, -37.2763671875, -36.025390625, -34.7744140625, -33.5234375, -32.2724609375, -31.021484375, -29.7705078125, -28.51953125, -27.2685546875, -26.017578125, -24.7666015625, -23.515625, -22.2646484375, -21.013671875, -19.7626953125, -18.51171875, -17.2607421875, -16.009765625, -14.7587890625, -13.5078125, -12.2568359375, -11.005859375, -9.7548828125, -8.50390625, -7.2529296875, -6.001953125, -4.7509765625, -3.5, -2.2490234375, -0.998046875, 0.2529296875, 1.50390625, 2.7548828125, 4.005859375, 5.2568359375, 6.5078125, 7.7587890625, 9.009765625, 10.2607421875, 11.51171875, 12.7626953125, 14.013671875, 15.2646484375, 16.515625, 17.7666015625, 19.017578125, 20.2685546875, 21.51953125, 22.7705078125, 24.021484375, 25.2724609375, 26.5234375, 27.7744140625, 29.025390625, 30.2763671875, 31.52734375, 32.7783203125, 34.029296875, 35.2802734375, 36.53125]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 3.0, 11.0, 5.0, 9.0, 8.0, 14.0, 6.0, 15.0, 13.0, 21.0, 33.0, 32.0, 41.0, 50.0, 52.0, 88.0, 91.0, 97.0, 111.0, 130.0, 167.0, 173.0, 156.0, 184.0, 192.0, 208.0, 216.0, 203.0, 203.0, 187.0, 185.0, 165.0, 154.0, 147.0, 123.0, 113.0, 89.0, 73.0, 58.0, 53.0, 51.0, 33.0, 34.0, 27.0, 17.0, 11.0, 7.0, 7.0, 6.0, 5.0, 1.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.140625, -15.60546875, -15.0703125, -14.53515625, -14.0, -13.46484375, -12.9296875, -12.39453125, -11.859375, -11.32421875, -10.7890625, -10.25390625, -9.71875, -9.18359375, -8.6484375, -8.11328125, -7.578125, -7.04296875, -6.5078125, -5.97265625, -5.4375, -4.90234375, -4.3671875, -3.83203125, -3.296875, -2.76171875, -2.2265625, -1.69140625, -1.15625, -0.62109375, -0.0859375, 0.44921875, 0.984375, 1.51953125, 2.0546875, 2.58984375, 3.125, 3.66015625, 4.1953125, 4.73046875, 5.265625, 5.80078125, 6.3359375, 6.87109375, 7.40625, 7.94140625, 8.4765625, 9.01171875, 9.546875, 10.08203125, 10.6171875, 11.15234375, 11.6875, 12.22265625, 12.7578125, 13.29296875, 13.828125, 14.36328125, 14.8984375, 15.43359375, 15.96875, 16.50390625, 17.0390625, 17.57421875, 18.109375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 0.0, 4.0, 3.0, 6.0, 9.0, 10.0, 10.0, 14.0, 15.0, 22.0, 19.0, 31.0, 35.0, 44.0, 38.0, 47.0, 46.0, 53.0, 63.0, 62.0, 69.0, 59.0, 55.0, 49.0, 34.0, 28.0, 37.0, 27.0, 23.0, 20.0, 17.0, 10.0, 14.0, 10.0, 9.0, 4.0, 8.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-51.68342971801758, -50.09819412231445, -48.51295471191406, -46.92771911621094, -45.34248352050781, -43.75724411010742, -42.1720085144043, -40.586769104003906, -39.00153350830078, -37.416297912597656, -35.831058502197266, -34.24582290649414, -32.66058349609375, -31.075347900390625, -29.4901123046875, -27.904874801635742, -26.319637298583984, -24.734399795532227, -23.14916229248047, -21.563926696777344, -19.978689193725586, -18.393451690673828, -16.808216094970703, -15.222978591918945, -13.637741088867188, -12.05250358581543, -10.467267036437988, -8.882030487060547, -7.296792984008789, -5.7115559577941895, -4.12631893157959, -2.5410823822021484, -0.955841064453125, 0.6293959617614746, 2.214632987976074, 3.799870014190674, 5.385107040405273, 6.970344066619873, 8.555581092834473, 10.140817642211914, 11.726055145263672, 13.31129264831543, 14.896529197692871, 16.481765747070312, 18.06700325012207, 19.652240753173828, 21.237476348876953, 22.82271385192871, 24.40795135498047, 25.993188858032227, 27.578426361083984, 29.16366195678711, 30.748899459838867, 32.334136962890625, 33.91937255859375, 35.504608154296875, 37.089847564697266, 38.67508316040039, 40.26032257080078, 41.845558166503906, 43.43079376220703, 45.01603317260742, 46.60126876831055, 48.18650817871094, 49.77174377441406]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 6.0, 6.0, 3.0, 9.0, 6.0, 3.0, 13.0, 16.0, 21.0, 19.0, 16.0, 32.0, 30.0, 27.0, 21.0, 31.0, 42.0, 45.0, 42.0, 47.0, 43.0, 38.0, 38.0, 38.0, 43.0, 30.0, 22.0, 35.0, 40.0, 30.0, 32.0, 23.0, 27.0, 34.0, 8.0, 13.0, 19.0, 14.0, 10.0, 7.0, 8.0, 3.0, 6.0, 3.0, 0.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 3.0], "bins": [-55.67958450317383, -53.94290542602539, -52.20622253417969, -50.46954345703125, -48.73286437988281, -46.996185302734375, -45.25950241088867, -43.522823333740234, -41.78614044189453, -40.049461364746094, -38.31277847290039, -36.57609939575195, -34.839420318603516, -33.10273742675781, -31.366058349609375, -29.629379272460938, -27.8927001953125, -26.15601921081543, -24.419340133666992, -22.682659149169922, -20.945980072021484, -19.209299087524414, -17.472618103027344, -15.73593807220459, -13.999258041381836, -12.262578010559082, -10.525897979736328, -8.789216995239258, -7.052536964416504, -5.31585693359375, -3.5791759490966797, -1.8424959182739258, -0.10581207275390625, 1.6308681964874268, 3.3675484657287598, 5.104228973388672, 6.840909004211426, 8.57758903503418, 10.31427001953125, 12.050950050354004, 13.787630081176758, 15.524310111999512, 17.260990142822266, 18.997671127319336, 20.734352111816406, 22.471031188964844, 24.207712173461914, 25.944393157958984, 27.681072235107422, 29.417753219604492, 31.15443229675293, 32.89111328125, 34.62779235839844, 36.364471435546875, 38.10115432739258, 39.837833404541016, 41.57451629638672, 43.311195373535156, 45.04787826538086, 46.7845573425293, 48.521236419677734, 50.25791931152344, 51.994598388671875, 53.73127746582031, 55.46795654296875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 6.0, 2.0, 13.0, 14.0, 12.0, 28.0, 46.0, 46.0, 61.0, 107.0, 141.0, 206.0, 349.0, 500.0, 833.0, 1283.0, 2045.0, 3273.0, 5157.0, 8415.0, 13729.0, 21914.0, 34654.0, 54487.0, 79892.0, 109445.0, 133399.0, 142959.0, 129049.0, 101980.0, 72945.0, 48525.0, 30994.0, 19613.0, 12053.0, 7657.0, 4649.0, 2923.0, 1829.0, 1165.0, 769.0, 486.0, 329.0, 186.0, 122.0, 89.0, 59.0, 32.0, 29.0, 25.0, 13.0, 10.0, 8.0, 4.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-12.71875, -12.300048828125, -11.88134765625, -11.462646484375, -11.0439453125, -10.625244140625, -10.20654296875, -9.787841796875, -9.369140625, -8.950439453125, -8.53173828125, -8.113037109375, -7.6943359375, -7.275634765625, -6.85693359375, -6.438232421875, -6.01953125, -5.600830078125, -5.18212890625, -4.763427734375, -4.3447265625, -3.926025390625, -3.50732421875, -3.088623046875, -2.669921875, -2.251220703125, -1.83251953125, -1.413818359375, -0.9951171875, -0.576416015625, -0.15771484375, 0.260986328125, 0.6796875, 1.098388671875, 1.51708984375, 1.935791015625, 2.3544921875, 2.773193359375, 3.19189453125, 3.610595703125, 4.029296875, 4.447998046875, 4.86669921875, 5.285400390625, 5.7041015625, 6.122802734375, 6.54150390625, 6.960205078125, 7.37890625, 7.797607421875, 8.21630859375, 8.635009765625, 9.0537109375, 9.472412109375, 9.89111328125, 10.309814453125, 10.728515625, 11.147216796875, 11.56591796875, 11.984619140625, 12.4033203125, 12.822021484375, 13.24072265625, 13.659423828125, 14.078125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 2.0, 5.0, 4.0, 5.0, 5.0, 8.0, 9.0, 10.0, 12.0, 12.0, 13.0, 14.0, 31.0, 31.0, 29.0, 29.0, 30.0, 47.0, 37.0, 39.0, 37.0, 46.0, 38.0, 53.0, 38.0, 42.0, 30.0, 33.0, 31.0, 33.0, 26.0, 26.0, 28.0, 33.0, 29.0, 21.0, 17.0, 15.0, 9.0, 12.0, 6.0, 6.0, 6.0, 4.0, 2.0, 4.0, 5.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-57.0625, -55.30322265625, -53.5439453125, -51.78466796875, -50.025390625, -48.26611328125, -46.5068359375, -44.74755859375, -42.98828125, -41.22900390625, -39.4697265625, -37.71044921875, -35.951171875, -34.19189453125, -32.4326171875, -30.67333984375, -28.9140625, -27.15478515625, -25.3955078125, -23.63623046875, -21.876953125, -20.11767578125, -18.3583984375, -16.59912109375, -14.83984375, -13.08056640625, -11.3212890625, -9.56201171875, -7.802734375, -6.04345703125, -4.2841796875, -2.52490234375, -0.765625, 0.99365234375, 2.7529296875, 4.51220703125, 6.271484375, 8.03076171875, 9.7900390625, 11.54931640625, 13.30859375, 15.06787109375, 16.8271484375, 18.58642578125, 20.345703125, 22.10498046875, 23.8642578125, 25.62353515625, 27.3828125, 29.14208984375, 30.9013671875, 32.66064453125, 34.419921875, 36.17919921875, 37.9384765625, 39.69775390625, 41.45703125, 43.21630859375, 44.9755859375, 46.73486328125, 48.494140625, 50.25341796875, 52.0126953125, 53.77197265625, 55.53125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 11.0, 8.0, 10.0, 19.0, 25.0, 30.0, 41.0, 60.0, 106.0, 143.0, 209.0, 362.0, 539.0, 760.0, 1230.0, 1975.0, 2883.0, 4648.0, 7382.0, 11724.0, 19272.0, 30639.0, 49092.0, 76731.0, 112030.0, 146614.0, 158208.0, 138167.0, 102087.0, 68465.0, 42989.0, 26723.0, 16784.0, 10536.0, 6498.0, 3982.0, 2712.0, 1665.0, 1114.0, 701.0, 453.0, 310.0, 210.0, 123.0, 101.0, 60.0, 44.0, 27.0, 16.0, 9.0, 7.0, 9.0, 6.0, 0.0, 4.0, 5.0, 0.0, 4.0], "bins": [-15.3984375, -14.9227294921875, -14.447021484375, -13.9713134765625, -13.49560546875, -13.0198974609375, -12.544189453125, -12.0684814453125, -11.5927734375, -11.1170654296875, -10.641357421875, -10.1656494140625, -9.68994140625, -9.2142333984375, -8.738525390625, -8.2628173828125, -7.787109375, -7.3114013671875, -6.835693359375, -6.3599853515625, -5.88427734375, -5.4085693359375, -4.932861328125, -4.4571533203125, -3.9814453125, -3.5057373046875, -3.030029296875, -2.5543212890625, -2.07861328125, -1.6029052734375, -1.127197265625, -0.6514892578125, -0.17578125, 0.2999267578125, 0.775634765625, 1.2513427734375, 1.72705078125, 2.2027587890625, 2.678466796875, 3.1541748046875, 3.6298828125, 4.1055908203125, 4.581298828125, 5.0570068359375, 5.53271484375, 6.0084228515625, 6.484130859375, 6.9598388671875, 7.435546875, 7.9112548828125, 8.386962890625, 8.8626708984375, 9.33837890625, 9.8140869140625, 10.289794921875, 10.7655029296875, 11.2412109375, 11.7169189453125, 12.192626953125, 12.6683349609375, 13.14404296875, 13.6197509765625, 14.095458984375, 14.5711669921875, 15.046875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 6.0, 3.0, 10.0, 9.0, 6.0, 17.0, 9.0, 19.0, 35.0, 18.0, 21.0, 38.0, 28.0, 29.0, 51.0, 42.0, 47.0, 63.0, 46.0, 47.0, 37.0, 46.0, 47.0, 46.0, 33.0, 41.0, 38.0, 32.0, 24.0, 17.0, 18.0, 16.0, 9.0, 17.0, 15.0, 8.0, 9.0, 3.0, 4.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.8125, -28.76220703125, -27.7119140625, -26.66162109375, -25.611328125, -24.56103515625, -23.5107421875, -22.46044921875, -21.41015625, -20.35986328125, -19.3095703125, -18.25927734375, -17.208984375, -16.15869140625, -15.1083984375, -14.05810546875, -13.0078125, -11.95751953125, -10.9072265625, -9.85693359375, -8.806640625, -7.75634765625, -6.7060546875, -5.65576171875, -4.60546875, -3.55517578125, -2.5048828125, -1.45458984375, -0.404296875, 0.64599609375, 1.6962890625, 2.74658203125, 3.796875, 4.84716796875, 5.8974609375, 6.94775390625, 7.998046875, 9.04833984375, 10.0986328125, 11.14892578125, 12.19921875, 13.24951171875, 14.2998046875, 15.35009765625, 16.400390625, 17.45068359375, 18.5009765625, 19.55126953125, 20.6015625, 21.65185546875, 22.7021484375, 23.75244140625, 24.802734375, 25.85302734375, 26.9033203125, 27.95361328125, 29.00390625, 30.05419921875, 31.1044921875, 32.15478515625, 33.205078125, 34.25537109375, 35.3056640625, 36.35595703125, 37.40625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 3.0, 2.0, 4.0, 6.0, 15.0, 13.0, 17.0, 34.0, 51.0, 80.0, 90.0, 157.0, 211.0, 359.0, 543.0, 831.0, 1296.0, 2078.0, 3180.0, 5166.0, 8168.0, 13035.0, 21084.0, 32819.0, 51255.0, 77714.0, 111632.0, 143928.0, 153151.0, 133768.0, 99796.0, 67922.0, 44230.0, 28325.0, 17635.0, 11025.0, 6778.0, 4383.0, 2821.0, 1711.0, 1090.0, 749.0, 493.0, 311.0, 181.0, 145.0, 97.0, 55.0, 38.0, 30.0, 20.0, 12.0, 7.0, 10.0, 3.0, 3.0, 3.0, 1.0, 0.0, 3.0, 3.0], "bins": [-5.6484375, -5.4681396484375, -5.287841796875, -5.1075439453125, -4.92724609375, -4.7469482421875, -4.566650390625, -4.3863525390625, -4.2060546875, -4.0257568359375, -3.845458984375, -3.6651611328125, -3.48486328125, -3.3045654296875, -3.124267578125, -2.9439697265625, -2.763671875, -2.5833740234375, -2.403076171875, -2.2227783203125, -2.04248046875, -1.8621826171875, -1.681884765625, -1.5015869140625, -1.3212890625, -1.1409912109375, -0.960693359375, -0.7803955078125, -0.60009765625, -0.4197998046875, -0.239501953125, -0.0592041015625, 0.12109375, 0.3013916015625, 0.481689453125, 0.6619873046875, 0.84228515625, 1.0225830078125, 1.202880859375, 1.3831787109375, 1.5634765625, 1.7437744140625, 1.924072265625, 2.1043701171875, 2.28466796875, 2.4649658203125, 2.645263671875, 2.8255615234375, 3.005859375, 3.1861572265625, 3.366455078125, 3.5467529296875, 3.72705078125, 3.9073486328125, 4.087646484375, 4.2679443359375, 4.4482421875, 4.6285400390625, 4.808837890625, 4.9891357421875, 5.16943359375, 5.3497314453125, 5.530029296875, 5.7103271484375, 5.890625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 1.0, 5.0, 5.0, 4.0, 7.0, 14.0, 15.0, 22.0, 26.0, 28.0, 22.0, 21.0, 42.0, 51.0, 36.0, 59.0, 57.0, 43.0, 57.0, 46.0, 46.0, 49.0, 40.0, 37.0, 39.0, 33.0, 41.0, 35.0, 29.0, 23.0, 16.0, 10.0, 10.0, 7.0, 11.0, 4.0, 6.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00036144256591796875, -0.0003485381603240967, -0.0003356337547302246, -0.00032272934913635254, -0.00030982494354248047, -0.0002969205379486084, -0.00028401613235473633, -0.00027111172676086426, -0.0002582073211669922, -0.0002453029155731201, -0.00023239850997924805, -0.00021949410438537598, -0.0002065896987915039, -0.00019368529319763184, -0.00018078088760375977, -0.0001678764820098877, -0.00015497207641601562, -0.00014206767082214355, -0.00012916326522827148, -0.00011625885963439941, -0.00010335445404052734, -9.045004844665527e-05, -7.75456428527832e-05, -6.464123725891113e-05, -5.173683166503906e-05, -3.883242607116699e-05, -2.5928020477294922e-05, -1.3023614883422852e-05, -1.1920928955078125e-07, 1.2785196304321289e-05, 2.568960189819336e-05, 3.859400749206543e-05, 5.14984130859375e-05, 6.440281867980957e-05, 7.730722427368164e-05, 9.021162986755371e-05, 0.00010311603546142578, 0.00011602044105529785, 0.00012892484664916992, 0.000141829252243042, 0.00015473365783691406, 0.00016763806343078613, 0.0001805424690246582, 0.00019344687461853027, 0.00020635128021240234, 0.00021925568580627441, 0.00023216009140014648, 0.00024506449699401855, 0.0002579689025878906, 0.0002708733081817627, 0.00028377771377563477, 0.00029668211936950684, 0.0003095865249633789, 0.000322490930557251, 0.00033539533615112305, 0.0003482997417449951, 0.0003612041473388672, 0.00037410855293273926, 0.00038701295852661133, 0.0003999173641204834, 0.00041282176971435547, 0.00042572617530822754, 0.0004386305809020996, 0.0004515349864959717, 0.00046443939208984375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [5.0, 2.0, 3.0, 3.0, 6.0, 10.0, 15.0, 27.0, 29.0, 55.0, 51.0, 95.0, 123.0, 166.0, 268.0, 387.0, 606.0, 865.0, 1329.0, 1890.0, 2902.0, 4400.0, 6715.0, 10033.0, 15325.0, 23453.0, 34838.0, 51409.0, 73350.0, 97299.0, 118036.0, 128454.0, 123092.0, 103452.0, 79164.0, 56327.0, 38417.0, 25763.0, 16997.0, 11130.0, 7435.0, 4876.0, 3224.0, 2094.0, 1441.0, 994.0, 625.0, 440.0, 318.0, 189.0, 148.0, 102.0, 59.0, 43.0, 24.0, 26.0, 13.0, 13.0, 8.0, 6.0, 2.0, 1.0, 1.0, 3.0], "bins": [-6.40625, -6.20367431640625, -6.0010986328125, -5.79852294921875, -5.595947265625, -5.39337158203125, -5.1907958984375, -4.98822021484375, -4.78564453125, -4.58306884765625, -4.3804931640625, -4.17791748046875, -3.975341796875, -3.77276611328125, -3.5701904296875, -3.36761474609375, -3.1650390625, -2.96246337890625, -2.7598876953125, -2.55731201171875, -2.354736328125, -2.15216064453125, -1.9495849609375, -1.74700927734375, -1.54443359375, -1.34185791015625, -1.1392822265625, -0.93670654296875, -0.734130859375, -0.53155517578125, -0.3289794921875, -0.12640380859375, 0.076171875, 0.27874755859375, 0.4813232421875, 0.68389892578125, 0.886474609375, 1.08905029296875, 1.2916259765625, 1.49420166015625, 1.69677734375, 1.89935302734375, 2.1019287109375, 2.30450439453125, 2.507080078125, 2.70965576171875, 2.9122314453125, 3.11480712890625, 3.3173828125, 3.51995849609375, 3.7225341796875, 3.92510986328125, 4.127685546875, 4.33026123046875, 4.5328369140625, 4.73541259765625, 4.93798828125, 5.14056396484375, 5.3431396484375, 5.54571533203125, 5.748291015625, 5.95086669921875, 6.1534423828125, 6.35601806640625, 6.55859375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 4.0, 2.0, 4.0, 11.0, 9.0, 9.0, 14.0, 10.0, 19.0, 16.0, 27.0, 23.0, 39.0, 34.0, 44.0, 57.0, 46.0, 57.0, 62.0, 52.0, 49.0, 66.0, 42.0, 63.0, 38.0, 35.0, 25.0, 25.0, 28.0, 22.0, 22.0, 7.0, 12.0, 7.0, 8.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.97265625, -3.84490966796875, -3.7171630859375, -3.58941650390625, -3.461669921875, -3.33392333984375, -3.2061767578125, -3.07843017578125, -2.95068359375, -2.82293701171875, -2.6951904296875, -2.56744384765625, -2.439697265625, -2.31195068359375, -2.1842041015625, -2.05645751953125, -1.9287109375, -1.80096435546875, -1.6732177734375, -1.54547119140625, -1.417724609375, -1.28997802734375, -1.1622314453125, -1.03448486328125, -0.90673828125, -0.77899169921875, -0.6512451171875, -0.52349853515625, -0.395751953125, -0.26800537109375, -0.1402587890625, -0.01251220703125, 0.115234375, 0.24298095703125, 0.3707275390625, 0.49847412109375, 0.626220703125, 0.75396728515625, 0.8817138671875, 1.00946044921875, 1.13720703125, 1.26495361328125, 1.3927001953125, 1.52044677734375, 1.648193359375, 1.77593994140625, 1.9036865234375, 2.03143310546875, 2.1591796875, 2.28692626953125, 2.4146728515625, 2.54241943359375, 2.670166015625, 2.79791259765625, 2.9256591796875, 3.05340576171875, 3.18115234375, 3.30889892578125, 3.4366455078125, 3.56439208984375, 3.692138671875, 3.81988525390625, 3.9476318359375, 4.07537841796875, 4.203125]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 11.0, 4.0, 12.0, 15.0, 11.0, 17.0, 22.0, 18.0, 34.0, 37.0, 37.0, 41.0, 50.0, 65.0, 45.0, 61.0, 70.0, 63.0, 51.0, 55.0, 56.0, 28.0, 34.0, 29.0, 26.0, 22.0, 24.0, 12.0, 16.0, 9.0, 7.0, 7.0, 7.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.71332550048828, -49.083213806152344, -47.453102111816406, -45.82299041748047, -44.19287872314453, -42.562767028808594, -40.932655334472656, -39.30253982543945, -37.672428131103516, -36.04231643676758, -34.41220474243164, -32.7820930480957, -31.151979446411133, -29.521867752075195, -27.891756057739258, -26.261642456054688, -24.631532669067383, -23.001420974731445, -21.371309280395508, -19.741195678710938, -18.111083984375, -16.480972290039062, -14.850860595703125, -13.220747947692871, -11.590636253356934, -9.960524559020996, -8.330411911010742, -6.700300216674805, -5.070188045501709, -3.4400758743286133, -1.8099641799926758, -0.17985153198242188, 1.4502601623535156, 3.0803723335266113, 4.710484504699707, 6.3405961990356445, 7.97070837020874, 9.600820541381836, 11.230932235717773, 12.861044883728027, 14.491156578063965, 16.12126922607422, 17.751380920410156, 19.381492614746094, 21.01160430908203, 22.64171600341797, 24.271827697753906, 25.901941299438477, 27.532052993774414, 29.16216468811035, 30.79227638244629, 32.42238998413086, 34.0525016784668, 35.682613372802734, 37.31272506713867, 38.94283676147461, 40.57294845581055, 42.203060150146484, 43.83317184448242, 45.46328353881836, 47.0933952331543, 48.7235107421875, 50.35362243652344, 51.983734130859375, 53.61384582519531]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 8.0, 3.0, 4.0, 11.0, 2.0, 5.0, 13.0, 16.0, 21.0, 20.0, 19.0, 32.0, 23.0, 24.0, 22.0, 30.0, 46.0, 47.0, 39.0, 45.0, 37.0, 43.0, 36.0, 34.0, 39.0, 38.0, 23.0, 27.0, 37.0, 36.0, 34.0, 19.0, 31.0, 27.0, 15.0, 15.0, 16.0, 16.0, 10.0, 10.0, 11.0, 3.0, 4.0, 4.0, 2.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0], "bins": [-53.97252655029297, -52.24657440185547, -50.52062225341797, -48.79467010498047, -47.068721771240234, -45.342769622802734, -43.616817474365234, -41.890865325927734, -40.1649169921875, -38.43896484375, -36.7130126953125, -34.987060546875, -33.261112213134766, -31.535160064697266, -29.809207916259766, -28.083255767822266, -26.357303619384766, -24.631351470947266, -22.9054012298584, -21.1794490814209, -19.45349884033203, -17.72754669189453, -16.00159454345703, -14.275643348693848, -12.549692153930664, -10.82374095916748, -9.097789764404297, -7.371837615966797, -5.645886421203613, -3.9199352264404297, -2.1939830780029297, -0.4680318832397461, 1.2579154968261719, 2.9838669300079346, 4.709818363189697, 6.435770034790039, 8.161721229553223, 9.887672424316406, 11.613624572753906, 13.33957576751709, 15.065526962280273, 16.791479110717773, 18.51742935180664, 20.24338150024414, 21.96933364868164, 23.695283889770508, 25.421236038208008, 27.147186279296875, 28.873138427734375, 30.599090576171875, 32.325042724609375, 34.050994873046875, 35.77694320678711, 37.50289535522461, 39.22884750366211, 40.95479965209961, 42.680747985839844, 44.406700134277344, 46.132652282714844, 47.858604431152344, 49.58455276489258, 51.31050491333008, 53.03645706176758, 54.76240921020508, 56.48836135864258]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 3.0, 6.0, 4.0, 9.0, 17.0, 25.0, 23.0, 55.0, 69.0, 104.0, 157.0, 207.0, 363.0, 579.0, 789.0, 1169.0, 1941.0, 3070.0, 4589.0, 7265.0, 11283.0, 17494.0, 27459.0, 41583.0, 59980.0, 82030.0, 105450.0, 120806.0, 125331.0, 115902.0, 96177.0, 73314.0, 51982.0, 35156.0, 23039.0, 14859.0, 9357.0, 5803.0, 3905.0, 2483.0, 1641.0, 1060.0, 688.0, 455.0, 298.0, 206.0, 139.0, 86.0, 50.0, 42.0, 22.0, 14.0, 13.0, 4.0, 6.0, 5.0, 2.0, 1.0, 0.0, 2.0], "bins": [-25.328125, -24.5439453125, -23.759765625, -22.9755859375, -22.19140625, -21.4072265625, -20.623046875, -19.8388671875, -19.0546875, -18.2705078125, -17.486328125, -16.7021484375, -15.91796875, -15.1337890625, -14.349609375, -13.5654296875, -12.78125, -11.9970703125, -11.212890625, -10.4287109375, -9.64453125, -8.8603515625, -8.076171875, -7.2919921875, -6.5078125, -5.7236328125, -4.939453125, -4.1552734375, -3.37109375, -2.5869140625, -1.802734375, -1.0185546875, -0.234375, 0.5498046875, 1.333984375, 2.1181640625, 2.90234375, 3.6865234375, 4.470703125, 5.2548828125, 6.0390625, 6.8232421875, 7.607421875, 8.3916015625, 9.17578125, 9.9599609375, 10.744140625, 11.5283203125, 12.3125, 13.0966796875, 13.880859375, 14.6650390625, 15.44921875, 16.2333984375, 17.017578125, 17.8017578125, 18.5859375, 19.3701171875, 20.154296875, 20.9384765625, 21.72265625, 22.5068359375, 23.291015625, 24.0751953125, 24.859375]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 4.0, 3.0, 7.0, 7.0, 7.0, 11.0, 15.0, 16.0, 26.0, 22.0, 25.0, 21.0, 30.0, 34.0, 32.0, 41.0, 45.0, 53.0, 42.0, 40.0, 50.0, 48.0, 39.0, 35.0, 29.0, 36.0, 44.0, 42.0, 25.0, 29.0, 24.0, 16.0, 24.0, 13.0, 14.0, 15.0, 9.0, 13.0, 4.0, 3.0, 5.0, 3.0, 2.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-56.40625, -54.56591796875, -52.7255859375, -50.88525390625, -49.044921875, -47.20458984375, -45.3642578125, -43.52392578125, -41.68359375, -39.84326171875, -38.0029296875, -36.16259765625, -34.322265625, -32.48193359375, -30.6416015625, -28.80126953125, -26.9609375, -25.12060546875, -23.2802734375, -21.43994140625, -19.599609375, -17.75927734375, -15.9189453125, -14.07861328125, -12.23828125, -10.39794921875, -8.5576171875, -6.71728515625, -4.876953125, -3.03662109375, -1.1962890625, 0.64404296875, 2.484375, 4.32470703125, 6.1650390625, 8.00537109375, 9.845703125, 11.68603515625, 13.5263671875, 15.36669921875, 17.20703125, 19.04736328125, 20.8876953125, 22.72802734375, 24.568359375, 26.40869140625, 28.2490234375, 30.08935546875, 31.9296875, 33.77001953125, 35.6103515625, 37.45068359375, 39.291015625, 41.13134765625, 42.9716796875, 44.81201171875, 46.65234375, 48.49267578125, 50.3330078125, 52.17333984375, 54.013671875, 55.85400390625, 57.6943359375, 59.53466796875, 61.375]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 1.0, 3.0, 2.0, 2.0, 7.0, 8.0, 18.0, 22.0, 43.0, 68.0, 81.0, 157.0, 202.0, 315.0, 478.0, 753.0, 1189.0, 1700.0, 2714.0, 4131.0, 6692.0, 10587.0, 17266.0, 27814.0, 45550.0, 71667.0, 105218.0, 138583.0, 153942.0, 143022.0, 111162.0, 76184.0, 48605.0, 30063.0, 18661.0, 11599.0, 7167.0, 4547.0, 2881.0, 1908.0, 1238.0, 817.0, 512.0, 314.0, 228.0, 152.0, 72.0, 65.0, 50.0, 39.0, 25.0, 14.0, 4.0, 10.0, 4.0, 5.0, 3.0, 3.0, 0.0, 0.0, 1.0], "bins": [-38.75, -37.52294921875, -36.2958984375, -35.06884765625, -33.841796875, -32.61474609375, -31.3876953125, -30.16064453125, -28.93359375, -27.70654296875, -26.4794921875, -25.25244140625, -24.025390625, -22.79833984375, -21.5712890625, -20.34423828125, -19.1171875, -17.89013671875, -16.6630859375, -15.43603515625, -14.208984375, -12.98193359375, -11.7548828125, -10.52783203125, -9.30078125, -8.07373046875, -6.8466796875, -5.61962890625, -4.392578125, -3.16552734375, -1.9384765625, -0.71142578125, 0.515625, 1.74267578125, 2.9697265625, 4.19677734375, 5.423828125, 6.65087890625, 7.8779296875, 9.10498046875, 10.33203125, 11.55908203125, 12.7861328125, 14.01318359375, 15.240234375, 16.46728515625, 17.6943359375, 18.92138671875, 20.1484375, 21.37548828125, 22.6025390625, 23.82958984375, 25.056640625, 26.28369140625, 27.5107421875, 28.73779296875, 29.96484375, 31.19189453125, 32.4189453125, 33.64599609375, 34.873046875, 36.10009765625, 37.3271484375, 38.55419921875, 39.78125]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 5.0, 3.0, 4.0, 6.0, 5.0, 9.0, 5.0, 10.0, 14.0, 20.0, 30.0, 26.0, 39.0, 27.0, 34.0, 46.0, 38.0, 47.0, 50.0, 51.0, 37.0, 42.0, 42.0, 54.0, 61.0, 44.0, 35.0, 38.0, 37.0, 17.0, 22.0, 22.0, 21.0, 13.0, 11.0, 11.0, 10.0, 7.0, 8.0, 5.0, 3.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.125, -34.6796875, -33.234375, -31.7890625, -30.34375, -28.8984375, -27.453125, -26.0078125, -24.5625, -23.1171875, -21.671875, -20.2265625, -18.78125, -17.3359375, -15.890625, -14.4453125, -13.0, -11.5546875, -10.109375, -8.6640625, -7.21875, -5.7734375, -4.328125, -2.8828125, -1.4375, 0.0078125, 1.453125, 2.8984375, 4.34375, 5.7890625, 7.234375, 8.6796875, 10.125, 11.5703125, 13.015625, 14.4609375, 15.90625, 17.3515625, 18.796875, 20.2421875, 21.6875, 23.1328125, 24.578125, 26.0234375, 27.46875, 28.9140625, 30.359375, 31.8046875, 33.25, 34.6953125, 36.140625, 37.5859375, 39.03125, 40.4765625, 41.921875, 43.3671875, 44.8125, 46.2578125, 47.703125, 49.1484375, 50.59375, 52.0390625, 53.484375, 54.9296875, 56.375]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 5.0, 10.0, 9.0, 10.0, 6.0, 13.0, 27.0, 41.0, 71.0, 85.0, 161.0, 219.0, 294.0, 487.0, 809.0, 1238.0, 2098.0, 3443.0, 5772.0, 10127.0, 17813.0, 31120.0, 55235.0, 92221.0, 137407.0, 173065.0, 170995.0, 134411.0, 88052.0, 52596.0, 29971.0, 16854.0, 9777.0, 5605.0, 3285.0, 1904.0, 1172.0, 762.0, 488.0, 321.0, 188.0, 125.0, 87.0, 68.0, 35.0, 33.0, 19.0, 9.0, 13.0, 7.0, 1.0, 4.0, 0.0, 0.0, 1.0], "bins": [-22.0625, -21.431396484375, -20.80029296875, -20.169189453125, -19.5380859375, -18.906982421875, -18.27587890625, -17.644775390625, -17.013671875, -16.382568359375, -15.75146484375, -15.120361328125, -14.4892578125, -13.858154296875, -13.22705078125, -12.595947265625, -11.96484375, -11.333740234375, -10.70263671875, -10.071533203125, -9.4404296875, -8.809326171875, -8.17822265625, -7.547119140625, -6.916015625, -6.284912109375, -5.65380859375, -5.022705078125, -4.3916015625, -3.760498046875, -3.12939453125, -2.498291015625, -1.8671875, -1.236083984375, -0.60498046875, 0.026123046875, 0.6572265625, 1.288330078125, 1.91943359375, 2.550537109375, 3.181640625, 3.812744140625, 4.44384765625, 5.074951171875, 5.7060546875, 6.337158203125, 6.96826171875, 7.599365234375, 8.23046875, 8.861572265625, 9.49267578125, 10.123779296875, 10.7548828125, 11.385986328125, 12.01708984375, 12.648193359375, 13.279296875, 13.910400390625, 14.54150390625, 15.172607421875, 15.8037109375, 16.434814453125, 17.06591796875, 17.697021484375, 18.328125]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 1.0, 4.0, 5.0, 3.0, 9.0, 8.0, 12.0, 21.0, 15.0, 24.0, 29.0, 31.0, 33.0, 50.0, 53.0, 54.0, 58.0, 59.0, 62.0, 56.0, 73.0, 65.0, 45.0, 39.0, 47.0, 27.0, 23.0, 20.0, 20.0, 13.0, 9.0, 8.0, 7.0, 10.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0022411346435546875, -0.0021737217903137207, -0.002106308937072754, -0.002038896083831787, -0.0019714832305908203, -0.0019040703773498535, -0.0018366575241088867, -0.00176924467086792, -0.0017018318176269531, -0.0016344189643859863, -0.0015670061111450195, -0.0014995932579040527, -0.001432180404663086, -0.0013647675514221191, -0.0012973546981811523, -0.0012299418449401855, -0.0011625289916992188, -0.001095116138458252, -0.0010277032852172852, -0.0009602904319763184, -0.0008928775787353516, -0.0008254647254943848, -0.000758051872253418, -0.0006906390190124512, -0.0006232261657714844, -0.0005558133125305176, -0.0004884004592895508, -0.000420987606048584, -0.0003535747528076172, -0.0002861618995666504, -0.0002187490463256836, -0.0001513361930847168, -8.392333984375e-05, -1.6510486602783203e-05, 5.0902366638183594e-05, 0.00011831521987915039, 0.0001857280731201172, 0.000253140926361084, 0.0003205537796020508, 0.0003879666328430176, 0.0004553794860839844, 0.0005227923393249512, 0.000590205192565918, 0.0006576180458068848, 0.0007250308990478516, 0.0007924437522888184, 0.0008598566055297852, 0.000927269458770752, 0.0009946823120117188, 0.0010620951652526855, 0.0011295080184936523, 0.0011969208717346191, 0.001264333724975586, 0.0013317465782165527, 0.0013991594314575195, 0.0014665722846984863, 0.0015339851379394531, 0.00160139799118042, 0.0016688108444213867, 0.0017362236976623535, 0.0018036365509033203, 0.0018710494041442871, 0.001938462257385254, 0.0020058751106262207, 0.0020732879638671875]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 6.0, 16.0, 17.0, 20.0, 37.0, 54.0, 76.0, 108.0, 174.0, 234.0, 392.0, 564.0, 844.0, 1254.0, 2235.0, 3543.0, 5808.0, 9516.0, 16474.0, 28041.0, 47888.0, 77234.0, 117933.0, 153671.0, 165824.0, 144616.0, 105422.0, 66957.0, 40417.0, 23882.0, 13807.0, 8329.0, 4949.0, 2985.0, 1838.0, 1127.0, 767.0, 502.0, 321.0, 214.0, 143.0, 91.0, 75.0, 52.0, 42.0, 22.0, 20.0, 9.0, 9.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-18.21875, -17.618408203125, -17.01806640625, -16.417724609375, -15.8173828125, -15.217041015625, -14.61669921875, -14.016357421875, -13.416015625, -12.815673828125, -12.21533203125, -11.614990234375, -11.0146484375, -10.414306640625, -9.81396484375, -9.213623046875, -8.61328125, -8.012939453125, -7.41259765625, -6.812255859375, -6.2119140625, -5.611572265625, -5.01123046875, -4.410888671875, -3.810546875, -3.210205078125, -2.60986328125, -2.009521484375, -1.4091796875, -0.808837890625, -0.20849609375, 0.391845703125, 0.9921875, 1.592529296875, 2.19287109375, 2.793212890625, 3.3935546875, 3.993896484375, 4.59423828125, 5.194580078125, 5.794921875, 6.395263671875, 6.99560546875, 7.595947265625, 8.1962890625, 8.796630859375, 9.39697265625, 9.997314453125, 10.59765625, 11.197998046875, 11.79833984375, 12.398681640625, 12.9990234375, 13.599365234375, 14.19970703125, 14.800048828125, 15.400390625, 16.000732421875, 16.60107421875, 17.201416015625, 17.8017578125, 18.402099609375, 19.00244140625, 19.602783203125, 20.203125]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 3.0, 4.0, 4.0, 7.0, 9.0, 11.0, 13.0, 15.0, 21.0, 24.0, 21.0, 38.0, 44.0, 35.0, 45.0, 46.0, 49.0, 51.0, 66.0, 74.0, 68.0, 59.0, 43.0, 42.0, 33.0, 32.0, 33.0, 27.0, 15.0, 13.0, 10.0, 8.0, 8.0, 6.0, 5.0, 4.0, 7.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.62109375, -7.3890380859375, -7.156982421875, -6.9249267578125, -6.69287109375, -6.4608154296875, -6.228759765625, -5.9967041015625, -5.7646484375, -5.5325927734375, -5.300537109375, -5.0684814453125, -4.83642578125, -4.6043701171875, -4.372314453125, -4.1402587890625, -3.908203125, -3.6761474609375, -3.444091796875, -3.2120361328125, -2.97998046875, -2.7479248046875, -2.515869140625, -2.2838134765625, -2.0517578125, -1.8197021484375, -1.587646484375, -1.3555908203125, -1.12353515625, -0.8914794921875, -0.659423828125, -0.4273681640625, -0.1953125, 0.0367431640625, 0.268798828125, 0.5008544921875, 0.73291015625, 0.9649658203125, 1.197021484375, 1.4290771484375, 1.6611328125, 1.8931884765625, 2.125244140625, 2.3572998046875, 2.58935546875, 2.8214111328125, 3.053466796875, 3.2855224609375, 3.517578125, 3.7496337890625, 3.981689453125, 4.2137451171875, 4.44580078125, 4.6778564453125, 4.909912109375, 5.1419677734375, 5.3740234375, 5.6060791015625, 5.838134765625, 6.0701904296875, 6.30224609375, 6.5343017578125, 6.766357421875, 6.9984130859375, 7.23046875]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 2.0, 5.0, 10.0, 6.0, 8.0, 9.0, 7.0, 15.0, 20.0, 17.0, 17.0, 33.0, 26.0, 32.0, 39.0, 35.0, 46.0, 57.0, 45.0, 57.0, 63.0, 40.0, 51.0, 34.0, 36.0, 45.0, 47.0, 28.0, 31.0, 23.0, 20.0, 21.0, 11.0, 11.0, 7.0, 10.0, 8.0, 8.0, 8.0, 7.0, 4.0, 6.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-48.3460807800293, -46.90038299560547, -45.454689025878906, -44.00899124145508, -42.56329345703125, -41.11759948730469, -39.67190170288086, -38.22620391845703, -36.78050994873047, -35.33481216430664, -33.88911819458008, -32.44342041015625, -30.997724533081055, -29.55202865600586, -28.10633087158203, -26.660634994506836, -25.21493911743164, -23.769243240356445, -22.32354736328125, -20.877849578857422, -19.432153701782227, -17.98645782470703, -16.540760040283203, -15.095064163208008, -13.649368286132812, -12.203672409057617, -10.757975578308105, -9.312278747558594, -7.866582870483398, -6.420886516571045, -4.975190162658691, -3.5294933319091797, -2.0837974548339844, -0.6381011009216309, 0.8075952529907227, 2.253291606903076, 3.6989879608154297, 5.144684314727783, 6.590380668640137, 8.036077499389648, 9.481773376464844, 10.927469253540039, 12.37316608428955, 13.818862915039062, 15.264558792114258, 16.710254669189453, 18.15595245361328, 19.601648330688477, 21.047344207763672, 22.493040084838867, 23.938735961914062, 25.38443374633789, 26.830129623413086, 28.27582550048828, 29.72152328491211, 31.167219161987305, 32.6129150390625, 34.05861282348633, 35.50430679321289, 36.95000457763672, 38.39569854736328, 39.84139633178711, 41.28709411621094, 42.7327880859375, 44.17848587036133]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 5.0, 3.0, 7.0, 4.0, 3.0, 3.0, 12.0, 16.0, 19.0, 5.0, 21.0, 17.0, 21.0, 22.0, 19.0, 28.0, 30.0, 24.0, 33.0, 29.0, 28.0, 33.0, 43.0, 42.0, 45.0, 30.0, 44.0, 32.0, 35.0, 54.0, 28.0, 40.0, 31.0, 25.0, 22.0, 31.0, 13.0, 25.0, 10.0, 22.0, 11.0, 7.0, 10.0, 9.0, 6.0, 6.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0], "bins": [-75.282470703125, -72.97908020019531, -70.6756820678711, -68.3722915649414, -66.06889343261719, -63.7655029296875, -61.46210861206055, -59.158714294433594, -56.855323791503906, -54.55192947387695, -52.24853515625, -49.94514465332031, -47.64175033569336, -45.338356018066406, -43.03496170043945, -40.7315673828125, -38.42817306518555, -36.124778747558594, -33.82138442993164, -31.51799201965332, -29.214599609375, -26.911205291748047, -24.607810974121094, -22.304418563842773, -20.00102424621582, -17.697629928588867, -15.394237518310547, -13.090843200683594, -10.787449836730957, -8.48405647277832, -6.180662155151367, -3.877269744873047, -1.5738754272460938, 0.7295181751251221, 3.032911777496338, 5.336305618286133, 7.6396989822387695, 9.943092346191406, 12.24648666381836, 14.54987907409668, 16.853273391723633, 19.156667709350586, 21.460060119628906, 23.76345443725586, 26.066848754882812, 28.370241165161133, 30.673635482788086, 32.977027893066406, 35.28042221069336, 37.58381652832031, 39.887210845947266, 42.19060516357422, 44.493995666503906, 46.79738998413086, 49.10078430175781, 51.4041748046875, 53.70757293701172, 56.01096725463867, 58.314361572265625, 60.61775207519531, 62.921146392822266, 65.22454071044922, 67.52793884277344, 69.83132934570312, 72.13471984863281]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 4.0, 4.0, 10.0, 13.0, 16.0, 20.0, 23.0, 46.0, 41.0, 65.0, 68.0, 113.0, 145.0, 222.0, 285.0, 440.0, 666.0, 1031.0, 1796.0, 2905.0, 4238.0, 6475.0, 1017905.0, 4935.0, 3345.0, 2044.0, 1293.0, 805.0, 467.0, 322.0, 230.0, 171.0, 128.0, 79.0, 68.0, 56.0, 37.0, 25.0, 23.0, 9.0, 9.0, 10.0, 10.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-663.8341064453125, -641.8236083984375, -619.8131713867188, -597.8026733398438, -575.792236328125, -553.78173828125, -531.771240234375, -509.76080322265625, -487.75030517578125, -465.7398376464844, -443.7293701171875, -421.7188720703125, -399.7084045410156, -377.69793701171875, -355.6874694824219, -333.677001953125, -311.6665344238281, -289.65606689453125, -267.6455993652344, -245.63511657714844, -223.6246337890625, -201.61416625976562, -179.60369873046875, -157.5932159423828, -135.58274841308594, -113.57227325439453, -91.56179809570312, -69.55133056640625, -47.540855407714844, -25.530380249023438, -3.5199127197265625, 18.490570068359375, 40.50103759765625, 62.511512756347656, 84.52198791503906, 106.53245544433594, 128.54293823242188, 150.55340576171875, 172.56387329101562, 194.57435607910156, 216.58482360839844, 238.5952911376953, 260.60577392578125, 282.6162414550781, 304.626708984375, 326.63720703125, 348.64764404296875, 370.65814208984375, 392.6686096191406, 414.6790771484375, 436.6895446777344, 458.70001220703125, 480.71051025390625, 502.7209777832031, 524.7314453125, 546.741943359375, 568.7523803710938, 590.7628784179688, 612.7733154296875, 634.7838134765625, 656.7942504882812, 678.8047485351562, 700.815185546875, 722.82568359375, 744.836181640625]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 7.0, 7.0, 7.0, 8.0, 12.0, 24.0, 25.0, 31.0, 49.0, 42.0, 65.0, 100.0, 147.0, 208.0, 288.0, 403.0, 555.0, 813.0, 1402.0, 2355.0, 4689.0, 9104.0, 16414.0, 32120.0, 51279416.0, 70747.0, 23923.0, 12841.0, 6687.0, 3520.0, 1867.0, 1132.0, 680.0, 418.0, 361.0, 200.0, 186.0, 131.0, 95.0, 70.0, 43.0, 48.0, 31.0, 19.0, 12.0, 11.0, 6.0, 9.0, 3.0, 6.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-520.4613037109375, -504.0864562988281, -487.71160888671875, -471.3367614746094, -454.9619140625, -438.5870361328125, -422.2121887207031, -405.83734130859375, -389.4624938964844, -373.087646484375, -356.7127990722656, -340.33795166015625, -323.96307373046875, -307.5882568359375, -291.21337890625, -274.8385314941406, -258.46368408203125, -242.08883666992188, -225.7139892578125, -209.33912658691406, -192.9642791748047, -176.5894317626953, -160.21456909179688, -143.8397216796875, -127.46487426757812, -111.09002685546875, -94.71517181396484, -78.34031677246094, -61.96546936035156, -45.59062194824219, -29.21576690673828, -12.840911865234375, 3.533935546875, 19.90878677368164, 36.28363800048828, 52.65848922729492, 69.03334045410156, 85.40818786621094, 101.78304290771484, 118.15789794921875, 134.53274536132812, 150.9075927734375, 167.28244018554688, 183.6573028564453, 200.0321502685547, 216.40699768066406, 232.7818603515625, 249.15670776367188, 265.53155517578125, 281.9064025878906, 298.28125, 314.6560974121094, 331.03094482421875, 347.40582275390625, 363.7806701660156, 380.155517578125, 396.5303649902344, 412.90521240234375, 429.2800598144531, 445.6549072265625, 462.02978515625, 478.40460205078125, 494.77947998046875, 511.1543273925781, 527.5291748046875]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 1.0, 11.0, 18.0, 23.0, 23.0, 44.0, 73.0, 90.0, 205.0, 276.0, 481.0, 729.0, 1192.0, 2091.0, 3673.0, 6792.0, 12649.0, 24810.0, 50468.0, 105060.0, 229071.0, 525489.0, 1329326.0, 2191610.0, 1029271.0, 418198.0, 186790.0, 86637.0, 41471.0, 20717.0, 10733.0, 5672.0, 3225.0, 1790.0, 1067.0, 614.0, 378.0, 219.0, 151.0, 105.0, 66.0, 46.0, 34.0, 21.0, 13.0, 5.0, 1.0, 6.0, 6.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-59.9375, -58.1416015625, -56.345703125, -54.5498046875, -52.75390625, -50.9580078125, -49.162109375, -47.3662109375, -45.5703125, -43.7744140625, -41.978515625, -40.1826171875, -38.38671875, -36.5908203125, -34.794921875, -32.9990234375, -31.203125, -29.4072265625, -27.611328125, -25.8154296875, -24.01953125, -22.2236328125, -20.427734375, -18.6318359375, -16.8359375, -15.0400390625, -13.244140625, -11.4482421875, -9.65234375, -7.8564453125, -6.060546875, -4.2646484375, -2.46875, -0.6728515625, 1.123046875, 2.9189453125, 4.71484375, 6.5107421875, 8.306640625, 10.1025390625, 11.8984375, 13.6943359375, 15.490234375, 17.2861328125, 19.08203125, 20.8779296875, 22.673828125, 24.4697265625, 26.265625, 28.0615234375, 29.857421875, 31.6533203125, 33.44921875, 35.2451171875, 37.041015625, 38.8369140625, 40.6328125, 42.4287109375, 44.224609375, 46.0205078125, 47.81640625, 49.6123046875, 51.408203125, 53.2041015625, 55.0]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 1.0, 2.0, 7.0, 4.0, 2.0, 6.0, 6.0, 8.0, 9.0, 10.0, 21.0, 25.0, 19.0, 25.0, 21.0, 34.0, 46.0, 48.0, 67.0, 77.0, 102.0, 142.0, 194.0, 217.0, 226.0, 150.0, 124.0, 87.0, 67.0, 62.0, 39.0, 33.0, 33.0, 17.0, 20.0, 11.0, 20.0, 12.0, 12.0, 9.0, 6.0, 7.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.375, -39.0439453125, -37.712890625, -36.3818359375, -35.05078125, -33.7197265625, -32.388671875, -31.0576171875, -29.7265625, -28.3955078125, -27.064453125, -25.7333984375, -24.40234375, -23.0712890625, -21.740234375, -20.4091796875, -19.078125, -17.7470703125, -16.416015625, -15.0849609375, -13.75390625, -12.4228515625, -11.091796875, -9.7607421875, -8.4296875, -7.0986328125, -5.767578125, -4.4365234375, -3.10546875, -1.7744140625, -0.443359375, 0.8876953125, 2.21875, 3.5498046875, 4.880859375, 6.2119140625, 7.54296875, 8.8740234375, 10.205078125, 11.5361328125, 12.8671875, 14.1982421875, 15.529296875, 16.8603515625, 18.19140625, 19.5224609375, 20.853515625, 22.1845703125, 23.515625, 24.8466796875, 26.177734375, 27.5087890625, 28.83984375, 30.1708984375, 31.501953125, 32.8330078125, 34.1640625, 35.4951171875, 36.826171875, 38.1572265625, 39.48828125, 40.8193359375, 42.150390625, 43.4814453125, 44.8125]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 5.0, 8.0, 7.0, 12.0, 19.0, 40.0, 36.0, 62.0, 66.0, 87.0, 147.0, 244.0, 371.0, 564.0, 1048.0, 1634.0, 2856.0, 4437.0, 7804.0, 13213.0, 22393.0, 36600.0, 60408.0, 96115.0, 152450.0, 237408.0, 383416.0, 815431.0, 1952018.0, 1241952.0, 494450.0, 283598.0, 182168.0, 116852.0, 71807.0, 44470.0, 26613.0, 16433.0, 9698.0, 5741.0, 3478.0, 2041.0, 1218.0, 753.0, 442.0, 284.0, 195.0, 115.0, 82.0, 45.0, 35.0, 21.0, 19.0, 12.0, 7.0, 11.0, 5.0, 1.0, 4.0, 1.0, 1.0], "bins": [-24.84375, -24.06005859375, -23.2763671875, -22.49267578125, -21.708984375, -20.92529296875, -20.1416015625, -19.35791015625, -18.57421875, -17.79052734375, -17.0068359375, -16.22314453125, -15.439453125, -14.65576171875, -13.8720703125, -13.08837890625, -12.3046875, -11.52099609375, -10.7373046875, -9.95361328125, -9.169921875, -8.38623046875, -7.6025390625, -6.81884765625, -6.03515625, -5.25146484375, -4.4677734375, -3.68408203125, -2.900390625, -2.11669921875, -1.3330078125, -0.54931640625, 0.234375, 1.01806640625, 1.8017578125, 2.58544921875, 3.369140625, 4.15283203125, 4.9365234375, 5.72021484375, 6.50390625, 7.28759765625, 8.0712890625, 8.85498046875, 9.638671875, 10.42236328125, 11.2060546875, 11.98974609375, 12.7734375, 13.55712890625, 14.3408203125, 15.12451171875, 15.908203125, 16.69189453125, 17.4755859375, 18.25927734375, 19.04296875, 19.82666015625, 20.6103515625, 21.39404296875, 22.177734375, 22.96142578125, 23.7451171875, 24.52880859375, 25.3125]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 8.0, 6.0, 4.0, 5.0, 10.0, 15.0, 13.0, 14.0, 22.0, 24.0, 22.0, 39.0, 40.0, 55.0, 51.0, 69.0, 125.0, 253.0, 375.0, 267.0, 169.0, 111.0, 68.0, 49.0, 49.0, 30.0, 30.0, 26.0, 16.0, 16.0, 16.0, 11.0, 13.0, 5.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.9375, -46.7568359375, -44.576171875, -42.3955078125, -40.21484375, -38.0341796875, -35.853515625, -33.6728515625, -31.4921875, -29.3115234375, -27.130859375, -24.9501953125, -22.76953125, -20.5888671875, -18.408203125, -16.2275390625, -14.046875, -11.8662109375, -9.685546875, -7.5048828125, -5.32421875, -3.1435546875, -0.962890625, 1.2177734375, 3.3984375, 5.5791015625, 7.759765625, 9.9404296875, 12.12109375, 14.3017578125, 16.482421875, 18.6630859375, 20.84375, 23.0244140625, 25.205078125, 27.3857421875, 29.56640625, 31.7470703125, 33.927734375, 36.1083984375, 38.2890625, 40.4697265625, 42.650390625, 44.8310546875, 47.01171875, 49.1923828125, 51.373046875, 53.5537109375, 55.734375, 57.9150390625, 60.095703125, 62.2763671875, 64.45703125, 66.6376953125, 68.818359375, 70.9990234375, 73.1796875, 75.3603515625, 77.541015625, 79.7216796875, 81.90234375, 84.0830078125, 86.263671875, 88.4443359375, 90.625]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [2.0, 6.0, 5.0, 0.0, 4.0, 6.0, 7.0, 13.0, 25.0, 21.0, 30.0, 36.0, 53.0, 69.0, 133.0, 172.0, 241.0, 335.0, 540.0, 824.0, 1173.0, 1979.0, 3606.0, 6422.0, 11941.0, 23327.0, 47449.0, 104083.0, 3984642.0, 1903583.0, 102592.0, 46949.0, 23351.0, 11828.0, 6459.0, 3595.0, 2064.0, 1297.0, 811.0, 529.0, 324.0, 266.0, 168.0, 134.0, 96.0, 74.0, 41.0, 30.0, 34.0, 25.0, 21.0, 11.0, 11.0, 3.0, 7.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-85.625, -82.671875, -79.71875, -76.765625, -73.8125, -70.859375, -67.90625, -64.953125, -62.0, -59.046875, -56.09375, -53.140625, -50.1875, -47.234375, -44.28125, -41.328125, -38.375, -35.421875, -32.46875, -29.515625, -26.5625, -23.609375, -20.65625, -17.703125, -14.75, -11.796875, -8.84375, -5.890625, -2.9375, 0.015625, 2.96875, 5.921875, 8.875, 11.828125, 14.78125, 17.734375, 20.6875, 23.640625, 26.59375, 29.546875, 32.5, 35.453125, 38.40625, 41.359375, 44.3125, 47.265625, 50.21875, 53.171875, 56.125, 59.078125, 62.03125, 64.984375, 67.9375, 70.890625, 73.84375, 76.796875, 79.75, 82.703125, 85.65625, 88.609375, 91.5625, 94.515625, 97.46875, 100.421875, 103.375]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 2.0, 5.0, 6.0, 10.0, 9.0, 11.0, 16.0, 21.0, 21.0, 22.0, 23.0, 33.0, 36.0, 47.0, 45.0, 43.0, 55.0, 115.0, 388.0, 442.0, 210.0, 94.0, 70.0, 47.0, 41.0, 33.0, 30.0, 35.0, 22.0, 18.0, 16.0, 15.0, 11.0, 12.0, 5.0, 2.0, 2.0, 3.0, 5.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-113.875, -110.5380859375, -107.201171875, -103.8642578125, -100.52734375, -97.1904296875, -93.853515625, -90.5166015625, -87.1796875, -83.8427734375, -80.505859375, -77.1689453125, -73.83203125, -70.4951171875, -67.158203125, -63.8212890625, -60.484375, -57.1474609375, -53.810546875, -50.4736328125, -47.13671875, -43.7998046875, -40.462890625, -37.1259765625, -33.7890625, -30.4521484375, -27.115234375, -23.7783203125, -20.44140625, -17.1044921875, -13.767578125, -10.4306640625, -7.09375, -3.7568359375, -0.419921875, 2.9169921875, 6.25390625, 9.5908203125, 12.927734375, 16.2646484375, 19.6015625, 22.9384765625, 26.275390625, 29.6123046875, 32.94921875, 36.2861328125, 39.623046875, 42.9599609375, 46.296875, 49.6337890625, 52.970703125, 56.3076171875, 59.64453125, 62.9814453125, 66.318359375, 69.6552734375, 72.9921875, 76.3291015625, 79.666015625, 83.0029296875, 86.33984375, 89.6767578125, 93.013671875, 96.3505859375, 99.6875]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 6.0, 2.0, 2.0, 4.0, 7.0, 3.0, 18.0, 25.0, 38.0, 63.0, 99.0, 171.0, 243.0, 101.0, 76.0, 48.0, 39.0, 14.0, 11.0, 12.0, 7.0, 4.0, 6.0, 5.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2903.458740234375, -2837.835693359375, -2772.212890625, -2706.58984375, -2640.967041015625, -2575.343994140625, -2509.72119140625, -2444.09814453125, -2378.47509765625, -2312.85205078125, -2247.229248046875, -2181.606201171875, -2115.9833984375, -2050.3603515625, -1984.7374267578125, -1919.114501953125, -1853.4915771484375, -1787.86865234375, -1722.2457275390625, -1656.622802734375, -1590.999755859375, -1525.3768310546875, -1459.75390625, -1394.1309814453125, -1328.508056640625, -1262.8851318359375, -1197.26220703125, -1131.63916015625, -1066.0162353515625, -1000.393310546875, -934.7703857421875, -869.1474609375, -803.5244140625, -737.9014892578125, -672.2785034179688, -606.6555786132812, -541.0325927734375, -475.40966796875, -409.7867431640625, -344.1637878417969, -278.54083251953125, -212.91787719726562, -147.29493713378906, -81.6719970703125, -16.049041748046875, 49.57391357421875, 115.19683837890625, 180.81979370117188, 246.4427490234375, 312.0657043457031, 377.68865966796875, 443.31158447265625, 508.9345397949219, 574.5574951171875, 640.180419921875, 705.8033447265625, 771.4263305664062, 837.0492553710938, 902.6722412109375, 968.295166015625, 1033.9180908203125, 1099.541015625, 1165.1640625, 1230.7869873046875, 1296.409912109375]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 3.0, 8.0, 7.0, 7.0, 7.0, 16.0, 10.0, 22.0, 12.0, 16.0, 10.0, 20.0, 12.0, 28.0, 28.0, 33.0, 40.0, 52.0, 81.0, 101.0, 92.0, 69.0, 51.0, 50.0, 30.0, 27.0, 18.0, 24.0, 23.0, 13.0, 18.0, 15.0, 15.0, 5.0, 8.0, 9.0, 2.0, 7.0, 2.0, 4.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1565.72216796875, -1518.025146484375, -1470.328125, -1422.631103515625, -1374.93408203125, -1327.237060546875, -1279.5400390625, -1231.8428955078125, -1184.1458740234375, -1136.4488525390625, -1088.7518310546875, -1041.0548095703125, -993.3577270507812, -945.6607055664062, -897.9636840820312, -850.2666015625, -802.5696411132812, -754.8726196289062, -707.1755981445312, -659.478515625, -611.781494140625, -564.08447265625, -516.387451171875, -468.6903991699219, -420.9933776855469, -373.2963562011719, -325.59930419921875, -277.90228271484375, -230.2052459716797, -182.50820922851562, -134.81118774414062, -87.1141357421875, -39.4171142578125, 8.279918670654297, 55.976951599121094, 103.67398071289062, 151.3710174560547, 199.06805419921875, 246.76507568359375, 294.4621276855469, 342.1591491699219, 389.8561706542969, 437.55322265625, 485.250244140625, 532.947265625, 580.644287109375, 628.34130859375, 676.0383911132812, 723.7354125976562, 771.4324340820312, 819.1294555664062, 866.8265380859375, 914.5235595703125, 962.2205810546875, 1009.9176025390625, 1057.6146240234375, 1105.3116455078125, 1153.0086669921875, 1200.7056884765625, 1248.4027099609375, 1296.0997314453125, 1343.796875, 1391.493896484375, 1439.19091796875, 1486.887939453125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 5.0, 5.0, 5.0, 5.0, 10.0, 14.0, 17.0, 22.0, 27.0, 38.0, 51.0, 88.0, 103.0, 175.0, 220.0, 290.0, 464.0, 657.0, 961.0, 1489.0, 2420.0, 3903.0, 6620.0, 11605.0, 22780.0, 51125.0, 175954.0, 3290695.0, 481977.0, 80014.0, 30502.0, 14254.0, 7553.0, 4074.0, 2331.0, 1413.0, 830.0, 546.0, 351.0, 264.0, 133.0, 98.0, 77.0, 41.0, 32.0, 23.0, 14.0, 9.0, 2.0, 4.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-13.40625, -13.0198974609375, -12.633544921875, -12.2471923828125, -11.86083984375, -11.4744873046875, -11.088134765625, -10.7017822265625, -10.3154296875, -9.9290771484375, -9.542724609375, -9.1563720703125, -8.77001953125, -8.3836669921875, -7.997314453125, -7.6109619140625, -7.224609375, -6.8382568359375, -6.451904296875, -6.0655517578125, -5.67919921875, -5.2928466796875, -4.906494140625, -4.5201416015625, -4.1337890625, -3.7474365234375, -3.361083984375, -2.9747314453125, -2.58837890625, -2.2020263671875, -1.815673828125, -1.4293212890625, -1.04296875, -0.6566162109375, -0.270263671875, 0.1160888671875, 0.50244140625, 0.8887939453125, 1.275146484375, 1.6614990234375, 2.0478515625, 2.4342041015625, 2.820556640625, 3.2069091796875, 3.59326171875, 3.9796142578125, 4.365966796875, 4.7523193359375, 5.138671875, 5.5250244140625, 5.911376953125, 6.2977294921875, 6.68408203125, 7.0704345703125, 7.456787109375, 7.8431396484375, 8.2294921875, 8.6158447265625, 9.002197265625, 9.3885498046875, 9.77490234375, 10.1612548828125, 10.547607421875, 10.9339599609375, 11.3203125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 5.0, 6.0, 7.0, 4.0, 11.0, 6.0, 8.0, 10.0, 11.0, 26.0, 59.0, 137.0, 264.0, 200.0, 98.0, 42.0, 20.0, 17.0, 18.0, 11.0, 7.0, 7.0, 4.0, 2.0, 4.0, 3.0, 4.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5625, -2.488616943359375, -2.41473388671875, -2.340850830078125, -2.2669677734375, -2.193084716796875, -2.11920166015625, -2.045318603515625, -1.971435546875, -1.897552490234375, -1.82366943359375, -1.749786376953125, -1.6759033203125, -1.602020263671875, -1.52813720703125, -1.454254150390625, -1.38037109375, -1.306488037109375, -1.23260498046875, -1.158721923828125, -1.0848388671875, -1.010955810546875, -0.93707275390625, -0.863189697265625, -0.789306640625, -0.715423583984375, -0.64154052734375, -0.567657470703125, -0.4937744140625, -0.419891357421875, -0.34600830078125, -0.272125244140625, -0.1982421875, -0.124359130859375, -0.05047607421875, 0.023406982421875, 0.0972900390625, 0.171173095703125, 0.24505615234375, 0.318939208984375, 0.392822265625, 0.466705322265625, 0.54058837890625, 0.614471435546875, 0.6883544921875, 0.762237548828125, 0.83612060546875, 0.910003662109375, 0.98388671875, 1.057769775390625, 1.13165283203125, 1.205535888671875, 1.2794189453125, 1.353302001953125, 1.42718505859375, 1.501068115234375, 1.574951171875, 1.648834228515625, 1.72271728515625, 1.796600341796875, 1.8704833984375, 1.944366455078125, 2.01824951171875, 2.092132568359375, 2.166015625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 3.0, 6.0, 9.0, 12.0, 14.0, 29.0, 32.0, 41.0, 81.0, 88.0, 188.0, 312.0, 525.0, 940.0, 1708.0, 3596.0, 8327.0, 21471.0, 65492.0, 245330.0, 1159490.0, 2072843.0, 447925.0, 109711.0, 33391.0, 12359.0, 5161.0, 2366.0, 1143.0, 651.0, 353.0, 208.0, 146.0, 93.0, 73.0, 45.0, 35.0, 20.0, 19.0, 10.0, 4.0, 16.0, 8.0, 3.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-9.4375, -9.135009765625, -8.83251953125, -8.530029296875, -8.2275390625, -7.925048828125, -7.62255859375, -7.320068359375, -7.017578125, -6.715087890625, -6.41259765625, -6.110107421875, -5.8076171875, -5.505126953125, -5.20263671875, -4.900146484375, -4.59765625, -4.295166015625, -3.99267578125, -3.690185546875, -3.3876953125, -3.085205078125, -2.78271484375, -2.480224609375, -2.177734375, -1.875244140625, -1.57275390625, -1.270263671875, -0.9677734375, -0.665283203125, -0.36279296875, -0.060302734375, 0.2421875, 0.544677734375, 0.84716796875, 1.149658203125, 1.4521484375, 1.754638671875, 2.05712890625, 2.359619140625, 2.662109375, 2.964599609375, 3.26708984375, 3.569580078125, 3.8720703125, 4.174560546875, 4.47705078125, 4.779541015625, 5.08203125, 5.384521484375, 5.68701171875, 5.989501953125, 6.2919921875, 6.594482421875, 6.89697265625, 7.199462890625, 7.501953125, 7.804443359375, 8.10693359375, 8.409423828125, 8.7119140625, 9.014404296875, 9.31689453125, 9.619384765625, 9.921875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 6.0, 6.0, 7.0, 8.0, 9.0, 15.0, 20.0, 21.0, 43.0, 53.0, 58.0, 98.0, 125.0, 167.0, 219.0, 294.0, 408.0, 583.0, 487.0, 376.0, 273.0, 207.0, 146.0, 113.0, 96.0, 68.0, 42.0, 37.0, 19.0, 16.0, 14.0, 15.0, 9.0, 7.0, 7.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.68359375, -3.56744384765625, -3.4512939453125, -3.33514404296875, -3.218994140625, -3.10284423828125, -2.9866943359375, -2.87054443359375, -2.75439453125, -2.63824462890625, -2.5220947265625, -2.40594482421875, -2.289794921875, -2.17364501953125, -2.0574951171875, -1.94134521484375, -1.8251953125, -1.70904541015625, -1.5928955078125, -1.47674560546875, -1.360595703125, -1.24444580078125, -1.1282958984375, -1.01214599609375, -0.89599609375, -0.77984619140625, -0.6636962890625, -0.54754638671875, -0.431396484375, -0.31524658203125, -0.1990966796875, -0.08294677734375, 0.033203125, 0.14935302734375, 0.2655029296875, 0.38165283203125, 0.497802734375, 0.61395263671875, 0.7301025390625, 0.84625244140625, 0.96240234375, 1.07855224609375, 1.1947021484375, 1.31085205078125, 1.427001953125, 1.54315185546875, 1.6593017578125, 1.77545166015625, 1.8916015625, 2.00775146484375, 2.1239013671875, 2.24005126953125, 2.356201171875, 2.47235107421875, 2.5885009765625, 2.70465087890625, 2.82080078125, 2.93695068359375, 3.0531005859375, 3.16925048828125, 3.285400390625, 3.40155029296875, 3.5177001953125, 3.63385009765625, 3.75]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 2.0, 9.0, 14.0, 44.0, 79.0, 140.0, 217.0, 245.0, 123.0, 66.0, 35.0, 16.0, 7.0, 6.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.758819580078125, -45.90781021118164, -44.056800842285156, -42.205787658691406, -40.35477828979492, -38.50376892089844, -36.65275955200195, -34.80175018310547, -32.95073699951172, -31.099727630615234, -29.248716354370117, -27.397706985473633, -25.546695709228516, -23.69568634033203, -21.844676971435547, -19.993667602539062, -18.142658233642578, -16.291648864746094, -14.440637588500977, -12.589628219604492, -10.738617897033691, -8.88760757446289, -7.036598205566406, -5.1855878829956055, -3.3345775604248047, -1.483567476272583, 0.36744260787963867, 2.2184524536132812, 4.069462776184082, 5.920473098754883, 7.771482467651367, 9.622492790222168, 11.473503112792969, 13.32451343536377, 15.17552375793457, 17.026533126831055, 18.877544403076172, 20.728553771972656, 22.57956314086914, 24.430572509765625, 26.281583786010742, 28.132593154907227, 29.983604431152344, 31.834613800048828, 33.68562316894531, 35.53663635253906, 37.38764190673828, 39.23865509033203, 41.089664459228516, 42.940673828125, 44.791683197021484, 46.64269256591797, 48.49370574951172, 50.3447151184082, 52.19572448730469, 54.04673385620117, 55.897743225097656, 57.74875259399414, 59.599761962890625, 61.450775146484375, 63.30178451538086, 65.15279388427734, 67.00379943847656, 68.85481262207031, 70.70582580566406]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 9.0, 5.0, 7.0, 20.0, 15.0, 10.0, 18.0, 36.0, 30.0, 33.0, 42.0, 50.0, 54.0, 73.0, 55.0, 64.0, 62.0, 58.0, 62.0, 47.0, 43.0, 37.0, 33.0, 29.0, 24.0, 17.0, 14.0, 13.0, 14.0, 13.0, 2.0, 3.0, 2.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.553367614746094, -23.76286506652832, -22.972362518310547, -22.181861877441406, -21.391359329223633, -20.60085678100586, -19.81035614013672, -19.019853591918945, -18.229351043701172, -17.4388484954834, -16.648345947265625, -15.857845306396484, -15.067342758178711, -14.276840209960938, -13.48633861541748, -12.695837020874023, -11.90533447265625, -11.114831924438477, -10.32433032989502, -9.533828735351562, -8.743326187133789, -7.952824115753174, -7.162322044372559, -6.371819972991943, -5.581317901611328, -4.790815830230713, -4.000313758850098, -3.2098116874694824, -2.419309616088867, -1.628807544708252, -0.8383054733276367, -0.047803401947021484, 0.7426986694335938, 1.533200740814209, 2.323702812194824, 3.1142048835754395, 3.9047069549560547, 4.69520902633667, 5.485711097717285, 6.2762131690979, 7.066715240478516, 7.857217311859131, 8.647719383239746, 9.438220977783203, 10.228723526000977, 11.01922607421875, 11.809727668762207, 12.600229263305664, 13.390731811523438, 14.181234359741211, 14.971735954284668, 15.762237548828125, 16.5527400970459, 17.343242645263672, 18.133743286132812, 18.924245834350586, 19.71474838256836, 20.505250930786133, 21.295753479003906, 22.086254119873047, 22.87675666809082, 23.667259216308594, 24.457759857177734, 25.248262405395508, 26.03876495361328]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 4.0, 1.0, 3.0, 4.0, 9.0, 16.0, 17.0, 20.0, 28.0, 43.0, 52.0, 74.0, 80.0, 115.0, 176.0, 223.0, 296.0, 397.0, 578.0, 831.0, 1318.0, 2031.0, 3015.0, 4913.0, 8477.0, 17031.0, 44282.0, 210940.0, 588909.0, 103831.0, 29265.0, 12650.0, 7018.0, 3999.0, 2609.0, 1619.0, 1074.0, 737.0, 516.0, 386.0, 239.0, 166.0, 132.0, 103.0, 96.0, 61.0, 51.0, 37.0, 25.0, 22.0, 18.0, 9.0, 6.0, 5.0, 6.0, 1.0, 1.0, 2.0, 2.0, 1.0], "bins": [-6.14453125, -5.954345703125, -5.76416015625, -5.573974609375, -5.3837890625, -5.193603515625, -5.00341796875, -4.813232421875, -4.623046875, -4.432861328125, -4.24267578125, -4.052490234375, -3.8623046875, -3.672119140625, -3.48193359375, -3.291748046875, -3.1015625, -2.911376953125, -2.72119140625, -2.531005859375, -2.3408203125, -2.150634765625, -1.96044921875, -1.770263671875, -1.580078125, -1.389892578125, -1.19970703125, -1.009521484375, -0.8193359375, -0.629150390625, -0.43896484375, -0.248779296875, -0.05859375, 0.131591796875, 0.32177734375, 0.511962890625, 0.7021484375, 0.892333984375, 1.08251953125, 1.272705078125, 1.462890625, 1.653076171875, 1.84326171875, 2.033447265625, 2.2236328125, 2.413818359375, 2.60400390625, 2.794189453125, 2.984375, 3.174560546875, 3.36474609375, 3.554931640625, 3.7451171875, 3.935302734375, 4.12548828125, 4.315673828125, 4.505859375, 4.696044921875, 4.88623046875, 5.076416015625, 5.2666015625, 5.456787109375, 5.64697265625, 5.837158203125, 6.02734375]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 1.0, 3.0, 4.0, 5.0, 2.0, 4.0, 12.0, 6.0, 8.0, 5.0, 8.0, 18.0, 37.0, 56.0, 93.0, 140.0, 171.0, 152.0, 105.0, 58.0, 30.0, 20.0, 17.0, 11.0, 7.0, 4.0, 9.0, 4.0, 5.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-2.748046875, -2.67462158203125, -2.6011962890625, -2.52777099609375, -2.454345703125, -2.38092041015625, -2.3074951171875, -2.23406982421875, -2.16064453125, -2.08721923828125, -2.0137939453125, -1.94036865234375, -1.866943359375, -1.79351806640625, -1.7200927734375, -1.64666748046875, -1.5732421875, -1.49981689453125, -1.4263916015625, -1.35296630859375, -1.279541015625, -1.20611572265625, -1.1326904296875, -1.05926513671875, -0.98583984375, -0.91241455078125, -0.8389892578125, -0.76556396484375, -0.692138671875, -0.61871337890625, -0.5452880859375, -0.47186279296875, -0.3984375, -0.32501220703125, -0.2515869140625, -0.17816162109375, -0.104736328125, -0.03131103515625, 0.0421142578125, 0.11553955078125, 0.18896484375, 0.26239013671875, 0.3358154296875, 0.40924072265625, 0.482666015625, 0.55609130859375, 0.6295166015625, 0.70294189453125, 0.7763671875, 0.84979248046875, 0.9232177734375, 0.99664306640625, 1.070068359375, 1.14349365234375, 1.2169189453125, 1.29034423828125, 1.36376953125, 1.43719482421875, 1.5106201171875, 1.58404541015625, 1.657470703125, 1.73089599609375, 1.8043212890625, 1.87774658203125, 1.951171875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 10.0, 8.0, 8.0, 14.0, 18.0, 22.0, 27.0, 46.0, 63.0, 116.0, 158.0, 269.0, 456.0, 773.0, 1532.0, 2802.0, 5273.0, 10787.0, 22862.0, 53739.0, 148931.0, 422857.0, 238597.0, 78224.0, 31718.0, 14232.0, 6901.0, 3607.0, 1947.0, 1044.0, 582.0, 354.0, 185.0, 134.0, 66.0, 59.0, 43.0, 28.0, 18.0, 15.0, 12.0, 8.0, 4.0, 3.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.95703125, -5.77484130859375, -5.5926513671875, -5.41046142578125, -5.228271484375, -5.04608154296875, -4.8638916015625, -4.68170166015625, -4.49951171875, -4.31732177734375, -4.1351318359375, -3.95294189453125, -3.770751953125, -3.58856201171875, -3.4063720703125, -3.22418212890625, -3.0419921875, -2.85980224609375, -2.6776123046875, -2.49542236328125, -2.313232421875, -2.13104248046875, -1.9488525390625, -1.76666259765625, -1.58447265625, -1.40228271484375, -1.2200927734375, -1.03790283203125, -0.855712890625, -0.67352294921875, -0.4913330078125, -0.30914306640625, -0.126953125, 0.05523681640625, 0.2374267578125, 0.41961669921875, 0.601806640625, 0.78399658203125, 0.9661865234375, 1.14837646484375, 1.33056640625, 1.51275634765625, 1.6949462890625, 1.87713623046875, 2.059326171875, 2.24151611328125, 2.4237060546875, 2.60589599609375, 2.7880859375, 2.97027587890625, 3.1524658203125, 3.33465576171875, 3.516845703125, 3.69903564453125, 3.8812255859375, 4.06341552734375, 4.24560546875, 4.42779541015625, 4.6099853515625, 4.79217529296875, 4.974365234375, 5.15655517578125, 5.3387451171875, 5.52093505859375, 5.703125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 8.0, 4.0, 4.0, 9.0, 10.0, 9.0, 7.0, 11.0, 25.0, 19.0, 15.0, 18.0, 27.0, 37.0, 29.0, 34.0, 36.0, 45.0, 38.0, 47.0, 55.0, 58.0, 40.0, 39.0, 53.0, 32.0, 30.0, 31.0, 43.0, 23.0, 36.0, 31.0, 20.0, 19.0, 17.0, 11.0, 9.0, 9.0, 7.0, 7.0, 6.0, 3.0, 0.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.4375, -8.1761474609375, -7.914794921875, -7.6534423828125, -7.39208984375, -7.1307373046875, -6.869384765625, -6.6080322265625, -6.3466796875, -6.0853271484375, -5.823974609375, -5.5626220703125, -5.30126953125, -5.0399169921875, -4.778564453125, -4.5172119140625, -4.255859375, -3.9945068359375, -3.733154296875, -3.4718017578125, -3.21044921875, -2.9490966796875, -2.687744140625, -2.4263916015625, -2.1650390625, -1.9036865234375, -1.642333984375, -1.3809814453125, -1.11962890625, -0.8582763671875, -0.596923828125, -0.3355712890625, -0.07421875, 0.1871337890625, 0.448486328125, 0.7098388671875, 0.97119140625, 1.2325439453125, 1.493896484375, 1.7552490234375, 2.0166015625, 2.2779541015625, 2.539306640625, 2.8006591796875, 3.06201171875, 3.3233642578125, 3.584716796875, 3.8460693359375, 4.107421875, 4.3687744140625, 4.630126953125, 4.8914794921875, 5.15283203125, 5.4141845703125, 5.675537109375, 5.9368896484375, 6.1982421875, 6.4595947265625, 6.720947265625, 6.9822998046875, 7.24365234375, 7.5050048828125, 7.766357421875, 8.0277099609375, 8.2890625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 6.0, 2.0, 5.0, 6.0, 11.0, 6.0, 13.0, 19.0, 22.0, 31.0, 74.0, 126.0, 290.0, 841.0, 2939.0, 16283.0, 310297.0, 683451.0, 27826.0, 4428.0, 1116.0, 370.0, 173.0, 72.0, 59.0, 25.0, 20.0, 9.0, 10.0, 9.0, 6.0, 3.0, 4.0, 5.0, 7.0, 1.0, 0.0, 3.0, 0.0, 3.0, 1.0], "bins": [-17.765625, -17.3228759765625, -16.880126953125, -16.4373779296875, -15.99462890625, -15.5518798828125, -15.109130859375, -14.6663818359375, -14.2236328125, -13.7808837890625, -13.338134765625, -12.8953857421875, -12.45263671875, -12.0098876953125, -11.567138671875, -11.1243896484375, -10.681640625, -10.2388916015625, -9.796142578125, -9.3533935546875, -8.91064453125, -8.4678955078125, -8.025146484375, -7.5823974609375, -7.1396484375, -6.6968994140625, -6.254150390625, -5.8114013671875, -5.36865234375, -4.9259033203125, -4.483154296875, -4.0404052734375, -3.59765625, -3.1549072265625, -2.712158203125, -2.2694091796875, -1.82666015625, -1.3839111328125, -0.941162109375, -0.4984130859375, -0.0556640625, 0.3870849609375, 0.829833984375, 1.2725830078125, 1.71533203125, 2.1580810546875, 2.600830078125, 3.0435791015625, 3.486328125, 3.9290771484375, 4.371826171875, 4.8145751953125, 5.25732421875, 5.7000732421875, 6.142822265625, 6.5855712890625, 7.0283203125, 7.4710693359375, 7.913818359375, 8.3565673828125, 8.79931640625, 9.2420654296875, 9.684814453125, 10.1275634765625, 10.5703125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 6.0, 4.0, 6.0, 11.0, 15.0, 14.0, 12.0, 22.0, 37.0, 38.0, 41.0, 53.0, 48.0, 73.0, 78.0, 74.0, 54.0, 68.0, 58.0, 57.0, 34.0, 40.0, 35.0, 23.0, 25.0, 11.0, 16.0, 12.0, 6.0, 6.0, 11.0, 5.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0002601146697998047, -0.0002533774822950363, -0.00024664029479026794, -0.00023990310728549957, -0.0002331659197807312, -0.00022642873227596283, -0.00021969154477119446, -0.00021295435726642609, -0.00020621716976165771, -0.00019947998225688934, -0.00019274279475212097, -0.0001860056072473526, -0.00017926841974258423, -0.00017253123223781586, -0.00016579404473304749, -0.00015905685722827911, -0.00015231966972351074, -0.00014558248221874237, -0.000138845294713974, -0.00013210810720920563, -0.00012537091970443726, -0.00011863373219966888, -0.00011189654469490051, -0.00010515935719013214, -9.842216968536377e-05, -9.16849821805954e-05, -8.494779467582703e-05, -7.821060717105865e-05, -7.147341966629028e-05, -6.473623216152191e-05, -5.799904465675354e-05, -5.126185715198517e-05, -4.45246696472168e-05, -3.7787482142448425e-05, -3.1050294637680054e-05, -2.4313107132911682e-05, -1.757591962814331e-05, -1.0838732123374939e-05, -4.101544618606567e-06, 2.635642886161804e-06, 9.372830390930176e-06, 1.6110017895698547e-05, 2.284720540046692e-05, 2.958439290523529e-05, 3.632158041000366e-05, 4.3058767914772034e-05, 4.9795955419540405e-05, 5.653314292430878e-05, 6.327033042907715e-05, 7.000751793384552e-05, 7.674470543861389e-05, 8.348189294338226e-05, 9.021908044815063e-05, 9.6956267952919e-05, 0.00010369345545768738, 0.00011043064296245575, 0.00011716783046722412, 0.0001239050179719925, 0.00013064220547676086, 0.00013737939298152924, 0.0001441165804862976, 0.00015085376799106598, 0.00015759095549583435, 0.00016432814300060272, 0.0001710653305053711]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 1.0, 2.0, 7.0, 6.0, 9.0, 16.0, 18.0, 42.0, 57.0, 135.0, 208.0, 425.0, 954.0, 2160.0, 6407.0, 24009.0, 155704.0, 688232.0, 138121.0, 22180.0, 6036.0, 2037.0, 886.0, 418.0, 181.0, 119.0, 68.0, 32.0, 27.0, 23.0, 17.0, 10.0, 6.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-11.0859375, -10.79779052734375, -10.5096435546875, -10.22149658203125, -9.933349609375, -9.64520263671875, -9.3570556640625, -9.06890869140625, -8.78076171875, -8.49261474609375, -8.2044677734375, -7.91632080078125, -7.628173828125, -7.34002685546875, -7.0518798828125, -6.76373291015625, -6.4755859375, -6.18743896484375, -5.8992919921875, -5.61114501953125, -5.322998046875, -5.03485107421875, -4.7467041015625, -4.45855712890625, -4.17041015625, -3.88226318359375, -3.5941162109375, -3.30596923828125, -3.017822265625, -2.72967529296875, -2.4415283203125, -2.15338134765625, -1.865234375, -1.57708740234375, -1.2889404296875, -1.00079345703125, -0.712646484375, -0.42449951171875, -0.1363525390625, 0.15179443359375, 0.43994140625, 0.72808837890625, 1.0162353515625, 1.30438232421875, 1.592529296875, 1.88067626953125, 2.1688232421875, 2.45697021484375, 2.7451171875, 3.03326416015625, 3.3214111328125, 3.60955810546875, 3.897705078125, 4.18585205078125, 4.4739990234375, 4.76214599609375, 5.05029296875, 5.33843994140625, 5.6265869140625, 5.91473388671875, 6.202880859375, 6.49102783203125, 6.7791748046875, 7.06732177734375, 7.35546875]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 5.0, 3.0, 1.0, 1.0, 1.0, 6.0, 2.0, 7.0, 11.0, 2.0, 6.0, 15.0, 20.0, 16.0, 35.0, 41.0, 47.0, 54.0, 65.0, 72.0, 83.0, 82.0, 71.0, 88.0, 64.0, 37.0, 38.0, 32.0, 32.0, 18.0, 18.0, 12.0, 9.0, 5.0, 4.0, 8.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.39453125, -4.22918701171875, -4.0638427734375, -3.89849853515625, -3.733154296875, -3.56781005859375, -3.4024658203125, -3.23712158203125, -3.07177734375, -2.90643310546875, -2.7410888671875, -2.57574462890625, -2.410400390625, -2.24505615234375, -2.0797119140625, -1.91436767578125, -1.7490234375, -1.58367919921875, -1.4183349609375, -1.25299072265625, -1.087646484375, -0.92230224609375, -0.7569580078125, -0.59161376953125, -0.42626953125, -0.26092529296875, -0.0955810546875, 0.06976318359375, 0.235107421875, 0.40045166015625, 0.5657958984375, 0.73114013671875, 0.896484375, 1.06182861328125, 1.2271728515625, 1.39251708984375, 1.557861328125, 1.72320556640625, 1.8885498046875, 2.05389404296875, 2.21923828125, 2.38458251953125, 2.5499267578125, 2.71527099609375, 2.880615234375, 3.04595947265625, 3.2113037109375, 3.37664794921875, 3.5419921875, 3.70733642578125, 3.8726806640625, 4.03802490234375, 4.203369140625, 4.36871337890625, 4.5340576171875, 4.69940185546875, 4.86474609375, 5.03009033203125, 5.1954345703125, 5.36077880859375, 5.526123046875, 5.69146728515625, 5.8568115234375, 6.02215576171875, 6.1875]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 10.0, 20.0, 84.0, 518.0, 298.0, 49.0, 11.0, 10.0, 9.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-295.17803955078125, -286.9461364746094, -278.7142028808594, -270.4822998046875, -262.2503662109375, -254.01844787597656, -245.78652954101562, -237.55462646484375, -229.32269287109375, -221.0907745361328, -212.85885620117188, -204.62693786621094, -196.39501953125, -188.16310119628906, -179.93118286132812, -171.69927978515625, -163.4673614501953, -155.23544311523438, -147.00352478027344, -138.7716064453125, -130.53968811035156, -122.30776977539062, -114.07585906982422, -105.84394073486328, -97.61202239990234, -89.3801040649414, -81.14818572998047, -72.91627502441406, -64.68435668945312, -56.45243453979492, -48.22052001953125, -39.98860168457031, -31.756698608398438, -23.5247802734375, -15.292863845825195, -7.060947418212891, 1.1709709167480469, 9.402889251708984, 17.634803771972656, 25.866722106933594, 34.09864044189453, 42.33055877685547, 50.562477111816406, 58.79439163208008, 67.02630615234375, 75.25822448730469, 83.49014282226562, 91.72206115722656, 99.9539794921875, 108.18589782714844, 116.41781616210938, 124.64973449707031, 132.88165283203125, 141.1135711669922, 149.34548950195312, 157.577392578125, 165.809326171875, 174.04124450683594, 182.27316284179688, 190.5050811767578, 198.73699951171875, 206.9689178466797, 215.20083618164062, 223.4327392578125, 231.66465759277344]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 5.0, 1.0, 2.0, 6.0, 3.0, 4.0, 4.0, 5.0, 2.0, 5.0, 9.0, 13.0, 9.0, 22.0, 27.0, 55.0, 66.0, 85.0, 129.0, 133.0, 111.0, 98.0, 62.0, 47.0, 25.0, 22.0, 7.0, 12.0, 6.0, 6.0, 5.0, 4.0, 2.0, 5.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-128.66307067871094, -124.70231628417969, -120.74156188964844, -116.78080749511719, -112.82006072998047, -108.85930633544922, -104.89855194091797, -100.93779754638672, -96.97705078125, -93.01629638671875, -89.0555419921875, -85.09478759765625, -81.13404083251953, -77.17328643798828, -73.21253204345703, -69.25177764892578, -65.29102325439453, -61.33026885986328, -57.3695182800293, -53.40876388549805, -49.44801330566406, -45.48725891113281, -41.52650451660156, -37.56575012207031, -33.60499954223633, -29.64424705505371, -25.683494567871094, -21.722740173339844, -17.761987686157227, -13.80123519897461, -9.84048080444336, -5.879728317260742, -1.918975830078125, 2.0417771339416504, 6.002530097961426, 9.96328353881836, 13.924036026000977, 17.884788513183594, 21.845542907714844, 25.80629539489746, 29.767047882080078, 33.72780227661133, 37.68855285644531, 41.64930725097656, 45.61006164550781, 49.5708122253418, 53.53156661987305, 57.49231719970703, 61.45307159423828, 65.41382598876953, 69.37458038330078, 73.3353271484375, 77.29608154296875, 81.2568359375, 85.21759033203125, 89.1783447265625, 93.13909912109375, 97.099853515625, 101.06060791015625, 105.0213623046875, 108.98210906982422, 112.94286346435547, 116.90361785888672, 120.86437225341797, 124.82511901855469]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 8.0, 7.0, 15.0, 17.0, 27.0, 40.0, 52.0, 99.0, 247.0, 551.0, 1181.0, 3166.0, 10961.0, 78101.0, 3971843.0, 111784.0, 11549.0, 2906.0, 993.0, 354.0, 184.0, 83.0, 45.0, 15.0, 12.0, 13.0, 6.0, 3.0, 5.0, 0.0, 2.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-55.15625, -53.6875, -52.21875, -50.75, -49.28125, -47.8125, -46.34375, -44.875, -43.40625, -41.9375, -40.46875, -39.0, -37.53125, -36.0625, -34.59375, -33.125, -31.65625, -30.1875, -28.71875, -27.25, -25.78125, -24.3125, -22.84375, -21.375, -19.90625, -18.4375, -16.96875, -15.5, -14.03125, -12.5625, -11.09375, -9.625, -8.15625, -6.6875, -5.21875, -3.75, -2.28125, -0.8125, 0.65625, 2.125, 3.59375, 5.0625, 6.53125, 8.0, 9.46875, 10.9375, 12.40625, 13.875, 15.34375, 16.8125, 18.28125, 19.75, 21.21875, 22.6875, 24.15625, 25.625, 27.09375, 28.5625, 30.03125, 31.5, 32.96875, 34.4375, 35.90625, 37.375, 38.84375]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 3.0, 2.0, 5.0, 3.0, 4.0, 3.0, 7.0, 7.0, 9.0, 7.0, 8.0, 15.0, 32.0, 48.0, 54.0, 83.0, 123.0, 135.0, 114.0, 103.0, 67.0, 59.0, 27.0, 15.0, 17.0, 10.0, 7.0, 7.0, 10.0, 4.0, 6.0, 2.0, 0.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-2.412109375, -2.347686767578125, -2.28326416015625, -2.218841552734375, -2.1544189453125, -2.089996337890625, -2.02557373046875, -1.961151123046875, -1.896728515625, -1.832305908203125, -1.76788330078125, -1.703460693359375, -1.6390380859375, -1.574615478515625, -1.51019287109375, -1.445770263671875, -1.38134765625, -1.316925048828125, -1.25250244140625, -1.188079833984375, -1.1236572265625, -1.059234619140625, -0.99481201171875, -0.930389404296875, -0.865966796875, -0.801544189453125, -0.73712158203125, -0.672698974609375, -0.6082763671875, -0.543853759765625, -0.47943115234375, -0.415008544921875, -0.3505859375, -0.286163330078125, -0.22174072265625, -0.157318115234375, -0.0928955078125, -0.028472900390625, 0.03594970703125, 0.100372314453125, 0.164794921875, 0.229217529296875, 0.29364013671875, 0.358062744140625, 0.4224853515625, 0.486907958984375, 0.55133056640625, 0.615753173828125, 0.68017578125, 0.744598388671875, 0.80902099609375, 0.873443603515625, 0.9378662109375, 1.002288818359375, 1.06671142578125, 1.131134033203125, 1.195556640625, 1.259979248046875, 1.32440185546875, 1.388824462890625, 1.4532470703125, 1.517669677734375, 1.58209228515625, 1.646514892578125, 1.7109375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 3.0, 2.0, 10.0, 5.0, 7.0, 14.0, 21.0, 39.0, 46.0, 92.0, 147.0, 299.0, 560.0, 1151.0, 2689.0, 7132.0, 25024.0, 130501.0, 2371462.0, 1508711.0, 112021.0, 22554.0, 6824.0, 2618.0, 1126.0, 535.0, 298.0, 164.0, 84.0, 48.0, 33.0, 11.0, 21.0, 6.0, 8.0, 4.0, 7.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.53125, -17.868408203125, -17.20556640625, -16.542724609375, -15.8798828125, -15.217041015625, -14.55419921875, -13.891357421875, -13.228515625, -12.565673828125, -11.90283203125, -11.239990234375, -10.5771484375, -9.914306640625, -9.25146484375, -8.588623046875, -7.92578125, -7.262939453125, -6.60009765625, -5.937255859375, -5.2744140625, -4.611572265625, -3.94873046875, -3.285888671875, -2.623046875, -1.960205078125, -1.29736328125, -0.634521484375, 0.0283203125, 0.691162109375, 1.35400390625, 2.016845703125, 2.6796875, 3.342529296875, 4.00537109375, 4.668212890625, 5.3310546875, 5.993896484375, 6.65673828125, 7.319580078125, 7.982421875, 8.645263671875, 9.30810546875, 9.970947265625, 10.6337890625, 11.296630859375, 11.95947265625, 12.622314453125, 13.28515625, 13.947998046875, 14.61083984375, 15.273681640625, 15.9365234375, 16.599365234375, 17.26220703125, 17.925048828125, 18.587890625, 19.250732421875, 19.91357421875, 20.576416015625, 21.2392578125, 21.902099609375, 22.56494140625, 23.227783203125, 23.890625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 3.0, 2.0, 2.0, 3.0, 5.0, 10.0, 18.0, 16.0, 26.0, 43.0, 63.0, 112.0, 159.0, 310.0, 539.0, 1380.0, 594.0, 274.0, 180.0, 94.0, 70.0, 51.0, 30.0, 20.0, 15.0, 20.0, 7.0, 8.0, 6.0, 5.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.126953125, -3.0208740234375, -2.914794921875, -2.8087158203125, -2.70263671875, -2.5965576171875, -2.490478515625, -2.3843994140625, -2.2783203125, -2.1722412109375, -2.066162109375, -1.9600830078125, -1.85400390625, -1.7479248046875, -1.641845703125, -1.5357666015625, -1.4296875, -1.3236083984375, -1.217529296875, -1.1114501953125, -1.00537109375, -0.8992919921875, -0.793212890625, -0.6871337890625, -0.5810546875, -0.4749755859375, -0.368896484375, -0.2628173828125, -0.15673828125, -0.0506591796875, 0.055419921875, 0.1614990234375, 0.267578125, 0.3736572265625, 0.479736328125, 0.5858154296875, 0.69189453125, 0.7979736328125, 0.904052734375, 1.0101318359375, 1.1162109375, 1.2222900390625, 1.328369140625, 1.4344482421875, 1.54052734375, 1.6466064453125, 1.752685546875, 1.8587646484375, 1.96484375, 2.0709228515625, 2.177001953125, 2.2830810546875, 2.38916015625, 2.4952392578125, 2.601318359375, 2.7073974609375, 2.8134765625, 2.9195556640625, 3.025634765625, 3.1317138671875, 3.23779296875, 3.3438720703125, 3.449951171875, 3.5560302734375, 3.662109375]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 9.0, 11.0, 28.0, 70.0, 164.0, 259.0, 257.0, 122.0, 46.0, 18.0, 8.0, 6.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.38623046875, -34.19475173950195, -33.00327682495117, -31.811798095703125, -30.62032127380371, -29.428844451904297, -28.23736572265625, -27.045888900756836, -25.854412078857422, -24.662935256958008, -23.471458435058594, -22.279979705810547, -21.088502883911133, -19.89702606201172, -18.705547332763672, -17.514070510864258, -16.322593688964844, -15.13111686706543, -13.9396390914917, -12.748161315917969, -11.556684494018555, -10.36520767211914, -9.17372989654541, -7.98225212097168, -6.790775299072266, -5.599298000335693, -4.407820701599121, -3.216343402862549, -2.0248661041259766, -0.8333888053894043, 0.35808849334716797, 1.5495662689208984, 2.741039276123047, 3.932516574859619, 5.123993873596191, 6.315471172332764, 7.506948471069336, 8.69842529296875, 9.88990306854248, 11.081380844116211, 12.272857666015625, 13.464334487915039, 14.65581226348877, 15.8472900390625, 17.038766860961914, 18.230243682861328, 19.421722412109375, 20.61319923400879, 21.804676055908203, 22.996152877807617, 24.18762969970703, 25.379108428955078, 26.570585250854492, 27.762062072753906, 28.953540802001953, 30.145017623901367, 31.33649444580078, 32.52797317504883, 33.71944808959961, 34.910926818847656, 36.10240173339844, 37.293880462646484, 38.48535919189453, 39.67683410644531, 40.86831283569336]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 6.0, 0.0, 2.0, 0.0, 2.0, 4.0, 4.0, 6.0, 4.0, 11.0, 22.0, 22.0, 35.0, 64.0, 43.0, 70.0, 70.0, 92.0, 69.0, 89.0, 88.0, 58.0, 56.0, 45.0, 40.0, 31.0, 24.0, 15.0, 7.0, 5.0, 6.0, 6.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0], "bins": [-21.577701568603516, -20.988906860351562, -20.400110244750977, -19.81131362915039, -19.222518920898438, -18.633724212646484, -18.0449275970459, -17.456130981445312, -16.86733627319336, -16.278541564941406, -15.68974494934082, -15.10094928741455, -14.512153625488281, -13.923357963562012, -13.334562301635742, -12.745766639709473, -12.156970977783203, -11.568175315856934, -10.979379653930664, -10.390583992004395, -9.801788330078125, -9.212992668151855, -8.624197006225586, -8.035401344299316, -7.446605682373047, -6.857810020446777, -6.269014358520508, -5.680218696594238, -5.091423034667969, -4.502627372741699, -3.9138317108154297, -3.32503604888916, -2.736238479614258, -2.1474428176879883, -1.5586471557617188, -0.9698514938354492, -0.3810558319091797, 0.20773983001708984, 0.7965354919433594, 1.385331153869629, 1.9741268157958984, 2.562922477722168, 3.1517181396484375, 3.740513801574707, 4.329309463500977, 4.918105125427246, 5.506900787353516, 6.095696449279785, 6.684492111206055, 7.273287773132324, 7.862083435058594, 8.450879096984863, 9.039674758911133, 9.628470420837402, 10.217266082763672, 10.806061744689941, 11.394857406616211, 11.98365306854248, 12.57244873046875, 13.16124439239502, 13.750040054321289, 14.338835716247559, 14.927631378173828, 15.516427040100098, 16.105222702026367]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 3.0, 2.0, 4.0, 9.0, 9.0, 5.0, 11.0, 16.0, 29.0, 44.0, 81.0, 146.0, 194.0, 387.0, 659.0, 1400.0, 3454.0, 9922.0, 40703.0, 393430.0, 528203.0, 51022.0, 11532.0, 3912.0, 1495.0, 753.0, 408.0, 221.0, 175.0, 106.0, 73.0, 55.0, 29.0, 19.0, 18.0, 10.0, 6.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-21.578125, -20.925537109375, -20.27294921875, -19.620361328125, -18.9677734375, -18.315185546875, -17.66259765625, -17.010009765625, -16.357421875, -15.704833984375, -15.05224609375, -14.399658203125, -13.7470703125, -13.094482421875, -12.44189453125, -11.789306640625, -11.13671875, -10.484130859375, -9.83154296875, -9.178955078125, -8.5263671875, -7.873779296875, -7.22119140625, -6.568603515625, -5.916015625, -5.263427734375, -4.61083984375, -3.958251953125, -3.3056640625, -2.653076171875, -2.00048828125, -1.347900390625, -0.6953125, -0.042724609375, 0.60986328125, 1.262451171875, 1.9150390625, 2.567626953125, 3.22021484375, 3.872802734375, 4.525390625, 5.177978515625, 5.83056640625, 6.483154296875, 7.1357421875, 7.788330078125, 8.44091796875, 9.093505859375, 9.74609375, 10.398681640625, 11.05126953125, 11.703857421875, 12.3564453125, 13.009033203125, 13.66162109375, 14.314208984375, 14.966796875, 15.619384765625, 16.27197265625, 16.924560546875, 17.5771484375, 18.229736328125, 18.88232421875, 19.534912109375, 20.1875]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 4.0, 8.0, 5.0, 6.0, 6.0, 1.0, 11.0, 20.0, 25.0, 31.0, 42.0, 78.0, 96.0, 109.0, 149.0, 105.0, 89.0, 65.0, 46.0, 29.0, 15.0, 16.0, 11.0, 9.0, 7.0, 5.0, 3.0, 6.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0], "bins": [-2.86328125, -2.79840087890625, -2.7335205078125, -2.66864013671875, -2.603759765625, -2.53887939453125, -2.4739990234375, -2.40911865234375, -2.34423828125, -2.27935791015625, -2.2144775390625, -2.14959716796875, -2.084716796875, -2.01983642578125, -1.9549560546875, -1.89007568359375, -1.8251953125, -1.76031494140625, -1.6954345703125, -1.63055419921875, -1.565673828125, -1.50079345703125, -1.4359130859375, -1.37103271484375, -1.30615234375, -1.24127197265625, -1.1763916015625, -1.11151123046875, -1.046630859375, -0.98175048828125, -0.9168701171875, -0.85198974609375, -0.787109375, -0.72222900390625, -0.6573486328125, -0.59246826171875, -0.527587890625, -0.46270751953125, -0.3978271484375, -0.33294677734375, -0.26806640625, -0.20318603515625, -0.1383056640625, -0.07342529296875, -0.008544921875, 0.05633544921875, 0.1212158203125, 0.18609619140625, 0.2509765625, 0.31585693359375, 0.3807373046875, 0.44561767578125, 0.510498046875, 0.57537841796875, 0.6402587890625, 0.70513916015625, 0.77001953125, 0.83489990234375, 0.8997802734375, 0.96466064453125, 1.029541015625, 1.09442138671875, 1.1593017578125, 1.22418212890625, 1.2890625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 4.0, 4.0, 4.0, 8.0, 11.0, 10.0, 17.0, 29.0, 36.0, 74.0, 88.0, 145.0, 242.0, 403.0, 691.0, 1445.0, 2993.0, 6926.0, 17842.0, 54122.0, 208733.0, 504358.0, 174221.0, 47506.0, 16354.0, 6302.0, 2787.0, 1408.0, 752.0, 383.0, 245.0, 134.0, 84.0, 65.0, 28.0, 23.0, 19.0, 25.0, 11.0, 6.0, 8.0, 7.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.40625, -9.09716796875, -8.7880859375, -8.47900390625, -8.169921875, -7.86083984375, -7.5517578125, -7.24267578125, -6.93359375, -6.62451171875, -6.3154296875, -6.00634765625, -5.697265625, -5.38818359375, -5.0791015625, -4.77001953125, -4.4609375, -4.15185546875, -3.8427734375, -3.53369140625, -3.224609375, -2.91552734375, -2.6064453125, -2.29736328125, -1.98828125, -1.67919921875, -1.3701171875, -1.06103515625, -0.751953125, -0.44287109375, -0.1337890625, 0.17529296875, 0.484375, 0.79345703125, 1.1025390625, 1.41162109375, 1.720703125, 2.02978515625, 2.3388671875, 2.64794921875, 2.95703125, 3.26611328125, 3.5751953125, 3.88427734375, 4.193359375, 4.50244140625, 4.8115234375, 5.12060546875, 5.4296875, 5.73876953125, 6.0478515625, 6.35693359375, 6.666015625, 6.97509765625, 7.2841796875, 7.59326171875, 7.90234375, 8.21142578125, 8.5205078125, 8.82958984375, 9.138671875, 9.44775390625, 9.7568359375, 10.06591796875, 10.375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 10.0, 9.0, 12.0, 14.0, 20.0, 16.0, 42.0, 26.0, 47.0, 60.0, 67.0, 59.0, 57.0, 59.0, 64.0, 69.0, 47.0, 56.0, 63.0, 52.0, 41.0, 17.0, 31.0, 23.0, 5.0, 9.0, 10.0, 5.0, 4.0, 7.0, 3.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.78125, -8.486083984375, -8.19091796875, -7.895751953125, -7.6005859375, -7.305419921875, -7.01025390625, -6.715087890625, -6.419921875, -6.124755859375, -5.82958984375, -5.534423828125, -5.2392578125, -4.944091796875, -4.64892578125, -4.353759765625, -4.05859375, -3.763427734375, -3.46826171875, -3.173095703125, -2.8779296875, -2.582763671875, -2.28759765625, -1.992431640625, -1.697265625, -1.402099609375, -1.10693359375, -0.811767578125, -0.5166015625, -0.221435546875, 0.07373046875, 0.368896484375, 0.6640625, 0.959228515625, 1.25439453125, 1.549560546875, 1.8447265625, 2.139892578125, 2.43505859375, 2.730224609375, 3.025390625, 3.320556640625, 3.61572265625, 3.910888671875, 4.2060546875, 4.501220703125, 4.79638671875, 5.091552734375, 5.38671875, 5.681884765625, 5.97705078125, 6.272216796875, 6.5673828125, 6.862548828125, 7.15771484375, 7.452880859375, 7.748046875, 8.043212890625, 8.33837890625, 8.633544921875, 8.9287109375, 9.223876953125, 9.51904296875, 9.814208984375, 10.109375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 5.0, 10.0, 16.0, 13.0, 23.0, 65.0, 107.0, 267.0, 942.0, 5141.0, 91816.0, 910216.0, 35800.0, 3027.0, 696.0, 236.0, 78.0, 44.0, 26.0, 13.0, 12.0, 4.0, 7.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.09375, -48.75341796875, -47.4130859375, -46.07275390625, -44.732421875, -43.39208984375, -42.0517578125, -40.71142578125, -39.37109375, -38.03076171875, -36.6904296875, -35.35009765625, -34.009765625, -32.66943359375, -31.3291015625, -29.98876953125, -28.6484375, -27.30810546875, -25.9677734375, -24.62744140625, -23.287109375, -21.94677734375, -20.6064453125, -19.26611328125, -17.92578125, -16.58544921875, -15.2451171875, -13.90478515625, -12.564453125, -11.22412109375, -9.8837890625, -8.54345703125, -7.203125, -5.86279296875, -4.5224609375, -3.18212890625, -1.841796875, -0.50146484375, 0.8388671875, 2.17919921875, 3.51953125, 4.85986328125, 6.2001953125, 7.54052734375, 8.880859375, 10.22119140625, 11.5615234375, 12.90185546875, 14.2421875, 15.58251953125, 16.9228515625, 18.26318359375, 19.603515625, 20.94384765625, 22.2841796875, 23.62451171875, 24.96484375, 26.30517578125, 27.6455078125, 28.98583984375, 30.326171875, 31.66650390625, 33.0068359375, 34.34716796875, 35.6875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 5.0, 1.0, 3.0, 1.0, 3.0, 3.0, 4.0, 7.0, 10.0, 7.0, 23.0, 45.0, 85.0, 104.0, 143.0, 162.0, 144.0, 81.0, 58.0, 35.0, 27.0, 11.0, 14.0, 8.0, 4.0, 2.0, 4.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0013637542724609375, -0.001328207552433014, -0.0012926608324050903, -0.0012571141123771667, -0.0012215673923492432, -0.0011860206723213196, -0.001150473952293396, -0.0011149272322654724, -0.0010793805122375488, -0.0010438337922096252, -0.0010082870721817017, -0.0009727403521537781, -0.0009371936321258545, -0.0009016469120979309, -0.0008661001920700073, -0.0008305534720420837, -0.0007950067520141602, -0.0007594600319862366, -0.000723913311958313, -0.0006883665919303894, -0.0006528198719024658, -0.0006172731518745422, -0.0005817264318466187, -0.0005461797118186951, -0.0005106329917907715, -0.0004750862717628479, -0.0004395395517349243, -0.00040399283170700073, -0.00036844611167907715, -0.00033289939165115356, -0.00029735267162323, -0.0002618059515953064, -0.0002262592315673828, -0.00019071251153945923, -0.00015516579151153564, -0.00011961907148361206, -8.407235145568848e-05, -4.852563142776489e-05, -1.2978911399841309e-05, 2.2567808628082275e-05, 5.811452865600586e-05, 9.366124868392944e-05, 0.00012920796871185303, 0.0001647546887397766, 0.0002003014087677002, 0.00023584812879562378, 0.00027139484882354736, 0.00030694156885147095, 0.00034248828887939453, 0.0003780350089073181, 0.0004135817289352417, 0.0004491284489631653, 0.00048467516899108887, 0.0005202218890190125, 0.000555768609046936, 0.0005913153290748596, 0.0006268620491027832, 0.0006624087691307068, 0.0006979554891586304, 0.000733502209186554, 0.0007690489292144775, 0.0008045956492424011, 0.0008401423692703247, 0.0008756890892982483, 0.0009112358093261719]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 3.0, 1.0, 2.0, 3.0, 7.0, 4.0, 8.0, 16.0, 24.0, 30.0, 63.0, 104.0, 166.0, 335.0, 885.0, 2468.0, 9451.0, 54211.0, 511893.0, 414725.0, 42821.0, 7759.0, 2204.0, 741.0, 294.0, 150.0, 83.0, 44.0, 31.0, 11.0, 9.0, 8.0, 5.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.796875, -20.078369140625, -19.35986328125, -18.641357421875, -17.9228515625, -17.204345703125, -16.48583984375, -15.767333984375, -15.048828125, -14.330322265625, -13.61181640625, -12.893310546875, -12.1748046875, -11.456298828125, -10.73779296875, -10.019287109375, -9.30078125, -8.582275390625, -7.86376953125, -7.145263671875, -6.4267578125, -5.708251953125, -4.98974609375, -4.271240234375, -3.552734375, -2.834228515625, -2.11572265625, -1.397216796875, -0.6787109375, 0.039794921875, 0.75830078125, 1.476806640625, 2.1953125, 2.913818359375, 3.63232421875, 4.350830078125, 5.0693359375, 5.787841796875, 6.50634765625, 7.224853515625, 7.943359375, 8.661865234375, 9.38037109375, 10.098876953125, 10.8173828125, 11.535888671875, 12.25439453125, 12.972900390625, 13.69140625, 14.409912109375, 15.12841796875, 15.846923828125, 16.5654296875, 17.283935546875, 18.00244140625, 18.720947265625, 19.439453125, 20.157958984375, 20.87646484375, 21.594970703125, 22.3134765625, 23.031982421875, 23.75048828125, 24.468994140625, 25.1875]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 10.0, 8.0, 17.0, 32.0, 28.0, 47.0, 63.0, 70.0, 109.0, 151.0, 126.0, 107.0, 71.0, 46.0, 37.0, 24.0, 15.0, 14.0, 7.0, 9.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.140625, -17.7166748046875, -17.292724609375, -16.8687744140625, -16.44482421875, -16.0208740234375, -15.596923828125, -15.1729736328125, -14.7490234375, -14.3250732421875, -13.901123046875, -13.4771728515625, -13.05322265625, -12.6292724609375, -12.205322265625, -11.7813720703125, -11.357421875, -10.9334716796875, -10.509521484375, -10.0855712890625, -9.66162109375, -9.2376708984375, -8.813720703125, -8.3897705078125, -7.9658203125, -7.5418701171875, -7.117919921875, -6.6939697265625, -6.27001953125, -5.8460693359375, -5.422119140625, -4.9981689453125, -4.57421875, -4.1502685546875, -3.726318359375, -3.3023681640625, -2.87841796875, -2.4544677734375, -2.030517578125, -1.6065673828125, -1.1826171875, -0.7586669921875, -0.334716796875, 0.0892333984375, 0.51318359375, 0.9371337890625, 1.361083984375, 1.7850341796875, 2.208984375, 2.6329345703125, 3.056884765625, 3.4808349609375, 3.90478515625, 4.3287353515625, 4.752685546875, 5.1766357421875, 5.6005859375, 6.0245361328125, 6.448486328125, 6.8724365234375, 7.29638671875, 7.7203369140625, 8.144287109375, 8.5682373046875, 8.9921875]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 8.0, 7.0, 15.0, 35.0, 100.0, 225.0, 281.0, 179.0, 85.0, 39.0, 13.0, 7.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-131.6260528564453, -127.67518615722656, -123.72432708740234, -119.7734603881836, -115.82260131835938, -111.87173461914062, -107.92086791992188, -103.97000885009766, -100.0191421508789, -96.06827545166016, -92.11741638183594, -88.16654968261719, -84.21569061279297, -80.26482391357422, -76.31396484375, -72.36309814453125, -68.4122314453125, -64.46136474609375, -60.51050567626953, -56.55963897705078, -52.6087760925293, -48.65791320800781, -44.70705032348633, -40.756187438964844, -36.805328369140625, -32.85446548461914, -28.903600692749023, -24.95273780822754, -21.001873016357422, -17.051010131835938, -13.100147247314453, -9.149282455444336, -5.198417663574219, -1.247554063796997, 2.7033095359802246, 6.654172897338867, 10.605036735534668, 14.555900573730469, 18.506763458251953, 22.45762825012207, 26.408491134643555, 30.35935401916504, 34.310218811035156, 38.26108169555664, 42.211944580078125, 46.162811279296875, 50.113670349121094, 54.064537048339844, 58.01539993286133, 61.96626281738281, 65.91712951660156, 69.86798858642578, 73.81885528564453, 77.76971435546875, 81.7205810546875, 85.67144775390625, 89.62230682373047, 93.57317352294922, 97.52403259277344, 101.47489929199219, 105.4257583618164, 109.37662506103516, 113.32748413085938, 117.27835083007812, 121.22921752929688]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 0.0, 1.0, 6.0, 4.0, 2.0, 5.0, 7.0, 7.0, 13.0, 20.0, 19.0, 31.0, 36.0, 62.0, 56.0, 60.0, 76.0, 78.0, 78.0, 86.0, 86.0, 80.0, 42.0, 36.0, 19.0, 22.0, 21.0, 13.0, 14.0, 5.0, 5.0, 4.0, 5.0, 2.0, 5.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-76.03410339355469, -73.37730407714844, -70.72050476074219, -68.0636978149414, -65.40689849853516, -62.750099182128906, -60.093299865722656, -57.43649673461914, -54.779693603515625, -52.122894287109375, -49.46609115600586, -46.80929183959961, -44.152488708496094, -41.495689392089844, -38.838890075683594, -36.18208694458008, -33.52528762817383, -30.868486404418945, -28.211685180664062, -25.554885864257812, -22.898082733154297, -20.241283416748047, -17.584482192993164, -14.927680969238281, -12.270879745483398, -9.614078521728516, -6.957277774810791, -4.300477027893066, -1.6436758041381836, 1.0131254196166992, 3.6699256896972656, 6.326726913452148, 8.983528137207031, 11.640329360961914, 14.297130584716797, 16.953929901123047, 19.610733032226562, 22.267532348632812, 24.924333572387695, 27.581134796142578, 30.23793601989746, 32.894737243652344, 35.551536560058594, 38.20833969116211, 40.86513900756836, 43.521942138671875, 46.178741455078125, 48.835540771484375, 51.49234390258789, 54.14914321899414, 56.805946350097656, 59.462745666503906, 62.11954879760742, 64.77635192871094, 67.43315124511719, 70.08995056152344, 72.74674987792969, 75.40354919433594, 78.06034851074219, 80.71715545654297, 83.37395477294922, 86.03075408935547, 88.68755340576172, 91.3443603515625, 94.00115966796875]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 4.0, 5.0, 4.0, 7.0, 8.0, 12.0, 14.0, 15.0, 9.0, 17.0, 19.0, 24.0, 29.0, 34.0, 58.0, 50.0, 65.0, 81.0, 108.0, 148.0, 198.0, 268.0, 402.0, 622.0, 1022.0, 1667.0, 3230.0, 6808.0, 17930.0, 68856.0, 824590.0, 3109400.0, 119175.0, 24694.0, 7918.0, 3383.0, 1620.0, 794.0, 414.0, 232.0, 138.0, 87.0, 53.0, 35.0, 19.0, 9.0, 3.0, 6.0, 3.0, 2.0, 1.0], "bins": [-41.34375, -40.406982421875, -39.47021484375, -38.533447265625, -37.5966796875, -36.659912109375, -35.72314453125, -34.786376953125, -33.849609375, -32.912841796875, -31.97607421875, -31.039306640625, -30.1025390625, -29.165771484375, -28.22900390625, -27.292236328125, -26.35546875, -25.418701171875, -24.48193359375, -23.545166015625, -22.6083984375, -21.671630859375, -20.73486328125, -19.798095703125, -18.861328125, -17.924560546875, -16.98779296875, -16.051025390625, -15.1142578125, -14.177490234375, -13.24072265625, -12.303955078125, -11.3671875, -10.430419921875, -9.49365234375, -8.556884765625, -7.6201171875, -6.683349609375, -5.74658203125, -4.809814453125, -3.873046875, -2.936279296875, -1.99951171875, -1.062744140625, -0.1259765625, 0.810791015625, 1.74755859375, 2.684326171875, 3.62109375, 4.557861328125, 5.49462890625, 6.431396484375, 7.3681640625, 8.304931640625, 9.24169921875, 10.178466796875, 11.115234375, 12.052001953125, 12.98876953125, 13.925537109375, 14.8623046875, 15.799072265625, 16.73583984375, 17.672607421875, 18.609375]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 5.0, 9.0, 7.0, 14.0, 18.0, 9.0, 39.0, 40.0, 53.0, 74.0, 96.0, 116.0, 97.0, 91.0, 72.0, 80.0, 51.0, 28.0, 33.0, 13.0, 23.0, 9.0, 8.0, 4.0, 5.0, 5.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-2.76953125, -2.7081451416015625, -2.646759033203125, -2.5853729248046875, -2.52398681640625, -2.4626007080078125, -2.401214599609375, -2.3398284912109375, -2.2784423828125, -2.2170562744140625, -2.155670166015625, -2.0942840576171875, -2.03289794921875, -1.9715118408203125, -1.910125732421875, -1.8487396240234375, -1.787353515625, -1.7259674072265625, -1.664581298828125, -1.6031951904296875, -1.54180908203125, -1.4804229736328125, -1.419036865234375, -1.3576507568359375, -1.2962646484375, -1.2348785400390625, -1.173492431640625, -1.1121063232421875, -1.05072021484375, -0.9893341064453125, -0.927947998046875, -0.8665618896484375, -0.80517578125, -0.7437896728515625, -0.682403564453125, -0.6210174560546875, -0.55963134765625, -0.4982452392578125, -0.436859130859375, -0.3754730224609375, -0.3140869140625, -0.2527008056640625, -0.191314697265625, -0.1299285888671875, -0.06854248046875, -0.0071563720703125, 0.054229736328125, 0.1156158447265625, 0.177001953125, 0.2383880615234375, 0.299774169921875, 0.3611602783203125, 0.42254638671875, 0.4839324951171875, 0.545318603515625, 0.6067047119140625, 0.6680908203125, 0.7294769287109375, 0.790863037109375, 0.8522491455078125, 0.91363525390625, 0.9750213623046875, 1.036407470703125, 1.0977935791015625, 1.1591796875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 0.0, 2.0, 7.0, 6.0, 6.0, 6.0, 8.0, 19.0, 11.0, 30.0, 37.0, 55.0, 62.0, 103.0, 193.0, 493.0, 1899.0, 11675.0, 348297.0, 3767097.0, 57874.0, 4699.0, 936.0, 301.0, 143.0, 80.0, 61.0, 44.0, 41.0, 27.0, 11.0, 15.0, 15.0, 6.0, 9.0, 2.0, 2.0, 2.0, 3.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.0, -47.267578125, -45.53515625, -43.802734375, -42.0703125, -40.337890625, -38.60546875, -36.873046875, -35.140625, -33.408203125, -31.67578125, -29.943359375, -28.2109375, -26.478515625, -24.74609375, -23.013671875, -21.28125, -19.548828125, -17.81640625, -16.083984375, -14.3515625, -12.619140625, -10.88671875, -9.154296875, -7.421875, -5.689453125, -3.95703125, -2.224609375, -0.4921875, 1.240234375, 2.97265625, 4.705078125, 6.4375, 8.169921875, 9.90234375, 11.634765625, 13.3671875, 15.099609375, 16.83203125, 18.564453125, 20.296875, 22.029296875, 23.76171875, 25.494140625, 27.2265625, 28.958984375, 30.69140625, 32.423828125, 34.15625, 35.888671875, 37.62109375, 39.353515625, 41.0859375, 42.818359375, 44.55078125, 46.283203125, 48.015625, 49.748046875, 51.48046875, 53.212890625, 54.9453125, 56.677734375, 58.41015625, 60.142578125, 61.875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 0.0, 5.0, 3.0, 6.0, 8.0, 10.0, 3.0, 12.0, 23.0, 30.0, 42.0, 42.0, 62.0, 81.0, 116.0, 169.0, 236.0, 382.0, 775.0, 806.0, 391.0, 262.0, 180.0, 140.0, 75.0, 59.0, 33.0, 29.0, 27.0, 18.0, 13.0, 6.0, 9.0, 5.0, 5.0, 3.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.23828125, -3.13714599609375, -3.0360107421875, -2.93487548828125, -2.833740234375, -2.73260498046875, -2.6314697265625, -2.53033447265625, -2.42919921875, -2.32806396484375, -2.2269287109375, -2.12579345703125, -2.024658203125, -1.92352294921875, -1.8223876953125, -1.72125244140625, -1.6201171875, -1.51898193359375, -1.4178466796875, -1.31671142578125, -1.215576171875, -1.11444091796875, -1.0133056640625, -0.91217041015625, -0.81103515625, -0.70989990234375, -0.6087646484375, -0.50762939453125, -0.406494140625, -0.30535888671875, -0.2042236328125, -0.10308837890625, -0.001953125, 0.09918212890625, 0.2003173828125, 0.30145263671875, 0.402587890625, 0.50372314453125, 0.6048583984375, 0.70599365234375, 0.80712890625, 0.90826416015625, 1.0093994140625, 1.11053466796875, 1.211669921875, 1.31280517578125, 1.4139404296875, 1.51507568359375, 1.6162109375, 1.71734619140625, 1.8184814453125, 1.91961669921875, 2.020751953125, 2.12188720703125, 2.2230224609375, 2.32415771484375, 2.42529296875, 2.52642822265625, 2.6275634765625, 2.72869873046875, 2.829833984375, 2.93096923828125, 3.0321044921875, 3.13323974609375, 3.234375]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 6.0, 1.0, 12.0, 34.0, 43.0, 94.0, 161.0, 186.0, 189.0, 149.0, 78.0, 26.0, 17.0, 8.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.10785484313965, -21.94831085205078, -20.788766860961914, -19.629222869873047, -18.469680786132812, -17.310136795043945, -16.150592803955078, -14.991049766540527, -13.83150577545166, -12.671961784362793, -11.512418746948242, -10.352874755859375, -9.193330764770508, -8.033787727355957, -6.87424373626709, -5.714700698852539, -4.555156707763672, -3.395613193511963, -2.236069440841675, -1.0765256881713867, 0.08301782608032227, 1.2425613403320312, 2.4021053314208984, 3.561648368835449, 4.721192359924316, 5.880735874176025, 7.040279388427734, 8.199823379516602, 9.359367370605469, 10.51891040802002, 11.678454399108887, 12.837997436523438, 13.997539520263672, 15.157083511352539, 16.316627502441406, 17.47616958618164, 18.635713577270508, 19.795257568359375, 20.954801559448242, 22.11434555053711, 23.273887634277344, 24.43343162536621, 25.592975616455078, 26.752517700195312, 27.91206169128418, 29.071605682373047, 30.231149673461914, 31.39069366455078, 32.55023956298828, 33.709781646728516, 34.869327545166016, 36.02886962890625, 37.18841552734375, 38.347957611083984, 39.50749969482422, 40.66704559326172, 41.82658767700195, 42.98612976074219, 44.14567565917969, 45.30521774291992, 46.46476364135742, 47.624305725097656, 48.783851623535156, 49.94339370727539, 51.102935791015625]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 5.0, 2.0, 5.0, 9.0, 8.0, 16.0, 20.0, 20.0, 22.0, 39.0, 32.0, 38.0, 47.0, 45.0, 50.0, 52.0, 59.0, 62.0, 51.0, 51.0, 50.0, 58.0, 41.0, 41.0, 36.0, 27.0, 23.0, 22.0, 14.0, 9.0, 11.0, 14.0, 6.0, 4.0, 10.0, 0.0, 6.0, 4.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.380228042602539, -11.859716415405273, -11.339204788208008, -10.818693161010742, -10.298181533813477, -9.777669906616211, -9.257158279418945, -8.73664665222168, -8.216135025024414, -7.695623397827148, -7.175111770629883, -6.654600143432617, -6.134088516235352, -5.613576889038086, -5.093064785003662, -4.5725531578063965, -4.052041053771973, -3.531529426574707, -3.0110177993774414, -2.4905059337615967, -1.969994306564331, -1.4494826793670654, -0.9289708137512207, -0.4084591865539551, 0.11205244064331055, 0.632564127445221, 1.1530758142471313, 1.6735875606536865, 2.194099187850952, 2.7146108150482178, 3.2351226806640625, 3.755634307861328, 4.276145935058594, 4.796657562255859, 5.317169189453125, 5.837680816650391, 6.358192443847656, 6.878704071044922, 7.399216175079346, 7.919727802276611, 8.440238952636719, 8.960750579833984, 9.48126220703125, 10.001773834228516, 10.522285461425781, 11.042797088623047, 11.563308715820312, 12.083820343017578, 12.60433292388916, 13.124844551086426, 13.645356178283691, 14.165867805480957, 14.686379432678223, 15.206891059875488, 15.72740364074707, 16.247915267944336, 16.7684268951416, 17.288938522338867, 17.809450149536133, 18.3299617767334, 18.850473403930664, 19.37098503112793, 19.891496658325195, 20.41200828552246, 20.932519912719727]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 7.0, 7.0, 5.0, 9.0, 15.0, 28.0, 26.0, 44.0, 45.0, 49.0, 84.0, 130.0, 214.0, 303.0, 471.0, 912.0, 1815.0, 4298.0, 11933.0, 38116.0, 141802.0, 473137.0, 274610.0, 67828.0, 20019.0, 6905.0, 2762.0, 1193.0, 649.0, 375.0, 237.0, 153.0, 84.0, 73.0, 73.0, 39.0, 27.0, 27.0, 12.0, 12.0, 7.0, 9.0, 3.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.5, -16.96533203125, -16.4306640625, -15.89599609375, -15.361328125, -14.82666015625, -14.2919921875, -13.75732421875, -13.22265625, -12.68798828125, -12.1533203125, -11.61865234375, -11.083984375, -10.54931640625, -10.0146484375, -9.47998046875, -8.9453125, -8.41064453125, -7.8759765625, -7.34130859375, -6.806640625, -6.27197265625, -5.7373046875, -5.20263671875, -4.66796875, -4.13330078125, -3.5986328125, -3.06396484375, -2.529296875, -1.99462890625, -1.4599609375, -0.92529296875, -0.390625, 0.14404296875, 0.6787109375, 1.21337890625, 1.748046875, 2.28271484375, 2.8173828125, 3.35205078125, 3.88671875, 4.42138671875, 4.9560546875, 5.49072265625, 6.025390625, 6.56005859375, 7.0947265625, 7.62939453125, 8.1640625, 8.69873046875, 9.2333984375, 9.76806640625, 10.302734375, 10.83740234375, 11.3720703125, 11.90673828125, 12.44140625, 12.97607421875, 13.5107421875, 14.04541015625, 14.580078125, 15.11474609375, 15.6494140625, 16.18408203125, 16.71875]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 8.0, 6.0, 12.0, 24.0, 28.0, 36.0, 43.0, 61.0, 85.0, 111.0, 94.0, 112.0, 89.0, 76.0, 57.0, 50.0, 42.0, 28.0, 12.0, 10.0, 6.0, 3.0, 8.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.8828125, -2.8168792724609375, -2.750946044921875, -2.6850128173828125, -2.61907958984375, -2.5531463623046875, -2.487213134765625, -2.4212799072265625, -2.3553466796875, -2.2894134521484375, -2.223480224609375, -2.1575469970703125, -2.09161376953125, -2.0256805419921875, -1.959747314453125, -1.8938140869140625, -1.827880859375, -1.7619476318359375, -1.696014404296875, -1.6300811767578125, -1.56414794921875, -1.4982147216796875, -1.432281494140625, -1.3663482666015625, -1.3004150390625, -1.2344818115234375, -1.168548583984375, -1.1026153564453125, -1.03668212890625, -0.9707489013671875, -0.904815673828125, -0.8388824462890625, -0.77294921875, -0.7070159912109375, -0.641082763671875, -0.5751495361328125, -0.50921630859375, -0.4432830810546875, -0.377349853515625, -0.3114166259765625, -0.2454833984375, -0.1795501708984375, -0.113616943359375, -0.0476837158203125, 0.01824951171875, 0.0841827392578125, 0.150115966796875, 0.2160491943359375, 0.281982421875, 0.3479156494140625, 0.413848876953125, 0.4797821044921875, 0.54571533203125, 0.6116485595703125, 0.677581787109375, 0.7435150146484375, 0.8094482421875, 0.8753814697265625, 0.941314697265625, 1.0072479248046875, 1.07318115234375, 1.1391143798828125, 1.205047607421875, 1.2709808349609375, 1.3369140625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 10.0, 7.0, 9.0, 10.0, 12.0, 15.0, 14.0, 27.0, 43.0, 48.0, 68.0, 107.0, 135.0, 237.0, 313.0, 600.0, 965.0, 2003.0, 4672.0, 12323.0, 36868.0, 125439.0, 384489.0, 330549.0, 100539.0, 30336.0, 10273.0, 4129.0, 1847.0, 907.0, 522.0, 331.0, 208.0, 122.0, 101.0, 60.0, 54.0, 49.0, 36.0, 27.0, 16.0, 11.0, 8.0, 10.0, 5.0, 2.0, 4.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.875, -14.377685546875, -13.88037109375, -13.383056640625, -12.8857421875, -12.388427734375, -11.89111328125, -11.393798828125, -10.896484375, -10.399169921875, -9.90185546875, -9.404541015625, -8.9072265625, -8.409912109375, -7.91259765625, -7.415283203125, -6.91796875, -6.420654296875, -5.92333984375, -5.426025390625, -4.9287109375, -4.431396484375, -3.93408203125, -3.436767578125, -2.939453125, -2.442138671875, -1.94482421875, -1.447509765625, -0.9501953125, -0.452880859375, 0.04443359375, 0.541748046875, 1.0390625, 1.536376953125, 2.03369140625, 2.531005859375, 3.0283203125, 3.525634765625, 4.02294921875, 4.520263671875, 5.017578125, 5.514892578125, 6.01220703125, 6.509521484375, 7.0068359375, 7.504150390625, 8.00146484375, 8.498779296875, 8.99609375, 9.493408203125, 9.99072265625, 10.488037109375, 10.9853515625, 11.482666015625, 11.97998046875, 12.477294921875, 12.974609375, 13.471923828125, 13.96923828125, 14.466552734375, 14.9638671875, 15.461181640625, 15.95849609375, 16.455810546875, 16.953125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 3.0, 2.0, 6.0, 2.0, 7.0, 10.0, 13.0, 14.0, 13.0, 16.0, 15.0, 21.0, 29.0, 28.0, 37.0, 38.0, 37.0, 37.0, 35.0, 47.0, 50.0, 55.0, 46.0, 41.0, 43.0, 45.0, 40.0, 44.0, 31.0, 32.0, 28.0, 29.0, 20.0, 11.0, 11.0, 11.0, 8.0, 14.0, 6.0, 6.0, 5.0, 6.0, 8.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.32421875, -7.06890869140625, -6.8135986328125, -6.55828857421875, -6.302978515625, -6.04766845703125, -5.7923583984375, -5.53704833984375, -5.28173828125, -5.02642822265625, -4.7711181640625, -4.51580810546875, -4.260498046875, -4.00518798828125, -3.7498779296875, -3.49456787109375, -3.2392578125, -2.98394775390625, -2.7286376953125, -2.47332763671875, -2.218017578125, -1.96270751953125, -1.7073974609375, -1.45208740234375, -1.19677734375, -0.94146728515625, -0.6861572265625, -0.43084716796875, -0.175537109375, 0.07977294921875, 0.3350830078125, 0.59039306640625, 0.845703125, 1.10101318359375, 1.3563232421875, 1.61163330078125, 1.866943359375, 2.12225341796875, 2.3775634765625, 2.63287353515625, 2.88818359375, 3.14349365234375, 3.3988037109375, 3.65411376953125, 3.909423828125, 4.16473388671875, 4.4200439453125, 4.67535400390625, 4.9306640625, 5.18597412109375, 5.4412841796875, 5.69659423828125, 5.951904296875, 6.20721435546875, 6.4625244140625, 6.71783447265625, 6.97314453125, 7.22845458984375, 7.4837646484375, 7.73907470703125, 7.994384765625, 8.24969482421875, 8.5050048828125, 8.76031494140625, 9.015625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 6.0, 9.0, 9.0, 13.0, 36.0, 31.0, 51.0, 79.0, 103.0, 210.0, 448.0, 870.0, 2238.0, 6717.0, 24025.0, 99964.0, 423339.0, 374594.0, 85384.0, 21017.0, 5773.0, 1992.0, 786.0, 350.0, 191.0, 99.0, 68.0, 42.0, 33.0, 31.0, 13.0, 7.0, 11.0, 5.0, 6.0, 2.0, 4.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.96875, -17.4688720703125, -16.968994140625, -16.4691162109375, -15.96923828125, -15.4693603515625, -14.969482421875, -14.4696044921875, -13.9697265625, -13.4698486328125, -12.969970703125, -12.4700927734375, -11.97021484375, -11.4703369140625, -10.970458984375, -10.4705810546875, -9.970703125, -9.4708251953125, -8.970947265625, -8.4710693359375, -7.97119140625, -7.4713134765625, -6.971435546875, -6.4715576171875, -5.9716796875, -5.4718017578125, -4.971923828125, -4.4720458984375, -3.97216796875, -3.4722900390625, -2.972412109375, -2.4725341796875, -1.97265625, -1.4727783203125, -0.972900390625, -0.4730224609375, 0.02685546875, 0.5267333984375, 1.026611328125, 1.5264892578125, 2.0263671875, 2.5262451171875, 3.026123046875, 3.5260009765625, 4.02587890625, 4.5257568359375, 5.025634765625, 5.5255126953125, 6.025390625, 6.5252685546875, 7.025146484375, 7.5250244140625, 8.02490234375, 8.5247802734375, 9.024658203125, 9.5245361328125, 10.0244140625, 10.5242919921875, 11.024169921875, 11.5240478515625, 12.02392578125, 12.5238037109375, 13.023681640625, 13.5235595703125, 14.0234375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 5.0, 12.0, 5.0, 9.0, 8.0, 11.0, 11.0, 10.0, 22.0, 19.0, 36.0, 39.0, 41.0, 46.0, 70.0, 81.0, 112.0, 99.0, 61.0, 67.0, 58.0, 40.0, 25.0, 25.0, 24.0, 15.0, 6.0, 5.0, 5.0, 9.0, 5.0, 3.0, 3.0, 5.0, 6.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.001453399658203125, -0.0014092177152633667, -0.0013650357723236084, -0.00132085382938385, -0.0012766718864440918, -0.0012324899435043335, -0.0011883080005645752, -0.001144126057624817, -0.0010999441146850586, -0.0010557621717453003, -0.001011580228805542, -0.0009673982858657837, -0.0009232163429260254, -0.0008790343999862671, -0.0008348524570465088, -0.0007906705141067505, -0.0007464885711669922, -0.0007023066282272339, -0.0006581246852874756, -0.0006139427423477173, -0.000569760799407959, -0.0005255788564682007, -0.0004813969135284424, -0.0004372149705886841, -0.0003930330276489258, -0.0003488510847091675, -0.0003046691417694092, -0.0002604871988296509, -0.00021630525588989258, -0.00017212331295013428, -0.00012794137001037598, -8.375942707061768e-05, -3.9577484130859375e-05, 4.604458808898926e-06, 4.8786401748657227e-05, 9.296834468841553e-05, 0.00013715028762817383, 0.00018133223056793213, 0.00022551417350769043, 0.00026969611644744873, 0.00031387805938720703, 0.00035806000232696533, 0.00040224194526672363, 0.00044642388820648193, 0.0004906058311462402, 0.0005347877740859985, 0.0005789697170257568, 0.0006231516599655151, 0.0006673336029052734, 0.0007115155458450317, 0.00075569748878479, 0.0007998794317245483, 0.0008440613746643066, 0.0008882433176040649, 0.0009324252605438232, 0.0009766072034835815, 0.0010207891464233398, 0.0010649710893630981, 0.0011091530323028564, 0.0011533349752426147, 0.001197516918182373, 0.0012416988611221313, 0.0012858808040618896, 0.001330062747001648, 0.0013742446899414062]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 8.0, 6.0, 8.0, 14.0, 24.0, 29.0, 42.0, 74.0, 114.0, 202.0, 402.0, 800.0, 1782.0, 5003.0, 16189.0, 66501.0, 387106.0, 461757.0, 79841.0, 19124.0, 5658.0, 2054.0, 840.0, 424.0, 244.0, 102.0, 76.0, 42.0, 21.0, 25.0, 9.0, 8.0, 5.0, 5.0, 3.0, 3.0, 3.0, 6.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-21.671875, -21.07080078125, -20.4697265625, -19.86865234375, -19.267578125, -18.66650390625, -18.0654296875, -17.46435546875, -16.86328125, -16.26220703125, -15.6611328125, -15.06005859375, -14.458984375, -13.85791015625, -13.2568359375, -12.65576171875, -12.0546875, -11.45361328125, -10.8525390625, -10.25146484375, -9.650390625, -9.04931640625, -8.4482421875, -7.84716796875, -7.24609375, -6.64501953125, -6.0439453125, -5.44287109375, -4.841796875, -4.24072265625, -3.6396484375, -3.03857421875, -2.4375, -1.83642578125, -1.2353515625, -0.63427734375, -0.033203125, 0.56787109375, 1.1689453125, 1.77001953125, 2.37109375, 2.97216796875, 3.5732421875, 4.17431640625, 4.775390625, 5.37646484375, 5.9775390625, 6.57861328125, 7.1796875, 7.78076171875, 8.3818359375, 8.98291015625, 9.583984375, 10.18505859375, 10.7861328125, 11.38720703125, 11.98828125, 12.58935546875, 13.1904296875, 13.79150390625, 14.392578125, 14.99365234375, 15.5947265625, 16.19580078125, 16.796875]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 7.0, 2.0, 2.0, 1.0, 9.0, 5.0, 8.0, 9.0, 9.0, 28.0, 23.0, 31.0, 36.0, 65.0, 62.0, 86.0, 118.0, 95.0, 97.0, 78.0, 62.0, 31.0, 28.0, 21.0, 20.0, 18.0, 11.0, 9.0, 13.0, 6.0, 5.0, 5.0, 3.0, 0.0, 2.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-9.375, -9.10675048828125, -8.8385009765625, -8.57025146484375, -8.302001953125, -8.03375244140625, -7.7655029296875, -7.49725341796875, -7.22900390625, -6.96075439453125, -6.6925048828125, -6.42425537109375, -6.156005859375, -5.88775634765625, -5.6195068359375, -5.35125732421875, -5.0830078125, -4.81475830078125, -4.5465087890625, -4.27825927734375, -4.010009765625, -3.74176025390625, -3.4735107421875, -3.20526123046875, -2.93701171875, -2.66876220703125, -2.4005126953125, -2.13226318359375, -1.864013671875, -1.59576416015625, -1.3275146484375, -1.05926513671875, -0.791015625, -0.52276611328125, -0.2545166015625, 0.01373291015625, 0.281982421875, 0.55023193359375, 0.8184814453125, 1.08673095703125, 1.35498046875, 1.62322998046875, 1.8914794921875, 2.15972900390625, 2.427978515625, 2.69622802734375, 2.9644775390625, 3.23272705078125, 3.5009765625, 3.76922607421875, 4.0374755859375, 4.30572509765625, 4.573974609375, 4.84222412109375, 5.1104736328125, 5.37872314453125, 5.64697265625, 5.91522216796875, 6.1834716796875, 6.45172119140625, 6.719970703125, 6.98822021484375, 7.2564697265625, 7.52471923828125, 7.79296875]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 8.0, 3.0, 5.0, 16.0, 20.0, 48.0, 76.0, 137.0, 165.0, 204.0, 138.0, 79.0, 36.0, 29.0, 18.0, 7.0, 7.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-148.98036193847656, -144.6322479248047, -140.28414916992188, -135.93603515625, -131.58792114257812, -127.23981475830078, -122.89170837402344, -118.54359436035156, -114.19548797607422, -109.84738159179688, -105.499267578125, -101.15116119384766, -96.80305480957031, -92.45494079589844, -88.1068344116211, -83.75872802734375, -79.41061401367188, -75.06250762939453, -70.71439361572266, -66.36628723144531, -62.0181770324707, -57.670066833496094, -53.32196044921875, -48.97385025024414, -44.62574005126953, -40.27762985229492, -35.92951965332031, -31.58141326904297, -27.23330307006836, -22.88519287109375, -18.537084579467773, -14.188976287841797, -9.84088134765625, -5.492772102355957, -1.144662857055664, 3.203446388244629, 7.551555633544922, 11.899665832519531, 16.247774124145508, 20.595882415771484, 24.943992614746094, 29.292102813720703, 33.64021301269531, 37.988319396972656, 42.336429595947266, 46.684539794921875, 51.03264617919922, 55.38075637817383, 59.72886657714844, 64.07697296142578, 68.42508697509766, 72.773193359375, 77.12130737304688, 81.46941375732422, 85.81752014160156, 90.16563415527344, 94.51374053955078, 98.86184692382812, 103.2099609375, 107.55806732177734, 111.90617370605469, 116.25428771972656, 120.6023941040039, 124.95050048828125, 129.29861450195312]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 8.0, 5.0, 5.0, 7.0, 12.0, 13.0, 17.0, 18.0, 22.0, 30.0, 30.0, 35.0, 52.0, 41.0, 42.0, 50.0, 66.0, 63.0, 58.0, 46.0, 51.0, 49.0, 51.0, 35.0, 30.0, 25.0, 28.0, 26.0, 15.0, 18.0, 16.0, 8.0, 5.0, 9.0, 6.0, 5.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-76.22288513183594, -73.91661834716797, -71.6103515625, -69.30408477783203, -66.99781799316406, -64.6915512084961, -62.385284423828125, -60.079017639160156, -57.77275085449219, -55.46648406982422, -53.16021728515625, -50.85395050048828, -48.54768371582031, -46.241416931152344, -43.935150146484375, -41.628883361816406, -39.32261276245117, -37.0163459777832, -34.710079193115234, -32.403812408447266, -30.097545623779297, -27.791278839111328, -25.485010147094727, -23.178743362426758, -20.87247657775879, -18.56620979309082, -16.25994300842285, -13.953675270080566, -11.647408485412598, -9.341141700744629, -7.034873962402344, -4.728607177734375, -2.4223403930664062, -0.1160733699798584, 2.1901936531066895, 4.496460914611816, 6.802727699279785, 9.108994483947754, 11.415262222290039, 13.721529006958008, 16.027795791625977, 18.334062576293945, 20.640329360961914, 22.946598052978516, 25.252864837646484, 27.559131622314453, 29.865398406982422, 32.17166519165039, 34.47793197631836, 36.78419876098633, 39.0904655456543, 41.396732330322266, 43.702999114990234, 46.0092658996582, 48.31553649902344, 50.621803283691406, 52.928070068359375, 55.234336853027344, 57.54060363769531, 59.84687042236328, 62.15313720703125, 64.45940399169922, 66.76567077636719, 69.07193756103516, 71.37820434570312]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 3.0, 0.0, 0.0, 5.0, 5.0, 8.0, 10.0, 6.0, 6.0, 16.0, 25.0, 37.0, 32.0, 60.0, 63.0, 111.0, 154.0, 223.0, 338.0, 565.0, 993.0, 2021.0, 4594.0, 14486.0, 78625.0, 2861533.0, 1147720.0, 64432.0, 12128.0, 3512.0, 1375.0, 598.0, 253.0, 141.0, 73.0, 53.0, 28.0, 12.0, 14.0, 10.0, 6.0, 2.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-49.09375, -47.864501953125, -46.63525390625, -45.406005859375, -44.1767578125, -42.947509765625, -41.71826171875, -40.489013671875, -39.259765625, -38.030517578125, -36.80126953125, -35.572021484375, -34.3427734375, -33.113525390625, -31.88427734375, -30.655029296875, -29.42578125, -28.196533203125, -26.96728515625, -25.738037109375, -24.5087890625, -23.279541015625, -22.05029296875, -20.821044921875, -19.591796875, -18.362548828125, -17.13330078125, -15.904052734375, -14.6748046875, -13.445556640625, -12.21630859375, -10.987060546875, -9.7578125, -8.528564453125, -7.29931640625, -6.070068359375, -4.8408203125, -3.611572265625, -2.38232421875, -1.153076171875, 0.076171875, 1.305419921875, 2.53466796875, 3.763916015625, 4.9931640625, 6.222412109375, 7.45166015625, 8.680908203125, 9.91015625, 11.139404296875, 12.36865234375, 13.597900390625, 14.8271484375, 16.056396484375, 17.28564453125, 18.514892578125, 19.744140625, 20.973388671875, 22.20263671875, 23.431884765625, 24.6611328125, 25.890380859375, 27.11962890625, 28.348876953125, 29.578125]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 4.0, 3.0, 6.0, 7.0, 13.0, 25.0, 31.0, 54.0, 68.0, 103.0, 90.0, 117.0, 124.0, 88.0, 71.0, 65.0, 51.0, 33.0, 26.0, 9.0, 8.0, 5.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.951171875, -3.854095458984375, -3.75701904296875, -3.659942626953125, -3.5628662109375, -3.465789794921875, -3.36871337890625, -3.271636962890625, -3.174560546875, -3.077484130859375, -2.98040771484375, -2.883331298828125, -2.7862548828125, -2.689178466796875, -2.59210205078125, -2.495025634765625, -2.39794921875, -2.300872802734375, -2.20379638671875, -2.106719970703125, -2.0096435546875, -1.912567138671875, -1.81549072265625, -1.718414306640625, -1.621337890625, -1.524261474609375, -1.42718505859375, -1.330108642578125, -1.2330322265625, -1.135955810546875, -1.03887939453125, -0.941802978515625, -0.8447265625, -0.747650146484375, -0.65057373046875, -0.553497314453125, -0.4564208984375, -0.359344482421875, -0.26226806640625, -0.165191650390625, -0.068115234375, 0.028961181640625, 0.12603759765625, 0.223114013671875, 0.3201904296875, 0.417266845703125, 0.51434326171875, 0.611419677734375, 0.70849609375, 0.805572509765625, 0.90264892578125, 0.999725341796875, 1.0968017578125, 1.193878173828125, 1.29095458984375, 1.388031005859375, 1.485107421875, 1.582183837890625, 1.67926025390625, 1.776336669921875, 1.8734130859375, 1.970489501953125, 2.06756591796875, 2.164642333984375, 2.26171875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 9.0, 9.0, 19.0, 46.0, 65.0, 109.0, 330.0, 804.0, 2691.0, 12782.0, 112649.0, 3515481.0, 511030.0, 30732.0, 5217.0, 1398.0, 475.0, 239.0, 93.0, 57.0, 37.0, 8.0, 7.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.09375, -54.52392578125, -52.9541015625, -51.38427734375, -49.814453125, -48.24462890625, -46.6748046875, -45.10498046875, -43.53515625, -41.96533203125, -40.3955078125, -38.82568359375, -37.255859375, -35.68603515625, -34.1162109375, -32.54638671875, -30.9765625, -29.40673828125, -27.8369140625, -26.26708984375, -24.697265625, -23.12744140625, -21.5576171875, -19.98779296875, -18.41796875, -16.84814453125, -15.2783203125, -13.70849609375, -12.138671875, -10.56884765625, -8.9990234375, -7.42919921875, -5.859375, -4.28955078125, -2.7197265625, -1.14990234375, 0.419921875, 1.98974609375, 3.5595703125, 5.12939453125, 6.69921875, 8.26904296875, 9.8388671875, 11.40869140625, 12.978515625, 14.54833984375, 16.1181640625, 17.68798828125, 19.2578125, 20.82763671875, 22.3974609375, 23.96728515625, 25.537109375, 27.10693359375, 28.6767578125, 30.24658203125, 31.81640625, 33.38623046875, 34.9560546875, 36.52587890625, 38.095703125, 39.66552734375, 41.2353515625, 42.80517578125, 44.375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 2.0, 6.0, 5.0, 13.0, 12.0, 22.0, 25.0, 34.0, 49.0, 92.0, 125.0, 218.0, 446.0, 1312.0, 841.0, 336.0, 190.0, 127.0, 73.0, 44.0, 34.0, 23.0, 15.0, 12.0, 4.0, 3.0, 1.0, 6.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.125, -7.898193359375, -7.67138671875, -7.444580078125, -7.2177734375, -6.990966796875, -6.76416015625, -6.537353515625, -6.310546875, -6.083740234375, -5.85693359375, -5.630126953125, -5.4033203125, -5.176513671875, -4.94970703125, -4.722900390625, -4.49609375, -4.269287109375, -4.04248046875, -3.815673828125, -3.5888671875, -3.362060546875, -3.13525390625, -2.908447265625, -2.681640625, -2.454833984375, -2.22802734375, -2.001220703125, -1.7744140625, -1.547607421875, -1.32080078125, -1.093994140625, -0.8671875, -0.640380859375, -0.41357421875, -0.186767578125, 0.0400390625, 0.266845703125, 0.49365234375, 0.720458984375, 0.947265625, 1.174072265625, 1.40087890625, 1.627685546875, 1.8544921875, 2.081298828125, 2.30810546875, 2.534912109375, 2.76171875, 2.988525390625, 3.21533203125, 3.442138671875, 3.6689453125, 3.895751953125, 4.12255859375, 4.349365234375, 4.576171875, 4.802978515625, 5.02978515625, 5.256591796875, 5.4833984375, 5.710205078125, 5.93701171875, 6.163818359375, 6.390625]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 14.0, 13.0, 35.0, 92.0, 175.0, 227.0, 185.0, 143.0, 85.0, 25.0, 8.0, 5.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0], "bins": [-117.08839416503906, -114.83235931396484, -112.57633209228516, -110.32029724121094, -108.06426239013672, -105.80823516845703, -103.55220031738281, -101.2961654663086, -99.0401382446289, -96.78410339355469, -94.528076171875, -92.27204132080078, -90.01600646972656, -87.75997924804688, -85.50394439697266, -83.24790954589844, -80.99188232421875, -78.73584747314453, -76.47982025146484, -74.22378540039062, -71.9677505493164, -69.71172332763672, -67.4556884765625, -65.19965362548828, -62.94361877441406, -60.68758773803711, -58.43155288696289, -56.17552185058594, -53.919490814208984, -51.66345977783203, -49.40742492675781, -47.15139389038086, -44.895355224609375, -42.63932418823242, -40.3832893371582, -38.12725830078125, -35.8712272644043, -33.615196228027344, -31.359161376953125, -29.103130340576172, -26.84709930419922, -24.591066360473633, -22.33503532409668, -20.079002380371094, -17.82297134399414, -15.566938400268555, -13.310905456542969, -11.0548734664917, -8.79884147644043, -6.54280948638916, -4.286777019500732, -2.0307445526123047, 0.22528743743896484, 2.4813194274902344, 4.73735237121582, 6.99338436126709, 9.24941635131836, 11.505448341369629, 13.761480331420898, 16.017513275146484, 18.273544311523438, 20.529577255249023, 22.78561019897461, 25.041641235351562, 27.29767417907715]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 6.0, 4.0, 4.0, 9.0, 6.0, 8.0, 15.0, 18.0, 11.0, 19.0, 22.0, 28.0, 25.0, 30.0, 25.0, 26.0, 40.0, 39.0, 44.0, 49.0, 39.0, 43.0, 33.0, 40.0, 64.0, 44.0, 41.0, 48.0, 36.0, 30.0, 35.0, 24.0, 16.0, 22.0, 10.0, 13.0, 8.0, 10.0, 9.0, 3.0, 4.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-26.254213333129883, -25.470956802368164, -24.687698364257812, -23.904441833496094, -23.121185302734375, -22.337926864624023, -21.554670333862305, -20.771411895751953, -19.988155364990234, -19.204898834228516, -18.421640396118164, -17.638383865356445, -16.855125427246094, -16.071868896484375, -15.288612365722656, -14.505354881286621, -13.722097396850586, -12.93883991241455, -12.155582427978516, -11.372325897216797, -10.589068412780762, -9.805810928344727, -9.022554397583008, -8.239296913146973, -7.4560394287109375, -6.672781944274902, -5.889524936676025, -5.106267929077148, -4.323010444641113, -3.5397531986236572, -2.756495952606201, -1.9732389450073242, -1.1899833679199219, -0.4067261219024658, 0.37653112411499023, 1.1597883701324463, 1.9430456161499023, 2.7263028621673584, 3.5095601081848145, 4.292817115783691, 5.076074600219727, 5.859332084655762, 6.642589092254639, 7.425846099853516, 8.20910358428955, 8.992361068725586, 9.775617599487305, 10.55887508392334, 11.342132568359375, 12.12539005279541, 12.908647537231445, 13.691904067993164, 14.4751615524292, 15.258419036865234, 16.041675567626953, 16.824932098388672, 17.608190536499023, 18.391447067260742, 19.174705505371094, 19.957962036132812, 20.74121856689453, 21.524477005004883, 22.3077335357666, 23.090991973876953, 23.874248504638672]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 0.0, 6.0, 8.0, 5.0, 10.0, 10.0, 25.0, 22.0, 40.0, 43.0, 45.0, 104.0, 128.0, 209.0, 335.0, 547.0, 1071.0, 2251.0, 5937.0, 15702.0, 47059.0, 141891.0, 357928.0, 305531.0, 111171.0, 36980.0, 12537.0, 4697.0, 2017.0, 917.0, 462.0, 283.0, 176.0, 133.0, 68.0, 57.0, 41.0, 36.0, 17.0, 18.0, 14.0, 9.0, 3.0, 5.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-17.734375, -17.2110595703125, -16.687744140625, -16.1644287109375, -15.64111328125, -15.1177978515625, -14.594482421875, -14.0711669921875, -13.5478515625, -13.0245361328125, -12.501220703125, -11.9779052734375, -11.45458984375, -10.9312744140625, -10.407958984375, -9.8846435546875, -9.361328125, -8.8380126953125, -8.314697265625, -7.7913818359375, -7.26806640625, -6.7447509765625, -6.221435546875, -5.6981201171875, -5.1748046875, -4.6514892578125, -4.128173828125, -3.6048583984375, -3.08154296875, -2.5582275390625, -2.034912109375, -1.5115966796875, -0.98828125, -0.4649658203125, 0.058349609375, 0.5816650390625, 1.10498046875, 1.6282958984375, 2.151611328125, 2.6749267578125, 3.1982421875, 3.7215576171875, 4.244873046875, 4.7681884765625, 5.29150390625, 5.8148193359375, 6.338134765625, 6.8614501953125, 7.384765625, 7.9080810546875, 8.431396484375, 8.9547119140625, 9.47802734375, 10.0013427734375, 10.524658203125, 11.0479736328125, 11.5712890625, 12.0946044921875, 12.617919921875, 13.1412353515625, 13.66455078125, 14.1878662109375, 14.711181640625, 15.2344970703125, 15.7578125]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 3.0, 4.0, 4.0, 8.0, 14.0, 20.0, 24.0, 35.0, 35.0, 65.0, 49.0, 63.0, 64.0, 78.0, 77.0, 84.0, 89.0, 62.0, 53.0, 64.0, 24.0, 29.0, 15.0, 11.0, 9.0, 12.0, 6.0, 1.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.81640625, -3.7277984619140625, -3.639190673828125, -3.5505828857421875, -3.46197509765625, -3.3733673095703125, -3.284759521484375, -3.1961517333984375, -3.1075439453125, -3.0189361572265625, -2.930328369140625, -2.8417205810546875, -2.75311279296875, -2.6645050048828125, -2.575897216796875, -2.4872894287109375, -2.398681640625, -2.3100738525390625, -2.221466064453125, -2.1328582763671875, -2.04425048828125, -1.9556427001953125, -1.867034912109375, -1.7784271240234375, -1.6898193359375, -1.6012115478515625, -1.512603759765625, -1.4239959716796875, -1.33538818359375, -1.2467803955078125, -1.158172607421875, -1.0695648193359375, -0.98095703125, -0.8923492431640625, -0.803741455078125, -0.7151336669921875, -0.62652587890625, -0.5379180908203125, -0.449310302734375, -0.3607025146484375, -0.2720947265625, -0.1834869384765625, -0.094879150390625, -0.0062713623046875, 0.08233642578125, 0.1709442138671875, 0.259552001953125, 0.3481597900390625, 0.436767578125, 0.5253753662109375, 0.613983154296875, 0.7025909423828125, 0.79119873046875, 0.8798065185546875, 0.968414306640625, 1.0570220947265625, 1.1456298828125, 1.2342376708984375, 1.322845458984375, 1.4114532470703125, 1.50006103515625, 1.5886688232421875, 1.677276611328125, 1.7658843994140625, 1.8544921875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 5.0, 8.0, 13.0, 7.0, 20.0, 19.0, 18.0, 33.0, 41.0, 51.0, 75.0, 89.0, 144.0, 177.0, 306.0, 405.0, 662.0, 1130.0, 2067.0, 3892.0, 8247.0, 19208.0, 50337.0, 140519.0, 358524.0, 290649.0, 104792.0, 37907.0, 14986.0, 6585.0, 3220.0, 1669.0, 957.0, 581.0, 347.0, 242.0, 172.0, 99.0, 109.0, 63.0, 63.0, 24.0, 29.0, 18.0, 14.0, 13.0, 7.0, 9.0, 3.0, 4.0, 0.0, 6.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-18.09375, -17.52587890625, -16.9580078125, -16.39013671875, -15.822265625, -15.25439453125, -14.6865234375, -14.11865234375, -13.55078125, -12.98291015625, -12.4150390625, -11.84716796875, -11.279296875, -10.71142578125, -10.1435546875, -9.57568359375, -9.0078125, -8.43994140625, -7.8720703125, -7.30419921875, -6.736328125, -6.16845703125, -5.6005859375, -5.03271484375, -4.46484375, -3.89697265625, -3.3291015625, -2.76123046875, -2.193359375, -1.62548828125, -1.0576171875, -0.48974609375, 0.078125, 0.64599609375, 1.2138671875, 1.78173828125, 2.349609375, 2.91748046875, 3.4853515625, 4.05322265625, 4.62109375, 5.18896484375, 5.7568359375, 6.32470703125, 6.892578125, 7.46044921875, 8.0283203125, 8.59619140625, 9.1640625, 9.73193359375, 10.2998046875, 10.86767578125, 11.435546875, 12.00341796875, 12.5712890625, 13.13916015625, 13.70703125, 14.27490234375, 14.8427734375, 15.41064453125, 15.978515625, 16.54638671875, 17.1142578125, 17.68212890625, 18.25]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 2.0, 5.0, 3.0, 3.0, 3.0, 1.0, 4.0, 6.0, 8.0, 19.0, 13.0, 6.0, 14.0, 22.0, 27.0, 33.0, 27.0, 34.0, 35.0, 47.0, 60.0, 48.0, 47.0, 50.0, 55.0, 33.0, 45.0, 57.0, 39.0, 38.0, 46.0, 33.0, 26.0, 19.0, 19.0, 17.0, 13.0, 7.0, 12.0, 9.0, 6.0, 6.0, 3.0, 6.0, 5.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.3046875, -11.86767578125, -11.4306640625, -10.99365234375, -10.556640625, -10.11962890625, -9.6826171875, -9.24560546875, -8.80859375, -8.37158203125, -7.9345703125, -7.49755859375, -7.060546875, -6.62353515625, -6.1865234375, -5.74951171875, -5.3125, -4.87548828125, -4.4384765625, -4.00146484375, -3.564453125, -3.12744140625, -2.6904296875, -2.25341796875, -1.81640625, -1.37939453125, -0.9423828125, -0.50537109375, -0.068359375, 0.36865234375, 0.8056640625, 1.24267578125, 1.6796875, 2.11669921875, 2.5537109375, 2.99072265625, 3.427734375, 3.86474609375, 4.3017578125, 4.73876953125, 5.17578125, 5.61279296875, 6.0498046875, 6.48681640625, 6.923828125, 7.36083984375, 7.7978515625, 8.23486328125, 8.671875, 9.10888671875, 9.5458984375, 9.98291015625, 10.419921875, 10.85693359375, 11.2939453125, 11.73095703125, 12.16796875, 12.60498046875, 13.0419921875, 13.47900390625, 13.916015625, 14.35302734375, 14.7900390625, 15.22705078125, 15.6640625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 1.0, 4.0, 6.0, 6.0, 6.0, 4.0, 12.0, 15.0, 18.0, 38.0, 55.0, 64.0, 99.0, 148.0, 236.0, 371.0, 653.0, 1185.0, 2173.0, 4298.0, 9130.0, 20738.0, 49181.0, 124468.0, 328038.0, 309094.0, 115485.0, 45873.0, 19349.0, 8690.0, 4139.0, 2150.0, 1175.0, 634.0, 375.0, 216.0, 138.0, 77.0, 61.0, 47.0, 29.0, 18.0, 21.0, 16.0, 13.0, 5.0, 2.0, 5.0, 4.0, 2.0, 0.0, 1.0, 1.0], "bins": [-10.15625, -9.87384033203125, -9.5914306640625, -9.30902099609375, -9.026611328125, -8.74420166015625, -8.4617919921875, -8.17938232421875, -7.89697265625, -7.61456298828125, -7.3321533203125, -7.04974365234375, -6.767333984375, -6.48492431640625, -6.2025146484375, -5.92010498046875, -5.6376953125, -5.35528564453125, -5.0728759765625, -4.79046630859375, -4.508056640625, -4.22564697265625, -3.9432373046875, -3.66082763671875, -3.37841796875, -3.09600830078125, -2.8135986328125, -2.53118896484375, -2.248779296875, -1.96636962890625, -1.6839599609375, -1.40155029296875, -1.119140625, -0.83673095703125, -0.5543212890625, -0.27191162109375, 0.010498046875, 0.29290771484375, 0.5753173828125, 0.85772705078125, 1.14013671875, 1.42254638671875, 1.7049560546875, 1.98736572265625, 2.269775390625, 2.55218505859375, 2.8345947265625, 3.11700439453125, 3.3994140625, 3.68182373046875, 3.9642333984375, 4.24664306640625, 4.529052734375, 4.81146240234375, 5.0938720703125, 5.37628173828125, 5.65869140625, 5.94110107421875, 6.2235107421875, 6.50592041015625, 6.788330078125, 7.07073974609375, 7.3531494140625, 7.63555908203125, 7.91796875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 6.0, 2.0, 7.0, 2.0, 12.0, 8.0, 4.0, 13.0, 18.0, 8.0, 13.0, 23.0, 26.0, 22.0, 29.0, 51.0, 69.0, 115.0, 117.0, 104.0, 69.0, 41.0, 53.0, 30.0, 28.0, 27.0, 15.0, 11.0, 12.0, 7.0, 12.0, 9.0, 8.0, 5.0, 7.0, 6.0, 3.0, 3.0, 7.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0018377304077148438, -0.0017860978841781616, -0.0017344653606414795, -0.0016828328371047974, -0.0016312003135681152, -0.001579567790031433, -0.001527935266494751, -0.0014763027429580688, -0.0014246702194213867, -0.0013730376958847046, -0.0013214051723480225, -0.0012697726488113403, -0.0012181401252746582, -0.001166507601737976, -0.001114875078201294, -0.0010632425546646118, -0.0010116100311279297, -0.0009599775075912476, -0.0009083449840545654, -0.0008567124605178833, -0.0008050799369812012, -0.000753447413444519, -0.0007018148899078369, -0.0006501823663711548, -0.0005985498428344727, -0.0005469173192977905, -0.0004952847957611084, -0.00044365227222442627, -0.00039201974868774414, -0.000340387225151062, -0.0002887547016143799, -0.00023712217807769775, -0.00018548965454101562, -0.0001338571310043335, -8.222460746765137e-05, -3.059208393096924e-05, 2.104043960571289e-05, 7.267296314239502e-05, 0.00012430548667907715, 0.00017593801021575928, 0.0002275705337524414, 0.00027920305728912354, 0.00033083558082580566, 0.0003824681043624878, 0.0004341006278991699, 0.00048573315143585205, 0.0005373656749725342, 0.0005889981985092163, 0.0006406307220458984, 0.0006922632455825806, 0.0007438957691192627, 0.0007955282926559448, 0.000847160816192627, 0.0008987933397293091, 0.0009504258632659912, 0.0010020583868026733, 0.0010536909103393555, 0.0011053234338760376, 0.0011569559574127197, 0.0012085884809494019, 0.001260221004486084, 0.0013118535280227661, 0.0013634860515594482, 0.0014151185750961304, 0.0014667510986328125]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 0.0, 0.0, 3.0, 5.0, 3.0, 5.0, 2.0, 7.0, 10.0, 21.0, 16.0, 28.0, 35.0, 56.0, 73.0, 114.0, 161.0, 242.0, 430.0, 774.0, 1462.0, 3205.0, 7440.0, 20411.0, 64783.0, 252636.0, 501435.0, 133132.0, 38787.0, 13090.0, 5127.0, 2335.0, 1114.0, 648.0, 335.0, 195.0, 130.0, 88.0, 75.0, 40.0, 33.0, 26.0, 17.0, 12.0, 8.0, 4.0, 5.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.96875, -12.52587890625, -12.0830078125, -11.64013671875, -11.197265625, -10.75439453125, -10.3115234375, -9.86865234375, -9.42578125, -8.98291015625, -8.5400390625, -8.09716796875, -7.654296875, -7.21142578125, -6.7685546875, -6.32568359375, -5.8828125, -5.43994140625, -4.9970703125, -4.55419921875, -4.111328125, -3.66845703125, -3.2255859375, -2.78271484375, -2.33984375, -1.89697265625, -1.4541015625, -1.01123046875, -0.568359375, -0.12548828125, 0.3173828125, 0.76025390625, 1.203125, 1.64599609375, 2.0888671875, 2.53173828125, 2.974609375, 3.41748046875, 3.8603515625, 4.30322265625, 4.74609375, 5.18896484375, 5.6318359375, 6.07470703125, 6.517578125, 6.96044921875, 7.4033203125, 7.84619140625, 8.2890625, 8.73193359375, 9.1748046875, 9.61767578125, 10.060546875, 10.50341796875, 10.9462890625, 11.38916015625, 11.83203125, 12.27490234375, 12.7177734375, 13.16064453125, 13.603515625, 14.04638671875, 14.4892578125, 14.93212890625, 15.375]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 2.0, 3.0, 4.0, 6.0, 5.0, 4.0, 6.0, 4.0, 18.0, 13.0, 15.0, 18.0, 18.0, 37.0, 29.0, 42.0, 53.0, 59.0, 69.0, 83.0, 80.0, 70.0, 58.0, 44.0, 53.0, 30.0, 35.0, 24.0, 15.0, 22.0, 9.0, 11.0, 12.0, 6.0, 11.0, 6.0, 4.0, 4.0, 3.0, 5.0, 1.0, 2.0, 5.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.01171875, -6.79290771484375, -6.5740966796875, -6.35528564453125, -6.136474609375, -5.91766357421875, -5.6988525390625, -5.48004150390625, -5.26123046875, -5.04241943359375, -4.8236083984375, -4.60479736328125, -4.385986328125, -4.16717529296875, -3.9483642578125, -3.72955322265625, -3.5107421875, -3.29193115234375, -3.0731201171875, -2.85430908203125, -2.635498046875, -2.41668701171875, -2.1978759765625, -1.97906494140625, -1.76025390625, -1.54144287109375, -1.3226318359375, -1.10382080078125, -0.885009765625, -0.66619873046875, -0.4473876953125, -0.22857666015625, -0.009765625, 0.20904541015625, 0.4278564453125, 0.64666748046875, 0.865478515625, 1.08428955078125, 1.3031005859375, 1.52191162109375, 1.74072265625, 1.95953369140625, 2.1783447265625, 2.39715576171875, 2.615966796875, 2.83477783203125, 3.0535888671875, 3.27239990234375, 3.4912109375, 3.71002197265625, 3.9288330078125, 4.14764404296875, 4.366455078125, 4.58526611328125, 4.8040771484375, 5.02288818359375, 5.24169921875, 5.46051025390625, 5.6793212890625, 5.89813232421875, 6.116943359375, 6.33575439453125, 6.5545654296875, 6.77337646484375, 6.9921875]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 5.0, 6.0, 8.0, 12.0, 16.0, 38.0, 49.0, 58.0, 86.0, 104.0, 112.0, 127.0, 98.0, 80.0, 59.0, 40.0, 28.0, 29.0, 11.0, 9.0, 9.0, 5.0, 5.0, 3.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-106.07269287109375, -102.42373657226562, -98.77478790283203, -95.1258316040039, -91.47688293457031, -87.82792663574219, -84.17897033691406, -80.53001403808594, -76.88106536865234, -73.23210906982422, -69.58316040039062, -65.9342041015625, -62.28525161743164, -58.63629913330078, -54.987342834472656, -51.3383903503418, -47.68943786621094, -44.04048538208008, -40.39153289794922, -36.742576599121094, -33.093624114990234, -29.444671630859375, -25.795717239379883, -22.14676284790039, -18.49781036376953, -14.848856925964355, -11.19990348815918, -7.550950050354004, -3.901996612548828, -0.25304412841796875, 3.3959102630615234, 7.044864654541016, 10.693817138671875, 14.34277057647705, 17.991724014282227, 21.64067840576172, 25.289630889892578, 28.938583374023438, 32.58753967285156, 36.23649215698242, 39.88544464111328, 43.53439712524414, 47.183349609375, 50.832305908203125, 54.481258392333984, 58.130210876464844, 61.77916717529297, 65.42811584472656, 69.07707214355469, 72.72602844238281, 76.3749771118164, 80.02393341064453, 83.67288208007812, 87.32183837890625, 90.97079467773438, 94.6197509765625, 98.2686996459961, 101.91765594482422, 105.56660461425781, 109.21556091308594, 112.86451721191406, 116.51346588134766, 120.16242218017578, 123.81137084960938, 127.4603271484375]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 6.0, 10.0, 3.0, 9.0, 7.0, 7.0, 11.0, 17.0, 18.0, 17.0, 25.0, 23.0, 34.0, 38.0, 41.0, 39.0, 45.0, 55.0, 42.0, 45.0, 50.0, 45.0, 48.0, 38.0, 42.0, 39.0, 36.0, 35.0, 24.0, 35.0, 21.0, 22.0, 12.0, 16.0, 16.0, 12.0, 6.0, 1.0, 7.0, 4.0, 0.0, 0.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-96.41365051269531, -93.451171875, -90.48869323730469, -87.52621459960938, -84.5637435913086, -81.60126495361328, -78.63878631591797, -75.67630767822266, -72.71383666992188, -69.75135803222656, -66.78887939453125, -63.8264045715332, -60.863929748535156, -57.901451110839844, -54.93897247314453, -51.97649383544922, -49.014015197753906, -46.051536560058594, -43.08906173706055, -40.126583099365234, -37.16410827636719, -34.201629638671875, -31.239151000976562, -28.276674270629883, -25.314197540283203, -22.351720809936523, -19.389244079589844, -16.42676544189453, -13.464288711547852, -10.501811981201172, -7.539333343505859, -4.57685661315918, -1.6143798828125, 1.348097324371338, 4.310574531555176, 7.273052215576172, 10.235528945922852, 13.198005676269531, 16.160484313964844, 19.122961044311523, 22.085437774658203, 25.047914505004883, 28.010391235351562, 30.972869873046875, 33.93534851074219, 36.897823333740234, 39.86030197143555, 42.822776794433594, 45.785255432128906, 48.74773406982422, 51.710208892822266, 54.67268753051758, 57.635162353515625, 60.59764099121094, 63.56011962890625, 66.52259826660156, 69.48507690429688, 72.44755554199219, 75.4100341796875, 78.37251281738281, 81.3349838256836, 84.2974624633789, 87.25994110107422, 90.22241973876953, 93.18489074707031]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 3.0, 3.0, 5.0, 9.0, 11.0, 9.0, 18.0, 23.0, 49.0, 59.0, 105.0, 157.0, 338.0, 665.0, 1667.0, 4888.0, 21297.0, 200803.0, 3806195.0, 135716.0, 16496.0, 3698.0, 1162.0, 474.0, 173.0, 105.0, 57.0, 31.0, 24.0, 20.0, 9.0, 12.0, 4.0, 2.0, 1.0, 1.0, 4.0, 0.0, 1.0], "bins": [-56.90625, -55.595947265625, -54.28564453125, -52.975341796875, -51.6650390625, -50.354736328125, -49.04443359375, -47.734130859375, -46.423828125, -45.113525390625, -43.80322265625, -42.492919921875, -41.1826171875, -39.872314453125, -38.56201171875, -37.251708984375, -35.94140625, -34.631103515625, -33.32080078125, -32.010498046875, -30.7001953125, -29.389892578125, -28.07958984375, -26.769287109375, -25.458984375, -24.148681640625, -22.83837890625, -21.528076171875, -20.2177734375, -18.907470703125, -17.59716796875, -16.286865234375, -14.9765625, -13.666259765625, -12.35595703125, -11.045654296875, -9.7353515625, -8.425048828125, -7.11474609375, -5.804443359375, -4.494140625, -3.183837890625, -1.87353515625, -0.563232421875, 0.7470703125, 2.057373046875, 3.36767578125, 4.677978515625, 5.98828125, 7.298583984375, 8.60888671875, 9.919189453125, 11.2294921875, 12.539794921875, 13.85009765625, 15.160400390625, 16.470703125, 17.781005859375, 19.09130859375, 20.401611328125, 21.7119140625, 23.022216796875, 24.33251953125, 25.642822265625, 26.953125]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 1.0, 9.0, 5.0, 12.0, 15.0, 16.0, 30.0, 36.0, 48.0, 40.0, 51.0, 64.0, 74.0, 73.0, 85.0, 91.0, 62.0, 60.0, 64.0, 45.0, 40.0, 17.0, 12.0, 19.0, 14.0, 8.0, 5.0, 6.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.71875, -4.6064453125, -4.494140625, -4.3818359375, -4.26953125, -4.1572265625, -4.044921875, -3.9326171875, -3.8203125, -3.7080078125, -3.595703125, -3.4833984375, -3.37109375, -3.2587890625, -3.146484375, -3.0341796875, -2.921875, -2.8095703125, -2.697265625, -2.5849609375, -2.47265625, -2.3603515625, -2.248046875, -2.1357421875, -2.0234375, -1.9111328125, -1.798828125, -1.6865234375, -1.57421875, -1.4619140625, -1.349609375, -1.2373046875, -1.125, -1.0126953125, -0.900390625, -0.7880859375, -0.67578125, -0.5634765625, -0.451171875, -0.3388671875, -0.2265625, -0.1142578125, -0.001953125, 0.1103515625, 0.22265625, 0.3349609375, 0.447265625, 0.5595703125, 0.671875, 0.7841796875, 0.896484375, 1.0087890625, 1.12109375, 1.2333984375, 1.345703125, 1.4580078125, 1.5703125, 1.6826171875, 1.794921875, 1.9072265625, 2.01953125, 2.1318359375, 2.244140625, 2.3564453125, 2.46875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 5.0, 10.0, 14.0, 24.0, 54.0, 72.0, 109.0, 198.0, 332.0, 778.0, 1857.0, 4829.0, 14686.0, 58498.0, 445392.0, 3374665.0, 236509.0, 38830.0, 10497.0, 3749.0, 1448.0, 688.0, 380.0, 218.0, 152.0, 98.0, 64.0, 41.0, 34.0, 13.0, 16.0, 7.0, 9.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-36.875, -35.861083984375, -34.84716796875, -33.833251953125, -32.8193359375, -31.805419921875, -30.79150390625, -29.777587890625, -28.763671875, -27.749755859375, -26.73583984375, -25.721923828125, -24.7080078125, -23.694091796875, -22.68017578125, -21.666259765625, -20.65234375, -19.638427734375, -18.62451171875, -17.610595703125, -16.5966796875, -15.582763671875, -14.56884765625, -13.554931640625, -12.541015625, -11.527099609375, -10.51318359375, -9.499267578125, -8.4853515625, -7.471435546875, -6.45751953125, -5.443603515625, -4.4296875, -3.415771484375, -2.40185546875, -1.387939453125, -0.3740234375, 0.639892578125, 1.65380859375, 2.667724609375, 3.681640625, 4.695556640625, 5.70947265625, 6.723388671875, 7.7373046875, 8.751220703125, 9.76513671875, 10.779052734375, 11.79296875, 12.806884765625, 13.82080078125, 14.834716796875, 15.8486328125, 16.862548828125, 17.87646484375, 18.890380859375, 19.904296875, 20.918212890625, 21.93212890625, 22.946044921875, 23.9599609375, 24.973876953125, 25.98779296875, 27.001708984375, 28.015625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [5.0, 0.0, 1.0, 1.0, 3.0, 8.0, 7.0, 10.0, 5.0, 18.0, 16.0, 22.0, 31.0, 42.0, 70.0, 100.0, 165.0, 324.0, 985.0, 1327.0, 374.0, 200.0, 128.0, 74.0, 57.0, 23.0, 21.0, 28.0, 10.0, 9.0, 7.0, 4.0, 2.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.79296875, -4.54144287109375, -4.2899169921875, -4.03839111328125, -3.786865234375, -3.53533935546875, -3.2838134765625, -3.03228759765625, -2.78076171875, -2.52923583984375, -2.2777099609375, -2.02618408203125, -1.774658203125, -1.52313232421875, -1.2716064453125, -1.02008056640625, -0.7685546875, -0.51702880859375, -0.2655029296875, -0.01397705078125, 0.237548828125, 0.48907470703125, 0.7406005859375, 0.99212646484375, 1.24365234375, 1.49517822265625, 1.7467041015625, 1.99822998046875, 2.249755859375, 2.50128173828125, 2.7528076171875, 3.00433349609375, 3.255859375, 3.50738525390625, 3.7589111328125, 4.01043701171875, 4.261962890625, 4.51348876953125, 4.7650146484375, 5.01654052734375, 5.26806640625, 5.51959228515625, 5.7711181640625, 6.02264404296875, 6.274169921875, 6.52569580078125, 6.7772216796875, 7.02874755859375, 7.2802734375, 7.53179931640625, 7.7833251953125, 8.03485107421875, 8.286376953125, 8.53790283203125, 8.7894287109375, 9.04095458984375, 9.29248046875, 9.54400634765625, 9.7955322265625, 10.04705810546875, 10.298583984375, 10.55010986328125, 10.8016357421875, 11.05316162109375, 11.3046875]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 4.0, 12.0, 18.0, 16.0, 26.0, 68.0, 104.0, 131.0, 173.0, 137.0, 128.0, 81.0, 40.0, 30.0, 15.0, 6.0, 5.0, 6.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.09375, -62.28982162475586, -60.48588943481445, -58.68196105957031, -56.878028869628906, -55.074100494384766, -53.270172119140625, -51.46623992919922, -49.66231155395508, -47.85838317871094, -46.05445098876953, -44.25052261352539, -42.44659423828125, -40.642662048339844, -38.8387336730957, -37.03480529785156, -35.230873107910156, -33.426944732666016, -31.62301254272461, -29.81908416748047, -28.015153884887695, -26.211223602294922, -24.40729522705078, -22.603364944458008, -20.799434661865234, -18.99550437927246, -17.191574096679688, -15.387645721435547, -13.583715438842773, -11.77978515625, -9.975855827331543, -8.171926498413086, -6.3679962158203125, -4.564066410064697, -2.760136604309082, -0.9562067985534668, 0.8477230072021484, 2.651653289794922, 4.455582618713379, 6.259511947631836, 8.06344223022461, 9.867372512817383, 11.67130184173584, 13.475231170654297, 15.27916145324707, 17.083091735839844, 18.887020111083984, 20.690950393676758, 22.49488067626953, 24.298810958862305, 26.102741241455078, 27.90666961669922, 29.710599899291992, 31.514530181884766, 33.318458557128906, 35.12239074707031, 36.92631912231445, 38.730247497558594, 40.5341796875, 42.33810806274414, 44.14203643798828, 45.94596862792969, 47.74989700317383, 49.55382537841797, 51.357757568359375]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 3.0, 7.0, 10.0, 14.0, 17.0, 11.0, 18.0, 19.0, 18.0, 26.0, 24.0, 31.0, 15.0, 31.0, 36.0, 35.0, 29.0, 34.0, 43.0, 45.0, 45.0, 44.0, 40.0, 36.0, 40.0, 38.0, 38.0, 35.0, 34.0, 25.0, 21.0, 24.0, 14.0, 7.0, 14.0, 21.0, 9.0, 13.0, 10.0, 11.0, 5.0, 4.0, 0.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-25.883262634277344, -25.136049270629883, -24.388835906982422, -23.64162254333496, -22.8944091796875, -22.14719581604004, -21.399982452392578, -20.652767181396484, -19.905555725097656, -19.158342361450195, -18.411128997802734, -17.663915634155273, -16.916702270507812, -16.16948890686035, -15.422274589538574, -14.675061225891113, -13.927846908569336, -13.180633544921875, -12.433420181274414, -11.686206817626953, -10.938993453979492, -10.191780090332031, -9.444565773010254, -8.697352409362793, -7.950139045715332, -7.202925682067871, -6.45571231842041, -5.708498477935791, -4.96128511428833, -4.214071750640869, -3.46685791015625, -2.719644546508789, -1.9724311828613281, -1.2252177000045776, -0.47800421714782715, 0.2692093849182129, 1.0164227485656738, 1.7636361122131348, 2.510849952697754, 3.258063316345215, 4.005276679992676, 4.752490043640137, 5.499703407287598, 6.246917247772217, 6.994130611419678, 7.741343975067139, 8.488557815551758, 9.235771179199219, 9.98298454284668, 10.73019790649414, 11.477411270141602, 12.224624633789062, 12.971837997436523, 13.719051361083984, 14.466265678405762, 15.213479042053223, 15.960692405700684, 16.70790672302246, 17.455120086669922, 18.202333450317383, 18.949546813964844, 19.696760177612305, 20.443973541259766, 21.191186904907227, 21.938400268554688]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 3.0, 6.0, 8.0, 4.0, 8.0, 17.0, 16.0, 23.0, 41.0, 42.0, 50.0, 67.0, 130.0, 167.0, 300.0, 568.0, 978.0, 1751.0, 3356.0, 6471.0, 13029.0, 27054.0, 56299.0, 118641.0, 226418.0, 276957.0, 162012.0, 79210.0, 37692.0, 18217.0, 8956.0, 4632.0, 2347.0, 1216.0, 736.0, 384.0, 209.0, 167.0, 97.0, 69.0, 59.0, 43.0, 29.0, 27.0, 15.0, 16.0, 11.0, 5.0, 5.0, 2.0, 4.0], "bins": [-12.8984375, -12.56103515625, -12.2236328125, -11.88623046875, -11.548828125, -11.21142578125, -10.8740234375, -10.53662109375, -10.19921875, -9.86181640625, -9.5244140625, -9.18701171875, -8.849609375, -8.51220703125, -8.1748046875, -7.83740234375, -7.5, -7.16259765625, -6.8251953125, -6.48779296875, -6.150390625, -5.81298828125, -5.4755859375, -5.13818359375, -4.80078125, -4.46337890625, -4.1259765625, -3.78857421875, -3.451171875, -3.11376953125, -2.7763671875, -2.43896484375, -2.1015625, -1.76416015625, -1.4267578125, -1.08935546875, -0.751953125, -0.41455078125, -0.0771484375, 0.26025390625, 0.59765625, 0.93505859375, 1.2724609375, 1.60986328125, 1.947265625, 2.28466796875, 2.6220703125, 2.95947265625, 3.296875, 3.63427734375, 3.9716796875, 4.30908203125, 4.646484375, 4.98388671875, 5.3212890625, 5.65869140625, 5.99609375, 6.33349609375, 6.6708984375, 7.00830078125, 7.345703125, 7.68310546875, 8.0205078125, 8.35791015625, 8.6953125]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 2.0, 4.0, 6.0, 13.0, 17.0, 16.0, 20.0, 23.0, 31.0, 25.0, 39.0, 38.0, 53.0, 43.0, 58.0, 58.0, 58.0, 66.0, 71.0, 50.0, 49.0, 59.0, 42.0, 35.0, 22.0, 23.0, 22.0, 15.0, 13.0, 8.0, 9.0, 3.0, 3.0, 9.0, 2.0, 2.0, 3.0], "bins": [-4.140625, -4.0455474853515625, -3.950469970703125, -3.8553924560546875, -3.76031494140625, -3.6652374267578125, -3.570159912109375, -3.4750823974609375, -3.3800048828125, -3.2849273681640625, -3.189849853515625, -3.0947723388671875, -2.99969482421875, -2.9046173095703125, -2.809539794921875, -2.7144622802734375, -2.619384765625, -2.5243072509765625, -2.429229736328125, -2.3341522216796875, -2.23907470703125, -2.1439971923828125, -2.048919677734375, -1.9538421630859375, -1.8587646484375, -1.7636871337890625, -1.668609619140625, -1.5735321044921875, -1.47845458984375, -1.3833770751953125, -1.288299560546875, -1.1932220458984375, -1.09814453125, -1.0030670166015625, -0.907989501953125, -0.8129119873046875, -0.71783447265625, -0.6227569580078125, -0.527679443359375, -0.4326019287109375, -0.3375244140625, -0.2424468994140625, -0.147369384765625, -0.0522918701171875, 0.04278564453125, 0.1378631591796875, 0.232940673828125, 0.3280181884765625, 0.423095703125, 0.5181732177734375, 0.613250732421875, 0.7083282470703125, 0.80340576171875, 0.8984832763671875, 0.993560791015625, 1.0886383056640625, 1.1837158203125, 1.2787933349609375, 1.373870849609375, 1.4689483642578125, 1.56402587890625, 1.6591033935546875, 1.754180908203125, 1.8492584228515625, 1.9443359375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 4.0, 8.0, 14.0, 15.0, 25.0, 32.0, 41.0, 50.0, 108.0, 102.0, 152.0, 263.0, 368.0, 569.0, 948.0, 1537.0, 2645.0, 4783.0, 9518.0, 19694.0, 45088.0, 107683.0, 244781.0, 321861.0, 162505.0, 67779.0, 29181.0, 13320.0, 6560.0, 3486.0, 1970.0, 1185.0, 726.0, 463.0, 334.0, 232.0, 154.0, 117.0, 63.0, 46.0, 43.0, 38.0, 16.0, 18.0, 11.0, 6.0, 5.0, 5.0, 3.0, 5.0, 2.0, 3.0, 1.0, 1.0], "bins": [-14.140625, -13.7152099609375, -13.289794921875, -12.8643798828125, -12.43896484375, -12.0135498046875, -11.588134765625, -11.1627197265625, -10.7373046875, -10.3118896484375, -9.886474609375, -9.4610595703125, -9.03564453125, -8.6102294921875, -8.184814453125, -7.7593994140625, -7.333984375, -6.9085693359375, -6.483154296875, -6.0577392578125, -5.63232421875, -5.2069091796875, -4.781494140625, -4.3560791015625, -3.9306640625, -3.5052490234375, -3.079833984375, -2.6544189453125, -2.22900390625, -1.8035888671875, -1.378173828125, -0.9527587890625, -0.52734375, -0.1019287109375, 0.323486328125, 0.7489013671875, 1.17431640625, 1.5997314453125, 2.025146484375, 2.4505615234375, 2.8759765625, 3.3013916015625, 3.726806640625, 4.1522216796875, 4.57763671875, 5.0030517578125, 5.428466796875, 5.8538818359375, 6.279296875, 6.7047119140625, 7.130126953125, 7.5555419921875, 7.98095703125, 8.4063720703125, 8.831787109375, 9.2572021484375, 9.6826171875, 10.1080322265625, 10.533447265625, 10.9588623046875, 11.38427734375, 11.8096923828125, 12.235107421875, 12.6605224609375, 13.0859375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 2.0, 2.0, 4.0, 4.0, 3.0, 11.0, 10.0, 10.0, 12.0, 17.0, 18.0, 31.0, 29.0, 31.0, 41.0, 45.0, 48.0, 57.0, 50.0, 62.0, 51.0, 48.0, 51.0, 46.0, 44.0, 48.0, 39.0, 29.0, 33.0, 25.0, 11.0, 19.0, 20.0, 14.0, 7.0, 7.0, 11.0, 6.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.2578125, -13.7381591796875, -13.218505859375, -12.6988525390625, -12.17919921875, -11.6595458984375, -11.139892578125, -10.6202392578125, -10.1005859375, -9.5809326171875, -9.061279296875, -8.5416259765625, -8.02197265625, -7.5023193359375, -6.982666015625, -6.4630126953125, -5.943359375, -5.4237060546875, -4.904052734375, -4.3843994140625, -3.86474609375, -3.3450927734375, -2.825439453125, -2.3057861328125, -1.7861328125, -1.2664794921875, -0.746826171875, -0.2271728515625, 0.29248046875, 0.8121337890625, 1.331787109375, 1.8514404296875, 2.37109375, 2.8907470703125, 3.410400390625, 3.9300537109375, 4.44970703125, 4.9693603515625, 5.489013671875, 6.0086669921875, 6.5283203125, 7.0479736328125, 7.567626953125, 8.0872802734375, 8.60693359375, 9.1265869140625, 9.646240234375, 10.1658935546875, 10.685546875, 11.2052001953125, 11.724853515625, 12.2445068359375, 12.76416015625, 13.2838134765625, 13.803466796875, 14.3231201171875, 14.8427734375, 15.3624267578125, 15.882080078125, 16.4017333984375, 16.92138671875, 17.4410400390625, 17.960693359375, 18.4803466796875, 19.0]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [9.0, 4.0, 3.0, 9.0, 7.0, 10.0, 6.0, 18.0, 17.0, 29.0, 29.0, 64.0, 70.0, 101.0, 152.0, 259.0, 444.0, 857.0, 1758.0, 4285.0, 11703.0, 37229.0, 130444.0, 388931.0, 326909.0, 100161.0, 28910.0, 9295.0, 3548.0, 1448.0, 732.0, 383.0, 222.0, 169.0, 99.0, 57.0, 36.0, 39.0, 29.0, 24.0, 19.0, 13.0, 10.0, 6.0, 4.0, 9.0, 6.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.7578125, -5.516845703125, -5.27587890625, -5.034912109375, -4.7939453125, -4.552978515625, -4.31201171875, -4.071044921875, -3.830078125, -3.589111328125, -3.34814453125, -3.107177734375, -2.8662109375, -2.625244140625, -2.38427734375, -2.143310546875, -1.90234375, -1.661376953125, -1.42041015625, -1.179443359375, -0.9384765625, -0.697509765625, -0.45654296875, -0.215576171875, 0.025390625, 0.266357421875, 0.50732421875, 0.748291015625, 0.9892578125, 1.230224609375, 1.47119140625, 1.712158203125, 1.953125, 2.194091796875, 2.43505859375, 2.676025390625, 2.9169921875, 3.157958984375, 3.39892578125, 3.639892578125, 3.880859375, 4.121826171875, 4.36279296875, 4.603759765625, 4.8447265625, 5.085693359375, 5.32666015625, 5.567626953125, 5.80859375, 6.049560546875, 6.29052734375, 6.531494140625, 6.7724609375, 7.013427734375, 7.25439453125, 7.495361328125, 7.736328125, 7.977294921875, 8.21826171875, 8.459228515625, 8.7001953125, 8.941162109375, 9.18212890625, 9.423095703125, 9.6640625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 5.0, 7.0, 6.0, 7.0, 9.0, 13.0, 12.0, 8.0, 15.0, 17.0, 26.0, 30.0, 37.0, 32.0, 31.0, 40.0, 63.0, 75.0, 101.0, 92.0, 59.0, 40.0, 35.0, 38.0, 29.0, 30.0, 23.0, 19.0, 23.0, 16.0, 14.0, 13.0, 11.0, 5.0, 3.0, 11.0, 3.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009675025939941406, -0.0009347125887870789, -0.0009019225835800171, -0.0008691325783729553, -0.0008363425731658936, -0.0008035525679588318, -0.00077076256275177, -0.0007379725575447083, -0.0007051825523376465, -0.0006723925471305847, -0.000639602541923523, -0.0006068125367164612, -0.0005740225315093994, -0.0005412325263023376, -0.0005084425210952759, -0.0004756525158882141, -0.00044286251068115234, -0.0004100725054740906, -0.0003772825002670288, -0.00034449249505996704, -0.0003117024898529053, -0.0002789124846458435, -0.00024612247943878174, -0.00021333247423171997, -0.0001805424690246582, -0.00014775246381759644, -0.00011496245861053467, -8.21724534034729e-05, -4.938244819641113e-05, -1.6592442989349365e-05, 1.6197562217712402e-05, 4.898756742477417e-05, 8.177757263183594e-05, 0.0001145675778388977, 0.00014735758304595947, 0.00018014758825302124, 0.000212937593460083, 0.0002457275986671448, 0.00027851760387420654, 0.0003113076090812683, 0.0003440976142883301, 0.00037688761949539185, 0.0004096776247024536, 0.0004424676299095154, 0.00047525763511657715, 0.0005080476403236389, 0.0005408376455307007, 0.0005736276507377625, 0.0006064176559448242, 0.000639207661151886, 0.0006719976663589478, 0.0007047876715660095, 0.0007375776767730713, 0.0007703676819801331, 0.0008031576871871948, 0.0008359476923942566, 0.0008687376976013184, 0.0009015277028083801, 0.0009343177080154419, 0.0009671077132225037, 0.0009998977184295654, 0.0010326877236366272, 0.001065477728843689, 0.0010982677340507507, 0.0011310577392578125]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 3.0, 6.0, 9.0, 8.0, 14.0, 19.0, 31.0, 38.0, 52.0, 83.0, 100.0, 197.0, 247.0, 475.0, 782.0, 1336.0, 2605.0, 5336.0, 12733.0, 34766.0, 105974.0, 317597.0, 365971.0, 130214.0, 42189.0, 14879.0, 6093.0, 2893.0, 1590.0, 888.0, 490.0, 281.0, 208.0, 112.0, 101.0, 67.0, 42.0, 28.0, 27.0, 21.0, 8.0, 12.0, 6.0, 8.0, 1.0, 3.0, 3.0, 1.0, 6.0, 1.0, 5.0, 1.0, 1.0], "bins": [-7.6484375, -7.41729736328125, -7.1861572265625, -6.95501708984375, -6.723876953125, -6.49273681640625, -6.2615966796875, -6.03045654296875, -5.79931640625, -5.56817626953125, -5.3370361328125, -5.10589599609375, -4.874755859375, -4.64361572265625, -4.4124755859375, -4.18133544921875, -3.9501953125, -3.71905517578125, -3.4879150390625, -3.25677490234375, -3.025634765625, -2.79449462890625, -2.5633544921875, -2.33221435546875, -2.10107421875, -1.86993408203125, -1.6387939453125, -1.40765380859375, -1.176513671875, -0.94537353515625, -0.7142333984375, -0.48309326171875, -0.251953125, -0.02081298828125, 0.2103271484375, 0.44146728515625, 0.672607421875, 0.90374755859375, 1.1348876953125, 1.36602783203125, 1.59716796875, 1.82830810546875, 2.0594482421875, 2.29058837890625, 2.521728515625, 2.75286865234375, 2.9840087890625, 3.21514892578125, 3.4462890625, 3.67742919921875, 3.9085693359375, 4.13970947265625, 4.370849609375, 4.60198974609375, 4.8331298828125, 5.06427001953125, 5.29541015625, 5.52655029296875, 5.7576904296875, 5.98883056640625, 6.219970703125, 6.45111083984375, 6.6822509765625, 6.91339111328125, 7.14453125]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 6.0, 7.0, 8.0, 14.0, 23.0, 16.0, 19.0, 33.0, 54.0, 48.0, 65.0, 76.0, 88.0, 91.0, 79.0, 76.0, 64.0, 71.0, 52.0, 18.0, 34.0, 20.0, 8.0, 7.0, 5.0, 7.0, 2.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-7.8359375, -7.6160888671875, -7.396240234375, -7.1763916015625, -6.95654296875, -6.7366943359375, -6.516845703125, -6.2969970703125, -6.0771484375, -5.8572998046875, -5.637451171875, -5.4176025390625, -5.19775390625, -4.9779052734375, -4.758056640625, -4.5382080078125, -4.318359375, -4.0985107421875, -3.878662109375, -3.6588134765625, -3.43896484375, -3.2191162109375, -2.999267578125, -2.7794189453125, -2.5595703125, -2.3397216796875, -2.119873046875, -1.9000244140625, -1.68017578125, -1.4603271484375, -1.240478515625, -1.0206298828125, -0.80078125, -0.5809326171875, -0.361083984375, -0.1412353515625, 0.07861328125, 0.2984619140625, 0.518310546875, 0.7381591796875, 0.9580078125, 1.1778564453125, 1.397705078125, 1.6175537109375, 1.83740234375, 2.0572509765625, 2.277099609375, 2.4969482421875, 2.716796875, 2.9366455078125, 3.156494140625, 3.3763427734375, 3.59619140625, 3.8160400390625, 4.035888671875, 4.2557373046875, 4.4755859375, 4.6954345703125, 4.915283203125, 5.1351318359375, 5.35498046875, 5.5748291015625, 5.794677734375, 6.0145263671875, 6.234375]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 5.0, 7.0, 12.0, 12.0, 18.0, 40.0, 50.0, 114.0, 116.0, 155.0, 156.0, 107.0, 73.0, 52.0, 38.0, 18.0, 11.0, 7.0, 6.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-157.15682983398438, -153.20716857910156, -149.2575225830078, -145.307861328125, -141.35821533203125, -137.40855407714844, -133.4589080810547, -129.50924682617188, -125.55960083007812, -121.60994720458984, -117.66029357910156, -113.71063995361328, -109.760986328125, -105.81133270263672, -101.86167907714844, -97.91202545166016, -93.96237182617188, -90.0127182006836, -86.06306457519531, -82.11341094970703, -78.16375732421875, -74.21410369873047, -70.26445007324219, -66.3147964477539, -62.365135192871094, -58.41548156738281, -54.46582794189453, -50.51617431640625, -46.56652069091797, -42.61686706542969, -38.667213439941406, -34.717559814453125, -30.767906188964844, -26.818252563476562, -22.86859893798828, -18.9189453125, -14.969290733337402, -11.019636154174805, -7.069982528686523, -3.120328903198242, 0.8293247222900391, 4.77897834777832, 8.728631973266602, 12.6782865524292, 16.627941131591797, 20.577594757080078, 24.52724838256836, 28.47690200805664, 32.42655563354492, 36.3762092590332, 40.325862884521484, 44.275516510009766, 48.22517013549805, 52.174827575683594, 56.124481201171875, 60.074134826660156, 64.02378845214844, 67.97344207763672, 71.923095703125, 75.87274932861328, 79.82240295410156, 83.77205657958984, 87.72171020507812, 91.6713638305664, 95.62101745605469]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 4.0, 2.0, 6.0, 9.0, 4.0, 6.0, 4.0, 21.0, 17.0, 20.0, 20.0, 36.0, 35.0, 37.0, 38.0, 51.0, 46.0, 58.0, 59.0, 55.0, 62.0, 53.0, 51.0, 46.0, 43.0, 38.0, 34.0, 25.0, 20.0, 22.0, 22.0, 20.0, 14.0, 10.0, 4.0, 7.0, 3.0, 4.0, 2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.13690185546875, -66.1010513305664, -63.0651969909668, -60.02934265136719, -56.99348831176758, -53.95763397216797, -50.921783447265625, -47.885929107666016, -44.850074768066406, -41.8142204284668, -38.77836990356445, -35.742515563964844, -32.706661224365234, -29.670808792114258, -26.63495635986328, -23.599102020263672, -20.563251495361328, -17.52739906311035, -14.491544723510742, -11.455692291259766, -8.419838905334473, -5.38398551940918, -2.348133087158203, 0.6877212524414062, 3.723573684692383, 6.759427070617676, 9.795280456542969, 12.831132888793945, 15.866986274719238, 18.90283966064453, 21.938692092895508, 24.974546432495117, 28.010398864746094, 31.04625129699707, 34.08210372924805, 37.117958068847656, 40.153812408447266, 43.189666748046875, 46.22551727294922, 49.26137161254883, 52.29722595214844, 55.33308029174805, 58.36893081665039, 61.40478515625, 64.44063568115234, 67.47649383544922, 70.51234436035156, 73.54820251464844, 76.58404541015625, 79.6198959350586, 82.65575408935547, 85.69160461425781, 88.72745513916016, 91.76331329345703, 94.79916381835938, 97.83502197265625, 100.8708724975586, 103.90672302246094, 106.94258117675781, 109.97843170166016, 113.0142822265625, 116.05014038085938, 119.08599090576172, 122.12184143066406, 125.15769958496094]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 4.0, 4.0, 6.0, 20.0, 11.0, 16.0, 28.0, 46.0, 52.0, 100.0, 142.0, 229.0, 427.0, 696.0, 1256.0, 2507.0, 5246.0, 12704.0, 38009.0, 200166.0, 3635649.0, 230856.0, 41345.0, 13534.0, 5583.0, 2570.0, 1326.0, 740.0, 405.0, 234.0, 133.0, 93.0, 51.0, 28.0, 18.0, 16.0, 17.0, 8.0, 5.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.703125, -19.1485595703125, -18.593994140625, -18.0394287109375, -17.48486328125, -16.9302978515625, -16.375732421875, -15.8211669921875, -15.2666015625, -14.7120361328125, -14.157470703125, -13.6029052734375, -13.04833984375, -12.4937744140625, -11.939208984375, -11.3846435546875, -10.830078125, -10.2755126953125, -9.720947265625, -9.1663818359375, -8.61181640625, -8.0572509765625, -7.502685546875, -6.9481201171875, -6.3935546875, -5.8389892578125, -5.284423828125, -4.7298583984375, -4.17529296875, -3.6207275390625, -3.066162109375, -2.5115966796875, -1.95703125, -1.4024658203125, -0.847900390625, -0.2933349609375, 0.26123046875, 0.8157958984375, 1.370361328125, 1.9249267578125, 2.4794921875, 3.0340576171875, 3.588623046875, 4.1431884765625, 4.69775390625, 5.2523193359375, 5.806884765625, 6.3614501953125, 6.916015625, 7.4705810546875, 8.025146484375, 8.5797119140625, 9.13427734375, 9.6888427734375, 10.243408203125, 10.7979736328125, 11.3525390625, 11.9071044921875, 12.461669921875, 13.0162353515625, 13.57080078125, 14.1253662109375, 14.679931640625, 15.2344970703125, 15.7890625]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 8.0, 6.0, 9.0, 13.0, 26.0, 30.0, 24.0, 34.0, 43.0, 49.0, 55.0, 52.0, 50.0, 74.0, 65.0, 51.0, 84.0, 50.0, 64.0, 43.0, 43.0, 27.0, 30.0, 21.0, 11.0, 8.0, 14.0, 7.0, 5.0, 3.0, 3.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.2734375, -4.167236328125, -4.06103515625, -3.954833984375, -3.8486328125, -3.742431640625, -3.63623046875, -3.530029296875, -3.423828125, -3.317626953125, -3.21142578125, -3.105224609375, -2.9990234375, -2.892822265625, -2.78662109375, -2.680419921875, -2.57421875, -2.468017578125, -2.36181640625, -2.255615234375, -2.1494140625, -2.043212890625, -1.93701171875, -1.830810546875, -1.724609375, -1.618408203125, -1.51220703125, -1.406005859375, -1.2998046875, -1.193603515625, -1.08740234375, -0.981201171875, -0.875, -0.768798828125, -0.66259765625, -0.556396484375, -0.4501953125, -0.343994140625, -0.23779296875, -0.131591796875, -0.025390625, 0.080810546875, 0.18701171875, 0.293212890625, 0.3994140625, 0.505615234375, 0.61181640625, 0.718017578125, 0.82421875, 0.930419921875, 1.03662109375, 1.142822265625, 1.2490234375, 1.355224609375, 1.46142578125, 1.567626953125, 1.673828125, 1.780029296875, 1.88623046875, 1.992431640625, 2.0986328125, 2.204833984375, 2.31103515625, 2.417236328125, 2.5234375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 7.0, 9.0, 11.0, 19.0, 29.0, 34.0, 78.0, 98.0, 135.0, 253.0, 392.0, 598.0, 988.0, 1583.0, 3003.0, 6243.0, 14394.0, 41780.0, 159554.0, 2262233.0, 1493357.0, 144788.0, 38628.0, 13690.0, 5767.0, 2797.0, 1490.0, 863.0, 503.0, 322.0, 206.0, 144.0, 112.0, 62.0, 44.0, 25.0, 18.0, 9.0, 8.0, 7.0, 1.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.59375, -17.090576171875, -16.58740234375, -16.084228515625, -15.5810546875, -15.077880859375, -14.57470703125, -14.071533203125, -13.568359375, -13.065185546875, -12.56201171875, -12.058837890625, -11.5556640625, -11.052490234375, -10.54931640625, -10.046142578125, -9.54296875, -9.039794921875, -8.53662109375, -8.033447265625, -7.5302734375, -7.027099609375, -6.52392578125, -6.020751953125, -5.517578125, -5.014404296875, -4.51123046875, -4.008056640625, -3.5048828125, -3.001708984375, -2.49853515625, -1.995361328125, -1.4921875, -0.989013671875, -0.48583984375, 0.017333984375, 0.5205078125, 1.023681640625, 1.52685546875, 2.030029296875, 2.533203125, 3.036376953125, 3.53955078125, 4.042724609375, 4.5458984375, 5.049072265625, 5.55224609375, 6.055419921875, 6.55859375, 7.061767578125, 7.56494140625, 8.068115234375, 8.5712890625, 9.074462890625, 9.57763671875, 10.080810546875, 10.583984375, 11.087158203125, 11.59033203125, 12.093505859375, 12.5966796875, 13.099853515625, 13.60302734375, 14.106201171875, 14.609375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 1.0, 0.0, 7.0, 9.0, 7.0, 6.0, 9.0, 20.0, 29.0, 40.0, 51.0, 89.0, 148.0, 317.0, 1041.0, 1434.0, 383.0, 181.0, 98.0, 73.0, 34.0, 34.0, 13.0, 16.0, 10.0, 9.0, 4.0, 5.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.80078125, -5.61419677734375, -5.4276123046875, -5.24102783203125, -5.054443359375, -4.86785888671875, -4.6812744140625, -4.49468994140625, -4.30810546875, -4.12152099609375, -3.9349365234375, -3.74835205078125, -3.561767578125, -3.37518310546875, -3.1885986328125, -3.00201416015625, -2.8154296875, -2.62884521484375, -2.4422607421875, -2.25567626953125, -2.069091796875, -1.88250732421875, -1.6959228515625, -1.50933837890625, -1.32275390625, -1.13616943359375, -0.9495849609375, -0.76300048828125, -0.576416015625, -0.38983154296875, -0.2032470703125, -0.01666259765625, 0.169921875, 0.35650634765625, 0.5430908203125, 0.72967529296875, 0.916259765625, 1.10284423828125, 1.2894287109375, 1.47601318359375, 1.66259765625, 1.84918212890625, 2.0357666015625, 2.22235107421875, 2.408935546875, 2.59552001953125, 2.7821044921875, 2.96868896484375, 3.1552734375, 3.34185791015625, 3.5284423828125, 3.71502685546875, 3.901611328125, 4.08819580078125, 4.2747802734375, 4.46136474609375, 4.64794921875, 4.83453369140625, 5.0211181640625, 5.20770263671875, 5.394287109375, 5.58087158203125, 5.7674560546875, 5.95404052734375, 6.140625]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 5.0, 5.0, 10.0, 30.0, 84.0, 214.0, 291.0, 233.0, 100.0, 29.0, 9.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-135.7429656982422, -133.20912170410156, -130.67526245117188, -128.14141845703125, -125.6075668334961, -123.07371520996094, -120.53986358642578, -118.00601196289062, -115.47216796875, -112.93831634521484, -110.40446472167969, -107.87062072753906, -105.3367691040039, -102.80291748046875, -100.2690658569336, -97.73521423339844, -95.20137023925781, -92.66751861572266, -90.1336669921875, -87.59982299804688, -85.06597137451172, -82.53211975097656, -79.9982681274414, -77.46441650390625, -74.9305648803711, -72.39671325683594, -69.86286163330078, -67.32901763916016, -64.795166015625, -62.261314392089844, -59.72746276855469, -57.1936149597168, -54.65976333618164, -52.125911712646484, -49.592063903808594, -47.05821228027344, -44.52436447143555, -41.99051284790039, -39.4566650390625, -36.922813415527344, -34.38896179199219, -31.855112075805664, -29.32126235961914, -26.787410736083984, -24.253562927246094, -21.719711303710938, -19.185861587524414, -16.65201187133789, -14.1181640625, -11.584314346313477, -9.050464630126953, -6.516613960266113, -3.98276424407959, -1.4489145278930664, 1.0849361419677734, 3.618785858154297, 6.15263557434082, 8.686485290527344, 11.220335006713867, 13.754185676574707, 16.288036346435547, 18.821884155273438, 21.355735778808594, 23.889585494995117, 26.42343521118164]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 5.0, 1.0, 9.0, 6.0, 11.0, 14.0, 18.0, 27.0, 32.0, 46.0, 31.0, 41.0, 52.0, 65.0, 78.0, 55.0, 66.0, 54.0, 68.0, 59.0, 39.0, 56.0, 32.0, 35.0, 22.0, 22.0, 20.0, 13.0, 11.0, 7.0, 3.0, 5.0, 0.0, 1.0, 1.0, 4.0, 3.0, 0.0, 1.0], "bins": [-31.299800872802734, -30.542741775512695, -29.785682678222656, -29.02862548828125, -28.27156639099121, -27.514507293701172, -26.757448196411133, -26.000389099121094, -25.243331909179688, -24.48627281188965, -23.72921371459961, -22.972156524658203, -22.215097427368164, -21.458038330078125, -20.700979232788086, -19.943920135498047, -19.186861038208008, -18.42980194091797, -17.67274284362793, -16.91568374633789, -16.158626556396484, -15.401567459106445, -14.644508361816406, -13.887449264526367, -13.130391120910645, -12.373332023620605, -11.616273880004883, -10.859214782714844, -10.102155685424805, -9.345097541809082, -8.588038444519043, -7.830979824066162, -7.073921203613281, -6.3168625831604, -5.5598039627075195, -4.8027448654174805, -4.0456862449646, -3.2886276245117188, -2.5315685272216797, -1.7745099067687988, -1.017451286315918, -0.26039254665374756, 0.49666619300842285, 1.2537250518798828, 2.0107836723327637, 2.7678422927856445, 3.5249013900756836, 4.2819600105285645, 5.039018630981445, 5.796077251434326, 6.553135871887207, 7.310194969177246, 8.067253112792969, 8.824312210083008, 9.581371307373047, 10.338430404663086, 11.095488548278809, 11.852547645568848, 12.60960578918457, 13.36666488647461, 14.123723983764648, 14.880782127380371, 15.63784122467041, 16.394899368286133, 17.151958465576172]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 2.0, 7.0, 12.0, 11.0, 9.0, 16.0, 19.0, 35.0, 48.0, 87.0, 118.0, 219.0, 343.0, 558.0, 1144.0, 1993.0, 3828.0, 7886.0, 16771.0, 36886.0, 81388.0, 172695.0, 295911.0, 224315.0, 109908.0, 50128.0, 22923.0, 10503.0, 5041.0, 2573.0, 1360.0, 706.0, 408.0, 257.0, 150.0, 83.0, 61.0, 37.0, 36.0, 22.0, 20.0, 8.0, 10.0, 5.0, 2.0, 3.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-10.375, -10.0369873046875, -9.698974609375, -9.3609619140625, -9.02294921875, -8.6849365234375, -8.346923828125, -8.0089111328125, -7.6708984375, -7.3328857421875, -6.994873046875, -6.6568603515625, -6.31884765625, -5.9808349609375, -5.642822265625, -5.3048095703125, -4.966796875, -4.6287841796875, -4.290771484375, -3.9527587890625, -3.61474609375, -3.2767333984375, -2.938720703125, -2.6007080078125, -2.2626953125, -1.9246826171875, -1.586669921875, -1.2486572265625, -0.91064453125, -0.5726318359375, -0.234619140625, 0.1033935546875, 0.44140625, 0.7794189453125, 1.117431640625, 1.4554443359375, 1.79345703125, 2.1314697265625, 2.469482421875, 2.8074951171875, 3.1455078125, 3.4835205078125, 3.821533203125, 4.1595458984375, 4.49755859375, 4.8355712890625, 5.173583984375, 5.5115966796875, 5.849609375, 6.1876220703125, 6.525634765625, 6.8636474609375, 7.20166015625, 7.5396728515625, 7.877685546875, 8.2156982421875, 8.5537109375, 8.8917236328125, 9.229736328125, 9.5677490234375, 9.90576171875, 10.2437744140625, 10.581787109375, 10.9197998046875, 11.2578125]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 5.0, 7.0, 16.0, 20.0, 20.0, 25.0, 19.0, 37.0, 43.0, 49.0, 43.0, 36.0, 48.0, 69.0, 62.0, 65.0, 74.0, 45.0, 41.0, 53.0, 48.0, 43.0, 23.0, 22.0, 26.0, 20.0, 13.0, 7.0, 6.0, 11.0, 4.0, 1.0, 3.0, 3.0, 1.0, 1.0], "bins": [-4.2265625, -4.1278076171875, -4.029052734375, -3.9302978515625, -3.83154296875, -3.7327880859375, -3.634033203125, -3.5352783203125, -3.4365234375, -3.3377685546875, -3.239013671875, -3.1402587890625, -3.04150390625, -2.9427490234375, -2.843994140625, -2.7452392578125, -2.646484375, -2.5477294921875, -2.448974609375, -2.3502197265625, -2.25146484375, -2.1527099609375, -2.053955078125, -1.9552001953125, -1.8564453125, -1.7576904296875, -1.658935546875, -1.5601806640625, -1.46142578125, -1.3626708984375, -1.263916015625, -1.1651611328125, -1.06640625, -0.9676513671875, -0.868896484375, -0.7701416015625, -0.67138671875, -0.5726318359375, -0.473876953125, -0.3751220703125, -0.2763671875, -0.1776123046875, -0.078857421875, 0.0198974609375, 0.11865234375, 0.2174072265625, 0.316162109375, 0.4149169921875, 0.513671875, 0.6124267578125, 0.711181640625, 0.8099365234375, 0.90869140625, 1.0074462890625, 1.106201171875, 1.2049560546875, 1.3037109375, 1.4024658203125, 1.501220703125, 1.5999755859375, 1.69873046875, 1.7974853515625, 1.896240234375, 1.9949951171875, 2.09375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 4.0, 6.0, 6.0, 11.0, 21.0, 21.0, 17.0, 28.0, 49.0, 62.0, 70.0, 128.0, 172.0, 299.0, 438.0, 727.0, 1237.0, 2328.0, 4876.0, 11311.0, 28138.0, 78415.0, 215134.0, 389614.0, 198074.0, 71259.0, 25912.0, 10216.0, 4672.0, 2188.0, 1167.0, 689.0, 409.0, 262.0, 186.0, 115.0, 87.0, 59.0, 47.0, 30.0, 20.0, 13.0, 15.0, 8.0, 6.0, 3.0, 5.0, 1.0, 4.0, 1.0, 2.0, 0.0, 2.0], "bins": [-14.0859375, -13.6771240234375, -13.268310546875, -12.8594970703125, -12.45068359375, -12.0418701171875, -11.633056640625, -11.2242431640625, -10.8154296875, -10.4066162109375, -9.997802734375, -9.5889892578125, -9.18017578125, -8.7713623046875, -8.362548828125, -7.9537353515625, -7.544921875, -7.1361083984375, -6.727294921875, -6.3184814453125, -5.90966796875, -5.5008544921875, -5.092041015625, -4.6832275390625, -4.2744140625, -3.8656005859375, -3.456787109375, -3.0479736328125, -2.63916015625, -2.2303466796875, -1.821533203125, -1.4127197265625, -1.00390625, -0.5950927734375, -0.186279296875, 0.2225341796875, 0.63134765625, 1.0401611328125, 1.448974609375, 1.8577880859375, 2.2666015625, 2.6754150390625, 3.084228515625, 3.4930419921875, 3.90185546875, 4.3106689453125, 4.719482421875, 5.1282958984375, 5.537109375, 5.9459228515625, 6.354736328125, 6.7635498046875, 7.17236328125, 7.5811767578125, 7.989990234375, 8.3988037109375, 8.8076171875, 9.2164306640625, 9.625244140625, 10.0340576171875, 10.44287109375, 10.8516845703125, 11.260498046875, 11.6693115234375, 12.078125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 5.0, 6.0, 2.0, 5.0, 8.0, 14.0, 3.0, 8.0, 8.0, 15.0, 13.0, 22.0, 19.0, 26.0, 29.0, 25.0, 42.0, 35.0, 39.0, 42.0, 34.0, 36.0, 35.0, 47.0, 40.0, 42.0, 45.0, 39.0, 43.0, 43.0, 30.0, 26.0, 28.0, 23.0, 20.0, 15.0, 9.0, 12.0, 18.0, 13.0, 8.0, 8.0, 10.0, 5.0, 4.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-9.9296875, -9.596435546875, -9.26318359375, -8.929931640625, -8.5966796875, -8.263427734375, -7.93017578125, -7.596923828125, -7.263671875, -6.930419921875, -6.59716796875, -6.263916015625, -5.9306640625, -5.597412109375, -5.26416015625, -4.930908203125, -4.59765625, -4.264404296875, -3.93115234375, -3.597900390625, -3.2646484375, -2.931396484375, -2.59814453125, -2.264892578125, -1.931640625, -1.598388671875, -1.26513671875, -0.931884765625, -0.5986328125, -0.265380859375, 0.06787109375, 0.401123046875, 0.734375, 1.067626953125, 1.40087890625, 1.734130859375, 2.0673828125, 2.400634765625, 2.73388671875, 3.067138671875, 3.400390625, 3.733642578125, 4.06689453125, 4.400146484375, 4.7333984375, 5.066650390625, 5.39990234375, 5.733154296875, 6.06640625, 6.399658203125, 6.73291015625, 7.066162109375, 7.3994140625, 7.732666015625, 8.06591796875, 8.399169921875, 8.732421875, 9.065673828125, 9.39892578125, 9.732177734375, 10.0654296875, 10.398681640625, 10.73193359375, 11.065185546875, 11.3984375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 5.0, 3.0, 7.0, 9.0, 15.0, 34.0, 71.0, 158.0, 418.0, 1245.0, 5408.0, 35350.0, 352617.0, 578589.0, 63470.0, 8464.0, 1780.0, 557.0, 193.0, 85.0, 33.0, 17.0, 16.0, 6.0, 3.0, 4.0, 2.0, 0.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.234375, -14.8450927734375, -14.455810546875, -14.0665283203125, -13.67724609375, -13.2879638671875, -12.898681640625, -12.5093994140625, -12.1201171875, -11.7308349609375, -11.341552734375, -10.9522705078125, -10.56298828125, -10.1737060546875, -9.784423828125, -9.3951416015625, -9.005859375, -8.6165771484375, -8.227294921875, -7.8380126953125, -7.44873046875, -7.0594482421875, -6.670166015625, -6.2808837890625, -5.8916015625, -5.5023193359375, -5.113037109375, -4.7237548828125, -4.33447265625, -3.9451904296875, -3.555908203125, -3.1666259765625, -2.77734375, -2.3880615234375, -1.998779296875, -1.6094970703125, -1.22021484375, -0.8309326171875, -0.441650390625, -0.0523681640625, 0.3369140625, 0.7261962890625, 1.115478515625, 1.5047607421875, 1.89404296875, 2.2833251953125, 2.672607421875, 3.0618896484375, 3.451171875, 3.8404541015625, 4.229736328125, 4.6190185546875, 5.00830078125, 5.3975830078125, 5.786865234375, 6.1761474609375, 6.5654296875, 6.9547119140625, 7.343994140625, 7.7332763671875, 8.12255859375, 8.5118408203125, 8.901123046875, 9.2904052734375, 9.6796875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 8.0, 12.0, 5.0, 11.0, 10.0, 13.0, 10.0, 23.0, 26.0, 30.0, 37.0, 55.0, 81.0, 112.0, 139.0, 114.0, 80.0, 48.0, 39.0, 38.0, 27.0, 20.0, 12.0, 15.0, 8.0, 8.0, 3.0, 4.0, 5.0, 3.0, 0.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0017251968383789062, -0.0016801655292510986, -0.001635134220123291, -0.0015901029109954834, -0.0015450716018676758, -0.0015000402927398682, -0.0014550089836120605, -0.001409977674484253, -0.0013649463653564453, -0.0013199150562286377, -0.00127488374710083, -0.0012298524379730225, -0.0011848211288452148, -0.0011397898197174072, -0.0010947585105895996, -0.001049727201461792, -0.0010046958923339844, -0.0009596645832061768, -0.0009146332740783691, -0.0008696019649505615, -0.0008245706558227539, -0.0007795393466949463, -0.0007345080375671387, -0.0006894767284393311, -0.0006444454193115234, -0.0005994141101837158, -0.0005543828010559082, -0.0005093514919281006, -0.00046432018280029297, -0.00041928887367248535, -0.00037425756454467773, -0.0003292262554168701, -0.0002841949462890625, -0.00023916363716125488, -0.00019413232803344727, -0.00014910101890563965, -0.00010406970977783203, -5.9038400650024414e-05, -1.4007091522216797e-05, 3.102421760559082e-05, 7.605552673339844e-05, 0.00012108683586120605, 0.00016611814498901367, 0.0002111494541168213, 0.0002561807632446289, 0.0003012120723724365, 0.00034624338150024414, 0.00039127469062805176, 0.0004363059997558594, 0.000481337308883667, 0.0005263686180114746, 0.0005713999271392822, 0.0006164312362670898, 0.0006614625453948975, 0.0007064938545227051, 0.0007515251636505127, 0.0007965564727783203, 0.0008415877819061279, 0.0008866190910339355, 0.0009316504001617432, 0.0009766817092895508, 0.0010217130184173584, 0.001066744327545166, 0.0011117756366729736, 0.0011568069458007812]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 1.0, 3.0, 3.0, 7.0, 6.0, 13.0, 21.0, 30.0, 58.0, 102.0, 171.0, 311.0, 640.0, 1673.0, 5375.0, 24355.0, 176053.0, 692659.0, 122014.0, 18249.0, 4204.0, 1332.0, 587.0, 301.0, 158.0, 83.0, 48.0, 38.0, 15.0, 15.0, 7.0, 9.0, 3.0, 2.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.7890625, -12.39453125, -12.0, -11.60546875, -11.2109375, -10.81640625, -10.421875, -10.02734375, -9.6328125, -9.23828125, -8.84375, -8.44921875, -8.0546875, -7.66015625, -7.265625, -6.87109375, -6.4765625, -6.08203125, -5.6875, -5.29296875, -4.8984375, -4.50390625, -4.109375, -3.71484375, -3.3203125, -2.92578125, -2.53125, -2.13671875, -1.7421875, -1.34765625, -0.953125, -0.55859375, -0.1640625, 0.23046875, 0.625, 1.01953125, 1.4140625, 1.80859375, 2.203125, 2.59765625, 2.9921875, 3.38671875, 3.78125, 4.17578125, 4.5703125, 4.96484375, 5.359375, 5.75390625, 6.1484375, 6.54296875, 6.9375, 7.33203125, 7.7265625, 8.12109375, 8.515625, 8.91015625, 9.3046875, 9.69921875, 10.09375, 10.48828125, 10.8828125, 11.27734375, 11.671875, 12.06640625, 12.4609375]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 5.0, 4.0, 8.0, 7.0, 13.0, 22.0, 14.0, 32.0, 45.0, 74.0, 87.0, 120.0, 137.0, 125.0, 85.0, 53.0, 50.0, 46.0, 18.0, 19.0, 9.0, 13.0, 3.0, 3.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.6484375, -6.39794921875, -6.1474609375, -5.89697265625, -5.646484375, -5.39599609375, -5.1455078125, -4.89501953125, -4.64453125, -4.39404296875, -4.1435546875, -3.89306640625, -3.642578125, -3.39208984375, -3.1416015625, -2.89111328125, -2.640625, -2.39013671875, -2.1396484375, -1.88916015625, -1.638671875, -1.38818359375, -1.1376953125, -0.88720703125, -0.63671875, -0.38623046875, -0.1357421875, 0.11474609375, 0.365234375, 0.61572265625, 0.8662109375, 1.11669921875, 1.3671875, 1.61767578125, 1.8681640625, 2.11865234375, 2.369140625, 2.61962890625, 2.8701171875, 3.12060546875, 3.37109375, 3.62158203125, 3.8720703125, 4.12255859375, 4.373046875, 4.62353515625, 4.8740234375, 5.12451171875, 5.375, 5.62548828125, 5.8759765625, 6.12646484375, 6.376953125, 6.62744140625, 6.8779296875, 7.12841796875, 7.37890625, 7.62939453125, 7.8798828125, 8.13037109375, 8.380859375, 8.63134765625, 8.8818359375, 9.13232421875, 9.3828125]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 4.0, 7.0, 18.0, 23.0, 45.0, 83.0, 143.0, 172.0, 170.0, 148.0, 90.0, 42.0, 32.0, 13.0, 8.0, 5.0, 0.0, 0.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-141.83692932128906, -137.397705078125, -132.95849609375, -128.51927185058594, -124.08004760742188, -119.64082336425781, -115.20160675048828, -110.76239013671875, -106.32316589355469, -101.88394165039062, -97.4447250366211, -93.00550842285156, -88.5662841796875, -84.12705993652344, -79.6878433227539, -75.24862670898438, -70.80940246582031, -66.37017822265625, -61.93096160888672, -57.49174118041992, -53.052520751953125, -48.61330032348633, -44.17407989501953, -39.734859466552734, -35.29563903808594, -30.85641860961914, -26.417198181152344, -21.977977752685547, -17.53875732421875, -13.099536895751953, -8.660316467285156, -4.221096038818359, 0.2181396484375, 4.657360076904297, 9.096580505371094, 13.53580093383789, 17.975021362304688, 22.414241790771484, 26.85346221923828, 31.292682647705078, 35.731903076171875, 40.17112350463867, 44.61034393310547, 49.049564361572266, 53.48878479003906, 57.92800521850586, 62.367225646972656, 66.80644226074219, 71.24566650390625, 75.68489074707031, 80.12410736083984, 84.56332397460938, 89.00254821777344, 93.4417724609375, 97.88098907470703, 102.32020568847656, 106.75942993164062, 111.19865417480469, 115.63787078857422, 120.07708740234375, 124.51631164550781, 128.95553588867188, 133.39474487304688, 137.83396911621094, 142.273193359375]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 2.0, 5.0, 1.0, 6.0, 6.0, 9.0, 8.0, 5.0, 9.0, 12.0, 7.0, 17.0, 24.0, 31.0, 19.0, 31.0, 35.0, 23.0, 39.0, 23.0, 40.0, 42.0, 37.0, 37.0, 37.0, 43.0, 43.0, 55.0, 53.0, 26.0, 41.0, 33.0, 29.0, 24.0, 36.0, 23.0, 14.0, 9.0, 23.0, 10.0, 9.0, 6.0, 2.0, 2.0, 7.0, 9.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-55.4637451171875, -53.53178405761719, -51.599822998046875, -49.66786193847656, -47.73590087890625, -45.80393981933594, -43.871978759765625, -41.94002151489258, -40.008060455322266, -38.07609939575195, -36.14413833618164, -34.21217727661133, -32.280216217041016, -30.348257064819336, -28.416296005249023, -26.484336853027344, -24.5523738861084, -22.620412826538086, -20.688451766967773, -18.756492614746094, -16.82453155517578, -14.892570495605469, -12.960609436035156, -11.02864933013916, -9.096688270568848, -7.164727687835693, -5.232767105102539, -3.3008060455322266, -1.3688454627990723, 0.563115119934082, 2.4950761795043945, 4.427036285400391, 6.358997344970703, 8.290958404541016, 10.222918510437012, 12.154879570007324, 14.08683967590332, 16.018800735473633, 17.950761795043945, 19.882720947265625, 21.814682006835938, 23.74664306640625, 25.678604125976562, 27.610565185546875, 29.542524337768555, 31.474485397338867, 33.40644836425781, 35.33840560913086, 37.27037048339844, 39.20233154296875, 41.13429260253906, 43.066253662109375, 44.99821472167969, 46.93017578125, 48.86213684082031, 50.79409408569336, 52.72605514526367, 54.658016204833984, 56.5899772644043, 58.52193832397461, 60.45389938354492, 62.38585662841797, 64.31781768798828, 66.2497787475586, 68.1817398071289]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 7.0, 6.0, 4.0, 12.0, 17.0, 25.0, 32.0, 49.0, 81.0, 110.0, 154.0, 282.0, 457.0, 761.0, 1406.0, 2593.0, 5568.0, 12903.0, 35093.0, 125368.0, 1723787.0, 2093684.0, 130645.0, 36169.0, 13395.0, 5666.0, 2835.0, 1333.0, 727.0, 419.0, 254.0, 162.0, 99.0, 55.0, 37.0, 27.0, 27.0, 14.0, 8.0, 6.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-15.3984375, -14.9708251953125, -14.543212890625, -14.1156005859375, -13.68798828125, -13.2603759765625, -12.832763671875, -12.4051513671875, -11.9775390625, -11.5499267578125, -11.122314453125, -10.6947021484375, -10.26708984375, -9.8394775390625, -9.411865234375, -8.9842529296875, -8.556640625, -8.1290283203125, -7.701416015625, -7.2738037109375, -6.84619140625, -6.4185791015625, -5.990966796875, -5.5633544921875, -5.1357421875, -4.7081298828125, -4.280517578125, -3.8529052734375, -3.42529296875, -2.9976806640625, -2.570068359375, -2.1424560546875, -1.71484375, -1.2872314453125, -0.859619140625, -0.4320068359375, -0.00439453125, 0.4232177734375, 0.850830078125, 1.2784423828125, 1.7060546875, 2.1336669921875, 2.561279296875, 2.9888916015625, 3.41650390625, 3.8441162109375, 4.271728515625, 4.6993408203125, 5.126953125, 5.5545654296875, 5.982177734375, 6.4097900390625, 6.83740234375, 7.2650146484375, 7.692626953125, 8.1202392578125, 8.5478515625, 8.9754638671875, 9.403076171875, 9.8306884765625, 10.25830078125, 10.6859130859375, 11.113525390625, 11.5411376953125, 11.96875]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 7.0, 5.0, 10.0, 14.0, 23.0, 30.0, 25.0, 36.0, 38.0, 53.0, 53.0, 44.0, 43.0, 69.0, 60.0, 69.0, 66.0, 43.0, 68.0, 50.0, 43.0, 34.0, 36.0, 22.0, 22.0, 7.0, 7.0, 7.0, 6.0, 7.0, 5.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 3.0], "bins": [-4.078125, -3.977630615234375, -3.87713623046875, -3.776641845703125, -3.6761474609375, -3.575653076171875, -3.47515869140625, -3.374664306640625, -3.274169921875, -3.173675537109375, -3.07318115234375, -2.972686767578125, -2.8721923828125, -2.771697998046875, -2.67120361328125, -2.570709228515625, -2.47021484375, -2.369720458984375, -2.26922607421875, -2.168731689453125, -2.0682373046875, -1.967742919921875, -1.86724853515625, -1.766754150390625, -1.666259765625, -1.565765380859375, -1.46527099609375, -1.364776611328125, -1.2642822265625, -1.163787841796875, -1.06329345703125, -0.962799072265625, -0.8623046875, -0.761810302734375, -0.66131591796875, -0.560821533203125, -0.4603271484375, -0.359832763671875, -0.25933837890625, -0.158843994140625, -0.058349609375, 0.042144775390625, 0.14263916015625, 0.243133544921875, 0.3436279296875, 0.444122314453125, 0.54461669921875, 0.645111083984375, 0.74560546875, 0.846099853515625, 0.94659423828125, 1.047088623046875, 1.1475830078125, 1.248077392578125, 1.34857177734375, 1.449066162109375, 1.549560546875, 1.650054931640625, 1.75054931640625, 1.851043701171875, 1.9515380859375, 2.052032470703125, 2.15252685546875, 2.253021240234375, 2.353515625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 6.0, 7.0, 4.0, 7.0, 9.0, 12.0, 15.0, 16.0, 27.0, 51.0, 70.0, 100.0, 149.0, 251.0, 367.0, 586.0, 1117.0, 1921.0, 3581.0, 7316.0, 16553.0, 43002.0, 141856.0, 786028.0, 2722212.0, 335258.0, 82095.0, 28064.0, 11524.0, 5522.0, 2819.0, 1442.0, 898.0, 463.0, 343.0, 177.0, 120.0, 86.0, 63.0, 44.0, 37.0, 22.0, 17.0, 12.0, 9.0, 2.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-12.6953125, -12.33544921875, -11.9755859375, -11.61572265625, -11.255859375, -10.89599609375, -10.5361328125, -10.17626953125, -9.81640625, -9.45654296875, -9.0966796875, -8.73681640625, -8.376953125, -8.01708984375, -7.6572265625, -7.29736328125, -6.9375, -6.57763671875, -6.2177734375, -5.85791015625, -5.498046875, -5.13818359375, -4.7783203125, -4.41845703125, -4.05859375, -3.69873046875, -3.3388671875, -2.97900390625, -2.619140625, -2.25927734375, -1.8994140625, -1.53955078125, -1.1796875, -0.81982421875, -0.4599609375, -0.10009765625, 0.259765625, 0.61962890625, 0.9794921875, 1.33935546875, 1.69921875, 2.05908203125, 2.4189453125, 2.77880859375, 3.138671875, 3.49853515625, 3.8583984375, 4.21826171875, 4.578125, 4.93798828125, 5.2978515625, 5.65771484375, 6.017578125, 6.37744140625, 6.7373046875, 7.09716796875, 7.45703125, 7.81689453125, 8.1767578125, 8.53662109375, 8.896484375, 9.25634765625, 9.6162109375, 9.97607421875, 10.3359375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 5.0, 1.0, 4.0, 3.0, 4.0, 3.0, 2.0, 8.0, 8.0, 10.0, 15.0, 14.0, 24.0, 48.0, 73.0, 85.0, 143.0, 245.0, 482.0, 1189.0, 738.0, 365.0, 205.0, 131.0, 82.0, 45.0, 33.0, 22.0, 25.0, 22.0, 13.0, 4.0, 9.0, 4.0, 5.0, 3.0, 4.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.9140625, -4.72991943359375, -4.5457763671875, -4.36163330078125, -4.177490234375, -3.99334716796875, -3.8092041015625, -3.62506103515625, -3.44091796875, -3.25677490234375, -3.0726318359375, -2.88848876953125, -2.704345703125, -2.52020263671875, -2.3360595703125, -2.15191650390625, -1.9677734375, -1.78363037109375, -1.5994873046875, -1.41534423828125, -1.231201171875, -1.04705810546875, -0.8629150390625, -0.67877197265625, -0.49462890625, -0.31048583984375, -0.1263427734375, 0.05780029296875, 0.241943359375, 0.42608642578125, 0.6102294921875, 0.79437255859375, 0.978515625, 1.16265869140625, 1.3468017578125, 1.53094482421875, 1.715087890625, 1.89923095703125, 2.0833740234375, 2.26751708984375, 2.45166015625, 2.63580322265625, 2.8199462890625, 3.00408935546875, 3.188232421875, 3.37237548828125, 3.5565185546875, 3.74066162109375, 3.9248046875, 4.10894775390625, 4.2930908203125, 4.47723388671875, 4.661376953125, 4.84552001953125, 5.0296630859375, 5.21380615234375, 5.39794921875, 5.58209228515625, 5.7662353515625, 5.95037841796875, 6.134521484375, 6.31866455078125, 6.5028076171875, 6.68695068359375, 6.87109375]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 5.0, 9.0, 14.0, 15.0, 24.0, 52.0, 84.0, 79.0, 127.0, 145.0, 105.0, 100.0, 79.0, 61.0, 46.0, 29.0, 8.0, 8.0, 6.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.97651290893555, -38.51361083984375, -37.05070877075195, -35.587806701660156, -34.12490463256836, -32.66200256347656, -31.199098587036133, -29.736196517944336, -28.27329444885254, -26.810392379760742, -25.347490310668945, -23.884586334228516, -22.42168426513672, -20.958782196044922, -19.495880126953125, -18.032978057861328, -16.57007598876953, -15.107173919677734, -13.644271850585938, -12.181368827819824, -10.718466758728027, -9.25556468963623, -7.792661666870117, -6.32975959777832, -4.866857528686523, -3.4039552211761475, -1.9410529136657715, -0.4781503677368164, 0.9847517013549805, 2.4476537704467773, 3.9105567932128906, 5.3734588623046875, 6.836357116699219, 8.299259185791016, 9.762161254882812, 11.225064277648926, 12.687966346740723, 14.15086841583252, 15.613771438598633, 17.07667350769043, 18.539575576782227, 20.002477645874023, 21.46537971496582, 22.92828369140625, 24.391185760498047, 25.854087829589844, 27.31698989868164, 28.779891967773438, 30.242794036865234, 31.70569610595703, 33.16859817504883, 34.631500244140625, 36.09440231323242, 37.55730438232422, 39.02021026611328, 40.48310852050781, 41.946014404296875, 43.40891647338867, 44.87181854248047, 46.334720611572266, 47.79762268066406, 49.26052474975586, 50.723426818847656, 52.18633270263672, 53.64923095703125]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 6.0, 6.0, 5.0, 2.0, 5.0, 13.0, 12.0, 18.0, 11.0, 18.0, 20.0, 21.0, 28.0, 22.0, 27.0, 34.0, 34.0, 33.0, 43.0, 46.0, 35.0, 47.0, 50.0, 40.0, 40.0, 42.0, 25.0, 42.0, 31.0, 25.0, 32.0, 20.0, 28.0, 24.0, 26.0, 13.0, 14.0, 14.0, 8.0, 15.0, 5.0, 9.0, 9.0, 4.0, 3.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.687936782836914, -20.018146514892578, -19.348358154296875, -18.67856788635254, -18.008777618408203, -17.338987350463867, -16.66919708251953, -15.999408721923828, -15.329618453979492, -14.659828186035156, -13.990038871765137, -13.320249557495117, -12.650459289550781, -11.980669021606445, -11.310879707336426, -10.641090393066406, -9.97130012512207, -9.301509857177734, -8.631720542907715, -7.961930751800537, -7.292140960693359, -6.622351169586182, -5.952561378479004, -5.282771587371826, -4.612981796264648, -3.9431920051574707, -3.273402214050293, -2.6036124229431152, -1.9338226318359375, -1.2640328407287598, -0.594243049621582, 0.0755467414855957, 0.7453384399414062, 1.415128231048584, 2.0849180221557617, 2.7547078132629395, 3.424497604370117, 4.094287395477295, 4.764077186584473, 5.43386697769165, 6.103656768798828, 6.773446559906006, 7.443236351013184, 8.113025665283203, 8.782815933227539, 9.452606201171875, 10.122395515441895, 10.792184829711914, 11.46197509765625, 12.131765365600586, 12.801554679870605, 13.471343994140625, 14.141134262084961, 14.810924530029297, 15.480713844299316, 16.150503158569336, 16.820293426513672, 17.490083694458008, 18.159873962402344, 18.829662322998047, 19.499452590942383, 20.16924285888672, 20.839031219482422, 21.508821487426758, 22.178611755371094]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 3.0, 8.0, 9.0, 5.0, 13.0, 26.0, 38.0, 51.0, 97.0, 154.0, 242.0, 492.0, 880.0, 2094.0, 5065.0, 13942.0, 41274.0, 121938.0, 352358.0, 334496.0, 114642.0, 38907.0, 13304.0, 4694.0, 1891.0, 876.0, 433.0, 234.0, 139.0, 100.0, 59.0, 32.0, 22.0, 16.0, 9.0, 6.0, 4.0, 5.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.703125, -15.17919921875, -14.6552734375, -14.13134765625, -13.607421875, -13.08349609375, -12.5595703125, -12.03564453125, -11.51171875, -10.98779296875, -10.4638671875, -9.93994140625, -9.416015625, -8.89208984375, -8.3681640625, -7.84423828125, -7.3203125, -6.79638671875, -6.2724609375, -5.74853515625, -5.224609375, -4.70068359375, -4.1767578125, -3.65283203125, -3.12890625, -2.60498046875, -2.0810546875, -1.55712890625, -1.033203125, -0.50927734375, 0.0146484375, 0.53857421875, 1.0625, 1.58642578125, 2.1103515625, 2.63427734375, 3.158203125, 3.68212890625, 4.2060546875, 4.72998046875, 5.25390625, 5.77783203125, 6.3017578125, 6.82568359375, 7.349609375, 7.87353515625, 8.3974609375, 8.92138671875, 9.4453125, 9.96923828125, 10.4931640625, 11.01708984375, 11.541015625, 12.06494140625, 12.5888671875, 13.11279296875, 13.63671875, 14.16064453125, 14.6845703125, 15.20849609375, 15.732421875, 16.25634765625, 16.7802734375, 17.30419921875, 17.828125]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 4.0, 2.0, 6.0, 11.0, 18.0, 26.0, 25.0, 17.0, 33.0, 52.0, 58.0, 50.0, 57.0, 68.0, 56.0, 80.0, 63.0, 59.0, 62.0, 47.0, 50.0, 37.0, 29.0, 29.0, 19.0, 15.0, 10.0, 5.0, 5.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0], "bins": [-4.359375, -4.253326416015625, -4.14727783203125, -4.041229248046875, -3.9351806640625, -3.829132080078125, -3.72308349609375, -3.617034912109375, -3.510986328125, -3.404937744140625, -3.29888916015625, -3.192840576171875, -3.0867919921875, -2.980743408203125, -2.87469482421875, -2.768646240234375, -2.66259765625, -2.556549072265625, -2.45050048828125, -2.344451904296875, -2.2384033203125, -2.132354736328125, -2.02630615234375, -1.920257568359375, -1.814208984375, -1.708160400390625, -1.60211181640625, -1.496063232421875, -1.3900146484375, -1.283966064453125, -1.17791748046875, -1.071868896484375, -0.9658203125, -0.859771728515625, -0.75372314453125, -0.647674560546875, -0.5416259765625, -0.435577392578125, -0.32952880859375, -0.223480224609375, -0.117431640625, -0.011383056640625, 0.09466552734375, 0.200714111328125, 0.3067626953125, 0.412811279296875, 0.51885986328125, 0.624908447265625, 0.73095703125, 0.837005615234375, 0.94305419921875, 1.049102783203125, 1.1551513671875, 1.261199951171875, 1.36724853515625, 1.473297119140625, 1.579345703125, 1.685394287109375, 1.79144287109375, 1.897491455078125, 2.0035400390625, 2.109588623046875, 2.21563720703125, 2.321685791015625, 2.427734375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 9.0, 10.0, 16.0, 22.0, 37.0, 75.0, 99.0, 147.0, 240.0, 458.0, 980.0, 2232.0, 5597.0, 14792.0, 44471.0, 141750.0, 418010.0, 285664.0, 88680.0, 28558.0, 9949.0, 3676.0, 1497.0, 727.0, 350.0, 195.0, 118.0, 64.0, 36.0, 19.0, 23.0, 13.0, 12.0, 10.0, 7.0, 1.0, 2.0, 2.0, 3.0, 0.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.171875, -13.6962890625, -13.220703125, -12.7451171875, -12.26953125, -11.7939453125, -11.318359375, -10.8427734375, -10.3671875, -9.8916015625, -9.416015625, -8.9404296875, -8.46484375, -7.9892578125, -7.513671875, -7.0380859375, -6.5625, -6.0869140625, -5.611328125, -5.1357421875, -4.66015625, -4.1845703125, -3.708984375, -3.2333984375, -2.7578125, -2.2822265625, -1.806640625, -1.3310546875, -0.85546875, -0.3798828125, 0.095703125, 0.5712890625, 1.046875, 1.5224609375, 1.998046875, 2.4736328125, 2.94921875, 3.4248046875, 3.900390625, 4.3759765625, 4.8515625, 5.3271484375, 5.802734375, 6.2783203125, 6.75390625, 7.2294921875, 7.705078125, 8.1806640625, 8.65625, 9.1318359375, 9.607421875, 10.0830078125, 10.55859375, 11.0341796875, 11.509765625, 11.9853515625, 12.4609375, 12.9365234375, 13.412109375, 13.8876953125, 14.36328125, 14.8388671875, 15.314453125, 15.7900390625, 16.265625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 6.0, 7.0, 9.0, 10.0, 15.0, 16.0, 16.0, 20.0, 12.0, 16.0, 25.0, 24.0, 29.0, 26.0, 36.0, 31.0, 28.0, 43.0, 51.0, 34.0, 51.0, 31.0, 42.0, 43.0, 38.0, 31.0, 37.0, 38.0, 33.0, 28.0, 29.0, 22.0, 22.0, 9.0, 11.0, 13.0, 14.0, 11.0, 12.0, 2.0, 8.0, 7.0, 1.0, 5.0, 6.0, 4.0, 1.0, 4.0, 0.0, 0.0, 2.0, 1.0], "bins": [-11.046875, -10.710205078125, -10.37353515625, -10.036865234375, -9.7001953125, -9.363525390625, -9.02685546875, -8.690185546875, -8.353515625, -8.016845703125, -7.68017578125, -7.343505859375, -7.0068359375, -6.670166015625, -6.33349609375, -5.996826171875, -5.66015625, -5.323486328125, -4.98681640625, -4.650146484375, -4.3134765625, -3.976806640625, -3.64013671875, -3.303466796875, -2.966796875, -2.630126953125, -2.29345703125, -1.956787109375, -1.6201171875, -1.283447265625, -0.94677734375, -0.610107421875, -0.2734375, 0.063232421875, 0.39990234375, 0.736572265625, 1.0732421875, 1.409912109375, 1.74658203125, 2.083251953125, 2.419921875, 2.756591796875, 3.09326171875, 3.429931640625, 3.7666015625, 4.103271484375, 4.43994140625, 4.776611328125, 5.11328125, 5.449951171875, 5.78662109375, 6.123291015625, 6.4599609375, 6.796630859375, 7.13330078125, 7.469970703125, 7.806640625, 8.143310546875, 8.47998046875, 8.816650390625, 9.1533203125, 9.489990234375, 9.82666015625, 10.163330078125, 10.5]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 6.0, 4.0, 5.0, 7.0, 8.0, 15.0, 25.0, 37.0, 74.0, 123.0, 284.0, 855.0, 3396.0, 20196.0, 212573.0, 723437.0, 75395.0, 9305.0, 1799.0, 539.0, 205.0, 90.0, 56.0, 43.0, 28.0, 8.0, 12.0, 8.0, 2.0, 5.0, 7.0, 1.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.7421875, -12.2576904296875, -11.773193359375, -11.2886962890625, -10.80419921875, -10.3197021484375, -9.835205078125, -9.3507080078125, -8.8662109375, -8.3817138671875, -7.897216796875, -7.4127197265625, -6.92822265625, -6.4437255859375, -5.959228515625, -5.4747314453125, -4.990234375, -4.5057373046875, -4.021240234375, -3.5367431640625, -3.05224609375, -2.5677490234375, -2.083251953125, -1.5987548828125, -1.1142578125, -0.6297607421875, -0.145263671875, 0.3392333984375, 0.82373046875, 1.3082275390625, 1.792724609375, 2.2772216796875, 2.76171875, 3.2462158203125, 3.730712890625, 4.2152099609375, 4.69970703125, 5.1842041015625, 5.668701171875, 6.1531982421875, 6.6376953125, 7.1221923828125, 7.606689453125, 8.0911865234375, 8.57568359375, 9.0601806640625, 9.544677734375, 10.0291748046875, 10.513671875, 10.9981689453125, 11.482666015625, 11.9671630859375, 12.45166015625, 12.9361572265625, 13.420654296875, 13.9051513671875, 14.3896484375, 14.8741455078125, 15.358642578125, 15.8431396484375, 16.32763671875, 16.8121337890625, 17.296630859375, 17.7811279296875, 18.265625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 1.0, 5.0, 9.0, 1.0, 2.0, 10.0, 10.0, 15.0, 18.0, 22.0, 19.0, 28.0, 27.0, 46.0, 66.0, 105.0, 143.0, 124.0, 99.0, 58.0, 34.0, 31.0, 28.0, 15.0, 15.0, 12.0, 8.0, 14.0, 5.0, 7.0, 5.0, 5.0, 4.0, 3.0, 1.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0012731552124023438, -0.0012291669845581055, -0.0011851787567138672, -0.001141190528869629, -0.0010972023010253906, -0.0010532140731811523, -0.001009225845336914, -0.0009652376174926758, -0.0009212493896484375, -0.0008772611618041992, -0.0008332729339599609, -0.0007892847061157227, -0.0007452964782714844, -0.0007013082504272461, -0.0006573200225830078, -0.0006133317947387695, -0.0005693435668945312, -0.000525355339050293, -0.0004813671112060547, -0.0004373788833618164, -0.0003933906555175781, -0.00034940242767333984, -0.00030541419982910156, -0.0002614259719848633, -0.000217437744140625, -0.00017344951629638672, -0.00012946128845214844, -8.547306060791016e-05, -4.1484832763671875e-05, 2.5033950805664062e-06, 4.649162292480469e-05, 9.047985076904297e-05, 0.00013446807861328125, 0.00017845630645751953, 0.0002224445343017578, 0.0002664327621459961, 0.0003104209899902344, 0.00035440921783447266, 0.00039839744567871094, 0.0004423856735229492, 0.0004863739013671875, 0.0005303621292114258, 0.0005743503570556641, 0.0006183385848999023, 0.0006623268127441406, 0.0007063150405883789, 0.0007503032684326172, 0.0007942914962768555, 0.0008382797241210938, 0.000882267951965332, 0.0009262561798095703, 0.0009702444076538086, 0.0010142326354980469, 0.0010582208633422852, 0.0011022090911865234, 0.0011461973190307617, 0.001190185546875, 0.0012341737747192383, 0.0012781620025634766, 0.0013221502304077148, 0.0013661384582519531, 0.0014101266860961914, 0.0014541149139404297, 0.001498103141784668, 0.0015420913696289062]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 3.0, 12.0, 10.0, 13.0, 25.0, 16.0, 42.0, 47.0, 56.0, 97.0, 169.0, 252.0, 433.0, 748.0, 1327.0, 3027.0, 7764.0, 24759.0, 109996.0, 556113.0, 271184.0, 49894.0, 13200.0, 4834.0, 2058.0, 1002.0, 548.0, 295.0, 190.0, 123.0, 101.0, 65.0, 45.0, 32.0, 19.0, 15.0, 11.0, 9.0, 5.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-8.9296875, -8.6295166015625, -8.329345703125, -8.0291748046875, -7.72900390625, -7.4288330078125, -7.128662109375, -6.8284912109375, -6.5283203125, -6.2281494140625, -5.927978515625, -5.6278076171875, -5.32763671875, -5.0274658203125, -4.727294921875, -4.4271240234375, -4.126953125, -3.8267822265625, -3.526611328125, -3.2264404296875, -2.92626953125, -2.6260986328125, -2.325927734375, -2.0257568359375, -1.7255859375, -1.4254150390625, -1.125244140625, -0.8250732421875, -0.52490234375, -0.2247314453125, 0.075439453125, 0.3756103515625, 0.67578125, 0.9759521484375, 1.276123046875, 1.5762939453125, 1.87646484375, 2.1766357421875, 2.476806640625, 2.7769775390625, 3.0771484375, 3.3773193359375, 3.677490234375, 3.9776611328125, 4.27783203125, 4.5780029296875, 4.878173828125, 5.1783447265625, 5.478515625, 5.7786865234375, 6.078857421875, 6.3790283203125, 6.67919921875, 6.9793701171875, 7.279541015625, 7.5797119140625, 7.8798828125, 8.1800537109375, 8.480224609375, 8.7803955078125, 9.08056640625, 9.3807373046875, 9.680908203125, 9.9810791015625, 10.28125]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 2.0, 6.0, 3.0, 5.0, 7.0, 12.0, 10.0, 22.0, 44.0, 67.0, 84.0, 129.0, 185.0, 142.0, 92.0, 65.0, 48.0, 29.0, 17.0, 9.0, 7.0, 8.0, 1.0, 5.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.3359375, -8.0228271484375, -7.709716796875, -7.3966064453125, -7.08349609375, -6.7703857421875, -6.457275390625, -6.1441650390625, -5.8310546875, -5.5179443359375, -5.204833984375, -4.8917236328125, -4.57861328125, -4.2655029296875, -3.952392578125, -3.6392822265625, -3.326171875, -3.0130615234375, -2.699951171875, -2.3868408203125, -2.07373046875, -1.7606201171875, -1.447509765625, -1.1343994140625, -0.8212890625, -0.5081787109375, -0.195068359375, 0.1180419921875, 0.43115234375, 0.7442626953125, 1.057373046875, 1.3704833984375, 1.68359375, 1.9967041015625, 2.309814453125, 2.6229248046875, 2.93603515625, 3.2491455078125, 3.562255859375, 3.8753662109375, 4.1884765625, 4.5015869140625, 4.814697265625, 5.1278076171875, 5.44091796875, 5.7540283203125, 6.067138671875, 6.3802490234375, 6.693359375, 7.0064697265625, 7.319580078125, 7.6326904296875, 7.94580078125, 8.2589111328125, 8.572021484375, 8.8851318359375, 9.1982421875, 9.5113525390625, 9.824462890625, 10.1375732421875, 10.45068359375, 10.7637939453125, 11.076904296875, 11.3900146484375, 11.703125]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 6.0, 3.0, 4.0, 9.0, 12.0, 13.0, 27.0, 36.0, 54.0, 60.0, 88.0, 106.0, 111.0, 93.0, 100.0, 86.0, 55.0, 47.0, 30.0, 26.0, 13.0, 12.0, 3.0, 2.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-106.55751037597656, -103.81463623046875, -101.07176971435547, -98.32889556884766, -95.58602142333984, -92.84314727783203, -90.10028076171875, -87.35740661621094, -84.61453247070312, -81.87165832519531, -79.12879180908203, -76.38591766357422, -73.6430435180664, -70.9001693725586, -68.15730285644531, -65.4144287109375, -62.67155838012695, -59.928688049316406, -57.185813903808594, -54.44294357299805, -51.700069427490234, -48.95719909667969, -46.214324951171875, -43.47145462036133, -40.72858428955078, -37.985713958740234, -35.24283981323242, -32.499969482421875, -29.757095336914062, -27.014225006103516, -24.271352767944336, -21.528480529785156, -18.785606384277344, -16.042734146118164, -13.299861907958984, -10.556990623474121, -7.814118385314941, -5.071246147155762, -2.3283748626708984, 0.41449737548828125, 3.157369613647461, 5.900241851806641, 8.64311408996582, 11.385985374450684, 14.128857612609863, 16.87173080444336, 19.614601135253906, 22.357473373413086, 25.100345611572266, 27.843217849731445, 30.586090087890625, 33.32896041870117, 36.071834564208984, 38.81470489501953, 41.557579040527344, 44.30044937133789, 47.04331970214844, 49.786190032958984, 52.5290641784668, 55.271934509277344, 58.014808654785156, 60.7576789855957, 63.50054931640625, 66.24342346191406, 68.98629760742188]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 5.0, 5.0, 8.0, 1.0, 4.0, 6.0, 9.0, 13.0, 16.0, 17.0, 14.0, 20.0, 16.0, 23.0, 30.0, 36.0, 40.0, 26.0, 35.0, 44.0, 45.0, 29.0, 45.0, 44.0, 43.0, 40.0, 53.0, 37.0, 46.0, 37.0, 30.0, 32.0, 25.0, 30.0, 16.0, 18.0, 14.0, 14.0, 6.0, 9.0, 3.0, 2.0, 4.0, 4.0, 3.0, 2.0, 0.0, 1.0, 2.0, 5.0, 1.0, 2.0, 1.0], "bins": [-68.12063598632812, -66.09707641601562, -64.07352447509766, -62.04996871948242, -60.02641296386719, -58.00285720825195, -55.97930145263672, -53.95574188232422, -51.93218994140625, -49.908634185791016, -47.88507843017578, -45.86152267456055, -43.83796691894531, -41.81441116333008, -39.790855407714844, -37.767295837402344, -35.74374008178711, -33.720184326171875, -31.69662857055664, -29.673072814941406, -27.649517059326172, -25.625961303710938, -23.60240364074707, -21.578847885131836, -19.5552921295166, -17.531736373901367, -15.508180618286133, -13.484623908996582, -11.461068153381348, -9.437512397766113, -7.4139556884765625, -5.390399932861328, -3.3668479919433594, -1.343291997909546, 0.6802639961242676, 2.70382022857666, 4.7273759841918945, 6.750931739807129, 8.77448844909668, 10.798044204711914, 12.821599960327148, 14.845155715942383, 16.868711471557617, 18.892269134521484, 20.91582489013672, 22.939380645751953, 24.962936401367188, 26.986492156982422, 29.010047912597656, 31.03360366821289, 33.057159423828125, 35.08071517944336, 37.104270935058594, 39.12782669067383, 41.15138244628906, 43.17494201660156, 45.19849395751953, 47.222049713134766, 49.24560546875, 51.269161224365234, 53.29271697998047, 55.3162727355957, 57.33982849121094, 59.36338806152344, 61.38694381713867]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 5.0, 9.0, 4.0, 8.0, 11.0, 13.0, 28.0, 29.0, 33.0, 71.0, 85.0, 134.0, 167.0, 318.0, 403.0, 653.0, 1147.0, 2001.0, 3910.0, 8254.0, 20065.0, 63135.0, 375856.0, 3457425.0, 188854.0, 43184.0, 14821.0, 6223.0, 3153.0, 1662.0, 936.0, 546.0, 390.0, 253.0, 159.0, 103.0, 65.0, 45.0, 41.0, 30.0, 16.0, 11.0, 12.0, 3.0, 3.0, 4.0, 4.0, 4.0, 1.0, 2.0, 1.0], "bins": [-13.4921875, -13.1209716796875, -12.749755859375, -12.3785400390625, -12.00732421875, -11.6361083984375, -11.264892578125, -10.8936767578125, -10.5224609375, -10.1512451171875, -9.780029296875, -9.4088134765625, -9.03759765625, -8.6663818359375, -8.295166015625, -7.9239501953125, -7.552734375, -7.1815185546875, -6.810302734375, -6.4390869140625, -6.06787109375, -5.6966552734375, -5.325439453125, -4.9542236328125, -4.5830078125, -4.2117919921875, -3.840576171875, -3.4693603515625, -3.09814453125, -2.7269287109375, -2.355712890625, -1.9844970703125, -1.61328125, -1.2420654296875, -0.870849609375, -0.4996337890625, -0.12841796875, 0.2427978515625, 0.614013671875, 0.9852294921875, 1.3564453125, 1.7276611328125, 2.098876953125, 2.4700927734375, 2.84130859375, 3.2125244140625, 3.583740234375, 3.9549560546875, 4.326171875, 4.6973876953125, 5.068603515625, 5.4398193359375, 5.81103515625, 6.1822509765625, 6.553466796875, 6.9246826171875, 7.2958984375, 7.6671142578125, 8.038330078125, 8.4095458984375, 8.78076171875, 9.1519775390625, 9.523193359375, 9.8944091796875, 10.265625]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 4.0, 3.0, 5.0, 7.0, 12.0, 16.0, 24.0, 14.0, 29.0, 39.0, 55.0, 55.0, 60.0, 65.0, 65.0, 71.0, 75.0, 50.0, 72.0, 62.0, 51.0, 56.0, 31.0, 21.0, 17.0, 15.0, 11.0, 6.0, 9.0, 4.0, 1.0, 0.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.34765625, -4.22900390625, -4.1103515625, -3.99169921875, -3.873046875, -3.75439453125, -3.6357421875, -3.51708984375, -3.3984375, -3.27978515625, -3.1611328125, -3.04248046875, -2.923828125, -2.80517578125, -2.6865234375, -2.56787109375, -2.44921875, -2.33056640625, -2.2119140625, -2.09326171875, -1.974609375, -1.85595703125, -1.7373046875, -1.61865234375, -1.5, -1.38134765625, -1.2626953125, -1.14404296875, -1.025390625, -0.90673828125, -0.7880859375, -0.66943359375, -0.55078125, -0.43212890625, -0.3134765625, -0.19482421875, -0.076171875, 0.04248046875, 0.1611328125, 0.27978515625, 0.3984375, 0.51708984375, 0.6357421875, 0.75439453125, 0.873046875, 0.99169921875, 1.1103515625, 1.22900390625, 1.34765625, 1.46630859375, 1.5849609375, 1.70361328125, 1.822265625, 1.94091796875, 2.0595703125, 2.17822265625, 2.296875, 2.41552734375, 2.5341796875, 2.65283203125, 2.771484375, 2.89013671875, 3.0087890625, 3.12744140625, 3.24609375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 9.0, 9.0, 14.0, 18.0, 36.0, 75.0, 102.0, 199.0, 348.0, 599.0, 1143.0, 2076.0, 4284.0, 9580.0, 24231.0, 75963.0, 396053.0, 3163475.0, 397384.0, 76263.0, 24317.0, 9574.0, 4111.0, 2075.0, 1045.0, 549.0, 316.0, 180.0, 103.0, 68.0, 36.0, 26.0, 18.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.0703125, -8.714599609375, -8.35888671875, -8.003173828125, -7.6474609375, -7.291748046875, -6.93603515625, -6.580322265625, -6.224609375, -5.868896484375, -5.51318359375, -5.157470703125, -4.8017578125, -4.446044921875, -4.09033203125, -3.734619140625, -3.37890625, -3.023193359375, -2.66748046875, -2.311767578125, -1.9560546875, -1.600341796875, -1.24462890625, -0.888916015625, -0.533203125, -0.177490234375, 0.17822265625, 0.533935546875, 0.8896484375, 1.245361328125, 1.60107421875, 1.956787109375, 2.3125, 2.668212890625, 3.02392578125, 3.379638671875, 3.7353515625, 4.091064453125, 4.44677734375, 4.802490234375, 5.158203125, 5.513916015625, 5.86962890625, 6.225341796875, 6.5810546875, 6.936767578125, 7.29248046875, 7.648193359375, 8.00390625, 8.359619140625, 8.71533203125, 9.071044921875, 9.4267578125, 9.782470703125, 10.13818359375, 10.493896484375, 10.849609375, 11.205322265625, 11.56103515625, 11.916748046875, 12.2724609375, 12.628173828125, 12.98388671875, 13.339599609375, 13.6953125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 6.0, 3.0, 3.0, 7.0, 5.0, 7.0, 8.0, 12.0, 14.0, 22.0, 22.0, 38.0, 43.0, 86.0, 112.0, 232.0, 379.0, 1095.0, 949.0, 385.0, 234.0, 129.0, 63.0, 62.0, 43.0, 27.0, 8.0, 16.0, 19.0, 11.0, 6.0, 9.0, 5.0, 5.0, 4.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.33984375, -4.212005615234375, -4.08416748046875, -3.956329345703125, -3.8284912109375, -3.700653076171875, -3.57281494140625, -3.444976806640625, -3.317138671875, -3.189300537109375, -3.06146240234375, -2.933624267578125, -2.8057861328125, -2.677947998046875, -2.55010986328125, -2.422271728515625, -2.29443359375, -2.166595458984375, -2.03875732421875, -1.910919189453125, -1.7830810546875, -1.655242919921875, -1.52740478515625, -1.399566650390625, -1.271728515625, -1.143890380859375, -1.01605224609375, -0.888214111328125, -0.7603759765625, -0.632537841796875, -0.50469970703125, -0.376861572265625, -0.2490234375, -0.121185302734375, 0.00665283203125, 0.134490966796875, 0.2623291015625, 0.390167236328125, 0.51800537109375, 0.645843505859375, 0.773681640625, 0.901519775390625, 1.02935791015625, 1.157196044921875, 1.2850341796875, 1.412872314453125, 1.54071044921875, 1.668548583984375, 1.79638671875, 1.924224853515625, 2.05206298828125, 2.179901123046875, 2.3077392578125, 2.435577392578125, 2.56341552734375, 2.691253662109375, 2.819091796875, 2.946929931640625, 3.07476806640625, 3.202606201171875, 3.3304443359375, 3.458282470703125, 3.58612060546875, 3.713958740234375, 3.841796875]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 3.0, 7.0, 7.0, 10.0, 15.0, 30.0, 39.0, 51.0, 68.0, 80.0, 123.0, 86.0, 109.0, 95.0, 77.0, 71.0, 51.0, 34.0, 17.0, 11.0, 10.0, 5.0, 3.0, 5.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-29.805009841918945, -28.969240188598633, -28.13347053527832, -27.297700881958008, -26.461933135986328, -25.626163482666016, -24.790393829345703, -23.95462417602539, -23.118854522705078, -22.283084869384766, -21.447315216064453, -20.61154556274414, -19.775775909423828, -18.940006256103516, -18.104238510131836, -17.268468856811523, -16.43269920349121, -15.596929550170898, -14.761159896850586, -13.92539119720459, -13.089621543884277, -12.253851890563965, -11.418083190917969, -10.582313537597656, -9.746543884277344, -8.910774230957031, -8.075004577636719, -7.239235877990723, -6.40346622467041, -5.567696571350098, -4.731927394866943, -3.896158218383789, -3.0603866577148438, -2.2246172428131104, -1.388847827911377, -0.5530784130096436, 0.28269100189208984, 1.1184606552124023, 1.9542298316955566, 2.789999008178711, 3.6257686614990234, 4.461538314819336, 5.29730749130249, 6.1330766677856445, 6.968846321105957, 7.8046159744262695, 8.640384674072266, 9.476154327392578, 10.31192398071289, 11.147693634033203, 11.983463287353516, 12.819231986999512, 13.655001640319824, 14.490771293640137, 15.326539993286133, 16.162309646606445, 16.998079299926758, 17.83384895324707, 18.669618606567383, 19.505388259887695, 20.341156005859375, 21.176925659179688, 22.0126953125, 22.848464965820312, 23.684234619140625]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 3.0, 8.0, 11.0, 8.0, 10.0, 18.0, 18.0, 20.0, 21.0, 25.0, 34.0, 31.0, 32.0, 37.0, 42.0, 48.0, 61.0, 57.0, 58.0, 62.0, 37.0, 47.0, 45.0, 32.0, 39.0, 40.0, 26.0, 25.0, 18.0, 19.0, 13.0, 12.0, 8.0, 10.0, 10.0, 11.0, 5.0, 3.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.24041748046875, -13.703510284423828, -13.166603088378906, -12.629695892333984, -12.092788696289062, -11.55588150024414, -11.018974304199219, -10.482067108154297, -9.945159912109375, -9.408252716064453, -8.871345520019531, -8.33443832397461, -7.7975311279296875, -7.260623931884766, -6.723716735839844, -6.186809539794922, -5.64990234375, -5.112995147705078, -4.576087951660156, -4.039180755615234, -3.5022735595703125, -2.9653663635253906, -2.4284591674804688, -1.8915519714355469, -1.354644775390625, -0.8177375793457031, -0.28083038330078125, 0.2560768127441406, 0.7929840087890625, 1.3298912048339844, 1.8667984008789062, 2.403705596923828, 2.940614700317383, 3.4775218963623047, 4.014429092407227, 4.551336288452148, 5.08824348449707, 5.625150680541992, 6.162057876586914, 6.698965072631836, 7.235872268676758, 7.77277946472168, 8.309686660766602, 8.846593856811523, 9.383501052856445, 9.920408248901367, 10.457315444946289, 10.994222640991211, 11.531129837036133, 12.068037033081055, 12.604944229125977, 13.141851425170898, 13.67875862121582, 14.215665817260742, 14.752573013305664, 15.289480209350586, 15.826387405395508, 16.36329460144043, 16.90020179748535, 17.437108993530273, 17.974016189575195, 18.510923385620117, 19.04783058166504, 19.58473777770996, 20.121644973754883]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 7.0, 3.0, 6.0, 7.0, 14.0, 17.0, 22.0, 31.0, 68.0, 72.0, 140.0, 227.0, 360.0, 611.0, 1123.0, 1996.0, 3845.0, 8014.0, 16938.0, 38607.0, 89340.0, 207744.0, 342103.0, 189963.0, 81663.0, 34647.0, 15520.0, 7406.0, 3672.0, 1907.0, 1036.0, 535.0, 324.0, 213.0, 119.0, 95.0, 43.0, 39.0, 28.0, 17.0, 14.0, 9.0, 12.0, 1.0, 4.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.6484375, -11.2239990234375, -10.799560546875, -10.3751220703125, -9.95068359375, -9.5262451171875, -9.101806640625, -8.6773681640625, -8.2529296875, -7.8284912109375, -7.404052734375, -6.9796142578125, -6.55517578125, -6.1307373046875, -5.706298828125, -5.2818603515625, -4.857421875, -4.4329833984375, -4.008544921875, -3.5841064453125, -3.15966796875, -2.7352294921875, -2.310791015625, -1.8863525390625, -1.4619140625, -1.0374755859375, -0.613037109375, -0.1885986328125, 0.23583984375, 0.6602783203125, 1.084716796875, 1.5091552734375, 1.93359375, 2.3580322265625, 2.782470703125, 3.2069091796875, 3.63134765625, 4.0557861328125, 4.480224609375, 4.9046630859375, 5.3291015625, 5.7535400390625, 6.177978515625, 6.6024169921875, 7.02685546875, 7.4512939453125, 7.875732421875, 8.3001708984375, 8.724609375, 9.1490478515625, 9.573486328125, 9.9979248046875, 10.42236328125, 10.8468017578125, 11.271240234375, 11.6956787109375, 12.1201171875, 12.5445556640625, 12.968994140625, 13.3934326171875, 13.81787109375, 14.2423095703125, 14.666748046875, 15.0911865234375, 15.515625]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 4.0, 6.0, 6.0, 10.0, 14.0, 16.0, 23.0, 22.0, 30.0, 46.0, 47.0, 66.0, 44.0, 57.0, 71.0, 61.0, 54.0, 64.0, 65.0, 45.0, 43.0, 40.0, 40.0, 43.0, 21.0, 21.0, 9.0, 7.0, 8.0, 6.0, 4.0, 5.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.880859375, -3.774993896484375, -3.66912841796875, -3.563262939453125, -3.4573974609375, -3.351531982421875, -3.24566650390625, -3.139801025390625, -3.033935546875, -2.928070068359375, -2.82220458984375, -2.716339111328125, -2.6104736328125, -2.504608154296875, -2.39874267578125, -2.292877197265625, -2.18701171875, -2.081146240234375, -1.97528076171875, -1.869415283203125, -1.7635498046875, -1.657684326171875, -1.55181884765625, -1.445953369140625, -1.340087890625, -1.234222412109375, -1.12835693359375, -1.022491455078125, -0.9166259765625, -0.810760498046875, -0.70489501953125, -0.599029541015625, -0.4931640625, -0.387298583984375, -0.28143310546875, -0.175567626953125, -0.0697021484375, 0.036163330078125, 0.14202880859375, 0.247894287109375, 0.353759765625, 0.459625244140625, 0.56549072265625, 0.671356201171875, 0.7772216796875, 0.883087158203125, 0.98895263671875, 1.094818115234375, 1.20068359375, 1.306549072265625, 1.41241455078125, 1.518280029296875, 1.6241455078125, 1.730010986328125, 1.83587646484375, 1.941741943359375, 2.047607421875, 2.153472900390625, 2.25933837890625, 2.365203857421875, 2.4710693359375, 2.576934814453125, 2.68280029296875, 2.788665771484375, 2.89453125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 5.0, 6.0, 7.0, 12.0, 17.0, 16.0, 36.0, 28.0, 61.0, 73.0, 98.0, 140.0, 217.0, 321.0, 454.0, 747.0, 1342.0, 2774.0, 6107.0, 15375.0, 42155.0, 117616.0, 306314.0, 339077.0, 135212.0, 48844.0, 17542.0, 6911.0, 3090.0, 1544.0, 803.0, 472.0, 361.0, 220.0, 173.0, 107.0, 76.0, 51.0, 36.0, 32.0, 15.0, 24.0, 11.0, 13.0, 8.0, 4.0, 6.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-12.546875, -12.16748046875, -11.7880859375, -11.40869140625, -11.029296875, -10.64990234375, -10.2705078125, -9.89111328125, -9.51171875, -9.13232421875, -8.7529296875, -8.37353515625, -7.994140625, -7.61474609375, -7.2353515625, -6.85595703125, -6.4765625, -6.09716796875, -5.7177734375, -5.33837890625, -4.958984375, -4.57958984375, -4.2001953125, -3.82080078125, -3.44140625, -3.06201171875, -2.6826171875, -2.30322265625, -1.923828125, -1.54443359375, -1.1650390625, -0.78564453125, -0.40625, -0.02685546875, 0.3525390625, 0.73193359375, 1.111328125, 1.49072265625, 1.8701171875, 2.24951171875, 2.62890625, 3.00830078125, 3.3876953125, 3.76708984375, 4.146484375, 4.52587890625, 4.9052734375, 5.28466796875, 5.6640625, 6.04345703125, 6.4228515625, 6.80224609375, 7.181640625, 7.56103515625, 7.9404296875, 8.31982421875, 8.69921875, 9.07861328125, 9.4580078125, 9.83740234375, 10.216796875, 10.59619140625, 10.9755859375, 11.35498046875, 11.734375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 6.0, 6.0, 8.0, 5.0, 8.0, 13.0, 16.0, 14.0, 21.0, 37.0, 31.0, 40.0, 37.0, 50.0, 56.0, 50.0, 56.0, 53.0, 51.0, 55.0, 46.0, 50.0, 48.0, 34.0, 43.0, 30.0, 29.0, 22.0, 21.0, 18.0, 9.0, 15.0, 9.0, 4.0, 7.0, 4.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.1484375, -11.726318359375, -11.30419921875, -10.882080078125, -10.4599609375, -10.037841796875, -9.61572265625, -9.193603515625, -8.771484375, -8.349365234375, -7.92724609375, -7.505126953125, -7.0830078125, -6.660888671875, -6.23876953125, -5.816650390625, -5.39453125, -4.972412109375, -4.55029296875, -4.128173828125, -3.7060546875, -3.283935546875, -2.86181640625, -2.439697265625, -2.017578125, -1.595458984375, -1.17333984375, -0.751220703125, -0.3291015625, 0.093017578125, 0.51513671875, 0.937255859375, 1.359375, 1.781494140625, 2.20361328125, 2.625732421875, 3.0478515625, 3.469970703125, 3.89208984375, 4.314208984375, 4.736328125, 5.158447265625, 5.58056640625, 6.002685546875, 6.4248046875, 6.846923828125, 7.26904296875, 7.691162109375, 8.11328125, 8.535400390625, 8.95751953125, 9.379638671875, 9.8017578125, 10.223876953125, 10.64599609375, 11.068115234375, 11.490234375, 11.912353515625, 12.33447265625, 12.756591796875, 13.1787109375, 13.600830078125, 14.02294921875, 14.445068359375, 14.8671875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 3.0, 6.0, 6.0, 12.0, 12.0, 23.0, 19.0, 36.0, 75.0, 93.0, 154.0, 269.0, 494.0, 850.0, 1561.0, 3162.0, 6846.0, 16054.0, 46628.0, 172638.0, 485599.0, 222194.0, 57251.0, 19166.0, 7815.0, 3651.0, 1718.0, 930.0, 489.0, 299.0, 178.0, 110.0, 75.0, 43.0, 27.0, 21.0, 12.0, 14.0, 9.0, 11.0, 5.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.91015625, -7.66741943359375, -7.4246826171875, -7.18194580078125, -6.939208984375, -6.69647216796875, -6.4537353515625, -6.21099853515625, -5.96826171875, -5.72552490234375, -5.4827880859375, -5.24005126953125, -4.997314453125, -4.75457763671875, -4.5118408203125, -4.26910400390625, -4.0263671875, -3.78363037109375, -3.5408935546875, -3.29815673828125, -3.055419921875, -2.81268310546875, -2.5699462890625, -2.32720947265625, -2.08447265625, -1.84173583984375, -1.5989990234375, -1.35626220703125, -1.113525390625, -0.87078857421875, -0.6280517578125, -0.38531494140625, -0.142578125, 0.10015869140625, 0.3428955078125, 0.58563232421875, 0.828369140625, 1.07110595703125, 1.3138427734375, 1.55657958984375, 1.79931640625, 2.04205322265625, 2.2847900390625, 2.52752685546875, 2.770263671875, 3.01300048828125, 3.2557373046875, 3.49847412109375, 3.7412109375, 3.98394775390625, 4.2266845703125, 4.46942138671875, 4.712158203125, 4.95489501953125, 5.1976318359375, 5.44036865234375, 5.68310546875, 5.92584228515625, 6.1685791015625, 6.41131591796875, 6.654052734375, 6.89678955078125, 7.1395263671875, 7.38226318359375, 7.625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 2.0, 3.0, 6.0, 10.0, 10.0, 11.0, 9.0, 12.0, 14.0, 20.0, 31.0, 42.0, 41.0, 50.0, 70.0, 142.0, 144.0, 110.0, 58.0, 58.0, 38.0, 33.0, 18.0, 15.0, 12.0, 9.0, 10.0, 14.0, 6.0, 1.0, 1.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00148773193359375, -0.0014365911483764648, -0.0013854503631591797, -0.0013343095779418945, -0.0012831687927246094, -0.0012320280075073242, -0.001180887222290039, -0.001129746437072754, -0.0010786056518554688, -0.0010274648666381836, -0.0009763240814208984, -0.0009251832962036133, -0.0008740425109863281, -0.000822901725769043, -0.0007717609405517578, -0.0007206201553344727, -0.0006694793701171875, -0.0006183385848999023, -0.0005671977996826172, -0.000516057014465332, -0.0004649162292480469, -0.0004137754440307617, -0.00036263465881347656, -0.0003114938735961914, -0.00026035308837890625, -0.0002092123031616211, -0.00015807151794433594, -0.00010693073272705078, -5.5789947509765625e-05, -4.649162292480469e-06, 4.649162292480469e-05, 9.763240814208984e-05, 0.000148773193359375, 0.00019991397857666016, 0.0002510547637939453, 0.00030219554901123047, 0.0003533363342285156, 0.0004044771194458008, 0.00045561790466308594, 0.0005067586898803711, 0.0005578994750976562, 0.0006090402603149414, 0.0006601810455322266, 0.0007113218307495117, 0.0007624626159667969, 0.000813603401184082, 0.0008647441864013672, 0.0009158849716186523, 0.0009670257568359375, 0.0010181665420532227, 0.0010693073272705078, 0.001120448112487793, 0.0011715888977050781, 0.0012227296829223633, 0.0012738704681396484, 0.0013250112533569336, 0.0013761520385742188, 0.001427292823791504, 0.001478433609008789, 0.0015295743942260742, 0.0015807151794433594, 0.0016318559646606445, 0.0016829967498779297, 0.0017341375350952148, 0.0017852783203125]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 9.0, 11.0, 17.0, 17.0, 31.0, 51.0, 78.0, 114.0, 208.0, 380.0, 803.0, 2010.0, 5398.0, 17116.0, 72650.0, 588651.0, 301219.0, 41896.0, 11265.0, 3707.0, 1484.0, 670.0, 293.0, 158.0, 112.0, 65.0, 46.0, 32.0, 24.0, 14.0, 12.0, 5.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.3671875, -11.966064453125, -11.56494140625, -11.163818359375, -10.7626953125, -10.361572265625, -9.96044921875, -9.559326171875, -9.158203125, -8.757080078125, -8.35595703125, -7.954833984375, -7.5537109375, -7.152587890625, -6.75146484375, -6.350341796875, -5.94921875, -5.548095703125, -5.14697265625, -4.745849609375, -4.3447265625, -3.943603515625, -3.54248046875, -3.141357421875, -2.740234375, -2.339111328125, -1.93798828125, -1.536865234375, -1.1357421875, -0.734619140625, -0.33349609375, 0.067626953125, 0.46875, 0.869873046875, 1.27099609375, 1.672119140625, 2.0732421875, 2.474365234375, 2.87548828125, 3.276611328125, 3.677734375, 4.078857421875, 4.47998046875, 4.881103515625, 5.2822265625, 5.683349609375, 6.08447265625, 6.485595703125, 6.88671875, 7.287841796875, 7.68896484375, 8.090087890625, 8.4912109375, 8.892333984375, 9.29345703125, 9.694580078125, 10.095703125, 10.496826171875, 10.89794921875, 11.299072265625, 11.7001953125, 12.101318359375, 12.50244140625, 12.903564453125, 13.3046875]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 5.0, 1.0, 2.0, 3.0, 4.0, 3.0, 7.0, 13.0, 5.0, 10.0, 20.0, 17.0, 19.0, 29.0, 62.0, 66.0, 92.0, 133.0, 120.0, 119.0, 83.0, 48.0, 40.0, 24.0, 12.0, 20.0, 11.0, 8.0, 8.0, 7.0, 3.0, 1.0, 4.0, 1.0, 5.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.51171875, -7.25445556640625, -6.9971923828125, -6.73992919921875, -6.482666015625, -6.22540283203125, -5.9681396484375, -5.71087646484375, -5.45361328125, -5.19635009765625, -4.9390869140625, -4.68182373046875, -4.424560546875, -4.16729736328125, -3.9100341796875, -3.65277099609375, -3.3955078125, -3.13824462890625, -2.8809814453125, -2.62371826171875, -2.366455078125, -2.10919189453125, -1.8519287109375, -1.59466552734375, -1.33740234375, -1.08013916015625, -0.8228759765625, -0.56561279296875, -0.308349609375, -0.05108642578125, 0.2061767578125, 0.46343994140625, 0.720703125, 0.97796630859375, 1.2352294921875, 1.49249267578125, 1.749755859375, 2.00701904296875, 2.2642822265625, 2.52154541015625, 2.77880859375, 3.03607177734375, 3.2933349609375, 3.55059814453125, 3.807861328125, 4.06512451171875, 4.3223876953125, 4.57965087890625, 4.8369140625, 5.09417724609375, 5.3514404296875, 5.60870361328125, 5.865966796875, 6.12322998046875, 6.3804931640625, 6.63775634765625, 6.89501953125, 7.15228271484375, 7.4095458984375, 7.66680908203125, 7.924072265625, 8.18133544921875, 8.4385986328125, 8.69586181640625, 8.953125]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 3.0, 1.0, 5.0, 9.0, 28.0, 31.0, 60.0, 63.0, 131.0, 143.0, 133.0, 108.0, 98.0, 75.0, 36.0, 32.0, 24.0, 9.0, 3.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-76.35137939453125, -72.9698715209961, -69.58836364746094, -66.20685577392578, -62.82535171508789, -59.443843841552734, -56.06233596801758, -52.68083190917969, -49.29932403564453, -45.917816162109375, -42.53630828857422, -39.15480041503906, -35.77329635620117, -32.391788482666016, -29.01028060913086, -25.628774642944336, -22.247264862060547, -18.86575698852539, -15.484251022338867, -12.102743148803711, -8.721236228942871, -5.339729309082031, -1.958221435546875, 1.4232845306396484, 4.804792404174805, 8.186299324035645, 11.567806243896484, 14.94931411743164, 18.330821990966797, 21.71232795715332, 25.093835830688477, 28.475341796875, 31.856849670410156, 35.23835754394531, 38.61986541748047, 42.001373291015625, 45.382877349853516, 48.76438522338867, 52.14589309692383, 55.52739715576172, 58.908905029296875, 62.29041290283203, 65.67192077636719, 69.05342864990234, 72.4349365234375, 75.81643676757812, 79.19795227050781, 82.57945251464844, 85.96096801757812, 89.34247589111328, 92.72398376464844, 96.1054916381836, 99.48699951171875, 102.86849975585938, 106.25001525878906, 109.63151550292969, 113.01302337646484, 116.39453125, 119.77603912353516, 123.15754699707031, 126.53905487060547, 129.92056274414062, 133.30206298828125, 136.68357849121094, 140.06507873535156]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 3.0, 7.0, 4.0, 5.0, 10.0, 4.0, 9.0, 16.0, 8.0, 16.0, 19.0, 24.0, 16.0, 24.0, 29.0, 25.0, 22.0, 32.0, 30.0, 39.0, 40.0, 32.0, 35.0, 42.0, 40.0, 49.0, 50.0, 38.0, 38.0, 43.0, 28.0, 33.0, 37.0, 22.0, 20.0, 16.0, 10.0, 24.0, 19.0, 8.0, 6.0, 7.0, 7.0, 4.0, 6.0, 3.0, 3.0, 2.0, 4.0, 4.0, 1.0, 0.0, 1.0, 2.0], "bins": [-57.708396911621094, -55.993080139160156, -54.27776336669922, -52.56244659423828, -50.847129821777344, -49.131813049316406, -47.41649627685547, -45.70117950439453, -43.985862731933594, -42.270545959472656, -40.55522918701172, -38.83991241455078, -37.124595642089844, -35.409278869628906, -33.69396209716797, -31.97864532470703, -30.263328552246094, -28.548011779785156, -26.83269500732422, -25.11737823486328, -23.402061462402344, -21.686744689941406, -19.97142791748047, -18.25611114501953, -16.540794372558594, -14.825477600097656, -13.110160827636719, -11.394844055175781, -9.679527282714844, -7.964210510253906, -6.248893737792969, -4.533576965332031, -2.818256378173828, -1.1029396057128906, 0.6123771667480469, 2.3276939392089844, 4.043010711669922, 5.758327484130859, 7.473644256591797, 9.188961029052734, 10.904277801513672, 12.61959457397461, 14.334911346435547, 16.050228118896484, 17.765544891357422, 19.48086166381836, 21.196178436279297, 22.911495208740234, 24.626811981201172, 26.34212875366211, 28.057445526123047, 29.772762298583984, 31.488079071044922, 33.20339584350586, 34.9187126159668, 36.634029388427734, 38.34934616088867, 40.06466293334961, 41.77997970581055, 43.495296478271484, 45.21061325073242, 46.92593002319336, 48.6412467956543, 50.356563568115234, 52.07188034057617]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 5.0, 6.0, 12.0, 11.0, 22.0, 25.0, 48.0, 64.0, 90.0, 122.0, 199.0, 314.0, 554.0, 1057.0, 2046.0, 4324.0, 10906.0, 34561.0, 189647.0, 3515955.0, 359953.0, 49769.0, 14057.0, 5388.0, 2399.0, 1185.0, 635.0, 347.0, 194.0, 125.0, 76.0, 47.0, 39.0, 32.0, 23.0, 10.0, 8.0, 8.0, 6.0, 5.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.609375, -17.085693359375, -16.56201171875, -16.038330078125, -15.5146484375, -14.990966796875, -14.46728515625, -13.943603515625, -13.419921875, -12.896240234375, -12.37255859375, -11.848876953125, -11.3251953125, -10.801513671875, -10.27783203125, -9.754150390625, -9.23046875, -8.706787109375, -8.18310546875, -7.659423828125, -7.1357421875, -6.612060546875, -6.08837890625, -5.564697265625, -5.041015625, -4.517333984375, -3.99365234375, -3.469970703125, -2.9462890625, -2.422607421875, -1.89892578125, -1.375244140625, -0.8515625, -0.327880859375, 0.19580078125, 0.719482421875, 1.2431640625, 1.766845703125, 2.29052734375, 2.814208984375, 3.337890625, 3.861572265625, 4.38525390625, 4.908935546875, 5.4326171875, 5.956298828125, 6.47998046875, 7.003662109375, 7.52734375, 8.051025390625, 8.57470703125, 9.098388671875, 9.6220703125, 10.145751953125, 10.66943359375, 11.193115234375, 11.716796875, 12.240478515625, 12.76416015625, 13.287841796875, 13.8115234375, 14.335205078125, 14.85888671875, 15.382568359375, 15.90625]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 6.0, 9.0, 6.0, 14.0, 9.0, 11.0, 27.0, 21.0, 35.0, 27.0, 37.0, 61.0, 38.0, 51.0, 65.0, 61.0, 77.0, 58.0, 60.0, 58.0, 55.0, 35.0, 42.0, 33.0, 29.0, 18.0, 15.0, 14.0, 10.0, 3.0, 6.0, 3.0, 3.0, 1.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-3.931640625, -3.82568359375, -3.7197265625, -3.61376953125, -3.5078125, -3.40185546875, -3.2958984375, -3.18994140625, -3.083984375, -2.97802734375, -2.8720703125, -2.76611328125, -2.66015625, -2.55419921875, -2.4482421875, -2.34228515625, -2.236328125, -2.13037109375, -2.0244140625, -1.91845703125, -1.8125, -1.70654296875, -1.6005859375, -1.49462890625, -1.388671875, -1.28271484375, -1.1767578125, -1.07080078125, -0.96484375, -0.85888671875, -0.7529296875, -0.64697265625, -0.541015625, -0.43505859375, -0.3291015625, -0.22314453125, -0.1171875, -0.01123046875, 0.0947265625, 0.20068359375, 0.306640625, 0.41259765625, 0.5185546875, 0.62451171875, 0.73046875, 0.83642578125, 0.9423828125, 1.04833984375, 1.154296875, 1.26025390625, 1.3662109375, 1.47216796875, 1.578125, 1.68408203125, 1.7900390625, 1.89599609375, 2.001953125, 2.10791015625, 2.2138671875, 2.31982421875, 2.42578125, 2.53173828125, 2.6376953125, 2.74365234375, 2.849609375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 8.0, 3.0, 11.0, 13.0, 20.0, 27.0, 56.0, 100.0, 133.0, 216.0, 420.0, 734.0, 1327.0, 2507.0, 4854.0, 10061.0, 22645.0, 62673.0, 236404.0, 2126202.0, 1437807.0, 194602.0, 54002.0, 20470.0, 9021.0, 4518.0, 2430.0, 1310.0, 709.0, 393.0, 245.0, 150.0, 80.0, 61.0, 29.0, 19.0, 17.0, 9.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.1484375, -8.832275390625, -8.51611328125, -8.199951171875, -7.8837890625, -7.567626953125, -7.25146484375, -6.935302734375, -6.619140625, -6.302978515625, -5.98681640625, -5.670654296875, -5.3544921875, -5.038330078125, -4.72216796875, -4.406005859375, -4.08984375, -3.773681640625, -3.45751953125, -3.141357421875, -2.8251953125, -2.509033203125, -2.19287109375, -1.876708984375, -1.560546875, -1.244384765625, -0.92822265625, -0.612060546875, -0.2958984375, 0.020263671875, 0.33642578125, 0.652587890625, 0.96875, 1.284912109375, 1.60107421875, 1.917236328125, 2.2333984375, 2.549560546875, 2.86572265625, 3.181884765625, 3.498046875, 3.814208984375, 4.13037109375, 4.446533203125, 4.7626953125, 5.078857421875, 5.39501953125, 5.711181640625, 6.02734375, 6.343505859375, 6.65966796875, 6.975830078125, 7.2919921875, 7.608154296875, 7.92431640625, 8.240478515625, 8.556640625, 8.872802734375, 9.18896484375, 9.505126953125, 9.8212890625, 10.137451171875, 10.45361328125, 10.769775390625, 11.0859375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 1.0, 3.0, 3.0, 2.0, 2.0, 4.0, 4.0, 10.0, 12.0, 8.0, 10.0, 16.0, 28.0, 22.0, 45.0, 55.0, 86.0, 109.0, 172.0, 325.0, 538.0, 950.0, 654.0, 320.0, 207.0, 135.0, 104.0, 72.0, 30.0, 30.0, 21.0, 15.0, 18.0, 12.0, 8.0, 4.0, 7.0, 7.0, 4.0, 5.0, 7.0, 2.0, 1.0, 3.0, 0.0, 4.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.921875, -3.77996826171875, -3.6380615234375, -3.49615478515625, -3.354248046875, -3.21234130859375, -3.0704345703125, -2.92852783203125, -2.78662109375, -2.64471435546875, -2.5028076171875, -2.36090087890625, -2.218994140625, -2.07708740234375, -1.9351806640625, -1.79327392578125, -1.6513671875, -1.50946044921875, -1.3675537109375, -1.22564697265625, -1.083740234375, -0.94183349609375, -0.7999267578125, -0.65802001953125, -0.51611328125, -0.37420654296875, -0.2322998046875, -0.09039306640625, 0.051513671875, 0.19342041015625, 0.3353271484375, 0.47723388671875, 0.619140625, 0.76104736328125, 0.9029541015625, 1.04486083984375, 1.186767578125, 1.32867431640625, 1.4705810546875, 1.61248779296875, 1.75439453125, 1.89630126953125, 2.0382080078125, 2.18011474609375, 2.322021484375, 2.46392822265625, 2.6058349609375, 2.74774169921875, 2.8896484375, 3.03155517578125, 3.1734619140625, 3.31536865234375, 3.457275390625, 3.59918212890625, 3.7410888671875, 3.88299560546875, 4.02490234375, 4.16680908203125, 4.3087158203125, 4.45062255859375, 4.592529296875, 4.73443603515625, 4.8763427734375, 5.01824951171875, 5.16015625]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 5.0, 7.0, 5.0, 15.0, 36.0, 36.0, 78.0, 96.0, 121.0, 127.0, 143.0, 110.0, 89.0, 52.0, 29.0, 22.0, 19.0, 6.0, 5.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-62.25694274902344, -60.917850494384766, -59.578758239746094, -58.23966979980469, -56.900577545166016, -55.561485290527344, -54.22239303588867, -52.88330078125, -51.544212341308594, -50.20512008666992, -48.86602783203125, -47.526939392089844, -46.18784713745117, -44.8487548828125, -43.50966262817383, -42.170570373535156, -40.831478118896484, -39.49238586425781, -38.15329360961914, -36.81420135498047, -35.47511291503906, -34.13602066040039, -32.79692840576172, -31.457836151123047, -30.118745803833008, -28.779653549194336, -27.440563201904297, -26.101470947265625, -24.762378692626953, -23.423288345336914, -22.084196090698242, -20.745105743408203, -19.4060115814209, -18.066919326782227, -16.727828979492188, -15.388736724853516, -14.04964542388916, -12.710554122924805, -11.371461868286133, -10.032370567321777, -8.693279266357422, -7.354187965393066, -6.015096187591553, -4.676004409790039, -3.3369131088256836, -1.9978218078613281, -0.6587295532226562, 0.6803617477416992, 2.0194530487060547, 3.3585445880889893, 4.697636127471924, 6.0367279052734375, 7.375819206237793, 8.714910507202148, 10.05400276184082, 11.393094062805176, 12.732185363769531, 14.071276664733887, 15.410367965698242, 16.749460220336914, 18.088550567626953, 19.427642822265625, 20.766735076904297, 22.10582733154297, 23.444917678833008]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 5.0, 1.0, 4.0, 5.0, 9.0, 11.0, 8.0, 6.0, 18.0, 8.0, 20.0, 17.0, 18.0, 26.0, 44.0, 28.0, 26.0, 33.0, 39.0, 47.0, 49.0, 44.0, 45.0, 42.0, 40.0, 40.0, 40.0, 40.0, 31.0, 27.0, 32.0, 19.0, 23.0, 31.0, 25.0, 11.0, 17.0, 15.0, 12.0, 11.0, 11.0, 5.0, 3.0, 3.0, 5.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-17.653610229492188, -17.060409545898438, -16.467206954956055, -15.874006271362305, -15.280805587768555, -14.687603950500488, -14.094402313232422, -13.501201629638672, -12.908000946044922, -12.314799308776855, -11.721598625183105, -11.128396987915039, -10.535196304321289, -9.941994667053223, -9.348793029785156, -8.755592346191406, -8.16239070892334, -7.569189548492432, -6.975988388061523, -6.382786750793457, -5.789586067199707, -5.196384429931641, -4.603183269500732, -4.009982109069824, -3.416780948638916, -2.823579788208008, -2.2303786277770996, -1.6371772289276123, -1.043976068496704, -0.4507749080657959, 0.1424264907836914, 0.7356276512145996, 1.3288288116455078, 1.922029972076416, 2.515231132507324, 3.1084325313568115, 3.7016336917877197, 4.294835090637207, 4.888036251068115, 5.481237411499023, 6.074438571929932, 6.66763973236084, 7.260840892791748, 7.854042053222656, 8.447243690490723, 9.040444374084473, 9.633646011352539, 10.226846694946289, 10.820048332214355, 11.413249969482422, 12.006450653076172, 12.599652290344238, 13.192852973937988, 13.786054611206055, 14.379255294799805, 14.972456932067871, 15.565658569335938, 16.158859252929688, 16.75206184387207, 17.34526252746582, 17.93846321105957, 18.53166389465332, 19.124866485595703, 19.718067169189453, 20.311267852783203]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 4.0, 2.0, 7.0, 7.0, 10.0, 8.0, 19.0, 27.0, 40.0, 59.0, 102.0, 165.0, 293.0, 516.0, 878.0, 1787.0, 3583.0, 7536.0, 16413.0, 39691.0, 107358.0, 400660.0, 318841.0, 89251.0, 33878.0, 14357.0, 6419.0, 3089.0, 1580.0, 818.0, 476.0, 266.0, 151.0, 105.0, 65.0, 28.0, 23.0, 15.0, 12.0, 5.0, 6.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.5078125, -15.03662109375, -14.5654296875, -14.09423828125, -13.623046875, -13.15185546875, -12.6806640625, -12.20947265625, -11.73828125, -11.26708984375, -10.7958984375, -10.32470703125, -9.853515625, -9.38232421875, -8.9111328125, -8.43994140625, -7.96875, -7.49755859375, -7.0263671875, -6.55517578125, -6.083984375, -5.61279296875, -5.1416015625, -4.67041015625, -4.19921875, -3.72802734375, -3.2568359375, -2.78564453125, -2.314453125, -1.84326171875, -1.3720703125, -0.90087890625, -0.4296875, 0.04150390625, 0.5126953125, 0.98388671875, 1.455078125, 1.92626953125, 2.3974609375, 2.86865234375, 3.33984375, 3.81103515625, 4.2822265625, 4.75341796875, 5.224609375, 5.69580078125, 6.1669921875, 6.63818359375, 7.109375, 7.58056640625, 8.0517578125, 8.52294921875, 8.994140625, 9.46533203125, 9.9365234375, 10.40771484375, 10.87890625, 11.35009765625, 11.8212890625, 12.29248046875, 12.763671875, 13.23486328125, 13.7060546875, 14.17724609375, 14.6484375]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 6.0, 5.0, 14.0, 10.0, 14.0, 29.0, 25.0, 42.0, 52.0, 49.0, 60.0, 54.0, 72.0, 78.0, 52.0, 66.0, 69.0, 66.0, 51.0, 50.0, 44.0, 22.0, 15.0, 16.0, 15.0, 7.0, 5.0, 6.0, 3.0, 3.0, 5.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.31640625, -4.19610595703125, -4.0758056640625, -3.95550537109375, -3.835205078125, -3.71490478515625, -3.5946044921875, -3.47430419921875, -3.35400390625, -3.23370361328125, -3.1134033203125, -2.99310302734375, -2.872802734375, -2.75250244140625, -2.6322021484375, -2.51190185546875, -2.3916015625, -2.27130126953125, -2.1510009765625, -2.03070068359375, -1.910400390625, -1.79010009765625, -1.6697998046875, -1.54949951171875, -1.42919921875, -1.30889892578125, -1.1885986328125, -1.06829833984375, -0.947998046875, -0.82769775390625, -0.7073974609375, -0.58709716796875, -0.466796875, -0.34649658203125, -0.2261962890625, -0.10589599609375, 0.014404296875, 0.13470458984375, 0.2550048828125, 0.37530517578125, 0.49560546875, 0.61590576171875, 0.7362060546875, 0.85650634765625, 0.976806640625, 1.09710693359375, 1.2174072265625, 1.33770751953125, 1.4580078125, 1.57830810546875, 1.6986083984375, 1.81890869140625, 1.939208984375, 2.05950927734375, 2.1798095703125, 2.30010986328125, 2.42041015625, 2.54071044921875, 2.6610107421875, 2.78131103515625, 2.901611328125, 3.02191162109375, 3.1422119140625, 3.26251220703125, 3.3828125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 7.0, 5.0, 5.0, 6.0, 13.0, 9.0, 19.0, 27.0, 40.0, 44.0, 63.0, 96.0, 125.0, 219.0, 320.0, 559.0, 1170.0, 2829.0, 7897.0, 27722.0, 123244.0, 613721.0, 209754.0, 42264.0, 11253.0, 3752.0, 1470.0, 728.0, 407.0, 253.0, 181.0, 100.0, 64.0, 62.0, 34.0, 25.0, 23.0, 18.0, 12.0, 5.0, 7.0, 1.0, 2.0, 6.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.609375, -19.026611328125, -18.44384765625, -17.861083984375, -17.2783203125, -16.695556640625, -16.11279296875, -15.530029296875, -14.947265625, -14.364501953125, -13.78173828125, -13.198974609375, -12.6162109375, -12.033447265625, -11.45068359375, -10.867919921875, -10.28515625, -9.702392578125, -9.11962890625, -8.536865234375, -7.9541015625, -7.371337890625, -6.78857421875, -6.205810546875, -5.623046875, -5.040283203125, -4.45751953125, -3.874755859375, -3.2919921875, -2.709228515625, -2.12646484375, -1.543701171875, -0.9609375, -0.378173828125, 0.20458984375, 0.787353515625, 1.3701171875, 1.952880859375, 2.53564453125, 3.118408203125, 3.701171875, 4.283935546875, 4.86669921875, 5.449462890625, 6.0322265625, 6.614990234375, 7.19775390625, 7.780517578125, 8.36328125, 8.946044921875, 9.52880859375, 10.111572265625, 10.6943359375, 11.277099609375, 11.85986328125, 12.442626953125, 13.025390625, 13.608154296875, 14.19091796875, 14.773681640625, 15.3564453125, 15.939208984375, 16.52197265625, 17.104736328125, 17.6875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 4.0, 1.0, 2.0, 8.0, 5.0, 2.0, 5.0, 7.0, 11.0, 11.0, 23.0, 24.0, 31.0, 34.0, 34.0, 42.0, 47.0, 49.0, 51.0, 53.0, 68.0, 50.0, 65.0, 51.0, 45.0, 45.0, 27.0, 40.0, 44.0, 25.0, 18.0, 28.0, 18.0, 13.0, 7.0, 4.0, 4.0, 2.0, 3.0, 3.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.1171875, -11.6744384765625, -11.231689453125, -10.7889404296875, -10.34619140625, -9.9034423828125, -9.460693359375, -9.0179443359375, -8.5751953125, -8.1324462890625, -7.689697265625, -7.2469482421875, -6.80419921875, -6.3614501953125, -5.918701171875, -5.4759521484375, -5.033203125, -4.5904541015625, -4.147705078125, -3.7049560546875, -3.26220703125, -2.8194580078125, -2.376708984375, -1.9339599609375, -1.4912109375, -1.0484619140625, -0.605712890625, -0.1629638671875, 0.27978515625, 0.7225341796875, 1.165283203125, 1.6080322265625, 2.05078125, 2.4935302734375, 2.936279296875, 3.3790283203125, 3.82177734375, 4.2645263671875, 4.707275390625, 5.1500244140625, 5.5927734375, 6.0355224609375, 6.478271484375, 6.9210205078125, 7.36376953125, 7.8065185546875, 8.249267578125, 8.6920166015625, 9.134765625, 9.5775146484375, 10.020263671875, 10.4630126953125, 10.90576171875, 11.3485107421875, 11.791259765625, 12.2340087890625, 12.6767578125, 13.1195068359375, 13.562255859375, 14.0050048828125, 14.44775390625, 14.8905029296875, 15.333251953125, 15.7760009765625, 16.21875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 7.0, 7.0, 11.0, 14.0, 17.0, 37.0, 55.0, 151.0, 390.0, 1559.0, 12929.0, 235608.0, 766106.0, 28057.0, 2706.0, 524.0, 191.0, 80.0, 38.0, 22.0, 12.0, 12.0, 8.0, 1.0, 3.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.234375, -15.5888671875, -14.943359375, -14.2978515625, -13.65234375, -13.0068359375, -12.361328125, -11.7158203125, -11.0703125, -10.4248046875, -9.779296875, -9.1337890625, -8.48828125, -7.8427734375, -7.197265625, -6.5517578125, -5.90625, -5.2607421875, -4.615234375, -3.9697265625, -3.32421875, -2.6787109375, -2.033203125, -1.3876953125, -0.7421875, -0.0966796875, 0.548828125, 1.1943359375, 1.83984375, 2.4853515625, 3.130859375, 3.7763671875, 4.421875, 5.0673828125, 5.712890625, 6.3583984375, 7.00390625, 7.6494140625, 8.294921875, 8.9404296875, 9.5859375, 10.2314453125, 10.876953125, 11.5224609375, 12.16796875, 12.8134765625, 13.458984375, 14.1044921875, 14.75, 15.3955078125, 16.041015625, 16.6865234375, 17.33203125, 17.9775390625, 18.623046875, 19.2685546875, 19.9140625, 20.5595703125, 21.205078125, 21.8505859375, 22.49609375, 23.1416015625, 23.787109375, 24.4326171875, 25.078125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 3.0, 3.0, 3.0, 5.0, 3.0, 6.0, 5.0, 6.0, 13.0, 10.0, 14.0, 11.0, 22.0, 26.0, 36.0, 30.0, 94.0, 171.0, 212.0, 115.0, 47.0, 34.0, 25.0, 18.0, 19.0, 10.0, 18.0, 4.0, 6.0, 7.0, 6.0, 2.0, 1.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.001926422119140625, -0.0018717795610427856, -0.0018171370029449463, -0.001762494444847107, -0.0017078518867492676, -0.0016532093286514282, -0.0015985667705535889, -0.0015439242124557495, -0.0014892816543579102, -0.0014346390962600708, -0.0013799965381622314, -0.001325353980064392, -0.0012707114219665527, -0.0012160688638687134, -0.001161426305770874, -0.0011067837476730347, -0.0010521411895751953, -0.000997498631477356, -0.0009428560733795166, -0.0008882135152816772, -0.0008335709571838379, -0.0007789283990859985, -0.0007242858409881592, -0.0006696432828903198, -0.0006150007247924805, -0.0005603581666946411, -0.0005057156085968018, -0.0004510730504989624, -0.00039643049240112305, -0.0003417879343032837, -0.00028714537620544434, -0.00023250281810760498, -0.00017786026000976562, -0.00012321770191192627, -6.857514381408691e-05, -1.3932585716247559e-05, 4.07099723815918e-05, 9.535253047943115e-05, 0.0001499950885772705, 0.00020463764667510986, 0.0002592802047729492, 0.0003139227628707886, 0.00036856532096862793, 0.0004232078790664673, 0.00047785043716430664, 0.000532492995262146, 0.0005871355533599854, 0.0006417781114578247, 0.0006964206695556641, 0.0007510632276535034, 0.0008057057857513428, 0.0008603483438491821, 0.0009149909019470215, 0.0009696334600448608, 0.0010242760181427002, 0.0010789185762405396, 0.001133561134338379, 0.0011882036924362183, 0.0012428462505340576, 0.001297488808631897, 0.0013521313667297363, 0.0014067739248275757, 0.001461416482925415, 0.0015160590410232544, 0.0015707015991210938]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 6.0, 6.0, 7.0, 17.0, 16.0, 35.0, 41.0, 69.0, 135.0, 294.0, 671.0, 1802.0, 7284.0, 52681.0, 833387.0, 132713.0, 14667.0, 2896.0, 983.0, 399.0, 206.0, 95.0, 60.0, 33.0, 20.0, 12.0, 5.0, 4.0, 5.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.265625, -13.71044921875, -13.1552734375, -12.60009765625, -12.044921875, -11.48974609375, -10.9345703125, -10.37939453125, -9.82421875, -9.26904296875, -8.7138671875, -8.15869140625, -7.603515625, -7.04833984375, -6.4931640625, -5.93798828125, -5.3828125, -4.82763671875, -4.2724609375, -3.71728515625, -3.162109375, -2.60693359375, -2.0517578125, -1.49658203125, -0.94140625, -0.38623046875, 0.1689453125, 0.72412109375, 1.279296875, 1.83447265625, 2.3896484375, 2.94482421875, 3.5, 4.05517578125, 4.6103515625, 5.16552734375, 5.720703125, 6.27587890625, 6.8310546875, 7.38623046875, 7.94140625, 8.49658203125, 9.0517578125, 9.60693359375, 10.162109375, 10.71728515625, 11.2724609375, 11.82763671875, 12.3828125, 12.93798828125, 13.4931640625, 14.04833984375, 14.603515625, 15.15869140625, 15.7138671875, 16.26904296875, 16.82421875, 17.37939453125, 17.9345703125, 18.48974609375, 19.044921875, 19.60009765625, 20.1552734375, 20.71044921875, 21.265625]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 4.0, 6.0, 7.0, 4.0, 7.0, 14.0, 17.0, 19.0, 38.0, 53.0, 127.0, 283.0, 199.0, 83.0, 44.0, 22.0, 19.0, 17.0, 11.0, 9.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.9140625, -9.5284423828125, -9.142822265625, -8.7572021484375, -8.37158203125, -7.9859619140625, -7.600341796875, -7.2147216796875, -6.8291015625, -6.4434814453125, -6.057861328125, -5.6722412109375, -5.28662109375, -4.9010009765625, -4.515380859375, -4.1297607421875, -3.744140625, -3.3585205078125, -2.972900390625, -2.5872802734375, -2.20166015625, -1.8160400390625, -1.430419921875, -1.0447998046875, -0.6591796875, -0.2735595703125, 0.112060546875, 0.4976806640625, 0.88330078125, 1.2689208984375, 1.654541015625, 2.0401611328125, 2.42578125, 2.8114013671875, 3.197021484375, 3.5826416015625, 3.96826171875, 4.3538818359375, 4.739501953125, 5.1251220703125, 5.5107421875, 5.8963623046875, 6.281982421875, 6.6676025390625, 7.05322265625, 7.4388427734375, 7.824462890625, 8.2100830078125, 8.595703125, 8.9813232421875, 9.366943359375, 9.7525634765625, 10.13818359375, 10.5238037109375, 10.909423828125, 11.2950439453125, 11.6806640625, 12.0662841796875, 12.451904296875, 12.8375244140625, 13.22314453125, 13.6087646484375, 13.994384765625, 14.3800048828125, 14.765625]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 6.0, 19.0, 74.0, 143.0, 228.0, 249.0, 169.0, 67.0, 28.0, 12.0, 7.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-254.49009704589844, -247.62008666992188, -240.75009155273438, -233.8800811767578, -227.01007080078125, -220.14007568359375, -213.2700653076172, -206.40005493164062, -199.53005981445312, -192.66004943847656, -185.79005432128906, -178.9200439453125, -172.050048828125, -165.18003845214844, -158.31002807617188, -151.44003295898438, -144.5700225830078, -137.70001220703125, -130.83001708984375, -123.96000671386719, -117.09000396728516, -110.22000122070312, -103.34999084472656, -96.47998809814453, -89.6099853515625, -82.73998260498047, -75.86997985839844, -68.99996948242188, -62.129966735839844, -55.25996398925781, -48.389957427978516, -41.51995086669922, -34.64996337890625, -27.779958724975586, -20.909954071044922, -14.039949417114258, -7.169944763183594, -0.2999420166015625, 6.570064544677734, 13.440071105957031, 20.310073852539062, 27.180078506469727, 34.05008316040039, 40.92008972167969, 47.79009246826172, 54.66009521484375, 61.53010177612305, 68.40010833740234, 75.27011108398438, 82.1401138305664, 89.01011657714844, 95.880126953125, 102.75012969970703, 109.62013244628906, 116.49014282226562, 123.36014556884766, 130.2301483154297, 137.10015869140625, 143.97015380859375, 150.8401641845703, 157.71017456054688, 164.58016967773438, 171.45018005371094, 178.3201904296875, 185.190185546875]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 7.0, 5.0, 3.0, 5.0, 6.0, 8.0, 10.0, 14.0, 12.0, 22.0, 24.0, 18.0, 38.0, 26.0, 25.0, 37.0, 34.0, 34.0, 44.0, 38.0, 50.0, 39.0, 41.0, 58.0, 30.0, 43.0, 40.0, 36.0, 39.0, 30.0, 24.0, 30.0, 20.0, 35.0, 14.0, 15.0, 11.0, 9.0, 9.0, 5.0, 4.0, 6.0, 4.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0], "bins": [-66.76054382324219, -64.84466552734375, -62.92879104614258, -61.012916564941406, -59.097042083740234, -57.18116760253906, -55.265289306640625, -53.34941482543945, -51.43354034423828, -49.51766586303711, -47.60178756713867, -45.6859130859375, -43.77003860473633, -41.854164123535156, -39.93828582763672, -38.02241134643555, -36.10653305053711, -34.19065856933594, -32.2747802734375, -30.358905792236328, -28.443031311035156, -26.52715492248535, -24.611278533935547, -22.695404052734375, -20.77952766418457, -18.863651275634766, -16.947776794433594, -15.031900405883789, -13.1160249710083, -11.200149536132812, -9.284273147583008, -7.3683977127075195, -5.452518463134766, -3.5366427898406982, -1.6207671165466309, 0.2951087951660156, 2.210984230041504, 4.126859664916992, 6.042736053466797, 7.958611488342285, 9.874486923217773, 11.790362358093262, 13.70623779296875, 15.622114181518555, 17.53799057006836, 19.45386505126953, 21.369741439819336, 23.28561782836914, 25.201492309570312, 27.117368698120117, 29.03324317932129, 30.949119567871094, 32.864994049072266, 34.78086853027344, 36.696746826171875, 38.61262130737305, 40.52849578857422, 42.44437026977539, 44.36024856567383, 46.276123046875, 48.19199752807617, 50.107872009277344, 52.02375030517578, 53.93962478637695, 55.85550308227539]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 1.0, 3.0, 3.0, 3.0, 10.0, 12.0, 20.0, 25.0, 27.0, 39.0, 67.0, 76.0, 109.0, 184.0, 296.0, 491.0, 793.0, 1316.0, 2451.0, 4786.0, 9819.0, 22889.0, 67573.0, 343001.0, 3330379.0, 305200.0, 63589.0, 21758.0, 9246.0, 4486.0, 2408.0, 1292.0, 753.0, 445.0, 280.0, 149.0, 95.0, 72.0, 39.0, 38.0, 20.0, 11.0, 9.0, 5.0, 9.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.9921875, -13.5863037109375, -13.180419921875, -12.7745361328125, -12.36865234375, -11.9627685546875, -11.556884765625, -11.1510009765625, -10.7451171875, -10.3392333984375, -9.933349609375, -9.5274658203125, -9.12158203125, -8.7156982421875, -8.309814453125, -7.9039306640625, -7.498046875, -7.0921630859375, -6.686279296875, -6.2803955078125, -5.87451171875, -5.4686279296875, -5.062744140625, -4.6568603515625, -4.2509765625, -3.8450927734375, -3.439208984375, -3.0333251953125, -2.62744140625, -2.2215576171875, -1.815673828125, -1.4097900390625, -1.00390625, -0.5980224609375, -0.192138671875, 0.2137451171875, 0.61962890625, 1.0255126953125, 1.431396484375, 1.8372802734375, 2.2431640625, 2.6490478515625, 3.054931640625, 3.4608154296875, 3.86669921875, 4.2725830078125, 4.678466796875, 5.0843505859375, 5.490234375, 5.8961181640625, 6.302001953125, 6.7078857421875, 7.11376953125, 7.5196533203125, 7.925537109375, 8.3314208984375, 8.7373046875, 9.1431884765625, 9.549072265625, 9.9549560546875, 10.36083984375, 10.7667236328125, 11.172607421875, 11.5784912109375, 11.984375]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 5.0, 12.0, 16.0, 17.0, 23.0, 33.0, 38.0, 47.0, 60.0, 68.0, 59.0, 71.0, 59.0, 70.0, 68.0, 71.0, 51.0, 58.0, 55.0, 34.0, 27.0, 15.0, 15.0, 10.0, 4.0, 7.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.1640625, -5.027069091796875, -4.89007568359375, -4.753082275390625, -4.6160888671875, -4.479095458984375, -4.34210205078125, -4.205108642578125, -4.068115234375, -3.931121826171875, -3.79412841796875, -3.657135009765625, -3.5201416015625, -3.383148193359375, -3.24615478515625, -3.109161376953125, -2.97216796875, -2.835174560546875, -2.69818115234375, -2.561187744140625, -2.4241943359375, -2.287200927734375, -2.15020751953125, -2.013214111328125, -1.876220703125, -1.739227294921875, -1.60223388671875, -1.465240478515625, -1.3282470703125, -1.191253662109375, -1.05426025390625, -0.917266845703125, -0.7802734375, -0.643280029296875, -0.50628662109375, -0.369293212890625, -0.2322998046875, -0.095306396484375, 0.04168701171875, 0.178680419921875, 0.315673828125, 0.452667236328125, 0.58966064453125, 0.726654052734375, 0.8636474609375, 1.000640869140625, 1.13763427734375, 1.274627685546875, 1.41162109375, 1.548614501953125, 1.68560791015625, 1.822601318359375, 1.9595947265625, 2.096588134765625, 2.23358154296875, 2.370574951171875, 2.507568359375, 2.644561767578125, 2.78155517578125, 2.918548583984375, 3.0555419921875, 3.192535400390625, 3.32952880859375, 3.466522216796875, 3.603515625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 9.0, 10.0, 12.0, 16.0, 18.0, 29.0, 39.0, 72.0, 101.0, 137.0, 208.0, 407.0, 617.0, 1102.0, 1924.0, 3473.0, 7353.0, 15952.0, 42602.0, 165397.0, 1891068.0, 1826654.0, 163784.0, 42355.0, 15865.0, 6970.0, 3515.0, 1855.0, 1082.0, 625.0, 347.0, 226.0, 132.0, 95.0, 73.0, 38.0, 31.0, 26.0, 17.0, 12.0, 13.0, 5.0, 4.0, 5.0, 1.0, 0.0, 3.0, 2.0, 6.0], "bins": [-13.71875, -13.337646484375, -12.95654296875, -12.575439453125, -12.1943359375, -11.813232421875, -11.43212890625, -11.051025390625, -10.669921875, -10.288818359375, -9.90771484375, -9.526611328125, -9.1455078125, -8.764404296875, -8.38330078125, -8.002197265625, -7.62109375, -7.239990234375, -6.85888671875, -6.477783203125, -6.0966796875, -5.715576171875, -5.33447265625, -4.953369140625, -4.572265625, -4.191162109375, -3.81005859375, -3.428955078125, -3.0478515625, -2.666748046875, -2.28564453125, -1.904541015625, -1.5234375, -1.142333984375, -0.76123046875, -0.380126953125, 0.0009765625, 0.382080078125, 0.76318359375, 1.144287109375, 1.525390625, 1.906494140625, 2.28759765625, 2.668701171875, 3.0498046875, 3.430908203125, 3.81201171875, 4.193115234375, 4.57421875, 4.955322265625, 5.33642578125, 5.717529296875, 6.0986328125, 6.479736328125, 6.86083984375, 7.241943359375, 7.623046875, 8.004150390625, 8.38525390625, 8.766357421875, 9.1474609375, 9.528564453125, 9.90966796875, 10.290771484375, 10.671875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 7.0, 7.0, 10.0, 19.0, 8.0, 18.0, 40.0, 38.0, 91.0, 136.0, 288.0, 693.0, 1544.0, 585.0, 248.0, 132.0, 77.0, 44.0, 16.0, 23.0, 10.0, 9.0, 12.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.53515625, -5.31744384765625, -5.0997314453125, -4.88201904296875, -4.664306640625, -4.44659423828125, -4.2288818359375, -4.01116943359375, -3.79345703125, -3.57574462890625, -3.3580322265625, -3.14031982421875, -2.922607421875, -2.70489501953125, -2.4871826171875, -2.26947021484375, -2.0517578125, -1.83404541015625, -1.6163330078125, -1.39862060546875, -1.180908203125, -0.96319580078125, -0.7454833984375, -0.52777099609375, -0.31005859375, -0.09234619140625, 0.1253662109375, 0.34307861328125, 0.560791015625, 0.77850341796875, 0.9962158203125, 1.21392822265625, 1.431640625, 1.64935302734375, 1.8670654296875, 2.08477783203125, 2.302490234375, 2.52020263671875, 2.7379150390625, 2.95562744140625, 3.17333984375, 3.39105224609375, 3.6087646484375, 3.82647705078125, 4.044189453125, 4.26190185546875, 4.4796142578125, 4.69732666015625, 4.9150390625, 5.13275146484375, 5.3504638671875, 5.56817626953125, 5.785888671875, 6.00360107421875, 6.2213134765625, 6.43902587890625, 6.65673828125, 6.87445068359375, 7.0921630859375, 7.30987548828125, 7.527587890625, 7.74530029296875, 7.9630126953125, 8.18072509765625, 8.3984375]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 6.0, 3.0, 10.0, 11.0, 27.0, 42.0, 63.0, 80.0, 125.0, 131.0, 152.0, 120.0, 92.0, 61.0, 34.0, 19.0, 15.0, 8.0, 0.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.06793212890625, -44.725563049316406, -43.38319778442383, -42.040828704833984, -40.698463439941406, -39.35609436035156, -38.013729095458984, -36.67136001586914, -35.32899475097656, -33.98662567138672, -32.64426040649414, -31.30189323425293, -29.95952606201172, -28.617158889770508, -27.274791717529297, -25.932422637939453, -24.590055465698242, -23.24768829345703, -21.90532112121582, -20.56295394897461, -19.2205867767334, -17.878219604492188, -16.535850524902344, -15.19348430633545, -13.851117134094238, -12.508749961853027, -11.166382789611816, -9.824014663696289, -8.481647491455078, -7.139280796051025, -5.796913146972656, -4.454545974731445, -3.1121788024902344, -1.7698115110397339, -0.4274442195892334, 0.9149231910705566, 2.2572903633117676, 3.5996575355529785, 4.942025184631348, 6.284392356872559, 7.6267595291137695, 8.96912670135498, 10.311493873596191, 11.653861999511719, 12.99622917175293, 14.33859634399414, 15.680963516235352, 17.023330688476562, 18.365697860717773, 19.708065032958984, 21.050432205200195, 22.392799377441406, 23.735166549682617, 25.077533721923828, 26.419902801513672, 27.76226806640625, 29.104637145996094, 30.447004318237305, 31.789371490478516, 33.13174057006836, 34.47410583496094, 35.81647491455078, 37.15884017944336, 38.5012092590332, 39.84357452392578]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 5.0, 7.0, 7.0, 10.0, 10.0, 12.0, 14.0, 21.0, 17.0, 22.0, 29.0, 25.0, 31.0, 35.0, 44.0, 38.0, 25.0, 29.0, 39.0, 36.0, 33.0, 58.0, 39.0, 51.0, 36.0, 33.0, 34.0, 31.0, 30.0, 31.0, 23.0, 21.0, 18.0, 15.0, 15.0, 16.0, 11.0, 8.0, 8.0, 8.0, 6.0, 4.0, 3.0, 6.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.29275894165039, -16.720579147338867, -16.148399353027344, -15.576218605041504, -15.004037857055664, -14.43185806274414, -13.859678268432617, -13.287498474121094, -12.715317726135254, -12.14313793182373, -11.57095718383789, -10.998777389526367, -10.426597595214844, -9.854416847229004, -9.28223705291748, -8.71005630493164, -8.137876510620117, -7.5656962394714355, -6.993515968322754, -6.4213361740112305, -5.849155902862549, -5.276975631713867, -4.704795837402344, -4.132615566253662, -3.5604352951049805, -2.988255023956299, -2.4160749912261963, -1.8438948392868042, -1.271714687347412, -0.6995344161987305, -0.12735438346862793, 0.4448256492614746, 1.0170059204101562, 1.5891860723495483, 2.1613662242889404, 2.733546257019043, 3.3057265281677246, 3.8779067993164062, 4.45008659362793, 5.022266864776611, 5.594447135925293, 6.166627407073975, 6.738807678222656, 7.31098747253418, 7.883167743682861, 8.455348014831543, 9.027527809143066, 9.599708557128906, 10.17188835144043, 10.744068145751953, 11.316248893737793, 11.888428688049316, 12.460609436035156, 13.03278923034668, 13.604969024658203, 14.177148818969727, 14.749329566955566, 15.32150936126709, 15.89369010925293, 16.465869903564453, 17.038049697875977, 17.6102294921875, 18.182411193847656, 18.75459098815918, 19.326770782470703]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 5.0, 2.0, 4.0, 10.0, 11.0, 22.0, 13.0, 34.0, 38.0, 65.0, 98.0, 130.0, 220.0, 366.0, 629.0, 1250.0, 2497.0, 4967.0, 10508.0, 23039.0, 50197.0, 125097.0, 402288.0, 270684.0, 85719.0, 37353.0, 17317.0, 8030.0, 3694.0, 1858.0, 983.0, 539.0, 326.0, 194.0, 140.0, 76.0, 39.0, 34.0, 29.0, 19.0, 15.0, 4.0, 5.0, 3.0, 5.0, 3.0, 2.0, 1.0, 1.0, 4.0], "bins": [-14.1328125, -13.7489013671875, -13.364990234375, -12.9810791015625, -12.59716796875, -12.2132568359375, -11.829345703125, -11.4454345703125, -11.0615234375, -10.6776123046875, -10.293701171875, -9.9097900390625, -9.52587890625, -9.1419677734375, -8.758056640625, -8.3741455078125, -7.990234375, -7.6063232421875, -7.222412109375, -6.8385009765625, -6.45458984375, -6.0706787109375, -5.686767578125, -5.3028564453125, -4.9189453125, -4.5350341796875, -4.151123046875, -3.7672119140625, -3.38330078125, -2.9993896484375, -2.615478515625, -2.2315673828125, -1.84765625, -1.4637451171875, -1.079833984375, -0.6959228515625, -0.31201171875, 0.0718994140625, 0.455810546875, 0.8397216796875, 1.2236328125, 1.6075439453125, 1.991455078125, 2.3753662109375, 2.75927734375, 3.1431884765625, 3.527099609375, 3.9110107421875, 4.294921875, 4.6788330078125, 5.062744140625, 5.4466552734375, 5.83056640625, 6.2144775390625, 6.598388671875, 6.9822998046875, 7.3662109375, 7.7501220703125, 8.134033203125, 8.5179443359375, 8.90185546875, 9.2857666015625, 9.669677734375, 10.0535888671875, 10.4375]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 5.0, 2.0, 4.0, 10.0, 16.0, 13.0, 11.0, 21.0, 36.0, 46.0, 43.0, 37.0, 53.0, 51.0, 61.0, 59.0, 59.0, 58.0, 56.0, 54.0, 55.0, 45.0, 45.0, 39.0, 30.0, 27.0, 20.0, 10.0, 6.0, 11.0, 5.0, 8.0, 4.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.01171875, -3.895416259765625, -3.77911376953125, -3.662811279296875, -3.5465087890625, -3.430206298828125, -3.31390380859375, -3.197601318359375, -3.081298828125, -2.964996337890625, -2.84869384765625, -2.732391357421875, -2.6160888671875, -2.499786376953125, -2.38348388671875, -2.267181396484375, -2.15087890625, -2.034576416015625, -1.91827392578125, -1.801971435546875, -1.6856689453125, -1.569366455078125, -1.45306396484375, -1.336761474609375, -1.220458984375, -1.104156494140625, -0.98785400390625, -0.871551513671875, -0.7552490234375, -0.638946533203125, -0.52264404296875, -0.406341552734375, -0.2900390625, -0.173736572265625, -0.05743408203125, 0.058868408203125, 0.1751708984375, 0.291473388671875, 0.40777587890625, 0.524078369140625, 0.640380859375, 0.756683349609375, 0.87298583984375, 0.989288330078125, 1.1055908203125, 1.221893310546875, 1.33819580078125, 1.454498291015625, 1.57080078125, 1.687103271484375, 1.80340576171875, 1.919708251953125, 2.0360107421875, 2.152313232421875, 2.26861572265625, 2.384918212890625, 2.501220703125, 2.617523193359375, 2.73382568359375, 2.850128173828125, 2.9664306640625, 3.082733154296875, 3.19903564453125, 3.315338134765625, 3.431640625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 10.0, 8.0, 16.0, 16.0, 18.0, 30.0, 30.0, 42.0, 82.0, 80.0, 143.0, 264.0, 562.0, 1228.0, 2922.0, 7550.0, 20582.0, 64269.0, 429683.0, 423983.0, 63578.0, 20574.0, 7574.0, 2879.0, 1110.0, 540.0, 277.0, 169.0, 98.0, 69.0, 43.0, 36.0, 26.0, 19.0, 10.0, 10.0, 7.0, 8.0, 2.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-19.34375, -18.791015625, -18.23828125, -17.685546875, -17.1328125, -16.580078125, -16.02734375, -15.474609375, -14.921875, -14.369140625, -13.81640625, -13.263671875, -12.7109375, -12.158203125, -11.60546875, -11.052734375, -10.5, -9.947265625, -9.39453125, -8.841796875, -8.2890625, -7.736328125, -7.18359375, -6.630859375, -6.078125, -5.525390625, -4.97265625, -4.419921875, -3.8671875, -3.314453125, -2.76171875, -2.208984375, -1.65625, -1.103515625, -0.55078125, 0.001953125, 0.5546875, 1.107421875, 1.66015625, 2.212890625, 2.765625, 3.318359375, 3.87109375, 4.423828125, 4.9765625, 5.529296875, 6.08203125, 6.634765625, 7.1875, 7.740234375, 8.29296875, 8.845703125, 9.3984375, 9.951171875, 10.50390625, 11.056640625, 11.609375, 12.162109375, 12.71484375, 13.267578125, 13.8203125, 14.373046875, 14.92578125, 15.478515625, 16.03125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 3.0, 5.0, 3.0, 5.0, 8.0, 6.0, 4.0, 10.0, 9.0, 7.0, 13.0, 17.0, 25.0, 16.0, 29.0, 31.0, 45.0, 42.0, 44.0, 53.0, 52.0, 57.0, 67.0, 46.0, 50.0, 47.0, 44.0, 50.0, 47.0, 23.0, 31.0, 18.0, 22.0, 18.0, 9.0, 10.0, 7.0, 7.0, 6.0, 4.0, 7.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-12.5625, -12.146484375, -11.73046875, -11.314453125, -10.8984375, -10.482421875, -10.06640625, -9.650390625, -9.234375, -8.818359375, -8.40234375, -7.986328125, -7.5703125, -7.154296875, -6.73828125, -6.322265625, -5.90625, -5.490234375, -5.07421875, -4.658203125, -4.2421875, -3.826171875, -3.41015625, -2.994140625, -2.578125, -2.162109375, -1.74609375, -1.330078125, -0.9140625, -0.498046875, -0.08203125, 0.333984375, 0.75, 1.166015625, 1.58203125, 1.998046875, 2.4140625, 2.830078125, 3.24609375, 3.662109375, 4.078125, 4.494140625, 4.91015625, 5.326171875, 5.7421875, 6.158203125, 6.57421875, 6.990234375, 7.40625, 7.822265625, 8.23828125, 8.654296875, 9.0703125, 9.486328125, 9.90234375, 10.318359375, 10.734375, 11.150390625, 11.56640625, 11.982421875, 12.3984375, 12.814453125, 13.23046875, 13.646484375, 14.0625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 7.0, 9.0, 21.0, 25.0, 39.0, 72.0, 119.0, 301.0, 636.0, 1920.0, 5702.0, 18623.0, 59382.0, 499081.0, 385433.0, 52698.0, 16613.0, 5124.0, 1585.0, 670.0, 258.0, 100.0, 58.0, 28.0, 19.0, 20.0, 8.0, 6.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.390625, -5.13330078125, -4.8759765625, -4.61865234375, -4.361328125, -4.10400390625, -3.8466796875, -3.58935546875, -3.33203125, -3.07470703125, -2.8173828125, -2.56005859375, -2.302734375, -2.04541015625, -1.7880859375, -1.53076171875, -1.2734375, -1.01611328125, -0.7587890625, -0.50146484375, -0.244140625, 0.01318359375, 0.2705078125, 0.52783203125, 0.78515625, 1.04248046875, 1.2998046875, 1.55712890625, 1.814453125, 2.07177734375, 2.3291015625, 2.58642578125, 2.84375, 3.10107421875, 3.3583984375, 3.61572265625, 3.873046875, 4.13037109375, 4.3876953125, 4.64501953125, 4.90234375, 5.15966796875, 5.4169921875, 5.67431640625, 5.931640625, 6.18896484375, 6.4462890625, 6.70361328125, 6.9609375, 7.21826171875, 7.4755859375, 7.73291015625, 7.990234375, 8.24755859375, 8.5048828125, 8.76220703125, 9.01953125, 9.27685546875, 9.5341796875, 9.79150390625, 10.048828125, 10.30615234375, 10.5634765625, 10.82080078125, 11.078125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 4.0, 2.0, 7.0, 5.0, 8.0, 10.0, 8.0, 20.0, 23.0, 22.0, 47.0, 252.0, 383.0, 99.0, 37.0, 22.0, 15.0, 11.0, 13.0, 13.0, 7.0, 3.0, 6.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0013904571533203125, -0.0012923777103424072, -0.001194298267364502, -0.0010962188243865967, -0.0009981393814086914, -0.0009000599384307861, -0.0008019804954528809, -0.0007039010524749756, -0.0006058216094970703, -0.000507742166519165, -0.00040966272354125977, -0.0003115832805633545, -0.00021350383758544922, -0.00011542439460754395, -1.7344951629638672e-05, 8.07344913482666e-05, 0.00017881393432617188, 0.00027689337730407715, 0.0003749728202819824, 0.0004730522632598877, 0.000571131706237793, 0.0006692111492156982, 0.0007672905921936035, 0.0008653700351715088, 0.0009634494781494141, 0.0010615289211273193, 0.0011596083641052246, 0.0012576878070831299, 0.0013557672500610352, 0.0014538466930389404, 0.0015519261360168457, 0.001650005578994751, 0.0017480850219726562, 0.0018461644649505615, 0.0019442439079284668, 0.002042323350906372, 0.0021404027938842773, 0.0022384822368621826, 0.002336561679840088, 0.002434641122817993, 0.0025327205657958984, 0.0026308000087738037, 0.002728879451751709, 0.0028269588947296143, 0.0029250383377075195, 0.003023117780685425, 0.00312119722366333, 0.0032192766666412354, 0.0033173561096191406, 0.003415435552597046, 0.003513514995574951, 0.0036115944385528564, 0.0037096738815307617, 0.003807753324508667, 0.0039058327674865723, 0.0040039122104644775, 0.004101991653442383, 0.004200071096420288, 0.004298150539398193, 0.004396229982376099, 0.004494309425354004, 0.004592388868331909, 0.0046904683113098145, 0.00478854775428772, 0.004886627197265625]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 3.0, 9.0, 8.0, 14.0, 35.0, 26.0, 69.0, 99.0, 209.0, 375.0, 762.0, 2156.0, 6662.0, 22826.0, 90831.0, 765097.0, 120273.0, 26977.0, 7859.0, 2512.0, 910.0, 367.0, 179.0, 104.0, 68.0, 42.0, 30.0, 17.0, 10.0, 6.0, 6.0, 7.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.53125, -10.25091552734375, -9.9705810546875, -9.69024658203125, -9.409912109375, -9.12957763671875, -8.8492431640625, -8.56890869140625, -8.28857421875, -8.00823974609375, -7.7279052734375, -7.44757080078125, -7.167236328125, -6.88690185546875, -6.6065673828125, -6.32623291015625, -6.0458984375, -5.76556396484375, -5.4852294921875, -5.20489501953125, -4.924560546875, -4.64422607421875, -4.3638916015625, -4.08355712890625, -3.80322265625, -3.52288818359375, -3.2425537109375, -2.96221923828125, -2.681884765625, -2.40155029296875, -2.1212158203125, -1.84088134765625, -1.560546875, -1.28021240234375, -0.9998779296875, -0.71954345703125, -0.439208984375, -0.15887451171875, 0.1214599609375, 0.40179443359375, 0.68212890625, 0.96246337890625, 1.2427978515625, 1.52313232421875, 1.803466796875, 2.08380126953125, 2.3641357421875, 2.64447021484375, 2.9248046875, 3.20513916015625, 3.4854736328125, 3.76580810546875, 4.046142578125, 4.32647705078125, 4.6068115234375, 4.88714599609375, 5.16748046875, 5.44781494140625, 5.7281494140625, 6.00848388671875, 6.288818359375, 6.56915283203125, 6.8494873046875, 7.12982177734375, 7.41015625]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 8.0, 12.0, 11.0, 16.0, 20.0, 33.0, 38.0, 108.0, 184.0, 242.0, 145.0, 65.0, 30.0, 24.0, 15.0, 15.0, 10.0, 7.0, 3.0, 4.0, 5.0, 1.0, 2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-11.21875, -10.96484375, -10.7109375, -10.45703125, -10.203125, -9.94921875, -9.6953125, -9.44140625, -9.1875, -8.93359375, -8.6796875, -8.42578125, -8.171875, -7.91796875, -7.6640625, -7.41015625, -7.15625, -6.90234375, -6.6484375, -6.39453125, -6.140625, -5.88671875, -5.6328125, -5.37890625, -5.125, -4.87109375, -4.6171875, -4.36328125, -4.109375, -3.85546875, -3.6015625, -3.34765625, -3.09375, -2.83984375, -2.5859375, -2.33203125, -2.078125, -1.82421875, -1.5703125, -1.31640625, -1.0625, -0.80859375, -0.5546875, -0.30078125, -0.046875, 0.20703125, 0.4609375, 0.71484375, 0.96875, 1.22265625, 1.4765625, 1.73046875, 1.984375, 2.23828125, 2.4921875, 2.74609375, 3.0, 3.25390625, 3.5078125, 3.76171875, 4.015625, 4.26953125, 4.5234375, 4.77734375, 5.03125]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 7.0, 3.0, 16.0, 21.0, 33.0, 44.0, 59.0, 104.0, 109.0, 117.0, 123.0, 103.0, 84.0, 59.0, 38.0, 27.0, 26.0, 19.0, 8.0, 7.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.19029235839844, -64.12901306152344, -61.06774139404297, -58.006465911865234, -54.9451904296875, -51.883914947509766, -48.82263946533203, -45.76136016845703, -42.70008850097656, -39.63881301879883, -36.577537536621094, -33.51626205444336, -30.454986572265625, -27.39371109008789, -24.332433700561523, -21.27115821838379, -18.209880828857422, -15.148605346679688, -12.087329864501953, -9.026053428649902, -5.964777946472168, -2.9035024642944336, 0.1577739715576172, 3.2190494537353516, 6.280324935913086, 9.34160041809082, 12.402875900268555, 15.464152336120605, 18.525428771972656, 21.58670425415039, 24.647979736328125, 27.70925521850586, 30.770530700683594, 33.83180618286133, 36.89308166503906, 39.9543571472168, 43.01563262939453, 46.076908111572266, 49.13818359375, 52.199462890625, 55.26073455810547, 58.3220100402832, 61.38328552246094, 64.44456481933594, 67.5058364868164, 70.5671157836914, 73.62838745117188, 76.68966674804688, 79.75094604492188, 82.81222534179688, 85.87349700927734, 88.93477630615234, 91.99604797363281, 95.05732727050781, 98.11859893798828, 101.17987823486328, 104.24114990234375, 107.30242919921875, 110.36370086669922, 113.42498016357422, 116.48625183105469, 119.54753112792969, 122.60880279541016, 125.67008209228516, 128.73135375976562]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 4.0, 3.0, 10.0, 5.0, 6.0, 5.0, 9.0, 8.0, 13.0, 9.0, 16.0, 20.0, 23.0, 26.0, 33.0, 33.0, 28.0, 30.0, 38.0, 41.0, 30.0, 44.0, 49.0, 48.0, 46.0, 38.0, 50.0, 49.0, 40.0, 34.0, 27.0, 25.0, 26.0, 29.0, 23.0, 15.0, 18.0, 19.0, 8.0, 11.0, 5.0, 6.0, 4.0, 2.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-57.872650146484375, -56.1311149597168, -54.38957595825195, -52.648040771484375, -50.90650177001953, -49.16496658325195, -47.423431396484375, -45.68189239501953, -43.94035720825195, -42.198822021484375, -40.45728302001953, -38.71574783325195, -36.974212646484375, -35.23267364501953, -33.49113845825195, -31.749601364135742, -30.00806427001953, -28.26652717590332, -26.52499008178711, -24.78345489501953, -23.04191780090332, -21.30038070678711, -19.55884552001953, -17.81730842590332, -16.07577133178711, -14.334234237670898, -12.592698097229004, -10.85116195678711, -9.109624862670898, -7.3680877685546875, -5.626551628112793, -3.8850154876708984, -2.143482208251953, -0.4019455909729004, 1.3395910263061523, 3.081127643585205, 4.822664260864258, 6.564201354980469, 8.305737495422363, 10.047273635864258, 11.788810729980469, 13.53034782409668, 15.271883964538574, 17.01342010498047, 18.75495719909668, 20.49649429321289, 22.23802947998047, 23.97956657409668, 25.72110366821289, 27.4626407623291, 29.204177856445312, 30.94571304321289, 32.68724822998047, 34.42878723144531, 36.17032241821289, 37.91185760498047, 39.65339660644531, 41.39493179321289, 43.136470794677734, 44.87800598144531, 46.619544982910156, 48.361080169677734, 50.10261535644531, 51.844154357910156, 53.585689544677734]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 3.0, 2.0, 0.0, 4.0, 6.0, 2.0, 11.0, 4.0, 12.0, 22.0, 22.0, 28.0, 61.0, 85.0, 139.0, 235.0, 321.0, 609.0, 1048.0, 2047.0, 4037.0, 8232.0, 19156.0, 53166.0, 239539.0, 3369557.0, 383114.0, 69541.0, 23406.0, 9923.0, 4797.0, 2287.0, 1216.0, 720.0, 376.0, 220.0, 116.0, 79.0, 58.0, 30.0, 16.0, 18.0, 10.0, 6.0, 6.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-18.453125, -17.904052734375, -17.35498046875, -16.805908203125, -16.2568359375, -15.707763671875, -15.15869140625, -14.609619140625, -14.060546875, -13.511474609375, -12.96240234375, -12.413330078125, -11.8642578125, -11.315185546875, -10.76611328125, -10.217041015625, -9.66796875, -9.118896484375, -8.56982421875, -8.020751953125, -7.4716796875, -6.922607421875, -6.37353515625, -5.824462890625, -5.275390625, -4.726318359375, -4.17724609375, -3.628173828125, -3.0791015625, -2.530029296875, -1.98095703125, -1.431884765625, -0.8828125, -0.333740234375, 0.21533203125, 0.764404296875, 1.3134765625, 1.862548828125, 2.41162109375, 2.960693359375, 3.509765625, 4.058837890625, 4.60791015625, 5.156982421875, 5.7060546875, 6.255126953125, 6.80419921875, 7.353271484375, 7.90234375, 8.451416015625, 9.00048828125, 9.549560546875, 10.0986328125, 10.647705078125, 11.19677734375, 11.745849609375, 12.294921875, 12.843994140625, 13.39306640625, 13.942138671875, 14.4912109375, 15.040283203125, 15.58935546875, 16.138427734375, 16.6875]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 3.0, 11.0, 11.0, 18.0, 27.0, 31.0, 32.0, 43.0, 47.0, 40.0, 61.0, 60.0, 70.0, 71.0, 54.0, 51.0, 58.0, 57.0, 51.0, 45.0, 34.0, 29.0, 32.0, 18.0, 16.0, 5.0, 6.0, 12.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.015625, -4.8824462890625, -4.749267578125, -4.6160888671875, -4.48291015625, -4.3497314453125, -4.216552734375, -4.0833740234375, -3.9501953125, -3.8170166015625, -3.683837890625, -3.5506591796875, -3.41748046875, -3.2843017578125, -3.151123046875, -3.0179443359375, -2.884765625, -2.7515869140625, -2.618408203125, -2.4852294921875, -2.35205078125, -2.2188720703125, -2.085693359375, -1.9525146484375, -1.8193359375, -1.6861572265625, -1.552978515625, -1.4197998046875, -1.28662109375, -1.1534423828125, -1.020263671875, -0.8870849609375, -0.75390625, -0.6207275390625, -0.487548828125, -0.3543701171875, -0.22119140625, -0.0880126953125, 0.045166015625, 0.1783447265625, 0.3115234375, 0.4447021484375, 0.577880859375, 0.7110595703125, 0.84423828125, 0.9774169921875, 1.110595703125, 1.2437744140625, 1.376953125, 1.5101318359375, 1.643310546875, 1.7764892578125, 1.90966796875, 2.0428466796875, 2.176025390625, 2.3092041015625, 2.4423828125, 2.5755615234375, 2.708740234375, 2.8419189453125, 2.97509765625, 3.1082763671875, 3.241455078125, 3.3746337890625, 3.5078125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 16.0, 21.0, 14.0, 31.0, 72.0, 94.0, 148.0, 287.0, 504.0, 848.0, 1484.0, 3053.0, 6121.0, 13811.0, 35051.0, 117224.0, 809706.0, 2903752.0, 211922.0, 54005.0, 19325.0, 8424.0, 3993.0, 1995.0, 1057.0, 584.0, 292.0, 198.0, 109.0, 60.0, 28.0, 24.0, 14.0, 8.0, 5.0, 3.0, 3.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.21875, -13.731689453125, -13.24462890625, -12.757568359375, -12.2705078125, -11.783447265625, -11.29638671875, -10.809326171875, -10.322265625, -9.835205078125, -9.34814453125, -8.861083984375, -8.3740234375, -7.886962890625, -7.39990234375, -6.912841796875, -6.42578125, -5.938720703125, -5.45166015625, -4.964599609375, -4.4775390625, -3.990478515625, -3.50341796875, -3.016357421875, -2.529296875, -2.042236328125, -1.55517578125, -1.068115234375, -0.5810546875, -0.093994140625, 0.39306640625, 0.880126953125, 1.3671875, 1.854248046875, 2.34130859375, 2.828369140625, 3.3154296875, 3.802490234375, 4.28955078125, 4.776611328125, 5.263671875, 5.750732421875, 6.23779296875, 6.724853515625, 7.2119140625, 7.698974609375, 8.18603515625, 8.673095703125, 9.16015625, 9.647216796875, 10.13427734375, 10.621337890625, 11.1083984375, 11.595458984375, 12.08251953125, 12.569580078125, 13.056640625, 13.543701171875, 14.03076171875, 14.517822265625, 15.0048828125, 15.491943359375, 15.97900390625, 16.466064453125, 16.953125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 5.0, 2.0, 3.0, 3.0, 4.0, 2.0, 13.0, 7.0, 9.0, 11.0, 20.0, 23.0, 28.0, 35.0, 69.0, 108.0, 157.0, 269.0, 669.0, 1477.0, 473.0, 226.0, 116.0, 104.0, 76.0, 29.0, 35.0, 24.0, 13.0, 9.0, 9.0, 9.0, 13.0, 6.0, 3.0, 5.0, 3.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-6.51953125, -6.32415771484375, -6.1287841796875, -5.93341064453125, -5.738037109375, -5.54266357421875, -5.3472900390625, -5.15191650390625, -4.95654296875, -4.76116943359375, -4.5657958984375, -4.37042236328125, -4.175048828125, -3.97967529296875, -3.7843017578125, -3.58892822265625, -3.3935546875, -3.19818115234375, -3.0028076171875, -2.80743408203125, -2.612060546875, -2.41668701171875, -2.2213134765625, -2.02593994140625, -1.83056640625, -1.63519287109375, -1.4398193359375, -1.24444580078125, -1.049072265625, -0.85369873046875, -0.6583251953125, -0.46295166015625, -0.267578125, -0.07220458984375, 0.1231689453125, 0.31854248046875, 0.513916015625, 0.70928955078125, 0.9046630859375, 1.10003662109375, 1.29541015625, 1.49078369140625, 1.6861572265625, 1.88153076171875, 2.076904296875, 2.27227783203125, 2.4676513671875, 2.66302490234375, 2.8583984375, 3.05377197265625, 3.2491455078125, 3.44451904296875, 3.639892578125, 3.83526611328125, 4.0306396484375, 4.22601318359375, 4.42138671875, 4.61676025390625, 4.8121337890625, 5.00750732421875, 5.202880859375, 5.39825439453125, 5.5936279296875, 5.78900146484375, 5.984375]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 6.0, 13.0, 26.0, 78.0, 181.0, 263.0, 250.0, 137.0, 38.0, 10.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-131.16787719726562, -127.96488952636719, -124.76190185546875, -121.55892181396484, -118.3559341430664, -115.15294647216797, -111.94995880126953, -108.74697875976562, -105.54399108886719, -102.34100341796875, -99.13801574707031, -95.9350357055664, -92.73204803466797, -89.52906036376953, -86.3260726928711, -83.12309265136719, -79.92010498046875, -76.71711730957031, -73.51412963867188, -70.31114959716797, -67.10816192626953, -63.905174255371094, -60.702186584472656, -57.499202728271484, -54.29621124267578, -51.093223571777344, -47.89023971557617, -44.687252044677734, -41.48426818847656, -38.281280517578125, -35.07829284667969, -31.875308990478516, -28.672325134277344, -25.46933937072754, -22.266353607177734, -19.063365936279297, -15.860381126403809, -12.657394409179688, -9.454408645629883, -6.251422882080078, -3.0484371185302734, 0.15454888343811035, 3.357534885406494, 6.560521125793457, 9.763506889343262, 12.966493606567383, 16.169479370117188, 19.372465133666992, 22.575450897216797, 25.7784366607666, 28.981422424316406, 32.184410095214844, 35.387393951416016, 38.59038162231445, 41.793365478515625, 44.99635314941406, 48.1993408203125, 51.40232849121094, 54.60531234741211, 57.80830001831055, 61.01128387451172, 64.21427154541016, 67.4172592163086, 70.6202392578125, 73.82322692871094]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 6.0, 2.0, 1.0, 5.0, 8.0, 12.0, 15.0, 11.0, 22.0, 25.0, 36.0, 43.0, 36.0, 38.0, 53.0, 55.0, 66.0, 71.0, 55.0, 66.0, 51.0, 43.0, 32.0, 41.0, 51.0, 38.0, 23.0, 20.0, 17.0, 18.0, 14.0, 8.0, 10.0, 4.0, 4.0, 3.0, 1.0, 3.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.87667465209961, -30.93840217590332, -30.0001277923584, -29.06185531616211, -28.123580932617188, -27.1853084564209, -26.24703598022461, -25.308761596679688, -24.370487213134766, -23.432214736938477, -22.493940353393555, -21.555667877197266, -20.617393493652344, -19.679121017456055, -18.740848541259766, -17.802574157714844, -16.864301681518555, -15.92602825164795, -14.987754821777344, -14.049482345581055, -13.111207962036133, -12.172935485839844, -11.234662055969238, -10.296388626098633, -9.358115196228027, -8.419841766357422, -7.481568336486816, -6.543295383453369, -5.605021953582764, -4.666748523712158, -3.728475570678711, -2.7902021408081055, -1.8519287109375, -0.9136554002761841, 0.024617910385131836, 0.9628911018371582, 1.9011645317077637, 2.839437961578369, 3.7777109146118164, 4.715984344482422, 5.654257774353027, 6.592531204223633, 7.530804634094238, 8.469078063964844, 9.407350540161133, 10.345624923706055, 11.283897399902344, 12.22217082977295, 13.160444259643555, 14.09871768951416, 15.036991119384766, 15.975263595581055, 16.913537979125977, 17.851810455322266, 18.790084838867188, 19.728357315063477, 20.666629791259766, 21.604902267456055, 22.543176651000977, 23.481449127197266, 24.419723510742188, 25.357995986938477, 26.296268463134766, 27.234542846679688, 28.17281723022461]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 2.0, 2.0, 8.0, 8.0, 16.0, 22.0, 35.0, 56.0, 99.0, 197.0, 332.0, 666.0, 1351.0, 2971.0, 7591.0, 19788.0, 53273.0, 132387.0, 353033.0, 294993.0, 110141.0, 44071.0, 16401.0, 6259.0, 2485.0, 1109.0, 548.0, 294.0, 176.0, 83.0, 54.0, 30.0, 31.0, 16.0, 10.0, 7.0, 2.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-16.6875, -16.22265625, -15.7578125, -15.29296875, -14.828125, -14.36328125, -13.8984375, -13.43359375, -12.96875, -12.50390625, -12.0390625, -11.57421875, -11.109375, -10.64453125, -10.1796875, -9.71484375, -9.25, -8.78515625, -8.3203125, -7.85546875, -7.390625, -6.92578125, -6.4609375, -5.99609375, -5.53125, -5.06640625, -4.6015625, -4.13671875, -3.671875, -3.20703125, -2.7421875, -2.27734375, -1.8125, -1.34765625, -0.8828125, -0.41796875, 0.046875, 0.51171875, 0.9765625, 1.44140625, 1.90625, 2.37109375, 2.8359375, 3.30078125, 3.765625, 4.23046875, 4.6953125, 5.16015625, 5.625, 6.08984375, 6.5546875, 7.01953125, 7.484375, 7.94921875, 8.4140625, 8.87890625, 9.34375, 9.80859375, 10.2734375, 10.73828125, 11.203125, 11.66796875, 12.1328125, 12.59765625, 13.0625]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 4.0, 8.0, 13.0, 16.0, 18.0, 21.0, 32.0, 46.0, 48.0, 55.0, 61.0, 49.0, 61.0, 66.0, 64.0, 56.0, 59.0, 51.0, 62.0, 49.0, 47.0, 32.0, 17.0, 22.0, 14.0, 10.0, 5.0, 9.0, 4.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.703125, -4.564208984375, -4.42529296875, -4.286376953125, -4.1474609375, -4.008544921875, -3.86962890625, -3.730712890625, -3.591796875, -3.452880859375, -3.31396484375, -3.175048828125, -3.0361328125, -2.897216796875, -2.75830078125, -2.619384765625, -2.48046875, -2.341552734375, -2.20263671875, -2.063720703125, -1.9248046875, -1.785888671875, -1.64697265625, -1.508056640625, -1.369140625, -1.230224609375, -1.09130859375, -0.952392578125, -0.8134765625, -0.674560546875, -0.53564453125, -0.396728515625, -0.2578125, -0.118896484375, 0.02001953125, 0.158935546875, 0.2978515625, 0.436767578125, 0.57568359375, 0.714599609375, 0.853515625, 0.992431640625, 1.13134765625, 1.270263671875, 1.4091796875, 1.548095703125, 1.68701171875, 1.825927734375, 1.96484375, 2.103759765625, 2.24267578125, 2.381591796875, 2.5205078125, 2.659423828125, 2.79833984375, 2.937255859375, 3.076171875, 3.215087890625, 3.35400390625, 3.492919921875, 3.6318359375, 3.770751953125, 3.90966796875, 4.048583984375, 4.1875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 2.0, 3.0, 11.0, 9.0, 12.0, 22.0, 30.0, 44.0, 58.0, 78.0, 118.0, 115.0, 227.0, 307.0, 487.0, 784.0, 1540.0, 4126.0, 17961.0, 87702.0, 456090.0, 382351.0, 74120.0, 15198.0, 3663.0, 1325.0, 697.0, 466.0, 319.0, 196.0, 164.0, 82.0, 64.0, 52.0, 41.0, 21.0, 26.0, 13.0, 9.0, 6.0, 6.0, 7.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.5625, -17.962646484375, -17.36279296875, -16.762939453125, -16.1630859375, -15.563232421875, -14.96337890625, -14.363525390625, -13.763671875, -13.163818359375, -12.56396484375, -11.964111328125, -11.3642578125, -10.764404296875, -10.16455078125, -9.564697265625, -8.96484375, -8.364990234375, -7.76513671875, -7.165283203125, -6.5654296875, -5.965576171875, -5.36572265625, -4.765869140625, -4.166015625, -3.566162109375, -2.96630859375, -2.366455078125, -1.7666015625, -1.166748046875, -0.56689453125, 0.032958984375, 0.6328125, 1.232666015625, 1.83251953125, 2.432373046875, 3.0322265625, 3.632080078125, 4.23193359375, 4.831787109375, 5.431640625, 6.031494140625, 6.63134765625, 7.231201171875, 7.8310546875, 8.430908203125, 9.03076171875, 9.630615234375, 10.23046875, 10.830322265625, 11.43017578125, 12.030029296875, 12.6298828125, 13.229736328125, 13.82958984375, 14.429443359375, 15.029296875, 15.629150390625, 16.22900390625, 16.828857421875, 17.4287109375, 18.028564453125, 18.62841796875, 19.228271484375, 19.828125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 2.0, 5.0, 6.0, 10.0, 8.0, 15.0, 15.0, 17.0, 31.0, 30.0, 21.0, 39.0, 35.0, 47.0, 32.0, 42.0, 55.0, 65.0, 41.0, 50.0, 61.0, 41.0, 57.0, 44.0, 34.0, 31.0, 39.0, 27.0, 27.0, 16.0, 12.0, 16.0, 2.0, 8.0, 7.0, 5.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-17.875, -17.3690185546875, -16.863037109375, -16.3570556640625, -15.85107421875, -15.3450927734375, -14.839111328125, -14.3331298828125, -13.8271484375, -13.3211669921875, -12.815185546875, -12.3092041015625, -11.80322265625, -11.2972412109375, -10.791259765625, -10.2852783203125, -9.779296875, -9.2733154296875, -8.767333984375, -8.2613525390625, -7.75537109375, -7.2493896484375, -6.743408203125, -6.2374267578125, -5.7314453125, -5.2254638671875, -4.719482421875, -4.2135009765625, -3.70751953125, -3.2015380859375, -2.695556640625, -2.1895751953125, -1.68359375, -1.1776123046875, -0.671630859375, -0.1656494140625, 0.34033203125, 0.8463134765625, 1.352294921875, 1.8582763671875, 2.3642578125, 2.8702392578125, 3.376220703125, 3.8822021484375, 4.38818359375, 4.8941650390625, 5.400146484375, 5.9061279296875, 6.412109375, 6.9180908203125, 7.424072265625, 7.9300537109375, 8.43603515625, 8.9420166015625, 9.447998046875, 9.9539794921875, 10.4599609375, 10.9659423828125, 11.471923828125, 11.9779052734375, 12.48388671875, 12.9898681640625, 13.495849609375, 14.0018310546875, 14.5078125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 7.0, 11.0, 15.0, 26.0, 35.0, 64.0, 117.0, 181.0, 420.0, 1007.0, 2732.0, 9164.0, 36757.0, 147573.0, 580930.0, 200705.0, 50476.0, 12554.0, 3562.0, 1200.0, 477.0, 233.0, 147.0, 64.0, 34.0, 26.0, 16.0, 8.0, 5.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.37109375, -7.08331298828125, -6.7955322265625, -6.50775146484375, -6.219970703125, -5.93218994140625, -5.6444091796875, -5.35662841796875, -5.06884765625, -4.78106689453125, -4.4932861328125, -4.20550537109375, -3.917724609375, -3.62994384765625, -3.3421630859375, -3.05438232421875, -2.7666015625, -2.47882080078125, -2.1910400390625, -1.90325927734375, -1.615478515625, -1.32769775390625, -1.0399169921875, -0.75213623046875, -0.46435546875, -0.17657470703125, 0.1112060546875, 0.39898681640625, 0.686767578125, 0.97454833984375, 1.2623291015625, 1.55010986328125, 1.837890625, 2.12567138671875, 2.4134521484375, 2.70123291015625, 2.989013671875, 3.27679443359375, 3.5645751953125, 3.85235595703125, 4.14013671875, 4.42791748046875, 4.7156982421875, 5.00347900390625, 5.291259765625, 5.57904052734375, 5.8668212890625, 6.15460205078125, 6.4423828125, 6.73016357421875, 7.0179443359375, 7.30572509765625, 7.593505859375, 7.88128662109375, 8.1690673828125, 8.45684814453125, 8.74462890625, 9.03240966796875, 9.3201904296875, 9.60797119140625, 9.895751953125, 10.18353271484375, 10.4713134765625, 10.75909423828125, 11.046875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 5.0, 10.0, 6.0, 4.0, 2.0, 4.0, 6.0, 12.0, 8.0, 17.0, 12.0, 19.0, 11.0, 17.0, 21.0, 25.0, 34.0, 45.0, 43.0, 67.0, 147.0, 121.0, 76.0, 48.0, 34.0, 28.0, 27.0, 20.0, 25.0, 14.0, 12.0, 16.0, 12.0, 4.0, 13.0, 6.0, 10.0, 8.0, 6.0, 5.0, 0.0, 2.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.001369476318359375, -0.0013265162706375122, -0.0012835562229156494, -0.0012405961751937866, -0.0011976361274719238, -0.001154676079750061, -0.0011117160320281982, -0.0010687559843063354, -0.0010257959365844727, -0.0009828358888626099, -0.0009398758411407471, -0.0008969157934188843, -0.0008539557456970215, -0.0008109956979751587, -0.0007680356502532959, -0.0007250756025314331, -0.0006821155548095703, -0.0006391555070877075, -0.0005961954593658447, -0.0005532354116439819, -0.0005102753639221191, -0.00046731531620025635, -0.00042435526847839355, -0.00038139522075653076, -0.00033843517303466797, -0.0002954751253128052, -0.0002525150775909424, -0.0002095550298690796, -0.0001665949821472168, -0.000123634934425354, -8.067488670349121e-05, -3.771483898162842e-05, 5.245208740234375e-06, 4.820525646209717e-05, 9.116530418395996e-05, 0.00013412535190582275, 0.00017708539962768555, 0.00022004544734954834, 0.00026300549507141113, 0.0003059655427932739, 0.0003489255905151367, 0.0003918856382369995, 0.0004348456859588623, 0.0004778057336807251, 0.0005207657814025879, 0.0005637258291244507, 0.0006066858768463135, 0.0006496459245681763, 0.0006926059722900391, 0.0007355660200119019, 0.0007785260677337646, 0.0008214861154556274, 0.0008644461631774902, 0.000907406210899353, 0.0009503662586212158, 0.0009933263063430786, 0.0010362863540649414, 0.0010792464017868042, 0.001122206449508667, 0.0011651664972305298, 0.0012081265449523926, 0.0012510865926742554, 0.0012940466403961182, 0.001337006688117981, 0.0013799667358398438]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 6.0, 5.0, 10.0, 15.0, 21.0, 30.0, 57.0, 81.0, 153.0, 256.0, 406.0, 802.0, 1825.0, 5432.0, 21310.0, 105514.0, 567489.0, 276343.0, 51783.0, 11191.0, 3211.0, 1228.0, 596.0, 325.0, 180.0, 91.0, 64.0, 29.0, 29.0, 24.0, 18.0, 7.0, 7.0, 6.0, 4.0, 7.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.1875, -10.84619140625, -10.5048828125, -10.16357421875, -9.822265625, -9.48095703125, -9.1396484375, -8.79833984375, -8.45703125, -8.11572265625, -7.7744140625, -7.43310546875, -7.091796875, -6.75048828125, -6.4091796875, -6.06787109375, -5.7265625, -5.38525390625, -5.0439453125, -4.70263671875, -4.361328125, -4.02001953125, -3.6787109375, -3.33740234375, -2.99609375, -2.65478515625, -2.3134765625, -1.97216796875, -1.630859375, -1.28955078125, -0.9482421875, -0.60693359375, -0.265625, 0.07568359375, 0.4169921875, 0.75830078125, 1.099609375, 1.44091796875, 1.7822265625, 2.12353515625, 2.46484375, 2.80615234375, 3.1474609375, 3.48876953125, 3.830078125, 4.17138671875, 4.5126953125, 4.85400390625, 5.1953125, 5.53662109375, 5.8779296875, 6.21923828125, 6.560546875, 6.90185546875, 7.2431640625, 7.58447265625, 7.92578125, 8.26708984375, 8.6083984375, 8.94970703125, 9.291015625, 9.63232421875, 9.9736328125, 10.31494140625, 10.65625]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [4.0, 2.0, 4.0, 1.0, 5.0, 1.0, 6.0, 5.0, 3.0, 7.0, 6.0, 7.0, 9.0, 13.0, 14.0, 28.0, 23.0, 30.0, 30.0, 48.0, 54.0, 64.0, 85.0, 90.0, 103.0, 85.0, 40.0, 44.0, 35.0, 33.0, 26.0, 21.0, 17.0, 12.0, 13.0, 11.0, 9.0, 7.0, 5.0, 3.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.99609375, -4.78497314453125, -4.5738525390625, -4.36273193359375, -4.151611328125, -3.94049072265625, -3.7293701171875, -3.51824951171875, -3.30712890625, -3.09600830078125, -2.8848876953125, -2.67376708984375, -2.462646484375, -2.25152587890625, -2.0404052734375, -1.82928466796875, -1.6181640625, -1.40704345703125, -1.1959228515625, -0.98480224609375, -0.773681640625, -0.56256103515625, -0.3514404296875, -0.14031982421875, 0.07080078125, 0.28192138671875, 0.4930419921875, 0.70416259765625, 0.915283203125, 1.12640380859375, 1.3375244140625, 1.54864501953125, 1.759765625, 1.97088623046875, 2.1820068359375, 2.39312744140625, 2.604248046875, 2.81536865234375, 3.0264892578125, 3.23760986328125, 3.44873046875, 3.65985107421875, 3.8709716796875, 4.08209228515625, 4.293212890625, 4.50433349609375, 4.7154541015625, 4.92657470703125, 5.1376953125, 5.34881591796875, 5.5599365234375, 5.77105712890625, 5.982177734375, 6.19329833984375, 6.4044189453125, 6.61553955078125, 6.82666015625, 7.03778076171875, 7.2489013671875, 7.46002197265625, 7.671142578125, 7.88226318359375, 8.0933837890625, 8.30450439453125, 8.515625]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 6.0, 3.0, 9.0, 11.0, 28.0, 53.0, 104.0, 157.0, 185.0, 158.0, 144.0, 88.0, 37.0, 14.0, 6.0, 4.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-242.6143341064453, -236.9787139892578, -231.3430938720703, -225.7074737548828, -220.0718536376953, -214.4362335205078, -208.8006134033203, -203.1649932861328, -197.5293731689453, -191.8937530517578, -186.2581329345703, -180.6225128173828, -174.9868927001953, -169.3512725830078, -163.7156524658203, -158.0800323486328, -152.44439697265625, -146.80877685546875, -141.17315673828125, -135.53753662109375, -129.90191650390625, -124.26629638671875, -118.63067626953125, -112.99505615234375, -107.35943603515625, -101.72381591796875, -96.08819580078125, -90.45257568359375, -84.81695556640625, -79.18133544921875, -73.54571533203125, -67.91009521484375, -62.27446746826172, -56.63884735107422, -51.00322723388672, -45.36760711669922, -39.73198699951172, -34.09636688232422, -28.460742950439453, -22.825122833251953, -17.189502716064453, -11.553882598876953, -5.918261528015137, -0.2826404571533203, 5.35297966003418, 10.98859977722168, 16.624221801757812, 22.259841918945312, 27.895462036132812, 33.53108215332031, 39.16670227050781, 44.80232238769531, 50.43794250488281, 56.07356262207031, 61.70918655395508, 67.34480285644531, 72.98042297363281, 78.61604309082031, 84.25166320800781, 89.88728332519531, 95.52290344238281, 101.15852355957031, 106.79414367675781, 112.42976379394531, 118.06539154052734]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 3.0, 9.0, 8.0, 3.0, 15.0, 18.0, 14.0, 17.0, 18.0, 16.0, 23.0, 21.0, 30.0, 32.0, 30.0, 35.0, 41.0, 49.0, 44.0, 34.0, 48.0, 46.0, 39.0, 42.0, 43.0, 47.0, 35.0, 25.0, 39.0, 33.0, 30.0, 13.0, 17.0, 16.0, 18.0, 5.0, 9.0, 9.0, 5.0, 5.0, 8.0, 4.0, 3.0, 4.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.42166137695312, -71.0766372680664, -68.73160552978516, -66.38658142089844, -64.04154968261719, -61.69652557373047, -59.35150146484375, -57.006473541259766, -54.66144561767578, -52.3164176940918, -49.97138977050781, -47.626365661621094, -45.28133773803711, -42.936309814453125, -40.591285705566406, -38.24625778198242, -35.90122985839844, -33.55620193481445, -31.2111759185791, -28.86614990234375, -26.521121978759766, -24.17609405517578, -21.83106803894043, -19.486042022705078, -17.141014099121094, -14.795987129211426, -12.450960159301758, -10.10593318939209, -7.760906219482422, -5.415879249572754, -3.070852279663086, -0.7258262634277344, 1.6192092895507812, 3.964236259460449, 6.309263229370117, 8.654290199279785, 10.999317169189453, 13.344344139099121, 15.689371109008789, 18.03439712524414, 20.379425048828125, 22.72445297241211, 25.06947898864746, 27.414505004882812, 29.759532928466797, 32.10456085205078, 34.4495849609375, 36.794612884521484, 39.13964080810547, 41.48466873168945, 43.82969665527344, 46.174720764160156, 48.51974868774414, 50.864776611328125, 53.209800720214844, 55.55482864379883, 57.89985656738281, 60.2448844909668, 62.58991241455078, 64.9349365234375, 67.27996826171875, 69.62499237060547, 71.97001647949219, 74.31504821777344, 76.66007232666016]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 3.0, 5.0, 8.0, 8.0, 11.0, 17.0, 21.0, 22.0, 40.0, 71.0, 95.0, 148.0, 254.0, 421.0, 790.0, 1441.0, 2620.0, 5332.0, 11031.0, 25919.0, 70864.0, 267471.0, 2625719.0, 938156.0, 158296.0, 48721.0, 18928.0, 8629.0, 4269.0, 2181.0, 1152.0, 700.0, 374.0, 221.0, 142.0, 74.0, 56.0, 24.0, 17.0, 21.0, 3.0, 5.0, 5.0, 4.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.1171875, -12.7293701171875, -12.341552734375, -11.9537353515625, -11.56591796875, -11.1781005859375, -10.790283203125, -10.4024658203125, -10.0146484375, -9.6268310546875, -9.239013671875, -8.8511962890625, -8.46337890625, -8.0755615234375, -7.687744140625, -7.2999267578125, -6.912109375, -6.5242919921875, -6.136474609375, -5.7486572265625, -5.36083984375, -4.9730224609375, -4.585205078125, -4.1973876953125, -3.8095703125, -3.4217529296875, -3.033935546875, -2.6461181640625, -2.25830078125, -1.8704833984375, -1.482666015625, -1.0948486328125, -0.70703125, -0.3192138671875, 0.068603515625, 0.4564208984375, 0.84423828125, 1.2320556640625, 1.619873046875, 2.0076904296875, 2.3955078125, 2.7833251953125, 3.171142578125, 3.5589599609375, 3.94677734375, 4.3345947265625, 4.722412109375, 5.1102294921875, 5.498046875, 5.8858642578125, 6.273681640625, 6.6614990234375, 7.04931640625, 7.4371337890625, 7.824951171875, 8.2127685546875, 8.6005859375, 8.9884033203125, 9.376220703125, 9.7640380859375, 10.15185546875, 10.5396728515625, 10.927490234375, 11.3153076171875, 11.703125]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 5.0, 2.0, 3.0, 14.0, 9.0, 18.0, 23.0, 33.0, 31.0, 35.0, 35.0, 55.0, 50.0, 54.0, 71.0, 59.0, 65.0, 72.0, 65.0, 59.0, 46.0, 34.0, 35.0, 29.0, 25.0, 30.0, 12.0, 9.0, 7.0, 6.0, 7.0, 3.0, 4.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.71484375, -4.576171875, -4.4375, -4.298828125, -4.16015625, -4.021484375, -3.8828125, -3.744140625, -3.60546875, -3.466796875, -3.328125, -3.189453125, -3.05078125, -2.912109375, -2.7734375, -2.634765625, -2.49609375, -2.357421875, -2.21875, -2.080078125, -1.94140625, -1.802734375, -1.6640625, -1.525390625, -1.38671875, -1.248046875, -1.109375, -0.970703125, -0.83203125, -0.693359375, -0.5546875, -0.416015625, -0.27734375, -0.138671875, 0.0, 0.138671875, 0.27734375, 0.416015625, 0.5546875, 0.693359375, 0.83203125, 0.970703125, 1.109375, 1.248046875, 1.38671875, 1.525390625, 1.6640625, 1.802734375, 1.94140625, 2.080078125, 2.21875, 2.357421875, 2.49609375, 2.634765625, 2.7734375, 2.912109375, 3.05078125, 3.189453125, 3.328125, 3.466796875, 3.60546875, 3.744140625, 3.8828125, 4.021484375, 4.16015625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 4.0, 3.0, 5.0, 8.0, 12.0, 15.0, 45.0, 41.0, 81.0, 98.0, 156.0, 280.0, 459.0, 824.0, 1504.0, 2870.0, 6087.0, 13132.0, 30932.0, 83482.0, 270308.0, 1324342.0, 1954990.0, 338585.0, 100515.0, 36282.0, 15099.0, 6928.0, 3320.0, 1751.0, 882.0, 462.0, 289.0, 186.0, 106.0, 71.0, 53.0, 27.0, 17.0, 14.0, 6.0, 10.0, 5.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.5078125, -8.181640625, -7.85546875, -7.529296875, -7.203125, -6.876953125, -6.55078125, -6.224609375, -5.8984375, -5.572265625, -5.24609375, -4.919921875, -4.59375, -4.267578125, -3.94140625, -3.615234375, -3.2890625, -2.962890625, -2.63671875, -2.310546875, -1.984375, -1.658203125, -1.33203125, -1.005859375, -0.6796875, -0.353515625, -0.02734375, 0.298828125, 0.625, 0.951171875, 1.27734375, 1.603515625, 1.9296875, 2.255859375, 2.58203125, 2.908203125, 3.234375, 3.560546875, 3.88671875, 4.212890625, 4.5390625, 4.865234375, 5.19140625, 5.517578125, 5.84375, 6.169921875, 6.49609375, 6.822265625, 7.1484375, 7.474609375, 7.80078125, 8.126953125, 8.453125, 8.779296875, 9.10546875, 9.431640625, 9.7578125, 10.083984375, 10.41015625, 10.736328125, 11.0625, 11.388671875, 11.71484375, 12.041015625, 12.3671875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 4.0, 3.0, 6.0, 10.0, 18.0, 20.0, 18.0, 35.0, 68.0, 95.0, 142.0, 221.0, 379.0, 886.0, 977.0, 473.0, 270.0, 167.0, 96.0, 59.0, 31.0, 29.0, 21.0, 13.0, 13.0, 7.0, 9.0, 3.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-11.1015625, -10.8311767578125, -10.560791015625, -10.2904052734375, -10.02001953125, -9.7496337890625, -9.479248046875, -9.2088623046875, -8.9384765625, -8.6680908203125, -8.397705078125, -8.1273193359375, -7.85693359375, -7.5865478515625, -7.316162109375, -7.0457763671875, -6.775390625, -6.5050048828125, -6.234619140625, -5.9642333984375, -5.69384765625, -5.4234619140625, -5.153076171875, -4.8826904296875, -4.6123046875, -4.3419189453125, -4.071533203125, -3.8011474609375, -3.53076171875, -3.2603759765625, -2.989990234375, -2.7196044921875, -2.44921875, -2.1788330078125, -1.908447265625, -1.6380615234375, -1.36767578125, -1.0972900390625, -0.826904296875, -0.5565185546875, -0.2861328125, -0.0157470703125, 0.254638671875, 0.5250244140625, 0.79541015625, 1.0657958984375, 1.336181640625, 1.6065673828125, 1.876953125, 2.1473388671875, 2.417724609375, 2.6881103515625, 2.95849609375, 3.2288818359375, 3.499267578125, 3.7696533203125, 4.0400390625, 4.3104248046875, 4.580810546875, 4.8511962890625, 5.12158203125, 5.3919677734375, 5.662353515625, 5.9327392578125, 6.203125]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 8.0, 8.0, 17.0, 12.0, 34.0, 47.0, 69.0, 92.0, 113.0, 118.0, 130.0, 101.0, 74.0, 64.0, 41.0, 25.0, 22.0, 14.0, 7.0, 5.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.33293914794922, -58.6876335144043, -57.04232406616211, -55.39701843261719, -53.751712799072266, -52.106407165527344, -50.461097717285156, -48.815792083740234, -47.17048645019531, -45.52518081665039, -43.8798713684082, -42.23456573486328, -40.58926010131836, -38.94395446777344, -37.29864501953125, -35.65333938598633, -34.008033752441406, -32.362728118896484, -30.71742057800293, -29.072113037109375, -27.426807403564453, -25.7814998626709, -24.136192321777344, -22.490886688232422, -20.845577239990234, -19.20026969909668, -17.554964065551758, -15.909656524658203, -14.264350891113281, -12.619043350219727, -10.973736763000488, -9.32843017578125, -7.683124542236328, -6.03781795501709, -4.392511367797852, -2.747204303741455, -1.1018977165222168, 0.5434093475341797, 2.188715934753418, 3.8340225219726562, 5.4793291091918945, 7.124635696411133, 8.769942283630371, 10.41524887084961, 12.060556411743164, 13.705862998962402, 15.35116958618164, 16.996475219726562, 18.641782760620117, 20.287090301513672, 21.932395935058594, 23.57770347595215, 25.22300910949707, 26.868316650390625, 28.513622283935547, 30.1589298248291, 31.804237365722656, 33.44954299926758, 35.094852447509766, 36.74015808105469, 38.38546371459961, 40.03076934814453, 41.67607879638672, 43.32138442993164, 44.96669006347656]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 4.0, 6.0, 4.0, 6.0, 3.0, 9.0, 9.0, 15.0, 18.0, 27.0, 17.0, 29.0, 35.0, 37.0, 39.0, 40.0, 41.0, 41.0, 55.0, 42.0, 54.0, 49.0, 43.0, 46.0, 38.0, 33.0, 47.0, 32.0, 29.0, 37.0, 19.0, 16.0, 13.0, 16.0, 11.0, 11.0, 8.0, 9.0, 8.0, 1.0, 1.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-27.20871353149414, -26.219411849975586, -25.23011016845703, -24.240806579589844, -23.25150489807129, -22.262203216552734, -21.27290153503418, -20.283599853515625, -19.294296264648438, -18.304994583129883, -17.315692901611328, -16.32638931274414, -15.337087631225586, -14.347785949707031, -13.358484268188477, -12.369182586669922, -11.379880905151367, -10.390579223632812, -9.401276588439941, -8.411974906921387, -7.422672748565674, -6.433370590209961, -5.444068908691406, -4.454766750335693, -3.4654645919799805, -2.4761624336242676, -1.4868605136871338, -0.49755859375, 0.4917435646057129, 1.4810457229614258, 2.4703474044799805, 3.4596495628356934, 4.448951721191406, 5.438253879547119, 6.427556037902832, 7.416857719421387, 8.406160354614258, 9.395462036132812, 10.384763717651367, 11.374065399169922, 12.363368034362793, 13.352669715881348, 14.341972351074219, 15.331274032592773, 16.320575714111328, 17.309879302978516, 18.299179077148438, 19.288482666015625, 20.27778434753418, 21.267086029052734, 22.25638771057129, 23.245689392089844, 24.23499298095703, 25.224294662475586, 26.21359634399414, 27.202898025512695, 28.19219970703125, 29.181501388549805, 30.17080307006836, 31.160106658935547, 32.14940643310547, 33.138710021972656, 34.128013610839844, 35.117313385009766, 36.10661697387695]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 5.0, 5.0, 6.0, 9.0, 8.0, 21.0, 23.0, 31.0, 46.0, 94.0, 145.0, 278.0, 469.0, 938.0, 1647.0, 3537.0, 8498.0, 20922.0, 53434.0, 130691.0, 257050.0, 287000.0, 165324.0, 70614.0, 27430.0, 11044.0, 4752.0, 2115.0, 1053.0, 617.0, 283.0, 176.0, 92.0, 64.0, 39.0, 25.0, 23.0, 12.0, 13.0, 7.0, 3.0, 4.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.3515625, -11.9898681640625, -11.628173828125, -11.2664794921875, -10.90478515625, -10.5430908203125, -10.181396484375, -9.8197021484375, -9.4580078125, -9.0963134765625, -8.734619140625, -8.3729248046875, -8.01123046875, -7.6495361328125, -7.287841796875, -6.9261474609375, -6.564453125, -6.2027587890625, -5.841064453125, -5.4793701171875, -5.11767578125, -4.7559814453125, -4.394287109375, -4.0325927734375, -3.6708984375, -3.3092041015625, -2.947509765625, -2.5858154296875, -2.22412109375, -1.8624267578125, -1.500732421875, -1.1390380859375, -0.77734375, -0.4156494140625, -0.053955078125, 0.3077392578125, 0.66943359375, 1.0311279296875, 1.392822265625, 1.7545166015625, 2.1162109375, 2.4779052734375, 2.839599609375, 3.2012939453125, 3.56298828125, 3.9246826171875, 4.286376953125, 4.6480712890625, 5.009765625, 5.3714599609375, 5.733154296875, 6.0948486328125, 6.45654296875, 6.8182373046875, 7.179931640625, 7.5416259765625, 7.9033203125, 8.2650146484375, 8.626708984375, 8.9884033203125, 9.35009765625, 9.7117919921875, 10.073486328125, 10.4351806640625, 10.796875]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 7.0, 3.0, 12.0, 14.0, 24.0, 23.0, 17.0, 33.0, 56.0, 38.0, 54.0, 64.0, 72.0, 60.0, 65.0, 63.0, 61.0, 59.0, 48.0, 52.0, 42.0, 43.0, 23.0, 20.0, 15.0, 12.0, 6.0, 7.0, 7.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.76171875, -4.61004638671875, -4.4583740234375, -4.30670166015625, -4.155029296875, -4.00335693359375, -3.8516845703125, -3.70001220703125, -3.54833984375, -3.39666748046875, -3.2449951171875, -3.09332275390625, -2.941650390625, -2.78997802734375, -2.6383056640625, -2.48663330078125, -2.3349609375, -2.18328857421875, -2.0316162109375, -1.87994384765625, -1.728271484375, -1.57659912109375, -1.4249267578125, -1.27325439453125, -1.12158203125, -0.96990966796875, -0.8182373046875, -0.66656494140625, -0.514892578125, -0.36322021484375, -0.2115478515625, -0.05987548828125, 0.091796875, 0.24346923828125, 0.3951416015625, 0.54681396484375, 0.698486328125, 0.85015869140625, 1.0018310546875, 1.15350341796875, 1.30517578125, 1.45684814453125, 1.6085205078125, 1.76019287109375, 1.911865234375, 2.06353759765625, 2.2152099609375, 2.36688232421875, 2.5185546875, 2.67022705078125, 2.8218994140625, 2.97357177734375, 3.125244140625, 3.27691650390625, 3.4285888671875, 3.58026123046875, 3.73193359375, 3.88360595703125, 4.0352783203125, 4.18695068359375, 4.338623046875, 4.49029541015625, 4.6419677734375, 4.79364013671875, 4.9453125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 3.0, 1.0, 4.0, 3.0, 6.0, 6.0, 11.0, 9.0, 25.0, 40.0, 45.0, 57.0, 87.0, 107.0, 179.0, 319.0, 509.0, 823.0, 1583.0, 4367.0, 18373.0, 112397.0, 539275.0, 306371.0, 49464.0, 8966.0, 2500.0, 1200.0, 634.0, 409.0, 275.0, 165.0, 101.0, 69.0, 46.0, 40.0, 24.0, 19.0, 15.0, 10.0, 8.0, 9.0, 3.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.1875, -17.50830078125, -16.8291015625, -16.14990234375, -15.470703125, -14.79150390625, -14.1123046875, -13.43310546875, -12.75390625, -12.07470703125, -11.3955078125, -10.71630859375, -10.037109375, -9.35791015625, -8.6787109375, -7.99951171875, -7.3203125, -6.64111328125, -5.9619140625, -5.28271484375, -4.603515625, -3.92431640625, -3.2451171875, -2.56591796875, -1.88671875, -1.20751953125, -0.5283203125, 0.15087890625, 0.830078125, 1.50927734375, 2.1884765625, 2.86767578125, 3.546875, 4.22607421875, 4.9052734375, 5.58447265625, 6.263671875, 6.94287109375, 7.6220703125, 8.30126953125, 8.98046875, 9.65966796875, 10.3388671875, 11.01806640625, 11.697265625, 12.37646484375, 13.0556640625, 13.73486328125, 14.4140625, 15.09326171875, 15.7724609375, 16.45166015625, 17.130859375, 17.81005859375, 18.4892578125, 19.16845703125, 19.84765625, 20.52685546875, 21.2060546875, 21.88525390625, 22.564453125, 23.24365234375, 23.9228515625, 24.60205078125, 25.28125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 4.0, 3.0, 4.0, 6.0, 12.0, 7.0, 12.0, 7.0, 19.0, 32.0, 13.0, 23.0, 30.0, 34.0, 53.0, 48.0, 45.0, 43.0, 49.0, 46.0, 52.0, 52.0, 48.0, 46.0, 49.0, 41.0, 43.0, 34.0, 24.0, 17.0, 24.0, 14.0, 13.0, 15.0, 2.0, 9.0, 4.0, 8.0, 8.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.84375, -18.2216796875, -17.599609375, -16.9775390625, -16.35546875, -15.7333984375, -15.111328125, -14.4892578125, -13.8671875, -13.2451171875, -12.623046875, -12.0009765625, -11.37890625, -10.7568359375, -10.134765625, -9.5126953125, -8.890625, -8.2685546875, -7.646484375, -7.0244140625, -6.40234375, -5.7802734375, -5.158203125, -4.5361328125, -3.9140625, -3.2919921875, -2.669921875, -2.0478515625, -1.42578125, -0.8037109375, -0.181640625, 0.4404296875, 1.0625, 1.6845703125, 2.306640625, 2.9287109375, 3.55078125, 4.1728515625, 4.794921875, 5.4169921875, 6.0390625, 6.6611328125, 7.283203125, 7.9052734375, 8.52734375, 9.1494140625, 9.771484375, 10.3935546875, 11.015625, 11.6376953125, 12.259765625, 12.8818359375, 13.50390625, 14.1259765625, 14.748046875, 15.3701171875, 15.9921875, 16.6142578125, 17.236328125, 17.8583984375, 18.48046875, 19.1025390625, 19.724609375, 20.3466796875, 20.96875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 8.0, 12.0, 21.0, 23.0, 52.0, 79.0, 160.0, 330.0, 954.0, 3389.0, 19033.0, 130057.0, 578949.0, 267062.0, 39552.0, 6460.0, 1466.0, 489.0, 220.0, 99.0, 58.0, 28.0, 12.0, 13.0, 9.0, 7.0, 7.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0], "bins": [-10.2734375, -9.9154052734375, -9.557373046875, -9.1993408203125, -8.84130859375, -8.4832763671875, -8.125244140625, -7.7672119140625, -7.4091796875, -7.0511474609375, -6.693115234375, -6.3350830078125, -5.97705078125, -5.6190185546875, -5.260986328125, -4.9029541015625, -4.544921875, -4.1868896484375, -3.828857421875, -3.4708251953125, -3.11279296875, -2.7547607421875, -2.396728515625, -2.0386962890625, -1.6806640625, -1.3226318359375, -0.964599609375, -0.6065673828125, -0.24853515625, 0.1094970703125, 0.467529296875, 0.8255615234375, 1.18359375, 1.5416259765625, 1.899658203125, 2.2576904296875, 2.61572265625, 2.9737548828125, 3.331787109375, 3.6898193359375, 4.0478515625, 4.4058837890625, 4.763916015625, 5.1219482421875, 5.47998046875, 5.8380126953125, 6.196044921875, 6.5540771484375, 6.912109375, 7.2701416015625, 7.628173828125, 7.9862060546875, 8.34423828125, 8.7022705078125, 9.060302734375, 9.4183349609375, 9.7763671875, 10.1343994140625, 10.492431640625, 10.8504638671875, 11.20849609375, 11.5665283203125, 11.924560546875, 12.2825927734375, 12.640625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 4.0, 3.0, 5.0, 4.0, 4.0, 6.0, 5.0, 13.0, 8.0, 10.0, 18.0, 18.0, 20.0, 26.0, 30.0, 32.0, 44.0, 53.0, 59.0, 51.0, 83.0, 62.0, 76.0, 55.0, 49.0, 42.0, 35.0, 36.0, 18.0, 27.0, 29.0, 16.0, 18.0, 9.0, 10.0, 3.0, 8.0, 4.0, 2.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0013256072998046875, -0.0012833178043365479, -0.0012410283088684082, -0.0011987388134002686, -0.001156449317932129, -0.0011141598224639893, -0.0010718703269958496, -0.00102958083152771, -0.0009872913360595703, -0.0009450018405914307, -0.000902712345123291, -0.0008604228496551514, -0.0008181333541870117, -0.0007758438587188721, -0.0007335543632507324, -0.0006912648677825928, -0.0006489753723144531, -0.0006066858768463135, -0.0005643963813781738, -0.0005221068859100342, -0.00047981739044189453, -0.0004375278949737549, -0.00039523839950561523, -0.0003529489040374756, -0.00031065940856933594, -0.0002683699131011963, -0.00022608041763305664, -0.000183790922164917, -0.00014150142669677734, -9.92119312286377e-05, -5.692243576049805e-05, -1.4632940292358398e-05, 2.765655517578125e-05, 6.99460506439209e-05, 0.00011223554611206055, 0.0001545250415802002, 0.00019681453704833984, 0.0002391040325164795, 0.00028139352798461914, 0.0003236830234527588, 0.00036597251892089844, 0.0004082620143890381, 0.00045055150985717773, 0.0004928410053253174, 0.000535130500793457, 0.0005774199962615967, 0.0006197094917297363, 0.000661998987197876, 0.0007042884826660156, 0.0007465779781341553, 0.0007888674736022949, 0.0008311569690704346, 0.0008734464645385742, 0.0009157359600067139, 0.0009580254554748535, 0.0010003149509429932, 0.0010426044464111328, 0.0010848939418792725, 0.0011271834373474121, 0.0011694729328155518, 0.0012117624282836914, 0.001254051923751831, 0.0012963414192199707, 0.0013386309146881104, 0.00138092041015625]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 7.0, 4.0, 9.0, 25.0, 36.0, 39.0, 49.0, 88.0, 138.0, 237.0, 372.0, 721.0, 1451.0, 3340.0, 11083.0, 47753.0, 199857.0, 490855.0, 220175.0, 52967.0, 12181.0, 3728.0, 1521.0, 746.0, 419.0, 276.0, 166.0, 108.0, 64.0, 61.0, 32.0, 19.0, 14.0, 5.0, 2.0, 1.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.015625, -7.7347412109375, -7.453857421875, -7.1729736328125, -6.89208984375, -6.6112060546875, -6.330322265625, -6.0494384765625, -5.7685546875, -5.4876708984375, -5.206787109375, -4.9259033203125, -4.64501953125, -4.3641357421875, -4.083251953125, -3.8023681640625, -3.521484375, -3.2406005859375, -2.959716796875, -2.6788330078125, -2.39794921875, -2.1170654296875, -1.836181640625, -1.5552978515625, -1.2744140625, -0.9935302734375, -0.712646484375, -0.4317626953125, -0.15087890625, 0.1300048828125, 0.410888671875, 0.6917724609375, 0.97265625, 1.2535400390625, 1.534423828125, 1.8153076171875, 2.09619140625, 2.3770751953125, 2.657958984375, 2.9388427734375, 3.2197265625, 3.5006103515625, 3.781494140625, 4.0623779296875, 4.34326171875, 4.6241455078125, 4.905029296875, 5.1859130859375, 5.466796875, 5.7476806640625, 6.028564453125, 6.3094482421875, 6.59033203125, 6.8712158203125, 7.152099609375, 7.4329833984375, 7.7138671875, 7.9947509765625, 8.275634765625, 8.5565185546875, 8.83740234375, 9.1182861328125, 9.399169921875, 9.6800537109375, 9.9609375]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 8.0, 6.0, 8.0, 9.0, 11.0, 24.0, 18.0, 24.0, 25.0, 33.0, 39.0, 38.0, 49.0, 53.0, 78.0, 80.0, 81.0, 68.0, 62.0, 45.0, 60.0, 43.0, 27.0, 21.0, 12.0, 19.0, 15.0, 12.0, 8.0, 8.0, 3.0, 3.0, 5.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.4140625, -6.1849365234375, -5.955810546875, -5.7266845703125, -5.49755859375, -5.2684326171875, -5.039306640625, -4.8101806640625, -4.5810546875, -4.3519287109375, -4.122802734375, -3.8936767578125, -3.66455078125, -3.4354248046875, -3.206298828125, -2.9771728515625, -2.748046875, -2.5189208984375, -2.289794921875, -2.0606689453125, -1.83154296875, -1.6024169921875, -1.373291015625, -1.1441650390625, -0.9150390625, -0.6859130859375, -0.456787109375, -0.2276611328125, 0.00146484375, 0.2305908203125, 0.459716796875, 0.6888427734375, 0.91796875, 1.1470947265625, 1.376220703125, 1.6053466796875, 1.83447265625, 2.0635986328125, 2.292724609375, 2.5218505859375, 2.7509765625, 2.9801025390625, 3.209228515625, 3.4383544921875, 3.66748046875, 3.8966064453125, 4.125732421875, 4.3548583984375, 4.583984375, 4.8131103515625, 5.042236328125, 5.2713623046875, 5.50048828125, 5.7296142578125, 5.958740234375, 6.1878662109375, 6.4169921875, 6.6461181640625, 6.875244140625, 7.1043701171875, 7.33349609375, 7.5626220703125, 7.791748046875, 8.0208740234375, 8.25]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 5.0, 6.0, 9.0, 27.0, 68.0, 162.0, 283.0, 259.0, 139.0, 44.0, 8.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-83.36935424804688, -74.14250946044922, -64.91566467285156, -55.688812255859375, -46.46196746826172, -37.23512268066406, -28.00827407836914, -18.78142547607422, -9.554580688476562, -0.32773399353027344, 8.899112701416016, 18.125959396362305, 27.352806091308594, 36.57965087890625, 45.80649948120117, 55.033348083496094, 64.26019287109375, 73.4870376586914, 82.71388244628906, 91.94073486328125, 101.1675796508789, 110.39442443847656, 119.62127685546875, 128.84811401367188, 138.07496643066406, 147.30181884765625, 156.52865600585938, 165.75550842285156, 174.98236083984375, 184.20919799804688, 193.43605041503906, 202.66290283203125, 211.88973999023438, 221.11659240722656, 230.3434295654297, 239.57028198242188, 248.797119140625, 258.02398681640625, 267.2508239746094, 276.4776611328125, 285.70452880859375, 294.9313659667969, 304.1582336425781, 313.38507080078125, 322.6119079589844, 331.8387451171875, 341.06561279296875, 350.2924499511719, 359.519287109375, 368.7461242675781, 377.9729919433594, 387.1998291015625, 396.4266662597656, 405.65350341796875, 414.88037109375, 424.1072082519531, 433.33404541015625, 442.5608825683594, 451.7877502441406, 461.01458740234375, 470.2414245605469, 479.46826171875, 488.69512939453125, 497.9219665527344, 507.1488342285156]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 5.0, 6.0, 9.0, 8.0, 7.0, 5.0, 14.0, 13.0, 19.0, 26.0, 24.0, 26.0, 26.0, 34.0, 38.0, 41.0, 43.0, 53.0, 44.0, 52.0, 43.0, 44.0, 43.0, 51.0, 45.0, 38.0, 33.0, 34.0, 25.0, 33.0, 21.0, 16.0, 18.0, 20.0, 13.0, 4.0, 7.0, 6.0, 2.0, 4.0, 3.0, 2.0, 5.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-84.62775421142578, -81.8919677734375, -79.15618896484375, -76.42040252685547, -73.68462371826172, -70.94883728027344, -68.21305847167969, -65.4772720336914, -62.74148941040039, -60.005706787109375, -57.26992416381836, -54.534141540527344, -51.79835510253906, -49.06257629394531, -46.32678985595703, -43.591007232666016, -40.855224609375, -38.119441986083984, -35.38365936279297, -32.64787292480469, -29.912092208862305, -27.17630958557129, -24.44052505493164, -21.704742431640625, -18.96895980834961, -16.233177185058594, -13.497393608093262, -10.76161003112793, -8.025827407836914, -5.290044784545898, -2.55426025390625, 0.18152236938476562, 2.9173049926757812, 5.653088092803955, 8.388871192932129, 11.124654769897461, 13.860437393188477, 16.596220016479492, 19.33200454711914, 22.067787170410156, 24.803569793701172, 27.539352416992188, 30.275135040283203, 33.01091766357422, 35.7467041015625, 38.48248291015625, 41.21826934814453, 43.95405197143555, 46.68983459472656, 49.42561721801758, 52.161399841308594, 54.897186279296875, 57.632965087890625, 60.368751525878906, 63.10453414916992, 65.84031677246094, 68.57609558105469, 71.31188201904297, 74.04766082763672, 76.783447265625, 79.51922607421875, 82.25501251220703, 84.99079895019531, 87.72657775878906, 90.46236419677734]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 4.0, 7.0, 6.0, 11.0, 16.0, 19.0, 23.0, 42.0, 48.0, 62.0, 86.0, 146.0, 222.0, 319.0, 472.0, 793.0, 1212.0, 1871.0, 3316.0, 6165.0, 12619.0, 30491.0, 95204.0, 3482194.0, 439447.0, 71242.0, 24686.0, 10606.0, 5264.0, 2906.0, 1669.0, 1106.0, 637.0, 425.0, 287.0, 203.0, 135.0, 83.0, 56.0, 56.0, 40.0, 23.0, 24.0, 9.0, 12.0, 9.0, 3.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.3515625, -11.95166015625, -11.5517578125, -11.15185546875, -10.751953125, -10.35205078125, -9.9521484375, -9.55224609375, -9.15234375, -8.75244140625, -8.3525390625, -7.95263671875, -7.552734375, -7.15283203125, -6.7529296875, -6.35302734375, -5.953125, -5.55322265625, -5.1533203125, -4.75341796875, -4.353515625, -3.95361328125, -3.5537109375, -3.15380859375, -2.75390625, -2.35400390625, -1.9541015625, -1.55419921875, -1.154296875, -0.75439453125, -0.3544921875, 0.04541015625, 0.4453125, 0.84521484375, 1.2451171875, 1.64501953125, 2.044921875, 2.44482421875, 2.8447265625, 3.24462890625, 3.64453125, 4.04443359375, 4.4443359375, 4.84423828125, 5.244140625, 5.64404296875, 6.0439453125, 6.44384765625, 6.84375, 7.24365234375, 7.6435546875, 8.04345703125, 8.443359375, 8.84326171875, 9.2431640625, 9.64306640625, 10.04296875, 10.44287109375, 10.8427734375, 11.24267578125, 11.642578125, 12.04248046875, 12.4423828125, 12.84228515625, 13.2421875]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 6.0, 5.0, 4.0, 7.0, 5.0, 12.0, 12.0, 20.0, 19.0, 33.0, 39.0, 47.0, 51.0, 44.0, 55.0, 65.0, 67.0, 60.0, 51.0, 71.0, 53.0, 57.0, 42.0, 43.0, 32.0, 23.0, 25.0, 12.0, 11.0, 3.0, 10.0, 9.0, 5.0, 3.0, 2.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.40625, -5.2432861328125, -5.080322265625, -4.9173583984375, -4.75439453125, -4.5914306640625, -4.428466796875, -4.2655029296875, -4.1025390625, -3.9395751953125, -3.776611328125, -3.6136474609375, -3.45068359375, -3.2877197265625, -3.124755859375, -2.9617919921875, -2.798828125, -2.6358642578125, -2.472900390625, -2.3099365234375, -2.14697265625, -1.9840087890625, -1.821044921875, -1.6580810546875, -1.4951171875, -1.3321533203125, -1.169189453125, -1.0062255859375, -0.84326171875, -0.6802978515625, -0.517333984375, -0.3543701171875, -0.19140625, -0.0284423828125, 0.134521484375, 0.2974853515625, 0.46044921875, 0.6234130859375, 0.786376953125, 0.9493408203125, 1.1123046875, 1.2752685546875, 1.438232421875, 1.6011962890625, 1.76416015625, 1.9271240234375, 2.090087890625, 2.2530517578125, 2.416015625, 2.5789794921875, 2.741943359375, 2.9049072265625, 3.06787109375, 3.2308349609375, 3.393798828125, 3.5567626953125, 3.7197265625, 3.8826904296875, 4.045654296875, 4.2086181640625, 4.37158203125, 4.5345458984375, 4.697509765625, 4.8604736328125, 5.0234375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 4.0, 10.0, 7.0, 14.0, 26.0, 33.0, 61.0, 103.0, 200.0, 351.0, 855.0, 2501.0, 8676.0, 48014.0, 3388619.0, 695998.0, 37614.0, 7524.0, 2176.0, 823.0, 301.0, 149.0, 90.0, 40.0, 43.0, 21.0, 17.0, 6.0, 8.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.125, -19.34912109375, -18.5732421875, -17.79736328125, -17.021484375, -16.24560546875, -15.4697265625, -14.69384765625, -13.91796875, -13.14208984375, -12.3662109375, -11.59033203125, -10.814453125, -10.03857421875, -9.2626953125, -8.48681640625, -7.7109375, -6.93505859375, -6.1591796875, -5.38330078125, -4.607421875, -3.83154296875, -3.0556640625, -2.27978515625, -1.50390625, -0.72802734375, 0.0478515625, 0.82373046875, 1.599609375, 2.37548828125, 3.1513671875, 3.92724609375, 4.703125, 5.47900390625, 6.2548828125, 7.03076171875, 7.806640625, 8.58251953125, 9.3583984375, 10.13427734375, 10.91015625, 11.68603515625, 12.4619140625, 13.23779296875, 14.013671875, 14.78955078125, 15.5654296875, 16.34130859375, 17.1171875, 17.89306640625, 18.6689453125, 19.44482421875, 20.220703125, 20.99658203125, 21.7724609375, 22.54833984375, 23.32421875, 24.10009765625, 24.8759765625, 25.65185546875, 26.427734375, 27.20361328125, 27.9794921875, 28.75537109375, 29.53125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 7.0, 4.0, 2.0, 13.0, 12.0, 18.0, 33.0, 49.0, 87.0, 141.0, 302.0, 2610.0, 409.0, 146.0, 89.0, 43.0, 33.0, 15.0, 20.0, 14.0, 11.0, 6.0, 4.0, 3.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.41796875, -4.3092041015625, -4.200439453125, -4.0916748046875, -3.98291015625, -3.8741455078125, -3.765380859375, -3.6566162109375, -3.5478515625, -3.4390869140625, -3.330322265625, -3.2215576171875, -3.11279296875, -3.0040283203125, -2.895263671875, -2.7864990234375, -2.677734375, -2.5689697265625, -2.460205078125, -2.3514404296875, -2.24267578125, -2.1339111328125, -2.025146484375, -1.9163818359375, -1.8076171875, -1.6988525390625, -1.590087890625, -1.4813232421875, -1.37255859375, -1.2637939453125, -1.155029296875, -1.0462646484375, -0.9375, -0.8287353515625, -0.719970703125, -0.6112060546875, -0.50244140625, -0.3936767578125, -0.284912109375, -0.1761474609375, -0.0673828125, 0.0413818359375, 0.150146484375, 0.2589111328125, 0.36767578125, 0.4764404296875, 0.585205078125, 0.6939697265625, 0.802734375, 0.9114990234375, 1.020263671875, 1.1290283203125, 1.23779296875, 1.3465576171875, 1.455322265625, 1.5640869140625, 1.6728515625, 1.7816162109375, 1.890380859375, 1.9991455078125, 2.10791015625, 2.2166748046875, 2.325439453125, 2.4342041015625, 2.54296875]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 7.0, 13.0, 7.0, 16.0, 21.0, 46.0, 55.0, 81.0, 92.0, 124.0, 142.0, 114.0, 93.0, 73.0, 46.0, 36.0, 17.0, 10.0, 7.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-22.40271759033203, -21.832439422607422, -21.262161254882812, -20.691883087158203, -20.121604919433594, -19.551326751708984, -18.981048583984375, -18.410770416259766, -17.840492248535156, -17.270214080810547, -16.699935913085938, -16.129657745361328, -15.559379577636719, -14.98910140991211, -14.4188232421875, -13.84854507446289, -13.278267860412598, -12.707989692687988, -12.137711524963379, -11.56743335723877, -10.99715518951416, -10.42687702178955, -9.856599807739258, -9.286321640014648, -8.716043472290039, -8.14576530456543, -7.57548713684082, -7.005208969116211, -6.434930801391602, -5.864652633666992, -5.294374942779541, -4.724096775054932, -4.153818130493164, -3.5835399627685547, -3.0132617950439453, -2.442983865737915, -1.8727056980133057, -1.3024275302886963, -0.732149600982666, -0.16187143325805664, 0.40840673446655273, 0.9786848425865173, 1.548962950706482, 2.1192409992218018, 2.689519166946411, 3.2597973346710205, 3.830075263977051, 4.40035343170166, 4.9706315994262695, 5.540909767150879, 6.111187934875488, 6.681466102600098, 7.251744270324707, 7.822022438049316, 8.39229965209961, 8.962577819824219, 9.532855987548828, 10.103134155273438, 10.673412322998047, 11.243690490722656, 11.813968658447266, 12.384246826171875, 12.954524993896484, 13.524803161621094, 14.095081329345703]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 4.0, 5.0, 8.0, 6.0, 10.0, 11.0, 10.0, 13.0, 14.0, 18.0, 21.0, 14.0, 23.0, 21.0, 32.0, 27.0, 32.0, 31.0, 39.0, 26.0, 47.0, 38.0, 40.0, 45.0, 40.0, 39.0, 22.0, 35.0, 40.0, 38.0, 34.0, 32.0, 34.0, 23.0, 26.0, 19.0, 15.0, 13.0, 16.0, 16.0, 7.0, 8.0, 2.0, 2.0, 3.0, 7.0, 2.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.1619720458984375, -5.936976432800293, -5.711980819702148, -5.486985206604004, -5.261989593505859, -5.036993980407715, -4.81199836730957, -4.587002754211426, -4.362007141113281, -4.137011528015137, -3.912015914916992, -3.6870203018188477, -3.462024688720703, -3.2370290756225586, -3.012033462524414, -2.7870378494262695, -2.562042236328125, -2.3370466232299805, -2.112051010131836, -1.8870553970336914, -1.6620597839355469, -1.4370641708374023, -1.2120685577392578, -0.9870729446411133, -0.7620773315429688, -0.5370817184448242, -0.3120861053466797, -0.08709049224853516, 0.13790512084960938, 0.3629007339477539, 0.5878963470458984, 0.812891960144043, 1.0378875732421875, 1.262883186340332, 1.4878787994384766, 1.712874412536621, 1.9378700256347656, 2.16286563873291, 2.3878612518310547, 2.612856864929199, 2.8378524780273438, 3.0628480911254883, 3.287843704223633, 3.5128393173217773, 3.737834930419922, 3.9628305435180664, 4.187826156616211, 4.4128217697143555, 4.6378173828125, 4.8628129959106445, 5.087808609008789, 5.312804222106934, 5.537799835205078, 5.762795448303223, 5.987791061401367, 6.212786674499512, 6.437782287597656, 6.662777900695801, 6.887773513793945, 7.11276912689209, 7.337764739990234, 7.562760353088379, 7.787755966186523, 8.012751579284668, 8.237747192382812]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 5.0, 8.0, 8.0, 18.0, 31.0, 47.0, 73.0, 170.0, 309.0, 659.0, 1553.0, 4607.0, 14274.0, 45791.0, 135887.0, 303766.0, 317052.0, 149207.0, 50778.0, 16101.0, 5048.0, 1803.0, 723.0, 291.0, 151.0, 88.0, 47.0, 23.0, 16.0, 8.0, 6.0, 6.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.03125, -14.6142578125, -14.197265625, -13.7802734375, -13.36328125, -12.9462890625, -12.529296875, -12.1123046875, -11.6953125, -11.2783203125, -10.861328125, -10.4443359375, -10.02734375, -9.6103515625, -9.193359375, -8.7763671875, -8.359375, -7.9423828125, -7.525390625, -7.1083984375, -6.69140625, -6.2744140625, -5.857421875, -5.4404296875, -5.0234375, -4.6064453125, -4.189453125, -3.7724609375, -3.35546875, -2.9384765625, -2.521484375, -2.1044921875, -1.6875, -1.2705078125, -0.853515625, -0.4365234375, -0.01953125, 0.3974609375, 0.814453125, 1.2314453125, 1.6484375, 2.0654296875, 2.482421875, 2.8994140625, 3.31640625, 3.7333984375, 4.150390625, 4.5673828125, 4.984375, 5.4013671875, 5.818359375, 6.2353515625, 6.65234375, 7.0693359375, 7.486328125, 7.9033203125, 8.3203125, 8.7373046875, 9.154296875, 9.5712890625, 9.98828125, 10.4052734375, 10.822265625, 11.2392578125, 11.65625]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 7.0, 8.0, 8.0, 13.0, 16.0, 23.0, 31.0, 36.0, 35.0, 43.0, 49.0, 49.0, 52.0, 61.0, 70.0, 50.0, 67.0, 56.0, 68.0, 50.0, 34.0, 29.0, 36.0, 33.0, 17.0, 17.0, 10.0, 13.0, 6.0, 2.0, 6.0, 4.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.71484375, -5.540771484375, -5.36669921875, -5.192626953125, -5.0185546875, -4.844482421875, -4.67041015625, -4.496337890625, -4.322265625, -4.148193359375, -3.97412109375, -3.800048828125, -3.6259765625, -3.451904296875, -3.27783203125, -3.103759765625, -2.9296875, -2.755615234375, -2.58154296875, -2.407470703125, -2.2333984375, -2.059326171875, -1.88525390625, -1.711181640625, -1.537109375, -1.363037109375, -1.18896484375, -1.014892578125, -0.8408203125, -0.666748046875, -0.49267578125, -0.318603515625, -0.14453125, 0.029541015625, 0.20361328125, 0.377685546875, 0.5517578125, 0.725830078125, 0.89990234375, 1.073974609375, 1.248046875, 1.422119140625, 1.59619140625, 1.770263671875, 1.9443359375, 2.118408203125, 2.29248046875, 2.466552734375, 2.640625, 2.814697265625, 2.98876953125, 3.162841796875, 3.3369140625, 3.510986328125, 3.68505859375, 3.859130859375, 4.033203125, 4.207275390625, 4.38134765625, 4.555419921875, 4.7294921875, 4.903564453125, 5.07763671875, 5.251708984375, 5.42578125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 4.0, 1.0, 1.0, 3.0, 3.0, 4.0, 5.0, 7.0, 7.0, 8.0, 9.0, 21.0, 31.0, 40.0, 60.0, 90.0, 124.0, 173.0, 292.0, 426.0, 738.0, 1495.0, 4539.0, 26102.0, 226015.0, 640451.0, 126234.0, 15423.0, 3129.0, 1201.0, 704.0, 395.0, 276.0, 182.0, 119.0, 68.0, 44.0, 30.0, 30.0, 24.0, 16.0, 10.0, 6.0, 7.0, 7.0, 2.0, 1.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-23.53125, -22.80419921875, -22.0771484375, -21.35009765625, -20.623046875, -19.89599609375, -19.1689453125, -18.44189453125, -17.71484375, -16.98779296875, -16.2607421875, -15.53369140625, -14.806640625, -14.07958984375, -13.3525390625, -12.62548828125, -11.8984375, -11.17138671875, -10.4443359375, -9.71728515625, -8.990234375, -8.26318359375, -7.5361328125, -6.80908203125, -6.08203125, -5.35498046875, -4.6279296875, -3.90087890625, -3.173828125, -2.44677734375, -1.7197265625, -0.99267578125, -0.265625, 0.46142578125, 1.1884765625, 1.91552734375, 2.642578125, 3.36962890625, 4.0966796875, 4.82373046875, 5.55078125, 6.27783203125, 7.0048828125, 7.73193359375, 8.458984375, 9.18603515625, 9.9130859375, 10.64013671875, 11.3671875, 12.09423828125, 12.8212890625, 13.54833984375, 14.275390625, 15.00244140625, 15.7294921875, 16.45654296875, 17.18359375, 17.91064453125, 18.6376953125, 19.36474609375, 20.091796875, 20.81884765625, 21.5458984375, 22.27294921875, 23.0]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 5.0, 2.0, 5.0, 2.0, 1.0, 7.0, 8.0, 11.0, 7.0, 13.0, 13.0, 26.0, 22.0, 27.0, 30.0, 45.0, 27.0, 31.0, 40.0, 46.0, 47.0, 53.0, 57.0, 53.0, 57.0, 51.0, 42.0, 45.0, 35.0, 39.0, 21.0, 19.0, 36.0, 16.0, 18.0, 12.0, 10.0, 3.0, 4.0, 5.0, 3.0, 7.0, 3.0, 1.0, 5.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-25.4375, -24.696044921875, -23.95458984375, -23.213134765625, -22.4716796875, -21.730224609375, -20.98876953125, -20.247314453125, -19.505859375, -18.764404296875, -18.02294921875, -17.281494140625, -16.5400390625, -15.798583984375, -15.05712890625, -14.315673828125, -13.57421875, -12.832763671875, -12.09130859375, -11.349853515625, -10.6083984375, -9.866943359375, -9.12548828125, -8.384033203125, -7.642578125, -6.901123046875, -6.15966796875, -5.418212890625, -4.6767578125, -3.935302734375, -3.19384765625, -2.452392578125, -1.7109375, -0.969482421875, -0.22802734375, 0.513427734375, 1.2548828125, 1.996337890625, 2.73779296875, 3.479248046875, 4.220703125, 4.962158203125, 5.70361328125, 6.445068359375, 7.1865234375, 7.927978515625, 8.66943359375, 9.410888671875, 10.15234375, 10.893798828125, 11.63525390625, 12.376708984375, 13.1181640625, 13.859619140625, 14.60107421875, 15.342529296875, 16.083984375, 16.825439453125, 17.56689453125, 18.308349609375, 19.0498046875, 19.791259765625, 20.53271484375, 21.274169921875, 22.015625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 10.0, 10.0, 12.0, 17.0, 32.0, 81.0, 132.0, 344.0, 973.0, 4357.0, 40227.0, 576901.0, 395627.0, 25239.0, 3206.0, 811.0, 287.0, 136.0, 62.0, 37.0, 24.0, 11.0, 8.0, 6.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.265625, -12.8221435546875, -12.378662109375, -11.9351806640625, -11.49169921875, -11.0482177734375, -10.604736328125, -10.1612548828125, -9.7177734375, -9.2742919921875, -8.830810546875, -8.3873291015625, -7.94384765625, -7.5003662109375, -7.056884765625, -6.6134033203125, -6.169921875, -5.7264404296875, -5.282958984375, -4.8394775390625, -4.39599609375, -3.9525146484375, -3.509033203125, -3.0655517578125, -2.6220703125, -2.1785888671875, -1.735107421875, -1.2916259765625, -0.84814453125, -0.4046630859375, 0.038818359375, 0.4822998046875, 0.92578125, 1.3692626953125, 1.812744140625, 2.2562255859375, 2.69970703125, 3.1431884765625, 3.586669921875, 4.0301513671875, 4.4736328125, 4.9171142578125, 5.360595703125, 5.8040771484375, 6.24755859375, 6.6910400390625, 7.134521484375, 7.5780029296875, 8.021484375, 8.4649658203125, 8.908447265625, 9.3519287109375, 9.79541015625, 10.2388916015625, 10.682373046875, 11.1258544921875, 11.5693359375, 12.0128173828125, 12.456298828125, 12.8997802734375, 13.34326171875, 13.7867431640625, 14.230224609375, 14.6737060546875, 15.1171875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 3.0, 6.0, 8.0, 7.0, 7.0, 10.0, 20.0, 23.0, 27.0, 34.0, 34.0, 51.0, 41.0, 47.0, 78.0, 59.0, 67.0, 66.0, 81.0, 60.0, 68.0, 34.0, 31.0, 34.0, 25.0, 19.0, 9.0, 13.0, 11.0, 10.0, 4.0, 4.0, 3.0, 3.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0012292861938476562, -0.0011877268552780151, -0.001146167516708374, -0.001104608178138733, -0.0010630488395690918, -0.0010214895009994507, -0.0009799301624298096, -0.0009383708238601685, -0.0008968114852905273, -0.0008552521467208862, -0.0008136928081512451, -0.000772133469581604, -0.0007305741310119629, -0.0006890147924423218, -0.0006474554538726807, -0.0006058961153030396, -0.0005643367767333984, -0.0005227774381637573, -0.0004812180995941162, -0.0004396587610244751, -0.000398099422454834, -0.00035654008388519287, -0.00031498074531555176, -0.00027342140674591064, -0.00023186206817626953, -0.00019030272960662842, -0.0001487433910369873, -0.00010718405246734619, -6.562471389770508e-05, -2.4065375328063965e-05, 1.749396324157715e-05, 5.905330181121826e-05, 0.00010061264038085938, 0.0001421719789505005, 0.0001837313175201416, 0.00022529065608978271, 0.00026684999465942383, 0.00030840933322906494, 0.00034996867179870605, 0.00039152801036834717, 0.0004330873489379883, 0.0004746466875076294, 0.0005162060260772705, 0.0005577653646469116, 0.0005993247032165527, 0.0006408840417861938, 0.000682443380355835, 0.0007240027189254761, 0.0007655620574951172, 0.0008071213960647583, 0.0008486807346343994, 0.0008902400732040405, 0.0009317994117736816, 0.0009733587503433228, 0.0010149180889129639, 0.001056477427482605, 0.001098036766052246, 0.0011395961046218872, 0.0011811554431915283, 0.0012227147817611694, 0.0012642741203308105, 0.0013058334589004517, 0.0013473927974700928, 0.0013889521360397339, 0.001430511474609375]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 11.0, 2.0, 13.0, 11.0, 21.0, 28.0, 44.0, 95.0, 193.0, 428.0, 1190.0, 4019.0, 33412.0, 579998.0, 402108.0, 21843.0, 3431.0, 984.0, 370.0, 172.0, 73.0, 41.0, 22.0, 19.0, 7.0, 6.0, 5.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.5546875, -15.0673828125, -14.580078125, -14.0927734375, -13.60546875, -13.1181640625, -12.630859375, -12.1435546875, -11.65625, -11.1689453125, -10.681640625, -10.1943359375, -9.70703125, -9.2197265625, -8.732421875, -8.2451171875, -7.7578125, -7.2705078125, -6.783203125, -6.2958984375, -5.80859375, -5.3212890625, -4.833984375, -4.3466796875, -3.859375, -3.3720703125, -2.884765625, -2.3974609375, -1.91015625, -1.4228515625, -0.935546875, -0.4482421875, 0.0390625, 0.5263671875, 1.013671875, 1.5009765625, 1.98828125, 2.4755859375, 2.962890625, 3.4501953125, 3.9375, 4.4248046875, 4.912109375, 5.3994140625, 5.88671875, 6.3740234375, 6.861328125, 7.3486328125, 7.8359375, 8.3232421875, 8.810546875, 9.2978515625, 9.78515625, 10.2724609375, 10.759765625, 11.2470703125, 11.734375, 12.2216796875, 12.708984375, 13.1962890625, 13.68359375, 14.1708984375, 14.658203125, 15.1455078125, 15.6328125]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 4.0, 10.0, 20.0, 25.0, 33.0, 61.0, 81.0, 109.0, 162.0, 130.0, 109.0, 93.0, 63.0, 41.0, 26.0, 9.0, 9.0, 5.0, 4.0, 6.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.96875, -15.4984130859375, -15.028076171875, -14.5577392578125, -14.08740234375, -13.6170654296875, -13.146728515625, -12.6763916015625, -12.2060546875, -11.7357177734375, -11.265380859375, -10.7950439453125, -10.32470703125, -9.8543701171875, -9.384033203125, -8.9136962890625, -8.443359375, -7.9730224609375, -7.502685546875, -7.0323486328125, -6.56201171875, -6.0916748046875, -5.621337890625, -5.1510009765625, -4.6806640625, -4.2103271484375, -3.739990234375, -3.2696533203125, -2.79931640625, -2.3289794921875, -1.858642578125, -1.3883056640625, -0.91796875, -0.4476318359375, 0.022705078125, 0.4930419921875, 0.96337890625, 1.4337158203125, 1.904052734375, 2.3743896484375, 2.8447265625, 3.3150634765625, 3.785400390625, 4.2557373046875, 4.72607421875, 5.1964111328125, 5.666748046875, 6.1370849609375, 6.607421875, 7.0777587890625, 7.548095703125, 8.0184326171875, 8.48876953125, 8.9591064453125, 9.429443359375, 9.8997802734375, 10.3701171875, 10.8404541015625, 11.310791015625, 11.7811279296875, 12.25146484375, 12.7218017578125, 13.192138671875, 13.6624755859375, 14.1328125]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 20.0, 30.0, 65.0, 136.0, 222.0, 194.0, 158.0, 95.0, 52.0, 15.0, 10.0, 6.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-214.3706817626953, -207.46087646484375, -200.5510711669922, -193.6412811279297, -186.73147583007812, -179.82167053222656, -172.911865234375, -166.0020751953125, -159.09226989746094, -152.18246459960938, -145.2726593017578, -138.3628692626953, -131.45306396484375, -124.54325866699219, -117.63345336914062, -110.7236557006836, -103.81385040283203, -96.90404510498047, -89.99424743652344, -83.08444213867188, -76.17464447021484, -69.26483917236328, -62.355037689208984, -55.44523620605469, -48.53543472290039, -41.625633239746094, -34.7158317565918, -27.806028366088867, -20.89622688293457, -13.98642349243164, -7.076622009277344, -0.16682052612304688, 6.74298095703125, 13.652782440185547, 20.562583923339844, 27.472387313842773, 34.38218688964844, 41.2919921875, 48.2017936706543, 55.111595153808594, 62.02139663696289, 68.93119812011719, 75.84100341796875, 82.75080108642578, 89.66060638427734, 96.57040405273438, 103.48020935058594, 110.3900146484375, 117.29981231689453, 124.2096176147461, 131.11941528320312, 138.0292205810547, 144.93902587890625, 151.84881591796875, 158.7586212158203, 165.66842651367188, 172.57823181152344, 179.488037109375, 186.39784240722656, 193.30763244628906, 200.21743774414062, 207.1272430419922, 214.03704833984375, 220.94683837890625, 227.8566436767578]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 4.0, 7.0, 5.0, 6.0, 11.0, 11.0, 15.0, 11.0, 21.0, 21.0, 22.0, 23.0, 25.0, 26.0, 35.0, 33.0, 39.0, 34.0, 34.0, 44.0, 47.0, 44.0, 42.0, 44.0, 36.0, 30.0, 38.0, 41.0, 30.0, 25.0, 29.0, 23.0, 22.0, 14.0, 20.0, 17.0, 17.0, 10.0, 9.0, 9.0, 7.0, 7.0, 5.0, 1.0, 5.0, 1.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-84.09310913085938, -81.26773834228516, -78.44236755371094, -75.61700439453125, -72.79163360595703, -69.96626281738281, -67.14089965820312, -64.3155288696289, -61.49015808105469, -58.66478729248047, -55.839420318603516, -53.01405334472656, -50.188682556152344, -47.363311767578125, -44.53794479370117, -41.71257781982422, -38.88720703125, -36.06183624267578, -33.23646926879883, -30.411100387573242, -27.585731506347656, -24.76036262512207, -21.934993743896484, -19.1096248626709, -16.284255981445312, -13.458887100219727, -10.63351821899414, -7.808149337768555, -4.982780456542969, -2.157411575317383, 0.6679573059082031, 3.493326187133789, 6.318695068359375, 9.144063949584961, 11.969432830810547, 14.794801712036133, 17.62017059326172, 20.445539474487305, 23.27090835571289, 26.096277236938477, 28.921646118164062, 31.74701499938965, 34.572383880615234, 37.39775085449219, 40.223121643066406, 43.048492431640625, 45.87385940551758, 48.69922637939453, 51.52459716796875, 54.34996795654297, 57.17533493041992, 60.000701904296875, 62.826072692871094, 65.65144348144531, 68.476806640625, 71.30217742919922, 74.12754821777344, 76.95291900634766, 79.77828979492188, 82.60365295410156, 85.42902374267578, 88.25439453125, 91.07975769042969, 93.9051284790039, 96.73049926757812]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 5.0, 2.0, 3.0, 7.0, 13.0, 17.0, 34.0, 51.0, 82.0, 147.0, 240.0, 474.0, 814.0, 1575.0, 3240.0, 6766.0, 16633.0, 48644.0, 248068.0, 3682112.0, 129377.0, 33181.0, 12343.0, 5115.0, 2513.0, 1307.0, 671.0, 374.0, 207.0, 106.0, 70.0, 35.0, 18.0, 20.0, 5.0, 10.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.8359375, -12.412841796875, -11.98974609375, -11.566650390625, -11.1435546875, -10.720458984375, -10.29736328125, -9.874267578125, -9.451171875, -9.028076171875, -8.60498046875, -8.181884765625, -7.7587890625, -7.335693359375, -6.91259765625, -6.489501953125, -6.06640625, -5.643310546875, -5.22021484375, -4.797119140625, -4.3740234375, -3.950927734375, -3.52783203125, -3.104736328125, -2.681640625, -2.258544921875, -1.83544921875, -1.412353515625, -0.9892578125, -0.566162109375, -0.14306640625, 0.280029296875, 0.703125, 1.126220703125, 1.54931640625, 1.972412109375, 2.3955078125, 2.818603515625, 3.24169921875, 3.664794921875, 4.087890625, 4.510986328125, 4.93408203125, 5.357177734375, 5.7802734375, 6.203369140625, 6.62646484375, 7.049560546875, 7.47265625, 7.895751953125, 8.31884765625, 8.741943359375, 9.1650390625, 9.588134765625, 10.01123046875, 10.434326171875, 10.857421875, 11.280517578125, 11.70361328125, 12.126708984375, 12.5498046875, 12.972900390625, 13.39599609375, 13.819091796875, 14.2421875]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 4.0, 4.0, 5.0, 18.0, 13.0, 16.0, 24.0, 33.0, 38.0, 42.0, 36.0, 58.0, 48.0, 53.0, 65.0, 58.0, 54.0, 61.0, 50.0, 45.0, 46.0, 43.0, 40.0, 34.0, 17.0, 28.0, 11.0, 13.0, 11.0, 8.0, 7.0, 10.0, 5.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.4375, -6.27178955078125, -6.1060791015625, -5.94036865234375, -5.774658203125, -5.60894775390625, -5.4432373046875, -5.27752685546875, -5.11181640625, -4.94610595703125, -4.7803955078125, -4.61468505859375, -4.448974609375, -4.28326416015625, -4.1175537109375, -3.95184326171875, -3.7861328125, -3.62042236328125, -3.4547119140625, -3.28900146484375, -3.123291015625, -2.95758056640625, -2.7918701171875, -2.62615966796875, -2.46044921875, -2.29473876953125, -2.1290283203125, -1.96331787109375, -1.797607421875, -1.63189697265625, -1.4661865234375, -1.30047607421875, -1.134765625, -0.96905517578125, -0.8033447265625, -0.63763427734375, -0.471923828125, -0.30621337890625, -0.1405029296875, 0.02520751953125, 0.19091796875, 0.35662841796875, 0.5223388671875, 0.68804931640625, 0.853759765625, 1.01947021484375, 1.1851806640625, 1.35089111328125, 1.5166015625, 1.68231201171875, 1.8480224609375, 2.01373291015625, 2.179443359375, 2.34515380859375, 2.5108642578125, 2.67657470703125, 2.84228515625, 3.00799560546875, 3.1737060546875, 3.33941650390625, 3.505126953125, 3.67083740234375, 3.8365478515625, 4.00225830078125, 4.16796875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 5.0, 3.0, 6.0, 15.0, 17.0, 19.0, 29.0, 60.0, 58.0, 100.0, 210.0, 380.0, 747.0, 1474.0, 3675.0, 10129.0, 34229.0, 190010.0, 3672728.0, 224334.0, 38042.0, 11035.0, 3812.0, 1563.0, 721.0, 335.0, 216.0, 124.0, 80.0, 41.0, 22.0, 21.0, 15.0, 12.0, 7.0, 6.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.2265625, -14.7279052734375, -14.229248046875, -13.7305908203125, -13.23193359375, -12.7332763671875, -12.234619140625, -11.7359619140625, -11.2373046875, -10.7386474609375, -10.239990234375, -9.7413330078125, -9.24267578125, -8.7440185546875, -8.245361328125, -7.7467041015625, -7.248046875, -6.7493896484375, -6.250732421875, -5.7520751953125, -5.25341796875, -4.7547607421875, -4.256103515625, -3.7574462890625, -3.2587890625, -2.7601318359375, -2.261474609375, -1.7628173828125, -1.26416015625, -0.7655029296875, -0.266845703125, 0.2318115234375, 0.73046875, 1.2291259765625, 1.727783203125, 2.2264404296875, 2.72509765625, 3.2237548828125, 3.722412109375, 4.2210693359375, 4.7197265625, 5.2183837890625, 5.717041015625, 6.2156982421875, 6.71435546875, 7.2130126953125, 7.711669921875, 8.2103271484375, 8.708984375, 9.2076416015625, 9.706298828125, 10.2049560546875, 10.70361328125, 11.2022705078125, 11.700927734375, 12.1995849609375, 12.6982421875, 13.1968994140625, 13.695556640625, 14.1942138671875, 14.69287109375, 15.1915283203125, 15.690185546875, 16.1888427734375, 16.6875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 6.0, 6.0, 4.0, 9.0, 18.0, 17.0, 28.0, 23.0, 47.0, 67.0, 135.0, 266.0, 1598.0, 1219.0, 232.0, 138.0, 85.0, 44.0, 43.0, 20.0, 15.0, 14.0, 9.0, 10.0, 3.0, 5.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.08984375, -2.986846923828125, -2.88385009765625, -2.780853271484375, -2.6778564453125, -2.574859619140625, -2.47186279296875, -2.368865966796875, -2.265869140625, -2.162872314453125, -2.05987548828125, -1.956878662109375, -1.8538818359375, -1.750885009765625, -1.64788818359375, -1.544891357421875, -1.44189453125, -1.338897705078125, -1.23590087890625, -1.132904052734375, -1.0299072265625, -0.926910400390625, -0.82391357421875, -0.720916748046875, -0.617919921875, -0.514923095703125, -0.41192626953125, -0.308929443359375, -0.2059326171875, -0.102935791015625, 6.103515625e-05, 0.103057861328125, 0.2060546875, 0.309051513671875, 0.41204833984375, 0.515045166015625, 0.6180419921875, 0.721038818359375, 0.82403564453125, 0.927032470703125, 1.030029296875, 1.133026123046875, 1.23602294921875, 1.339019775390625, 1.4420166015625, 1.545013427734375, 1.64801025390625, 1.751007080078125, 1.85400390625, 1.957000732421875, 2.05999755859375, 2.162994384765625, 2.2659912109375, 2.368988037109375, 2.47198486328125, 2.574981689453125, 2.677978515625, 2.780975341796875, 2.88397216796875, 2.986968994140625, 3.0899658203125, 3.192962646484375, 3.29595947265625, 3.398956298828125, 3.501953125]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 6.0, 10.0, 13.0, 24.0, 17.0, 30.0, 27.0, 48.0, 54.0, 65.0, 75.0, 75.0, 74.0, 78.0, 80.0, 64.0, 50.0, 46.0, 26.0, 30.0, 28.0, 20.0, 14.0, 9.0, 4.0, 10.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.424139022827148, -13.043779373168945, -12.663419723510742, -12.283060073852539, -11.902700424194336, -11.522340774536133, -11.14198112487793, -10.761621475219727, -10.381261825561523, -10.00090217590332, -9.620542526245117, -9.240182876586914, -8.859823226928711, -8.479463577270508, -8.099103927612305, -7.718743801116943, -7.338383674621582, -6.958024024963379, -6.577664375305176, -6.197304725646973, -5.8169450759887695, -5.436585426330566, -5.056225299835205, -4.675865650177002, -4.295506000518799, -3.9151463508605957, -3.5347867012023926, -3.1544268131256104, -2.7740671634674072, -2.393707513809204, -2.013347625732422, -1.6329879760742188, -1.252629280090332, -0.8722695708274841, -0.49190986156463623, -0.11155009269714355, 0.26880955696105957, 0.6491692066192627, 1.029529094696045, 1.409888744354248, 1.7902483940124512, 2.1706080436706543, 2.5509676933288574, 2.9313275814056396, 3.3116872310638428, 3.692046880722046, 4.072406768798828, 4.452766418457031, 4.833126068115234, 5.2134857177734375, 5.593845367431641, 5.974205017089844, 6.354564666748047, 6.73492431640625, 7.115284442901611, 7.4956440925598145, 7.876003742218018, 8.256363868713379, 8.636723518371582, 9.017083168029785, 9.397442817687988, 9.777802467346191, 10.158162117004395, 10.538521766662598, 10.9188814163208]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 6.0, 11.0, 8.0, 15.0, 11.0, 9.0, 12.0, 24.0, 19.0, 27.0, 36.0, 32.0, 20.0, 28.0, 33.0, 47.0, 39.0, 41.0, 36.0, 51.0, 48.0, 37.0, 41.0, 37.0, 39.0, 32.0, 30.0, 34.0, 28.0, 31.0, 27.0, 18.0, 17.0, 8.0, 17.0, 15.0, 11.0, 5.0, 5.0, 3.0, 3.0, 4.0, 2.0, 0.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-8.556029319763184, -8.2909574508667, -8.025885581970215, -7.760814189910889, -7.4957427978515625, -7.230670928955078, -6.965599060058594, -6.700527191162109, -6.435455799102783, -6.170383930206299, -5.905312538146973, -5.640240669250488, -5.375168800354004, -5.110097408294678, -4.845025539398193, -4.579954147338867, -4.314882278442383, -4.049810409545898, -3.7847390174865723, -3.519667148590088, -3.2545955181121826, -2.9895238876342773, -2.724452018737793, -2.4593803882598877, -2.1943087577819824, -1.9292371273040771, -1.6641653776168823, -1.3990936279296875, -1.1340219974517822, -0.868950366973877, -0.6038786172866821, -0.3388068675994873, -0.07373428344726562, 0.19133740663528442, 0.4564090967178345, 0.7214807868003845, 0.9865524768829346, 1.2516241073608398, 1.5166958570480347, 1.7817676067352295, 2.0468392372131348, 2.31191086769104, 2.5769824981689453, 2.8420543670654297, 3.107125997543335, 3.3721976280212402, 3.6372694969177246, 3.90234112739563, 4.167412757873535, 4.4324846267700195, 4.697556018829346, 4.96262788772583, 5.227699279785156, 5.492771148681641, 5.757843017578125, 6.022914886474609, 6.2879862785339355, 6.55305814743042, 6.818129539489746, 7.0832014083862305, 7.348273277282715, 7.613344669342041, 7.878416538238525, 8.143487930297852, 8.408559799194336]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 4.0, 0.0, 5.0, 7.0, 14.0, 17.0, 28.0, 34.0, 53.0, 75.0, 123.0, 155.0, 275.0, 445.0, 748.0, 1360.0, 2458.0, 4503.0, 9043.0, 17594.0, 34730.0, 67237.0, 122328.0, 187981.0, 213572.0, 168349.0, 103479.0, 55380.0, 28130.0, 14187.0, 7423.0, 3944.0, 2045.0, 1147.0, 670.0, 366.0, 213.0, 166.0, 93.0, 64.0, 40.0, 26.0, 14.0, 13.0, 5.0, 6.0, 7.0, 3.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-6.91796875, -6.7041015625, -6.490234375, -6.2763671875, -6.0625, -5.8486328125, -5.634765625, -5.4208984375, -5.20703125, -4.9931640625, -4.779296875, -4.5654296875, -4.3515625, -4.1376953125, -3.923828125, -3.7099609375, -3.49609375, -3.2822265625, -3.068359375, -2.8544921875, -2.640625, -2.4267578125, -2.212890625, -1.9990234375, -1.78515625, -1.5712890625, -1.357421875, -1.1435546875, -0.9296875, -0.7158203125, -0.501953125, -0.2880859375, -0.07421875, 0.1396484375, 0.353515625, 0.5673828125, 0.78125, 0.9951171875, 1.208984375, 1.4228515625, 1.63671875, 1.8505859375, 2.064453125, 2.2783203125, 2.4921875, 2.7060546875, 2.919921875, 3.1337890625, 3.34765625, 3.5615234375, 3.775390625, 3.9892578125, 4.203125, 4.4169921875, 4.630859375, 4.8447265625, 5.05859375, 5.2724609375, 5.486328125, 5.7001953125, 5.9140625, 6.1279296875, 6.341796875, 6.5556640625, 6.76953125]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 3.0, 5.0, 9.0, 10.0, 13.0, 21.0, 28.0, 28.0, 30.0, 31.0, 37.0, 44.0, 46.0, 45.0, 51.0, 66.0, 59.0, 51.0, 54.0, 35.0, 29.0, 52.0, 50.0, 48.0, 24.0, 21.0, 21.0, 15.0, 16.0, 10.0, 9.0, 9.0, 10.0, 8.0, 4.0, 3.0, 2.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.52734375, -5.36810302734375, -5.2088623046875, -5.04962158203125, -4.890380859375, -4.73114013671875, -4.5718994140625, -4.41265869140625, -4.25341796875, -4.09417724609375, -3.9349365234375, -3.77569580078125, -3.616455078125, -3.45721435546875, -3.2979736328125, -3.13873291015625, -2.9794921875, -2.82025146484375, -2.6610107421875, -2.50177001953125, -2.342529296875, -2.18328857421875, -2.0240478515625, -1.86480712890625, -1.70556640625, -1.54632568359375, -1.3870849609375, -1.22784423828125, -1.068603515625, -0.90936279296875, -0.7501220703125, -0.59088134765625, -0.431640625, -0.27239990234375, -0.1131591796875, 0.04608154296875, 0.205322265625, 0.36456298828125, 0.5238037109375, 0.68304443359375, 0.84228515625, 1.00152587890625, 1.1607666015625, 1.32000732421875, 1.479248046875, 1.63848876953125, 1.7977294921875, 1.95697021484375, 2.1162109375, 2.27545166015625, 2.4346923828125, 2.59393310546875, 2.753173828125, 2.91241455078125, 3.0716552734375, 3.23089599609375, 3.39013671875, 3.54937744140625, 3.7086181640625, 3.86785888671875, 4.027099609375, 4.18634033203125, 4.3455810546875, 4.50482177734375, 4.6640625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 5.0, 3.0, 7.0, 6.0, 19.0, 18.0, 28.0, 45.0, 61.0, 100.0, 184.0, 287.0, 595.0, 1036.0, 2470.0, 11650.0, 168349.0, 780380.0, 72353.0, 7054.0, 1894.0, 875.0, 454.0, 247.0, 154.0, 88.0, 63.0, 46.0, 25.0, 15.0, 11.0, 11.0, 10.0, 5.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.234375, -26.33740234375, -25.4404296875, -24.54345703125, -23.646484375, -22.74951171875, -21.8525390625, -20.95556640625, -20.05859375, -19.16162109375, -18.2646484375, -17.36767578125, -16.470703125, -15.57373046875, -14.6767578125, -13.77978515625, -12.8828125, -11.98583984375, -11.0888671875, -10.19189453125, -9.294921875, -8.39794921875, -7.5009765625, -6.60400390625, -5.70703125, -4.81005859375, -3.9130859375, -3.01611328125, -2.119140625, -1.22216796875, -0.3251953125, 0.57177734375, 1.46875, 2.36572265625, 3.2626953125, 4.15966796875, 5.056640625, 5.95361328125, 6.8505859375, 7.74755859375, 8.64453125, 9.54150390625, 10.4384765625, 11.33544921875, 12.232421875, 13.12939453125, 14.0263671875, 14.92333984375, 15.8203125, 16.71728515625, 17.6142578125, 18.51123046875, 19.408203125, 20.30517578125, 21.2021484375, 22.09912109375, 22.99609375, 23.89306640625, 24.7900390625, 25.68701171875, 26.583984375, 27.48095703125, 28.3779296875, 29.27490234375, 30.171875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 2.0, 8.0, 6.0, 10.0, 12.0, 8.0, 16.0, 21.0, 29.0, 33.0, 47.0, 58.0, 61.0, 65.0, 63.0, 68.0, 73.0, 74.0, 54.0, 48.0, 57.0, 36.0, 42.0, 29.0, 22.0, 16.0, 9.0, 14.0, 9.0, 8.0, 4.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-35.4375, -34.452392578125, -33.46728515625, -32.482177734375, -31.4970703125, -30.511962890625, -29.52685546875, -28.541748046875, -27.556640625, -26.571533203125, -25.58642578125, -24.601318359375, -23.6162109375, -22.631103515625, -21.64599609375, -20.660888671875, -19.67578125, -18.690673828125, -17.70556640625, -16.720458984375, -15.7353515625, -14.750244140625, -13.76513671875, -12.780029296875, -11.794921875, -10.809814453125, -9.82470703125, -8.839599609375, -7.8544921875, -6.869384765625, -5.88427734375, -4.899169921875, -3.9140625, -2.928955078125, -1.94384765625, -0.958740234375, 0.0263671875, 1.011474609375, 1.99658203125, 2.981689453125, 3.966796875, 4.951904296875, 5.93701171875, 6.922119140625, 7.9072265625, 8.892333984375, 9.87744140625, 10.862548828125, 11.84765625, 12.832763671875, 13.81787109375, 14.802978515625, 15.7880859375, 16.773193359375, 17.75830078125, 18.743408203125, 19.728515625, 20.713623046875, 21.69873046875, 22.683837890625, 23.6689453125, 24.654052734375, 25.63916015625, 26.624267578125, 27.609375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 5.0, 2.0, 5.0, 3.0, 4.0, 8.0, 6.0, 13.0, 15.0, 23.0, 30.0, 40.0, 53.0, 81.0, 136.0, 213.0, 358.0, 669.0, 1444.0, 3950.0, 14411.0, 81926.0, 565462.0, 322687.0, 42815.0, 9000.0, 2742.0, 1070.0, 524.0, 312.0, 182.0, 108.0, 71.0, 54.0, 38.0, 17.0, 24.0, 10.0, 16.0, 11.0, 8.0, 6.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.5859375, -9.2939453125, -9.001953125, -8.7099609375, -8.41796875, -8.1259765625, -7.833984375, -7.5419921875, -7.25, -6.9580078125, -6.666015625, -6.3740234375, -6.08203125, -5.7900390625, -5.498046875, -5.2060546875, -4.9140625, -4.6220703125, -4.330078125, -4.0380859375, -3.74609375, -3.4541015625, -3.162109375, -2.8701171875, -2.578125, -2.2861328125, -1.994140625, -1.7021484375, -1.41015625, -1.1181640625, -0.826171875, -0.5341796875, -0.2421875, 0.0498046875, 0.341796875, 0.6337890625, 0.92578125, 1.2177734375, 1.509765625, 1.8017578125, 2.09375, 2.3857421875, 2.677734375, 2.9697265625, 3.26171875, 3.5537109375, 3.845703125, 4.1376953125, 4.4296875, 4.7216796875, 5.013671875, 5.3056640625, 5.59765625, 5.8896484375, 6.181640625, 6.4736328125, 6.765625, 7.0576171875, 7.349609375, 7.6416015625, 7.93359375, 8.2255859375, 8.517578125, 8.8095703125, 9.1015625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 6.0, 7.0, 5.0, 7.0, 10.0, 11.0, 18.0, 21.0, 28.0, 40.0, 41.0, 69.0, 80.0, 108.0, 116.0, 104.0, 75.0, 60.0, 53.0, 30.0, 27.0, 15.0, 15.0, 16.0, 10.0, 10.0, 4.0, 11.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00179290771484375, -0.0017375648021697998, -0.0016822218894958496, -0.0016268789768218994, -0.0015715360641479492, -0.001516193151473999, -0.0014608502388000488, -0.0014055073261260986, -0.0013501644134521484, -0.0012948215007781982, -0.001239478588104248, -0.0011841356754302979, -0.0011287927627563477, -0.0010734498500823975, -0.0010181069374084473, -0.0009627640247344971, -0.0009074211120605469, -0.0008520781993865967, -0.0007967352867126465, -0.0007413923740386963, -0.0006860494613647461, -0.0006307065486907959, -0.0005753636360168457, -0.0005200207233428955, -0.0004646778106689453, -0.0004093348979949951, -0.0003539919853210449, -0.0002986490726470947, -0.00024330615997314453, -0.00018796324729919434, -0.00013262033462524414, -7.727742195129395e-05, -2.193450927734375e-05, 3.3408403396606445e-05, 8.875131607055664e-05, 0.00014409422874450684, 0.00019943714141845703, 0.0002547800540924072, 0.0003101229667663574, 0.0003654658794403076, 0.0004208087921142578, 0.000476151704788208, 0.0005314946174621582, 0.0005868375301361084, 0.0006421804428100586, 0.0006975233554840088, 0.000752866268157959, 0.0008082091808319092, 0.0008635520935058594, 0.0009188950061798096, 0.0009742379188537598, 0.00102958083152771, 0.0010849237442016602, 0.0011402666568756104, 0.0011956095695495605, 0.0012509524822235107, 0.001306295394897461, 0.0013616383075714111, 0.0014169812202453613, 0.0014723241329193115, 0.0015276670455932617, 0.001583009958267212, 0.0016383528709411621, 0.0016936957836151123, 0.0017490386962890625]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 6.0, 5.0, 6.0, 10.0, 14.0, 25.0, 36.0, 49.0, 82.0, 124.0, 227.0, 455.0, 976.0, 2626.0, 11552.0, 112069.0, 759626.0, 142230.0, 13330.0, 2915.0, 1120.0, 459.0, 237.0, 129.0, 98.0, 42.0, 32.0, 23.0, 13.0, 15.0, 8.0, 7.0, 6.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.7890625, -10.3973388671875, -10.005615234375, -9.6138916015625, -9.22216796875, -8.8304443359375, -8.438720703125, -8.0469970703125, -7.6552734375, -7.2635498046875, -6.871826171875, -6.4801025390625, -6.08837890625, -5.6966552734375, -5.304931640625, -4.9132080078125, -4.521484375, -4.1297607421875, -3.738037109375, -3.3463134765625, -2.95458984375, -2.5628662109375, -2.171142578125, -1.7794189453125, -1.3876953125, -0.9959716796875, -0.604248046875, -0.2125244140625, 0.17919921875, 0.5709228515625, 0.962646484375, 1.3543701171875, 1.74609375, 2.1378173828125, 2.529541015625, 2.9212646484375, 3.31298828125, 3.7047119140625, 4.096435546875, 4.4881591796875, 4.8798828125, 5.2716064453125, 5.663330078125, 6.0550537109375, 6.44677734375, 6.8385009765625, 7.230224609375, 7.6219482421875, 8.013671875, 8.4053955078125, 8.797119140625, 9.1888427734375, 9.58056640625, 9.9722900390625, 10.364013671875, 10.7557373046875, 11.1474609375, 11.5391845703125, 11.930908203125, 12.3226318359375, 12.71435546875, 13.1060791015625, 13.497802734375, 13.8895263671875, 14.28125]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 3.0, 3.0, 2.0, 3.0, 4.0, 5.0, 4.0, 14.0, 9.0, 9.0, 16.0, 25.0, 31.0, 32.0, 50.0, 59.0, 61.0, 63.0, 92.0, 88.0, 90.0, 71.0, 63.0, 31.0, 39.0, 31.0, 22.0, 19.0, 14.0, 13.0, 4.0, 7.0, 4.0, 4.0, 6.0, 1.0, 8.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.0859375, -6.8497314453125, -6.613525390625, -6.3773193359375, -6.14111328125, -5.9049072265625, -5.668701171875, -5.4324951171875, -5.1962890625, -4.9600830078125, -4.723876953125, -4.4876708984375, -4.25146484375, -4.0152587890625, -3.779052734375, -3.5428466796875, -3.306640625, -3.0704345703125, -2.834228515625, -2.5980224609375, -2.36181640625, -2.1256103515625, -1.889404296875, -1.6531982421875, -1.4169921875, -1.1807861328125, -0.944580078125, -0.7083740234375, -0.47216796875, -0.2359619140625, 0.000244140625, 0.2364501953125, 0.47265625, 0.7088623046875, 0.945068359375, 1.1812744140625, 1.41748046875, 1.6536865234375, 1.889892578125, 2.1260986328125, 2.3623046875, 2.5985107421875, 2.834716796875, 3.0709228515625, 3.30712890625, 3.5433349609375, 3.779541015625, 4.0157470703125, 4.251953125, 4.4881591796875, 4.724365234375, 4.9605712890625, 5.19677734375, 5.4329833984375, 5.669189453125, 5.9053955078125, 6.1416015625, 6.3778076171875, 6.614013671875, 6.8502197265625, 7.08642578125, 7.3226318359375, 7.558837890625, 7.7950439453125, 8.03125]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 4.0, 3.0, 5.0, 2.0, 4.0, 7.0, 20.0, 30.0, 58.0, 105.0, 104.0, 144.0, 134.0, 137.0, 94.0, 60.0, 39.0, 33.0, 6.0, 8.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-196.7230224609375, -192.2137908935547, -187.70455932617188, -183.19534301757812, -178.6861114501953, -174.1768798828125, -169.6676483154297, -165.15841674804688, -160.64920043945312, -156.1399688720703, -151.6307373046875, -147.12152099609375, -142.61228942871094, -138.10305786132812, -133.5938262939453, -129.0845947265625, -124.57537078857422, -120.0661392211914, -115.55691528320312, -111.04768371582031, -106.53845977783203, -102.02922821044922, -97.52000427246094, -93.01077270507812, -88.50154113769531, -83.9923095703125, -79.48308563232422, -74.9738540649414, -70.46463012695312, -65.95539855957031, -61.446170806884766, -56.93694305419922, -52.42771911621094, -47.91849136352539, -43.409263610839844, -38.90003204345703, -34.39080810546875, -29.88157844543457, -25.37234878540039, -20.863121032714844, -16.353893280029297, -11.84466552734375, -7.335436820983887, -2.8262081146240234, 1.6830196380615234, 6.19224739074707, 10.70147705078125, 15.210704803466797, 19.719932556152344, 24.22916030883789, 28.738388061523438, 33.24761962890625, 37.75684356689453, 42.266075134277344, 46.77530288696289, 51.28453063964844, 55.793758392333984, 60.30298614501953, 64.81221771240234, 69.32144165039062, 73.83067321777344, 78.33989715576172, 82.84912872314453, 87.35835266113281, 91.86758422851562]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 4.0, 4.0, 4.0, 1.0, 2.0, 6.0, 10.0, 4.0, 13.0, 14.0, 12.0, 37.0, 24.0, 29.0, 31.0, 30.0, 38.0, 35.0, 47.0, 58.0, 66.0, 45.0, 51.0, 51.0, 47.0, 44.0, 44.0, 43.0, 42.0, 28.0, 29.0, 20.0, 21.0, 14.0, 16.0, 12.0, 7.0, 10.0, 4.0, 5.0, 3.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-90.01398468017578, -86.9566879272461, -83.89939880371094, -80.84210205078125, -77.7848129272461, -74.7275161743164, -71.67022705078125, -68.61293029785156, -65.5556411743164, -62.498348236083984, -59.44105529785156, -56.38376235961914, -53.32646942138672, -50.2691764831543, -47.211883544921875, -44.15458679199219, -41.097293853759766, -38.040000915527344, -34.98270797729492, -31.9254150390625, -28.868122100830078, -25.810829162597656, -22.7535343170166, -19.69624137878418, -16.638948440551758, -13.581655502319336, -10.524362564086914, -7.467068672180176, -4.409775733947754, -1.352482795715332, 1.7048110961914062, 4.762104034423828, 7.81939697265625, 10.876689910888672, 13.933982849121094, 16.991275787353516, 20.048568725585938, 23.10586166381836, 26.163156509399414, 29.220449447631836, 32.277740478515625, 35.33503341674805, 38.39232635498047, 41.44961929321289, 44.50691223144531, 47.564205169677734, 50.621498107910156, 53.678794860839844, 56.736087799072266, 59.79338073730469, 62.85067367553711, 65.90796661376953, 68.96526336669922, 72.02255249023438, 75.07984924316406, 78.13713836669922, 81.1944351196289, 84.2517318725586, 87.30902099609375, 90.36631774902344, 93.4236068725586, 96.48090362548828, 99.53819274902344, 102.59548950195312, 105.65277862548828]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 5.0, 3.0, 3.0, 5.0, 11.0, 7.0, 25.0, 25.0, 38.0, 51.0, 66.0, 91.0, 119.0, 176.0, 242.0, 422.0, 721.0, 1152.0, 2021.0, 3906.0, 8345.0, 20223.0, 66590.0, 3746149.0, 271533.0, 43230.0, 15064.0, 6501.0, 3149.0, 1663.0, 991.0, 607.0, 363.0, 232.0, 183.0, 105.0, 74.0, 60.0, 43.0, 26.0, 19.0, 16.0, 12.0, 7.0, 3.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-13.078125, -12.691650390625, -12.30517578125, -11.918701171875, -11.5322265625, -11.145751953125, -10.75927734375, -10.372802734375, -9.986328125, -9.599853515625, -9.21337890625, -8.826904296875, -8.4404296875, -8.053955078125, -7.66748046875, -7.281005859375, -6.89453125, -6.508056640625, -6.12158203125, -5.735107421875, -5.3486328125, -4.962158203125, -4.57568359375, -4.189208984375, -3.802734375, -3.416259765625, -3.02978515625, -2.643310546875, -2.2568359375, -1.870361328125, -1.48388671875, -1.097412109375, -0.7109375, -0.324462890625, 0.06201171875, 0.448486328125, 0.8349609375, 1.221435546875, 1.60791015625, 1.994384765625, 2.380859375, 2.767333984375, 3.15380859375, 3.540283203125, 3.9267578125, 4.313232421875, 4.69970703125, 5.086181640625, 5.47265625, 5.859130859375, 6.24560546875, 6.632080078125, 7.0185546875, 7.405029296875, 7.79150390625, 8.177978515625, 8.564453125, 8.950927734375, 9.33740234375, 9.723876953125, 10.1103515625, 10.496826171875, 10.88330078125, 11.269775390625, 11.65625]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 7.0, 6.0, 10.0, 15.0, 15.0, 21.0, 26.0, 36.0, 35.0, 50.0, 48.0, 58.0, 70.0, 67.0, 66.0, 59.0, 60.0, 58.0, 53.0, 50.0, 37.0, 37.0, 19.0, 24.0, 15.0, 6.0, 16.0, 9.0, 11.0, 7.0, 9.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.48046875, -7.2862548828125, -7.092041015625, -6.8978271484375, -6.70361328125, -6.5093994140625, -6.315185546875, -6.1209716796875, -5.9267578125, -5.7325439453125, -5.538330078125, -5.3441162109375, -5.14990234375, -4.9556884765625, -4.761474609375, -4.5672607421875, -4.373046875, -4.1788330078125, -3.984619140625, -3.7904052734375, -3.59619140625, -3.4019775390625, -3.207763671875, -3.0135498046875, -2.8193359375, -2.6251220703125, -2.430908203125, -2.2366943359375, -2.04248046875, -1.8482666015625, -1.654052734375, -1.4598388671875, -1.265625, -1.0714111328125, -0.877197265625, -0.6829833984375, -0.48876953125, -0.2945556640625, -0.100341796875, 0.0938720703125, 0.2880859375, 0.4822998046875, 0.676513671875, 0.8707275390625, 1.06494140625, 1.2591552734375, 1.453369140625, 1.6475830078125, 1.841796875, 2.0360107421875, 2.230224609375, 2.4244384765625, 2.61865234375, 2.8128662109375, 3.007080078125, 3.2012939453125, 3.3955078125, 3.5897216796875, 3.783935546875, 3.9781494140625, 4.17236328125, 4.3665771484375, 4.560791015625, 4.7550048828125, 4.94921875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 7.0, 12.0, 19.0, 45.0, 81.0, 142.0, 280.0, 557.0, 1094.0, 2286.0, 5497.0, 16683.0, 74912.0, 3689133.0, 345719.0, 39747.0, 10715.0, 3940.0, 1744.0, 802.0, 421.0, 205.0, 95.0, 61.0, 38.0, 26.0, 12.0, 4.0, 4.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.6328125, -14.157958984375, -13.68310546875, -13.208251953125, -12.7333984375, -12.258544921875, -11.78369140625, -11.308837890625, -10.833984375, -10.359130859375, -9.88427734375, -9.409423828125, -8.9345703125, -8.459716796875, -7.98486328125, -7.510009765625, -7.03515625, -6.560302734375, -6.08544921875, -5.610595703125, -5.1357421875, -4.660888671875, -4.18603515625, -3.711181640625, -3.236328125, -2.761474609375, -2.28662109375, -1.811767578125, -1.3369140625, -0.862060546875, -0.38720703125, 0.087646484375, 0.5625, 1.037353515625, 1.51220703125, 1.987060546875, 2.4619140625, 2.936767578125, 3.41162109375, 3.886474609375, 4.361328125, 4.836181640625, 5.31103515625, 5.785888671875, 6.2607421875, 6.735595703125, 7.21044921875, 7.685302734375, 8.16015625, 8.635009765625, 9.10986328125, 9.584716796875, 10.0595703125, 10.534423828125, 11.00927734375, 11.484130859375, 11.958984375, 12.433837890625, 12.90869140625, 13.383544921875, 13.8583984375, 14.333251953125, 14.80810546875, 15.282958984375, 15.7578125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 1.0, 1.0, 4.0, 1.0, 5.0, 7.0, 2.0, 6.0, 8.0, 7.0, 22.0, 29.0, 49.0, 69.0, 89.0, 206.0, 2627.0, 542.0, 149.0, 84.0, 55.0, 33.0, 27.0, 13.0, 10.0, 11.0, 3.0, 5.0, 4.0, 4.0, 4.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.59765625, -3.502655029296875, -3.40765380859375, -3.312652587890625, -3.2176513671875, -3.122650146484375, -3.02764892578125, -2.932647705078125, -2.837646484375, -2.742645263671875, -2.64764404296875, -2.552642822265625, -2.4576416015625, -2.362640380859375, -2.26763916015625, -2.172637939453125, -2.07763671875, -1.982635498046875, -1.88763427734375, -1.792633056640625, -1.6976318359375, -1.602630615234375, -1.50762939453125, -1.412628173828125, -1.317626953125, -1.222625732421875, -1.12762451171875, -1.032623291015625, -0.9376220703125, -0.842620849609375, -0.74761962890625, -0.652618408203125, -0.5576171875, -0.462615966796875, -0.36761474609375, -0.272613525390625, -0.1776123046875, -0.082611083984375, 0.01239013671875, 0.107391357421875, 0.202392578125, 0.297393798828125, 0.39239501953125, 0.487396240234375, 0.5823974609375, 0.677398681640625, 0.77239990234375, 0.867401123046875, 0.96240234375, 1.057403564453125, 1.15240478515625, 1.247406005859375, 1.3424072265625, 1.437408447265625, 1.53240966796875, 1.627410888671875, 1.722412109375, 1.817413330078125, 1.91241455078125, 2.007415771484375, 2.1024169921875, 2.197418212890625, 2.29241943359375, 2.387420654296875, 2.482421875]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 5.0, 2.0, 6.0, 9.0, 23.0, 39.0, 66.0, 86.0, 132.0, 139.0, 142.0, 120.0, 81.0, 65.0, 38.0, 20.0, 9.0, 7.0, 3.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.356361389160156, -21.773834228515625, -21.191307067871094, -20.608779907226562, -20.02625274658203, -19.4437255859375, -18.86119842529297, -18.278671264648438, -17.696144104003906, -17.113616943359375, -16.531089782714844, -15.948562622070312, -15.366035461425781, -14.78350830078125, -14.200980186462402, -13.618453025817871, -13.035924911499023, -12.453397750854492, -11.870870590209961, -11.28834342956543, -10.705816268920898, -10.123289108276367, -9.54076099395752, -8.958233833312988, -8.375706672668457, -7.793179512023926, -7.2106523513793945, -6.628124713897705, -6.045597553253174, -5.463070392608643, -4.880542755126953, -4.298015594482422, -3.715486526489258, -3.1329593658447266, -2.550431966781616, -1.9679046869277954, -1.3853774070739746, -0.8028502464294434, -0.220322847366333, 0.36220455169677734, 0.9447317123413086, 1.5272589921951294, 2.10978627204895, 2.6923136711120605, 3.274840831756592, 3.857367992401123, 4.4398956298828125, 5.022422790527344, 5.604949951171875, 6.187477111816406, 6.7700042724609375, 7.352531909942627, 7.935059070587158, 8.517585754394531, 9.100113868713379, 9.68264102935791, 10.265168190002441, 10.847695350646973, 11.430222511291504, 12.012749671936035, 12.595277786254883, 13.177804946899414, 13.760332107543945, 14.342859268188477, 14.925386428833008]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 7.0, 2.0, 6.0, 5.0, 4.0, 7.0, 8.0, 6.0, 10.0, 19.0, 13.0, 16.0, 23.0, 21.0, 37.0, 28.0, 34.0, 32.0, 31.0, 38.0, 38.0, 42.0, 43.0, 40.0, 35.0, 37.0, 38.0, 38.0, 42.0, 40.0, 34.0, 28.0, 24.0, 35.0, 34.0, 12.0, 19.0, 18.0, 17.0, 9.0, 9.0, 6.0, 5.0, 8.0, 2.0, 3.0, 2.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-7.941380500793457, -7.705964088439941, -7.470547676086426, -7.23513126373291, -6.9997148513793945, -6.764298439025879, -6.528882026672363, -6.293465614318848, -6.058049201965332, -5.822632789611816, -5.587216377258301, -5.351799964904785, -5.1163835525512695, -4.880967140197754, -4.645550727844238, -4.410134315490723, -4.174718379974365, -3.9393019676208496, -3.703885555267334, -3.4684691429138184, -3.2330527305603027, -2.997636318206787, -2.7622201442718506, -2.526803731918335, -2.2913873195648193, -2.0559709072113037, -1.820554494857788, -1.585138201713562, -1.3497217893600464, -1.1143053770065308, -0.8788890838623047, -0.6434726715087891, -0.40805578231811523, -0.172639399766922, 0.06277698278427124, 0.2981933355331421, 0.5336097478866577, 0.7690261602401733, 1.0044424533843994, 1.239858865737915, 1.4752752780914307, 1.7106916904449463, 1.946108102798462, 2.1815242767333984, 2.416940689086914, 2.6523571014404297, 2.8877735137939453, 3.123189926147461, 3.3586063385009766, 3.594022750854492, 3.829439163208008, 4.064855575561523, 4.300271987915039, 4.535688400268555, 4.77110481262207, 5.006521224975586, 5.241937637329102, 5.477354049682617, 5.712770462036133, 5.948186874389648, 6.183603286743164, 6.41901969909668, 6.654436111450195, 6.889852523803711, 7.125268459320068]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 0.0, 4.0, 4.0, 6.0, 10.0, 12.0, 26.0, 18.0, 37.0, 52.0, 99.0, 149.0, 340.0, 639.0, 1326.0, 3334.0, 8982.0, 26626.0, 81042.0, 224408.0, 375750.0, 211532.0, 75483.0, 24591.0, 8310.0, 3164.0, 1239.0, 610.0, 297.0, 185.0, 98.0, 65.0, 34.0, 32.0, 19.0, 12.0, 12.0, 4.0, 9.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.7890625, -7.470703125, -7.15234375, -6.833984375, -6.515625, -6.197265625, -5.87890625, -5.560546875, -5.2421875, -4.923828125, -4.60546875, -4.287109375, -3.96875, -3.650390625, -3.33203125, -3.013671875, -2.6953125, -2.376953125, -2.05859375, -1.740234375, -1.421875, -1.103515625, -0.78515625, -0.466796875, -0.1484375, 0.169921875, 0.48828125, 0.806640625, 1.125, 1.443359375, 1.76171875, 2.080078125, 2.3984375, 2.716796875, 3.03515625, 3.353515625, 3.671875, 3.990234375, 4.30859375, 4.626953125, 4.9453125, 5.263671875, 5.58203125, 5.900390625, 6.21875, 6.537109375, 6.85546875, 7.173828125, 7.4921875, 7.810546875, 8.12890625, 8.447265625, 8.765625, 9.083984375, 9.40234375, 9.720703125, 10.0390625, 10.357421875, 10.67578125, 10.994140625, 11.3125, 11.630859375, 11.94921875, 12.267578125, 12.5859375]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 5.0, 6.0, 12.0, 7.0, 18.0, 18.0, 21.0, 37.0, 37.0, 33.0, 45.0, 41.0, 55.0, 62.0, 70.0, 67.0, 70.0, 51.0, 47.0, 59.0, 44.0, 34.0, 33.0, 22.0, 19.0, 26.0, 19.0, 7.0, 7.0, 10.0, 5.0, 10.0, 3.0, 2.0, 1.0, 1.0, 3.0, 1.0], "bins": [-8.0, -7.80706787109375, -7.6141357421875, -7.42120361328125, -7.228271484375, -7.03533935546875, -6.8424072265625, -6.64947509765625, -6.45654296875, -6.26361083984375, -6.0706787109375, -5.87774658203125, -5.684814453125, -5.49188232421875, -5.2989501953125, -5.10601806640625, -4.9130859375, -4.72015380859375, -4.5272216796875, -4.33428955078125, -4.141357421875, -3.94842529296875, -3.7554931640625, -3.56256103515625, -3.36962890625, -3.17669677734375, -2.9837646484375, -2.79083251953125, -2.597900390625, -2.40496826171875, -2.2120361328125, -2.01910400390625, -1.826171875, -1.63323974609375, -1.4403076171875, -1.24737548828125, -1.054443359375, -0.86151123046875, -0.6685791015625, -0.47564697265625, -0.28271484375, -0.08978271484375, 0.1031494140625, 0.29608154296875, 0.489013671875, 0.68194580078125, 0.8748779296875, 1.06781005859375, 1.2607421875, 1.45367431640625, 1.6466064453125, 1.83953857421875, 2.032470703125, 2.22540283203125, 2.4183349609375, 2.61126708984375, 2.80419921875, 2.99713134765625, 3.1900634765625, 3.38299560546875, 3.575927734375, 3.76885986328125, 3.9617919921875, 4.15472412109375, 4.34765625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 4.0, 6.0, 3.0, 4.0, 19.0, 13.0, 20.0, 30.0, 61.0, 73.0, 147.0, 262.0, 498.0, 882.0, 1928.0, 7959.0, 165320.0, 830248.0, 34227.0, 3961.0, 1378.0, 631.0, 382.0, 212.0, 94.0, 67.0, 41.0, 26.0, 10.0, 13.0, 12.0, 3.0, 7.0, 7.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-33.75, -32.70458984375, -31.6591796875, -30.61376953125, -29.568359375, -28.52294921875, -27.4775390625, -26.43212890625, -25.38671875, -24.34130859375, -23.2958984375, -22.25048828125, -21.205078125, -20.15966796875, -19.1142578125, -18.06884765625, -17.0234375, -15.97802734375, -14.9326171875, -13.88720703125, -12.841796875, -11.79638671875, -10.7509765625, -9.70556640625, -8.66015625, -7.61474609375, -6.5693359375, -5.52392578125, -4.478515625, -3.43310546875, -2.3876953125, -1.34228515625, -0.296875, 0.74853515625, 1.7939453125, 2.83935546875, 3.884765625, 4.93017578125, 5.9755859375, 7.02099609375, 8.06640625, 9.11181640625, 10.1572265625, 11.20263671875, 12.248046875, 13.29345703125, 14.3388671875, 15.38427734375, 16.4296875, 17.47509765625, 18.5205078125, 19.56591796875, 20.611328125, 21.65673828125, 22.7021484375, 23.74755859375, 24.79296875, 25.83837890625, 26.8837890625, 27.92919921875, 28.974609375, 30.02001953125, 31.0654296875, 32.11083984375, 33.15625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 8.0, 4.0, 7.0, 15.0, 18.0, 28.0, 30.0, 50.0, 65.0, 61.0, 85.0, 100.0, 109.0, 103.0, 77.0, 68.0, 51.0, 31.0, 28.0, 27.0, 11.0, 7.0, 7.0, 7.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-60.34375, -58.6865234375, -57.029296875, -55.3720703125, -53.71484375, -52.0576171875, -50.400390625, -48.7431640625, -47.0859375, -45.4287109375, -43.771484375, -42.1142578125, -40.45703125, -38.7998046875, -37.142578125, -35.4853515625, -33.828125, -32.1708984375, -30.513671875, -28.8564453125, -27.19921875, -25.5419921875, -23.884765625, -22.2275390625, -20.5703125, -18.9130859375, -17.255859375, -15.5986328125, -13.94140625, -12.2841796875, -10.626953125, -8.9697265625, -7.3125, -5.6552734375, -3.998046875, -2.3408203125, -0.68359375, 0.9736328125, 2.630859375, 4.2880859375, 5.9453125, 7.6025390625, 9.259765625, 10.9169921875, 12.57421875, 14.2314453125, 15.888671875, 17.5458984375, 19.203125, 20.8603515625, 22.517578125, 24.1748046875, 25.83203125, 27.4892578125, 29.146484375, 30.8037109375, 32.4609375, 34.1181640625, 35.775390625, 37.4326171875, 39.08984375, 40.7470703125, 42.404296875, 44.0615234375, 45.71875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 0.0, 4.0, 11.0, 6.0, 7.0, 11.0, 13.0, 28.0, 35.0, 45.0, 59.0, 100.0, 177.0, 321.0, 637.0, 1883.0, 15324.0, 698892.0, 319424.0, 8868.0, 1491.0, 516.0, 247.0, 157.0, 95.0, 55.0, 38.0, 29.0, 19.0, 14.0, 9.0, 5.0, 7.0, 3.0, 3.0, 4.0, 3.0, 4.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 4.0], "bins": [-19.84375, -19.275146484375, -18.70654296875, -18.137939453125, -17.5693359375, -17.000732421875, -16.43212890625, -15.863525390625, -15.294921875, -14.726318359375, -14.15771484375, -13.589111328125, -13.0205078125, -12.451904296875, -11.88330078125, -11.314697265625, -10.74609375, -10.177490234375, -9.60888671875, -9.040283203125, -8.4716796875, -7.903076171875, -7.33447265625, -6.765869140625, -6.197265625, -5.628662109375, -5.06005859375, -4.491455078125, -3.9228515625, -3.354248046875, -2.78564453125, -2.217041015625, -1.6484375, -1.079833984375, -0.51123046875, 0.057373046875, 0.6259765625, 1.194580078125, 1.76318359375, 2.331787109375, 2.900390625, 3.468994140625, 4.03759765625, 4.606201171875, 5.1748046875, 5.743408203125, 6.31201171875, 6.880615234375, 7.44921875, 8.017822265625, 8.58642578125, 9.155029296875, 9.7236328125, 10.292236328125, 10.86083984375, 11.429443359375, 11.998046875, 12.566650390625, 13.13525390625, 13.703857421875, 14.2724609375, 14.841064453125, 15.40966796875, 15.978271484375, 16.546875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 1.0, 7.0, 8.0, 5.0, 5.0, 11.0, 16.0, 11.0, 22.0, 31.0, 31.0, 41.0, 49.0, 63.0, 82.0, 115.0, 100.0, 89.0, 62.0, 43.0, 45.0, 33.0, 33.0, 22.0, 15.0, 13.0, 13.0, 11.0, 8.0, 10.0, 4.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011892318725585938, -0.0011435449123382568, -0.00109785795211792, -0.001052170991897583, -0.001006484031677246, -0.0009607970714569092, -0.0009151101112365723, -0.0008694231510162354, -0.0008237361907958984, -0.0007780492305755615, -0.0007323622703552246, -0.0006866753101348877, -0.0006409883499145508, -0.0005953013896942139, -0.000549614429473877, -0.00050392746925354, -0.0004582405090332031, -0.0004125535488128662, -0.0003668665885925293, -0.0003211796283721924, -0.00027549266815185547, -0.00022980570793151855, -0.00018411874771118164, -0.00013843178749084473, -9.274482727050781e-05, -4.70578670501709e-05, -1.3709068298339844e-06, 4.431605339050293e-05, 9.000301361083984e-05, 0.00013568997383117676, 0.00018137693405151367, 0.00022706389427185059, 0.0002727508544921875, 0.0003184378147125244, 0.00036412477493286133, 0.00040981173515319824, 0.00045549869537353516, 0.0005011856555938721, 0.000546872615814209, 0.0005925595760345459, 0.0006382465362548828, 0.0006839334964752197, 0.0007296204566955566, 0.0007753074169158936, 0.0008209943771362305, 0.0008666813373565674, 0.0009123682975769043, 0.0009580552577972412, 0.0010037422180175781, 0.001049429178237915, 0.001095116138458252, 0.0011408030986785889, 0.0011864900588989258, 0.0012321770191192627, 0.0012778639793395996, 0.0013235509395599365, 0.0013692378997802734, 0.0014149248600006104, 0.0014606118202209473, 0.0015062987804412842, 0.001551985740661621, 0.001597672700881958, 0.001643359661102295, 0.0016890466213226318, 0.0017347335815429688]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 4.0, 3.0, 2.0, 3.0, 3.0, 7.0, 14.0, 13.0, 15.0, 23.0, 16.0, 43.0, 68.0, 89.0, 154.0, 224.0, 461.0, 876.0, 2029.0, 6517.0, 38160.0, 515571.0, 440702.0, 33778.0, 5899.0, 1892.0, 862.0, 411.0, 259.0, 137.0, 100.0, 56.0, 38.0, 26.0, 32.0, 17.0, 8.0, 9.0, 7.0, 7.0, 8.0, 3.0, 0.0, 3.0, 5.0, 3.0, 4.0, 1.0, 2.0], "bins": [-13.359375, -12.998046875, -12.63671875, -12.275390625, -11.9140625, -11.552734375, -11.19140625, -10.830078125, -10.46875, -10.107421875, -9.74609375, -9.384765625, -9.0234375, -8.662109375, -8.30078125, -7.939453125, -7.578125, -7.216796875, -6.85546875, -6.494140625, -6.1328125, -5.771484375, -5.41015625, -5.048828125, -4.6875, -4.326171875, -3.96484375, -3.603515625, -3.2421875, -2.880859375, -2.51953125, -2.158203125, -1.796875, -1.435546875, -1.07421875, -0.712890625, -0.3515625, 0.009765625, 0.37109375, 0.732421875, 1.09375, 1.455078125, 1.81640625, 2.177734375, 2.5390625, 2.900390625, 3.26171875, 3.623046875, 3.984375, 4.345703125, 4.70703125, 5.068359375, 5.4296875, 5.791015625, 6.15234375, 6.513671875, 6.875, 7.236328125, 7.59765625, 7.958984375, 8.3203125, 8.681640625, 9.04296875, 9.404296875, 9.765625]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 1.0, 6.0, 4.0, 6.0, 1.0, 7.0, 18.0, 17.0, 16.0, 21.0, 36.0, 63.0, 60.0, 100.0, 110.0, 103.0, 105.0, 92.0, 62.0, 42.0, 31.0, 26.0, 22.0, 10.0, 11.0, 10.0, 4.0, 9.0, 7.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.7265625, -11.3856201171875, -11.044677734375, -10.7037353515625, -10.36279296875, -10.0218505859375, -9.680908203125, -9.3399658203125, -8.9990234375, -8.6580810546875, -8.317138671875, -7.9761962890625, -7.63525390625, -7.2943115234375, -6.953369140625, -6.6124267578125, -6.271484375, -5.9305419921875, -5.589599609375, -5.2486572265625, -4.90771484375, -4.5667724609375, -4.225830078125, -3.8848876953125, -3.5439453125, -3.2030029296875, -2.862060546875, -2.5211181640625, -2.18017578125, -1.8392333984375, -1.498291015625, -1.1573486328125, -0.81640625, -0.4754638671875, -0.134521484375, 0.2064208984375, 0.54736328125, 0.8883056640625, 1.229248046875, 1.5701904296875, 1.9111328125, 2.2520751953125, 2.593017578125, 2.9339599609375, 3.27490234375, 3.6158447265625, 3.956787109375, 4.2977294921875, 4.638671875, 4.9796142578125, 5.320556640625, 5.6614990234375, 6.00244140625, 6.3433837890625, 6.684326171875, 7.0252685546875, 7.3662109375, 7.7071533203125, 8.048095703125, 8.3890380859375, 8.72998046875, 9.0709228515625, 9.411865234375, 9.7528076171875, 10.09375]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 9.0, 53.0, 310.0, 431.0, 151.0, 27.0, 11.0, 7.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-609.361083984375, -596.2040405273438, -583.0469970703125, -569.889892578125, -556.7328491210938, -543.5758056640625, -530.4187622070312, -517.2616577148438, -504.1046142578125, -490.94757080078125, -477.7904968261719, -464.6334533691406, -451.47637939453125, -438.3193359375, -425.1622619628906, -412.0052185058594, -398.84814453125, -385.69110107421875, -372.5340270996094, -359.3769836425781, -346.21990966796875, -333.0628662109375, -319.9057922363281, -306.7487487792969, -293.5917053222656, -280.4346618652344, -267.277587890625, -254.1205291748047, -240.96347045898438, -227.80642700195312, -214.64935302734375, -201.4923095703125, -188.33523559570312, -175.1781768798828, -162.0211181640625, -148.8640594482422, -135.70700073242188, -122.5499496459961, -109.39289093017578, -96.23583221435547, -83.07877349853516, -69.92171478271484, -56.76465606689453, -43.607601165771484, -30.450542449951172, -17.293487548828125, -4.1364288330078125, 9.0206298828125, 22.177688598632812, 35.334747314453125, 48.49180603027344, 61.648860931396484, 74.80592346191406, 87.96297454833984, 101.12003326416016, 114.27709197998047, 127.43415069580078, 140.59120178222656, 153.74826049804688, 166.9053192138672, 180.0623779296875, 193.2194366455078, 206.37649536132812, 219.53355407714844, 232.69061279296875]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 7.0, 11.0, 14.0, 17.0, 14.0, 22.0, 23.0, 30.0, 22.0, 29.0, 45.0, 46.0, 43.0, 46.0, 53.0, 49.0, 43.0, 44.0, 50.0, 46.0, 51.0, 50.0, 43.0, 35.0, 23.0, 19.0, 36.0, 18.0, 13.0, 14.0, 9.0, 10.0, 2.0, 6.0, 7.0, 1.0, 4.0, 6.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-94.31135559082031, -90.91300201416016, -87.51464080810547, -84.11628723144531, -80.71792602539062, -77.31957244873047, -73.92121887207031, -70.52285766601562, -67.12449645996094, -63.726139068603516, -60.327781677246094, -56.92942810058594, -53.53106689453125, -50.132713317871094, -46.73435592651367, -43.33599853515625, -39.937644958496094, -36.53928756713867, -33.14093017578125, -29.74257469177246, -26.34421730041504, -22.945859909057617, -19.547504425048828, -16.149147033691406, -12.750789642333984, -9.352432250976562, -5.954075813293457, -2.5557193756103516, 0.8426380157470703, 4.240995407104492, 7.639350891113281, 11.037708282470703, 14.436058044433594, 17.834415435791016, 21.232772827148438, 24.631128311157227, 28.02948570251465, 31.42784309387207, 34.82619857788086, 38.22455596923828, 41.6229133605957, 45.021270751953125, 48.41962814331055, 51.81798553466797, 55.216339111328125, 58.61470031738281, 62.01305389404297, 65.41140747070312, 68.80976867675781, 72.20812225341797, 75.60648345947266, 79.00483703613281, 82.4031982421875, 85.80155181884766, 89.19990539550781, 92.5982666015625, 95.99662780761719, 99.39498138427734, 102.79334259033203, 106.19169616699219, 109.59005737304688, 112.98841094970703, 116.38676452636719, 119.78512573242188, 123.18347930908203]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 6.0, 7.0, 17.0, 28.0, 51.0, 57.0, 100.0, 149.0, 292.0, 527.0, 1095.0, 2422.0, 5955.0, 18319.0, 81078.0, 3380544.0, 620771.0, 58975.0, 14682.0, 4998.0, 2109.0, 967.0, 480.0, 284.0, 154.0, 89.0, 58.0, 27.0, 21.0, 8.0, 6.0, 2.0, 6.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.5625, -13.1624755859375, -12.762451171875, -12.3624267578125, -11.96240234375, -11.5623779296875, -11.162353515625, -10.7623291015625, -10.3623046875, -9.9622802734375, -9.562255859375, -9.1622314453125, -8.76220703125, -8.3621826171875, -7.962158203125, -7.5621337890625, -7.162109375, -6.7620849609375, -6.362060546875, -5.9620361328125, -5.56201171875, -5.1619873046875, -4.761962890625, -4.3619384765625, -3.9619140625, -3.5618896484375, -3.161865234375, -2.7618408203125, -2.36181640625, -1.9617919921875, -1.561767578125, -1.1617431640625, -0.76171875, -0.3616943359375, 0.038330078125, 0.4383544921875, 0.83837890625, 1.2384033203125, 1.638427734375, 2.0384521484375, 2.4384765625, 2.8385009765625, 3.238525390625, 3.6385498046875, 4.03857421875, 4.4385986328125, 4.838623046875, 5.2386474609375, 5.638671875, 6.0386962890625, 6.438720703125, 6.8387451171875, 7.23876953125, 7.6387939453125, 8.038818359375, 8.4388427734375, 8.8388671875, 9.2388916015625, 9.638916015625, 10.0389404296875, 10.43896484375, 10.8389892578125, 11.239013671875, 11.6390380859375, 12.0390625]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 8.0, 3.0, 7.0, 10.0, 9.0, 18.0, 29.0, 29.0, 33.0, 39.0, 38.0, 47.0, 61.0, 64.0, 71.0, 73.0, 47.0, 70.0, 49.0, 59.0, 42.0, 36.0, 37.0, 27.0, 20.0, 16.0, 16.0, 11.0, 3.0, 9.0, 6.0, 5.0, 2.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.6640625, -6.46575927734375, -6.2674560546875, -6.06915283203125, -5.870849609375, -5.67254638671875, -5.4742431640625, -5.27593994140625, -5.07763671875, -4.87933349609375, -4.6810302734375, -4.48272705078125, -4.284423828125, -4.08612060546875, -3.8878173828125, -3.68951416015625, -3.4912109375, -3.29290771484375, -3.0946044921875, -2.89630126953125, -2.697998046875, -2.49969482421875, -2.3013916015625, -2.10308837890625, -1.90478515625, -1.70648193359375, -1.5081787109375, -1.30987548828125, -1.111572265625, -0.91326904296875, -0.7149658203125, -0.51666259765625, -0.318359375, -0.12005615234375, 0.0782470703125, 0.27655029296875, 0.474853515625, 0.67315673828125, 0.8714599609375, 1.06976318359375, 1.26806640625, 1.46636962890625, 1.6646728515625, 1.86297607421875, 2.061279296875, 2.25958251953125, 2.4578857421875, 2.65618896484375, 2.8544921875, 3.05279541015625, 3.2510986328125, 3.44940185546875, 3.647705078125, 3.84600830078125, 4.0443115234375, 4.24261474609375, 4.44091796875, 4.63922119140625, 4.8375244140625, 5.03582763671875, 5.234130859375, 5.43243408203125, 5.6307373046875, 5.82904052734375, 6.02734375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 4.0, 2.0, 9.0, 9.0, 7.0, 17.0, 34.0, 32.0, 47.0, 66.0, 81.0, 119.0, 197.0, 330.0, 570.0, 1018.0, 2047.0, 4877.0, 13711.0, 49922.0, 330536.0, 3541395.0, 194328.0, 36403.0, 10718.0, 3934.0, 1724.0, 833.0, 485.0, 294.0, 161.0, 114.0, 79.0, 54.0, 35.0, 28.0, 20.0, 12.0, 11.0, 9.0, 7.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-11.7578125, -11.4158935546875, -11.073974609375, -10.7320556640625, -10.39013671875, -10.0482177734375, -9.706298828125, -9.3643798828125, -9.0224609375, -8.6805419921875, -8.338623046875, -7.9967041015625, -7.65478515625, -7.3128662109375, -6.970947265625, -6.6290283203125, -6.287109375, -5.9451904296875, -5.603271484375, -5.2613525390625, -4.91943359375, -4.5775146484375, -4.235595703125, -3.8936767578125, -3.5517578125, -3.2098388671875, -2.867919921875, -2.5260009765625, -2.18408203125, -1.8421630859375, -1.500244140625, -1.1583251953125, -0.81640625, -0.4744873046875, -0.132568359375, 0.2093505859375, 0.55126953125, 0.8931884765625, 1.235107421875, 1.5770263671875, 1.9189453125, 2.2608642578125, 2.602783203125, 2.9447021484375, 3.28662109375, 3.6285400390625, 3.970458984375, 4.3123779296875, 4.654296875, 4.9962158203125, 5.338134765625, 5.6800537109375, 6.02197265625, 6.3638916015625, 6.705810546875, 7.0477294921875, 7.3896484375, 7.7315673828125, 8.073486328125, 8.4154052734375, 8.75732421875, 9.0992431640625, 9.441162109375, 9.7830810546875, 10.125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 6.0, 3.0, 1.0, 4.0, 4.0, 2.0, 6.0, 13.0, 15.0, 12.0, 20.0, 37.0, 64.0, 84.0, 161.0, 374.0, 1892.0, 739.0, 282.0, 132.0, 79.0, 45.0, 42.0, 20.0, 12.0, 9.0, 7.0, 6.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.0234375, -4.86529541015625, -4.7071533203125, -4.54901123046875, -4.390869140625, -4.23272705078125, -4.0745849609375, -3.91644287109375, -3.75830078125, -3.60015869140625, -3.4420166015625, -3.28387451171875, -3.125732421875, -2.96759033203125, -2.8094482421875, -2.65130615234375, -2.4931640625, -2.33502197265625, -2.1768798828125, -2.01873779296875, -1.860595703125, -1.70245361328125, -1.5443115234375, -1.38616943359375, -1.22802734375, -1.06988525390625, -0.9117431640625, -0.75360107421875, -0.595458984375, -0.43731689453125, -0.2791748046875, -0.12103271484375, 0.037109375, 0.19525146484375, 0.3533935546875, 0.51153564453125, 0.669677734375, 0.82781982421875, 0.9859619140625, 1.14410400390625, 1.30224609375, 1.46038818359375, 1.6185302734375, 1.77667236328125, 1.934814453125, 2.09295654296875, 2.2510986328125, 2.40924072265625, 2.5673828125, 2.72552490234375, 2.8836669921875, 3.04180908203125, 3.199951171875, 3.35809326171875, 3.5162353515625, 3.67437744140625, 3.83251953125, 3.99066162109375, 4.1488037109375, 4.30694580078125, 4.465087890625, 4.62322998046875, 4.7813720703125, 4.93951416015625, 5.09765625]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 7.0, 3.0, 7.0, 8.0, 19.0, 32.0, 56.0, 93.0, 143.0, 171.0, 161.0, 121.0, 79.0, 45.0, 28.0, 10.0, 11.0, 7.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.189285278320312, -29.023456573486328, -27.85762596130371, -26.691795349121094, -25.52596664428711, -24.360137939453125, -23.194307327270508, -22.02847671508789, -20.862648010253906, -19.696819305419922, -18.530988693237305, -17.365158081054688, -16.199329376220703, -15.033499717712402, -13.867670059204102, -12.7018404006958, -11.5360107421875, -10.3701810836792, -9.204351425170898, -8.038521766662598, -6.872692108154297, -5.706862449645996, -4.541032791137695, -3.3752031326293945, -2.2093734741210938, -1.043543815612793, 0.12228584289550781, 1.2881155014038086, 2.4539451599121094, 3.61977481842041, 4.785604476928711, 5.951434135437012, 7.1172637939453125, 8.283093452453613, 9.448923110961914, 10.614752769470215, 11.780582427978516, 12.946412086486816, 14.112241744995117, 15.278071403503418, 16.44390106201172, 17.609729766845703, 18.77556037902832, 19.941390991210938, 21.107219696044922, 22.273048400878906, 23.438879013061523, 24.60470962524414, 25.770538330078125, 26.93636703491211, 28.102197647094727, 29.268028259277344, 30.433856964111328, 31.599685668945312, 32.76551818847656, 33.93134689331055, 35.09717559814453, 36.263004302978516, 37.4288330078125, 38.59466552734375, 39.760494232177734, 40.92632293701172, 42.09215545654297, 43.25798416137695, 44.42381286621094]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 7.0, 8.0, 3.0, 9.0, 9.0, 10.0, 12.0, 15.0, 17.0, 16.0, 21.0, 29.0, 23.0, 23.0, 38.0, 41.0, 42.0, 47.0, 38.0, 51.0, 49.0, 48.0, 41.0, 48.0, 38.0, 36.0, 44.0, 28.0, 37.0, 18.0, 27.0, 23.0, 17.0, 12.0, 21.0, 12.0, 11.0, 3.0, 11.0, 5.0, 3.0, 4.0, 2.0, 4.0, 3.0, 1.0, 0.0, 2.0], "bins": [-15.86805248260498, -15.43425464630127, -15.000456809997559, -14.566658973693848, -14.132862091064453, -13.699064254760742, -13.265266418457031, -12.83146858215332, -12.39767074584961, -11.963872909545898, -11.530075073242188, -11.096277236938477, -10.662479400634766, -10.228681564331055, -9.79488468170166, -9.36108684539795, -8.927289009094238, -8.493491172790527, -8.059693336486816, -7.625895977020264, -7.192098140716553, -6.758300304412842, -6.324502944946289, -5.890705108642578, -5.456907272338867, -5.023109436035156, -4.589311599731445, -4.155514240264893, -3.7217164039611816, -3.2879185676574707, -2.854120969772339, -2.420323371887207, -1.9865245819091797, -1.5527268648147583, -1.118929147720337, -0.6851314306259155, -0.25133371353149414, 0.1824641227722168, 0.6162617206573486, 1.0500593185424805, 1.4838571548461914, 1.9176548719406128, 2.351452589035034, 2.785250186920166, 3.219048023223877, 3.652845859527588, 4.086643218994141, 4.520441055297852, 4.9542388916015625, 5.388036727905273, 5.821834564208984, 6.255631923675537, 6.689429759979248, 7.123227596282959, 7.557024955749512, 7.990822792053223, 8.424620628356934, 8.858418464660645, 9.292216300964355, 9.726014137268066, 10.159811019897461, 10.593608856201172, 11.027406692504883, 11.461204528808594, 11.895002365112305]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 9.0, 8.0, 13.0, 14.0, 25.0, 39.0, 87.0, 200.0, 411.0, 1093.0, 3343.0, 12296.0, 54078.0, 231076.0, 522627.0, 170588.0, 39300.0, 9207.0, 2650.0, 840.0, 321.0, 159.0, 81.0, 40.0, 24.0, 14.0, 4.0, 7.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.703125, -18.189208984375, -17.67529296875, -17.161376953125, -16.6474609375, -16.133544921875, -15.61962890625, -15.105712890625, -14.591796875, -14.077880859375, -13.56396484375, -13.050048828125, -12.5361328125, -12.022216796875, -11.50830078125, -10.994384765625, -10.48046875, -9.966552734375, -9.45263671875, -8.938720703125, -8.4248046875, -7.910888671875, -7.39697265625, -6.883056640625, -6.369140625, -5.855224609375, -5.34130859375, -4.827392578125, -4.3134765625, -3.799560546875, -3.28564453125, -2.771728515625, -2.2578125, -1.743896484375, -1.22998046875, -0.716064453125, -0.2021484375, 0.311767578125, 0.82568359375, 1.339599609375, 1.853515625, 2.367431640625, 2.88134765625, 3.395263671875, 3.9091796875, 4.423095703125, 4.93701171875, 5.450927734375, 5.96484375, 6.478759765625, 6.99267578125, 7.506591796875, 8.0205078125, 8.534423828125, 9.04833984375, 9.562255859375, 10.076171875, 10.590087890625, 11.10400390625, 11.617919921875, 12.1318359375, 12.645751953125, 13.15966796875, 13.673583984375, 14.1875]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 4.0, 7.0, 7.0, 12.0, 21.0, 23.0, 25.0, 38.0, 34.0, 37.0, 46.0, 50.0, 58.0, 67.0, 66.0, 66.0, 57.0, 66.0, 54.0, 43.0, 50.0, 27.0, 36.0, 22.0, 20.0, 16.0, 15.0, 6.0, 7.0, 3.0, 5.0, 5.0, 2.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.76953125, -6.56463623046875, -6.3597412109375, -6.15484619140625, -5.949951171875, -5.74505615234375, -5.5401611328125, -5.33526611328125, -5.13037109375, -4.92547607421875, -4.7205810546875, -4.51568603515625, -4.310791015625, -4.10589599609375, -3.9010009765625, -3.69610595703125, -3.4912109375, -3.28631591796875, -3.0814208984375, -2.87652587890625, -2.671630859375, -2.46673583984375, -2.2618408203125, -2.05694580078125, -1.85205078125, -1.64715576171875, -1.4422607421875, -1.23736572265625, -1.032470703125, -0.82757568359375, -0.6226806640625, -0.41778564453125, -0.212890625, -0.00799560546875, 0.1968994140625, 0.40179443359375, 0.606689453125, 0.81158447265625, 1.0164794921875, 1.22137451171875, 1.42626953125, 1.63116455078125, 1.8360595703125, 2.04095458984375, 2.245849609375, 2.45074462890625, 2.6556396484375, 2.86053466796875, 3.0654296875, 3.27032470703125, 3.4752197265625, 3.68011474609375, 3.885009765625, 4.08990478515625, 4.2947998046875, 4.49969482421875, 4.70458984375, 4.90948486328125, 5.1143798828125, 5.31927490234375, 5.524169921875, 5.72906494140625, 5.9339599609375, 6.13885498046875, 6.34375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 2.0, 1.0, 7.0, 8.0, 9.0, 12.0, 14.0, 24.0, 33.0, 34.0, 47.0, 75.0, 99.0, 180.0, 338.0, 586.0, 1309.0, 3581.0, 17951.0, 396338.0, 596699.0, 23920.0, 4152.0, 1483.0, 676.0, 380.0, 205.0, 115.0, 76.0, 51.0, 47.0, 20.0, 20.0, 19.0, 13.0, 13.0, 7.0, 7.0, 2.0, 3.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.53125, -34.517822265625, -33.50439453125, -32.490966796875, -31.4775390625, -30.464111328125, -29.45068359375, -28.437255859375, -27.423828125, -26.410400390625, -25.39697265625, -24.383544921875, -23.3701171875, -22.356689453125, -21.34326171875, -20.329833984375, -19.31640625, -18.302978515625, -17.28955078125, -16.276123046875, -15.2626953125, -14.249267578125, -13.23583984375, -12.222412109375, -11.208984375, -10.195556640625, -9.18212890625, -8.168701171875, -7.1552734375, -6.141845703125, -5.12841796875, -4.114990234375, -3.1015625, -2.088134765625, -1.07470703125, -0.061279296875, 0.9521484375, 1.965576171875, 2.97900390625, 3.992431640625, 5.005859375, 6.019287109375, 7.03271484375, 8.046142578125, 9.0595703125, 10.072998046875, 11.08642578125, 12.099853515625, 13.11328125, 14.126708984375, 15.14013671875, 16.153564453125, 17.1669921875, 18.180419921875, 19.19384765625, 20.207275390625, 21.220703125, 22.234130859375, 23.24755859375, 24.260986328125, 25.2744140625, 26.287841796875, 27.30126953125, 28.314697265625, 29.328125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 7.0, 5.0, 6.0, 8.0, 8.0, 19.0, 34.0, 49.0, 65.0, 74.0, 97.0, 103.0, 93.0, 96.0, 88.0, 69.0, 57.0, 37.0, 26.0, 26.0, 10.0, 5.0, 9.0, 3.0, 4.0, 7.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.25, -33.80322265625, -32.3564453125, -30.90966796875, -29.462890625, -28.01611328125, -26.5693359375, -25.12255859375, -23.67578125, -22.22900390625, -20.7822265625, -19.33544921875, -17.888671875, -16.44189453125, -14.9951171875, -13.54833984375, -12.1015625, -10.65478515625, -9.2080078125, -7.76123046875, -6.314453125, -4.86767578125, -3.4208984375, -1.97412109375, -0.52734375, 0.91943359375, 2.3662109375, 3.81298828125, 5.259765625, 6.70654296875, 8.1533203125, 9.60009765625, 11.046875, 12.49365234375, 13.9404296875, 15.38720703125, 16.833984375, 18.28076171875, 19.7275390625, 21.17431640625, 22.62109375, 24.06787109375, 25.5146484375, 26.96142578125, 28.408203125, 29.85498046875, 31.3017578125, 32.74853515625, 34.1953125, 35.64208984375, 37.0888671875, 38.53564453125, 39.982421875, 41.42919921875, 42.8759765625, 44.32275390625, 45.76953125, 47.21630859375, 48.6630859375, 50.10986328125, 51.556640625, 53.00341796875, 54.4501953125, 55.89697265625, 57.34375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 4.0, 9.0, 7.0, 11.0, 8.0, 14.0, 19.0, 32.0, 42.0, 48.0, 71.0, 95.0, 161.0, 285.0, 479.0, 846.0, 2268.0, 6788.0, 30944.0, 187334.0, 668714.0, 120530.0, 21137.0, 5104.0, 1734.0, 778.0, 394.0, 234.0, 112.0, 101.0, 54.0, 46.0, 37.0, 32.0, 20.0, 18.0, 19.0, 8.0, 5.0, 8.0, 2.0, 5.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.0625, -7.8280029296875, -7.593505859375, -7.3590087890625, -7.12451171875, -6.8900146484375, -6.655517578125, -6.4210205078125, -6.1865234375, -5.9520263671875, -5.717529296875, -5.4830322265625, -5.24853515625, -5.0140380859375, -4.779541015625, -4.5450439453125, -4.310546875, -4.0760498046875, -3.841552734375, -3.6070556640625, -3.37255859375, -3.1380615234375, -2.903564453125, -2.6690673828125, -2.4345703125, -2.2000732421875, -1.965576171875, -1.7310791015625, -1.49658203125, -1.2620849609375, -1.027587890625, -0.7930908203125, -0.55859375, -0.3240966796875, -0.089599609375, 0.1448974609375, 0.37939453125, 0.6138916015625, 0.848388671875, 1.0828857421875, 1.3173828125, 1.5518798828125, 1.786376953125, 2.0208740234375, 2.25537109375, 2.4898681640625, 2.724365234375, 2.9588623046875, 3.193359375, 3.4278564453125, 3.662353515625, 3.8968505859375, 4.13134765625, 4.3658447265625, 4.600341796875, 4.8348388671875, 5.0693359375, 5.3038330078125, 5.538330078125, 5.7728271484375, 6.00732421875, 6.2418212890625, 6.476318359375, 6.7108154296875, 6.9453125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 6.0, 3.0, 5.0, 6.0, 12.0, 7.0, 13.0, 7.0, 12.0, 19.0, 19.0, 15.0, 20.0, 26.0, 28.0, 35.0, 33.0, 31.0, 79.0, 111.0, 99.0, 81.0, 42.0, 37.0, 36.0, 39.0, 25.0, 21.0, 32.0, 17.0, 22.0, 11.0, 7.0, 12.0, 7.0, 0.0, 4.0, 5.0, 2.0, 3.0, 6.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.0015230178833007812, -0.0014805346727371216, -0.001438051462173462, -0.0013955682516098022, -0.0013530850410461426, -0.001310601830482483, -0.0012681186199188232, -0.0012256354093551636, -0.001183152198791504, -0.0011406689882278442, -0.0010981857776641846, -0.001055702567100525, -0.0010132193565368652, -0.0009707361459732056, -0.0009282529354095459, -0.0008857697248458862, -0.0008432865142822266, -0.0008008033037185669, -0.0007583200931549072, -0.0007158368825912476, -0.0006733536720275879, -0.0006308704614639282, -0.0005883872509002686, -0.0005459040403366089, -0.0005034208297729492, -0.00046093761920928955, -0.0004184544086456299, -0.0003759711980819702, -0.00033348798751831055, -0.0002910047769546509, -0.0002485215663909912, -0.00020603835582733154, -0.00016355514526367188, -0.00012107193470001221, -7.858872413635254e-05, -3.610551357269287e-05, 6.377696990966797e-06, 4.8860907554626465e-05, 9.134411811828613e-05, 0.0001338273286819458, 0.00017631053924560547, 0.00021879374980926514, 0.0002612769603729248, 0.00030376017093658447, 0.00034624338150024414, 0.0003887265920639038, 0.0004312098026275635, 0.00047369301319122314, 0.0005161762237548828, 0.0005586594343185425, 0.0006011426448822021, 0.0006436258554458618, 0.0006861090660095215, 0.0007285922765731812, 0.0007710754871368408, 0.0008135586977005005, 0.0008560419082641602, 0.0008985251188278198, 0.0009410083293914795, 0.0009834915399551392, 0.0010259747505187988, 0.0010684579610824585, 0.0011109411716461182, 0.0011534243822097778, 0.0011959075927734375]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 4.0, 4.0, 8.0, 24.0, 13.0, 26.0, 30.0, 44.0, 59.0, 116.0, 207.0, 359.0, 927.0, 2320.0, 8684.0, 65442.0, 807223.0, 143922.0, 13627.0, 3285.0, 1196.0, 465.0, 219.0, 129.0, 79.0, 41.0, 32.0, 26.0, 13.0, 11.0, 7.0, 4.0, 3.0, 6.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.7734375, -12.382080078125, -11.99072265625, -11.599365234375, -11.2080078125, -10.816650390625, -10.42529296875, -10.033935546875, -9.642578125, -9.251220703125, -8.85986328125, -8.468505859375, -8.0771484375, -7.685791015625, -7.29443359375, -6.903076171875, -6.51171875, -6.120361328125, -5.72900390625, -5.337646484375, -4.9462890625, -4.554931640625, -4.16357421875, -3.772216796875, -3.380859375, -2.989501953125, -2.59814453125, -2.206787109375, -1.8154296875, -1.424072265625, -1.03271484375, -0.641357421875, -0.25, 0.141357421875, 0.53271484375, 0.924072265625, 1.3154296875, 1.706787109375, 2.09814453125, 2.489501953125, 2.880859375, 3.272216796875, 3.66357421875, 4.054931640625, 4.4462890625, 4.837646484375, 5.22900390625, 5.620361328125, 6.01171875, 6.403076171875, 6.79443359375, 7.185791015625, 7.5771484375, 7.968505859375, 8.35986328125, 8.751220703125, 9.142578125, 9.533935546875, 9.92529296875, 10.316650390625, 10.7080078125, 11.099365234375, 11.49072265625, 11.882080078125, 12.2734375]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 2.0, 2.0, 3.0, 8.0, 7.0, 6.0, 14.0, 13.0, 12.0, 32.0, 47.0, 36.0, 62.0, 76.0, 96.0, 116.0, 106.0, 89.0, 68.0, 39.0, 40.0, 32.0, 17.0, 21.0, 12.0, 16.0, 9.0, 4.0, 7.0, 5.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-9.5078125, -9.24285888671875, -8.9779052734375, -8.71295166015625, -8.447998046875, -8.18304443359375, -7.9180908203125, -7.65313720703125, -7.38818359375, -7.12322998046875, -6.8582763671875, -6.59332275390625, -6.328369140625, -6.06341552734375, -5.7984619140625, -5.53350830078125, -5.2685546875, -5.00360107421875, -4.7386474609375, -4.47369384765625, -4.208740234375, -3.94378662109375, -3.6788330078125, -3.41387939453125, -3.14892578125, -2.88397216796875, -2.6190185546875, -2.35406494140625, -2.089111328125, -1.82415771484375, -1.5592041015625, -1.29425048828125, -1.029296875, -0.76434326171875, -0.4993896484375, -0.23443603515625, 0.030517578125, 0.29547119140625, 0.5604248046875, 0.82537841796875, 1.09033203125, 1.35528564453125, 1.6202392578125, 1.88519287109375, 2.150146484375, 2.41510009765625, 2.6800537109375, 2.94500732421875, 3.2099609375, 3.47491455078125, 3.7398681640625, 4.00482177734375, 4.269775390625, 4.53472900390625, 4.7996826171875, 5.06463623046875, 5.32958984375, 5.59454345703125, 5.8594970703125, 6.12445068359375, 6.389404296875, 6.65435791015625, 6.9193115234375, 7.18426513671875, 7.44921875]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 4.0, 9.0, 16.0, 84.0, 273.0, 357.0, 201.0, 45.0, 11.0, 6.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-369.8257751464844, -358.3690185546875, -346.9122314453125, -335.4554748535156, -323.99871826171875, -312.54193115234375, -301.0851745605469, -289.62841796875, -278.171630859375, -266.7148742675781, -255.2581024169922, -243.80133056640625, -232.34457397460938, -220.88780212402344, -209.4310302734375, -197.97427368164062, -186.51751708984375, -175.0607452392578, -163.60398864746094, -152.147216796875, -140.69046020507812, -129.2336883544922, -117.77691650390625, -106.32015228271484, -94.86338806152344, -83.40662384033203, -71.94985961914062, -60.49308776855469, -49.03632354736328, -37.579559326171875, -26.122787475585938, -14.666023254394531, -3.209228515625, 8.247537612915039, 19.704303741455078, 31.16107177734375, 42.617835998535156, 54.07460021972656, 65.5313720703125, 76.9881362915039, 88.44490051269531, 99.90166473388672, 111.35842895507812, 122.81520080566406, 134.27197265625, 145.72872924804688, 157.1855010986328, 168.64227294921875, 180.09902954101562, 191.55580139160156, 203.01255798339844, 214.46932983398438, 225.92608642578125, 237.3828582763672, 248.83963012695312, 260.29638671875, 271.753173828125, 283.2099304199219, 294.6667175292969, 306.12347412109375, 317.5802307128906, 329.0369873046875, 340.4937744140625, 351.9505310058594, 363.40728759765625]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 6.0, 8.0, 7.0, 8.0, 9.0, 10.0, 16.0, 18.0, 21.0, 23.0, 25.0, 32.0, 31.0, 32.0, 32.0, 46.0, 44.0, 61.0, 50.0, 45.0, 57.0, 50.0, 52.0, 40.0, 41.0, 31.0, 31.0, 35.0, 23.0, 18.0, 14.0, 18.0, 11.0, 12.0, 8.0, 15.0, 5.0, 7.0, 6.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-115.42587280273438, -112.06140899658203, -108.69695281982422, -105.33248901367188, -101.96803283691406, -98.60356903076172, -95.23910522460938, -91.87464904785156, -88.51019287109375, -85.1457290649414, -81.7812728881836, -78.41680908203125, -75.05235290527344, -71.6878890991211, -68.32342529296875, -64.95896911621094, -61.594505310058594, -58.230045318603516, -54.86558532714844, -51.501121520996094, -48.13666534423828, -44.77220153808594, -41.40774154663086, -38.04328155517578, -34.6788215637207, -31.314361572265625, -27.949901580810547, -24.585439682006836, -21.220979690551758, -17.85651969909668, -14.492057800292969, -11.12759780883789, -7.7631378173828125, -4.398677349090576, -1.0342168807983398, 2.3302440643310547, 5.694704055786133, 9.059164047241211, 12.423625946044922, 15.7880859375, 19.152545928955078, 22.517005920410156, 25.881465911865234, 29.245927810668945, 32.610389709472656, 35.97484588623047, 39.33930969238281, 42.70376968383789, 46.06822967529297, 49.43268966674805, 52.797149658203125, 56.16161346435547, 59.52606964111328, 62.890533447265625, 66.25498962402344, 69.61945343017578, 72.98391723632812, 76.34838104248047, 79.71283721923828, 83.07730102539062, 86.44175720214844, 89.80622100830078, 93.17068481445312, 96.53514099121094, 99.89959716796875]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 5.0, 11.0, 17.0, 30.0, 49.0, 74.0, 153.0, 315.0, 795.0, 2179.0, 8142.0, 39648.0, 412697.0, 3287175.0, 392949.0, 38223.0, 8068.0, 2293.0, 788.0, 327.0, 149.0, 72.0, 48.0, 30.0, 14.0, 12.0, 10.0, 6.0, 0.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.015625, -9.6375732421875, -9.259521484375, -8.8814697265625, -8.50341796875, -8.1253662109375, -7.747314453125, -7.3692626953125, -6.9912109375, -6.6131591796875, -6.235107421875, -5.8570556640625, -5.47900390625, -5.1009521484375, -4.722900390625, -4.3448486328125, -3.966796875, -3.5887451171875, -3.210693359375, -2.8326416015625, -2.45458984375, -2.0765380859375, -1.698486328125, -1.3204345703125, -0.9423828125, -0.5643310546875, -0.186279296875, 0.1917724609375, 0.56982421875, 0.9478759765625, 1.325927734375, 1.7039794921875, 2.08203125, 2.4600830078125, 2.838134765625, 3.2161865234375, 3.59423828125, 3.9722900390625, 4.350341796875, 4.7283935546875, 5.1064453125, 5.4844970703125, 5.862548828125, 6.2406005859375, 6.61865234375, 6.9967041015625, 7.374755859375, 7.7528076171875, 8.130859375, 8.5089111328125, 8.886962890625, 9.2650146484375, 9.64306640625, 10.0211181640625, 10.399169921875, 10.7772216796875, 11.1552734375, 11.5333251953125, 11.911376953125, 12.2894287109375, 12.66748046875, 13.0455322265625, 13.423583984375, 13.8016357421875, 14.1796875]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 11.0, 17.0, 23.0, 21.0, 18.0, 47.0, 50.0, 50.0, 52.0, 71.0, 85.0, 64.0, 66.0, 71.0, 76.0, 57.0, 47.0, 39.0, 39.0, 22.0, 22.0, 10.0, 15.0, 3.0, 7.0, 9.0, 4.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.0625, -6.84063720703125, -6.6187744140625, -6.39691162109375, -6.175048828125, -5.95318603515625, -5.7313232421875, -5.50946044921875, -5.28759765625, -5.06573486328125, -4.8438720703125, -4.62200927734375, -4.400146484375, -4.17828369140625, -3.9564208984375, -3.73455810546875, -3.5126953125, -3.29083251953125, -3.0689697265625, -2.84710693359375, -2.625244140625, -2.40338134765625, -2.1815185546875, -1.95965576171875, -1.73779296875, -1.51593017578125, -1.2940673828125, -1.07220458984375, -0.850341796875, -0.62847900390625, -0.4066162109375, -0.18475341796875, 0.037109375, 0.25897216796875, 0.4808349609375, 0.70269775390625, 0.924560546875, 1.14642333984375, 1.3682861328125, 1.59014892578125, 1.81201171875, 2.03387451171875, 2.2557373046875, 2.47760009765625, 2.699462890625, 2.92132568359375, 3.1431884765625, 3.36505126953125, 3.5869140625, 3.80877685546875, 4.0306396484375, 4.25250244140625, 4.474365234375, 4.69622802734375, 4.9180908203125, 5.13995361328125, 5.36181640625, 5.58367919921875, 5.8055419921875, 6.02740478515625, 6.249267578125, 6.47113037109375, 6.6929931640625, 6.91485595703125, 7.13671875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 2.0, 3.0, 6.0, 7.0, 13.0, 22.0, 22.0, 30.0, 42.0, 62.0, 153.0, 304.0, 700.0, 1927.0, 6335.0, 27122.0, 196030.0, 2952091.0, 919750.0, 70347.0, 13513.0, 3649.0, 1201.0, 454.0, 219.0, 97.0, 51.0, 33.0, 21.0, 21.0, 12.0, 10.0, 6.0, 4.0, 5.0, 7.0, 0.0, 3.0, 1.0, 6.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-13.4453125, -13.047119140625, -12.64892578125, -12.250732421875, -11.8525390625, -11.454345703125, -11.05615234375, -10.657958984375, -10.259765625, -9.861572265625, -9.46337890625, -9.065185546875, -8.6669921875, -8.268798828125, -7.87060546875, -7.472412109375, -7.07421875, -6.676025390625, -6.27783203125, -5.879638671875, -5.4814453125, -5.083251953125, -4.68505859375, -4.286865234375, -3.888671875, -3.490478515625, -3.09228515625, -2.694091796875, -2.2958984375, -1.897705078125, -1.49951171875, -1.101318359375, -0.703125, -0.304931640625, 0.09326171875, 0.491455078125, 0.8896484375, 1.287841796875, 1.68603515625, 2.084228515625, 2.482421875, 2.880615234375, 3.27880859375, 3.677001953125, 4.0751953125, 4.473388671875, 4.87158203125, 5.269775390625, 5.66796875, 6.066162109375, 6.46435546875, 6.862548828125, 7.2607421875, 7.658935546875, 8.05712890625, 8.455322265625, 8.853515625, 9.251708984375, 9.64990234375, 10.048095703125, 10.4462890625, 10.844482421875, 11.24267578125, 11.640869140625, 12.0390625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 4.0, 8.0, 3.0, 9.0, 18.0, 30.0, 31.0, 55.0, 65.0, 107.0, 158.0, 243.0, 398.0, 625.0, 713.0, 552.0, 359.0, 261.0, 142.0, 100.0, 62.0, 35.0, 34.0, 15.0, 10.0, 8.0, 11.0, 10.0, 5.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-13.3671875, -13.0093994140625, -12.651611328125, -12.2938232421875, -11.93603515625, -11.5782470703125, -11.220458984375, -10.8626708984375, -10.5048828125, -10.1470947265625, -9.789306640625, -9.4315185546875, -9.07373046875, -8.7159423828125, -8.358154296875, -8.0003662109375, -7.642578125, -7.2847900390625, -6.927001953125, -6.5692138671875, -6.21142578125, -5.8536376953125, -5.495849609375, -5.1380615234375, -4.7802734375, -4.4224853515625, -4.064697265625, -3.7069091796875, -3.34912109375, -2.9913330078125, -2.633544921875, -2.2757568359375, -1.91796875, -1.5601806640625, -1.202392578125, -0.8446044921875, -0.48681640625, -0.1290283203125, 0.228759765625, 0.5865478515625, 0.9443359375, 1.3021240234375, 1.659912109375, 2.0177001953125, 2.37548828125, 2.7332763671875, 3.091064453125, 3.4488525390625, 3.806640625, 4.1644287109375, 4.522216796875, 4.8800048828125, 5.23779296875, 5.5955810546875, 5.953369140625, 6.3111572265625, 6.6689453125, 7.0267333984375, 7.384521484375, 7.7423095703125, 8.10009765625, 8.4578857421875, 8.815673828125, 9.1734619140625, 9.53125]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 7.0, 13.0, 26.0, 44.0, 61.0, 108.0, 156.0, 155.0, 146.0, 103.0, 76.0, 45.0, 23.0, 10.0, 11.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-80.26039123535156, -76.82545471191406, -73.39051055908203, -69.95556640625, -66.5206298828125, -63.085689544677734, -59.65074920654297, -56.2158088684082, -52.78086853027344, -49.34592819213867, -45.910987854003906, -42.47604751586914, -39.041107177734375, -35.60616683959961, -32.171226501464844, -28.736286163330078, -25.301345825195312, -21.866405487060547, -18.43146514892578, -14.996524810791016, -11.56158447265625, -8.126644134521484, -4.691703796386719, -1.2567634582519531, 2.1781768798828125, 5.613117218017578, 9.048057556152344, 12.48299789428711, 15.917938232421875, 19.35287857055664, 22.787818908691406, 26.222759246826172, 29.657699584960938, 33.0926399230957, 36.52758026123047, 39.962520599365234, 43.3974609375, 46.832401275634766, 50.26734161376953, 53.7022819519043, 57.13722229003906, 60.57216262817383, 64.0071029663086, 67.44204711914062, 70.87698364257812, 74.31192016601562, 77.74686431884766, 81.18180847167969, 84.61674499511719, 88.05168151855469, 91.48662567138672, 94.92156982421875, 98.35650634765625, 101.79144287109375, 105.22638702392578, 108.66133117675781, 112.09626770019531, 115.53120422363281, 118.96614837646484, 122.40109252929688, 125.83602905273438, 129.27096557617188, 132.70590209960938, 136.14085388183594, 139.57579040527344]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 7.0, 3.0, 3.0, 10.0, 6.0, 12.0, 7.0, 13.0, 19.0, 16.0, 19.0, 18.0, 32.0, 28.0, 28.0, 37.0, 37.0, 46.0, 42.0, 36.0, 44.0, 48.0, 49.0, 45.0, 36.0, 46.0, 50.0, 40.0, 31.0, 37.0, 35.0, 28.0, 25.0, 12.0, 13.0, 9.0, 11.0, 10.0, 8.0, 2.0, 4.0, 2.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-49.0355224609375, -47.66252899169922, -46.28953552246094, -44.91653823852539, -43.54354476928711, -42.17055130004883, -40.79755401611328, -39.424560546875, -38.05156707763672, -36.67857360839844, -35.305580139160156, -33.93258285522461, -32.55958938598633, -31.186595916748047, -29.813600540161133, -28.44060516357422, -27.067611694335938, -25.694618225097656, -24.321622848510742, -22.948627471923828, -21.575634002685547, -20.202640533447266, -18.82964515686035, -17.456649780273438, -16.083656311035156, -14.710661888122559, -13.337667465209961, -11.964673042297363, -10.591678619384766, -9.218684196472168, -7.84568977355957, -6.472695350646973, -5.099700927734375, -3.7267065048217773, -2.3537120819091797, -0.980717658996582, 0.3922767639160156, 1.7652711868286133, 3.138265609741211, 4.511260032653809, 5.884254455566406, 7.257248878479004, 8.630243301391602, 10.0032377243042, 11.376232147216797, 12.749226570129395, 14.122220993041992, 15.49521541595459, 16.868209838867188, 18.24120330810547, 19.614198684692383, 20.987194061279297, 22.360187530517578, 23.73318099975586, 25.106176376342773, 26.479171752929688, 27.85216522216797, 29.22515869140625, 30.598154067993164, 31.971149444580078, 33.34414291381836, 34.71713638305664, 36.09013366699219, 37.46312713623047, 38.83612060546875]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 1.0, 7.0, 6.0, 13.0, 8.0, 19.0, 31.0, 60.0, 75.0, 160.0, 301.0, 560.0, 1225.0, 2622.0, 6502.0, 18666.0, 60053.0, 228104.0, 506938.0, 156426.0, 43684.0, 13867.0, 4999.0, 2106.0, 1039.0, 489.0, 246.0, 144.0, 80.0, 40.0, 33.0, 15.0, 10.0, 5.0, 11.0, 5.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.796875, -12.37548828125, -11.9541015625, -11.53271484375, -11.111328125, -10.68994140625, -10.2685546875, -9.84716796875, -9.42578125, -9.00439453125, -8.5830078125, -8.16162109375, -7.740234375, -7.31884765625, -6.8974609375, -6.47607421875, -6.0546875, -5.63330078125, -5.2119140625, -4.79052734375, -4.369140625, -3.94775390625, -3.5263671875, -3.10498046875, -2.68359375, -2.26220703125, -1.8408203125, -1.41943359375, -0.998046875, -0.57666015625, -0.1552734375, 0.26611328125, 0.6875, 1.10888671875, 1.5302734375, 1.95166015625, 2.373046875, 2.79443359375, 3.2158203125, 3.63720703125, 4.05859375, 4.47998046875, 4.9013671875, 5.32275390625, 5.744140625, 6.16552734375, 6.5869140625, 7.00830078125, 7.4296875, 7.85107421875, 8.2724609375, 8.69384765625, 9.115234375, 9.53662109375, 9.9580078125, 10.37939453125, 10.80078125, 11.22216796875, 11.6435546875, 12.06494140625, 12.486328125, 12.90771484375, 13.3291015625, 13.75048828125, 14.171875]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 4.0, 8.0, 10.0, 16.0, 14.0, 29.0, 42.0, 48.0, 65.0, 58.0, 69.0, 49.0, 77.0, 92.0, 74.0, 77.0, 49.0, 54.0, 38.0, 31.0, 33.0, 18.0, 17.0, 10.0, 11.0, 4.0, 7.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.3671875, -8.128173828125, -7.88916015625, -7.650146484375, -7.4111328125, -7.172119140625, -6.93310546875, -6.694091796875, -6.455078125, -6.216064453125, -5.97705078125, -5.738037109375, -5.4990234375, -5.260009765625, -5.02099609375, -4.781982421875, -4.54296875, -4.303955078125, -4.06494140625, -3.825927734375, -3.5869140625, -3.347900390625, -3.10888671875, -2.869873046875, -2.630859375, -2.391845703125, -2.15283203125, -1.913818359375, -1.6748046875, -1.435791015625, -1.19677734375, -0.957763671875, -0.71875, -0.479736328125, -0.24072265625, -0.001708984375, 0.2373046875, 0.476318359375, 0.71533203125, 0.954345703125, 1.193359375, 1.432373046875, 1.67138671875, 1.910400390625, 2.1494140625, 2.388427734375, 2.62744140625, 2.866455078125, 3.10546875, 3.344482421875, 3.58349609375, 3.822509765625, 4.0615234375, 4.300537109375, 4.53955078125, 4.778564453125, 5.017578125, 5.256591796875, 5.49560546875, 5.734619140625, 5.9736328125, 6.212646484375, 6.45166015625, 6.690673828125, 6.9296875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 1.0, 4.0, 5.0, 8.0, 9.0, 8.0, 14.0, 27.0, 34.0, 62.0, 60.0, 118.0, 178.0, 340.0, 611.0, 1400.0, 4338.0, 28146.0, 807777.0, 189169.0, 11393.0, 2703.0, 1020.0, 459.0, 248.0, 129.0, 91.0, 62.0, 39.0, 36.0, 21.0, 16.0, 8.0, 2.0, 9.0, 2.0, 1.0, 7.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.28125, -33.130859375, -31.98046875, -30.830078125, -29.6796875, -28.529296875, -27.37890625, -26.228515625, -25.078125, -23.927734375, -22.77734375, -21.626953125, -20.4765625, -19.326171875, -18.17578125, -17.025390625, -15.875, -14.724609375, -13.57421875, -12.423828125, -11.2734375, -10.123046875, -8.97265625, -7.822265625, -6.671875, -5.521484375, -4.37109375, -3.220703125, -2.0703125, -0.919921875, 0.23046875, 1.380859375, 2.53125, 3.681640625, 4.83203125, 5.982421875, 7.1328125, 8.283203125, 9.43359375, 10.583984375, 11.734375, 12.884765625, 14.03515625, 15.185546875, 16.3359375, 17.486328125, 18.63671875, 19.787109375, 20.9375, 22.087890625, 23.23828125, 24.388671875, 25.5390625, 26.689453125, 27.83984375, 28.990234375, 30.140625, 31.291015625, 32.44140625, 33.591796875, 34.7421875, 35.892578125, 37.04296875, 38.193359375, 39.34375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 2.0, 6.0, 3.0, 3.0, 13.0, 11.0, 15.0, 24.0, 27.0, 39.0, 48.0, 42.0, 74.0, 90.0, 91.0, 91.0, 77.0, 85.0, 67.0, 56.0, 35.0, 32.0, 19.0, 10.0, 6.0, 4.0, 6.0, 2.0, 7.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-34.46875, -33.2509765625, -32.033203125, -30.8154296875, -29.59765625, -28.3798828125, -27.162109375, -25.9443359375, -24.7265625, -23.5087890625, -22.291015625, -21.0732421875, -19.85546875, -18.6376953125, -17.419921875, -16.2021484375, -14.984375, -13.7666015625, -12.548828125, -11.3310546875, -10.11328125, -8.8955078125, -7.677734375, -6.4599609375, -5.2421875, -4.0244140625, -2.806640625, -1.5888671875, -0.37109375, 0.8466796875, 2.064453125, 3.2822265625, 4.5, 5.7177734375, 6.935546875, 8.1533203125, 9.37109375, 10.5888671875, 11.806640625, 13.0244140625, 14.2421875, 15.4599609375, 16.677734375, 17.8955078125, 19.11328125, 20.3310546875, 21.548828125, 22.7666015625, 23.984375, 25.2021484375, 26.419921875, 27.6376953125, 28.85546875, 30.0732421875, 31.291015625, 32.5087890625, 33.7265625, 34.9443359375, 36.162109375, 37.3798828125, 38.59765625, 39.8154296875, 41.033203125, 42.2509765625, 43.46875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 2.0, 5.0, 5.0, 8.0, 12.0, 16.0, 15.0, 10.0, 24.0, 34.0, 45.0, 99.0, 145.0, 243.0, 603.0, 1717.0, 9626.0, 172810.0, 835672.0, 22869.0, 2968.0, 804.0, 355.0, 173.0, 87.0, 62.0, 43.0, 28.0, 15.0, 26.0, 7.0, 8.0, 3.0, 4.0, 5.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.890625, -17.2978515625, -16.705078125, -16.1123046875, -15.51953125, -14.9267578125, -14.333984375, -13.7412109375, -13.1484375, -12.5556640625, -11.962890625, -11.3701171875, -10.77734375, -10.1845703125, -9.591796875, -8.9990234375, -8.40625, -7.8134765625, -7.220703125, -6.6279296875, -6.03515625, -5.4423828125, -4.849609375, -4.2568359375, -3.6640625, -3.0712890625, -2.478515625, -1.8857421875, -1.29296875, -0.7001953125, -0.107421875, 0.4853515625, 1.078125, 1.6708984375, 2.263671875, 2.8564453125, 3.44921875, 4.0419921875, 4.634765625, 5.2275390625, 5.8203125, 6.4130859375, 7.005859375, 7.5986328125, 8.19140625, 8.7841796875, 9.376953125, 9.9697265625, 10.5625, 11.1552734375, 11.748046875, 12.3408203125, 12.93359375, 13.5263671875, 14.119140625, 14.7119140625, 15.3046875, 15.8974609375, 16.490234375, 17.0830078125, 17.67578125, 18.2685546875, 18.861328125, 19.4541015625, 20.046875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 5.0, 6.0, 6.0, 9.0, 13.0, 15.0, 13.0, 23.0, 43.0, 51.0, 76.0, 174.0, 213.0, 124.0, 58.0, 37.0, 25.0, 22.0, 20.0, 18.0, 14.0, 5.0, 8.0, 4.0, 8.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0031757354736328125, -0.0030856430530548096, -0.0029955506324768066, -0.0029054582118988037, -0.0028153657913208008, -0.002725273370742798, -0.002635180950164795, -0.002545088529586792, -0.002454996109008789, -0.002364903688430786, -0.002274811267852783, -0.0021847188472747803, -0.0020946264266967773, -0.0020045340061187744, -0.0019144415855407715, -0.0018243491649627686, -0.0017342567443847656, -0.0016441643238067627, -0.0015540719032287598, -0.0014639794826507568, -0.001373887062072754, -0.001283794641494751, -0.001193702220916748, -0.0011036098003387451, -0.0010135173797607422, -0.0009234249591827393, -0.0008333325386047363, -0.0007432401180267334, -0.0006531476974487305, -0.0005630552768707275, -0.0004729628562927246, -0.0003828704357147217, -0.00029277801513671875, -0.00020268559455871582, -0.00011259317398071289, -2.250075340270996e-05, 6.759166717529297e-05, 0.0001576840877532959, 0.00024777650833129883, 0.00033786892890930176, 0.0004279613494873047, 0.0005180537700653076, 0.0006081461906433105, 0.0006982386112213135, 0.0007883310317993164, 0.0008784234523773193, 0.0009685158729553223, 0.0010586082935333252, 0.0011487007141113281, 0.001238793134689331, 0.001328885555267334, 0.001418977975845337, 0.0015090703964233398, 0.0015991628170013428, 0.0016892552375793457, 0.0017793476581573486, 0.0018694400787353516, 0.0019595324993133545, 0.0020496249198913574, 0.0021397173404693604, 0.0022298097610473633, 0.002319902181625366, 0.002409994602203369, 0.002500087022781372, 0.002590179443359375]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 4.0, 3.0, 5.0, 5.0, 13.0, 16.0, 20.0, 46.0, 45.0, 61.0, 108.0, 142.0, 274.0, 451.0, 1002.0, 2324.0, 7116.0, 30545.0, 697677.0, 277595.0, 21705.0, 5494.0, 1917.0, 922.0, 399.0, 205.0, 153.0, 99.0, 65.0, 45.0, 29.0, 22.0, 15.0, 9.0, 8.0, 2.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-17.734375, -17.1953125, -16.65625, -16.1171875, -15.578125, -15.0390625, -14.5, -13.9609375, -13.421875, -12.8828125, -12.34375, -11.8046875, -11.265625, -10.7265625, -10.1875, -9.6484375, -9.109375, -8.5703125, -8.03125, -7.4921875, -6.953125, -6.4140625, -5.875, -5.3359375, -4.796875, -4.2578125, -3.71875, -3.1796875, -2.640625, -2.1015625, -1.5625, -1.0234375, -0.484375, 0.0546875, 0.59375, 1.1328125, 1.671875, 2.2109375, 2.75, 3.2890625, 3.828125, 4.3671875, 4.90625, 5.4453125, 5.984375, 6.5234375, 7.0625, 7.6015625, 8.140625, 8.6796875, 9.21875, 9.7578125, 10.296875, 10.8359375, 11.375, 11.9140625, 12.453125, 12.9921875, 13.53125, 14.0703125, 14.609375, 15.1484375, 15.6875, 16.2265625, 16.765625]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 7.0, 2.0, 2.0, 1.0, 0.0, 1.0, 5.0, 5.0, 2.0, 7.0, 19.0, 16.0, 32.0, 59.0, 100.0, 160.0, 221.0, 146.0, 80.0, 38.0, 25.0, 16.0, 16.0, 9.0, 10.0, 8.0, 5.0, 3.0, 3.0, 5.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.234375, -17.7159423828125, -17.197509765625, -16.6790771484375, -16.16064453125, -15.6422119140625, -15.123779296875, -14.6053466796875, -14.0869140625, -13.5684814453125, -13.050048828125, -12.5316162109375, -12.01318359375, -11.4947509765625, -10.976318359375, -10.4578857421875, -9.939453125, -9.4210205078125, -8.902587890625, -8.3841552734375, -7.86572265625, -7.3472900390625, -6.828857421875, -6.3104248046875, -5.7919921875, -5.2735595703125, -4.755126953125, -4.2366943359375, -3.71826171875, -3.1998291015625, -2.681396484375, -2.1629638671875, -1.64453125, -1.1260986328125, -0.607666015625, -0.0892333984375, 0.42919921875, 0.9476318359375, 1.466064453125, 1.9844970703125, 2.5029296875, 3.0213623046875, 3.539794921875, 4.0582275390625, 4.57666015625, 5.0950927734375, 5.613525390625, 6.1319580078125, 6.650390625, 7.1688232421875, 7.687255859375, 8.2056884765625, 8.72412109375, 9.2425537109375, 9.760986328125, 10.2794189453125, 10.7978515625, 11.3162841796875, 11.834716796875, 12.3531494140625, 12.87158203125, 13.3900146484375, 13.908447265625, 14.4268798828125, 14.9453125]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 2.0, 2.0, 8.0, 10.0, 24.0, 77.0, 167.0, 308.0, 203.0, 118.0, 50.0, 13.0, 6.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-164.7328338623047, -156.73707580566406, -148.74131774902344, -140.7455596923828, -132.74981689453125, -124.7540512084961, -116.75830078125, -108.76254272460938, -100.76678466796875, -92.77102661132812, -84.7752685546875, -76.7795181274414, -68.78376007080078, -60.788002014160156, -52.7922477722168, -44.79649353027344, -36.80073547363281, -28.80497932434082, -20.809223175048828, -12.813467025756836, -4.817710876464844, 3.1780471801757812, 11.17380142211914, 19.1695556640625, 27.165313720703125, 35.16107177734375, 43.15682601928711, 51.15258026123047, 59.148338317871094, 67.14409637451172, 75.13984680175781, 83.13560485839844, 91.13134765625, 99.12710571289062, 107.12286376953125, 115.11861419677734, 123.11437225341797, 131.11013793945312, 139.1058807373047, 147.1016387939453, 155.09739685058594, 163.09315490722656, 171.0889129638672, 179.0846710205078, 187.08041381835938, 195.076171875, 203.07192993164062, 211.06768798828125, 219.06344604492188, 227.0592041015625, 235.05496215820312, 243.05072021484375, 251.04647827148438, 259.042236328125, 267.0379943847656, 275.03375244140625, 283.02947998046875, 291.0252380371094, 299.02099609375, 307.0167541503906, 315.01251220703125, 323.0082702636719, 331.0040283203125, 338.999755859375, 346.99554443359375]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 5.0, 2.0, 6.0, 12.0, 11.0, 18.0, 19.0, 19.0, 25.0, 29.0, 42.0, 46.0, 53.0, 53.0, 61.0, 78.0, 66.0, 62.0, 61.0, 54.0, 52.0, 41.0, 38.0, 26.0, 26.0, 20.0, 20.0, 13.0, 14.0, 13.0, 8.0, 4.0, 6.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-95.6919937133789, -92.19994354248047, -88.70789337158203, -85.2158432006836, -81.72379302978516, -78.23174285888672, -74.73970031738281, -71.24765014648438, -67.75559997558594, -64.2635498046875, -60.77149963378906, -57.279449462890625, -53.78739929199219, -50.29534912109375, -46.80330276489258, -43.31125259399414, -39.81919860839844, -36.3271484375, -32.83509826660156, -29.343050003051758, -25.85099983215332, -22.358949661254883, -18.866901397705078, -15.37485122680664, -11.882801055908203, -8.390750885009766, -4.8987016677856445, -1.4066524505615234, 2.085397720336914, 5.577447891235352, 9.069496154785156, 12.561546325683594, 16.0535888671875, 19.545639038085938, 23.037689208984375, 26.52973747253418, 30.021787643432617, 33.51383972167969, 37.00588607788086, 40.4979362487793, 43.989986419677734, 47.48203659057617, 50.97408676147461, 54.46613311767578, 57.95818328857422, 61.450233459472656, 64.9422836303711, 68.43433380126953, 71.92638397216797, 75.4184341430664, 78.91048431396484, 82.40253448486328, 85.89458465576172, 89.38663482666016, 92.87867736816406, 96.3707275390625, 99.86277770996094, 103.35482788085938, 106.84687805175781, 110.33892822265625, 113.83097839355469, 117.32302856445312, 120.81507873535156, 124.30712890625, 127.79917907714844]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 7.0, 6.0, 9.0, 9.0, 25.0, 36.0, 48.0, 59.0, 106.0, 183.0, 315.0, 790.0, 5425.0, 529010.0, 3641297.0, 14667.0, 1391.0, 396.0, 182.0, 114.0, 68.0, 53.0, 33.0, 14.0, 9.0, 7.0, 7.0, 7.0, 4.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-31.921875, -30.92919921875, -29.9365234375, -28.94384765625, -27.951171875, -26.95849609375, -25.9658203125, -24.97314453125, -23.98046875, -22.98779296875, -21.9951171875, -21.00244140625, -20.009765625, -19.01708984375, -18.0244140625, -17.03173828125, -16.0390625, -15.04638671875, -14.0537109375, -13.06103515625, -12.068359375, -11.07568359375, -10.0830078125, -9.09033203125, -8.09765625, -7.10498046875, -6.1123046875, -5.11962890625, -4.126953125, -3.13427734375, -2.1416015625, -1.14892578125, -0.15625, 0.83642578125, 1.8291015625, 2.82177734375, 3.814453125, 4.80712890625, 5.7998046875, 6.79248046875, 7.78515625, 8.77783203125, 9.7705078125, 10.76318359375, 11.755859375, 12.74853515625, 13.7412109375, 14.73388671875, 15.7265625, 16.71923828125, 17.7119140625, 18.70458984375, 19.697265625, 20.68994140625, 21.6826171875, 22.67529296875, 23.66796875, 24.66064453125, 25.6533203125, 26.64599609375, 27.638671875, 28.63134765625, 29.6240234375, 30.61669921875, 31.609375]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 2.0, 4.0, 11.0, 10.0, 26.0, 26.0, 26.0, 53.0, 43.0, 72.0, 65.0, 99.0, 92.0, 80.0, 65.0, 83.0, 61.0, 38.0, 32.0, 33.0, 22.0, 17.0, 15.0, 7.0, 9.0, 5.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.109375, -7.8458251953125, -7.582275390625, -7.3187255859375, -7.05517578125, -6.7916259765625, -6.528076171875, -6.2645263671875, -6.0009765625, -5.7374267578125, -5.473876953125, -5.2103271484375, -4.94677734375, -4.6832275390625, -4.419677734375, -4.1561279296875, -3.892578125, -3.6290283203125, -3.365478515625, -3.1019287109375, -2.83837890625, -2.5748291015625, -2.311279296875, -2.0477294921875, -1.7841796875, -1.5206298828125, -1.257080078125, -0.9935302734375, -0.72998046875, -0.4664306640625, -0.202880859375, 0.0606689453125, 0.32421875, 0.5877685546875, 0.851318359375, 1.1148681640625, 1.37841796875, 1.6419677734375, 1.905517578125, 2.1690673828125, 2.4326171875, 2.6961669921875, 2.959716796875, 3.2232666015625, 3.48681640625, 3.7503662109375, 4.013916015625, 4.2774658203125, 4.541015625, 4.8045654296875, 5.068115234375, 5.3316650390625, 5.59521484375, 5.8587646484375, 6.122314453125, 6.3858642578125, 6.6494140625, 6.9129638671875, 7.176513671875, 7.4400634765625, 7.70361328125, 7.9671630859375, 8.230712890625, 8.4942626953125, 8.7578125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 5.0, 15.0, 17.0, 34.0, 69.0, 135.0, 265.0, 494.0, 1065.0, 2766.0, 8404.0, 32048.0, 201777.0, 2262665.0, 1512579.0, 135012.0, 25204.0, 7257.0, 2530.0, 976.0, 435.0, 219.0, 129.0, 58.0, 54.0, 26.0, 20.0, 11.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.328125, -11.9847412109375, -11.641357421875, -11.2979736328125, -10.95458984375, -10.6112060546875, -10.267822265625, -9.9244384765625, -9.5810546875, -9.2376708984375, -8.894287109375, -8.5509033203125, -8.20751953125, -7.8641357421875, -7.520751953125, -7.1773681640625, -6.833984375, -6.4906005859375, -6.147216796875, -5.8038330078125, -5.46044921875, -5.1170654296875, -4.773681640625, -4.4302978515625, -4.0869140625, -3.7435302734375, -3.400146484375, -3.0567626953125, -2.71337890625, -2.3699951171875, -2.026611328125, -1.6832275390625, -1.33984375, -0.9964599609375, -0.653076171875, -0.3096923828125, 0.03369140625, 0.3770751953125, 0.720458984375, 1.0638427734375, 1.4072265625, 1.7506103515625, 2.093994140625, 2.4373779296875, 2.78076171875, 3.1241455078125, 3.467529296875, 3.8109130859375, 4.154296875, 4.4976806640625, 4.841064453125, 5.1844482421875, 5.52783203125, 5.8712158203125, 6.214599609375, 6.5579833984375, 6.9013671875, 7.2447509765625, 7.588134765625, 7.9315185546875, 8.27490234375, 8.6182861328125, 8.961669921875, 9.3050537109375, 9.6484375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 6.0, 3.0, 7.0, 10.0, 9.0, 15.0, 28.0, 53.0, 42.0, 136.0, 187.0, 248.0, 384.0, 547.0, 662.0, 551.0, 394.0, 275.0, 180.0, 104.0, 71.0, 41.0, 33.0, 23.0, 19.0, 10.0, 12.0, 11.0, 3.0, 3.0, 5.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.1328125, -8.8004150390625, -8.468017578125, -8.1356201171875, -7.80322265625, -7.4708251953125, -7.138427734375, -6.8060302734375, -6.4736328125, -6.1412353515625, -5.808837890625, -5.4764404296875, -5.14404296875, -4.8116455078125, -4.479248046875, -4.1468505859375, -3.814453125, -3.4820556640625, -3.149658203125, -2.8172607421875, -2.48486328125, -2.1524658203125, -1.820068359375, -1.4876708984375, -1.1552734375, -0.8228759765625, -0.490478515625, -0.1580810546875, 0.17431640625, 0.5067138671875, 0.839111328125, 1.1715087890625, 1.50390625, 1.8363037109375, 2.168701171875, 2.5010986328125, 2.83349609375, 3.1658935546875, 3.498291015625, 3.8306884765625, 4.1630859375, 4.4954833984375, 4.827880859375, 5.1602783203125, 5.49267578125, 5.8250732421875, 6.157470703125, 6.4898681640625, 6.822265625, 7.1546630859375, 7.487060546875, 7.8194580078125, 8.15185546875, 8.4842529296875, 8.816650390625, 9.1490478515625, 9.4814453125, 9.8138427734375, 10.146240234375, 10.4786376953125, 10.81103515625, 11.1434326171875, 11.475830078125, 11.8082275390625, 12.140625]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 1.0, 2.0, 2.0, 8.0, 8.0, 10.0, 32.0, 95.0, 159.0, 218.0, 221.0, 139.0, 55.0, 25.0, 13.0, 3.0, 2.0, 3.0, 1.0, 4.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-113.59634399414062, -109.3470458984375, -105.09774780273438, -100.84845733642578, -96.59915924072266, -92.34986114501953, -88.10057067871094, -83.85127258300781, -79.60197448730469, -75.35267639160156, -71.10337829589844, -66.85408782958984, -62.60478973388672, -58.355491638183594, -54.106197357177734, -49.856903076171875, -45.60760498046875, -41.358306884765625, -37.109012603759766, -32.859718322753906, -28.61042022705078, -24.36112403869629, -20.111827850341797, -15.862531661987305, -11.613235473632812, -7.36393928527832, -3.114643096923828, 1.134653091430664, 5.383949279785156, 9.633245468139648, 13.88254165649414, 18.131837844848633, 22.381118774414062, 26.630414962768555, 30.879711151123047, 35.129005432128906, 39.37830352783203, 43.627601623535156, 47.876895904541016, 52.126190185546875, 56.37548828125, 60.624786376953125, 64.87408447265625, 69.12337493896484, 73.37267303466797, 77.6219711303711, 81.87126159667969, 86.12055969238281, 90.36985778808594, 94.61915588378906, 98.86845397949219, 103.11774444580078, 107.3670425415039, 111.61634063720703, 115.86563110351562, 120.11492919921875, 124.36422729492188, 128.613525390625, 132.86282348632812, 137.11212158203125, 141.36141967773438, 145.61070251464844, 149.86000061035156, 154.1092987060547, 158.3585968017578]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 3.0, 4.0, 7.0, 14.0, 10.0, 22.0, 21.0, 20.0, 36.0, 33.0, 35.0, 32.0, 40.0, 51.0, 56.0, 54.0, 50.0, 70.0, 47.0, 56.0, 50.0, 43.0, 37.0, 40.0, 28.0, 30.0, 18.0, 20.0, 17.0, 11.0, 13.0, 11.0, 10.0, 5.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-55.51289367675781, -53.9188117980957, -52.32473373413086, -50.73065185546875, -49.136573791503906, -47.5424919128418, -45.94841003417969, -44.354331970214844, -42.760250091552734, -41.166168212890625, -39.57209014892578, -37.97800827026367, -36.38393020629883, -34.78984832763672, -33.195770263671875, -31.601688385009766, -30.00760841369629, -28.413528442382812, -26.819448471069336, -25.22536849975586, -23.63128662109375, -22.037206649780273, -20.443126678466797, -18.849044799804688, -17.254966735839844, -15.660886764526367, -14.066805839538574, -12.472725868225098, -10.878644943237305, -9.284564971923828, -7.690485000610352, -6.096404075622559, -4.502323150634766, -2.908242702484131, -1.3141624927520752, 0.27991771697998047, 1.8739981651306152, 3.46807861328125, 5.062158584594727, 6.6562395095825195, 8.250319480895996, 9.844399452209473, 11.438480377197266, 13.032560348510742, 14.626640319824219, 16.220722198486328, 17.814800262451172, 19.40888214111328, 21.002962112426758, 22.597042083740234, 24.19112205505371, 25.785202026367188, 27.379283905029297, 28.973363876342773, 30.56744384765625, 32.16152572631836, 33.7556037902832, 35.34968566894531, 36.943763732910156, 38.537845611572266, 40.13192367553711, 41.72600555419922, 43.32008361816406, 44.91416549682617, 46.50824737548828]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 4.0, 1.0, 5.0, 8.0, 13.0, 10.0, 15.0, 24.0, 24.0, 30.0, 43.0, 66.0, 124.0, 198.0, 322.0, 606.0, 1201.0, 2575.0, 6418.0, 17184.0, 52053.0, 198953.0, 518808.0, 175842.0, 47328.0, 15834.0, 5987.0, 2464.0, 1076.0, 550.0, 298.0, 172.0, 99.0, 75.0, 41.0, 34.0, 20.0, 18.0, 14.0, 9.0, 2.0, 3.0, 2.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-15.109375, -14.6949462890625, -14.280517578125, -13.8660888671875, -13.45166015625, -13.0372314453125, -12.622802734375, -12.2083740234375, -11.7939453125, -11.3795166015625, -10.965087890625, -10.5506591796875, -10.13623046875, -9.7218017578125, -9.307373046875, -8.8929443359375, -8.478515625, -8.0640869140625, -7.649658203125, -7.2352294921875, -6.82080078125, -6.4063720703125, -5.991943359375, -5.5775146484375, -5.1630859375, -4.7486572265625, -4.334228515625, -3.9197998046875, -3.50537109375, -3.0909423828125, -2.676513671875, -2.2620849609375, -1.84765625, -1.4332275390625, -1.018798828125, -0.6043701171875, -0.18994140625, 0.2244873046875, 0.638916015625, 1.0533447265625, 1.4677734375, 1.8822021484375, 2.296630859375, 2.7110595703125, 3.12548828125, 3.5399169921875, 3.954345703125, 4.3687744140625, 4.783203125, 5.1976318359375, 5.612060546875, 6.0264892578125, 6.44091796875, 6.8553466796875, 7.269775390625, 7.6842041015625, 8.0986328125, 8.5130615234375, 8.927490234375, 9.3419189453125, 9.75634765625, 10.1707763671875, 10.585205078125, 10.9996337890625, 11.4140625]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 4.0, 5.0, 8.0, 6.0, 13.0, 10.0, 17.0, 16.0, 17.0, 36.0, 29.0, 46.0, 46.0, 63.0, 47.0, 61.0, 62.0, 68.0, 65.0, 59.0, 58.0, 56.0, 39.0, 32.0, 22.0, 19.0, 18.0, 14.0, 18.0, 7.0, 6.0, 11.0, 13.0, 5.0, 3.0, 1.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0], "bins": [-7.94921875, -7.74578857421875, -7.5423583984375, -7.33892822265625, -7.135498046875, -6.93206787109375, -6.7286376953125, -6.52520751953125, -6.32177734375, -6.11834716796875, -5.9149169921875, -5.71148681640625, -5.508056640625, -5.30462646484375, -5.1011962890625, -4.89776611328125, -4.6943359375, -4.49090576171875, -4.2874755859375, -4.08404541015625, -3.880615234375, -3.67718505859375, -3.4737548828125, -3.27032470703125, -3.06689453125, -2.86346435546875, -2.6600341796875, -2.45660400390625, -2.253173828125, -2.04974365234375, -1.8463134765625, -1.64288330078125, -1.439453125, -1.23602294921875, -1.0325927734375, -0.82916259765625, -0.625732421875, -0.42230224609375, -0.2188720703125, -0.01544189453125, 0.18798828125, 0.39141845703125, 0.5948486328125, 0.79827880859375, 1.001708984375, 1.20513916015625, 1.4085693359375, 1.61199951171875, 1.8154296875, 2.01885986328125, 2.2222900390625, 2.42572021484375, 2.629150390625, 2.83258056640625, 3.0360107421875, 3.23944091796875, 3.44287109375, 3.64630126953125, 3.8497314453125, 4.05316162109375, 4.256591796875, 4.46002197265625, 4.6634521484375, 4.86688232421875, 5.0703125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 5.0, 7.0, 6.0, 13.0, 14.0, 18.0, 26.0, 47.0, 69.0, 107.0, 211.0, 403.0, 813.0, 1857.0, 5785.0, 25838.0, 222328.0, 710396.0, 64290.0, 10928.0, 3063.0, 1115.0, 559.0, 245.0, 158.0, 86.0, 53.0, 36.0, 21.0, 19.0, 15.0, 10.0, 4.0, 7.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-19.765625, -18.982421875, -18.19921875, -17.416015625, -16.6328125, -15.849609375, -15.06640625, -14.283203125, -13.5, -12.716796875, -11.93359375, -11.150390625, -10.3671875, -9.583984375, -8.80078125, -8.017578125, -7.234375, -6.451171875, -5.66796875, -4.884765625, -4.1015625, -3.318359375, -2.53515625, -1.751953125, -0.96875, -0.185546875, 0.59765625, 1.380859375, 2.1640625, 2.947265625, 3.73046875, 4.513671875, 5.296875, 6.080078125, 6.86328125, 7.646484375, 8.4296875, 9.212890625, 9.99609375, 10.779296875, 11.5625, 12.345703125, 13.12890625, 13.912109375, 14.6953125, 15.478515625, 16.26171875, 17.044921875, 17.828125, 18.611328125, 19.39453125, 20.177734375, 20.9609375, 21.744140625, 22.52734375, 23.310546875, 24.09375, 24.876953125, 25.66015625, 26.443359375, 27.2265625, 28.009765625, 28.79296875, 29.576171875, 30.359375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 1.0, 2.0, 5.0, 6.0, 8.0, 17.0, 17.0, 24.0, 35.0, 39.0, 48.0, 69.0, 59.0, 77.0, 82.0, 70.0, 63.0, 81.0, 64.0, 69.0, 40.0, 35.0, 31.0, 20.0, 6.0, 12.0, 11.0, 5.0, 7.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.0625, -37.853515625, -36.64453125, -35.435546875, -34.2265625, -33.017578125, -31.80859375, -30.599609375, -29.390625, -28.181640625, -26.97265625, -25.763671875, -24.5546875, -23.345703125, -22.13671875, -20.927734375, -19.71875, -18.509765625, -17.30078125, -16.091796875, -14.8828125, -13.673828125, -12.46484375, -11.255859375, -10.046875, -8.837890625, -7.62890625, -6.419921875, -5.2109375, -4.001953125, -2.79296875, -1.583984375, -0.375, 0.833984375, 2.04296875, 3.251953125, 4.4609375, 5.669921875, 6.87890625, 8.087890625, 9.296875, 10.505859375, 11.71484375, 12.923828125, 14.1328125, 15.341796875, 16.55078125, 17.759765625, 18.96875, 20.177734375, 21.38671875, 22.595703125, 23.8046875, 25.013671875, 26.22265625, 27.431640625, 28.640625, 29.849609375, 31.05859375, 32.267578125, 33.4765625, 34.685546875, 35.89453125, 37.103515625, 38.3125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 5.0, 6.0, 5.0, 7.0, 18.0, 25.0, 22.0, 39.0, 44.0, 76.0, 148.0, 378.0, 1030.0, 4948.0, 72386.0, 936819.0, 28135.0, 3034.0, 768.0, 306.0, 136.0, 85.0, 50.0, 34.0, 12.0, 15.0, 11.0, 6.0, 4.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-27.3125, -26.493896484375, -25.67529296875, -24.856689453125, -24.0380859375, -23.219482421875, -22.40087890625, -21.582275390625, -20.763671875, -19.945068359375, -19.12646484375, -18.307861328125, -17.4892578125, -16.670654296875, -15.85205078125, -15.033447265625, -14.21484375, -13.396240234375, -12.57763671875, -11.759033203125, -10.9404296875, -10.121826171875, -9.30322265625, -8.484619140625, -7.666015625, -6.847412109375, -6.02880859375, -5.210205078125, -4.3916015625, -3.572998046875, -2.75439453125, -1.935791015625, -1.1171875, -0.298583984375, 0.52001953125, 1.338623046875, 2.1572265625, 2.975830078125, 3.79443359375, 4.613037109375, 5.431640625, 6.250244140625, 7.06884765625, 7.887451171875, 8.7060546875, 9.524658203125, 10.34326171875, 11.161865234375, 11.98046875, 12.799072265625, 13.61767578125, 14.436279296875, 15.2548828125, 16.073486328125, 16.89208984375, 17.710693359375, 18.529296875, 19.347900390625, 20.16650390625, 20.985107421875, 21.8037109375, 22.622314453125, 23.44091796875, 24.259521484375, 25.078125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 2.0, 6.0, 5.0, 1.0, 6.0, 9.0, 4.0, 5.0, 4.0, 10.0, 13.0, 32.0, 30.0, 58.0, 77.0, 172.0, 188.0, 143.0, 72.0, 45.0, 36.0, 29.0, 16.0, 10.0, 8.0, 7.0, 2.0, 5.0, 6.0, 3.0, 0.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002471923828125, -0.002378016710281372, -0.002284109592437744, -0.002190202474594116, -0.0020962953567504883, -0.0020023882389068604, -0.0019084811210632324, -0.0018145740032196045, -0.0017206668853759766, -0.0016267597675323486, -0.0015328526496887207, -0.0014389455318450928, -0.0013450384140014648, -0.001251131296157837, -0.001157224178314209, -0.001063317060470581, -0.0009694099426269531, -0.0008755028247833252, -0.0007815957069396973, -0.0006876885890960693, -0.0005937814712524414, -0.0004998743534088135, -0.00040596723556518555, -0.0003120601177215576, -0.0002181529998779297, -0.00012424588203430176, -3.0338764190673828e-05, 6.35683536529541e-05, 0.00015747547149658203, 0.00025138258934020996, 0.0003452897071838379, 0.0004391968250274658, 0.0005331039428710938, 0.0006270110607147217, 0.0007209181785583496, 0.0008148252964019775, 0.0009087324142456055, 0.0010026395320892334, 0.0010965466499328613, 0.0011904537677764893, 0.0012843608856201172, 0.0013782680034637451, 0.001472175121307373, 0.001566082239151001, 0.001659989356994629, 0.0017538964748382568, 0.0018478035926818848, 0.0019417107105255127, 0.0020356178283691406, 0.0021295249462127686, 0.0022234320640563965, 0.0023173391819000244, 0.0024112462997436523, 0.0025051534175872803, 0.002599060535430908, 0.002692967653274536, 0.002786874771118164, 0.002880781888961792, 0.00297468900680542, 0.003068596124649048, 0.0031625032424926758, 0.0032564103603363037, 0.0033503174781799316, 0.0034442245960235596, 0.0035381317138671875]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 0.0, 5.0, 1.0, 3.0, 4.0, 4.0, 3.0, 18.0, 23.0, 31.0, 35.0, 76.0, 140.0, 291.0, 556.0, 1307.0, 3371.0, 12111.0, 147460.0, 845143.0, 28540.0, 5811.0, 1977.0, 847.0, 352.0, 208.0, 84.0, 54.0, 35.0, 23.0, 17.0, 13.0, 2.0, 5.0, 2.0, 0.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-19.484375, -18.81787109375, -18.1513671875, -17.48486328125, -16.818359375, -16.15185546875, -15.4853515625, -14.81884765625, -14.15234375, -13.48583984375, -12.8193359375, -12.15283203125, -11.486328125, -10.81982421875, -10.1533203125, -9.48681640625, -8.8203125, -8.15380859375, -7.4873046875, -6.82080078125, -6.154296875, -5.48779296875, -4.8212890625, -4.15478515625, -3.48828125, -2.82177734375, -2.1552734375, -1.48876953125, -0.822265625, -0.15576171875, 0.5107421875, 1.17724609375, 1.84375, 2.51025390625, 3.1767578125, 3.84326171875, 4.509765625, 5.17626953125, 5.8427734375, 6.50927734375, 7.17578125, 7.84228515625, 8.5087890625, 9.17529296875, 9.841796875, 10.50830078125, 11.1748046875, 11.84130859375, 12.5078125, 13.17431640625, 13.8408203125, 14.50732421875, 15.173828125, 15.84033203125, 16.5068359375, 17.17333984375, 17.83984375, 18.50634765625, 19.1728515625, 19.83935546875, 20.505859375, 21.17236328125, 21.8388671875, 22.50537109375, 23.171875]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 3.0, 5.0, 10.0, 15.0, 13.0, 20.0, 55.0, 50.0, 95.0, 113.0, 175.0, 135.0, 110.0, 77.0, 32.0, 32.0, 8.0, 11.0, 7.0, 6.0, 3.0, 3.0, 2.0, 2.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.75, -13.3172607421875, -12.884521484375, -12.4517822265625, -12.01904296875, -11.5863037109375, -11.153564453125, -10.7208251953125, -10.2880859375, -9.8553466796875, -9.422607421875, -8.9898681640625, -8.55712890625, -8.1243896484375, -7.691650390625, -7.2589111328125, -6.826171875, -6.3934326171875, -5.960693359375, -5.5279541015625, -5.09521484375, -4.6624755859375, -4.229736328125, -3.7969970703125, -3.3642578125, -2.9315185546875, -2.498779296875, -2.0660400390625, -1.63330078125, -1.2005615234375, -0.767822265625, -0.3350830078125, 0.09765625, 0.5303955078125, 0.963134765625, 1.3958740234375, 1.82861328125, 2.2613525390625, 2.694091796875, 3.1268310546875, 3.5595703125, 3.9923095703125, 4.425048828125, 4.8577880859375, 5.29052734375, 5.7232666015625, 6.156005859375, 6.5887451171875, 7.021484375, 7.4542236328125, 7.886962890625, 8.3197021484375, 8.75244140625, 9.1851806640625, 9.617919921875, 10.0506591796875, 10.4833984375, 10.9161376953125, 11.348876953125, 11.7816162109375, 12.21435546875, 12.6470947265625, 13.079833984375, 13.5125732421875, 13.9453125]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 4.0, 4.0, 5.0, 9.0, 35.0, 117.0, 258.0, 353.0, 155.0, 37.0, 17.0, 6.0, 4.0, 1.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-297.60223388671875, -288.0688171386719, -278.535400390625, -269.0019836425781, -259.46856689453125, -249.93515014648438, -240.40174865722656, -230.8683319091797, -221.3349151611328, -211.80149841308594, -202.26808166503906, -192.7346649169922, -183.20126342773438, -173.6678466796875, -164.13442993164062, -154.60101318359375, -145.06759643554688, -135.5341796875, -126.00076293945312, -116.46735382080078, -106.9339370727539, -97.40052032470703, -87.86711120605469, -78.33369445800781, -68.80027770996094, -59.26686096191406, -49.73344802856445, -40.200035095214844, -30.66661834716797, -21.133201599121094, -11.599788665771484, -2.066375732421875, 7.467010498046875, 17.000425338745117, 26.53384017944336, 36.06725311279297, 45.600669860839844, 55.13408660888672, 64.66749572753906, 74.20091247558594, 83.73432922363281, 93.26774597167969, 102.80116271972656, 112.3345718383789, 121.86798858642578, 131.40139770507812, 140.934814453125, 150.46823120117188, 160.00164794921875, 169.53506469726562, 179.0684814453125, 188.60189819335938, 198.13531494140625, 207.66873168945312, 217.20213317871094, 226.7355499267578, 236.2689666748047, 245.80238342285156, 255.33580017089844, 264.86920166015625, 274.4026184082031, 283.93603515625, 293.4694519042969, 303.00286865234375, 312.5362854003906]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 8.0, 5.0, 13.0, 8.0, 13.0, 51.0, 38.0, 48.0, 59.0, 81.0, 74.0, 111.0, 118.0, 84.0, 70.0, 55.0, 38.0, 48.0, 26.0, 23.0, 9.0, 9.0, 10.0, 7.0, 3.0, 1.0, 1.0, 0.0, 3.0], "bins": [-264.48590087890625, -258.87890625, -253.2719268798828, -247.66493225097656, -242.0579376220703, -236.45095825195312, -230.84396362304688, -225.23696899414062, -219.62998962402344, -214.0229949951172, -208.416015625, -202.80902099609375, -197.2020263671875, -191.5950469970703, -185.98805236816406, -180.38107299804688, -174.77407836914062, -169.16708374023438, -163.5601043701172, -157.95310974121094, -152.3461151123047, -146.7391357421875, -141.13214111328125, -135.525146484375, -129.91815185546875, -124.31116485595703, -118.70417022705078, -113.09718322753906, -107.49019622802734, -101.88320922851562, -96.27621459960938, -90.66922760009766, -85.0622329711914, -79.45524597167969, -73.84825134277344, -68.24126434326172, -62.63427734375, -57.027286529541016, -51.42029571533203, -45.81330871582031, -40.20631790161133, -34.599327087402344, -28.992340087890625, -23.38534927368164, -17.77836036682129, -12.171371459960938, -6.564380645751953, -0.9573936462402344, 4.64959716796875, 10.256586074829102, 15.86357593536377, 21.470565795898438, 27.07755470275879, 32.68454360961914, 38.291534423828125, 43.898521423339844, 49.50551223754883, 55.11250305175781, 60.71949005126953, 66.32647705078125, 71.9334716796875, 77.54045867919922, 83.14744567871094, 88.75444030761719, 94.3614273071289]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 2.0, 8.0, 2.0, 6.0, 9.0, 13.0, 11.0, 16.0, 22.0, 29.0, 26.0, 47.0, 59.0, 63.0, 93.0, 134.0, 190.0, 261.0, 561.0, 1254.0, 4110.0, 25301.0, 460080.0, 3427704.0, 246400.0, 19985.0, 4670.0, 1815.0, 774.0, 325.0, 134.0, 66.0, 48.0, 24.0, 10.0, 13.0, 5.0, 3.0, 1.0, 0.0, 2.0, 4.0], "bins": [-22.90625, -22.40185546875, -21.8974609375, -21.39306640625, -20.888671875, -20.38427734375, -19.8798828125, -19.37548828125, -18.87109375, -18.36669921875, -17.8623046875, -17.35791015625, -16.853515625, -16.34912109375, -15.8447265625, -15.34033203125, -14.8359375, -14.33154296875, -13.8271484375, -13.32275390625, -12.818359375, -12.31396484375, -11.8095703125, -11.30517578125, -10.80078125, -10.29638671875, -9.7919921875, -9.28759765625, -8.783203125, -8.27880859375, -7.7744140625, -7.27001953125, -6.765625, -6.26123046875, -5.7568359375, -5.25244140625, -4.748046875, -4.24365234375, -3.7392578125, -3.23486328125, -2.73046875, -2.22607421875, -1.7216796875, -1.21728515625, -0.712890625, -0.20849609375, 0.2958984375, 0.80029296875, 1.3046875, 1.80908203125, 2.3134765625, 2.81787109375, 3.322265625, 3.82666015625, 4.3310546875, 4.83544921875, 5.33984375, 5.84423828125, 6.3486328125, 6.85302734375, 7.357421875, 7.86181640625, 8.3662109375, 8.87060546875, 9.375]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 8.0, 9.0, 23.0, 52.0, 105.0, 162.0, 161.0, 181.0, 122.0, 92.0, 45.0, 32.0, 14.0, 3.0, 6.0], "bins": [-31.515625, -30.9515380859375, -30.387451171875, -29.8233642578125, -29.25927734375, -28.6951904296875, -28.131103515625, -27.5670166015625, -27.0029296875, -26.4388427734375, -25.874755859375, -25.3106689453125, -24.74658203125, -24.1824951171875, -23.618408203125, -23.0543212890625, -22.490234375, -21.9261474609375, -21.362060546875, -20.7979736328125, -20.23388671875, -19.6697998046875, -19.105712890625, -18.5416259765625, -17.9775390625, -17.4134521484375, -16.849365234375, -16.2852783203125, -15.72119140625, -15.1571044921875, -14.593017578125, -14.0289306640625, -13.46484375, -12.9007568359375, -12.336669921875, -11.7725830078125, -11.20849609375, -10.6444091796875, -10.080322265625, -9.5162353515625, -8.9521484375, -8.3880615234375, -7.823974609375, -7.2598876953125, -6.69580078125, -6.1317138671875, -5.567626953125, -5.0035400390625, -4.439453125, -3.8753662109375, -3.311279296875, -2.7471923828125, -2.18310546875, -1.6190185546875, -1.054931640625, -0.4908447265625, 0.0732421875, 0.6373291015625, 1.201416015625, 1.7655029296875, 2.32958984375, 2.8936767578125, 3.457763671875, 4.0218505859375, 4.5859375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 4.0, 2.0, 4.0, 8.0, 10.0, 16.0, 27.0, 27.0, 42.0, 55.0, 90.0, 164.0, 315.0, 890.0, 2966.0, 13385.0, 94721.0, 1488504.0, 2404728.0, 158357.0, 22367.0, 4904.0, 1393.0, 534.0, 272.0, 113.0, 101.0, 81.0, 51.0, 35.0, 19.0, 26.0, 20.0, 13.0, 11.0, 13.0, 5.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.1015625, -13.633056640625, -13.16455078125, -12.696044921875, -12.2275390625, -11.759033203125, -11.29052734375, -10.822021484375, -10.353515625, -9.885009765625, -9.41650390625, -8.947998046875, -8.4794921875, -8.010986328125, -7.54248046875, -7.073974609375, -6.60546875, -6.136962890625, -5.66845703125, -5.199951171875, -4.7314453125, -4.262939453125, -3.79443359375, -3.325927734375, -2.857421875, -2.388916015625, -1.92041015625, -1.451904296875, -0.9833984375, -0.514892578125, -0.04638671875, 0.422119140625, 0.890625, 1.359130859375, 1.82763671875, 2.296142578125, 2.7646484375, 3.233154296875, 3.70166015625, 4.170166015625, 4.638671875, 5.107177734375, 5.57568359375, 6.044189453125, 6.5126953125, 6.981201171875, 7.44970703125, 7.918212890625, 8.38671875, 8.855224609375, 9.32373046875, 9.792236328125, 10.2607421875, 10.729248046875, 11.19775390625, 11.666259765625, 12.134765625, 12.603271484375, 13.07177734375, 13.540283203125, 14.0087890625, 14.477294921875, 14.94580078125, 15.414306640625, 15.8828125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 4.0, 2.0, 5.0, 3.0, 6.0, 11.0, 12.0, 29.0, 33.0, 69.0, 80.0, 120.0, 220.0, 285.0, 371.0, 550.0, 604.0, 488.0, 358.0, 230.0, 178.0, 120.0, 82.0, 61.0, 48.0, 33.0, 20.0, 15.0, 7.0, 8.0, 12.0, 5.0, 2.0, 3.0, 1.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.234375, -9.815185546875, -9.39599609375, -8.976806640625, -8.5576171875, -8.138427734375, -7.71923828125, -7.300048828125, -6.880859375, -6.461669921875, -6.04248046875, -5.623291015625, -5.2041015625, -4.784912109375, -4.36572265625, -3.946533203125, -3.52734375, -3.108154296875, -2.68896484375, -2.269775390625, -1.8505859375, -1.431396484375, -1.01220703125, -0.593017578125, -0.173828125, 0.245361328125, 0.66455078125, 1.083740234375, 1.5029296875, 1.922119140625, 2.34130859375, 2.760498046875, 3.1796875, 3.598876953125, 4.01806640625, 4.437255859375, 4.8564453125, 5.275634765625, 5.69482421875, 6.114013671875, 6.533203125, 6.952392578125, 7.37158203125, 7.790771484375, 8.2099609375, 8.629150390625, 9.04833984375, 9.467529296875, 9.88671875, 10.305908203125, 10.72509765625, 11.144287109375, 11.5634765625, 11.982666015625, 12.40185546875, 12.821044921875, 13.240234375, 13.659423828125, 14.07861328125, 14.497802734375, 14.9169921875, 15.336181640625, 15.75537109375, 16.174560546875, 16.59375]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 5.0, 4.0, 12.0, 32.0, 66.0, 153.0, 204.0, 210.0, 139.0, 96.0, 34.0, 20.0, 10.0, 3.0, 1.0, 5.0, 2.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-187.64988708496094, -181.1382293701172, -174.62655639648438, -168.11489868164062, -161.60324096679688, -155.09156799316406, -148.5799102783203, -142.0682373046875, -135.55657958984375, -129.044921875, -122.53324890136719, -116.02159118652344, -109.50992584228516, -102.99826049804688, -96.48660278320312, -89.97493743896484, -83.46327209472656, -76.95160675048828, -70.43994140625, -63.92828369140625, -57.41661834716797, -50.90495300292969, -44.39329147338867, -37.881629943847656, -31.369964599609375, -24.858301162719727, -18.346637725830078, -11.83497428894043, -5.323310852050781, 1.1883544921875, 7.700016021728516, 14.211677551269531, 20.72332763671875, 27.2349910736084, 33.74665451049805, 40.25831604003906, 46.769981384277344, 53.281646728515625, 59.79330825805664, 66.30496978759766, 72.81663513183594, 79.32830047607422, 85.8399658203125, 92.35162353515625, 98.86328887939453, 105.37495422363281, 111.88661193847656, 118.39827728271484, 124.90994262695312, 131.42160034179688, 137.9332733154297, 144.44493103027344, 150.95660400390625, 157.46826171875, 163.97991943359375, 170.4915771484375, 177.0032501220703, 183.51490783691406, 190.02658081054688, 196.53823852539062, 203.04989624023438, 209.5615692138672, 216.07322692871094, 222.58489990234375, 229.0965576171875]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 7.0, 4.0, 23.0, 25.0, 46.0, 56.0, 99.0, 111.0, 111.0, 119.0, 109.0, 88.0, 74.0, 65.0, 32.0, 29.0, 10.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-129.91571044921875, -124.40957641601562, -118.9034423828125, -113.39730834960938, -107.89118194580078, -102.38504791259766, -96.87891387939453, -91.37278747558594, -85.86665344238281, -80.36051940917969, -74.85438537597656, -69.34825134277344, -63.842124938964844, -58.33599090576172, -52.829856872558594, -47.323726654052734, -41.817588806152344, -36.31145477294922, -30.80532455444336, -25.299190521240234, -19.793058395385742, -14.28692626953125, -8.780792236328125, -3.2746620178222656, 2.2314720153808594, 7.73760461807251, 13.24373722076416, 18.74987030029297, 24.25600242614746, 29.762134552001953, 35.26826858520508, 40.77439880371094, 46.28053283691406, 51.78666687011719, 57.29279708862305, 62.79893112182617, 68.30506134033203, 73.81119537353516, 79.31732940673828, 84.82345581054688, 90.32958984375, 95.83572387695312, 101.34185791015625, 106.84799194335938, 112.35411834716797, 117.8602523803711, 123.36638641357422, 128.8725128173828, 134.378662109375, 139.88479614257812, 145.39093017578125, 150.89706420898438, 156.4031982421875, 161.90933227539062, 167.41546630859375, 172.9215850830078, 178.42771911621094, 183.93385314941406, 189.4399871826172, 194.9461212158203, 200.45225524902344, 205.9583740234375, 211.46450805664062, 216.97064208984375, 222.47677612304688]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 5.0, 4.0, 3.0, 7.0, 8.0, 13.0, 11.0, 13.0, 30.0, 30.0, 49.0, 70.0, 106.0, 146.0, 270.0, 499.0, 959.0, 2380.0, 7296.0, 29643.0, 134500.0, 525074.0, 270205.0, 57476.0, 13158.0, 3655.0, 1348.0, 609.0, 356.0, 220.0, 140.0, 75.0, 52.0, 42.0, 34.0, 28.0, 12.0, 16.0, 6.0, 8.0, 1.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.9140625, -13.3511962890625, -12.788330078125, -12.2254638671875, -11.66259765625, -11.0997314453125, -10.536865234375, -9.9739990234375, -9.4111328125, -8.8482666015625, -8.285400390625, -7.7225341796875, -7.15966796875, -6.5968017578125, -6.033935546875, -5.4710693359375, -4.908203125, -4.3453369140625, -3.782470703125, -3.2196044921875, -2.65673828125, -2.0938720703125, -1.531005859375, -0.9681396484375, -0.4052734375, 0.1575927734375, 0.720458984375, 1.2833251953125, 1.84619140625, 2.4090576171875, 2.971923828125, 3.5347900390625, 4.09765625, 4.6605224609375, 5.223388671875, 5.7862548828125, 6.34912109375, 6.9119873046875, 7.474853515625, 8.0377197265625, 8.6005859375, 9.1634521484375, 9.726318359375, 10.2891845703125, 10.85205078125, 11.4149169921875, 11.977783203125, 12.5406494140625, 13.103515625, 13.6663818359375, 14.229248046875, 14.7921142578125, 15.35498046875, 15.9178466796875, 16.480712890625, 17.0435791015625, 17.6064453125, 18.1693115234375, 18.732177734375, 19.2950439453125, 19.85791015625, 20.4207763671875, 20.983642578125, 21.5465087890625, 22.109375]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 14.0, 15.0, 12.0, 36.0, 27.0, 47.0, 39.0, 65.0, 64.0, 89.0, 71.0, 93.0, 73.0, 65.0, 69.0, 62.0, 46.0, 29.0, 29.0, 25.0, 10.0, 9.0, 7.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.203125, -10.924072265625, -10.64501953125, -10.365966796875, -10.0869140625, -9.807861328125, -9.52880859375, -9.249755859375, -8.970703125, -8.691650390625, -8.41259765625, -8.133544921875, -7.8544921875, -7.575439453125, -7.29638671875, -7.017333984375, -6.73828125, -6.459228515625, -6.18017578125, -5.901123046875, -5.6220703125, -5.343017578125, -5.06396484375, -4.784912109375, -4.505859375, -4.226806640625, -3.94775390625, -3.668701171875, -3.3896484375, -3.110595703125, -2.83154296875, -2.552490234375, -2.2734375, -1.994384765625, -1.71533203125, -1.436279296875, -1.1572265625, -0.878173828125, -0.59912109375, -0.320068359375, -0.041015625, 0.238037109375, 0.51708984375, 0.796142578125, 1.0751953125, 1.354248046875, 1.63330078125, 1.912353515625, 2.19140625, 2.470458984375, 2.74951171875, 3.028564453125, 3.3076171875, 3.586669921875, 3.86572265625, 4.144775390625, 4.423828125, 4.702880859375, 4.98193359375, 5.260986328125, 5.5400390625, 5.819091796875, 6.09814453125, 6.377197265625, 6.65625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 11.0, 8.0, 8.0, 14.0, 17.0, 27.0, 48.0, 77.0, 148.0, 249.0, 482.0, 1025.0, 2529.0, 8839.0, 99918.0, 868641.0, 55788.0, 6807.0, 2088.0, 867.0, 400.0, 229.0, 138.0, 68.0, 46.0, 26.0, 21.0, 9.0, 14.0, 9.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.90625, -46.55322265625, -45.2001953125, -43.84716796875, -42.494140625, -41.14111328125, -39.7880859375, -38.43505859375, -37.08203125, -35.72900390625, -34.3759765625, -33.02294921875, -31.669921875, -30.31689453125, -28.9638671875, -27.61083984375, -26.2578125, -24.90478515625, -23.5517578125, -22.19873046875, -20.845703125, -19.49267578125, -18.1396484375, -16.78662109375, -15.43359375, -14.08056640625, -12.7275390625, -11.37451171875, -10.021484375, -8.66845703125, -7.3154296875, -5.96240234375, -4.609375, -3.25634765625, -1.9033203125, -0.55029296875, 0.802734375, 2.15576171875, 3.5087890625, 4.86181640625, 6.21484375, 7.56787109375, 8.9208984375, 10.27392578125, 11.626953125, 12.97998046875, 14.3330078125, 15.68603515625, 17.0390625, 18.39208984375, 19.7451171875, 21.09814453125, 22.451171875, 23.80419921875, 25.1572265625, 26.51025390625, 27.86328125, 29.21630859375, 30.5693359375, 31.92236328125, 33.275390625, 34.62841796875, 35.9814453125, 37.33447265625, 38.6875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 0.0, 2.0, 3.0, 5.0, 5.0, 8.0, 9.0, 10.0, 11.0, 19.0, 23.0, 28.0, 30.0, 48.0, 43.0, 49.0, 45.0, 57.0, 53.0, 68.0, 71.0, 68.0, 59.0, 42.0, 46.0, 37.0, 37.0, 28.0, 19.0, 26.0, 14.0, 9.0, 3.0, 4.0, 6.0, 6.0, 2.0, 5.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-35.59375, -34.560302734375, -33.52685546875, -32.493408203125, -31.4599609375, -30.426513671875, -29.39306640625, -28.359619140625, -27.326171875, -26.292724609375, -25.25927734375, -24.225830078125, -23.1923828125, -22.158935546875, -21.12548828125, -20.092041015625, -19.05859375, -18.025146484375, -16.99169921875, -15.958251953125, -14.9248046875, -13.891357421875, -12.85791015625, -11.824462890625, -10.791015625, -9.757568359375, -8.72412109375, -7.690673828125, -6.6572265625, -5.623779296875, -4.59033203125, -3.556884765625, -2.5234375, -1.489990234375, -0.45654296875, 0.576904296875, 1.6103515625, 2.643798828125, 3.67724609375, 4.710693359375, 5.744140625, 6.777587890625, 7.81103515625, 8.844482421875, 9.8779296875, 10.911376953125, 11.94482421875, 12.978271484375, 14.01171875, 15.045166015625, 16.07861328125, 17.112060546875, 18.1455078125, 19.178955078125, 20.21240234375, 21.245849609375, 22.279296875, 23.312744140625, 24.34619140625, 25.379638671875, 26.4130859375, 27.446533203125, 28.47998046875, 29.513427734375, 30.546875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 4.0, 8.0, 3.0, 4.0, 8.0, 13.0, 15.0, 14.0, 27.0, 48.0, 59.0, 81.0, 110.0, 223.0, 400.0, 726.0, 1689.0, 4581.0, 16483.0, 104224.0, 819144.0, 79643.0, 13786.0, 4046.0, 1502.0, 687.0, 416.0, 196.0, 128.0, 88.0, 51.0, 35.0, 38.0, 29.0, 13.0, 4.0, 10.0, 6.0, 2.0, 1.0, 3.0, 1.0, 7.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-17.59375, -17.067626953125, -16.54150390625, -16.015380859375, -15.4892578125, -14.963134765625, -14.43701171875, -13.910888671875, -13.384765625, -12.858642578125, -12.33251953125, -11.806396484375, -11.2802734375, -10.754150390625, -10.22802734375, -9.701904296875, -9.17578125, -8.649658203125, -8.12353515625, -7.597412109375, -7.0712890625, -6.545166015625, -6.01904296875, -5.492919921875, -4.966796875, -4.440673828125, -3.91455078125, -3.388427734375, -2.8623046875, -2.336181640625, -1.81005859375, -1.283935546875, -0.7578125, -0.231689453125, 0.29443359375, 0.820556640625, 1.3466796875, 1.872802734375, 2.39892578125, 2.925048828125, 3.451171875, 3.977294921875, 4.50341796875, 5.029541015625, 5.5556640625, 6.081787109375, 6.60791015625, 7.134033203125, 7.66015625, 8.186279296875, 8.71240234375, 9.238525390625, 9.7646484375, 10.290771484375, 10.81689453125, 11.343017578125, 11.869140625, 12.395263671875, 12.92138671875, 13.447509765625, 13.9736328125, 14.499755859375, 15.02587890625, 15.552001953125, 16.078125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 7.0, 4.0, 5.0, 3.0, 5.0, 11.0, 10.0, 13.0, 18.0, 20.0, 29.0, 34.0, 32.0, 56.0, 76.0, 118.0, 197.0, 91.0, 58.0, 46.0, 28.0, 32.0, 20.0, 14.0, 9.0, 12.0, 3.0, 4.0, 5.0, 6.0, 7.0, 3.0, 2.0, 3.0, 4.0, 0.0, 2.0, 1.0, 3.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0030059814453125, -0.002906888723373413, -0.002807796001434326, -0.0027087032794952393, -0.0026096105575561523, -0.0025105178356170654, -0.0024114251136779785, -0.0023123323917388916, -0.0022132396697998047, -0.0021141469478607178, -0.002015054225921631, -0.001915961503982544, -0.001816868782043457, -0.0017177760601043701, -0.0016186833381652832, -0.0015195906162261963, -0.0014204978942871094, -0.0013214051723480225, -0.0012223124504089355, -0.0011232197284698486, -0.0010241270065307617, -0.0009250342845916748, -0.0008259415626525879, -0.000726848840713501, -0.0006277561187744141, -0.0005286633968353271, -0.00042957067489624023, -0.0003304779529571533, -0.0002313852310180664, -0.0001322925090789795, -3.319978713989258e-05, 6.589293479919434e-05, 0.00016498565673828125, 0.00026407837867736816, 0.0003631711006164551, 0.000462263822555542, 0.0005613565444946289, 0.0006604492664337158, 0.0007595419883728027, 0.0008586347103118896, 0.0009577274322509766, 0.0010568201541900635, 0.0011559128761291504, 0.0012550055980682373, 0.0013540983200073242, 0.0014531910419464111, 0.001552283763885498, 0.001651376485824585, 0.0017504692077636719, 0.0018495619297027588, 0.0019486546516418457, 0.0020477473735809326, 0.0021468400955200195, 0.0022459328174591064, 0.0023450255393981934, 0.0024441182613372803, 0.002543210983276367, 0.002642303705215454, 0.002741396427154541, 0.002840489149093628, 0.002939581871032715, 0.0030386745929718018, 0.0031377673149108887, 0.0032368600368499756, 0.0033359527587890625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 6.0, 6.0, 8.0, 14.0, 20.0, 27.0, 35.0, 57.0, 70.0, 101.0, 162.0, 346.0, 559.0, 1205.0, 3334.0, 11407.0, 66124.0, 878067.0, 69215.0, 11759.0, 3389.0, 1257.0, 563.0, 329.0, 181.0, 109.0, 79.0, 36.0, 22.0, 19.0, 23.0, 9.0, 6.0, 5.0, 5.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-28.9375, -28.205078125, -27.47265625, -26.740234375, -26.0078125, -25.275390625, -24.54296875, -23.810546875, -23.078125, -22.345703125, -21.61328125, -20.880859375, -20.1484375, -19.416015625, -18.68359375, -17.951171875, -17.21875, -16.486328125, -15.75390625, -15.021484375, -14.2890625, -13.556640625, -12.82421875, -12.091796875, -11.359375, -10.626953125, -9.89453125, -9.162109375, -8.4296875, -7.697265625, -6.96484375, -6.232421875, -5.5, -4.767578125, -4.03515625, -3.302734375, -2.5703125, -1.837890625, -1.10546875, -0.373046875, 0.359375, 1.091796875, 1.82421875, 2.556640625, 3.2890625, 4.021484375, 4.75390625, 5.486328125, 6.21875, 6.951171875, 7.68359375, 8.416015625, 9.1484375, 9.880859375, 10.61328125, 11.345703125, 12.078125, 12.810546875, 13.54296875, 14.275390625, 15.0078125, 15.740234375, 16.47265625, 17.205078125, 17.9375]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 4.0, 3.0, 1.0, 10.0, 10.0, 11.0, 12.0, 17.0, 13.0, 25.0, 45.0, 63.0, 84.0, 149.0, 158.0, 137.0, 64.0, 53.0, 35.0, 26.0, 17.0, 13.0, 6.0, 6.0, 4.0, 10.0, 3.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-16.515625, -16.020263671875, -15.52490234375, -15.029541015625, -14.5341796875, -14.038818359375, -13.54345703125, -13.048095703125, -12.552734375, -12.057373046875, -11.56201171875, -11.066650390625, -10.5712890625, -10.075927734375, -9.58056640625, -9.085205078125, -8.58984375, -8.094482421875, -7.59912109375, -7.103759765625, -6.6083984375, -6.113037109375, -5.61767578125, -5.122314453125, -4.626953125, -4.131591796875, -3.63623046875, -3.140869140625, -2.6455078125, -2.150146484375, -1.65478515625, -1.159423828125, -0.6640625, -0.168701171875, 0.32666015625, 0.822021484375, 1.3173828125, 1.812744140625, 2.30810546875, 2.803466796875, 3.298828125, 3.794189453125, 4.28955078125, 4.784912109375, 5.2802734375, 5.775634765625, 6.27099609375, 6.766357421875, 7.26171875, 7.757080078125, 8.25244140625, 8.747802734375, 9.2431640625, 9.738525390625, 10.23388671875, 10.729248046875, 11.224609375, 11.719970703125, 12.21533203125, 12.710693359375, 13.2060546875, 13.701416015625, 14.19677734375, 14.692138671875, 15.1875]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 5.0, 8.0, 18.0, 37.0, 82.0, 204.0, 311.0, 192.0, 80.0, 30.0, 17.0, 9.0, 2.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-236.33547973632812, -226.72068786621094, -217.10589599609375, -207.49110412597656, -197.87631225585938, -188.26153564453125, -178.64674377441406, -169.03195190429688, -159.4171600341797, -149.8023681640625, -140.1875762939453, -130.57278442382812, -120.95800018310547, -111.34320831298828, -101.72842407226562, -92.11363220214844, -82.49884033203125, -72.88404846191406, -63.26926040649414, -53.65447235107422, -44.03968048095703, -34.424888610839844, -24.810100555419922, -15.1953125, -5.5805206298828125, 4.034269332885742, 13.649059295654297, 23.26384925842285, 32.878639221191406, 42.493431091308594, 52.108219146728516, 61.72300720214844, 71.33782958984375, 80.95262145996094, 90.56741333007812, 100.18219757080078, 109.79698944091797, 119.41178131103516, 129.0265655517578, 138.641357421875, 148.2561492919922, 157.87094116210938, 167.48573303222656, 177.10052490234375, 186.71530151367188, 196.33010864257812, 205.94488525390625, 215.55967712402344, 225.17446899414062, 234.7892608642578, 244.404052734375, 254.0188446044922, 263.6336364746094, 273.2484130859375, 282.86322021484375, 292.4779968261719, 302.0927734375, 311.7075500488281, 321.3223571777344, 330.9371337890625, 340.55194091796875, 350.1667175292969, 359.7815246582031, 369.39630126953125, 379.0111083984375]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 1.0, 9.0, 3.0, 9.0, 16.0, 9.0, 10.0, 13.0, 15.0, 17.0, 16.0, 15.0, 31.0, 15.0, 34.0, 22.0, 26.0, 36.0, 34.0, 43.0, 48.0, 52.0, 66.0, 54.0, 52.0, 38.0, 29.0, 31.0, 40.0, 19.0, 31.0, 21.0, 20.0, 17.0, 16.0, 22.0, 14.0, 9.0, 10.0, 8.0, 7.0, 6.0, 5.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-94.78917694091797, -91.79435729980469, -88.7995376586914, -85.80471801757812, -82.80989074707031, -79.81507110595703, -76.82025146484375, -73.82543182373047, -70.83061218261719, -67.8357925415039, -64.84097290039062, -61.84614944458008, -58.8513298034668, -55.856510162353516, -52.86168670654297, -49.86686706542969, -46.872047424316406, -43.877227783203125, -40.882408142089844, -37.8875846862793, -34.892765045166016, -31.897945404052734, -28.90312385559082, -25.908302307128906, -22.913482666015625, -19.918663024902344, -16.92384147644043, -13.929020881652832, -10.934200286865234, -7.939379692077637, -4.944559097290039, -1.949737548828125, 1.0450897216796875, 4.039910316467285, 7.034730911254883, 10.02955150604248, 13.024372100830078, 16.01919174194336, 19.014013290405273, 22.008834838867188, 25.00365447998047, 27.99847412109375, 30.993295669555664, 33.98811721801758, 36.98293685913086, 39.97775650024414, 42.97257995605469, 45.96739959716797, 48.96221923828125, 51.95703887939453, 54.95185852050781, 57.94668197631836, 60.94150161743164, 63.93632125854492, 66.93114471435547, 69.92596435546875, 72.92078399658203, 75.91560363769531, 78.9104232788086, 81.90524291992188, 84.90007019042969, 87.89488983154297, 90.88970947265625, 93.88452911376953, 96.87934875488281]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 5.0, 0.0, 2.0, 3.0, 3.0, 8.0, 7.0, 2.0, 8.0, 18.0, 24.0, 39.0, 43.0, 68.0, 79.0, 137.0, 235.0, 462.0, 1070.0, 3230.0, 22021.0, 1274756.0, 2847376.0, 37428.0, 4860.0, 1349.0, 536.0, 205.0, 124.0, 65.0, 45.0, 28.0, 20.0, 12.0, 10.0, 3.0, 9.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-31.578125, -30.79052734375, -30.0029296875, -29.21533203125, -28.427734375, -27.64013671875, -26.8525390625, -26.06494140625, -25.27734375, -24.48974609375, -23.7021484375, -22.91455078125, -22.126953125, -21.33935546875, -20.5517578125, -19.76416015625, -18.9765625, -18.18896484375, -17.4013671875, -16.61376953125, -15.826171875, -15.03857421875, -14.2509765625, -13.46337890625, -12.67578125, -11.88818359375, -11.1005859375, -10.31298828125, -9.525390625, -8.73779296875, -7.9501953125, -7.16259765625, -6.375, -5.58740234375, -4.7998046875, -4.01220703125, -3.224609375, -2.43701171875, -1.6494140625, -0.86181640625, -0.07421875, 0.71337890625, 1.5009765625, 2.28857421875, 3.076171875, 3.86376953125, 4.6513671875, 5.43896484375, 6.2265625, 7.01416015625, 7.8017578125, 8.58935546875, 9.376953125, 10.16455078125, 10.9521484375, 11.73974609375, 12.52734375, 13.31494140625, 14.1025390625, 14.89013671875, 15.677734375, 16.46533203125, 17.2529296875, 18.04052734375, 18.828125]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 7.0, 5.0, 13.0, 12.0, 34.0, 33.0, 54.0, 76.0, 88.0, 100.0, 107.0, 106.0, 93.0, 92.0, 48.0, 46.0, 30.0, 27.0, 20.0, 13.0, 1.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.140625, -12.78369140625, -12.4267578125, -12.06982421875, -11.712890625, -11.35595703125, -10.9990234375, -10.64208984375, -10.28515625, -9.92822265625, -9.5712890625, -9.21435546875, -8.857421875, -8.50048828125, -8.1435546875, -7.78662109375, -7.4296875, -7.07275390625, -6.7158203125, -6.35888671875, -6.001953125, -5.64501953125, -5.2880859375, -4.93115234375, -4.57421875, -4.21728515625, -3.8603515625, -3.50341796875, -3.146484375, -2.78955078125, -2.4326171875, -2.07568359375, -1.71875, -1.36181640625, -1.0048828125, -0.64794921875, -0.291015625, 0.06591796875, 0.4228515625, 0.77978515625, 1.13671875, 1.49365234375, 1.8505859375, 2.20751953125, 2.564453125, 2.92138671875, 3.2783203125, 3.63525390625, 3.9921875, 4.34912109375, 4.7060546875, 5.06298828125, 5.419921875, 5.77685546875, 6.1337890625, 6.49072265625, 6.84765625, 7.20458984375, 7.5615234375, 7.91845703125, 8.275390625, 8.63232421875, 8.9892578125, 9.34619140625, 9.703125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 10.0, 6.0, 17.0, 19.0, 39.0, 81.0, 136.0, 301.0, 824.0, 3884.0, 331397.0, 3842517.0, 12757.0, 1323.0, 436.0, 205.0, 123.0, 77.0, 56.0, 38.0, 19.0, 10.0, 7.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-36.1875, -34.62744140625, -33.0673828125, -31.50732421875, -29.947265625, -28.38720703125, -26.8271484375, -25.26708984375, -23.70703125, -22.14697265625, -20.5869140625, -19.02685546875, -17.466796875, -15.90673828125, -14.3466796875, -12.78662109375, -11.2265625, -9.66650390625, -8.1064453125, -6.54638671875, -4.986328125, -3.42626953125, -1.8662109375, -0.30615234375, 1.25390625, 2.81396484375, 4.3740234375, 5.93408203125, 7.494140625, 9.05419921875, 10.6142578125, 12.17431640625, 13.734375, 15.29443359375, 16.8544921875, 18.41455078125, 19.974609375, 21.53466796875, 23.0947265625, 24.65478515625, 26.21484375, 27.77490234375, 29.3349609375, 30.89501953125, 32.455078125, 34.01513671875, 35.5751953125, 37.13525390625, 38.6953125, 40.25537109375, 41.8154296875, 43.37548828125, 44.935546875, 46.49560546875, 48.0556640625, 49.61572265625, 51.17578125, 52.73583984375, 54.2958984375, 55.85595703125, 57.416015625, 58.97607421875, 60.5361328125, 62.09619140625, 63.65625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 7.0, 5.0, 17.0, 20.0, 45.0, 112.0, 332.0, 949.0, 1441.0, 709.0, 266.0, 107.0, 37.0, 19.0, 15.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.796875, -17.714111328125, -16.63134765625, -15.548583984375, -14.4658203125, -13.383056640625, -12.30029296875, -11.217529296875, -10.134765625, -9.052001953125, -7.96923828125, -6.886474609375, -5.8037109375, -4.720947265625, -3.63818359375, -2.555419921875, -1.47265625, -0.389892578125, 0.69287109375, 1.775634765625, 2.8583984375, 3.941162109375, 5.02392578125, 6.106689453125, 7.189453125, 8.272216796875, 9.35498046875, 10.437744140625, 11.5205078125, 12.603271484375, 13.68603515625, 14.768798828125, 15.8515625, 16.934326171875, 18.01708984375, 19.099853515625, 20.1826171875, 21.265380859375, 22.34814453125, 23.430908203125, 24.513671875, 25.596435546875, 26.67919921875, 27.761962890625, 28.8447265625, 29.927490234375, 31.01025390625, 32.093017578125, 33.17578125, 34.258544921875, 35.34130859375, 36.424072265625, 37.5068359375, 38.589599609375, 39.67236328125, 40.755126953125, 41.837890625, 42.920654296875, 44.00341796875, 45.086181640625, 46.1689453125, 47.251708984375, 48.33447265625, 49.417236328125, 50.5]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 2.0, 4.0, 6.0, 37.0, 126.0, 301.0, 318.0, 122.0, 45.0, 23.0, 9.0, 5.0, 5.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-426.604248046875, -415.3379211425781, -404.07159423828125, -392.8052978515625, -381.5389709472656, -370.27264404296875, -359.0063171386719, -347.739990234375, -336.47369384765625, -325.2073669433594, -313.9410400390625, -302.67474365234375, -291.4084167480469, -280.14208984375, -268.8757629394531, -257.60943603515625, -246.34312438964844, -235.07679748535156, -223.81048583984375, -212.54415893554688, -201.27784729003906, -190.0115203857422, -178.74520874023438, -167.4788818359375, -156.21255493164062, -144.94622802734375, -133.67991638183594, -122.41358947753906, -111.14727783203125, -99.88095092773438, -88.61463165283203, -77.34831237792969, -66.08200073242188, -54.81568145751953, -43.54936218261719, -32.28303909301758, -21.016719818115234, -9.75040054321289, 1.5159225463867188, 12.782241821289062, 24.048561096191406, 35.31488037109375, 46.581199645996094, 57.8475227355957, 69.11384582519531, 80.38015747070312, 91.646484375, 102.91280364990234, 114.17912292480469, 125.44544219970703, 136.71176147460938, 147.97808837890625, 159.24440002441406, 170.51072692871094, 181.77703857421875, 193.04336547851562, 204.3096923828125, 215.57601928710938, 226.8423309326172, 238.10865783691406, 249.37496948242188, 260.64129638671875, 271.9076232910156, 283.1739501953125, 294.44024658203125]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 10.0, 12.0, 11.0, 12.0, 11.0, 28.0, 25.0, 38.0, 34.0, 52.0, 69.0, 49.0, 60.0, 79.0, 47.0, 62.0, 72.0, 65.0, 55.0, 49.0, 43.0, 30.0, 30.0, 12.0, 11.0, 13.0, 10.0, 5.0, 3.0, 0.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-71.90958404541016, -68.54634857177734, -65.18312072753906, -61.81988525390625, -58.4566535949707, -55.093421936035156, -51.730186462402344, -48.3669548034668, -45.00372314453125, -41.6404914855957, -38.277259826660156, -34.914024353027344, -31.550792694091797, -28.18756103515625, -24.82432746887207, -21.46109390258789, -18.097862243652344, -14.73462963104248, -11.371397018432617, -8.008164405822754, -4.644931793212891, -1.2817001342773438, 2.081533432006836, 5.444766998291016, 8.807998657226562, 12.171231269836426, 15.534463882446289, 18.89769744873047, 22.260929107666016, 25.624160766601562, 28.987394332885742, 32.35062789916992, 35.7138671875, 39.07709884643555, 42.440330505371094, 45.803565979003906, 49.16679763793945, 52.530029296875, 55.89326477050781, 59.25649642944336, 62.619728088378906, 65.98296356201172, 69.34619140625, 72.70942687988281, 76.07266235351562, 79.4358901977539, 82.79912567138672, 86.162353515625, 89.52558898925781, 92.88882446289062, 96.2520523071289, 99.61528778076172, 102.978515625, 106.34175109863281, 109.70498657226562, 113.06822204589844, 116.43144989013672, 119.79468536376953, 123.15791320800781, 126.52114868164062, 129.88438415527344, 133.24761962890625, 136.61083984375, 139.9740753173828, 143.33731079101562]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 1.0, 2.0, 2.0, 4.0, 5.0, 8.0, 12.0, 14.0, 17.0, 24.0, 41.0, 57.0, 94.0, 156.0, 285.0, 555.0, 1358.0, 4615.0, 23578.0, 215561.0, 701864.0, 83843.0, 11688.0, 2727.0, 980.0, 427.0, 248.0, 134.0, 83.0, 64.0, 32.0, 30.0, 13.0, 10.0, 7.0, 9.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.671875, -26.7587890625, -25.845703125, -24.9326171875, -24.01953125, -23.1064453125, -22.193359375, -21.2802734375, -20.3671875, -19.4541015625, -18.541015625, -17.6279296875, -16.71484375, -15.8017578125, -14.888671875, -13.9755859375, -13.0625, -12.1494140625, -11.236328125, -10.3232421875, -9.41015625, -8.4970703125, -7.583984375, -6.6708984375, -5.7578125, -4.8447265625, -3.931640625, -3.0185546875, -2.10546875, -1.1923828125, -0.279296875, 0.6337890625, 1.546875, 2.4599609375, 3.373046875, 4.2861328125, 5.19921875, 6.1123046875, 7.025390625, 7.9384765625, 8.8515625, 9.7646484375, 10.677734375, 11.5908203125, 12.50390625, 13.4169921875, 14.330078125, 15.2431640625, 16.15625, 17.0693359375, 17.982421875, 18.8955078125, 19.80859375, 20.7216796875, 21.634765625, 22.5478515625, 23.4609375, 24.3740234375, 25.287109375, 26.2001953125, 27.11328125, 28.0263671875, 28.939453125, 29.8525390625, 30.765625]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 4.0, 3.0, 6.0, 8.0, 11.0, 20.0, 20.0, 18.0, 46.0, 47.0, 52.0, 63.0, 72.0, 66.0, 93.0, 62.0, 77.0, 71.0, 51.0, 57.0, 35.0, 30.0, 33.0, 17.0, 13.0, 8.0, 11.0, 6.0, 4.0, 3.0, 3.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.9453125, -6.65576171875, -6.3662109375, -6.07666015625, -5.787109375, -5.49755859375, -5.2080078125, -4.91845703125, -4.62890625, -4.33935546875, -4.0498046875, -3.76025390625, -3.470703125, -3.18115234375, -2.8916015625, -2.60205078125, -2.3125, -2.02294921875, -1.7333984375, -1.44384765625, -1.154296875, -0.86474609375, -0.5751953125, -0.28564453125, 0.00390625, 0.29345703125, 0.5830078125, 0.87255859375, 1.162109375, 1.45166015625, 1.7412109375, 2.03076171875, 2.3203125, 2.60986328125, 2.8994140625, 3.18896484375, 3.478515625, 3.76806640625, 4.0576171875, 4.34716796875, 4.63671875, 4.92626953125, 5.2158203125, 5.50537109375, 5.794921875, 6.08447265625, 6.3740234375, 6.66357421875, 6.953125, 7.24267578125, 7.5322265625, 7.82177734375, 8.111328125, 8.40087890625, 8.6904296875, 8.97998046875, 9.26953125, 9.55908203125, 9.8486328125, 10.13818359375, 10.427734375, 10.71728515625, 11.0068359375, 11.29638671875, 11.5859375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 1.0, 3.0, 3.0, 8.0, 6.0, 12.0, 19.0, 26.0, 32.0, 76.0, 109.0, 162.0, 309.0, 682.0, 1645.0, 5477.0, 34524.0, 831680.0, 156626.0, 12129.0, 2879.0, 1090.0, 428.0, 250.0, 148.0, 90.0, 43.0, 36.0, 23.0, 14.0, 14.0, 3.0, 3.0, 8.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.78125, -49.23095703125, -47.6806640625, -46.13037109375, -44.580078125, -43.02978515625, -41.4794921875, -39.92919921875, -38.37890625, -36.82861328125, -35.2783203125, -33.72802734375, -32.177734375, -30.62744140625, -29.0771484375, -27.52685546875, -25.9765625, -24.42626953125, -22.8759765625, -21.32568359375, -19.775390625, -18.22509765625, -16.6748046875, -15.12451171875, -13.57421875, -12.02392578125, -10.4736328125, -8.92333984375, -7.373046875, -5.82275390625, -4.2724609375, -2.72216796875, -1.171875, 0.37841796875, 1.9287109375, 3.47900390625, 5.029296875, 6.57958984375, 8.1298828125, 9.68017578125, 11.23046875, 12.78076171875, 14.3310546875, 15.88134765625, 17.431640625, 18.98193359375, 20.5322265625, 22.08251953125, 23.6328125, 25.18310546875, 26.7333984375, 28.28369140625, 29.833984375, 31.38427734375, 32.9345703125, 34.48486328125, 36.03515625, 37.58544921875, 39.1357421875, 40.68603515625, 42.236328125, 43.78662109375, 45.3369140625, 46.88720703125, 48.4375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 3.0, 8.0, 14.0, 15.0, 12.0, 14.0, 36.0, 52.0, 49.0, 51.0, 60.0, 60.0, 74.0, 88.0, 72.0, 75.0, 51.0, 61.0, 38.0, 43.0, 26.0, 25.0, 25.0, 17.0, 13.0, 6.0, 3.0, 2.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-48.59375, -47.30908203125, -46.0244140625, -44.73974609375, -43.455078125, -42.17041015625, -40.8857421875, -39.60107421875, -38.31640625, -37.03173828125, -35.7470703125, -34.46240234375, -33.177734375, -31.89306640625, -30.6083984375, -29.32373046875, -28.0390625, -26.75439453125, -25.4697265625, -24.18505859375, -22.900390625, -21.61572265625, -20.3310546875, -19.04638671875, -17.76171875, -16.47705078125, -15.1923828125, -13.90771484375, -12.623046875, -11.33837890625, -10.0537109375, -8.76904296875, -7.484375, -6.19970703125, -4.9150390625, -3.63037109375, -2.345703125, -1.06103515625, 0.2236328125, 1.50830078125, 2.79296875, 4.07763671875, 5.3623046875, 6.64697265625, 7.931640625, 9.21630859375, 10.5009765625, 11.78564453125, 13.0703125, 14.35498046875, 15.6396484375, 16.92431640625, 18.208984375, 19.49365234375, 20.7783203125, 22.06298828125, 23.34765625, 24.63232421875, 25.9169921875, 27.20166015625, 28.486328125, 29.77099609375, 31.0556640625, 32.34033203125, 33.625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 5.0, 3.0, 9.0, 7.0, 8.0, 14.0, 26.0, 28.0, 44.0, 67.0, 131.0, 200.0, 404.0, 1008.0, 2713.0, 10626.0, 55241.0, 840549.0, 113169.0, 17600.0, 4131.0, 1343.0, 564.0, 253.0, 156.0, 106.0, 47.0, 25.0, 18.0, 16.0, 20.0, 6.0, 7.0, 7.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-22.515625, -21.88427734375, -21.2529296875, -20.62158203125, -19.990234375, -19.35888671875, -18.7275390625, -18.09619140625, -17.46484375, -16.83349609375, -16.2021484375, -15.57080078125, -14.939453125, -14.30810546875, -13.6767578125, -13.04541015625, -12.4140625, -11.78271484375, -11.1513671875, -10.52001953125, -9.888671875, -9.25732421875, -8.6259765625, -7.99462890625, -7.36328125, -6.73193359375, -6.1005859375, -5.46923828125, -4.837890625, -4.20654296875, -3.5751953125, -2.94384765625, -2.3125, -1.68115234375, -1.0498046875, -0.41845703125, 0.212890625, 0.84423828125, 1.4755859375, 2.10693359375, 2.73828125, 3.36962890625, 4.0009765625, 4.63232421875, 5.263671875, 5.89501953125, 6.5263671875, 7.15771484375, 7.7890625, 8.42041015625, 9.0517578125, 9.68310546875, 10.314453125, 10.94580078125, 11.5771484375, 12.20849609375, 12.83984375, 13.47119140625, 14.1025390625, 14.73388671875, 15.365234375, 15.99658203125, 16.6279296875, 17.25927734375, 17.890625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 4.0, 5.0, 6.0, 6.0, 8.0, 7.0, 12.0, 18.0, 26.0, 38.0, 46.0, 137.0, 244.0, 183.0, 80.0, 43.0, 33.0, 20.0, 12.0, 16.0, 9.0, 9.0, 10.0, 6.0, 3.0, 8.0, 4.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004852294921875, -0.004694581031799316, -0.004536867141723633, -0.004379153251647949, -0.004221439361572266, -0.004063725471496582, -0.0039060115814208984, -0.003748297691345215, -0.0035905838012695312, -0.0034328699111938477, -0.003275156021118164, -0.0031174421310424805, -0.002959728240966797, -0.0028020143508911133, -0.0026443004608154297, -0.002486586570739746, -0.0023288726806640625, -0.002171158790588379, -0.0020134449005126953, -0.0018557310104370117, -0.0016980171203613281, -0.0015403032302856445, -0.001382589340209961, -0.0012248754501342773, -0.0010671615600585938, -0.0009094476699829102, -0.0007517337799072266, -0.000594019889831543, -0.0004363059997558594, -0.0002785921096801758, -0.00012087821960449219, 3.6835670471191406e-05, 0.000194549560546875, 0.0003522634506225586, 0.0005099773406982422, 0.0006676912307739258, 0.0008254051208496094, 0.000983119010925293, 0.0011408329010009766, 0.0012985467910766602, 0.0014562606811523438, 0.0016139745712280273, 0.001771688461303711, 0.0019294023513793945, 0.002087116241455078, 0.0022448301315307617, 0.0024025440216064453, 0.002560257911682129, 0.0027179718017578125, 0.002875685691833496, 0.0030333995819091797, 0.0031911134719848633, 0.003348827362060547, 0.0035065412521362305, 0.003664255142211914, 0.0038219690322875977, 0.003979682922363281, 0.004137396812438965, 0.0042951107025146484, 0.004452824592590332, 0.004610538482666016, 0.004768252372741699, 0.004925966262817383, 0.005083680152893066, 0.00524139404296875]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [4.0, 4.0, 5.0, 8.0, 6.0, 4.0, 4.0, 11.0, 7.0, 14.0, 16.0, 32.0, 41.0, 63.0, 102.0, 147.0, 258.0, 440.0, 799.0, 1624.0, 4139.0, 12372.0, 44256.0, 653687.0, 280087.0, 33911.0, 10057.0, 3404.0, 1385.0, 681.0, 372.0, 194.0, 145.0, 98.0, 62.0, 37.0, 25.0, 15.0, 22.0, 7.0, 3.0, 7.0, 7.0, 1.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.6328125, -12.1043701171875, -11.575927734375, -11.0474853515625, -10.51904296875, -9.9906005859375, -9.462158203125, -8.9337158203125, -8.4052734375, -7.8768310546875, -7.348388671875, -6.8199462890625, -6.29150390625, -5.7630615234375, -5.234619140625, -4.7061767578125, -4.177734375, -3.6492919921875, -3.120849609375, -2.5924072265625, -2.06396484375, -1.5355224609375, -1.007080078125, -0.4786376953125, 0.0498046875, 0.5782470703125, 1.106689453125, 1.6351318359375, 2.16357421875, 2.6920166015625, 3.220458984375, 3.7489013671875, 4.27734375, 4.8057861328125, 5.334228515625, 5.8626708984375, 6.39111328125, 6.9195556640625, 7.447998046875, 7.9764404296875, 8.5048828125, 9.0333251953125, 9.561767578125, 10.0902099609375, 10.61865234375, 11.1470947265625, 11.675537109375, 12.2039794921875, 12.732421875, 13.2608642578125, 13.789306640625, 14.3177490234375, 14.84619140625, 15.3746337890625, 15.903076171875, 16.4315185546875, 16.9599609375, 17.4884033203125, 18.016845703125, 18.5452880859375, 19.07373046875, 19.6021728515625, 20.130615234375, 20.6590576171875, 21.1875]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 4.0, 3.0, 1.0, 4.0, 10.0, 5.0, 8.0, 12.0, 11.0, 10.0, 17.0, 18.0, 18.0, 28.0, 38.0, 60.0, 81.0, 117.0, 142.0, 124.0, 82.0, 51.0, 42.0, 29.0, 16.0, 17.0, 11.0, 3.0, 7.0, 7.0, 5.0, 4.0, 3.0, 5.0, 1.0, 4.0, 4.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-14.4375, -14.0418701171875, -13.646240234375, -13.2506103515625, -12.85498046875, -12.4593505859375, -12.063720703125, -11.6680908203125, -11.2724609375, -10.8768310546875, -10.481201171875, -10.0855712890625, -9.68994140625, -9.2943115234375, -8.898681640625, -8.5030517578125, -8.107421875, -7.7117919921875, -7.316162109375, -6.9205322265625, -6.52490234375, -6.1292724609375, -5.733642578125, -5.3380126953125, -4.9423828125, -4.5467529296875, -4.151123046875, -3.7554931640625, -3.35986328125, -2.9642333984375, -2.568603515625, -2.1729736328125, -1.77734375, -1.3817138671875, -0.986083984375, -0.5904541015625, -0.19482421875, 0.2008056640625, 0.596435546875, 0.9920654296875, 1.3876953125, 1.7833251953125, 2.178955078125, 2.5745849609375, 2.97021484375, 3.3658447265625, 3.761474609375, 4.1571044921875, 4.552734375, 4.9483642578125, 5.343994140625, 5.7396240234375, 6.13525390625, 6.5308837890625, 6.926513671875, 7.3221435546875, 7.7177734375, 8.1134033203125, 8.509033203125, 8.9046630859375, 9.30029296875, 9.6959228515625, 10.091552734375, 10.4871826171875, 10.8828125]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 4.0, 6.0, 6.0, 8.0, 21.0, 56.0, 188.0, 428.0, 191.0, 56.0, 17.0, 11.0, 2.0, 7.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-454.3094482421875, -441.15740966796875, -428.00537109375, -414.85333251953125, -401.7012939453125, -388.54925537109375, -375.397216796875, -362.24517822265625, -349.0931396484375, -335.94110107421875, -322.7890625, -309.63702392578125, -296.4849853515625, -283.33294677734375, -270.180908203125, -257.02886962890625, -243.87680053710938, -230.72476196289062, -217.57272338867188, -204.42068481445312, -191.26864624023438, -178.11660766601562, -164.9645538330078, -151.81251525878906, -138.6604766845703, -125.50843811035156, -112.35639953613281, -99.20435333251953, -86.05231475830078, -72.90027618408203, -59.74822998046875, -46.59619140625, -33.44415283203125, -20.292112350463867, -7.140071868896484, 6.011970520019531, 19.16400909423828, 32.31604766845703, 45.46809387207031, 58.62013244628906, 71.77217102050781, 84.92420959472656, 98.07624816894531, 111.2282943725586, 124.38033294677734, 137.53237915039062, 150.68441772460938, 163.83645629882812, 176.98849487304688, 190.14053344726562, 203.29257202148438, 216.44461059570312, 229.59664916992188, 242.74868774414062, 255.90074157714844, 269.05279541015625, 282.204833984375, 295.35687255859375, 308.5089111328125, 321.66094970703125, 334.81298828125, 347.96502685546875, 361.1170654296875, 374.26910400390625, 387.421142578125]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 7.0, 6.0, 6.0, 3.0, 10.0, 9.0, 16.0, 18.0, 15.0, 22.0, 27.0, 35.0, 24.0, 42.0, 43.0, 53.0, 63.0, 87.0, 73.0, 70.0, 62.0, 42.0, 45.0, 37.0, 33.0, 30.0, 18.0, 29.0, 15.0, 11.0, 11.0, 19.0, 10.0, 3.0, 5.0, 1.0, 5.0, 1.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-153.85374450683594, -149.58627319335938, -145.31878662109375, -141.0513153076172, -136.78384399414062, -132.51637268066406, -128.2489013671875, -123.98141479492188, -119.71394348144531, -115.44647216796875, -111.17899322509766, -106.91151428222656, -102.64404296875, -98.37657165527344, -94.10909271240234, -89.84161376953125, -85.57414245605469, -81.30667114257812, -77.03919219970703, -72.77171325683594, -68.50424194335938, -64.23677062988281, -59.96929168701172, -55.70181655883789, -51.43434143066406, -47.166866302490234, -42.899391174316406, -38.63191604614258, -34.36444091796875, -30.096965789794922, -25.829490661621094, -21.562015533447266, -17.29454803466797, -13.02707290649414, -8.759597778320312, -4.492122650146484, -0.22464752197265625, 4.042827606201172, 8.310302734375, 12.577777862548828, 16.845252990722656, 21.112728118896484, 25.380203247070312, 29.64767837524414, 33.91515350341797, 38.1826286315918, 42.450103759765625, 46.71757888793945, 50.98505401611328, 55.25252914428711, 59.52000427246094, 63.787479400634766, 68.0549545288086, 72.32243347167969, 76.58990478515625, 80.85737609863281, 85.1248550415039, 89.392333984375, 93.65980529785156, 97.92727661132812, 102.19475555419922, 106.46223449707031, 110.72970581054688, 114.99717712402344, 119.26465606689453]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 4.0, 6.0, 11.0, 11.0, 15.0, 13.0, 28.0, 32.0, 60.0, 78.0, 123.0, 212.0, 384.0, 830.0, 1973.0, 6722.0, 49776.0, 3128045.0, 974278.0, 24343.0, 4528.0, 1528.0, 596.0, 293.0, 161.0, 70.0, 59.0, 30.0, 20.0, 17.0, 13.0, 8.0, 7.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.546875, -20.74462890625, -19.9423828125, -19.14013671875, -18.337890625, -17.53564453125, -16.7333984375, -15.93115234375, -15.12890625, -14.32666015625, -13.5244140625, -12.72216796875, -11.919921875, -11.11767578125, -10.3154296875, -9.51318359375, -8.7109375, -7.90869140625, -7.1064453125, -6.30419921875, -5.501953125, -4.69970703125, -3.8974609375, -3.09521484375, -2.29296875, -1.49072265625, -0.6884765625, 0.11376953125, 0.916015625, 1.71826171875, 2.5205078125, 3.32275390625, 4.125, 4.92724609375, 5.7294921875, 6.53173828125, 7.333984375, 8.13623046875, 8.9384765625, 9.74072265625, 10.54296875, 11.34521484375, 12.1474609375, 12.94970703125, 13.751953125, 14.55419921875, 15.3564453125, 16.15869140625, 16.9609375, 17.76318359375, 18.5654296875, 19.36767578125, 20.169921875, 20.97216796875, 21.7744140625, 22.57666015625, 23.37890625, 24.18115234375, 24.9833984375, 25.78564453125, 26.587890625, 27.39013671875, 28.1923828125, 28.99462890625, 29.796875]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 8.0, 8.0, 13.0, 17.0, 19.0, 39.0, 46.0, 59.0, 73.0, 67.0, 89.0, 84.0, 87.0, 88.0, 70.0, 58.0, 46.0, 45.0, 34.0, 15.0, 10.0, 15.0, 6.0, 2.0, 5.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.7109375, -10.36181640625, -10.0126953125, -9.66357421875, -9.314453125, -8.96533203125, -8.6162109375, -8.26708984375, -7.91796875, -7.56884765625, -7.2197265625, -6.87060546875, -6.521484375, -6.17236328125, -5.8232421875, -5.47412109375, -5.125, -4.77587890625, -4.4267578125, -4.07763671875, -3.728515625, -3.37939453125, -3.0302734375, -2.68115234375, -2.33203125, -1.98291015625, -1.6337890625, -1.28466796875, -0.935546875, -0.58642578125, -0.2373046875, 0.11181640625, 0.4609375, 0.81005859375, 1.1591796875, 1.50830078125, 1.857421875, 2.20654296875, 2.5556640625, 2.90478515625, 3.25390625, 3.60302734375, 3.9521484375, 4.30126953125, 4.650390625, 4.99951171875, 5.3486328125, 5.69775390625, 6.046875, 6.39599609375, 6.7451171875, 7.09423828125, 7.443359375, 7.79248046875, 8.1416015625, 8.49072265625, 8.83984375, 9.18896484375, 9.5380859375, 9.88720703125, 10.236328125, 10.58544921875, 10.9345703125, 11.28369140625, 11.6328125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 11.0, 15.0, 32.0, 55.0, 95.0, 147.0, 300.0, 1337.0, 4086133.0, 105079.0, 728.0, 178.0, 78.0, 40.0, 23.0, 14.0, 9.0, 8.0, 5.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-216.625, -210.75390625, -204.8828125, -199.01171875, -193.140625, -187.26953125, -181.3984375, -175.52734375, -169.65625, -163.78515625, -157.9140625, -152.04296875, -146.171875, -140.30078125, -134.4296875, -128.55859375, -122.6875, -116.81640625, -110.9453125, -105.07421875, -99.203125, -93.33203125, -87.4609375, -81.58984375, -75.71875, -69.84765625, -63.9765625, -58.10546875, -52.234375, -46.36328125, -40.4921875, -34.62109375, -28.75, -22.87890625, -17.0078125, -11.13671875, -5.265625, 0.60546875, 6.4765625, 12.34765625, 18.21875, 24.08984375, 29.9609375, 35.83203125, 41.703125, 47.57421875, 53.4453125, 59.31640625, 65.1875, 71.05859375, 76.9296875, 82.80078125, 88.671875, 94.54296875, 100.4140625, 106.28515625, 112.15625, 118.02734375, 123.8984375, 129.76953125, 135.640625, 141.51171875, 147.3828125, 153.25390625, 159.125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 5.0, 29.0, 133.0, 1262.0, 2331.0, 254.0, 50.0, 10.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-131.75, -129.224853515625, -126.69970703125, -124.174560546875, -121.6494140625, -119.124267578125, -116.59912109375, -114.073974609375, -111.548828125, -109.023681640625, -106.49853515625, -103.973388671875, -101.4482421875, -98.923095703125, -96.39794921875, -93.872802734375, -91.34765625, -88.822509765625, -86.29736328125, -83.772216796875, -81.2470703125, -78.721923828125, -76.19677734375, -73.671630859375, -71.146484375, -68.621337890625, -66.09619140625, -63.571044921875, -61.0458984375, -58.520751953125, -55.99560546875, -53.470458984375, -50.9453125, -48.420166015625, -45.89501953125, -43.369873046875, -40.8447265625, -38.319580078125, -35.79443359375, -33.269287109375, -30.744140625, -28.218994140625, -25.69384765625, -23.168701171875, -20.6435546875, -18.118408203125, -15.59326171875, -13.068115234375, -10.54296875, -8.017822265625, -5.49267578125, -2.967529296875, -0.4423828125, 2.082763671875, 4.60791015625, 7.133056640625, 9.658203125, 12.183349609375, 14.70849609375, 17.233642578125, 19.7587890625, 22.283935546875, 24.80908203125, 27.334228515625, 29.859375]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 4.0, 6.0, 8.0, 30.0, 90.0, 292.0, 401.0, 114.0, 35.0, 7.0, 9.0, 2.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-593.7481079101562, -574.734130859375, -555.7200927734375, -536.7061157226562, -517.692138671875, -498.6781311035156, -479.66412353515625, -460.650146484375, -441.63616943359375, -422.6221618652344, -403.6081848144531, -384.59417724609375, -365.5802001953125, -346.5661926269531, -327.55218505859375, -308.5382080078125, -289.5242004394531, -270.51019287109375, -251.4962158203125, -232.48220825195312, -213.46823120117188, -194.4542236328125, -175.4402313232422, -156.42623901367188, -137.41224670410156, -118.39825439453125, -99.38426208496094, -80.3702621459961, -61.35626983642578, -42.34227752685547, -23.328277587890625, -4.3142852783203125, 14.69970703125, 33.71369934082031, 52.72769546508789, 71.74169158935547, 90.75568389892578, 109.7696762084961, 128.78367614746094, 147.79766845703125, 166.81166076660156, 185.82565307617188, 204.8396453857422, 223.8536376953125, 242.86764526367188, 261.8816223144531, 280.8956298828125, 299.90960693359375, 318.9236145019531, 337.9376220703125, 356.95159912109375, 375.9656066894531, 394.9795837402344, 413.99359130859375, 433.007568359375, 452.0215759277344, 471.03558349609375, 490.0495910644531, 509.0635681152344, 528.0775756835938, 547.091552734375, 566.1055297851562, 585.1195678710938, 604.133544921875, 623.1475219726562]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 9.0, 9.0, 11.0, 19.0, 22.0, 35.0, 38.0, 40.0, 37.0, 70.0, 62.0, 52.0, 77.0, 57.0, 87.0, 59.0, 58.0, 53.0, 42.0, 39.0, 31.0, 17.0, 24.0, 18.0, 13.0, 6.0, 7.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-215.36094665527344, -210.1773681640625, -204.9937744140625, -199.81019592285156, -194.62661743164062, -189.4430389404297, -184.25946044921875, -179.07586669921875, -173.8922882080078, -168.70870971679688, -163.52511596679688, -158.34153747558594, -153.157958984375, -147.97438049316406, -142.79080200195312, -137.60720825195312, -132.4236297607422, -127.24005126953125, -122.05646514892578, -116.87287902832031, -111.68930053710938, -106.50572204589844, -101.32213592529297, -96.1385498046875, -90.95497131347656, -85.77139282226562, -80.58780670166016, -75.40422058105469, -70.22064208984375, -65.03706359863281, -59.853477478027344, -54.66989517211914, -49.48631286621094, -44.302730560302734, -39.11914825439453, -33.93556594848633, -28.751983642578125, -23.568401336669922, -18.38481903076172, -13.201236724853516, -8.017654418945312, -2.8340721130371094, 2.3495101928710938, 7.533092498779297, 12.7166748046875, 17.900257110595703, 23.083839416503906, 28.26742172241211, 33.45100402832031, 38.634586334228516, 43.81816864013672, 49.00175094604492, 54.185333251953125, 59.36891555786133, 64.55249786376953, 69.736083984375, 74.91966247558594, 80.10324096679688, 85.28682708740234, 90.47041320800781, 95.65399169921875, 100.83757019042969, 106.02115631103516, 111.20474243164062, 116.38832092285156]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 5.0, 2.0, 7.0, 3.0, 8.0, 8.0, 12.0, 18.0, 31.0, 37.0, 39.0, 84.0, 145.0, 232.0, 499.0, 1265.0, 3824.0, 16142.0, 103006.0, 671583.0, 215536.0, 27231.0, 5767.0, 1716.0, 663.0, 297.0, 159.0, 75.0, 44.0, 28.0, 24.0, 17.0, 19.0, 8.0, 7.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-22.75, -21.927490234375, -21.10498046875, -20.282470703125, -19.4599609375, -18.637451171875, -17.81494140625, -16.992431640625, -16.169921875, -15.347412109375, -14.52490234375, -13.702392578125, -12.8798828125, -12.057373046875, -11.23486328125, -10.412353515625, -9.58984375, -8.767333984375, -7.94482421875, -7.122314453125, -6.2998046875, -5.477294921875, -4.65478515625, -3.832275390625, -3.009765625, -2.187255859375, -1.36474609375, -0.542236328125, 0.2802734375, 1.102783203125, 1.92529296875, 2.747802734375, 3.5703125, 4.392822265625, 5.21533203125, 6.037841796875, 6.8603515625, 7.682861328125, 8.50537109375, 9.327880859375, 10.150390625, 10.972900390625, 11.79541015625, 12.617919921875, 13.4404296875, 14.262939453125, 15.08544921875, 15.907958984375, 16.73046875, 17.552978515625, 18.37548828125, 19.197998046875, 20.0205078125, 20.843017578125, 21.66552734375, 22.488037109375, 23.310546875, 24.133056640625, 24.95556640625, 25.778076171875, 26.6005859375, 27.423095703125, 28.24560546875, 29.068115234375, 29.890625]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 8.0, 3.0, 9.0, 13.0, 8.0, 20.0, 18.0, 27.0, 27.0, 27.0, 45.0, 49.0, 60.0, 65.0, 65.0, 63.0, 65.0, 48.0, 51.0, 58.0, 50.0, 45.0, 31.0, 22.0, 22.0, 25.0, 18.0, 14.0, 17.0, 10.0, 7.0, 1.0, 3.0, 3.0, 5.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.6796875, -11.3458251953125, -11.011962890625, -10.6781005859375, -10.34423828125, -10.0103759765625, -9.676513671875, -9.3426513671875, -9.0087890625, -8.6749267578125, -8.341064453125, -8.0072021484375, -7.67333984375, -7.3394775390625, -7.005615234375, -6.6717529296875, -6.337890625, -6.0040283203125, -5.670166015625, -5.3363037109375, -5.00244140625, -4.6685791015625, -4.334716796875, -4.0008544921875, -3.6669921875, -3.3331298828125, -2.999267578125, -2.6654052734375, -2.33154296875, -1.9976806640625, -1.663818359375, -1.3299560546875, -0.99609375, -0.6622314453125, -0.328369140625, 0.0054931640625, 0.33935546875, 0.6732177734375, 1.007080078125, 1.3409423828125, 1.6748046875, 2.0086669921875, 2.342529296875, 2.6763916015625, 3.01025390625, 3.3441162109375, 3.677978515625, 4.0118408203125, 4.345703125, 4.6795654296875, 5.013427734375, 5.3472900390625, 5.68115234375, 6.0150146484375, 6.348876953125, 6.6827392578125, 7.0166015625, 7.3504638671875, 7.684326171875, 8.0181884765625, 8.35205078125, 8.6859130859375, 9.019775390625, 9.3536376953125, 9.6875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 6.0, 3.0, 1.0, 9.0, 8.0, 14.0, 31.0, 50.0, 82.0, 175.0, 504.0, 1740.0, 9554.0, 100718.0, 854254.0, 71659.0, 7471.0, 1472.0, 435.0, 173.0, 92.0, 35.0, 19.0, 20.0, 11.0, 8.0, 6.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.1875, -45.8173828125, -44.447265625, -43.0771484375, -41.70703125, -40.3369140625, -38.966796875, -37.5966796875, -36.2265625, -34.8564453125, -33.486328125, -32.1162109375, -30.74609375, -29.3759765625, -28.005859375, -26.6357421875, -25.265625, -23.8955078125, -22.525390625, -21.1552734375, -19.78515625, -18.4150390625, -17.044921875, -15.6748046875, -14.3046875, -12.9345703125, -11.564453125, -10.1943359375, -8.82421875, -7.4541015625, -6.083984375, -4.7138671875, -3.34375, -1.9736328125, -0.603515625, 0.7666015625, 2.13671875, 3.5068359375, 4.876953125, 6.2470703125, 7.6171875, 8.9873046875, 10.357421875, 11.7275390625, 13.09765625, 14.4677734375, 15.837890625, 17.2080078125, 18.578125, 19.9482421875, 21.318359375, 22.6884765625, 24.05859375, 25.4287109375, 26.798828125, 28.1689453125, 29.5390625, 30.9091796875, 32.279296875, 33.6494140625, 35.01953125, 36.3896484375, 37.759765625, 39.1298828125, 40.5]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 4.0, 4.0, 9.0, 4.0, 6.0, 10.0, 13.0, 12.0, 20.0, 20.0, 33.0, 33.0, 44.0, 54.0, 52.0, 52.0, 58.0, 60.0, 59.0, 68.0, 58.0, 54.0, 47.0, 36.0, 38.0, 32.0, 29.0, 17.0, 19.0, 15.0, 8.0, 3.0, 10.0, 3.0, 7.0, 3.0, 4.0, 1.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-49.09375, -47.64697265625, -46.2001953125, -44.75341796875, -43.306640625, -41.85986328125, -40.4130859375, -38.96630859375, -37.51953125, -36.07275390625, -34.6259765625, -33.17919921875, -31.732421875, -30.28564453125, -28.8388671875, -27.39208984375, -25.9453125, -24.49853515625, -23.0517578125, -21.60498046875, -20.158203125, -18.71142578125, -17.2646484375, -15.81787109375, -14.37109375, -12.92431640625, -11.4775390625, -10.03076171875, -8.583984375, -7.13720703125, -5.6904296875, -4.24365234375, -2.796875, -1.35009765625, 0.0966796875, 1.54345703125, 2.990234375, 4.43701171875, 5.8837890625, 7.33056640625, 8.77734375, 10.22412109375, 11.6708984375, 13.11767578125, 14.564453125, 16.01123046875, 17.4580078125, 18.90478515625, 20.3515625, 21.79833984375, 23.2451171875, 24.69189453125, 26.138671875, 27.58544921875, 29.0322265625, 30.47900390625, 31.92578125, 33.37255859375, 34.8193359375, 36.26611328125, 37.712890625, 39.15966796875, 40.6064453125, 42.05322265625, 43.5]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 4.0, 1.0, 4.0, 3.0, 4.0, 7.0, 13.0, 12.0, 14.0, 27.0, 20.0, 54.0, 100.0, 195.0, 469.0, 1324.0, 4853.0, 20867.0, 167931.0, 770089.0, 66960.0, 11164.0, 2879.0, 901.0, 366.0, 134.0, 58.0, 34.0, 22.0, 12.0, 13.0, 3.0, 6.0, 4.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-11.7578125, -11.4248046875, -11.091796875, -10.7587890625, -10.42578125, -10.0927734375, -9.759765625, -9.4267578125, -9.09375, -8.7607421875, -8.427734375, -8.0947265625, -7.76171875, -7.4287109375, -7.095703125, -6.7626953125, -6.4296875, -6.0966796875, -5.763671875, -5.4306640625, -5.09765625, -4.7646484375, -4.431640625, -4.0986328125, -3.765625, -3.4326171875, -3.099609375, -2.7666015625, -2.43359375, -2.1005859375, -1.767578125, -1.4345703125, -1.1015625, -0.7685546875, -0.435546875, -0.1025390625, 0.23046875, 0.5634765625, 0.896484375, 1.2294921875, 1.5625, 1.8955078125, 2.228515625, 2.5615234375, 2.89453125, 3.2275390625, 3.560546875, 3.8935546875, 4.2265625, 4.5595703125, 4.892578125, 5.2255859375, 5.55859375, 5.8916015625, 6.224609375, 6.5576171875, 6.890625, 7.2236328125, 7.556640625, 7.8896484375, 8.22265625, 8.5556640625, 8.888671875, 9.2216796875, 9.5546875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 3.0, 3.0, 6.0, 6.0, 4.0, 9.0, 7.0, 13.0, 15.0, 21.0, 21.0, 58.0, 82.0, 96.0, 137.0, 127.0, 117.0, 89.0, 54.0, 29.0, 26.0, 14.0, 15.0, 13.0, 11.0, 6.0, 6.0, 7.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00228118896484375, -0.0022122561931610107, -0.0021433234214782715, -0.0020743906497955322, -0.002005457878112793, -0.0019365251064300537, -0.0018675923347473145, -0.0017986595630645752, -0.001729726791381836, -0.0016607940196990967, -0.0015918612480163574, -0.0015229284763336182, -0.001453995704650879, -0.0013850629329681396, -0.0013161301612854004, -0.0012471973896026611, -0.0011782646179199219, -0.0011093318462371826, -0.0010403990745544434, -0.0009714663028717041, -0.0009025335311889648, -0.0008336007595062256, -0.0007646679878234863, -0.0006957352161407471, -0.0006268024444580078, -0.0005578696727752686, -0.0004889369010925293, -0.00042000412940979004, -0.0003510713577270508, -0.0002821385860443115, -0.00021320581436157227, -0.000144273042678833, -7.534027099609375e-05, -6.407499313354492e-06, 6.252527236938477e-05, 0.00013145804405212402, 0.00020039081573486328, 0.00026932358741760254, 0.0003382563591003418, 0.00040718913078308105, 0.0004761219024658203, 0.0005450546741485596, 0.0006139874458312988, 0.0006829202175140381, 0.0007518529891967773, 0.0008207857608795166, 0.0008897185325622559, 0.0009586513042449951, 0.0010275840759277344, 0.0010965168476104736, 0.0011654496192932129, 0.0012343823909759521, 0.0013033151626586914, 0.0013722479343414307, 0.00144118070602417, 0.0015101134777069092, 0.0015790462493896484, 0.0016479790210723877, 0.001716911792755127, 0.0017858445644378662, 0.0018547773361206055, 0.0019237101078033447, 0.001992642879486084, 0.0020615756511688232, 0.0021305084228515625]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 4.0, 3.0, 3.0, 9.0, 3.0, 7.0, 11.0, 13.0, 20.0, 42.0, 81.0, 165.0, 336.0, 815.0, 2202.0, 6805.0, 29013.0, 247367.0, 689884.0, 55578.0, 10970.0, 3241.0, 1109.0, 465.0, 185.0, 83.0, 51.0, 35.0, 19.0, 14.0, 8.0, 11.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.5, -12.1446533203125, -11.789306640625, -11.4339599609375, -11.07861328125, -10.7232666015625, -10.367919921875, -10.0125732421875, -9.6572265625, -9.3018798828125, -8.946533203125, -8.5911865234375, -8.23583984375, -7.8804931640625, -7.525146484375, -7.1697998046875, -6.814453125, -6.4591064453125, -6.103759765625, -5.7484130859375, -5.39306640625, -5.0377197265625, -4.682373046875, -4.3270263671875, -3.9716796875, -3.6163330078125, -3.260986328125, -2.9056396484375, -2.55029296875, -2.1949462890625, -1.839599609375, -1.4842529296875, -1.12890625, -0.7735595703125, -0.418212890625, -0.0628662109375, 0.29248046875, 0.6478271484375, 1.003173828125, 1.3585205078125, 1.7138671875, 2.0692138671875, 2.424560546875, 2.7799072265625, 3.13525390625, 3.4906005859375, 3.845947265625, 4.2012939453125, 4.556640625, 4.9119873046875, 5.267333984375, 5.6226806640625, 5.97802734375, 6.3333740234375, 6.688720703125, 7.0440673828125, 7.3994140625, 7.7547607421875, 8.110107421875, 8.4654541015625, 8.82080078125, 9.1761474609375, 9.531494140625, 9.8868408203125, 10.2421875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 6.0, 3.0, 1.0, 8.0, 3.0, 8.0, 3.0, 6.0, 6.0, 22.0, 27.0, 23.0, 28.0, 42.0, 49.0, 68.0, 97.0, 97.0, 118.0, 85.0, 78.0, 57.0, 48.0, 31.0, 20.0, 17.0, 10.0, 6.0, 12.0, 10.0, 7.0, 3.0, 3.0, 3.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.1640625, -7.91668701171875, -7.6693115234375, -7.42193603515625, -7.174560546875, -6.92718505859375, -6.6798095703125, -6.43243408203125, -6.18505859375, -5.93768310546875, -5.6903076171875, -5.44293212890625, -5.195556640625, -4.94818115234375, -4.7008056640625, -4.45343017578125, -4.2060546875, -3.95867919921875, -3.7113037109375, -3.46392822265625, -3.216552734375, -2.96917724609375, -2.7218017578125, -2.47442626953125, -2.22705078125, -1.97967529296875, -1.7322998046875, -1.48492431640625, -1.237548828125, -0.99017333984375, -0.7427978515625, -0.49542236328125, -0.248046875, -0.00067138671875, 0.2467041015625, 0.49407958984375, 0.741455078125, 0.98883056640625, 1.2362060546875, 1.48358154296875, 1.73095703125, 1.97833251953125, 2.2257080078125, 2.47308349609375, 2.720458984375, 2.96783447265625, 3.2152099609375, 3.46258544921875, 3.7099609375, 3.95733642578125, 4.2047119140625, 4.45208740234375, 4.699462890625, 4.94683837890625, 5.1942138671875, 5.44158935546875, 5.68896484375, 5.93634033203125, 6.1837158203125, 6.43109130859375, 6.678466796875, 6.92584228515625, 7.1732177734375, 7.42059326171875, 7.66796875]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 5.0, 3.0, 0.0, 5.0, 9.0, 10.0, 16.0, 23.0, 48.0, 84.0, 159.0, 301.0, 157.0, 86.0, 45.0, 21.0, 13.0, 8.0, 6.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-299.7222900390625, -292.5058898925781, -285.28948974609375, -278.0730895996094, -270.856689453125, -263.6402893066406, -256.42388916015625, -249.20750427246094, -241.99110412597656, -234.7747039794922, -227.5583038330078, -220.34190368652344, -213.12551879882812, -205.90911865234375, -198.69271850585938, -191.476318359375, -184.25991821289062, -177.04351806640625, -169.82711791992188, -162.6107177734375, -155.39431762695312, -148.17791748046875, -140.96153259277344, -133.74513244628906, -126.52873229980469, -119.31233215332031, -112.09593200683594, -104.8795394897461, -97.66313934326172, -90.44673919677734, -83.2303466796875, -76.01394653320312, -68.79754638671875, -61.581146240234375, -54.364749908447266, -47.148353576660156, -39.93195343017578, -32.715553283691406, -25.499156951904297, -18.282760620117188, -11.066360473632812, -3.8499622344970703, 3.366436004638672, 10.582834243774414, 17.799232482910156, 25.01563262939453, 32.23202896118164, 39.44842529296875, 46.664825439453125, 53.8812255859375, 61.09762191772461, 68.31401824951172, 75.5304183959961, 82.74681854248047, 89.96321105957031, 97.17961120605469, 104.39601135253906, 111.61241149902344, 118.82881164550781, 126.04520416259766, 133.2615966796875, 140.47799682617188, 147.69439697265625, 154.91079711914062, 162.127197265625]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 4.0, 10.0, 5.0, 1.0, 7.0, 7.0, 15.0, 8.0, 11.0, 13.0, 19.0, 18.0, 22.0, 23.0, 26.0, 24.0, 33.0, 43.0, 48.0, 80.0, 95.0, 91.0, 54.0, 41.0, 33.0, 37.0, 34.0, 25.0, 22.0, 34.0, 18.0, 18.0, 9.0, 13.0, 15.0, 13.0, 11.0, 6.0, 5.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-172.39007568359375, -166.42596435546875, -160.46185302734375, -154.4977569580078, -148.5336456298828, -142.5695343017578, -136.60543823242188, -130.64132690429688, -124.67721557617188, -118.71310424804688, -112.7490005493164, -106.78489685058594, -100.82078552246094, -94.85667419433594, -88.89257049560547, -82.928466796875, -76.96435546875, -71.000244140625, -65.03614044189453, -59.0720329284668, -53.10792541503906, -47.14381790161133, -41.179710388183594, -35.21560287475586, -29.251495361328125, -23.28738784790039, -17.323280334472656, -11.359172821044922, -5.3950653076171875, 0.5690422058105469, 6.533149719238281, 12.497257232666016, 18.46136474609375, 24.425472259521484, 30.38957977294922, 36.35368728637695, 42.31779479980469, 48.28190231323242, 54.246009826660156, 60.21011734008789, 66.17422485351562, 72.13833618164062, 78.1024398803711, 84.06654357910156, 90.03065490722656, 95.99476623535156, 101.95886993408203, 107.9229736328125, 113.8870849609375, 119.8511962890625, 125.81529998779297, 131.77940368652344, 137.74351501464844, 143.70762634277344, 149.67172241210938, 155.63583374023438, 161.59994506835938, 167.56405639648438, 173.52816772460938, 179.4922637939453, 185.4563751220703, 191.4204864501953, 197.38458251953125, 203.34869384765625, 209.31280517578125]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 2.0, 2.0, 5.0, 3.0, 2.0, 7.0, 8.0, 10.0, 15.0, 14.0, 23.0, 36.0, 48.0, 72.0, 113.0, 160.0, 241.0, 465.0, 800.0, 1650.0, 3840.0, 12809.0, 94839.0, 2188692.0, 1795372.0, 77642.0, 10957.0, 3382.0, 1416.0, 751.0, 361.0, 181.0, 135.0, 95.0, 56.0, 31.0, 25.0, 14.0, 8.0, 5.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-22.484375, -21.9610595703125, -21.437744140625, -20.9144287109375, -20.39111328125, -19.8677978515625, -19.344482421875, -18.8211669921875, -18.2978515625, -17.7745361328125, -17.251220703125, -16.7279052734375, -16.20458984375, -15.6812744140625, -15.157958984375, -14.6346435546875, -14.111328125, -13.5880126953125, -13.064697265625, -12.5413818359375, -12.01806640625, -11.4947509765625, -10.971435546875, -10.4481201171875, -9.9248046875, -9.4014892578125, -8.878173828125, -8.3548583984375, -7.83154296875, -7.3082275390625, -6.784912109375, -6.2615966796875, -5.73828125, -5.2149658203125, -4.691650390625, -4.1683349609375, -3.64501953125, -3.1217041015625, -2.598388671875, -2.0750732421875, -1.5517578125, -1.0284423828125, -0.505126953125, 0.0181884765625, 0.54150390625, 1.0648193359375, 1.588134765625, 2.1114501953125, 2.634765625, 3.1580810546875, 3.681396484375, 4.2047119140625, 4.72802734375, 5.2513427734375, 5.774658203125, 6.2979736328125, 6.8212890625, 7.3446044921875, 7.867919921875, 8.3912353515625, 8.91455078125, 9.4378662109375, 9.961181640625, 10.4844970703125, 11.0078125]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 4.0, 5.0, 10.0, 6.0, 12.0, 18.0, 30.0, 14.0, 26.0, 28.0, 29.0, 40.0, 41.0, 63.0, 58.0, 56.0, 54.0, 69.0, 63.0, 48.0, 45.0, 48.0, 42.0, 41.0, 26.0, 27.0, 17.0, 22.0, 11.0, 10.0, 10.0, 8.0, 3.0, 5.0, 6.0, 1.0, 4.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.19921875, -6.91192626953125, -6.6246337890625, -6.33734130859375, -6.050048828125, -5.76275634765625, -5.4754638671875, -5.18817138671875, -4.90087890625, -4.61358642578125, -4.3262939453125, -4.03900146484375, -3.751708984375, -3.46441650390625, -3.1771240234375, -2.88983154296875, -2.6025390625, -2.31524658203125, -2.0279541015625, -1.74066162109375, -1.453369140625, -1.16607666015625, -0.8787841796875, -0.59149169921875, -0.30419921875, -0.01690673828125, 0.2703857421875, 0.55767822265625, 0.844970703125, 1.13226318359375, 1.4195556640625, 1.70684814453125, 1.994140625, 2.28143310546875, 2.5687255859375, 2.85601806640625, 3.143310546875, 3.43060302734375, 3.7178955078125, 4.00518798828125, 4.29248046875, 4.57977294921875, 4.8670654296875, 5.15435791015625, 5.441650390625, 5.72894287109375, 6.0162353515625, 6.30352783203125, 6.5908203125, 6.87811279296875, 7.1654052734375, 7.45269775390625, 7.739990234375, 8.02728271484375, 8.3145751953125, 8.60186767578125, 8.88916015625, 9.17645263671875, 9.4637451171875, 9.75103759765625, 10.038330078125, 10.32562255859375, 10.6129150390625, 10.90020751953125, 11.1875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 7.0, 19.0, 29.0, 74.0, 143.0, 388.0, 1333.0, 12638.0, 4115811.0, 60902.0, 2096.0, 492.0, 189.0, 82.0, 35.0, 20.0, 14.0, 7.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.125, -73.0185546875, -70.912109375, -68.8056640625, -66.69921875, -64.5927734375, -62.486328125, -60.3798828125, -58.2734375, -56.1669921875, -54.060546875, -51.9541015625, -49.84765625, -47.7412109375, -45.634765625, -43.5283203125, -41.421875, -39.3154296875, -37.208984375, -35.1025390625, -32.99609375, -30.8896484375, -28.783203125, -26.6767578125, -24.5703125, -22.4638671875, -20.357421875, -18.2509765625, -16.14453125, -14.0380859375, -11.931640625, -9.8251953125, -7.71875, -5.6123046875, -3.505859375, -1.3994140625, 0.70703125, 2.8134765625, 4.919921875, 7.0263671875, 9.1328125, 11.2392578125, 13.345703125, 15.4521484375, 17.55859375, 19.6650390625, 21.771484375, 23.8779296875, 25.984375, 28.0908203125, 30.197265625, 32.3037109375, 34.41015625, 36.5166015625, 38.623046875, 40.7294921875, 42.8359375, 44.9423828125, 47.048828125, 49.1552734375, 51.26171875, 53.3681640625, 55.474609375, 57.5810546875, 59.6875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 0.0, 2.0, 3.0, 1.0, 5.0, 14.0, 8.0, 26.0, 22.0, 64.0, 132.0, 289.0, 702.0, 1184.0, 897.0, 390.0, 172.0, 69.0, 29.0, 30.0, 14.0, 9.0, 4.0, 9.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-36.5625, -35.7255859375, -34.888671875, -34.0517578125, -33.21484375, -32.3779296875, -31.541015625, -30.7041015625, -29.8671875, -29.0302734375, -28.193359375, -27.3564453125, -26.51953125, -25.6826171875, -24.845703125, -24.0087890625, -23.171875, -22.3349609375, -21.498046875, -20.6611328125, -19.82421875, -18.9873046875, -18.150390625, -17.3134765625, -16.4765625, -15.6396484375, -14.802734375, -13.9658203125, -13.12890625, -12.2919921875, -11.455078125, -10.6181640625, -9.78125, -8.9443359375, -8.107421875, -7.2705078125, -6.43359375, -5.5966796875, -4.759765625, -3.9228515625, -3.0859375, -2.2490234375, -1.412109375, -0.5751953125, 0.26171875, 1.0986328125, 1.935546875, 2.7724609375, 3.609375, 4.4462890625, 5.283203125, 6.1201171875, 6.95703125, 7.7939453125, 8.630859375, 9.4677734375, 10.3046875, 11.1416015625, 11.978515625, 12.8154296875, 13.65234375, 14.4892578125, 15.326171875, 16.1630859375, 17.0]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 3.0, 18.0, 37.0, 95.0, 238.0, 283.0, 182.0, 95.0, 31.0, 12.0, 8.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-422.3249816894531, -413.2271423339844, -404.1292724609375, -395.03143310546875, -385.93359375, -376.83575439453125, -367.7379150390625, -358.6400451660156, -349.5422058105469, -340.4443664550781, -331.34649658203125, -322.2486572265625, -313.15081787109375, -304.052978515625, -294.95513916015625, -285.8572692871094, -276.7594299316406, -267.6615905761719, -258.563720703125, -249.46588134765625, -240.3680419921875, -231.27020263671875, -222.17234802246094, -213.07449340820312, -203.97665405273438, -194.87881469726562, -185.7809600830078, -176.68310546875, -167.58526611328125, -158.4874267578125, -149.3895721435547, -140.29171752929688, -131.19386291503906, -122.09601593017578, -112.9981689453125, -103.90032196044922, -94.80247497558594, -85.70462799072266, -76.60678100585938, -67.5089340209961, -58.41108703613281, -49.31324005126953, -40.21539306640625, -31.11754608154297, -22.019699096679688, -12.921852111816406, -3.824005126953125, 5.273841857910156, 14.371688842773438, 23.46953582763672, 32.5673828125, 41.66522979736328, 50.76307678222656, 59.860923767089844, 68.95877075195312, 78.0566177368164, 87.15446472167969, 96.25231170654297, 105.35015869140625, 114.44800567626953, 123.54585266113281, 132.64370727539062, 141.74154663085938, 150.83938598632812, 159.93724060058594]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 9.0, 13.0, 23.0, 25.0, 26.0, 30.0, 36.0, 49.0, 62.0, 61.0, 63.0, 61.0, 59.0, 66.0, 71.0, 67.0, 55.0, 59.0, 45.0, 33.0, 28.0, 16.0, 14.0, 8.0, 9.0, 8.0, 4.0, 3.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-103.92166137695312, -100.23426818847656, -96.54688262939453, -92.85948944091797, -89.17210388183594, -85.48471069335938, -81.79731750488281, -78.10993194580078, -74.42253875732422, -70.73514556884766, -67.04776000976562, -63.36036682128906, -59.672977447509766, -55.98558807373047, -52.29819869995117, -48.610809326171875, -44.92341995239258, -41.23603057861328, -37.548641204833984, -33.86125183105469, -30.173858642578125, -26.486469268798828, -22.79907989501953, -19.1116886138916, -15.424299240112305, -11.736908912658691, -8.049518585205078, -4.362129211425781, -0.674738883972168, 3.0126514434814453, 6.700040817260742, 10.387432098388672, 14.074821472167969, 17.762210845947266, 21.449602127075195, 25.136991500854492, 28.824382781982422, 32.51177215576172, 36.199161529541016, 39.88655090332031, 43.573944091796875, 47.26133346557617, 50.94872283935547, 54.63611602783203, 58.32350540161133, 62.010894775390625, 65.69828796386719, 69.38567352294922, 73.07305908203125, 76.76045227050781, 80.44783782958984, 84.1352310180664, 87.82261657714844, 91.510009765625, 95.19740295410156, 98.8847885131836, 102.57218170166016, 106.25957489013672, 109.94696044921875, 113.63435363769531, 117.32173919677734, 121.0091323852539, 124.69651794433594, 128.3839111328125, 132.07130432128906]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 5.0, 4.0, 9.0, 9.0, 12.0, 20.0, 22.0, 55.0, 75.0, 170.0, 310.0, 672.0, 1785.0, 5972.0, 26538.0, 177879.0, 660630.0, 143695.0, 22575.0, 5161.0, 1648.0, 625.0, 300.0, 159.0, 80.0, 54.0, 29.0, 27.0, 7.0, 11.0, 8.0, 7.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0], "bins": [-27.140625, -26.48583984375, -25.8310546875, -25.17626953125, -24.521484375, -23.86669921875, -23.2119140625, -22.55712890625, -21.90234375, -21.24755859375, -20.5927734375, -19.93798828125, -19.283203125, -18.62841796875, -17.9736328125, -17.31884765625, -16.6640625, -16.00927734375, -15.3544921875, -14.69970703125, -14.044921875, -13.39013671875, -12.7353515625, -12.08056640625, -11.42578125, -10.77099609375, -10.1162109375, -9.46142578125, -8.806640625, -8.15185546875, -7.4970703125, -6.84228515625, -6.1875, -5.53271484375, -4.8779296875, -4.22314453125, -3.568359375, -2.91357421875, -2.2587890625, -1.60400390625, -0.94921875, -0.29443359375, 0.3603515625, 1.01513671875, 1.669921875, 2.32470703125, 2.9794921875, 3.63427734375, 4.2890625, 4.94384765625, 5.5986328125, 6.25341796875, 6.908203125, 7.56298828125, 8.2177734375, 8.87255859375, 9.52734375, 10.18212890625, 10.8369140625, 11.49169921875, 12.146484375, 12.80126953125, 13.4560546875, 14.11083984375, 14.765625]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 7.0, 7.0, 12.0, 11.0, 14.0, 24.0, 24.0, 22.0, 39.0, 43.0, 65.0, 63.0, 66.0, 72.0, 76.0, 56.0, 70.0, 62.0, 53.0, 51.0, 36.0, 27.0, 15.0, 19.0, 21.0, 14.0, 8.0, 12.0, 5.0, 4.0, 2.0, 6.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.15625, -10.79296875, -10.4296875, -10.06640625, -9.703125, -9.33984375, -8.9765625, -8.61328125, -8.25, -7.88671875, -7.5234375, -7.16015625, -6.796875, -6.43359375, -6.0703125, -5.70703125, -5.34375, -4.98046875, -4.6171875, -4.25390625, -3.890625, -3.52734375, -3.1640625, -2.80078125, -2.4375, -2.07421875, -1.7109375, -1.34765625, -0.984375, -0.62109375, -0.2578125, 0.10546875, 0.46875, 0.83203125, 1.1953125, 1.55859375, 1.921875, 2.28515625, 2.6484375, 3.01171875, 3.375, 3.73828125, 4.1015625, 4.46484375, 4.828125, 5.19140625, 5.5546875, 5.91796875, 6.28125, 6.64453125, 7.0078125, 7.37109375, 7.734375, 8.09765625, 8.4609375, 8.82421875, 9.1875, 9.55078125, 9.9140625, 10.27734375, 10.640625, 11.00390625, 11.3671875, 11.73046875, 12.09375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 5.0, 5.0, 5.0, 7.0, 9.0, 11.0, 19.0, 22.0, 20.0, 30.0, 31.0, 69.0, 106.0, 153.0, 220.0, 408.0, 747.0, 1816.0, 4838.0, 16274.0, 75992.0, 646081.0, 245828.0, 39946.0, 9848.0, 3265.0, 1278.0, 556.0, 324.0, 199.0, 138.0, 81.0, 59.0, 46.0, 26.0, 23.0, 15.0, 12.0, 12.0, 11.0, 6.0, 7.0, 2.0, 2.0, 2.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-19.453125, -18.800537109375, -18.14794921875, -17.495361328125, -16.8427734375, -16.190185546875, -15.53759765625, -14.885009765625, -14.232421875, -13.579833984375, -12.92724609375, -12.274658203125, -11.6220703125, -10.969482421875, -10.31689453125, -9.664306640625, -9.01171875, -8.359130859375, -7.70654296875, -7.053955078125, -6.4013671875, -5.748779296875, -5.09619140625, -4.443603515625, -3.791015625, -3.138427734375, -2.48583984375, -1.833251953125, -1.1806640625, -0.528076171875, 0.12451171875, 0.777099609375, 1.4296875, 2.082275390625, 2.73486328125, 3.387451171875, 4.0400390625, 4.692626953125, 5.34521484375, 5.997802734375, 6.650390625, 7.302978515625, 7.95556640625, 8.608154296875, 9.2607421875, 9.913330078125, 10.56591796875, 11.218505859375, 11.87109375, 12.523681640625, 13.17626953125, 13.828857421875, 14.4814453125, 15.134033203125, 15.78662109375, 16.439208984375, 17.091796875, 17.744384765625, 18.39697265625, 19.049560546875, 19.7021484375, 20.354736328125, 21.00732421875, 21.659912109375, 22.3125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 9.0, 6.0, 8.0, 9.0, 7.0, 10.0, 16.0, 17.0, 24.0, 35.0, 38.0, 35.0, 44.0, 39.0, 63.0, 78.0, 67.0, 75.0, 49.0, 63.0, 49.0, 52.0, 35.0, 27.0, 19.0, 22.0, 19.0, 21.0, 14.0, 13.0, 14.0, 4.0, 4.0, 6.0, 8.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.8125, -41.52783203125, -40.2431640625, -38.95849609375, -37.673828125, -36.38916015625, -35.1044921875, -33.81982421875, -32.53515625, -31.25048828125, -29.9658203125, -28.68115234375, -27.396484375, -26.11181640625, -24.8271484375, -23.54248046875, -22.2578125, -20.97314453125, -19.6884765625, -18.40380859375, -17.119140625, -15.83447265625, -14.5498046875, -13.26513671875, -11.98046875, -10.69580078125, -9.4111328125, -8.12646484375, -6.841796875, -5.55712890625, -4.2724609375, -2.98779296875, -1.703125, -0.41845703125, 0.8662109375, 2.15087890625, 3.435546875, 4.72021484375, 6.0048828125, 7.28955078125, 8.57421875, 9.85888671875, 11.1435546875, 12.42822265625, 13.712890625, 14.99755859375, 16.2822265625, 17.56689453125, 18.8515625, 20.13623046875, 21.4208984375, 22.70556640625, 23.990234375, 25.27490234375, 26.5595703125, 27.84423828125, 29.12890625, 30.41357421875, 31.6982421875, 32.98291015625, 34.267578125, 35.55224609375, 36.8369140625, 38.12158203125, 39.40625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 0.0, 4.0, 6.0, 6.0, 12.0, 16.0, 19.0, 22.0, 43.0, 60.0, 119.0, 224.0, 478.0, 1284.0, 4397.0, 20152.0, 149027.0, 798105.0, 59628.0, 10613.0, 2753.0, 858.0, 328.0, 172.0, 84.0, 46.0, 25.0, 26.0, 14.0, 11.0, 7.0, 4.0, 3.0, 4.0, 4.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.9453125, -10.643798828125, -10.34228515625, -10.040771484375, -9.7392578125, -9.437744140625, -9.13623046875, -8.834716796875, -8.533203125, -8.231689453125, -7.93017578125, -7.628662109375, -7.3271484375, -7.025634765625, -6.72412109375, -6.422607421875, -6.12109375, -5.819580078125, -5.51806640625, -5.216552734375, -4.9150390625, -4.613525390625, -4.31201171875, -4.010498046875, -3.708984375, -3.407470703125, -3.10595703125, -2.804443359375, -2.5029296875, -2.201416015625, -1.89990234375, -1.598388671875, -1.296875, -0.995361328125, -0.69384765625, -0.392333984375, -0.0908203125, 0.210693359375, 0.51220703125, 0.813720703125, 1.115234375, 1.416748046875, 1.71826171875, 2.019775390625, 2.3212890625, 2.622802734375, 2.92431640625, 3.225830078125, 3.52734375, 3.828857421875, 4.13037109375, 4.431884765625, 4.7333984375, 5.034912109375, 5.33642578125, 5.637939453125, 5.939453125, 6.240966796875, 6.54248046875, 6.843994140625, 7.1455078125, 7.447021484375, 7.74853515625, 8.050048828125, 8.3515625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 8.0, 3.0, 8.0, 2.0, 3.0, 5.0, 10.0, 8.0, 13.0, 14.0, 15.0, 23.0, 38.0, 45.0, 100.0, 91.0, 124.0, 141.0, 84.0, 71.0, 41.0, 33.0, 30.0, 19.0, 23.0, 19.0, 8.0, 6.0, 5.0, 5.0, 6.0, 3.0, 2.0, 5.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0018568038940429688, -0.001801997423171997, -0.0017471909523010254, -0.0016923844814300537, -0.001637578010559082, -0.0015827715396881104, -0.0015279650688171387, -0.001473158597946167, -0.0014183521270751953, -0.0013635456562042236, -0.001308739185333252, -0.0012539327144622803, -0.0011991262435913086, -0.001144319772720337, -0.0010895133018493652, -0.0010347068309783936, -0.0009799003601074219, -0.0009250938892364502, -0.0008702874183654785, -0.0008154809474945068, -0.0007606744766235352, -0.0007058680057525635, -0.0006510615348815918, -0.0005962550640106201, -0.0005414485931396484, -0.00048664212226867676, -0.0004318356513977051, -0.0003770291805267334, -0.0003222227096557617, -0.00026741623878479004, -0.00021260976791381836, -0.00015780329704284668, -0.000102996826171875, -4.819035530090332e-05, 6.616115570068359e-06, 6.142258644104004e-05, 0.00011622905731201172, 0.0001710355281829834, 0.00022584199905395508, 0.00028064846992492676, 0.00033545494079589844, 0.0003902614116668701, 0.0004450678825378418, 0.0004998743534088135, 0.0005546808242797852, 0.0006094872951507568, 0.0006642937660217285, 0.0007191002368927002, 0.0007739067077636719, 0.0008287131786346436, 0.0008835196495056152, 0.0009383261203765869, 0.0009931325912475586, 0.0010479390621185303, 0.001102745532989502, 0.0011575520038604736, 0.0012123584747314453, 0.001267164945602417, 0.0013219714164733887, 0.0013767778873443604, 0.001431584358215332, 0.0014863908290863037, 0.0015411972999572754, 0.001596003770828247, 0.0016508102416992188]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 6.0, 4.0, 6.0, 22.0, 33.0, 50.0, 67.0, 100.0, 168.0, 355.0, 706.0, 1746.0, 4476.0, 15302.0, 71248.0, 768506.0, 149556.0, 25080.0, 6898.0, 2310.0, 960.0, 428.0, 206.0, 123.0, 67.0, 40.0, 28.0, 23.0, 12.0, 9.0, 9.0, 5.0, 4.0, 3.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.0546875, -10.76885986328125, -10.4830322265625, -10.19720458984375, -9.911376953125, -9.62554931640625, -9.3397216796875, -9.05389404296875, -8.76806640625, -8.48223876953125, -8.1964111328125, -7.91058349609375, -7.624755859375, -7.33892822265625, -7.0531005859375, -6.76727294921875, -6.4814453125, -6.19561767578125, -5.9097900390625, -5.62396240234375, -5.338134765625, -5.05230712890625, -4.7664794921875, -4.48065185546875, -4.19482421875, -3.90899658203125, -3.6231689453125, -3.33734130859375, -3.051513671875, -2.76568603515625, -2.4798583984375, -2.19403076171875, -1.908203125, -1.62237548828125, -1.3365478515625, -1.05072021484375, -0.764892578125, -0.47906494140625, -0.1932373046875, 0.09259033203125, 0.37841796875, 0.66424560546875, 0.9500732421875, 1.23590087890625, 1.521728515625, 1.80755615234375, 2.0933837890625, 2.37921142578125, 2.6650390625, 2.95086669921875, 3.2366943359375, 3.52252197265625, 3.808349609375, 4.09417724609375, 4.3800048828125, 4.66583251953125, 4.95166015625, 5.23748779296875, 5.5233154296875, 5.80914306640625, 6.094970703125, 6.38079833984375, 6.6666259765625, 6.95245361328125, 7.23828125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 1.0, 5.0, 7.0, 4.0, 8.0, 11.0, 5.0, 14.0, 15.0, 17.0, 11.0, 17.0, 30.0, 30.0, 36.0, 59.0, 73.0, 85.0, 96.0, 99.0, 69.0, 75.0, 43.0, 42.0, 29.0, 23.0, 22.0, 18.0, 6.0, 14.0, 6.0, 4.0, 7.0, 6.0, 2.0, 5.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-5.6015625, -5.42083740234375, -5.2401123046875, -5.05938720703125, -4.878662109375, -4.69793701171875, -4.5172119140625, -4.33648681640625, -4.15576171875, -3.97503662109375, -3.7943115234375, -3.61358642578125, -3.432861328125, -3.25213623046875, -3.0714111328125, -2.89068603515625, -2.7099609375, -2.52923583984375, -2.3485107421875, -2.16778564453125, -1.987060546875, -1.80633544921875, -1.6256103515625, -1.44488525390625, -1.26416015625, -1.08343505859375, -0.9027099609375, -0.72198486328125, -0.541259765625, -0.36053466796875, -0.1798095703125, 0.00091552734375, 0.181640625, 0.36236572265625, 0.5430908203125, 0.72381591796875, 0.904541015625, 1.08526611328125, 1.2659912109375, 1.44671630859375, 1.62744140625, 1.80816650390625, 1.9888916015625, 2.16961669921875, 2.350341796875, 2.53106689453125, 2.7117919921875, 2.89251708984375, 3.0732421875, 3.25396728515625, 3.4346923828125, 3.61541748046875, 3.796142578125, 3.97686767578125, 4.1575927734375, 4.33831787109375, 4.51904296875, 4.69976806640625, 4.8804931640625, 5.06121826171875, 5.241943359375, 5.42266845703125, 5.6033935546875, 5.78411865234375, 5.96484375]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 4.0, 3.0, 5.0, 8.0, 12.0, 28.0, 54.0, 135.0, 360.0, 223.0, 95.0, 43.0, 19.0, 3.0, 4.0, 4.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-138.0602264404297, -130.32791137695312, -122.59558868408203, -114.86326599121094, -107.13095092773438, -99.39862823486328, -91.66630554199219, -83.93399047851562, -76.20166778564453, -68.46934509277344, -60.737030029296875, -53.00470733642578, -45.27238845825195, -37.540069580078125, -29.80774688720703, -22.075428009033203, -14.343109130859375, -6.6107892990112305, 1.121530532836914, 8.853851318359375, 16.586170196533203, 24.31848907470703, 32.050811767578125, 39.78313064575195, 47.51544952392578, 55.24776840209961, 62.98008728027344, 70.71240997314453, 78.44473266601562, 86.17704772949219, 93.90937042236328, 101.64169311523438, 109.37399291992188, 117.10631561279297, 124.83863067626953, 132.57095336914062, 140.3032684326172, 148.03558349609375, 155.76791381835938, 163.50022888183594, 171.2325439453125, 178.96485900878906, 186.6971893310547, 194.42950439453125, 202.1618194580078, 209.89413452148438, 217.62646484375, 225.35877990722656, 233.0911102294922, 240.82342529296875, 248.55575561523438, 256.2880859375, 264.0203857421875, 271.7527160644531, 279.48504638671875, 287.21734619140625, 294.9496765136719, 302.6820068359375, 310.414306640625, 318.1466369628906, 325.87896728515625, 333.61126708984375, 341.3435974121094, 349.075927734375, 356.8082275390625]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 5.0, 7.0, 5.0, 13.0, 16.0, 17.0, 11.0, 16.0, 22.0, 22.0, 42.0, 27.0, 28.0, 44.0, 43.0, 61.0, 116.0, 88.0, 69.0, 53.0, 44.0, 39.0, 27.0, 32.0, 26.0, 34.0, 18.0, 12.0, 18.0, 8.0, 8.0, 4.0, 4.0, 5.0, 9.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-172.89117431640625, -168.11264038085938, -163.3341064453125, -158.55555725097656, -153.7770233154297, -148.9984893798828, -144.21995544433594, -139.44142150878906, -134.66287231445312, -129.88433837890625, -125.10579681396484, -120.32726287841797, -115.54872131347656, -110.77018737792969, -105.99165344238281, -101.21311950683594, -96.43458557128906, -91.65605163574219, -86.87751007080078, -82.0989761352539, -77.3204345703125, -72.54190063476562, -67.76336669921875, -62.98482894897461, -58.20629119873047, -53.42775344848633, -48.64921569824219, -43.87068176269531, -39.09214401245117, -34.31360626220703, -29.535070419311523, -24.756534576416016, -19.977996826171875, -15.19946002960205, -10.420923233032227, -5.642386436462402, -0.8638496398925781, 3.9146881103515625, 8.69322395324707, 13.471759796142578, 18.25029754638672, 23.02883529663086, 27.807371139526367, 32.585906982421875, 37.364444732666016, 42.142982482910156, 46.92151641845703, 51.70005416870117, 56.47859191894531, 61.25712966918945, 66.0356674194336, 70.81420135498047, 75.59274291992188, 80.37127685546875, 85.14981079101562, 89.9283447265625, 94.7068862915039, 99.48542022705078, 104.26396179199219, 109.04249572753906, 113.82102966308594, 118.59957122802734, 123.37810516357422, 128.15664672851562, 132.9351806640625]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 4.0, 1.0, 1.0, 2.0, 6.0, 9.0, 10.0, 10.0, 15.0, 17.0, 24.0, 42.0, 50.0, 78.0, 89.0, 148.0, 228.0, 323.0, 522.0, 905.0, 1650.0, 3522.0, 9584.0, 41263.0, 445361.0, 3083767.0, 538955.0, 48515.0, 10578.0, 4064.0, 1906.0, 999.0, 581.0, 396.0, 210.0, 145.0, 94.0, 72.0, 45.0, 31.0, 20.0, 14.0, 13.0, 4.0, 4.0, 7.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.84375, -14.373046875, -13.90234375, -13.431640625, -12.9609375, -12.490234375, -12.01953125, -11.548828125, -11.078125, -10.607421875, -10.13671875, -9.666015625, -9.1953125, -8.724609375, -8.25390625, -7.783203125, -7.3125, -6.841796875, -6.37109375, -5.900390625, -5.4296875, -4.958984375, -4.48828125, -4.017578125, -3.546875, -3.076171875, -2.60546875, -2.134765625, -1.6640625, -1.193359375, -0.72265625, -0.251953125, 0.21875, 0.689453125, 1.16015625, 1.630859375, 2.1015625, 2.572265625, 3.04296875, 3.513671875, 3.984375, 4.455078125, 4.92578125, 5.396484375, 5.8671875, 6.337890625, 6.80859375, 7.279296875, 7.75, 8.220703125, 8.69140625, 9.162109375, 9.6328125, 10.103515625, 10.57421875, 11.044921875, 11.515625, 11.986328125, 12.45703125, 12.927734375, 13.3984375, 13.869140625, 14.33984375, 14.810546875, 15.28125]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 12.0, 5.0, 12.0, 23.0, 34.0, 25.0, 45.0, 48.0, 75.0, 65.0, 67.0, 74.0, 66.0, 89.0, 52.0, 70.0, 55.0, 37.0, 26.0, 31.0, 22.0, 26.0, 19.0, 8.0, 6.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-14.921875, -14.5303955078125, -14.138916015625, -13.7474365234375, -13.35595703125, -12.9644775390625, -12.572998046875, -12.1815185546875, -11.7900390625, -11.3985595703125, -11.007080078125, -10.6156005859375, -10.22412109375, -9.8326416015625, -9.441162109375, -9.0496826171875, -8.658203125, -8.2667236328125, -7.875244140625, -7.4837646484375, -7.09228515625, -6.7008056640625, -6.309326171875, -5.9178466796875, -5.5263671875, -5.1348876953125, -4.743408203125, -4.3519287109375, -3.96044921875, -3.5689697265625, -3.177490234375, -2.7860107421875, -2.39453125, -2.0030517578125, -1.611572265625, -1.2200927734375, -0.82861328125, -0.4371337890625, -0.045654296875, 0.3458251953125, 0.7373046875, 1.1287841796875, 1.520263671875, 1.9117431640625, 2.30322265625, 2.6947021484375, 3.086181640625, 3.4776611328125, 3.869140625, 4.2606201171875, 4.652099609375, 5.0435791015625, 5.43505859375, 5.8265380859375, 6.218017578125, 6.6094970703125, 7.0009765625, 7.3924560546875, 7.783935546875, 8.1754150390625, 8.56689453125, 8.9583740234375, 9.349853515625, 9.7413330078125, 10.1328125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 6.0, 16.0, 32.0, 76.0, 185.0, 387.0, 990.0, 4189256.0, 2556.0, 455.0, 186.0, 87.0, 30.0, 17.0, 9.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-288.5, -280.62109375, -272.7421875, -264.86328125, -256.984375, -249.10546875, -241.2265625, -233.34765625, -225.46875, -217.58984375, -209.7109375, -201.83203125, -193.953125, -186.07421875, -178.1953125, -170.31640625, -162.4375, -154.55859375, -146.6796875, -138.80078125, -130.921875, -123.04296875, -115.1640625, -107.28515625, -99.40625, -91.52734375, -83.6484375, -75.76953125, -67.890625, -60.01171875, -52.1328125, -44.25390625, -36.375, -28.49609375, -20.6171875, -12.73828125, -4.859375, 3.01953125, 10.8984375, 18.77734375, 26.65625, 34.53515625, 42.4140625, 50.29296875, 58.171875, 66.05078125, 73.9296875, 81.80859375, 89.6875, 97.56640625, 105.4453125, 113.32421875, 121.203125, 129.08203125, 136.9609375, 144.83984375, 152.71875, 160.59765625, 168.4765625, 176.35546875, 184.234375, 192.11328125, 199.9921875, 207.87109375, 215.75]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 41.0, 377.0, 3223.0, 392.0, 33.0, 14.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-140.625, -137.0654296875, -133.505859375, -129.9462890625, -126.38671875, -122.8271484375, -119.267578125, -115.7080078125, -112.1484375, -108.5888671875, -105.029296875, -101.4697265625, -97.91015625, -94.3505859375, -90.791015625, -87.2314453125, -83.671875, -80.1123046875, -76.552734375, -72.9931640625, -69.43359375, -65.8740234375, -62.314453125, -58.7548828125, -55.1953125, -51.6357421875, -48.076171875, -44.5166015625, -40.95703125, -37.3974609375, -33.837890625, -30.2783203125, -26.71875, -23.1591796875, -19.599609375, -16.0400390625, -12.48046875, -8.9208984375, -5.361328125, -1.8017578125, 1.7578125, 5.3173828125, 8.876953125, 12.4365234375, 15.99609375, 19.5556640625, 23.115234375, 26.6748046875, 30.234375, 33.7939453125, 37.353515625, 40.9130859375, 44.47265625, 48.0322265625, 51.591796875, 55.1513671875, 58.7109375, 62.2705078125, 65.830078125, 69.3896484375, 72.94921875, 76.5087890625, 80.068359375, 83.6279296875, 87.1875]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 6.0, 6.0, 13.0, 43.0, 94.0, 210.0, 346.0, 174.0, 69.0, 26.0, 9.0, 8.0, 6.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-518.0595703125, -505.5362854003906, -493.0130310058594, -480.48974609375, -467.96649169921875, -455.4432067871094, -442.919921875, -430.39666748046875, -417.8733825683594, -405.35009765625, -392.82684326171875, -380.3035583496094, -367.7802734375, -355.25701904296875, -342.7337341308594, -330.21044921875, -317.68719482421875, -305.1639099121094, -292.6406555175781, -280.11737060546875, -267.5941162109375, -255.07083129882812, -242.54754638671875, -230.02427673339844, -217.50100708007812, -204.9777374267578, -192.4544677734375, -179.93118286132812, -167.4079132080078, -154.8846435546875, -142.36135864257812, -129.8380889892578, -117.3148193359375, -104.79154968261719, -92.26827239990234, -79.7449951171875, -67.22172546386719, -54.69845199584961, -42.17517852783203, -29.651901245117188, -17.128631591796875, -4.605358123779297, 7.917915344238281, 20.44118881225586, 32.96446228027344, 45.487735748291016, 58.011009216308594, 70.53428649902344, 83.05755615234375, 95.58082580566406, 108.1041030883789, 120.62738037109375, 133.15065002441406, 145.67391967773438, 158.19720458984375, 170.72047424316406, 183.24374389648438, 195.7670135498047, 208.290283203125, 220.81356811523438, 233.3368377685547, 245.860107421875, 258.3833923339844, 270.90667724609375, 283.429931640625]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 3.0, 5.0, 3.0, 2.0, 11.0, 10.0, 10.0, 12.0, 17.0, 18.0, 33.0, 30.0, 31.0, 38.0, 40.0, 51.0, 49.0, 53.0, 47.0, 52.0, 46.0, 49.0, 41.0, 44.0, 41.0, 41.0, 44.0, 31.0, 24.0, 21.0, 23.0, 11.0, 10.0, 13.0, 18.0, 11.0, 9.0, 5.0, 3.0, 2.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-89.17119598388672, -85.4741439819336, -81.77708435058594, -78.08003234863281, -74.38298034667969, -70.68592834472656, -66.9888687133789, -63.29181671142578, -59.59476089477539, -55.897705078125, -52.200653076171875, -48.503597259521484, -44.806541442871094, -41.10948944091797, -37.41243362426758, -33.71537780761719, -30.018325805664062, -26.321271896362305, -22.624217987060547, -18.927162170410156, -15.230108261108398, -11.53305435180664, -7.83599853515625, -4.138944625854492, -0.4418907165527344, 3.2551636695861816, 6.952218055725098, 10.649272918701172, 14.34632682800293, 18.043380737304688, 21.740436553955078, 25.437490463256836, 29.134552001953125, 32.831607818603516, 36.52865982055664, 40.22571563720703, 43.922767639160156, 47.61982345581055, 51.31687927246094, 55.01393127441406, 58.71098709106445, 62.408042907714844, 66.10509490966797, 69.80215454101562, 73.49920654296875, 77.19625854492188, 80.893310546875, 84.59037017822266, 88.28742218017578, 91.9844741821289, 95.68153381347656, 99.37858581542969, 103.07563781738281, 106.77268981933594, 110.4697494506836, 114.16680145263672, 117.86386108398438, 121.5609130859375, 125.25797271728516, 128.95501708984375, 132.65208435058594, 136.34913635253906, 140.0461883544922, 143.7432403564453, 147.44029235839844]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 13.0, 10.0, 16.0, 16.0, 26.0, 52.0, 83.0, 144.0, 236.0, 469.0, 845.0, 1809.0, 4215.0, 11686.0, 40976.0, 212993.0, 596536.0, 134247.0, 28806.0, 8789.0, 3375.0, 1533.0, 745.0, 420.0, 193.0, 132.0, 74.0, 45.0, 34.0, 14.0, 5.0, 8.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.546875, -23.832763671875, -23.11865234375, -22.404541015625, -21.6904296875, -20.976318359375, -20.26220703125, -19.548095703125, -18.833984375, -18.119873046875, -17.40576171875, -16.691650390625, -15.9775390625, -15.263427734375, -14.54931640625, -13.835205078125, -13.12109375, -12.406982421875, -11.69287109375, -10.978759765625, -10.2646484375, -9.550537109375, -8.83642578125, -8.122314453125, -7.408203125, -6.694091796875, -5.97998046875, -5.265869140625, -4.5517578125, -3.837646484375, -3.12353515625, -2.409423828125, -1.6953125, -0.981201171875, -0.26708984375, 0.447021484375, 1.1611328125, 1.875244140625, 2.58935546875, 3.303466796875, 4.017578125, 4.731689453125, 5.44580078125, 6.159912109375, 6.8740234375, 7.588134765625, 8.30224609375, 9.016357421875, 9.73046875, 10.444580078125, 11.15869140625, 11.872802734375, 12.5869140625, 13.301025390625, 14.01513671875, 14.729248046875, 15.443359375, 16.157470703125, 16.87158203125, 17.585693359375, 18.2998046875, 19.013916015625, 19.72802734375, 20.442138671875, 21.15625]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 5.0, 4.0, 4.0, 0.0, 3.0, 10.0, 7.0, 8.0, 14.0, 23.0, 9.0, 23.0, 22.0, 34.0, 32.0, 36.0, 30.0, 49.0, 60.0, 78.0, 52.0, 51.0, 61.0, 48.0, 43.0, 47.0, 57.0, 34.0, 25.0, 23.0, 23.0, 21.0, 21.0, 11.0, 11.0, 7.0, 5.0, 7.0, 2.0, 2.0, 1.0, 4.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.078125, -10.7435302734375, -10.408935546875, -10.0743408203125, -9.73974609375, -9.4051513671875, -9.070556640625, -8.7359619140625, -8.4013671875, -8.0667724609375, -7.732177734375, -7.3975830078125, -7.06298828125, -6.7283935546875, -6.393798828125, -6.0592041015625, -5.724609375, -5.3900146484375, -5.055419921875, -4.7208251953125, -4.38623046875, -4.0516357421875, -3.717041015625, -3.3824462890625, -3.0478515625, -2.7132568359375, -2.378662109375, -2.0440673828125, -1.70947265625, -1.3748779296875, -1.040283203125, -0.7056884765625, -0.37109375, -0.0364990234375, 0.298095703125, 0.6326904296875, 0.96728515625, 1.3018798828125, 1.636474609375, 1.9710693359375, 2.3056640625, 2.6402587890625, 2.974853515625, 3.3094482421875, 3.64404296875, 3.9786376953125, 4.313232421875, 4.6478271484375, 4.982421875, 5.3170166015625, 5.651611328125, 5.9862060546875, 6.32080078125, 6.6553955078125, 6.989990234375, 7.3245849609375, 7.6591796875, 7.9937744140625, 8.328369140625, 8.6629638671875, 8.99755859375, 9.3321533203125, 9.666748046875, 10.0013427734375, 10.3359375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 2.0, 9.0, 8.0, 6.0, 15.0, 18.0, 32.0, 43.0, 68.0, 97.0, 179.0, 326.0, 721.0, 1952.0, 8018.0, 75017.0, 885070.0, 65956.0, 7572.0, 1944.0, 699.0, 314.0, 160.0, 105.0, 67.0, 46.0, 30.0, 16.0, 18.0, 9.0, 10.0, 9.0, 7.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-47.1875, -45.81884765625, -44.4501953125, -43.08154296875, -41.712890625, -40.34423828125, -38.9755859375, -37.60693359375, -36.23828125, -34.86962890625, -33.5009765625, -32.13232421875, -30.763671875, -29.39501953125, -28.0263671875, -26.65771484375, -25.2890625, -23.92041015625, -22.5517578125, -21.18310546875, -19.814453125, -18.44580078125, -17.0771484375, -15.70849609375, -14.33984375, -12.97119140625, -11.6025390625, -10.23388671875, -8.865234375, -7.49658203125, -6.1279296875, -4.75927734375, -3.390625, -2.02197265625, -0.6533203125, 0.71533203125, 2.083984375, 3.45263671875, 4.8212890625, 6.18994140625, 7.55859375, 8.92724609375, 10.2958984375, 11.66455078125, 13.033203125, 14.40185546875, 15.7705078125, 17.13916015625, 18.5078125, 19.87646484375, 21.2451171875, 22.61376953125, 23.982421875, 25.35107421875, 26.7197265625, 28.08837890625, 29.45703125, 30.82568359375, 32.1943359375, 33.56298828125, 34.931640625, 36.30029296875, 37.6689453125, 39.03759765625, 40.40625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 2.0, 3.0, 7.0, 7.0, 9.0, 9.0, 12.0, 29.0, 20.0, 38.0, 31.0, 59.0, 63.0, 65.0, 83.0, 57.0, 69.0, 58.0, 66.0, 61.0, 48.0, 55.0, 33.0, 32.0, 18.0, 19.0, 16.0, 10.0, 10.0, 7.0, 4.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.75, -52.01513671875, -50.2802734375, -48.54541015625, -46.810546875, -45.07568359375, -43.3408203125, -41.60595703125, -39.87109375, -38.13623046875, -36.4013671875, -34.66650390625, -32.931640625, -31.19677734375, -29.4619140625, -27.72705078125, -25.9921875, -24.25732421875, -22.5224609375, -20.78759765625, -19.052734375, -17.31787109375, -15.5830078125, -13.84814453125, -12.11328125, -10.37841796875, -8.6435546875, -6.90869140625, -5.173828125, -3.43896484375, -1.7041015625, 0.03076171875, 1.765625, 3.50048828125, 5.2353515625, 6.97021484375, 8.705078125, 10.43994140625, 12.1748046875, 13.90966796875, 15.64453125, 17.37939453125, 19.1142578125, 20.84912109375, 22.583984375, 24.31884765625, 26.0537109375, 27.78857421875, 29.5234375, 31.25830078125, 32.9931640625, 34.72802734375, 36.462890625, 38.19775390625, 39.9326171875, 41.66748046875, 43.40234375, 45.13720703125, 46.8720703125, 48.60693359375, 50.341796875, 52.07666015625, 53.8115234375, 55.54638671875, 57.28125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 1.0, 4.0, 6.0, 11.0, 5.0, 13.0, 13.0, 24.0, 35.0, 63.0, 73.0, 130.0, 226.0, 352.0, 701.0, 1302.0, 3317.0, 10928.0, 70430.0, 889336.0, 56502.0, 9401.0, 2889.0, 1261.0, 617.0, 325.0, 211.0, 123.0, 75.0, 47.0, 27.0, 36.0, 17.0, 14.0, 12.0, 5.0, 10.0, 6.0, 2.0, 2.0, 4.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.171875, -18.52099609375, -17.8701171875, -17.21923828125, -16.568359375, -15.91748046875, -15.2666015625, -14.61572265625, -13.96484375, -13.31396484375, -12.6630859375, -12.01220703125, -11.361328125, -10.71044921875, -10.0595703125, -9.40869140625, -8.7578125, -8.10693359375, -7.4560546875, -6.80517578125, -6.154296875, -5.50341796875, -4.8525390625, -4.20166015625, -3.55078125, -2.89990234375, -2.2490234375, -1.59814453125, -0.947265625, -0.29638671875, 0.3544921875, 1.00537109375, 1.65625, 2.30712890625, 2.9580078125, 3.60888671875, 4.259765625, 4.91064453125, 5.5615234375, 6.21240234375, 6.86328125, 7.51416015625, 8.1650390625, 8.81591796875, 9.466796875, 10.11767578125, 10.7685546875, 11.41943359375, 12.0703125, 12.72119140625, 13.3720703125, 14.02294921875, 14.673828125, 15.32470703125, 15.9755859375, 16.62646484375, 17.27734375, 17.92822265625, 18.5791015625, 19.22998046875, 19.880859375, 20.53173828125, 21.1826171875, 21.83349609375, 22.484375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 5.0, 4.0, 2.0, 5.0, 8.0, 7.0, 14.0, 18.0, 32.0, 65.0, 124.0, 233.0, 220.0, 89.0, 53.0, 37.0, 21.0, 14.0, 17.0, 4.0, 5.0, 6.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.004871368408203125, -0.0046836137771606445, -0.004495859146118164, -0.004308104515075684, -0.004120349884033203, -0.003932595252990723, -0.003744840621948242, -0.0035570859909057617, -0.0033693313598632812, -0.0031815767288208008, -0.0029938220977783203, -0.00280606746673584, -0.0026183128356933594, -0.002430558204650879, -0.0022428035736083984, -0.002055048942565918, -0.0018672943115234375, -0.001679539680480957, -0.0014917850494384766, -0.001304030418395996, -0.0011162757873535156, -0.0009285211563110352, -0.0007407665252685547, -0.0005530118942260742, -0.00036525726318359375, -0.00017750263214111328, 1.0251998901367188e-05, 0.00019800662994384766, 0.0003857612609863281, 0.0005735158920288086, 0.0007612705230712891, 0.0009490251541137695, 0.00113677978515625, 0.0013245344161987305, 0.001512289047241211, 0.0017000436782836914, 0.0018877983093261719, 0.0020755529403686523, 0.002263307571411133, 0.0024510622024536133, 0.0026388168334960938, 0.0028265714645385742, 0.0030143260955810547, 0.003202080726623535, 0.0033898353576660156, 0.003577589988708496, 0.0037653446197509766, 0.003953099250793457, 0.0041408538818359375, 0.004328608512878418, 0.0045163631439208984, 0.004704117774963379, 0.004891872406005859, 0.00507962703704834, 0.00526738166809082, 0.005455136299133301, 0.005642890930175781, 0.005830645561218262, 0.006018400192260742, 0.006206154823303223, 0.006393909454345703, 0.006581664085388184, 0.006769418716430664, 0.0069571733474731445, 0.007144927978515625]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 3.0, 2.0, 7.0, 13.0, 9.0, 9.0, 20.0, 30.0, 56.0, 54.0, 122.0, 218.0, 428.0, 950.0, 2720.0, 8929.0, 43075.0, 818992.0, 146894.0, 18292.0, 4760.0, 1526.0, 650.0, 301.0, 179.0, 114.0, 65.0, 45.0, 24.0, 15.0, 13.0, 15.0, 5.0, 3.0, 5.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.8125, -16.265869140625, -15.71923828125, -15.172607421875, -14.6259765625, -14.079345703125, -13.53271484375, -12.986083984375, -12.439453125, -11.892822265625, -11.34619140625, -10.799560546875, -10.2529296875, -9.706298828125, -9.15966796875, -8.613037109375, -8.06640625, -7.519775390625, -6.97314453125, -6.426513671875, -5.8798828125, -5.333251953125, -4.78662109375, -4.239990234375, -3.693359375, -3.146728515625, -2.60009765625, -2.053466796875, -1.5068359375, -0.960205078125, -0.41357421875, 0.133056640625, 0.6796875, 1.226318359375, 1.77294921875, 2.319580078125, 2.8662109375, 3.412841796875, 3.95947265625, 4.506103515625, 5.052734375, 5.599365234375, 6.14599609375, 6.692626953125, 7.2392578125, 7.785888671875, 8.33251953125, 8.879150390625, 9.42578125, 9.972412109375, 10.51904296875, 11.065673828125, 11.6123046875, 12.158935546875, 12.70556640625, 13.252197265625, 13.798828125, 14.345458984375, 14.89208984375, 15.438720703125, 15.9853515625, 16.531982421875, 17.07861328125, 17.625244140625, 18.171875]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 5.0, 8.0, 8.0, 5.0, 8.0, 18.0, 11.0, 5.0, 18.0, 22.0, 23.0, 36.0, 56.0, 74.0, 102.0, 119.0, 117.0, 81.0, 66.0, 54.0, 36.0, 20.0, 20.0, 13.0, 12.0, 12.0, 12.0, 8.0, 3.0, 4.0, 3.0, 4.0, 4.0, 4.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.125, -8.774169921875, -8.42333984375, -8.072509765625, -7.7216796875, -7.370849609375, -7.02001953125, -6.669189453125, -6.318359375, -5.967529296875, -5.61669921875, -5.265869140625, -4.9150390625, -4.564208984375, -4.21337890625, -3.862548828125, -3.51171875, -3.160888671875, -2.81005859375, -2.459228515625, -2.1083984375, -1.757568359375, -1.40673828125, -1.055908203125, -0.705078125, -0.354248046875, -0.00341796875, 0.347412109375, 0.6982421875, 1.049072265625, 1.39990234375, 1.750732421875, 2.1015625, 2.452392578125, 2.80322265625, 3.154052734375, 3.5048828125, 3.855712890625, 4.20654296875, 4.557373046875, 4.908203125, 5.259033203125, 5.60986328125, 5.960693359375, 6.3115234375, 6.662353515625, 7.01318359375, 7.364013671875, 7.71484375, 8.065673828125, 8.41650390625, 8.767333984375, 9.1181640625, 9.468994140625, 9.81982421875, 10.170654296875, 10.521484375, 10.872314453125, 11.22314453125, 11.573974609375, 11.9248046875, 12.275634765625, 12.62646484375, 12.977294921875, 13.328125]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 11.0, 120.0, 677.0, 142.0, 34.0, 13.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-572.6337890625, -539.8124389648438, -506.99102783203125, -474.169677734375, -441.3482971191406, -408.52691650390625, -375.70556640625, -342.8841857910156, -310.06280517578125, -277.2414245605469, -244.42005920410156, -211.59869384765625, -178.77731323242188, -145.9559326171875, -113.13456726074219, -80.31320190429688, -47.4918212890625, -14.670448303222656, 18.150924682617188, 50.97229766845703, 83.79367065429688, 116.61505126953125, 149.43641662597656, 182.25778198242188, 215.07916259765625, 247.90054321289062, 280.721923828125, 313.54327392578125, 346.3646545410156, 379.18603515625, 412.00738525390625, 444.8287658691406, 477.6502685546875, 510.4716491699219, 543.2930297851562, 576.1143798828125, 608.935791015625, 641.7571411132812, 674.5784912109375, 707.39990234375, 740.2212524414062, 773.0426025390625, 805.864013671875, 838.6853637695312, 871.5067138671875, 904.328125, 937.1494750976562, 969.9708251953125, 1002.792236328125, 1035.6136474609375, 1068.4349365234375, 1101.25634765625, 1134.0777587890625, 1166.899169921875, 1199.720458984375, 1232.5418701171875, 1265.36328125, 1298.1846923828125, 1331.0059814453125, 1363.827392578125, 1396.6488037109375, 1429.47021484375, 1462.29150390625, 1495.1129150390625, 1527.9342041015625]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 5.0, 1.0, 1.0, 2.0, 5.0, 4.0, 3.0, 9.0, 12.0, 17.0, 9.0, 14.0, 15.0, 19.0, 21.0, 20.0, 28.0, 24.0, 31.0, 41.0, 63.0, 95.0, 147.0, 94.0, 49.0, 32.0, 24.0, 31.0, 32.0, 16.0, 17.0, 23.0, 23.0, 13.0, 18.0, 9.0, 14.0, 10.0, 2.0, 4.0, 2.0, 1.0, 3.0, 3.0, 1.0, 4.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-193.44381713867188, -187.4773712158203, -181.5109405517578, -175.54449462890625, -169.57806396484375, -163.6116180419922, -157.64517211914062, -151.67874145507812, -145.71229553222656, -139.745849609375, -133.7794189453125, -127.81297302246094, -121.8465347290039, -115.88009643554688, -109.91365051269531, -103.94721221923828, -97.98077392578125, -92.01433563232422, -86.04789733886719, -80.08145141601562, -74.1150131225586, -68.14857482910156, -62.182132720947266, -56.21569061279297, -50.24925231933594, -44.282814025878906, -38.31637191772461, -32.34992980957031, -26.38349151611328, -20.417051315307617, -14.450611114501953, -8.484169006347656, -2.5177154541015625, 3.4487247467041016, 9.415164947509766, 15.38160514831543, 21.348045349121094, 27.314485549926758, 33.28092575073242, 39.24736785888672, 45.21380615234375, 51.18024444580078, 57.14668655395508, 63.113128662109375, 69.0795669555664, 75.04600524902344, 81.012451171875, 86.97888946533203, 92.94532775878906, 98.9117660522461, 104.87820434570312, 110.84465026855469, 116.81108856201172, 122.77752685546875, 128.7439727783203, 134.71041870117188, 140.67684936523438, 146.64329528808594, 152.60972595214844, 158.576171875, 164.5426025390625, 170.50904846191406, 176.47549438476562, 182.44192504882812, 188.4083709716797]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 7.0, 10.0, 36.0, 56.0, 85.0, 203.0, 346.0, 723.0, 1692.0, 5161.0, 23533.0, 440905.0, 3484168.0, 214387.0, 16712.0, 3899.0, 1332.0, 503.0, 256.0, 110.0, 67.0, 53.0, 24.0, 11.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-46.5, -45.2890625, -44.078125, -42.8671875, -41.65625, -40.4453125, -39.234375, -38.0234375, -36.8125, -35.6015625, -34.390625, -33.1796875, -31.96875, -30.7578125, -29.546875, -28.3359375, -27.125, -25.9140625, -24.703125, -23.4921875, -22.28125, -21.0703125, -19.859375, -18.6484375, -17.4375, -16.2265625, -15.015625, -13.8046875, -12.59375, -11.3828125, -10.171875, -8.9609375, -7.75, -6.5390625, -5.328125, -4.1171875, -2.90625, -1.6953125, -0.484375, 0.7265625, 1.9375, 3.1484375, 4.359375, 5.5703125, 6.78125, 7.9921875, 9.203125, 10.4140625, 11.625, 12.8359375, 14.046875, 15.2578125, 16.46875, 17.6796875, 18.890625, 20.1015625, 21.3125, 22.5234375, 23.734375, 24.9453125, 26.15625, 27.3671875, 28.578125, 29.7890625, 31.0]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 2.0, 1.0, 1.0, 3.0, 6.0, 7.0, 11.0, 10.0, 15.0, 12.0, 18.0, 17.0, 26.0, 18.0, 31.0, 30.0, 33.0, 49.0, 42.0, 42.0, 38.0, 55.0, 56.0, 52.0, 54.0, 45.0, 41.0, 41.0, 38.0, 31.0, 24.0, 18.0, 33.0, 23.0, 20.0, 11.0, 14.0, 11.0, 7.0, 8.0, 5.0, 3.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.6171875, -9.3333740234375, -9.049560546875, -8.7657470703125, -8.48193359375, -8.1981201171875, -7.914306640625, -7.6304931640625, -7.3466796875, -7.0628662109375, -6.779052734375, -6.4952392578125, -6.21142578125, -5.9276123046875, -5.643798828125, -5.3599853515625, -5.076171875, -4.7923583984375, -4.508544921875, -4.2247314453125, -3.94091796875, -3.6571044921875, -3.373291015625, -3.0894775390625, -2.8056640625, -2.5218505859375, -2.238037109375, -1.9542236328125, -1.67041015625, -1.3865966796875, -1.102783203125, -0.8189697265625, -0.53515625, -0.2513427734375, 0.032470703125, 0.3162841796875, 0.60009765625, 0.8839111328125, 1.167724609375, 1.4515380859375, 1.7353515625, 2.0191650390625, 2.302978515625, 2.5867919921875, 2.87060546875, 3.1544189453125, 3.438232421875, 3.7220458984375, 4.005859375, 4.2896728515625, 4.573486328125, 4.8572998046875, 5.14111328125, 5.4249267578125, 5.708740234375, 5.9925537109375, 6.2763671875, 6.5601806640625, 6.843994140625, 7.1278076171875, 7.41162109375, 7.6954345703125, 7.979248046875, 8.2630615234375, 8.546875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 2.0, 4.0, 14.0, 14.0, 37.0, 69.0, 170.0, 566.0, 3195.0, 3884979.0, 302017.0, 2361.0, 528.0, 172.0, 90.0, 28.0, 15.0, 11.0, 2.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-221.875, -215.697265625, -209.51953125, -203.341796875, -197.1640625, -190.986328125, -184.80859375, -178.630859375, -172.453125, -166.275390625, -160.09765625, -153.919921875, -147.7421875, -141.564453125, -135.38671875, -129.208984375, -123.03125, -116.853515625, -110.67578125, -104.498046875, -98.3203125, -92.142578125, -85.96484375, -79.787109375, -73.609375, -67.431640625, -61.25390625, -55.076171875, -48.8984375, -42.720703125, -36.54296875, -30.365234375, -24.1875, -18.009765625, -11.83203125, -5.654296875, 0.5234375, 6.701171875, 12.87890625, 19.056640625, 25.234375, 31.412109375, 37.58984375, 43.767578125, 49.9453125, 56.123046875, 62.30078125, 68.478515625, 74.65625, 80.833984375, 87.01171875, 93.189453125, 99.3671875, 105.544921875, 111.72265625, 117.900390625, 124.078125, 130.255859375, 136.43359375, 142.611328125, 148.7890625, 154.966796875, 161.14453125, 167.322265625, 173.5]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 6.0, 11.0, 29.0, 53.0, 129.0, 258.0, 586.0, 1213.0, 972.0, 452.0, 199.0, 72.0, 38.0, 25.0, 14.0, 9.0, 5.0, 5.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.25, -33.150390625, -31.05078125, -28.951171875, -26.8515625, -24.751953125, -22.65234375, -20.552734375, -18.453125, -16.353515625, -14.25390625, -12.154296875, -10.0546875, -7.955078125, -5.85546875, -3.755859375, -1.65625, 0.443359375, 2.54296875, 4.642578125, 6.7421875, 8.841796875, 10.94140625, 13.041015625, 15.140625, 17.240234375, 19.33984375, 21.439453125, 23.5390625, 25.638671875, 27.73828125, 29.837890625, 31.9375, 34.037109375, 36.13671875, 38.236328125, 40.3359375, 42.435546875, 44.53515625, 46.634765625, 48.734375, 50.833984375, 52.93359375, 55.033203125, 57.1328125, 59.232421875, 61.33203125, 63.431640625, 65.53125, 67.630859375, 69.73046875, 71.830078125, 73.9296875, 76.029296875, 78.12890625, 80.228515625, 82.328125, 84.427734375, 86.52734375, 88.626953125, 90.7265625, 92.826171875, 94.92578125, 97.025390625, 99.125]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 6.0, 2.0, 14.0, 15.0, 37.0, 106.0, 253.0, 265.0, 160.0, 57.0, 38.0, 18.0, 7.0, 7.0, 5.0, 3.0, 2.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-432.15667724609375, -412.7328796386719, -393.3091125488281, -373.88531494140625, -354.4615478515625, -335.0377502441406, -315.61395263671875, -296.190185546875, -276.7663879394531, -257.34259033203125, -237.9188232421875, -218.49502563476562, -199.0712432861328, -179.6474609375, -160.22366333007812, -140.7998809814453, -121.3760986328125, -101.95231628417969, -82.52852630615234, -63.104740142822266, -43.68095397949219, -24.257171630859375, -4.833381652832031, 14.590408325195312, 34.014190673828125, 53.4379768371582, 72.86176300048828, 92.28555297851562, 111.70933532714844, 131.13311767578125, 150.55691528320312, 169.98069763183594, 189.404541015625, 208.8283233642578, 228.25210571289062, 247.6759033203125, 267.09967041015625, 286.5234680175781, 305.947265625, 325.37103271484375, 344.7948303222656, 364.2186279296875, 383.64239501953125, 403.0661926269531, 422.489990234375, 441.91375732421875, 461.3375549316406, 480.7613525390625, 500.18511962890625, 519.60888671875, 539.03271484375, 558.4564819335938, 577.8802490234375, 597.3040771484375, 616.7278442382812, 636.151611328125, 655.575439453125, 674.9992065429688, 694.4230346679688, 713.8468017578125, 733.2705688476562, 752.6943359375, 772.1181640625, 791.5419311523438, 810.9656982421875]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 4.0, 5.0, 6.0, 12.0, 14.0, 15.0, 14.0, 22.0, 21.0, 21.0, 26.0, 42.0, 57.0, 56.0, 66.0, 67.0, 74.0, 93.0, 77.0, 58.0, 52.0, 48.0, 35.0, 29.0, 23.0, 10.0, 17.0, 8.0, 9.0, 6.0, 5.0, 0.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-321.7721862792969, -313.84332275390625, -305.91448974609375, -297.9856262207031, -290.0567626953125, -282.1279296875, -274.1990661621094, -266.2702331542969, -258.34136962890625, -250.4125213623047, -242.48367309570312, -234.5548095703125, -226.62596130371094, -218.69711303710938, -210.76824951171875, -202.8394012451172, -194.91055297851562, -186.98170471191406, -179.0528564453125, -171.12399291992188, -163.1951446533203, -155.26629638671875, -147.33743286132812, -139.40858459472656, -131.479736328125, -123.55088806152344, -115.62203216552734, -107.69317626953125, -99.76432800292969, -91.83547973632812, -83.90662384033203, -75.97776794433594, -68.04891967773438, -60.12006759643555, -52.19121551513672, -44.26236343383789, -36.33351135253906, -28.404659271240234, -20.475807189941406, -12.546955108642578, -4.61810302734375, 3.310749053955078, 11.239601135253906, 19.168453216552734, 27.097305297851562, 35.02615737915039, 42.95500946044922, 50.88386154174805, 58.812713623046875, 66.74156188964844, 74.67041778564453, 82.59927368164062, 90.52812194824219, 98.45697021484375, 106.38582611083984, 114.31468200683594, 122.2435302734375, 130.17237854003906, 138.10122680664062, 146.03009033203125, 153.9589385986328, 161.88778686523438, 169.816650390625, 177.74549865722656, 185.67434692382812]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 8.0, 6.0, 16.0, 16.0, 36.0, 50.0, 79.0, 158.0, 302.0, 620.0, 1539.0, 4420.0, 17360.0, 126827.0, 786811.0, 90033.0, 13876.0, 3862.0, 1353.0, 568.0, 268.0, 134.0, 70.0, 48.0, 35.0, 21.0, 11.0, 7.0, 9.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-39.53125, -38.41552734375, -37.2998046875, -36.18408203125, -35.068359375, -33.95263671875, -32.8369140625, -31.72119140625, -30.60546875, -29.48974609375, -28.3740234375, -27.25830078125, -26.142578125, -25.02685546875, -23.9111328125, -22.79541015625, -21.6796875, -20.56396484375, -19.4482421875, -18.33251953125, -17.216796875, -16.10107421875, -14.9853515625, -13.86962890625, -12.75390625, -11.63818359375, -10.5224609375, -9.40673828125, -8.291015625, -7.17529296875, -6.0595703125, -4.94384765625, -3.828125, -2.71240234375, -1.5966796875, -0.48095703125, 0.634765625, 1.75048828125, 2.8662109375, 3.98193359375, 5.09765625, 6.21337890625, 7.3291015625, 8.44482421875, 9.560546875, 10.67626953125, 11.7919921875, 12.90771484375, 14.0234375, 15.13916015625, 16.2548828125, 17.37060546875, 18.486328125, 19.60205078125, 20.7177734375, 21.83349609375, 22.94921875, 24.06494140625, 25.1806640625, 26.29638671875, 27.412109375, 28.52783203125, 29.6435546875, 30.75927734375, 31.875]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 7.0, 12.0, 16.0, 20.0, 21.0, 22.0, 38.0, 57.0, 82.0, 80.0, 72.0, 94.0, 104.0, 85.0, 77.0, 57.0, 55.0, 29.0, 28.0, 17.0, 15.0, 7.0, 8.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.0625, -22.33203125, -21.6015625, -20.87109375, -20.140625, -19.41015625, -18.6796875, -17.94921875, -17.21875, -16.48828125, -15.7578125, -15.02734375, -14.296875, -13.56640625, -12.8359375, -12.10546875, -11.375, -10.64453125, -9.9140625, -9.18359375, -8.453125, -7.72265625, -6.9921875, -6.26171875, -5.53125, -4.80078125, -4.0703125, -3.33984375, -2.609375, -1.87890625, -1.1484375, -0.41796875, 0.3125, 1.04296875, 1.7734375, 2.50390625, 3.234375, 3.96484375, 4.6953125, 5.42578125, 6.15625, 6.88671875, 7.6171875, 8.34765625, 9.078125, 9.80859375, 10.5390625, 11.26953125, 12.0, 12.73046875, 13.4609375, 14.19140625, 14.921875, 15.65234375, 16.3828125, 17.11328125, 17.84375, 18.57421875, 19.3046875, 20.03515625, 20.765625, 21.49609375, 22.2265625, 22.95703125, 23.6875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 1.0, 2.0, 2.0, 3.0, 6.0, 10.0, 18.0, 18.0, 34.0, 57.0, 118.0, 280.0, 738.0, 4148.0, 166671.0, 867474.0, 7221.0, 1062.0, 318.0, 152.0, 86.0, 39.0, 42.0, 26.0, 14.0, 11.0, 2.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.125, -63.21533203125, -61.3056640625, -59.39599609375, -57.486328125, -55.57666015625, -53.6669921875, -51.75732421875, -49.84765625, -47.93798828125, -46.0283203125, -44.11865234375, -42.208984375, -40.29931640625, -38.3896484375, -36.47998046875, -34.5703125, -32.66064453125, -30.7509765625, -28.84130859375, -26.931640625, -25.02197265625, -23.1123046875, -21.20263671875, -19.29296875, -17.38330078125, -15.4736328125, -13.56396484375, -11.654296875, -9.74462890625, -7.8349609375, -5.92529296875, -4.015625, -2.10595703125, -0.1962890625, 1.71337890625, 3.623046875, 5.53271484375, 7.4423828125, 9.35205078125, 11.26171875, 13.17138671875, 15.0810546875, 16.99072265625, 18.900390625, 20.81005859375, 22.7197265625, 24.62939453125, 26.5390625, 28.44873046875, 30.3583984375, 32.26806640625, 34.177734375, 36.08740234375, 37.9970703125, 39.90673828125, 41.81640625, 43.72607421875, 45.6357421875, 47.54541015625, 49.455078125, 51.36474609375, 53.2744140625, 55.18408203125, 57.09375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 3.0, 5.0, 2.0, 5.0, 9.0, 7.0, 9.0, 11.0, 16.0, 30.0, 24.0, 33.0, 48.0, 48.0, 52.0, 85.0, 94.0, 91.0, 75.0, 58.0, 62.0, 47.0, 31.0, 25.0, 17.0, 22.0, 23.0, 19.0, 8.0, 14.0, 3.0, 7.0, 8.0, 2.0, 5.0, 4.0, 1.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.25, -62.36474609375, -60.4794921875, -58.59423828125, -56.708984375, -54.82373046875, -52.9384765625, -51.05322265625, -49.16796875, -47.28271484375, -45.3974609375, -43.51220703125, -41.626953125, -39.74169921875, -37.8564453125, -35.97119140625, -34.0859375, -32.20068359375, -30.3154296875, -28.43017578125, -26.544921875, -24.65966796875, -22.7744140625, -20.88916015625, -19.00390625, -17.11865234375, -15.2333984375, -13.34814453125, -11.462890625, -9.57763671875, -7.6923828125, -5.80712890625, -3.921875, -2.03662109375, -0.1513671875, 1.73388671875, 3.619140625, 5.50439453125, 7.3896484375, 9.27490234375, 11.16015625, 13.04541015625, 14.9306640625, 16.81591796875, 18.701171875, 20.58642578125, 22.4716796875, 24.35693359375, 26.2421875, 28.12744140625, 30.0126953125, 31.89794921875, 33.783203125, 35.66845703125, 37.5537109375, 39.43896484375, 41.32421875, 43.20947265625, 45.0947265625, 46.97998046875, 48.865234375, 50.75048828125, 52.6357421875, 54.52099609375, 56.40625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 3.0, 6.0, 0.0, 4.0, 3.0, 4.0, 10.0, 8.0, 5.0, 6.0, 12.0, 19.0, 25.0, 49.0, 88.0, 196.0, 399.0, 900.0, 2960.0, 13844.0, 330772.0, 679985.0, 14512.0, 3013.0, 897.0, 357.0, 218.0, 98.0, 58.0, 34.0, 30.0, 12.0, 10.0, 11.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.31640625, -7.01165771484375, -6.7069091796875, -6.40216064453125, -6.097412109375, -5.79266357421875, -5.4879150390625, -5.18316650390625, -4.87841796875, -4.57366943359375, -4.2689208984375, -3.96417236328125, -3.659423828125, -3.35467529296875, -3.0499267578125, -2.74517822265625, -2.4404296875, -2.13568115234375, -1.8309326171875, -1.52618408203125, -1.221435546875, -0.91668701171875, -0.6119384765625, -0.30718994140625, -0.00244140625, 0.30230712890625, 0.6070556640625, 0.91180419921875, 1.216552734375, 1.52130126953125, 1.8260498046875, 2.13079833984375, 2.435546875, 2.74029541015625, 3.0450439453125, 3.34979248046875, 3.654541015625, 3.95928955078125, 4.2640380859375, 4.56878662109375, 4.87353515625, 5.17828369140625, 5.4830322265625, 5.78778076171875, 6.092529296875, 6.39727783203125, 6.7020263671875, 7.00677490234375, 7.3115234375, 7.61627197265625, 7.9210205078125, 8.22576904296875, 8.530517578125, 8.83526611328125, 9.1400146484375, 9.44476318359375, 9.74951171875, 10.05426025390625, 10.3590087890625, 10.66375732421875, 10.968505859375, 11.27325439453125, 11.5780029296875, 11.88275146484375, 12.1875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 2.0, 2.0, 7.0, 12.0, 21.0, 24.0, 50.0, 105.0, 243.0, 274.0, 101.0, 53.0, 37.0, 19.0, 16.0, 6.0, 9.0, 5.0, 3.0, 3.0, 2.0, 4.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00452423095703125, -0.004405617713928223, -0.004287004470825195, -0.004168391227722168, -0.004049777984619141, -0.003931164741516113, -0.003812551498413086, -0.0036939382553100586, -0.0035753250122070312, -0.003456711769104004, -0.0033380985260009766, -0.0032194852828979492, -0.003100872039794922, -0.0029822587966918945, -0.002863645553588867, -0.00274503231048584, -0.0026264190673828125, -0.002507805824279785, -0.002389192581176758, -0.0022705793380737305, -0.002151966094970703, -0.0020333528518676758, -0.0019147396087646484, -0.001796126365661621, -0.0016775131225585938, -0.0015588998794555664, -0.001440286636352539, -0.0013216733932495117, -0.0012030601501464844, -0.001084446907043457, -0.0009658336639404297, -0.0008472204208374023, -0.000728607177734375, -0.0006099939346313477, -0.0004913806915283203, -0.00037276744842529297, -0.0002541542053222656, -0.00013554096221923828, -1.6927719116210938e-05, 0.0001016855239868164, 0.00022029876708984375, 0.0003389120101928711, 0.00045752525329589844, 0.0005761384963989258, 0.0006947517395019531, 0.0008133649826049805, 0.0009319782257080078, 0.0010505914688110352, 0.0011692047119140625, 0.0012878179550170898, 0.0014064311981201172, 0.0015250444412231445, 0.0016436576843261719, 0.0017622709274291992, 0.0018808841705322266, 0.001999497413635254, 0.0021181106567382812, 0.0022367238998413086, 0.002355337142944336, 0.0024739503860473633, 0.0025925636291503906, 0.002711176872253418, 0.0028297901153564453, 0.0029484033584594727, 0.0030670166015625]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 5.0, 4.0, 5.0, 13.0, 10.0, 19.0, 28.0, 51.0, 81.0, 132.0, 243.0, 507.0, 1102.0, 2558.0, 7880.0, 48011.0, 936325.0, 39649.0, 7290.0, 2474.0, 1059.0, 498.0, 258.0, 141.0, 67.0, 39.0, 26.0, 14.0, 14.0, 15.0, 8.0, 10.0, 5.0, 6.0, 0.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.2890625, -10.9412841796875, -10.593505859375, -10.2457275390625, -9.89794921875, -9.5501708984375, -9.202392578125, -8.8546142578125, -8.5068359375, -8.1590576171875, -7.811279296875, -7.4635009765625, -7.11572265625, -6.7679443359375, -6.420166015625, -6.0723876953125, -5.724609375, -5.3768310546875, -5.029052734375, -4.6812744140625, -4.33349609375, -3.9857177734375, -3.637939453125, -3.2901611328125, -2.9423828125, -2.5946044921875, -2.246826171875, -1.8990478515625, -1.55126953125, -1.2034912109375, -0.855712890625, -0.5079345703125, -0.16015625, 0.1876220703125, 0.535400390625, 0.8831787109375, 1.23095703125, 1.5787353515625, 1.926513671875, 2.2742919921875, 2.6220703125, 2.9698486328125, 3.317626953125, 3.6654052734375, 4.01318359375, 4.3609619140625, 4.708740234375, 5.0565185546875, 5.404296875, 5.7520751953125, 6.099853515625, 6.4476318359375, 6.79541015625, 7.1431884765625, 7.490966796875, 7.8387451171875, 8.1865234375, 8.5343017578125, 8.882080078125, 9.2298583984375, 9.57763671875, 9.9254150390625, 10.273193359375, 10.6209716796875, 10.96875]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 1.0, 6.0, 7.0, 7.0, 10.0, 10.0, 13.0, 16.0, 26.0, 34.0, 67.0, 98.0, 150.0, 151.0, 109.0, 78.0, 57.0, 32.0, 24.0, 15.0, 14.0, 10.0, 8.0, 8.0, 8.0, 6.0, 6.0, 5.0, 5.0, 3.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.15625, -5.946044921875, -5.73583984375, -5.525634765625, -5.3154296875, -5.105224609375, -4.89501953125, -4.684814453125, -4.474609375, -4.264404296875, -4.05419921875, -3.843994140625, -3.6337890625, -3.423583984375, -3.21337890625, -3.003173828125, -2.79296875, -2.582763671875, -2.37255859375, -2.162353515625, -1.9521484375, -1.741943359375, -1.53173828125, -1.321533203125, -1.111328125, -0.901123046875, -0.69091796875, -0.480712890625, -0.2705078125, -0.060302734375, 0.14990234375, 0.360107421875, 0.5703125, 0.780517578125, 0.99072265625, 1.200927734375, 1.4111328125, 1.621337890625, 1.83154296875, 2.041748046875, 2.251953125, 2.462158203125, 2.67236328125, 2.882568359375, 3.0927734375, 3.302978515625, 3.51318359375, 3.723388671875, 3.93359375, 4.143798828125, 4.35400390625, 4.564208984375, 4.7744140625, 4.984619140625, 5.19482421875, 5.405029296875, 5.615234375, 5.825439453125, 6.03564453125, 6.245849609375, 6.4560546875, 6.666259765625, 6.87646484375, 7.086669921875, 7.296875]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 10.0, 17.0, 104.0, 566.0, 201.0, 59.0, 21.0, 15.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-158.60238647460938, -142.18923950195312, -125.77609252929688, -109.36295318603516, -92.9498062133789, -76.53665924072266, -60.12351989746094, -43.71037292480469, -27.297225952148438, -10.88408088684082, 5.529064178466797, 21.94220733642578, 38.35535430908203, 54.76850128173828, 71.181640625, 87.59478759765625, 104.0079345703125, 120.42108154296875, 136.834228515625, 153.24737548828125, 169.6605224609375, 186.07366943359375, 202.48680114746094, 218.8999481201172, 235.31309509277344, 251.7262420654297, 268.1393737792969, 284.5525207519531, 300.9656677246094, 317.3788146972656, 333.7919616699219, 350.2051086425781, 366.61822509765625, 383.0313720703125, 399.44451904296875, 415.857666015625, 432.27081298828125, 448.6839599609375, 465.09710693359375, 481.51025390625, 497.92340087890625, 514.3365478515625, 530.7496948242188, 547.162841796875, 563.5759887695312, 579.9891357421875, 596.4022827148438, 612.8154296875, 629.228515625, 645.6416625976562, 662.0548095703125, 678.4679565429688, 694.881103515625, 711.2942504882812, 727.7073974609375, 744.1205444335938, 760.53369140625, 776.9468383789062, 793.3599853515625, 809.7731323242188, 826.186279296875, 842.5994262695312, 859.0125732421875, 875.4257202148438, 891.8388671875]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 5.0, 5.0, 5.0, 6.0, 5.0, 2.0, 10.0, 10.0, 13.0, 15.0, 21.0, 20.0, 9.0, 29.0, 105.0, 97.0, 74.0, 46.0, 62.0, 108.0, 118.0, 41.0, 22.0, 24.0, 21.0, 18.0, 19.0, 13.0, 21.0, 5.0, 13.0, 4.0, 7.0, 7.0, 4.0, 3.0, 2.0, 4.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-181.88784790039062, -176.7776336669922, -171.66741943359375, -166.5572052001953, -161.44699096679688, -156.33677673339844, -151.2265625, -146.11634826660156, -141.00613403320312, -135.8959197998047, -130.78570556640625, -125.67549133300781, -120.56527709960938, -115.45506286621094, -110.3448486328125, -105.23463439941406, -100.12442779541016, -95.01421356201172, -89.90399932861328, -84.79378509521484, -79.6835708618164, -74.57335662841797, -69.46315002441406, -64.35293579101562, -59.24271774291992, -54.132503509521484, -49.02228927612305, -43.912078857421875, -38.80186462402344, -33.691650390625, -28.581436157226562, -23.471221923828125, -18.361007690429688, -13.25079345703125, -8.140580177307129, -3.030366897583008, 2.0798473358154297, 7.190061569213867, 12.300273895263672, 17.41048812866211, 22.520702362060547, 27.630916595458984, 32.74113082885742, 37.851341247558594, 42.96155548095703, 48.07176971435547, 53.181983947753906, 58.292198181152344, 63.40241241455078, 68.51262664794922, 73.62284088134766, 78.7330551147461, 83.84326934814453, 88.95348358154297, 94.06369018554688, 99.17390441894531, 104.28411865234375, 109.39433288574219, 114.50454711914062, 119.61476135253906, 124.7249755859375, 129.83518981933594, 134.94540405273438, 140.0556182861328, 145.16583251953125]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 6.0, 6.0, 14.0, 13.0, 32.0, 32.0, 54.0, 60.0, 88.0, 326.0, 119.0, 75.0, 55.0, 39.0, 34.0, 20.0, 11.0, 7.0, 6.0, 5.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.78125, -23.94482421875, -23.1083984375, -22.27197265625, -21.435546875, -20.59912109375, -19.7626953125, -18.92626953125, -18.08984375, -17.25341796875, -16.4169921875, -15.58056640625, -14.744140625, -13.90771484375, -13.0712890625, -12.23486328125, -11.3984375, -10.56201171875, -9.7255859375, -8.88916015625, -8.052734375, -7.21630859375, -6.3798828125, -5.54345703125, -4.70703125, -3.87060546875, -3.0341796875, -2.19775390625, -1.361328125, -0.52490234375, 0.3115234375, 1.14794921875, 1.984375, 2.82080078125, 3.6572265625, 4.49365234375, 5.330078125, 6.16650390625, 7.0029296875, 7.83935546875, 8.67578125, 9.51220703125, 10.3486328125, 11.18505859375, 12.021484375, 12.85791015625, 13.6943359375, 14.53076171875, 15.3671875, 16.20361328125, 17.0400390625, 17.87646484375, 18.712890625, 19.54931640625, 20.3857421875, 21.22216796875, 22.05859375, 22.89501953125, 23.7314453125, 24.56787109375, 25.404296875, 26.24072265625, 27.0771484375, 27.91357421875, 28.75]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 3.0, 2.0, 0.0, 1.0, 6.0, 12.0, 9.0, 7.0, 18.0, 30.0, 40.0, 68.0, 130.0, 403.0, 1817.0, 243606.0, 8139432.0, 2196.0, 451.0, 164.0, 79.0, 24.0, 33.0, 31.0, 3.0, 6.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-249.75706481933594, -241.95896911621094, -234.16085815429688, -226.36276245117188, -218.5646514892578, -210.7665557861328, -202.96844482421875, -195.17034912109375, -187.3722381591797, -179.5741424560547, -171.77603149414062, -163.97793579101562, -156.17982482910156, -148.38172912597656, -140.5836181640625, -132.7855224609375, -124.98741912841797, -117.18931579589844, -109.3912124633789, -101.59310913085938, -93.79500579833984, -85.99690246582031, -78.19880676269531, -70.40069580078125, -62.602596282958984, -54.80449295043945, -47.00638961791992, -39.208290100097656, -31.410184860229492, -23.612083435058594, -15.813980102539062, -8.015876770019531, -0.2177734375, 7.580329418182373, 15.378432273864746, 23.17653465270996, 30.974637985229492, 38.77273941040039, 46.57084274291992, 54.36894607543945, 62.167049407958984, 69.96514892578125, 77.76325225830078, 85.56135559082031, 93.35945892333984, 101.15756225585938, 108.9556655883789, 116.75376892089844, 124.55187225341797, 132.3499755859375, 140.1480712890625, 147.94618225097656, 155.74427795410156, 163.54238891601562, 171.34048461914062, 179.1385955810547, 186.9366912841797, 194.7347869873047, 202.53289794921875, 210.33099365234375, 218.1291046142578, 225.9272003173828, 233.72531127929688, 241.52340698242188, 249.32151794433594]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 3.0, 3.0, 3.0, 3.0, 4.0, 6.0, 2.0, 5.0, 4.0, 9.0, 8.0, 7.0, 5.0, 1.0, 2.0, 3.0, 3.0, 5.0, 3.0, 4.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-248.71612548828125, -240.24270629882812, -231.76930236816406, -223.2958984375, -214.82247924804688, -206.34906005859375, -197.8756561279297, -189.40225219726562, -180.9288330078125, -172.45541381835938, -163.9820098876953, -155.50860595703125, -147.03518676757812, -138.561767578125, -130.08836364746094, -121.61495208740234, -113.14154052734375, -104.66812896728516, -96.19471740722656, -87.72130584716797, -79.24789428710938, -70.77448272705078, -62.30107116699219, -53.827659606933594, -45.354248046875, -36.880836486816406, -28.407424926757812, -19.93401336669922, -11.460601806640625, -2.9871902465820312, 5.4862213134765625, 13.959632873535156, 22.433013916015625, 30.90642547607422, 39.37983703613281, 47.853248596191406, 56.32666015625, 64.8000717163086, 73.27348327636719, 81.74689483642578, 90.22030639648438, 98.69371795654297, 107.16712951660156, 115.64054107666016, 124.11395263671875, 132.58737182617188, 141.06077575683594, 149.5341796875, 158.00759887695312, 166.48101806640625, 174.9544219970703, 183.42782592773438, 191.9012451171875, 200.37466430664062, 208.8480682373047, 217.32147216796875, 225.79489135742188, 234.268310546875, 242.74171447753906, 251.21511840820312, 259.68853759765625, 268.1619567871094, 276.6353759765625, 285.1087646484375, 293.5821838378906]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 5.0, 4.0, 1.0, 8.0, 12.0, 4.0, 12.0, 17.0, 16.0, 22.0, 22.0, 18.0, 28.0, 41.0, 27.0, 64.0, 58.0, 68.0, 62.0, 53.0, 63.0, 61.0, 47.0, 40.0, 42.0, 34.0, 28.0, 34.0, 20.0, 21.0, 12.0, 14.0, 9.0, 15.0, 6.0, 5.0, 5.0, 3.0, 5.0, 2.0, 2.0, 1.0, 2.0], "bins": [-7.734375, -7.5419921875, -7.349609375, -7.1572265625, -6.96484375, -6.7724609375, -6.580078125, -6.3876953125, -6.1953125, -6.0029296875, -5.810546875, -5.6181640625, -5.42578125, -5.2333984375, -5.041015625, -4.8486328125, -4.65625, -4.4638671875, -4.271484375, -4.0791015625, -3.88671875, -3.6943359375, -3.501953125, -3.3095703125, -3.1171875, -2.9248046875, -2.732421875, -2.5400390625, -2.34765625, -2.1552734375, -1.962890625, -1.7705078125, -1.578125, -1.3857421875, -1.193359375, -1.0009765625, -0.80859375, -0.6162109375, -0.423828125, -0.2314453125, -0.0390625, 0.1533203125, 0.345703125, 0.5380859375, 0.73046875, 0.9228515625, 1.115234375, 1.3076171875, 1.5, 1.6923828125, 1.884765625, 2.0771484375, 2.26953125, 2.4619140625, 2.654296875, 2.8466796875, 3.0390625, 3.2314453125, 3.423828125, 3.6162109375, 3.80859375, 4.0009765625, 4.193359375, 4.3857421875, 4.578125]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 10.0, 4.0, 11.0, 9.0, 26.0, 29.0, 52.0, 78.0, 160.0, 272.0, 437.0, 776.0, 1500.0, 3262.0, 7860.0, 22523.0, 73059.0, 204190.0, 142578.0, 43141.0, 14016.0, 5315.0, 2440.0, 1107.0, 577.0, 303.0, 208.0, 115.0, 73.0, 36.0, 26.0, 14.0, 16.0, 9.0, 7.0, 7.0, 5.0, 1.0, 2.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-90.6875, -87.7412109375, -84.794921875, -81.8486328125, -78.90234375, -75.9560546875, -73.009765625, -70.0634765625, -67.1171875, -64.1708984375, -61.224609375, -58.2783203125, -55.33203125, -52.3857421875, -49.439453125, -46.4931640625, -43.546875, -40.6005859375, -37.654296875, -34.7080078125, -31.76171875, -28.8154296875, -25.869140625, -22.9228515625, -19.9765625, -17.0302734375, -14.083984375, -11.1376953125, -8.19140625, -5.2451171875, -2.298828125, 0.6474609375, 3.59375, 6.5400390625, 9.486328125, 12.4326171875, 15.37890625, 18.3251953125, 21.271484375, 24.2177734375, 27.1640625, 30.1103515625, 33.056640625, 36.0029296875, 38.94921875, 41.8955078125, 44.841796875, 47.7880859375, 50.734375, 53.6806640625, 56.626953125, 59.5732421875, 62.51953125, 65.4658203125, 68.412109375, 71.3583984375, 74.3046875, 77.2509765625, 80.197265625, 83.1435546875, 86.08984375, 89.0361328125, 91.982421875, 94.9287109375, 97.875]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 6.0, 6.0, 6.0, 7.0, 7.0, 7.0, 12.0, 17.0, 22.0, 31.0, 40.0, 69.0, 72.0, 68.0, 97.0, 94.0, 100.0, 82.0, 67.0, 47.0, 34.0, 19.0, 28.0, 18.0, 10.0, 11.0, 7.0, 7.0, 4.0, 2.0, 5.0, 0.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-23.515625, -22.8997802734375, -22.283935546875, -21.6680908203125, -21.05224609375, -20.4364013671875, -19.820556640625, -19.2047119140625, -18.5888671875, -17.9730224609375, -17.357177734375, -16.7413330078125, -16.12548828125, -15.5096435546875, -14.893798828125, -14.2779541015625, -13.662109375, -13.0462646484375, -12.430419921875, -11.8145751953125, -11.19873046875, -10.5828857421875, -9.967041015625, -9.3511962890625, -8.7353515625, -8.1195068359375, -7.503662109375, -6.8878173828125, -6.27197265625, -5.6561279296875, -5.040283203125, -4.4244384765625, -3.80859375, -3.1927490234375, -2.576904296875, -1.9610595703125, -1.34521484375, -0.7293701171875, -0.113525390625, 0.5023193359375, 1.1181640625, 1.7340087890625, 2.349853515625, 2.9656982421875, 3.58154296875, 4.1973876953125, 4.813232421875, 5.4290771484375, 6.044921875, 6.6607666015625, 7.276611328125, 7.8924560546875, 8.50830078125, 9.1241455078125, 9.739990234375, 10.3558349609375, 10.9716796875, 11.5875244140625, 12.203369140625, 12.8192138671875, 13.43505859375, 14.0509033203125, 14.666748046875, 15.2825927734375, 15.8984375]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 9.0, 9.0, 32.0, 60.0, 101.0, 131.0, 64.0, 32.0, 17.0, 14.0, 10.0, 9.0, 2.0, 2.0, 1.0, 0.0, 1.0, 4.0], "bins": [-309.65032958984375, -303.609375, -297.56842041015625, -291.5274658203125, -285.48651123046875, -279.445556640625, -273.40460205078125, -267.3636474609375, -261.32269287109375, -255.28173828125, -249.24078369140625, -243.1998291015625, -237.15887451171875, -231.11793518066406, -225.0769805908203, -219.03602600097656, -212.99508666992188, -206.95413208007812, -200.91317749023438, -194.87222290039062, -188.83126831054688, -182.7903289794922, -176.74937438964844, -170.7084197998047, -164.66746520996094, -158.6265106201172, -152.58555603027344, -146.5446014404297, -140.503662109375, -134.46270751953125, -128.4217529296875, -122.38079833984375, -116.33984375, -110.29888916015625, -104.2579345703125, -98.21698760986328, -92.17603302001953, -86.13507843017578, -80.09413146972656, -74.05317687988281, -68.01222229003906, -61.97126770019531, -55.93031692504883, -49.889366149902344, -43.848411560058594, -37.807456970214844, -31.76650619506836, -25.725555419921875, -19.684600830078125, -13.643648147583008, -7.602695465087891, -1.5617427825927734, 4.479209899902344, 10.520162582397461, 16.561115264892578, 22.602066040039062, 28.643020629882812, 34.68397521972656, 40.72492599487305, 46.76587677001953, 52.80683135986328, 58.84778594970703, 64.88873291015625, 70.9296875, 76.97064208984375]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 5.0, 5.0, 7.0, 6.0, 2.0, 8.0, 12.0, 22.0, 27.0, 50.0, 52.0, 85.0, 67.0, 39.0, 35.0, 24.0, 17.0, 7.0, 7.0, 5.0, 2.0, 3.0, 4.0, 3.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0], "bins": [-187.84454345703125, -183.61148071289062, -179.37843322753906, -175.14537048339844, -170.91232299804688, -166.67926025390625, -162.4462127685547, -158.21315002441406, -153.9801025390625, -149.74703979492188, -145.5139923095703, -141.2809295654297, -137.04788208007812, -132.8148193359375, -128.58177185058594, -124.34870910644531, -120.11564636230469, -115.8825912475586, -111.6495361328125, -107.4164810180664, -103.18342590332031, -98.95036315917969, -94.7173080444336, -90.4842529296875, -86.2511978149414, -82.01814270019531, -77.78508758544922, -73.55203247070312, -69.3189697265625, -65.08592224121094, -60.85285949707031, -56.61980438232422, -52.386749267578125, -48.15369415283203, -43.92063903808594, -39.68758010864258, -35.454524993896484, -31.22146987915039, -26.988412857055664, -22.755355834960938, -18.522300720214844, -14.289244651794434, -10.056188583374023, -5.823132514953613, -1.5900764465332031, 2.6429786682128906, 6.876035690307617, 11.109092712402344, 15.342147827148438, 19.57520294189453, 23.808259963989258, 28.041316986083984, 32.27437210083008, 36.50742721557617, 40.74048614501953, 44.973541259765625, 49.20659637451172, 53.43965148925781, 57.672706604003906, 61.905765533447266, 66.13882446289062, 70.37187194824219, 74.60493469238281, 78.8379898071289, 83.071044921875]}, "eval/loss": 3.480835437774658, "eval/wer": 0.7460729869099564, "eval/runtime": 649.7344, "eval/samples_per_second": 4.066, "eval/steps_per_second": 0.509} \ No newline at end of file