diff --git "a/wandb/run-20220301_200256-37laivn6/files/wandb-summary.json" "b/wandb/run-20220301_200256-37laivn6/files/wandb-summary.json" --- "a/wandb/run-20220301_200256-37laivn6/files/wandb-summary.json" +++ "b/wandb/run-20220301_200256-37laivn6/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 3.9803, "train/learning_rate": 7.653061224489796e-07, "train/epoch": 1.0, "train/global_step": 892, "_runtime": 7639, "_timestamp": 1646172615, "_step": 894, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [1.0, 0.0, 14.0, 45.0, 311.0, 523.0, 99.0, 20.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-33.67470169067383, -27.166728973388672, -20.65875816345215, -14.150787353515625, -7.642814636230469, -1.1348419189453125, 5.373126983642578, 11.881099700927734, 18.38907241821289, 24.897045135498047, 31.40501594543457, 37.912986755371094, 44.42095947265625, 50.928932189941406, 57.4369010925293, 63.94487380981445, 70.45285034179688, 76.96082305908203, 83.46879577636719, 89.97676086425781, 96.4847412109375, 102.99270629882812, 109.50067901611328, 116.00865173339844, 122.51661682128906, 129.0245819091797, 135.53256225585938, 142.04052734375, 148.5485076904297, 155.0564727783203, 161.564453125, 168.07241821289062, 174.58038330078125, 181.08834838867188, 187.59632873535156, 194.1042938232422, 200.61227416992188, 207.1202392578125, 213.62820434570312, 220.1361846923828, 226.6441650390625, 233.15213012695312, 239.6601104736328, 246.16807556152344, 252.67605590820312, 259.18402099609375, 265.6919860839844, 272.199951171875, 278.70794677734375, 285.2159118652344, 291.723876953125, 298.23187255859375, 304.7398376464844, 311.247802734375, 317.7557678222656, 324.26373291015625, 330.7716979980469, 337.2796630859375, 343.7876281738281, 350.2956237792969, 356.8035888671875, 363.3115539550781, 369.81951904296875, 376.3275146484375, 382.8354797363281]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 7.0, 3.0, 5.0, 4.0, 6.0, 8.0, 11.0, 11.0, 6.0, 17.0, 11.0, 17.0, 24.0, 19.0, 25.0, 20.0, 35.0, 35.0, 34.0, 50.0, 50.0, 57.0, 63.0, 77.0, 57.0, 44.0, 38.0, 38.0, 39.0, 23.0, 33.0, 23.0, 21.0, 16.0, 10.0, 12.0, 15.0, 11.0, 4.0, 8.0, 5.0, 8.0, 4.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-103.06948852539062, -100.24678039550781, -97.42407989501953, -94.60137176513672, -91.77867126464844, -88.95596313476562, -86.13325500488281, -83.310546875, -80.48784637451172, -77.6651382446289, -74.84243774414062, -72.01972961425781, -69.197021484375, -66.37432098388672, -63.551612854003906, -60.72890853881836, -57.90620422363281, -55.083499908447266, -52.26079559326172, -49.438087463378906, -46.61538314819336, -43.79267883300781, -40.969970703125, -38.14726638793945, -35.324562072753906, -32.50185775756836, -29.67915153503418, -26.8564453125, -24.033740997314453, -21.211036682128906, -18.388330459594727, -15.565624237060547, -12.742919921875, -9.920214653015137, -7.097509384155273, -4.27480411529541, -1.4520988464355469, 1.3706064224243164, 4.19331169128418, 7.016017913818359, 9.838722229003906, 12.66142749786377, 15.484132766723633, 18.306838989257812, 21.12954330444336, 23.952247619628906, 26.774953842163086, 29.597660064697266, 32.42036437988281, 35.24306869506836, 38.065773010253906, 40.88848114013672, 43.711185455322266, 46.53388977050781, 49.356597900390625, 52.17930221557617, 55.00200653076172, 57.824710845947266, 60.64741516113281, 63.470123291015625, 66.29283142089844, 69.11553192138672, 71.93824005126953, 74.76094055175781, 77.58364868164062]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 4.0, 3.0, 2.0, 5.0, 6.0, 5.0, 7.0, 9.0, 9.0, 14.0, 11.0, 10.0, 17.0, 18.0, 29.0, 22.0, 24.0, 28.0, 38.0, 33.0, 45.0, 41.0, 62.0, 65.0, 55.0, 62.0, 50.0, 37.0, 45.0, 35.0, 30.0, 31.0, 17.0, 17.0, 24.0, 15.0, 20.0, 7.0, 12.0, 9.0, 6.0, 6.0, 7.0, 6.0, 3.0, 2.0, 2.0, 1.0, 0.0, 4.0], "bins": [-4.01171875, -3.9049072265625, -3.798095703125, -3.6912841796875, -3.58447265625, -3.4776611328125, -3.370849609375, -3.2640380859375, -3.1572265625, -3.0504150390625, -2.943603515625, -2.8367919921875, -2.72998046875, -2.6231689453125, -2.516357421875, -2.4095458984375, -2.302734375, -2.1959228515625, -2.089111328125, -1.9822998046875, -1.87548828125, -1.7686767578125, -1.661865234375, -1.5550537109375, -1.4482421875, -1.3414306640625, -1.234619140625, -1.1278076171875, -1.02099609375, -0.9141845703125, -0.807373046875, -0.7005615234375, -0.59375, -0.4869384765625, -0.380126953125, -0.2733154296875, -0.16650390625, -0.0596923828125, 0.047119140625, 0.1539306640625, 0.2607421875, 0.3675537109375, 0.474365234375, 0.5811767578125, 0.68798828125, 0.7947998046875, 0.901611328125, 1.0084228515625, 1.115234375, 1.2220458984375, 1.328857421875, 1.4356689453125, 1.54248046875, 1.6492919921875, 1.756103515625, 1.8629150390625, 1.9697265625, 2.0765380859375, 2.183349609375, 2.2901611328125, 2.39697265625, 2.5037841796875, 2.610595703125, 2.7174072265625, 2.82421875]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 5.0, 5.0, 5.0, 5.0, 9.0, 7.0, 21.0, 17.0, 31.0, 25.0, 43.0, 47.0, 79.0, 80.0, 117.0, 204.0, 272.0, 393.0, 616.0, 1065.0, 1927.0, 3802.0, 8734.0, 22726.0, 90580.0, 3263722.0, 728831.0, 45439.0, 14006.0, 5592.0, 2468.0, 1351.0, 716.0, 447.0, 294.0, 176.0, 110.0, 92.0, 62.0, 40.0, 29.0, 31.0, 18.0, 11.0, 14.0, 8.0, 4.0, 4.0, 2.0, 2.0, 1.0, 3.0], "bins": [-23.59375, -22.969482421875, -22.34521484375, -21.720947265625, -21.0966796875, -20.472412109375, -19.84814453125, -19.223876953125, -18.599609375, -17.975341796875, -17.35107421875, -16.726806640625, -16.1025390625, -15.478271484375, -14.85400390625, -14.229736328125, -13.60546875, -12.981201171875, -12.35693359375, -11.732666015625, -11.1083984375, -10.484130859375, -9.85986328125, -9.235595703125, -8.611328125, -7.987060546875, -7.36279296875, -6.738525390625, -6.1142578125, -5.489990234375, -4.86572265625, -4.241455078125, -3.6171875, -2.992919921875, -2.36865234375, -1.744384765625, -1.1201171875, -0.495849609375, 0.12841796875, 0.752685546875, 1.376953125, 2.001220703125, 2.62548828125, 3.249755859375, 3.8740234375, 4.498291015625, 5.12255859375, 5.746826171875, 6.37109375, 6.995361328125, 7.61962890625, 8.243896484375, 8.8681640625, 9.492431640625, 10.11669921875, 10.740966796875, 11.365234375, 11.989501953125, 12.61376953125, 13.238037109375, 13.8623046875, 14.486572265625, 15.11083984375, 15.735107421875, 16.359375]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 12.0, 3.0, 11.0, 10.0, 10.0, 7.0, 26.0, 22.0, 48.0, 56.0, 68.0, 119.0, 185.0, 340.0, 615.0, 920.0, 646.0, 327.0, 211.0, 116.0, 98.0, 67.0, 46.0, 27.0, 28.0, 18.0, 15.0, 10.0, 7.0, 1.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.640625, -15.1103515625, -14.580078125, -14.0498046875, -13.51953125, -12.9892578125, -12.458984375, -11.9287109375, -11.3984375, -10.8681640625, -10.337890625, -9.8076171875, -9.27734375, -8.7470703125, -8.216796875, -7.6865234375, -7.15625, -6.6259765625, -6.095703125, -5.5654296875, -5.03515625, -4.5048828125, -3.974609375, -3.4443359375, -2.9140625, -2.3837890625, -1.853515625, -1.3232421875, -0.79296875, -0.2626953125, 0.267578125, 0.7978515625, 1.328125, 1.8583984375, 2.388671875, 2.9189453125, 3.44921875, 3.9794921875, 4.509765625, 5.0400390625, 5.5703125, 6.1005859375, 6.630859375, 7.1611328125, 7.69140625, 8.2216796875, 8.751953125, 9.2822265625, 9.8125, 10.3427734375, 10.873046875, 11.4033203125, 11.93359375, 12.4638671875, 12.994140625, 13.5244140625, 14.0546875, 14.5849609375, 15.115234375, 15.6455078125, 16.17578125, 16.7060546875, 17.236328125, 17.7666015625, 18.296875]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 8.0, 7.0, 14.0, 14.0, 20.0, 20.0, 30.0, 28.0, 46.0, 75.0, 104.0, 175.0, 263.0, 450.0, 1315.0, 5967.0, 56379.0, 3534433.0, 566313.0, 23347.0, 3269.0, 905.0, 376.0, 242.0, 145.0, 90.0, 70.0, 48.0, 41.0, 29.0, 26.0, 7.0, 8.0, 5.0, 5.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-46.90625, -45.33349609375, -43.7607421875, -42.18798828125, -40.615234375, -39.04248046875, -37.4697265625, -35.89697265625, -34.32421875, -32.75146484375, -31.1787109375, -29.60595703125, -28.033203125, -26.46044921875, -24.8876953125, -23.31494140625, -21.7421875, -20.16943359375, -18.5966796875, -17.02392578125, -15.451171875, -13.87841796875, -12.3056640625, -10.73291015625, -9.16015625, -7.58740234375, -6.0146484375, -4.44189453125, -2.869140625, -1.29638671875, 0.2763671875, 1.84912109375, 3.421875, 4.99462890625, 6.5673828125, 8.14013671875, 9.712890625, 11.28564453125, 12.8583984375, 14.43115234375, 16.00390625, 17.57666015625, 19.1494140625, 20.72216796875, 22.294921875, 23.86767578125, 25.4404296875, 27.01318359375, 28.5859375, 30.15869140625, 31.7314453125, 33.30419921875, 34.876953125, 36.44970703125, 38.0224609375, 39.59521484375, 41.16796875, 42.74072265625, 44.3134765625, 45.88623046875, 47.458984375, 49.03173828125, 50.6044921875, 52.17724609375, 53.75]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 9.0, 21.0, 104.0, 483.0, 332.0, 53.0, 13.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-272.2529296875, -266.1778869628906, -260.10284423828125, -254.02780151367188, -247.9527587890625, -241.87771606445312, -235.80267333984375, -229.72763061523438, -223.652587890625, -217.57754516601562, -211.50250244140625, -205.42745971679688, -199.3524169921875, -193.27737426757812, -187.20233154296875, -181.12728881835938, -175.05223083496094, -168.97718811035156, -162.9021453857422, -156.8271026611328, -150.75205993652344, -144.67701721191406, -138.60195922851562, -132.52691650390625, -126.4518814086914, -120.37683868408203, -114.30179595947266, -108.22674560546875, -102.15170288085938, -96.07666015625, -90.00161743164062, -83.92657470703125, -77.85153198242188, -71.7764892578125, -65.70144653320312, -59.626399993896484, -53.55135726928711, -47.476314544677734, -41.401268005371094, -35.32622528076172, -29.251182556152344, -23.17613983154297, -17.10109519958496, -11.026050567626953, -4.951007843017578, 1.1240348815917969, 7.1990814208984375, 13.274124145507812, 19.349166870117188, 25.424209594726562, 31.49925422668457, 37.57429885864258, 43.64934158325195, 49.72438430786133, 55.79943084716797, 61.874473571777344, 67.94951629638672, 74.0245590209961, 80.09960174560547, 86.17465209960938, 92.24969482421875, 98.32473754882812, 104.3997802734375, 110.47482299804688, 116.54986572265625]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 8.0, 2.0, 9.0, 9.0, 14.0, 15.0, 16.0, 13.0, 29.0, 26.0, 23.0, 25.0, 31.0, 28.0, 37.0, 28.0, 40.0, 34.0, 44.0, 59.0, 58.0, 45.0, 36.0, 36.0, 42.0, 28.0, 40.0, 28.0, 32.0, 34.0, 22.0, 19.0, 21.0, 12.0, 11.0, 13.0, 8.0, 3.0, 9.0, 4.0, 6.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-48.5851936340332, -47.16765213012695, -45.7501106262207, -44.33256912231445, -42.9150276184082, -41.49748611450195, -40.0799446105957, -38.66240310668945, -37.2448616027832, -35.82732009887695, -34.4097785949707, -32.99223709106445, -31.574695587158203, -30.157154083251953, -28.739612579345703, -27.322071075439453, -25.904531478881836, -24.486989974975586, -23.069448471069336, -21.651906967163086, -20.234365463256836, -18.816823959350586, -17.39928436279297, -15.981741905212402, -14.564200401306152, -13.146658897399902, -11.729117393493652, -10.311576843261719, -8.894035339355469, -7.4764933586120605, -6.058952331542969, -4.641410827636719, -3.2238693237304688, -1.8063279390335083, -0.38878655433654785, 1.028754711151123, 2.446296215057373, 3.863837718963623, 5.281378746032715, 6.698920249938965, 8.116461753845215, 9.534003257751465, 10.951544761657715, 12.369085311889648, 13.786626815795898, 15.204168319702148, 16.6217098236084, 18.03925132751465, 19.4567928314209, 20.87433433532715, 22.2918758392334, 23.70941734313965, 25.1269588470459, 26.54450035095215, 27.962039947509766, 29.379581451416016, 30.797122955322266, 32.214664459228516, 33.632205963134766, 35.049747467041016, 36.467288970947266, 37.884830474853516, 39.302371978759766, 40.719913482666016, 42.137454986572266]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 3.0, 4.0, 4.0, 9.0, 3.0, 9.0, 7.0, 9.0, 12.0, 14.0, 11.0, 22.0, 23.0, 23.0, 35.0, 31.0, 48.0, 41.0, 66.0, 49.0, 41.0, 44.0, 60.0, 57.0, 50.0, 49.0, 45.0, 33.0, 33.0, 37.0, 21.0, 27.0, 12.0, 14.0, 12.0, 10.0, 9.0, 10.0, 2.0, 4.0, 7.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.3046875, -4.186553955078125, -4.06842041015625, -3.950286865234375, -3.8321533203125, -3.714019775390625, -3.59588623046875, -3.477752685546875, -3.359619140625, -3.241485595703125, -3.12335205078125, -3.005218505859375, -2.8870849609375, -2.768951416015625, -2.65081787109375, -2.532684326171875, -2.41455078125, -2.296417236328125, -2.17828369140625, -2.060150146484375, -1.9420166015625, -1.823883056640625, -1.70574951171875, -1.587615966796875, -1.469482421875, -1.351348876953125, -1.23321533203125, -1.115081787109375, -0.9969482421875, -0.878814697265625, -0.76068115234375, -0.642547607421875, -0.5244140625, -0.406280517578125, -0.28814697265625, -0.170013427734375, -0.0518798828125, 0.066253662109375, 0.18438720703125, 0.302520751953125, 0.420654296875, 0.538787841796875, 0.65692138671875, 0.775054931640625, 0.8931884765625, 1.011322021484375, 1.12945556640625, 1.247589111328125, 1.36572265625, 1.483856201171875, 1.60198974609375, 1.720123291015625, 1.8382568359375, 1.956390380859375, 2.07452392578125, 2.192657470703125, 2.310791015625, 2.428924560546875, 2.54705810546875, 2.665191650390625, 2.7833251953125, 2.901458740234375, 3.01959228515625, 3.137725830078125, 3.255859375]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 9.0, 7.0, 10.0, 16.0, 26.0, 28.0, 48.0, 75.0, 117.0, 157.0, 211.0, 338.0, 458.0, 631.0, 960.0, 1513.0, 2313.0, 3592.0, 5436.0, 8635.0, 14289.0, 24015.0, 43710.0, 85741.0, 185679.0, 324605.0, 168142.0, 78243.0, 39973.0, 22379.0, 13286.0, 8343.0, 5485.0, 3345.0, 2240.0, 1490.0, 998.0, 623.0, 455.0, 277.0, 205.0, 145.0, 86.0, 60.0, 53.0, 46.0, 18.0, 15.0, 9.0, 6.0, 2.0, 7.0, 4.0, 2.0, 1.0, 2.0], "bins": [-0.1474609375, -0.1430511474609375, -0.138641357421875, -0.1342315673828125, -0.12982177734375, -0.1254119873046875, -0.121002197265625, -0.1165924072265625, -0.1121826171875, -0.1077728271484375, -0.103363037109375, -0.0989532470703125, -0.09454345703125, -0.0901336669921875, -0.085723876953125, -0.0813140869140625, -0.076904296875, -0.0724945068359375, -0.068084716796875, -0.0636749267578125, -0.05926513671875, -0.0548553466796875, -0.050445556640625, -0.0460357666015625, -0.0416259765625, -0.0372161865234375, -0.032806396484375, -0.0283966064453125, -0.02398681640625, -0.0195770263671875, -0.015167236328125, -0.0107574462890625, -0.00634765625, -0.0019378662109375, 0.002471923828125, 0.0068817138671875, 0.01129150390625, 0.0157012939453125, 0.020111083984375, 0.0245208740234375, 0.0289306640625, 0.0333404541015625, 0.037750244140625, 0.0421600341796875, 0.04656982421875, 0.0509796142578125, 0.055389404296875, 0.0597991943359375, 0.064208984375, 0.0686187744140625, 0.073028564453125, 0.0774383544921875, 0.08184814453125, 0.0862579345703125, 0.090667724609375, 0.0950775146484375, 0.0994873046875, 0.1038970947265625, 0.108306884765625, 0.1127166748046875, 0.11712646484375, 0.1215362548828125, 0.125946044921875, 0.1303558349609375, 0.134765625]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 5.0, 2.0, 2.0, 3.0, 3.0, 2.0, 3.0, 7.0, 5.0, 6.0, 13.0, 10.0, 12.0, 18.0, 14.0, 27.0, 39.0, 30.0, 42.0, 22.0, 36.0, 43.0, 41.0, 39.0, 36.0, 43.0, 1076.0, 50.0, 41.0, 44.0, 38.0, 33.0, 30.0, 30.0, 26.0, 26.0, 19.0, 17.0, 15.0, 21.0, 15.0, 7.0, 11.0, 10.0, 8.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 4.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-2.208984375, -2.138702392578125, -2.06842041015625, -1.998138427734375, -1.9278564453125, -1.857574462890625, -1.78729248046875, -1.717010498046875, -1.646728515625, -1.576446533203125, -1.50616455078125, -1.435882568359375, -1.3656005859375, -1.295318603515625, -1.22503662109375, -1.154754638671875, -1.08447265625, -1.014190673828125, -0.94390869140625, -0.873626708984375, -0.8033447265625, -0.733062744140625, -0.66278076171875, -0.592498779296875, -0.522216796875, -0.451934814453125, -0.38165283203125, -0.311370849609375, -0.2410888671875, -0.170806884765625, -0.10052490234375, -0.030242919921875, 0.0400390625, 0.110321044921875, 0.18060302734375, 0.250885009765625, 0.3211669921875, 0.391448974609375, 0.46173095703125, 0.532012939453125, 0.602294921875, 0.672576904296875, 0.74285888671875, 0.813140869140625, 0.8834228515625, 0.953704833984375, 1.02398681640625, 1.094268798828125, 1.16455078125, 1.234832763671875, 1.30511474609375, 1.375396728515625, 1.4456787109375, 1.515960693359375, 1.58624267578125, 1.656524658203125, 1.726806640625, 1.797088623046875, 1.86737060546875, 1.937652587890625, 2.0079345703125, 2.078216552734375, 2.14849853515625, 2.218780517578125, 2.2890625]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 6.0, 9.0, 12.0, 13.0, 20.0, 24.0, 24.0, 48.0, 57.0, 87.0, 138.0, 193.0, 277.0, 402.0, 574.0, 799.0, 1236.0, 1902.0, 2943.0, 4486.0, 7195.0, 11760.0, 19573.0, 33257.0, 57766.0, 104129.0, 199266.0, 1318704.0, 143786.0, 77899.0, 44167.0, 25558.0, 15186.0, 9211.0, 5821.0, 3682.0, 2255.0, 1528.0, 998.0, 668.0, 453.0, 311.0, 221.0, 152.0, 106.0, 63.0, 49.0, 45.0, 22.0, 23.0, 11.0, 4.0, 12.0, 2.0, 6.0, 4.0, 1.0, 2.0, 2.0], "bins": [-0.1075439453125, -0.10420989990234375, -0.1008758544921875, -0.09754180908203125, -0.094207763671875, -0.09087371826171875, -0.0875396728515625, -0.08420562744140625, -0.08087158203125, -0.07753753662109375, -0.0742034912109375, -0.07086944580078125, -0.067535400390625, -0.06420135498046875, -0.0608673095703125, -0.05753326416015625, -0.05419921875, -0.05086517333984375, -0.0475311279296875, -0.04419708251953125, -0.040863037109375, -0.03752899169921875, -0.0341949462890625, -0.03086090087890625, -0.02752685546875, -0.02419281005859375, -0.0208587646484375, -0.01752471923828125, -0.014190673828125, -0.01085662841796875, -0.0075225830078125, -0.00418853759765625, -0.0008544921875, 0.00247955322265625, 0.0058135986328125, 0.00914764404296875, 0.012481689453125, 0.01581573486328125, 0.0191497802734375, 0.02248382568359375, 0.02581787109375, 0.02915191650390625, 0.0324859619140625, 0.03582000732421875, 0.039154052734375, 0.04248809814453125, 0.0458221435546875, 0.04915618896484375, 0.052490234375, 0.05582427978515625, 0.0591583251953125, 0.06249237060546875, 0.065826416015625, 0.06916046142578125, 0.0724945068359375, 0.07582855224609375, 0.07916259765625, 0.08249664306640625, 0.0858306884765625, 0.08916473388671875, 0.092498779296875, 0.09583282470703125, 0.0991668701171875, 0.10250091552734375, 0.1058349609375]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 4.0, 3.0, 2.0, 2.0, 6.0, 4.0, 12.0, 7.0, 8.0, 11.0, 18.0, 35.0, 38.0, 53.0, 63.0, 75.0, 98.0, 124.0, 99.0, 87.0, 48.0, 46.0, 33.0, 28.0, 26.0, 17.0, 21.0, 10.0, 11.0, 6.0, 5.0, 1.0, 5.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00013017654418945312, -0.00012670084834098816, -0.0001232251524925232, -0.00011974945664405823, -0.00011627376079559326, -0.0001127980649471283, -0.00010932236909866333, -0.00010584667325019836, -0.0001023709774017334, -9.889528155326843e-05, -9.541958570480347e-05, -9.19438898563385e-05, -8.846819400787354e-05, -8.499249815940857e-05, -8.15168023109436e-05, -7.804110646247864e-05, -7.456541061401367e-05, -7.10897147655487e-05, -6.761401891708374e-05, -6.413832306861877e-05, -6.066262722015381e-05, -5.718693137168884e-05, -5.371123552322388e-05, -5.023553967475891e-05, -4.6759843826293945e-05, -4.328414797782898e-05, -3.9808452129364014e-05, -3.633275628089905e-05, -3.285706043243408e-05, -2.9381364583969116e-05, -2.590566873550415e-05, -2.2429972887039185e-05, -1.895427703857422e-05, -1.5478581190109253e-05, -1.2002885341644287e-05, -8.527189493179321e-06, -5.0514936447143555e-06, -1.5757977962493896e-06, 1.8998980522155762e-06, 5.375593900680542e-06, 8.851289749145508e-06, 1.2326985597610474e-05, 1.580268144607544e-05, 1.9278377294540405e-05, 2.275407314300537e-05, 2.6229768991470337e-05, 2.9705464839935303e-05, 3.318116068840027e-05, 3.6656856536865234e-05, 4.01325523853302e-05, 4.3608248233795166e-05, 4.708394408226013e-05, 5.05596399307251e-05, 5.4035335779190063e-05, 5.751103162765503e-05, 6.0986727476119995e-05, 6.446242332458496e-05, 6.793811917304993e-05, 7.141381502151489e-05, 7.488951086997986e-05, 7.836520671844482e-05, 8.184090256690979e-05, 8.531659841537476e-05, 8.879229426383972e-05, 9.226799011230469e-05]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 7.0, 6.0, 10.0, 8.0, 9.0, 22.0, 20.0, 24.0, 31.0, 47.0, 92.0, 120.0, 156.0, 275.0, 441.0, 3745.0, 1025156.0, 16854.0, 594.0, 293.0, 187.0, 123.0, 83.0, 62.0, 50.0, 41.0, 32.0, 17.0, 13.0, 10.0, 9.0, 4.0, 5.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0022945404052734375, -0.002228289842605591, -0.002162039279937744, -0.0020957887172698975, -0.0020295381546020508, -0.001963287591934204, -0.0018970370292663574, -0.0018307864665985107, -0.001764535903930664, -0.0016982853412628174, -0.0016320347785949707, -0.001565784215927124, -0.0014995336532592773, -0.0014332830905914307, -0.001367032527923584, -0.0013007819652557373, -0.0012345314025878906, -0.001168280839920044, -0.0011020302772521973, -0.0010357797145843506, -0.0009695291519165039, -0.0009032785892486572, -0.0008370280265808105, -0.0007707774639129639, -0.0007045269012451172, -0.0006382763385772705, -0.0005720257759094238, -0.0005057752132415771, -0.00043952465057373047, -0.0003732740879058838, -0.0003070235252380371, -0.00024077296257019043, -0.00017452239990234375, -0.00010827183723449707, -4.202127456665039e-05, 2.422928810119629e-05, 9.047985076904297e-05, 0.00015673041343688965, 0.00022298097610473633, 0.000289231538772583, 0.0003554821014404297, 0.00042173266410827637, 0.00048798322677612305, 0.0005542337894439697, 0.0006204843521118164, 0.0006867349147796631, 0.0007529854774475098, 0.0008192360401153564, 0.0008854866027832031, 0.0009517371654510498, 0.0010179877281188965, 0.0010842382907867432, 0.0011504888534545898, 0.0012167394161224365, 0.0012829899787902832, 0.0013492405414581299, 0.0014154911041259766, 0.0014817416667938232, 0.00154799222946167, 0.0016142427921295166, 0.0016804933547973633, 0.00174674391746521, 0.0018129944801330566, 0.0018792450428009033, 0.00194549560546875]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 48.0, 523.0, 425.0, 22.0], "bins": [-0.0006569771212525666, -0.0006463686586357653, -0.000635760254226625, -0.0006251517916098237, -0.0006145433289930224, -0.0006039348663762212, -0.0005933264037594199, -0.0005827179993502796, -0.0005721095367334783, -0.000561501074116677, -0.0005508926697075367, -0.0005402842070907354, -0.0005296757444739342, -0.0005190672818571329, -0.0005084588192403316, -0.0004978504148311913, -0.00048724195221439004, -0.0004766334895975888, -0.00046602505608461797, -0.00045541662257164717, -0.0004448081599548459, -0.00043419969733804464, -0.00042359126382507384, -0.00041298283031210303, -0.00040237436769530177, -0.0003917659050785005, -0.0003811574715655297, -0.0003705490380525589, -0.00035994057543575764, -0.0003493321128189564, -0.00033872367930598557, -0.00032811524579301476, -0.00031750675407238305, -0.00030689832055941224, -0.000296289857942611, -0.0002856813953258097, -0.0002750729618128389, -0.0002644645282998681, -0.00025385606568306684, -0.0002432476176181808, -0.00023263916955329478, -0.00022203072148840874, -0.0002114222734235227, -0.00020081382535863668, -0.00019020537729375064, -0.0001795969292288646, -0.00016898848116397858, -0.00015838003309909254, -0.0001477715850342065, -0.00013716313696932048, -0.00012655468890443444, -0.00011594624083954841, -0.00010533779277466238, -9.472934470977634e-05, -8.412089664489031e-05, -7.351244858000427e-05, -6.290400051511824e-05, -5.229555245023221e-05, -4.1687104385346174e-05, -3.107865632046014e-05, -2.0470208255574107e-05, -9.861760190688074e-06, 7.466878741979599e-07, 1.1355135939083993e-05, 2.1963582184980623e-05]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 1.0, 0.0, 3.0, 3.0, 8.0, 3.0, 6.0, 3.0, 9.0, 14.0, 14.0, 11.0, 11.0, 11.0, 23.0, 18.0, 36.0, 27.0, 29.0, 22.0, 35.0, 42.0, 28.0, 40.0, 45.0, 40.0, 46.0, 49.0, 40.0, 42.0, 32.0, 39.0, 35.0, 26.0, 28.0, 24.0, 34.0, 18.0, 20.0, 13.0, 16.0, 14.0, 11.0, 10.0, 3.0, 5.0, 11.0, 4.0, 5.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-3.910064697265625e-05, -3.782566636800766e-05, -3.655068576335907e-05, -3.527570515871048e-05, -3.400072455406189e-05, -3.27257439494133e-05, -3.145076334476471e-05, -3.017578274011612e-05, -2.890080213546753e-05, -2.762582153081894e-05, -2.635084092617035e-05, -2.507586032152176e-05, -2.380087971687317e-05, -2.252589911222458e-05, -2.125091850757599e-05, -1.99759379029274e-05, -1.870095729827881e-05, -1.742597669363022e-05, -1.615099608898163e-05, -1.4876015484333038e-05, -1.3601034879684448e-05, -1.2326054275035858e-05, -1.1051073670387268e-05, -9.776093065738678e-06, -8.501112461090088e-06, -7.226131856441498e-06, -5.951151251792908e-06, -4.676170647144318e-06, -3.4011900424957275e-06, -2.1262094378471375e-06, -8.512288331985474e-07, 4.237517714500427e-07, 1.6987323760986328e-06, 2.973712980747223e-06, 4.248693585395813e-06, 5.523674190044403e-06, 6.798654794692993e-06, 8.073635399341583e-06, 9.348616003990173e-06, 1.0623596608638763e-05, 1.1898577213287354e-05, 1.3173557817935944e-05, 1.4448538422584534e-05, 1.5723519027233124e-05, 1.6998499631881714e-05, 1.8273480236530304e-05, 1.9548460841178894e-05, 2.0823441445827484e-05, 2.2098422050476074e-05, 2.3373402655124664e-05, 2.4648383259773254e-05, 2.5923363864421844e-05, 2.7198344469070435e-05, 2.8473325073719025e-05, 2.9748305678367615e-05, 3.1023286283016205e-05, 3.2298266887664795e-05, 3.3573247492313385e-05, 3.4848228096961975e-05, 3.6123208701610565e-05, 3.7398189306259155e-05, 3.8673169910907745e-05, 3.9948150515556335e-05, 4.1223131120204926e-05, 4.2498111724853516e-05]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 3.0, 4.0, 4.0, 9.0, 3.0, 9.0, 7.0, 9.0, 12.0, 14.0, 11.0, 22.0, 23.0, 23.0, 35.0, 31.0, 48.0, 41.0, 66.0, 49.0, 41.0, 44.0, 60.0, 57.0, 50.0, 49.0, 45.0, 33.0, 33.0, 37.0, 21.0, 27.0, 12.0, 14.0, 12.0, 10.0, 9.0, 10.0, 2.0, 4.0, 7.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.3046875, -4.186553955078125, -4.06842041015625, -3.950286865234375, -3.8321533203125, -3.714019775390625, -3.59588623046875, -3.477752685546875, -3.359619140625, -3.241485595703125, -3.12335205078125, -3.005218505859375, -2.8870849609375, -2.768951416015625, -2.65081787109375, -2.532684326171875, -2.41455078125, -2.296417236328125, -2.17828369140625, -2.060150146484375, -1.9420166015625, -1.823883056640625, -1.70574951171875, -1.587615966796875, -1.469482421875, -1.351348876953125, -1.23321533203125, -1.115081787109375, -0.9969482421875, -0.878814697265625, -0.76068115234375, -0.642547607421875, -0.5244140625, -0.406280517578125, -0.28814697265625, -0.170013427734375, -0.0518798828125, 0.066253662109375, 0.18438720703125, 0.302520751953125, 0.420654296875, 0.538787841796875, 0.65692138671875, 0.775054931640625, 0.8931884765625, 1.011322021484375, 1.12945556640625, 1.247589111328125, 1.36572265625, 1.483856201171875, 1.60198974609375, 1.720123291015625, 1.8382568359375, 1.956390380859375, 2.07452392578125, 2.192657470703125, 2.310791015625, 2.428924560546875, 2.54705810546875, 2.665191650390625, 2.7833251953125, 2.901458740234375, 3.01959228515625, 3.137725830078125, 3.255859375]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 7.0, 9.0, 8.0, 14.0, 19.0, 29.0, 27.0, 40.0, 80.0, 77.0, 107.0, 149.0, 215.0, 282.0, 418.0, 654.0, 918.0, 1387.0, 2292.0, 3716.0, 6622.0, 13633.0, 34254.0, 136741.0, 618647.0, 158254.0, 37408.0, 14608.0, 6999.0, 3900.0, 2311.0, 1540.0, 975.0, 677.0, 424.0, 324.0, 209.0, 182.0, 116.0, 91.0, 52.0, 43.0, 33.0, 23.0, 10.0, 9.0, 14.0, 2.0, 4.0, 3.0, 0.0, 1.0, 4.0], "bins": [-11.921875, -11.58642578125, -11.2509765625, -10.91552734375, -10.580078125, -10.24462890625, -9.9091796875, -9.57373046875, -9.23828125, -8.90283203125, -8.5673828125, -8.23193359375, -7.896484375, -7.56103515625, -7.2255859375, -6.89013671875, -6.5546875, -6.21923828125, -5.8837890625, -5.54833984375, -5.212890625, -4.87744140625, -4.5419921875, -4.20654296875, -3.87109375, -3.53564453125, -3.2001953125, -2.86474609375, -2.529296875, -2.19384765625, -1.8583984375, -1.52294921875, -1.1875, -0.85205078125, -0.5166015625, -0.18115234375, 0.154296875, 0.48974609375, 0.8251953125, 1.16064453125, 1.49609375, 1.83154296875, 2.1669921875, 2.50244140625, 2.837890625, 3.17333984375, 3.5087890625, 3.84423828125, 4.1796875, 4.51513671875, 4.8505859375, 5.18603515625, 5.521484375, 5.85693359375, 6.1923828125, 6.52783203125, 6.86328125, 7.19873046875, 7.5341796875, 7.86962890625, 8.205078125, 8.54052734375, 8.8759765625, 9.21142578125, 9.546875]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 3.0, 6.0, 9.0, 6.0, 17.0, 12.0, 13.0, 12.0, 22.0, 24.0, 28.0, 46.0, 33.0, 48.0, 47.0, 64.0, 77.0, 182.0, 1654.0, 262.0, 88.0, 60.0, 49.0, 36.0, 33.0, 32.0, 28.0, 38.0, 18.0, 17.0, 21.0, 18.0, 9.0, 13.0, 6.0, 5.0, 8.0, 9.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.40625, -13.9903564453125, -13.574462890625, -13.1585693359375, -12.74267578125, -12.3267822265625, -11.910888671875, -11.4949951171875, -11.0791015625, -10.6632080078125, -10.247314453125, -9.8314208984375, -9.41552734375, -8.9996337890625, -8.583740234375, -8.1678466796875, -7.751953125, -7.3360595703125, -6.920166015625, -6.5042724609375, -6.08837890625, -5.6724853515625, -5.256591796875, -4.8406982421875, -4.4248046875, -4.0089111328125, -3.593017578125, -3.1771240234375, -2.76123046875, -2.3453369140625, -1.929443359375, -1.5135498046875, -1.09765625, -0.6817626953125, -0.265869140625, 0.1500244140625, 0.56591796875, 0.9818115234375, 1.397705078125, 1.8135986328125, 2.2294921875, 2.6453857421875, 3.061279296875, 3.4771728515625, 3.89306640625, 4.3089599609375, 4.724853515625, 5.1407470703125, 5.556640625, 5.9725341796875, 6.388427734375, 6.8043212890625, 7.22021484375, 7.6361083984375, 8.052001953125, 8.4678955078125, 8.8837890625, 9.2996826171875, 9.715576171875, 10.1314697265625, 10.54736328125, 10.9632568359375, 11.379150390625, 11.7950439453125, 12.2109375]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 3.0, 8.0, 5.0, 4.0, 3.0, 9.0, 11.0, 15.0, 19.0, 13.0, 19.0, 25.0, 37.0, 37.0, 38.0, 72.0, 127.0, 288.0, 1237.0, 212086.0, 2928476.0, 2353.0, 353.0, 162.0, 72.0, 43.0, 38.0, 40.0, 24.0, 19.0, 13.0, 8.0, 14.0, 10.0, 14.0, 7.0, 7.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.1875, -55.2236328125, -53.259765625, -51.2958984375, -49.33203125, -47.3681640625, -45.404296875, -43.4404296875, -41.4765625, -39.5126953125, -37.548828125, -35.5849609375, -33.62109375, -31.6572265625, -29.693359375, -27.7294921875, -25.765625, -23.8017578125, -21.837890625, -19.8740234375, -17.91015625, -15.9462890625, -13.982421875, -12.0185546875, -10.0546875, -8.0908203125, -6.126953125, -4.1630859375, -2.19921875, -0.2353515625, 1.728515625, 3.6923828125, 5.65625, 7.6201171875, 9.583984375, 11.5478515625, 13.51171875, 15.4755859375, 17.439453125, 19.4033203125, 21.3671875, 23.3310546875, 25.294921875, 27.2587890625, 29.22265625, 31.1865234375, 33.150390625, 35.1142578125, 37.078125, 39.0419921875, 41.005859375, 42.9697265625, 44.93359375, 46.8974609375, 48.861328125, 50.8251953125, 52.7890625, 54.7529296875, 56.716796875, 58.6806640625, 60.64453125, 62.6083984375, 64.572265625, 66.5361328125, 68.5]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 539.0, 477.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-130.96717834472656, -116.40142059326172, -101.83566284179688, -87.26991271972656, -72.70415496826172, -58.138397216796875, -43.57264709472656, -29.00688934326172, -14.441131591796875, 0.12462425231933594, 14.690380096435547, 29.256134033203125, 43.82189178466797, 58.38764953613281, 72.95339965820312, 87.51915740966797, 102.08491516113281, 116.65067291259766, 131.2164306640625, 145.7821807861328, 160.34793090820312, 174.9136962890625, 189.4794464111328, 204.04519653320312, 218.6109619140625, 233.1767120361328, 247.7424774169922, 262.3082275390625, 276.8739929199219, 291.43975830078125, 306.0054931640625, 320.5712585449219, 335.13702392578125, 349.7027893066406, 364.2685241699219, 378.83428955078125, 393.4000549316406, 407.9658203125, 422.53155517578125, 437.0973205566406, 451.6630859375, 466.2288513183594, 480.7945861816406, 495.3603515625, 509.9261169433594, 524.4918823242188, 539.0576171875, 553.6233520507812, 568.1890869140625, 582.7548217773438, 597.3206176757812, 611.8863525390625, 626.4520874023438, 641.0178833007812, 655.5836181640625, 670.1493530273438, 684.7151489257812, 699.2808837890625, 713.8466796875, 728.4124145507812, 742.9781494140625, 757.5439453125, 772.1096801757812, 786.6754150390625, 801.2412109375]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 0.0, 4.0, 5.0, 7.0, 7.0, 4.0, 9.0, 13.0, 13.0, 14.0, 20.0, 21.0, 39.0, 25.0, 30.0, 35.0, 32.0, 46.0, 45.0, 54.0, 51.0, 31.0, 47.0, 55.0, 42.0, 52.0, 42.0, 43.0, 34.0, 29.0, 32.0, 20.0, 21.0, 15.0, 15.0, 6.0, 7.0, 5.0, 8.0, 10.0, 9.0, 3.0, 6.0, 2.0, 3.0, 0.0, 1.0, 1.0], "bins": [-48.69575119018555, -47.21363830566406, -45.73152542114258, -44.249412536621094, -42.76729965209961, -41.285186767578125, -39.803077697753906, -38.320960998535156, -36.83885192871094, -35.35673904418945, -33.87462615966797, -32.392513275146484, -30.910400390625, -29.428287506103516, -27.946176528930664, -26.46406364440918, -24.981948852539062, -23.499835968017578, -22.017723083496094, -20.53561019897461, -19.053497314453125, -17.57138442993164, -16.08927345275879, -14.607160568237305, -13.12504768371582, -11.642934799194336, -10.160821914672852, -8.678709983825684, -7.196597099304199, -5.714484214782715, -4.232372283935547, -2.7502593994140625, -1.2681465148925781, 0.21396613121032715, 1.6960787773132324, 3.1781911849975586, 4.660304069519043, 6.142416954040527, 7.624528884887695, 9.10664176940918, 10.588754653930664, 12.070867538452148, 13.552980422973633, 15.0350923538208, 16.51720428466797, 17.999317169189453, 19.481430053710938, 20.963542938232422, 22.445655822753906, 23.92776870727539, 25.409881591796875, 26.89199447631836, 28.374107360839844, 29.856220245361328, 31.33833122253418, 32.82044219970703, 34.30255889892578, 35.784671783447266, 37.26678466796875, 38.748897552490234, 40.23101043701172, 41.7131233215332, 43.19523620605469, 44.677345275878906, 46.15945816040039]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 5.0, 1.0, 3.0, 6.0, 5.0, 9.0, 5.0, 8.0, 14.0, 11.0, 18.0, 21.0, 19.0, 24.0, 37.0, 25.0, 32.0, 53.0, 50.0, 48.0, 53.0, 63.0, 63.0, 55.0, 49.0, 45.0, 34.0, 34.0, 50.0, 26.0, 32.0, 19.0, 17.0, 14.0, 11.0, 17.0, 9.0, 5.0, 4.0, 4.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.59765625, -4.468719482421875, -4.33978271484375, -4.210845947265625, -4.0819091796875, -3.952972412109375, -3.82403564453125, -3.695098876953125, -3.566162109375, -3.437225341796875, -3.30828857421875, -3.179351806640625, -3.0504150390625, -2.921478271484375, -2.79254150390625, -2.663604736328125, -2.53466796875, -2.405731201171875, -2.27679443359375, -2.147857666015625, -2.0189208984375, -1.889984130859375, -1.76104736328125, -1.632110595703125, -1.503173828125, -1.374237060546875, -1.24530029296875, -1.116363525390625, -0.9874267578125, -0.858489990234375, -0.72955322265625, -0.600616455078125, -0.4716796875, -0.342742919921875, -0.21380615234375, -0.084869384765625, 0.0440673828125, 0.173004150390625, 0.30194091796875, 0.430877685546875, 0.559814453125, 0.688751220703125, 0.81768798828125, 0.946624755859375, 1.0755615234375, 1.204498291015625, 1.33343505859375, 1.462371826171875, 1.59130859375, 1.720245361328125, 1.84918212890625, 1.978118896484375, 2.1070556640625, 2.235992431640625, 2.36492919921875, 2.493865966796875, 2.622802734375, 2.751739501953125, 2.88067626953125, 3.009613037109375, 3.1385498046875, 3.267486572265625, 3.39642333984375, 3.525360107421875, 3.654296875]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 4.0, 4.0, 5.0, 8.0, 8.0, 7.0, 15.0, 14.0, 18.0, 20.0, 26.0, 34.0, 54.0, 82.0, 114.0, 199.0, 377.0, 945.0, 2514.0, 7476.0, 26079.0, 200900.0, 3825511.0, 103737.0, 17968.0, 5043.0, 1739.0, 616.0, 281.0, 149.0, 77.0, 73.0, 36.0, 26.0, 26.0, 22.0, 19.0, 16.0, 9.0, 8.0, 10.0, 4.0, 3.0, 3.0, 6.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-29.46875, -28.658935546875, -27.84912109375, -27.039306640625, -26.2294921875, -25.419677734375, -24.60986328125, -23.800048828125, -22.990234375, -22.180419921875, -21.37060546875, -20.560791015625, -19.7509765625, -18.941162109375, -18.13134765625, -17.321533203125, -16.51171875, -15.701904296875, -14.89208984375, -14.082275390625, -13.2724609375, -12.462646484375, -11.65283203125, -10.843017578125, -10.033203125, -9.223388671875, -8.41357421875, -7.603759765625, -6.7939453125, -5.984130859375, -5.17431640625, -4.364501953125, -3.5546875, -2.744873046875, -1.93505859375, -1.125244140625, -0.3154296875, 0.494384765625, 1.30419921875, 2.114013671875, 2.923828125, 3.733642578125, 4.54345703125, 5.353271484375, 6.1630859375, 6.972900390625, 7.78271484375, 8.592529296875, 9.40234375, 10.212158203125, 11.02197265625, 11.831787109375, 12.6416015625, 13.451416015625, 14.26123046875, 15.071044921875, 15.880859375, 16.690673828125, 17.50048828125, 18.310302734375, 19.1201171875, 19.929931640625, 20.73974609375, 21.549560546875, 22.359375]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 5.0, 3.0, 3.0, 3.0, 10.0, 9.0, 4.0, 5.0, 7.0, 7.0, 6.0, 10.0, 17.0, 28.0, 23.0, 36.0, 44.0, 69.0, 92.0, 138.0, 222.0, 394.0, 616.0, 734.0, 566.0, 326.0, 191.0, 125.0, 103.0, 70.0, 57.0, 34.0, 31.0, 21.0, 15.0, 21.0, 7.0, 7.0, 7.0, 5.0, 2.0, 4.0, 7.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.2421875, -9.867919921875, -9.49365234375, -9.119384765625, -8.7451171875, -8.370849609375, -7.99658203125, -7.622314453125, -7.248046875, -6.873779296875, -6.49951171875, -6.125244140625, -5.7509765625, -5.376708984375, -5.00244140625, -4.628173828125, -4.25390625, -3.879638671875, -3.50537109375, -3.131103515625, -2.7568359375, -2.382568359375, -2.00830078125, -1.634033203125, -1.259765625, -0.885498046875, -0.51123046875, -0.136962890625, 0.2373046875, 0.611572265625, 0.98583984375, 1.360107421875, 1.734375, 2.108642578125, 2.48291015625, 2.857177734375, 3.2314453125, 3.605712890625, 3.97998046875, 4.354248046875, 4.728515625, 5.102783203125, 5.47705078125, 5.851318359375, 6.2255859375, 6.599853515625, 6.97412109375, 7.348388671875, 7.72265625, 8.096923828125, 8.47119140625, 8.845458984375, 9.2197265625, 9.593994140625, 9.96826171875, 10.342529296875, 10.716796875, 11.091064453125, 11.46533203125, 11.839599609375, 12.2138671875, 12.588134765625, 12.96240234375, 13.336669921875, 13.7109375]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 8.0, 6.0, 10.0, 11.0, 19.0, 28.0, 51.0, 98.0, 114.0, 203.0, 363.0, 619.0, 1092.0, 1837.0, 3491.0, 6557.0, 12726.0, 28120.0, 68520.0, 247204.0, 2781544.0, 839604.0, 120062.0, 43419.0, 18980.0, 9255.0, 4580.0, 2482.0, 1387.0, 761.0, 429.0, 264.0, 161.0, 100.0, 59.0, 39.0, 29.0, 19.0, 11.0, 15.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-20.84375, -20.2607421875, -19.677734375, -19.0947265625, -18.51171875, -17.9287109375, -17.345703125, -16.7626953125, -16.1796875, -15.5966796875, -15.013671875, -14.4306640625, -13.84765625, -13.2646484375, -12.681640625, -12.0986328125, -11.515625, -10.9326171875, -10.349609375, -9.7666015625, -9.18359375, -8.6005859375, -8.017578125, -7.4345703125, -6.8515625, -6.2685546875, -5.685546875, -5.1025390625, -4.51953125, -3.9365234375, -3.353515625, -2.7705078125, -2.1875, -1.6044921875, -1.021484375, -0.4384765625, 0.14453125, 0.7275390625, 1.310546875, 1.8935546875, 2.4765625, 3.0595703125, 3.642578125, 4.2255859375, 4.80859375, 5.3916015625, 5.974609375, 6.5576171875, 7.140625, 7.7236328125, 8.306640625, 8.8896484375, 9.47265625, 10.0556640625, 10.638671875, 11.2216796875, 11.8046875, 12.3876953125, 12.970703125, 13.5537109375, 14.13671875, 14.7197265625, 15.302734375, 15.8857421875, 16.46875]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 2.0, 6.0, 14.0, 18.0, 41.0, 66.0, 125.0, 194.0, 217.0, 129.0, 89.0, 40.0, 32.0, 14.0, 10.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.10537338256836, -45.595149993896484, -43.084922790527344, -40.57469940185547, -38.064476013183594, -35.55425262451172, -33.044029235839844, -30.533802032470703, -28.023578643798828, -25.513355255126953, -23.003129959106445, -20.492904663085938, -17.982681274414062, -15.472456932067871, -12.96223258972168, -10.452007293701172, -7.941783905029297, -5.4315595626831055, -2.921335220336914, -0.41111087799072266, 2.0991134643554688, 4.60933780670166, 7.119562149047852, 9.62978744506836, 12.140010833740234, 14.650235176086426, 17.160459518432617, 19.670684814453125, 22.180908203125, 24.691131591796875, 27.201356887817383, 29.71158218383789, 32.2218017578125, 34.732025146484375, 37.24224853515625, 39.75247573852539, 42.262699127197266, 44.77292251586914, 47.28314971923828, 49.793373107910156, 52.30359649658203, 54.813819885253906, 57.32404327392578, 59.83427047729492, 62.3444938659668, 64.85472106933594, 67.36494445800781, 69.87516784667969, 72.38539123535156, 74.89561462402344, 77.40583801269531, 79.91606140136719, 82.42628479003906, 84.93651580810547, 87.44673919677734, 89.95696258544922, 92.4671859741211, 94.97740936279297, 97.48763275146484, 99.99785614013672, 102.50808715820312, 105.018310546875, 107.52853393554688, 110.03875732421875, 112.54898071289062]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 6.0, 1.0, 0.0, 3.0, 6.0, 17.0, 15.0, 9.0, 14.0, 20.0, 20.0, 22.0, 20.0, 28.0, 41.0, 31.0, 46.0, 41.0, 51.0, 40.0, 35.0, 43.0, 44.0, 51.0, 40.0, 44.0, 40.0, 28.0, 33.0, 40.0, 34.0, 18.0, 22.0, 13.0, 18.0, 9.0, 11.0, 10.0, 12.0, 8.0, 10.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-41.330196380615234, -40.10775375366211, -38.885311126708984, -37.662872314453125, -36.4404296875, -35.217987060546875, -33.99554443359375, -32.773101806640625, -31.550662994384766, -30.32822036743164, -29.10577964782715, -27.883337020874023, -26.66089630126953, -25.438453674316406, -24.21601104736328, -22.99357032775879, -21.771127700805664, -20.54868507385254, -19.326244354248047, -18.103801727294922, -16.88136100769043, -15.658918380737305, -14.436476707458496, -13.214035034179688, -11.991593360900879, -10.76915168762207, -9.546710014343262, -8.324268341064453, -7.101826190948486, -5.879384517669678, -4.656942367553711, -3.4345006942749023, -2.2120590209960938, -0.9896172285079956, 0.23282456398010254, 1.4552664756774902, 2.677708148956299, 3.9001498222351074, 5.122591972351074, 6.345033645629883, 7.567475318908691, 8.7899169921875, 10.012358665466309, 11.234800338745117, 12.457242965698242, 13.679683685302734, 14.90212631225586, 16.124568939208984, 17.347009658813477, 18.5694522857666, 19.791893005371094, 21.01433563232422, 22.23677635192871, 23.459218978881836, 24.681659698486328, 25.904102325439453, 27.126544952392578, 28.348987579345703, 29.571428298950195, 30.79387092590332, 32.01631164550781, 33.23875427246094, 34.46119689941406, 35.68363952636719, 36.90607833862305]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 0.0, 4.0, 6.0, 4.0, 4.0, 3.0, 8.0, 7.0, 10.0, 12.0, 5.0, 12.0, 13.0, 25.0, 25.0, 22.0, 36.0, 24.0, 36.0, 39.0, 51.0, 52.0, 54.0, 55.0, 60.0, 49.0, 51.0, 41.0, 48.0, 25.0, 29.0, 37.0, 32.0, 18.0, 19.0, 24.0, 16.0, 8.0, 6.0, 10.0, 7.0, 3.0, 6.0, 6.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.3828125, -4.256591796875, -4.13037109375, -4.004150390625, -3.8779296875, -3.751708984375, -3.62548828125, -3.499267578125, -3.373046875, -3.246826171875, -3.12060546875, -2.994384765625, -2.8681640625, -2.741943359375, -2.61572265625, -2.489501953125, -2.36328125, -2.237060546875, -2.11083984375, -1.984619140625, -1.8583984375, -1.732177734375, -1.60595703125, -1.479736328125, -1.353515625, -1.227294921875, -1.10107421875, -0.974853515625, -0.8486328125, -0.722412109375, -0.59619140625, -0.469970703125, -0.34375, -0.217529296875, -0.09130859375, 0.034912109375, 0.1611328125, 0.287353515625, 0.41357421875, 0.539794921875, 0.666015625, 0.792236328125, 0.91845703125, 1.044677734375, 1.1708984375, 1.297119140625, 1.42333984375, 1.549560546875, 1.67578125, 1.802001953125, 1.92822265625, 2.054443359375, 2.1806640625, 2.306884765625, 2.43310546875, 2.559326171875, 2.685546875, 2.811767578125, 2.93798828125, 3.064208984375, 3.1904296875, 3.316650390625, 3.44287109375, 3.569091796875, 3.6953125]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 5.0, 1.0, 0.0, 4.0, 7.0, 9.0, 19.0, 28.0, 34.0, 55.0, 74.0, 142.0, 213.0, 350.0, 507.0, 849.0, 1396.0, 2232.0, 3630.0, 6306.0, 11016.0, 20172.0, 38288.0, 78422.0, 186648.0, 365671.0, 175243.0, 74694.0, 36938.0, 19336.0, 10781.0, 5998.0, 3625.0, 2222.0, 1319.0, 874.0, 486.0, 356.0, 212.0, 138.0, 90.0, 52.0, 42.0, 30.0, 15.0, 14.0, 8.0, 10.0, 2.0, 2.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1624755859375, -0.156768798828125, -0.15106201171875, -0.145355224609375, -0.1396484375, -0.133941650390625, -0.12823486328125, -0.122528076171875, -0.1168212890625, -0.111114501953125, -0.10540771484375, -0.099700927734375, -0.093994140625, -0.088287353515625, -0.08258056640625, -0.076873779296875, -0.0711669921875, -0.065460205078125, -0.05975341796875, -0.054046630859375, -0.04833984375, -0.042633056640625, -0.03692626953125, -0.031219482421875, -0.0255126953125, -0.019805908203125, -0.01409912109375, -0.008392333984375, -0.002685546875, 0.003021240234375, 0.00872802734375, 0.014434814453125, 0.0201416015625, 0.025848388671875, 0.03155517578125, 0.037261962890625, 0.04296875, 0.048675537109375, 0.05438232421875, 0.060089111328125, 0.0657958984375, 0.071502685546875, 0.07720947265625, 0.082916259765625, 0.088623046875, 0.094329833984375, 0.10003662109375, 0.105743408203125, 0.1114501953125, 0.117156982421875, 0.12286376953125, 0.128570556640625, 0.13427734375, 0.139984130859375, 0.14569091796875, 0.151397705078125, 0.1571044921875, 0.162811279296875, 0.16851806640625, 0.174224853515625, 0.179931640625, 0.185638427734375, 0.19134521484375, 0.197052001953125, 0.2027587890625]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 9.0, 7.0, 10.0, 7.0, 9.0, 9.0, 11.0, 14.0, 12.0, 16.0, 16.0, 20.0, 25.0, 23.0, 21.0, 37.0, 29.0, 37.0, 42.0, 36.0, 44.0, 38.0, 1068.0, 45.0, 32.0, 37.0, 37.0, 36.0, 27.0, 32.0, 33.0, 31.0, 24.0, 25.0, 20.0, 22.0, 19.0, 13.0, 10.0, 5.0, 8.0, 8.0, 6.0, 4.0, 6.0, 7.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-2.453125, -2.379608154296875, -2.30609130859375, -2.232574462890625, -2.1590576171875, -2.085540771484375, -2.01202392578125, -1.938507080078125, -1.864990234375, -1.791473388671875, -1.71795654296875, -1.644439697265625, -1.5709228515625, -1.497406005859375, -1.42388916015625, -1.350372314453125, -1.27685546875, -1.203338623046875, -1.12982177734375, -1.056304931640625, -0.9827880859375, -0.909271240234375, -0.83575439453125, -0.762237548828125, -0.688720703125, -0.615203857421875, -0.54168701171875, -0.468170166015625, -0.3946533203125, -0.321136474609375, -0.24761962890625, -0.174102783203125, -0.1005859375, -0.027069091796875, 0.04644775390625, 0.119964599609375, 0.1934814453125, 0.266998291015625, 0.34051513671875, 0.414031982421875, 0.487548828125, 0.561065673828125, 0.63458251953125, 0.708099365234375, 0.7816162109375, 0.855133056640625, 0.92864990234375, 1.002166748046875, 1.07568359375, 1.149200439453125, 1.22271728515625, 1.296234130859375, 1.3697509765625, 1.443267822265625, 1.51678466796875, 1.590301513671875, 1.663818359375, 1.737335205078125, 1.81085205078125, 1.884368896484375, 1.9578857421875, 2.031402587890625, 2.10491943359375, 2.178436279296875, 2.251953125]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 4.0, 5.0, 10.0, 10.0, 12.0, 25.0, 28.0, 48.0, 84.0, 134.0, 180.0, 238.0, 345.0, 437.0, 696.0, 913.0, 1352.0, 1932.0, 2729.0, 4008.0, 5728.0, 8496.0, 12834.0, 19305.0, 29671.0, 46513.0, 74744.0, 122451.0, 1254527.0, 194284.0, 115861.0, 70317.0, 43686.0, 28407.0, 18543.0, 12137.0, 8203.0, 5563.0, 3742.0, 2735.0, 1803.0, 1316.0, 938.0, 641.0, 478.0, 317.0, 222.0, 146.0, 113.0, 84.0, 53.0, 29.0, 22.0, 19.0, 13.0, 7.0, 5.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.10076904296875, -0.09761428833007812, -0.09445953369140625, -0.09130477905273438, -0.0881500244140625, -0.08499526977539062, -0.08184051513671875, -0.07868576049804688, -0.075531005859375, -0.07237625122070312, -0.06922149658203125, -0.06606674194335938, -0.0629119873046875, -0.059757232666015625, -0.05660247802734375, -0.053447723388671875, -0.05029296875, -0.047138214111328125, -0.04398345947265625, -0.040828704833984375, -0.0376739501953125, -0.034519195556640625, -0.03136444091796875, -0.028209686279296875, -0.025054931640625, -0.021900177001953125, -0.01874542236328125, -0.015590667724609375, -0.0124359130859375, -0.009281158447265625, -0.00612640380859375, -0.002971649169921875, 0.00018310546875, 0.003337860107421875, 0.00649261474609375, 0.009647369384765625, 0.0128021240234375, 0.015956878662109375, 0.01911163330078125, 0.022266387939453125, 0.025421142578125, 0.028575897216796875, 0.03173065185546875, 0.034885406494140625, 0.0380401611328125, 0.041194915771484375, 0.04434967041015625, 0.047504425048828125, 0.0506591796875, 0.053813934326171875, 0.05696868896484375, 0.060123443603515625, 0.0632781982421875, 0.06643295288085938, 0.06958770751953125, 0.07274246215820312, 0.075897216796875, 0.07905197143554688, 0.08220672607421875, 0.08536148071289062, 0.0885162353515625, 0.09167098999023438, 0.09482574462890625, 0.09798049926757812, 0.10113525390625]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 3.0, 2.0, 4.0, 5.0, 7.0, 9.0, 20.0, 12.0, 27.0, 30.0, 37.0, 55.0, 57.0, 69.0, 90.0, 91.0, 101.0, 91.0, 79.0, 48.0, 38.0, 31.0, 17.0, 18.0, 11.0, 16.0, 10.0, 6.0, 11.0, 2.0, 2.0, 1.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011271238327026367, -0.00010924879461526871, -0.00010578520596027374, -0.00010232161730527878, -9.885802865028381e-05, -9.539443999528885e-05, -9.193085134029388e-05, -8.846726268529892e-05, -8.500367403030396e-05, -8.154008537530899e-05, -7.807649672031403e-05, -7.461290806531906e-05, -7.11493194103241e-05, -6.768573075532913e-05, -6.422214210033417e-05, -6.07585534453392e-05, -5.729496479034424e-05, -5.3831376135349274e-05, -5.036778748035431e-05, -4.6904198825359344e-05, -4.344061017036438e-05, -3.9977021515369415e-05, -3.651343286037445e-05, -3.3049844205379486e-05, -2.958625555038452e-05, -2.6122666895389557e-05, -2.2659078240394592e-05, -1.9195489585399628e-05, -1.5731900930404663e-05, -1.2268312275409698e-05, -8.804723620414734e-06, -5.341134965419769e-06, -1.8775463104248047e-06, 1.58604234457016e-06, 5.0496309995651245e-06, 8.513219654560089e-06, 1.1976808309555054e-05, 1.544039696455002e-05, 1.8903985619544983e-05, 2.2367574274539948e-05, 2.5831162929534912e-05, 2.9294751584529877e-05, 3.275834023952484e-05, 3.6221928894519806e-05, 3.968551754951477e-05, 4.3149106204509735e-05, 4.66126948595047e-05, 5.0076283514499664e-05, 5.353987216949463e-05, 5.7003460824489594e-05, 6.046704947948456e-05, 6.393063813447952e-05, 6.739422678947449e-05, 7.085781544446945e-05, 7.432140409946442e-05, 7.778499275445938e-05, 8.124858140945435e-05, 8.471217006444931e-05, 8.817575871944427e-05, 9.163934737443924e-05, 9.51029360294342e-05, 9.856652468442917e-05, 0.00010203011333942413, 0.0001054937019944191, 0.00010895729064941406]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 3.0, 6.0, 4.0, 10.0, 5.0, 13.0, 10.0, 16.0, 24.0, 27.0, 30.0, 40.0, 58.0, 92.0, 124.0, 207.0, 456.0, 1816.0, 15602.0, 949518.0, 75321.0, 3650.0, 733.0, 257.0, 149.0, 110.0, 70.0, 44.0, 49.0, 29.0, 24.0, 13.0, 13.0, 11.0, 6.0, 7.0, 0.0, 4.0, 1.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0015802383422851562, -0.0015303939580917358, -0.0014805495738983154, -0.001430705189704895, -0.0013808608055114746, -0.0013310164213180542, -0.0012811720371246338, -0.0012313276529312134, -0.001181483268737793, -0.0011316388845443726, -0.0010817945003509521, -0.0010319501161575317, -0.0009821057319641113, -0.0009322613477706909, -0.0008824169635772705, -0.0008325725793838501, -0.0007827281951904297, -0.0007328838109970093, -0.0006830394268035889, -0.0006331950426101685, -0.000583350658416748, -0.0005335062742233276, -0.0004836618900299072, -0.0004338175058364868, -0.0003839731216430664, -0.000334128737449646, -0.0002842843532562256, -0.00023443996906280518, -0.00018459558486938477, -0.00013475120067596436, -8.490681648254395e-05, -3.5062432289123535e-05, 1.4781951904296875e-05, 6.462633609771729e-05, 0.0001144707202911377, 0.0001643151044845581, 0.00021415948867797852, 0.0002640038728713989, 0.00031384825706481934, 0.00036369264125823975, 0.00041353702545166016, 0.00046338140964508057, 0.000513225793838501, 0.0005630701780319214, 0.0006129145622253418, 0.0006627589464187622, 0.0007126033306121826, 0.000762447714805603, 0.0008122920989990234, 0.0008621364831924438, 0.0009119808673858643, 0.0009618252515792847, 0.001011669635772705, 0.0010615140199661255, 0.001111358404159546, 0.0011612027883529663, 0.0012110471725463867, 0.0012608915567398071, 0.0013107359409332275, 0.001360580325126648, 0.0014104247093200684, 0.0014602690935134888, 0.0015101134777069092, 0.0015599578619003296, 0.00160980224609375]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 24.0, 47.0, 221.0, 456.0, 199.0, 52.0, 9.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002675997093319893, -0.00025982767692767084, -0.00025205567362718284, -0.0002442836412228644, -0.0002365116379223764, -0.00022873962006997317, -0.00022096760221756995, -0.0002131955698132515, -0.0002054235665127635, -0.00019765154866036028, -0.00018987953080795705, -0.00018210751295555383, -0.0001743354951031506, -0.00016656347725074738, -0.00015879145939834416, -0.0001510194269940257, -0.00014324740914162248, -0.00013547539128921926, -0.00012770337343681604, -0.00011993135558441281, -0.00011215933773200959, -0.00010438731987960637, -9.661529475124553e-05, -8.88432768988423e-05, -8.107125904643908e-05, -7.329924119403586e-05, -6.552722334163263e-05, -5.7755201851250604e-05, -4.998318399884738e-05, -4.221116614644416e-05, -3.4439144656062126e-05, -2.6667126803658903e-05, -1.8895123503170907e-05, -1.1123104741272982e-05, -3.351085979375057e-06, 4.42093369201757e-06, 1.2192951544420794e-05, 1.9964969396824017e-05, 2.7736990887206048e-05, 3.550900873960927e-05, 4.3281026592012495e-05, 5.105304444441572e-05, 5.882506229681894e-05, 6.659708742517978e-05, 7.4369105277583e-05, 8.214112312998623e-05, 8.991314098238945e-05, 9.768515883479267e-05, 0.0001054571766871959, 0.00011322919453959912, 0.00012100121239200234, 0.00012877323024440557, 0.0001365452480968088, 0.00014431726594921201, 0.00015208928380161524, 0.0001598613162059337, 0.00016763331950642169, 0.0001754053373588249, 0.00018317735521122813, 0.00019094937306363136, 0.00019872139091603458, 0.0002064934087684378, 0.00021426542662084103, 0.00022203745902515948, 0.0002298094768775627]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 3.0, 6.0, 9.0, 4.0, 11.0, 11.0, 12.0, 12.0, 13.0, 16.0, 15.0, 21.0, 23.0, 23.0, 30.0, 29.0, 32.0, 35.0, 33.0, 36.0, 48.0, 23.0, 47.0, 39.0, 38.0, 30.0, 32.0, 46.0, 38.0, 41.0, 37.0, 30.0, 30.0, 15.0, 25.0, 12.0, 25.0, 8.0, 16.0, 13.0, 5.0, 6.0, 7.0, 7.0, 6.0, 8.0, 1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.100799560546875e-05, -3.972742706537247e-05, -3.8446858525276184e-05, -3.71662899851799e-05, -3.588572144508362e-05, -3.4605152904987335e-05, -3.332458436489105e-05, -3.204401582479477e-05, -3.0763447284698486e-05, -2.9482878744602203e-05, -2.820231020450592e-05, -2.6921741664409637e-05, -2.5641173124313354e-05, -2.436060458421707e-05, -2.308003604412079e-05, -2.1799467504024506e-05, -2.0518898963928223e-05, -1.923833042383194e-05, -1.7957761883735657e-05, -1.6677193343639374e-05, -1.539662480354309e-05, -1.4116056263446808e-05, -1.2835487723350525e-05, -1.1554919183254242e-05, -1.0274350643157959e-05, -8.993782103061676e-06, -7.713213562965393e-06, -6.43264502286911e-06, -5.152076482772827e-06, -3.871507942676544e-06, -2.5909394025802612e-06, -1.3103708624839783e-06, -2.9802322387695312e-08, 1.2507662177085876e-06, 2.5313347578048706e-06, 3.8119032979011536e-06, 5.0924718379974365e-06, 6.3730403780937195e-06, 7.653608918190002e-06, 8.934177458286285e-06, 1.0214745998382568e-05, 1.1495314538478851e-05, 1.2775883078575134e-05, 1.4056451618671417e-05, 1.53370201587677e-05, 1.6617588698863983e-05, 1.7898157238960266e-05, 1.917872577905655e-05, 2.0459294319152832e-05, 2.1739862859249115e-05, 2.3020431399345398e-05, 2.430099993944168e-05, 2.5581568479537964e-05, 2.6862137019634247e-05, 2.814270555973053e-05, 2.9423274099826813e-05, 3.0703842639923096e-05, 3.198441118001938e-05, 3.326497972011566e-05, 3.4545548260211945e-05, 3.582611680030823e-05, 3.710668534040451e-05, 3.8387253880500793e-05, 3.9667822420597076e-05, 4.094839096069336e-05]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 0.0, 4.0, 6.0, 4.0, 4.0, 3.0, 8.0, 7.0, 10.0, 12.0, 5.0, 12.0, 13.0, 25.0, 25.0, 22.0, 36.0, 24.0, 36.0, 39.0, 51.0, 52.0, 54.0, 55.0, 60.0, 49.0, 51.0, 41.0, 48.0, 25.0, 29.0, 37.0, 32.0, 18.0, 19.0, 24.0, 16.0, 8.0, 6.0, 10.0, 7.0, 3.0, 6.0, 6.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.3828125, -4.256591796875, -4.13037109375, -4.004150390625, -3.8779296875, -3.751708984375, -3.62548828125, -3.499267578125, -3.373046875, -3.246826171875, -3.12060546875, -2.994384765625, -2.8681640625, -2.741943359375, -2.61572265625, -2.489501953125, -2.36328125, -2.237060546875, -2.11083984375, -1.984619140625, -1.8583984375, -1.732177734375, -1.60595703125, -1.479736328125, -1.353515625, -1.227294921875, -1.10107421875, -0.974853515625, -0.8486328125, -0.722412109375, -0.59619140625, -0.469970703125, -0.34375, -0.217529296875, -0.09130859375, 0.034912109375, 0.1611328125, 0.287353515625, 0.41357421875, 0.539794921875, 0.666015625, 0.792236328125, 0.91845703125, 1.044677734375, 1.1708984375, 1.297119140625, 1.42333984375, 1.549560546875, 1.67578125, 1.802001953125, 1.92822265625, 2.054443359375, 2.1806640625, 2.306884765625, 2.43310546875, 2.559326171875, 2.685546875, 2.811767578125, 2.93798828125, 3.064208984375, 3.1904296875, 3.316650390625, 3.44287109375, 3.569091796875, 3.6953125]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 0.0, 4.0, 5.0, 4.0, 12.0, 13.0, 12.0, 28.0, 20.0, 34.0, 42.0, 61.0, 100.0, 115.0, 164.0, 268.0, 332.0, 534.0, 762.0, 1148.0, 1829.0, 3289.0, 7155.0, 31120.0, 458420.0, 493645.0, 33083.0, 7391.0, 3415.0, 1945.0, 1131.0, 783.0, 495.0, 348.0, 237.0, 185.0, 104.0, 79.0, 56.0, 46.0, 26.0, 27.0, 16.0, 22.0, 16.0, 9.0, 12.0, 2.0, 5.0, 5.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-7.93359375, -7.67779541015625, -7.4219970703125, -7.16619873046875, -6.910400390625, -6.65460205078125, -6.3988037109375, -6.14300537109375, -5.88720703125, -5.63140869140625, -5.3756103515625, -5.11981201171875, -4.864013671875, -4.60821533203125, -4.3524169921875, -4.09661865234375, -3.8408203125, -3.58502197265625, -3.3292236328125, -3.07342529296875, -2.817626953125, -2.56182861328125, -2.3060302734375, -2.05023193359375, -1.79443359375, -1.53863525390625, -1.2828369140625, -1.02703857421875, -0.771240234375, -0.51544189453125, -0.2596435546875, -0.00384521484375, 0.251953125, 0.50775146484375, 0.7635498046875, 1.01934814453125, 1.275146484375, 1.53094482421875, 1.7867431640625, 2.04254150390625, 2.29833984375, 2.55413818359375, 2.8099365234375, 3.06573486328125, 3.321533203125, 3.57733154296875, 3.8331298828125, 4.08892822265625, 4.3447265625, 4.60052490234375, 4.8563232421875, 5.11212158203125, 5.367919921875, 5.62371826171875, 5.8795166015625, 6.13531494140625, 6.39111328125, 6.64691162109375, 6.9027099609375, 7.15850830078125, 7.414306640625, 7.67010498046875, 7.9259033203125, 8.18170166015625, 8.4375]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 0.0, 2.0, 1.0, 7.0, 5.0, 4.0, 9.0, 8.0, 10.0, 7.0, 18.0, 16.0, 15.0, 24.0, 26.0, 28.0, 26.0, 41.0, 39.0, 48.0, 43.0, 66.0, 94.0, 1776.0, 286.0, 61.0, 47.0, 51.0, 37.0, 24.0, 30.0, 30.0, 26.0, 22.0, 23.0, 23.0, 19.0, 16.0, 13.0, 7.0, 7.0, 5.0, 5.0, 2.0, 2.0, 1.0, 6.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.078125, -15.58740234375, -15.0966796875, -14.60595703125, -14.115234375, -13.62451171875, -13.1337890625, -12.64306640625, -12.15234375, -11.66162109375, -11.1708984375, -10.68017578125, -10.189453125, -9.69873046875, -9.2080078125, -8.71728515625, -8.2265625, -7.73583984375, -7.2451171875, -6.75439453125, -6.263671875, -5.77294921875, -5.2822265625, -4.79150390625, -4.30078125, -3.81005859375, -3.3193359375, -2.82861328125, -2.337890625, -1.84716796875, -1.3564453125, -0.86572265625, -0.375, 0.11572265625, 0.6064453125, 1.09716796875, 1.587890625, 2.07861328125, 2.5693359375, 3.06005859375, 3.55078125, 4.04150390625, 4.5322265625, 5.02294921875, 5.513671875, 6.00439453125, 6.4951171875, 6.98583984375, 7.4765625, 7.96728515625, 8.4580078125, 8.94873046875, 9.439453125, 9.93017578125, 10.4208984375, 10.91162109375, 11.40234375, 11.89306640625, 12.3837890625, 12.87451171875, 13.365234375, 13.85595703125, 14.3466796875, 14.83740234375, 15.328125]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 5.0, 0.0, 2.0, 3.0, 5.0, 6.0, 5.0, 13.0, 6.0, 13.0, 23.0, 18.0, 24.0, 35.0, 37.0, 44.0, 59.0, 67.0, 132.0, 302.0, 1085.0, 4328.0, 56271.0, 3070332.0, 9604.0, 2109.0, 577.0, 181.0, 95.0, 72.0, 48.0, 46.0, 28.0, 27.0, 24.0, 17.0, 17.0, 5.0, 10.0, 6.0, 9.0, 5.0, 6.0, 6.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.34375, -32.27685546875, -31.2099609375, -30.14306640625, -29.076171875, -28.00927734375, -26.9423828125, -25.87548828125, -24.80859375, -23.74169921875, -22.6748046875, -21.60791015625, -20.541015625, -19.47412109375, -18.4072265625, -17.34033203125, -16.2734375, -15.20654296875, -14.1396484375, -13.07275390625, -12.005859375, -10.93896484375, -9.8720703125, -8.80517578125, -7.73828125, -6.67138671875, -5.6044921875, -4.53759765625, -3.470703125, -2.40380859375, -1.3369140625, -0.27001953125, 0.796875, 1.86376953125, 2.9306640625, 3.99755859375, 5.064453125, 6.13134765625, 7.1982421875, 8.26513671875, 9.33203125, 10.39892578125, 11.4658203125, 12.53271484375, 13.599609375, 14.66650390625, 15.7333984375, 16.80029296875, 17.8671875, 18.93408203125, 20.0009765625, 21.06787109375, 22.134765625, 23.20166015625, 24.2685546875, 25.33544921875, 26.40234375, 27.46923828125, 28.5361328125, 29.60302734375, 30.669921875, 31.73681640625, 32.8037109375, 33.87060546875, 34.9375]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [1.0, 6.0, 489.0, 519.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.175048828125, -10.110292434692383, -5.045536041259766, 0.019220352172851562, 5.083976745605469, 10.148733139038086, 15.213489532470703, 20.278244018554688, 25.343002319335938, 30.407758712768555, 35.47251510620117, 40.537269592285156, 45.602027893066406, 50.666786193847656, 55.73154067993164, 60.796295166015625, 65.86105346679688, 70.92581176757812, 75.99057006835938, 81.0553207397461, 86.12007904052734, 91.1848373413086, 96.24958801269531, 101.31434631347656, 106.37910461425781, 111.44386291503906, 116.50862121582031, 121.57337188720703, 126.63813018798828, 131.702880859375, 136.76763916015625, 141.8323974609375, 146.89715576171875, 151.9619140625, 157.02667236328125, 162.0914306640625, 167.15618896484375, 172.22093200683594, 177.2856903076172, 182.35044860839844, 187.4152069091797, 192.47996520996094, 197.5447235107422, 202.60948181152344, 207.67422485351562, 212.73898315429688, 217.80374145507812, 222.86849975585938, 227.93325805664062, 232.99801635742188, 238.06277465820312, 243.12753295898438, 248.19229125976562, 253.2570343017578, 258.3218078613281, 263.38653564453125, 268.4512939453125, 273.51605224609375, 278.580810546875, 283.64556884765625, 288.7103271484375, 293.77508544921875, 298.83984375, 303.90460205078125, 308.9693603515625]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 2.0, 3.0, 10.0, 8.0, 8.0, 7.0, 15.0, 13.0, 15.0, 13.0, 17.0, 21.0, 18.0, 21.0, 24.0, 17.0, 27.0, 27.0, 37.0, 33.0, 33.0, 34.0, 37.0, 37.0, 39.0, 47.0, 38.0, 49.0, 36.0, 43.0, 39.0, 29.0, 27.0, 29.0, 17.0, 19.0, 14.0, 19.0, 20.0, 16.0, 6.0, 11.0, 9.0, 9.0, 5.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-47.5921516418457, -46.260528564453125, -44.92890167236328, -43.59727478027344, -42.26565170288086, -40.93402862548828, -39.60240173339844, -38.270774841308594, -36.939151763916016, -35.60752868652344, -34.275901794433594, -32.94427490234375, -31.612651824951172, -30.28102684020996, -28.94940185546875, -27.61777687072754, -26.286151885986328, -24.954526901245117, -23.622901916503906, -22.291276931762695, -20.959651947021484, -19.628026962280273, -18.296401977539062, -16.96477699279785, -15.63315200805664, -14.30152702331543, -12.969902038574219, -11.638277053833008, -10.306652069091797, -8.975027084350586, -7.643402099609375, -6.311777114868164, -4.980155944824219, -3.648530960083008, -2.316905975341797, -0.9852809906005859, 0.346343994140625, 1.677968978881836, 3.009593963623047, 4.341218948364258, 5.672843933105469, 7.00446891784668, 8.33609390258789, 9.667718887329102, 10.999343872070312, 12.330968856811523, 13.662593841552734, 14.994218826293945, 16.325843811035156, 17.657468795776367, 18.989093780517578, 20.32071876525879, 21.65234375, 22.98396873474121, 24.315593719482422, 25.647218704223633, 26.978843688964844, 28.310468673706055, 29.642093658447266, 30.973718643188477, 32.30534362792969, 33.63697052001953, 34.96859359741211, 36.30021667480469, 37.63184356689453]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 3.0, 4.0, 7.0, 3.0, 8.0, 14.0, 8.0, 7.0, 10.0, 16.0, 23.0, 25.0, 20.0, 36.0, 28.0, 28.0, 48.0, 45.0, 59.0, 48.0, 53.0, 60.0, 54.0, 46.0, 43.0, 35.0, 37.0, 32.0, 28.0, 36.0, 27.0, 19.0, 22.0, 18.0, 6.0, 9.0, 9.0, 6.0, 6.0, 4.0, 5.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-4.56640625, -4.435455322265625, -4.30450439453125, -4.173553466796875, -4.0426025390625, -3.911651611328125, -3.78070068359375, -3.649749755859375, -3.518798828125, -3.387847900390625, -3.25689697265625, -3.125946044921875, -2.9949951171875, -2.864044189453125, -2.73309326171875, -2.602142333984375, -2.47119140625, -2.340240478515625, -2.20928955078125, -2.078338623046875, -1.9473876953125, -1.816436767578125, -1.68548583984375, -1.554534912109375, -1.423583984375, -1.292633056640625, -1.16168212890625, -1.030731201171875, -0.8997802734375, -0.768829345703125, -0.63787841796875, -0.506927490234375, -0.3759765625, -0.245025634765625, -0.11407470703125, 0.016876220703125, 0.1478271484375, 0.278778076171875, 0.40972900390625, 0.540679931640625, 0.671630859375, 0.802581787109375, 0.93353271484375, 1.064483642578125, 1.1954345703125, 1.326385498046875, 1.45733642578125, 1.588287353515625, 1.71923828125, 1.850189208984375, 1.98114013671875, 2.112091064453125, 2.2430419921875, 2.373992919921875, 2.50494384765625, 2.635894775390625, 2.766845703125, 2.897796630859375, 3.02874755859375, 3.159698486328125, 3.2906494140625, 3.421600341796875, 3.55255126953125, 3.683502197265625, 3.814453125]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 5.0, 2.0, 3.0, 6.0, 10.0, 8.0, 16.0, 12.0, 22.0, 30.0, 56.0, 65.0, 86.0, 174.0, 273.0, 432.0, 810.0, 1479.0, 2947.0, 6022.0, 13750.0, 34379.0, 159989.0, 3333900.0, 553164.0, 52594.0, 18343.0, 7813.0, 3652.0, 1864.0, 990.0, 531.0, 320.0, 208.0, 124.0, 59.0, 46.0, 24.0, 21.0, 15.0, 12.0, 4.0, 4.0, 5.0, 4.0, 6.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-16.671875, -16.191162109375, -15.71044921875, -15.229736328125, -14.7490234375, -14.268310546875, -13.78759765625, -13.306884765625, -12.826171875, -12.345458984375, -11.86474609375, -11.384033203125, -10.9033203125, -10.422607421875, -9.94189453125, -9.461181640625, -8.98046875, -8.499755859375, -8.01904296875, -7.538330078125, -7.0576171875, -6.576904296875, -6.09619140625, -5.615478515625, -5.134765625, -4.654052734375, -4.17333984375, -3.692626953125, -3.2119140625, -2.731201171875, -2.25048828125, -1.769775390625, -1.2890625, -0.808349609375, -0.32763671875, 0.153076171875, 0.6337890625, 1.114501953125, 1.59521484375, 2.075927734375, 2.556640625, 3.037353515625, 3.51806640625, 3.998779296875, 4.4794921875, 4.960205078125, 5.44091796875, 5.921630859375, 6.40234375, 6.883056640625, 7.36376953125, 7.844482421875, 8.3251953125, 8.805908203125, 9.28662109375, 9.767333984375, 10.248046875, 10.728759765625, 11.20947265625, 11.690185546875, 12.1708984375, 12.651611328125, 13.13232421875, 13.613037109375, 14.09375]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 4.0, 5.0, 4.0, 7.0, 9.0, 11.0, 20.0, 13.0, 24.0, 44.0, 48.0, 79.0, 88.0, 130.0, 248.0, 514.0, 796.0, 840.0, 473.0, 224.0, 135.0, 99.0, 55.0, 49.0, 42.0, 34.0, 22.0, 14.0, 8.0, 8.0, 7.0, 6.0, 5.0, 8.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-14.7890625, -14.341552734375, -13.89404296875, -13.446533203125, -12.9990234375, -12.551513671875, -12.10400390625, -11.656494140625, -11.208984375, -10.761474609375, -10.31396484375, -9.866455078125, -9.4189453125, -8.971435546875, -8.52392578125, -8.076416015625, -7.62890625, -7.181396484375, -6.73388671875, -6.286376953125, -5.8388671875, -5.391357421875, -4.94384765625, -4.496337890625, -4.048828125, -3.601318359375, -3.15380859375, -2.706298828125, -2.2587890625, -1.811279296875, -1.36376953125, -0.916259765625, -0.46875, -0.021240234375, 0.42626953125, 0.873779296875, 1.3212890625, 1.768798828125, 2.21630859375, 2.663818359375, 3.111328125, 3.558837890625, 4.00634765625, 4.453857421875, 4.9013671875, 5.348876953125, 5.79638671875, 6.243896484375, 6.69140625, 7.138916015625, 7.58642578125, 8.033935546875, 8.4814453125, 8.928955078125, 9.37646484375, 9.823974609375, 10.271484375, 10.718994140625, 11.16650390625, 11.614013671875, 12.0615234375, 12.509033203125, 12.95654296875, 13.404052734375, 13.8515625]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 1.0, 8.0, 8.0, 12.0, 19.0, 31.0, 52.0, 50.0, 92.0, 137.0, 191.0, 308.0, 434.0, 729.0, 1146.0, 1982.0, 3480.0, 6084.0, 11376.0, 22030.0, 45536.0, 114848.0, 672895.0, 2826327.0, 327185.0, 83237.0, 36220.0, 17938.0, 9334.0, 5062.0, 2923.0, 1704.0, 1026.0, 643.0, 432.0, 262.0, 182.0, 111.0, 78.0, 50.0, 38.0, 23.0, 21.0, 12.0, 8.0, 11.0, 0.0, 3.0, 6.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-16.71875, -16.201904296875, -15.68505859375, -15.168212890625, -14.6513671875, -14.134521484375, -13.61767578125, -13.100830078125, -12.583984375, -12.067138671875, -11.55029296875, -11.033447265625, -10.5166015625, -9.999755859375, -9.48291015625, -8.966064453125, -8.44921875, -7.932373046875, -7.41552734375, -6.898681640625, -6.3818359375, -5.864990234375, -5.34814453125, -4.831298828125, -4.314453125, -3.797607421875, -3.28076171875, -2.763916015625, -2.2470703125, -1.730224609375, -1.21337890625, -0.696533203125, -0.1796875, 0.337158203125, 0.85400390625, 1.370849609375, 1.8876953125, 2.404541015625, 2.92138671875, 3.438232421875, 3.955078125, 4.471923828125, 4.98876953125, 5.505615234375, 6.0224609375, 6.539306640625, 7.05615234375, 7.572998046875, 8.08984375, 8.606689453125, 9.12353515625, 9.640380859375, 10.1572265625, 10.674072265625, 11.19091796875, 11.707763671875, 12.224609375, 12.741455078125, 13.25830078125, 13.775146484375, 14.2919921875, 14.808837890625, 15.32568359375, 15.842529296875, 16.359375]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 10.0, 11.0, 29.0, 45.0, 89.0, 160.0, 206.0, 180.0, 118.0, 71.0, 33.0, 23.0, 11.0, 12.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-95.14019012451172, -92.25006866455078, -89.35995483398438, -86.46983337402344, -83.5797119140625, -80.6895980834961, -77.79947662353516, -74.90936279296875, -72.01924133300781, -69.12911987304688, -66.23900604248047, -63.34888458251953, -60.45876693725586, -57.56864929199219, -54.67852783203125, -51.78841018676758, -48.898292541503906, -46.008174896240234, -43.11805725097656, -40.227935791015625, -37.33781814575195, -34.44770050048828, -31.557580947875977, -28.667461395263672, -25.77734375, -22.887226104736328, -19.997106552124023, -17.10698699951172, -14.216869354248047, -11.326750755310059, -8.43663215637207, -5.546512603759766, -2.656402587890625, 0.23371601104736328, 3.1238346099853516, 6.01395320892334, 8.904071807861328, 11.794190406799316, 14.684309005737305, 17.57442855834961, 20.46454620361328, 23.354663848876953, 26.244783401489258, 29.134902954101562, 32.025020599365234, 34.915138244628906, 37.805259704589844, 40.695377349853516, 43.58549499511719, 46.47561264038086, 49.36573028564453, 52.25585174560547, 55.14596939086914, 58.03608703613281, 60.92620849609375, 63.81632614135742, 66.7064437866211, 69.59656524658203, 72.48667907714844, 75.37680053710938, 78.26692199707031, 81.15703582763672, 84.04715728759766, 86.93727111816406, 89.827392578125]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 2.0, 2.0, 8.0, 0.0, 7.0, 12.0, 7.0, 2.0, 14.0, 11.0, 16.0, 17.0, 29.0, 27.0, 30.0, 30.0, 38.0, 34.0, 38.0, 30.0, 38.0, 44.0, 37.0, 53.0, 47.0, 44.0, 39.0, 36.0, 45.0, 33.0, 36.0, 33.0, 18.0, 26.0, 16.0, 21.0, 22.0, 15.0, 12.0, 9.0, 8.0, 4.0, 6.0, 5.0, 5.0, 2.0, 2.0, 0.0, 2.0, 3.0, 1.0, 2.0], "bins": [-41.89741134643555, -40.713348388671875, -39.5292854309082, -38.34522247314453, -37.161155700683594, -35.97709274291992, -34.79302978515625, -33.60896682739258, -32.424903869628906, -31.240840911865234, -30.056777954101562, -28.872713088989258, -27.688650131225586, -26.504587173461914, -25.32052230834961, -24.136459350585938, -22.952396392822266, -21.768333435058594, -20.584270477294922, -19.400205612182617, -18.216142654418945, -17.032079696655273, -15.848015785217285, -14.663951873779297, -13.479888916015625, -12.295825958251953, -11.111762046813965, -9.927698135375977, -8.743635177612305, -7.559571743011475, -6.3755083084106445, -5.191444396972656, -4.007377624511719, -2.8233141899108887, -1.6392507553100586, -0.4551873207092285, 0.7288761138916016, 1.9129395484924316, 3.0970029830932617, 4.28106689453125, 5.465129852294922, 6.649193286895752, 7.833256721496582, 9.01732063293457, 10.201383590698242, 11.385446548461914, 12.569510459899902, 13.75357437133789, 14.937637329101562, 16.121700286865234, 17.305763244628906, 18.48982810974121, 19.673891067504883, 20.857954025268555, 22.04201889038086, 23.22608184814453, 24.410144805908203, 25.594207763671875, 26.778270721435547, 27.96233558654785, 29.146398544311523, 30.330461502075195, 31.5145263671875, 32.69858932495117, 33.882652282714844]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 5.0, 4.0, 5.0, 5.0, 7.0, 6.0, 9.0, 10.0, 12.0, 12.0, 17.0, 19.0, 23.0, 33.0, 20.0, 33.0, 29.0, 44.0, 45.0, 42.0, 52.0, 58.0, 48.0, 46.0, 63.0, 47.0, 31.0, 43.0, 30.0, 30.0, 26.0, 23.0, 24.0, 21.0, 19.0, 13.0, 10.0, 10.0, 9.0, 3.0, 6.0, 4.0, 5.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0], "bins": [-4.74609375, -4.6146240234375, -4.483154296875, -4.3516845703125, -4.22021484375, -4.0887451171875, -3.957275390625, -3.8258056640625, -3.6943359375, -3.5628662109375, -3.431396484375, -3.2999267578125, -3.16845703125, -3.0369873046875, -2.905517578125, -2.7740478515625, -2.642578125, -2.5111083984375, -2.379638671875, -2.2481689453125, -2.11669921875, -1.9852294921875, -1.853759765625, -1.7222900390625, -1.5908203125, -1.4593505859375, -1.327880859375, -1.1964111328125, -1.06494140625, -0.9334716796875, -0.802001953125, -0.6705322265625, -0.5390625, -0.4075927734375, -0.276123046875, -0.1446533203125, -0.01318359375, 0.1182861328125, 0.249755859375, 0.3812255859375, 0.5126953125, 0.6441650390625, 0.775634765625, 0.9071044921875, 1.03857421875, 1.1700439453125, 1.301513671875, 1.4329833984375, 1.564453125, 1.6959228515625, 1.827392578125, 1.9588623046875, 2.09033203125, 2.2218017578125, 2.353271484375, 2.4847412109375, 2.6162109375, 2.7476806640625, 2.879150390625, 3.0106201171875, 3.14208984375, 3.2735595703125, 3.405029296875, 3.5364990234375, 3.66796875]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 1.0, 3.0, 12.0, 6.0, 9.0, 19.0, 21.0, 36.0, 48.0, 88.0, 115.0, 181.0, 278.0, 426.0, 665.0, 1042.0, 1719.0, 2845.0, 4853.0, 8487.0, 14961.0, 28255.0, 56483.0, 122081.0, 284971.0, 280710.0, 120635.0, 55790.0, 28028.0, 15139.0, 8394.0, 4835.0, 2852.0, 1716.0, 1057.0, 640.0, 395.0, 260.0, 173.0, 120.0, 74.0, 47.0, 27.0, 26.0, 17.0, 9.0, 4.0, 3.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.2103271484375, -0.20413970947265625, -0.1979522705078125, -0.19176483154296875, -0.185577392578125, -0.17938995361328125, -0.1732025146484375, -0.16701507568359375, -0.16082763671875, -0.15464019775390625, -0.1484527587890625, -0.14226531982421875, -0.136077880859375, -0.12989044189453125, -0.1237030029296875, -0.11751556396484375, -0.111328125, -0.10514068603515625, -0.0989532470703125, -0.09276580810546875, -0.086578369140625, -0.08039093017578125, -0.0742034912109375, -0.06801605224609375, -0.06182861328125, -0.05564117431640625, -0.0494537353515625, -0.04326629638671875, -0.037078857421875, -0.03089141845703125, -0.0247039794921875, -0.01851654052734375, -0.0123291015625, -0.00614166259765625, 4.57763671875e-05, 0.00623321533203125, 0.012420654296875, 0.01860809326171875, 0.0247955322265625, 0.03098297119140625, 0.03717041015625, 0.04335784912109375, 0.0495452880859375, 0.05573272705078125, 0.061920166015625, 0.06810760498046875, 0.0742950439453125, 0.08048248291015625, 0.086669921875, 0.09285736083984375, 0.0990447998046875, 0.10523223876953125, 0.111419677734375, 0.11760711669921875, 0.1237945556640625, 0.12998199462890625, 0.13616943359375, 0.14235687255859375, 0.1485443115234375, 0.15473175048828125, 0.160919189453125, 0.16710662841796875, 0.1732940673828125, 0.17948150634765625, 0.1856689453125]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 3.0, 0.0, 3.0, 4.0, 4.0, 4.0, 3.0, 8.0, 17.0, 9.0, 11.0, 15.0, 11.0, 22.0, 27.0, 17.0, 26.0, 24.0, 24.0, 38.0, 30.0, 42.0, 49.0, 33.0, 35.0, 28.0, 1071.0, 30.0, 32.0, 31.0, 25.0, 33.0, 35.0, 29.0, 28.0, 29.0, 24.0, 19.0, 22.0, 22.0, 25.0, 18.0, 8.0, 20.0, 3.0, 9.0, 7.0, 5.0, 8.0, 6.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.30859375, -2.230865478515625, -2.15313720703125, -2.075408935546875, -1.9976806640625, -1.919952392578125, -1.84222412109375, -1.764495849609375, -1.686767578125, -1.609039306640625, -1.53131103515625, -1.453582763671875, -1.3758544921875, -1.298126220703125, -1.22039794921875, -1.142669677734375, -1.06494140625, -0.987213134765625, -0.90948486328125, -0.831756591796875, -0.7540283203125, -0.676300048828125, -0.59857177734375, -0.520843505859375, -0.443115234375, -0.365386962890625, -0.28765869140625, -0.209930419921875, -0.1322021484375, -0.054473876953125, 0.02325439453125, 0.100982666015625, 0.1787109375, 0.256439208984375, 0.33416748046875, 0.411895751953125, 0.4896240234375, 0.567352294921875, 0.64508056640625, 0.722808837890625, 0.800537109375, 0.878265380859375, 0.95599365234375, 1.033721923828125, 1.1114501953125, 1.189178466796875, 1.26690673828125, 1.344635009765625, 1.42236328125, 1.500091552734375, 1.57781982421875, 1.655548095703125, 1.7332763671875, 1.811004638671875, 1.88873291015625, 1.966461181640625, 2.044189453125, 2.121917724609375, 2.19964599609375, 2.277374267578125, 2.3551025390625, 2.432830810546875, 2.51055908203125, 2.588287353515625, 2.666015625]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 2.0, 6.0, 6.0, 16.0, 19.0, 21.0, 27.0, 32.0, 54.0, 63.0, 78.0, 137.0, 191.0, 241.0, 377.0, 480.0, 692.0, 924.0, 1359.0, 2012.0, 2738.0, 3975.0, 5869.0, 8671.0, 12908.0, 19730.0, 30042.0, 46657.0, 72746.0, 115748.0, 193768.0, 1240412.0, 120654.0, 75301.0, 47728.0, 30886.0, 20275.0, 13407.0, 8949.0, 5957.0, 4244.0, 2898.0, 1949.0, 1368.0, 990.0, 734.0, 518.0, 347.0, 243.0, 200.0, 148.0, 106.0, 82.0, 50.0, 28.0, 29.0, 11.0, 16.0, 15.0, 5.0, 3.0, 2.0, 5.0], "bins": [-0.1065673828125, -0.103240966796875, -0.09991455078125, -0.096588134765625, -0.09326171875, -0.089935302734375, -0.08660888671875, -0.083282470703125, -0.0799560546875, -0.076629638671875, -0.07330322265625, -0.069976806640625, -0.066650390625, -0.063323974609375, -0.05999755859375, -0.056671142578125, -0.0533447265625, -0.050018310546875, -0.04669189453125, -0.043365478515625, -0.0400390625, -0.036712646484375, -0.03338623046875, -0.030059814453125, -0.0267333984375, -0.023406982421875, -0.02008056640625, -0.016754150390625, -0.013427734375, -0.010101318359375, -0.00677490234375, -0.003448486328125, -0.0001220703125, 0.003204345703125, 0.00653076171875, 0.009857177734375, 0.01318359375, 0.016510009765625, 0.01983642578125, 0.023162841796875, 0.0264892578125, 0.029815673828125, 0.03314208984375, 0.036468505859375, 0.039794921875, 0.043121337890625, 0.04644775390625, 0.049774169921875, 0.0531005859375, 0.056427001953125, 0.05975341796875, 0.063079833984375, 0.06640625, 0.069732666015625, 0.07305908203125, 0.076385498046875, 0.0797119140625, 0.083038330078125, 0.08636474609375, 0.089691162109375, 0.093017578125, 0.096343994140625, 0.09967041015625, 0.102996826171875, 0.1063232421875]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 0.0, 6.0, 3.0, 10.0, 9.0, 9.0, 15.0, 12.0, 19.0, 31.0, 31.0, 48.0, 60.0, 67.0, 90.0, 106.0, 110.0, 74.0, 72.0, 59.0, 46.0, 37.0, 26.0, 18.0, 11.0, 8.0, 6.0, 4.0, 5.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011920928955078125, -0.00011474266648292542, -0.00011027604341506958, -0.00010580942034721375, -0.00010134279727935791, -9.687617421150208e-05, -9.240955114364624e-05, -8.79429280757904e-05, -8.347630500793457e-05, -7.900968194007874e-05, -7.45430588722229e-05, -7.007643580436707e-05, -6.560981273651123e-05, -6.11431896686554e-05, -5.667656660079956e-05, -5.2209943532943726e-05, -4.774332046508789e-05, -4.3276697397232056e-05, -3.881007432937622e-05, -3.4343451261520386e-05, -2.987682819366455e-05, -2.5410205125808716e-05, -2.094358205795288e-05, -1.6476958990097046e-05, -1.2010335922241211e-05, -7.543712854385376e-06, -3.077089786529541e-06, 1.389533281326294e-06, 5.856156349182129e-06, 1.0322779417037964e-05, 1.4789402484893799e-05, 1.9256025552749634e-05, 2.372264862060547e-05, 2.8189271688461304e-05, 3.265589475631714e-05, 3.7122517824172974e-05, 4.158914089202881e-05, 4.6055763959884644e-05, 5.052238702774048e-05, 5.4989010095596313e-05, 5.945563316345215e-05, 6.392225623130798e-05, 6.838887929916382e-05, 7.285550236701965e-05, 7.732212543487549e-05, 8.178874850273132e-05, 8.625537157058716e-05, 9.072199463844299e-05, 9.518861770629883e-05, 9.965524077415466e-05, 0.0001041218638420105, 0.00010858848690986633, 0.00011305510997772217, 0.000117521733045578, 0.00012198835611343384, 0.00012645497918128967, 0.0001309216022491455, 0.00013538822531700134, 0.00013985484838485718, 0.000144321471452713, 0.00014878809452056885, 0.00015325471758842468, 0.00015772134065628052, 0.00016218796372413635, 0.0001666545867919922]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 2.0, 0.0, 4.0, 5.0, 12.0, 10.0, 12.0, 8.0, 26.0, 39.0, 46.0, 73.0, 99.0, 139.0, 328.0, 1036.0, 5306.0, 53085.0, 891507.0, 87414.0, 7272.0, 1254.0, 361.0, 165.0, 113.0, 60.0, 57.0, 30.0, 22.0, 25.0, 20.0, 8.0, 6.0, 2.0, 5.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0020046234130859375, -0.0019482821226119995, -0.0018919408321380615, -0.0018355995416641235, -0.0017792582511901855, -0.0017229169607162476, -0.0016665756702423096, -0.0016102343797683716, -0.0015538930892944336, -0.0014975517988204956, -0.0014412105083465576, -0.0013848692178726196, -0.0013285279273986816, -0.0012721866369247437, -0.0012158453464508057, -0.0011595040559768677, -0.0011031627655029297, -0.0010468214750289917, -0.0009904801845550537, -0.0009341388940811157, -0.0008777976036071777, -0.0008214563131332397, -0.0007651150226593018, -0.0007087737321853638, -0.0006524324417114258, -0.0005960911512374878, -0.0005397498607635498, -0.0004834085702896118, -0.00042706727981567383, -0.00037072598934173584, -0.00031438469886779785, -0.00025804340839385986, -0.00020170211791992188, -0.0001453608274459839, -8.90195369720459e-05, -3.267824649810791e-05, 2.3663043975830078e-05, 8.000433444976807e-05, 0.00013634562492370605, 0.00019268691539764404, 0.00024902820587158203, 0.00030536949634552, 0.000361710786819458, 0.000418052077293396, 0.000474393367767334, 0.000530734658241272, 0.00058707594871521, 0.000643417239189148, 0.0006997585296630859, 0.0007560998201370239, 0.0008124411106109619, 0.0008687824010848999, 0.0009251236915588379, 0.0009814649820327759, 0.0010378062725067139, 0.0010941475629806519, 0.0011504888534545898, 0.0012068301439285278, 0.0012631714344024658, 0.0013195127248764038, 0.0013758540153503418, 0.0014321953058242798, 0.0014885365962982178, 0.0015448778867721558, 0.0016012191772460938]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 11.0, 14.0, 29.0, 71.0, 148.0, 366.0, 213.0, 72.0, 45.0, 15.0, 14.0, 5.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010348988143960014, -9.455355757381767e-05, -8.56172337080352e-05, -7.668090984225273e-05, -6.774459325242788e-05, -5.88082657486666e-05, -4.987194552086294e-05, -4.093562165508047e-05, -3.1999297789298e-05, -2.306297392351553e-05, -1.4126651876722462e-05, -5.1903298299293965e-06, 3.745994035853073e-06, 1.2682317901635543e-05, 2.1618638129439205e-05, 3.0554961995221674e-05, 3.9491285861004144e-05, 4.8427609726786613e-05, 5.736393359256908e-05, 6.630025745835155e-05, 7.523657404817641e-05, 8.417290518991649e-05, 9.310922177974135e-05, 0.00010204554564552382, 0.00011098186951130629, 0.00011991819337708876, 0.00012885451724287122, 0.00013779083383269608, 0.00014672716497443616, 0.00015566348156426102, 0.00016459979815408587, 0.00017353612929582596, 0.00018247246043756604, 0.0001914087770273909, 0.00020034510816913098, 0.00020928142475895584, 0.00021821775590069592, 0.00022715407249052078, 0.00023609038908034563, 0.0002450267202220857, 0.0002539630513638258, 0.0002628993825055659, 0.0002718356845434755, 0.0002807720156852156, 0.0002897083468269557, 0.00029864467796869576, 0.0003075809800066054, 0.00031651731114834547, 0.00032545364229008555, 0.00033438997343182564, 0.00034332627546973526, 0.00035226260661147535, 0.00036119893775321543, 0.0003701352688949555, 0.00037907157093286514, 0.0003880079020746052, 0.00039694420411251485, 0.00040588053525425494, 0.00041481683729216456, 0.00042375316843390465, 0.00043268949957564473, 0.0004416258307173848, 0.00045056213275529444, 0.0004594984638970345, 0.0004684347950387746]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 3.0, 6.0, 0.0, 3.0, 9.0, 13.0, 12.0, 7.0, 11.0, 21.0, 18.0, 17.0, 22.0, 21.0, 28.0, 25.0, 27.0, 34.0, 32.0, 30.0, 29.0, 36.0, 43.0, 46.0, 30.0, 34.0, 38.0, 38.0, 26.0, 28.0, 30.0, 31.0, 32.0, 28.0, 19.0, 36.0, 25.0, 17.0, 15.0, 16.0, 8.0, 16.0, 8.0, 4.0, 4.0, 5.0, 7.0, 4.0, 2.0, 3.0, 5.0, 5.0, 1.0, 3.0], "bins": [-5.5909156799316406e-05, -5.427934229373932e-05, -5.264952778816223e-05, -5.1019713282585144e-05, -4.938989877700806e-05, -4.776008427143097e-05, -4.613026976585388e-05, -4.4500455260276794e-05, -4.287064075469971e-05, -4.124082624912262e-05, -3.961101174354553e-05, -3.7981197237968445e-05, -3.635138273239136e-05, -3.472156822681427e-05, -3.309175372123718e-05, -3.1461939215660095e-05, -2.9832124710083008e-05, -2.820231020450592e-05, -2.6572495698928833e-05, -2.4942681193351746e-05, -2.3312866687774658e-05, -2.168305218219757e-05, -2.0053237676620483e-05, -1.8423423171043396e-05, -1.679360866546631e-05, -1.5163794159889221e-05, -1.3533979654312134e-05, -1.1904165148735046e-05, -1.0274350643157959e-05, -8.644536137580872e-06, -7.014721632003784e-06, -5.384907126426697e-06, -3.7550926208496094e-06, -2.125278115272522e-06, -4.954636096954346e-07, 1.1343508958816528e-06, 2.7641654014587402e-06, 4.393979907035828e-06, 6.023794412612915e-06, 7.653608918190002e-06, 9.28342342376709e-06, 1.0913237929344177e-05, 1.2543052434921265e-05, 1.4172866940498352e-05, 1.580268144607544e-05, 1.7432495951652527e-05, 1.9062310457229614e-05, 2.06921249628067e-05, 2.232193946838379e-05, 2.3951753973960876e-05, 2.5581568479537964e-05, 2.721138298511505e-05, 2.884119749069214e-05, 3.0471011996269226e-05, 3.2100826501846313e-05, 3.37306410074234e-05, 3.536045551300049e-05, 3.6990270018577576e-05, 3.862008452415466e-05, 4.024989902973175e-05, 4.187971353530884e-05, 4.3509528040885925e-05, 4.513934254646301e-05, 4.67691570520401e-05, 4.839897155761719e-05]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 5.0, 4.0, 5.0, 5.0, 7.0, 6.0, 9.0, 10.0, 12.0, 12.0, 17.0, 19.0, 23.0, 33.0, 20.0, 33.0, 29.0, 44.0, 45.0, 42.0, 52.0, 58.0, 48.0, 46.0, 63.0, 47.0, 31.0, 43.0, 30.0, 30.0, 26.0, 23.0, 24.0, 21.0, 19.0, 13.0, 10.0, 10.0, 9.0, 3.0, 6.0, 4.0, 5.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0], "bins": [-4.74609375, -4.6146240234375, -4.483154296875, -4.3516845703125, -4.22021484375, -4.0887451171875, -3.957275390625, -3.8258056640625, -3.6943359375, -3.5628662109375, -3.431396484375, -3.2999267578125, -3.16845703125, -3.0369873046875, -2.905517578125, -2.7740478515625, -2.642578125, -2.5111083984375, -2.379638671875, -2.2481689453125, -2.11669921875, -1.9852294921875, -1.853759765625, -1.7222900390625, -1.5908203125, -1.4593505859375, -1.327880859375, -1.1964111328125, -1.06494140625, -0.9334716796875, -0.802001953125, -0.6705322265625, -0.5390625, -0.4075927734375, -0.276123046875, -0.1446533203125, -0.01318359375, 0.1182861328125, 0.249755859375, 0.3812255859375, 0.5126953125, 0.6441650390625, 0.775634765625, 0.9071044921875, 1.03857421875, 1.1700439453125, 1.301513671875, 1.4329833984375, 1.564453125, 1.6959228515625, 1.827392578125, 1.9588623046875, 2.09033203125, 2.2218017578125, 2.353271484375, 2.4847412109375, 2.6162109375, 2.7476806640625, 2.879150390625, 3.0106201171875, 3.14208984375, 3.2735595703125, 3.405029296875, 3.5364990234375, 3.66796875]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 3.0, 4.0, 9.0, 5.0, 13.0, 11.0, 22.0, 28.0, 27.0, 50.0, 71.0, 90.0, 134.0, 199.0, 247.0, 362.0, 511.0, 694.0, 1007.0, 1446.0, 1985.0, 2942.0, 5007.0, 12142.0, 64979.0, 645732.0, 262807.0, 27916.0, 7645.0, 3973.0, 2410.0, 1785.0, 1251.0, 854.0, 638.0, 467.0, 306.0, 222.0, 149.0, 114.0, 71.0, 58.0, 57.0, 36.0, 24.0, 20.0, 8.0, 11.0, 5.0, 6.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.8203125, -5.63720703125, -5.4541015625, -5.27099609375, -5.087890625, -4.90478515625, -4.7216796875, -4.53857421875, -4.35546875, -4.17236328125, -3.9892578125, -3.80615234375, -3.623046875, -3.43994140625, -3.2568359375, -3.07373046875, -2.890625, -2.70751953125, -2.5244140625, -2.34130859375, -2.158203125, -1.97509765625, -1.7919921875, -1.60888671875, -1.42578125, -1.24267578125, -1.0595703125, -0.87646484375, -0.693359375, -0.51025390625, -0.3271484375, -0.14404296875, 0.0390625, 0.22216796875, 0.4052734375, 0.58837890625, 0.771484375, 0.95458984375, 1.1376953125, 1.32080078125, 1.50390625, 1.68701171875, 1.8701171875, 2.05322265625, 2.236328125, 2.41943359375, 2.6025390625, 2.78564453125, 2.96875, 3.15185546875, 3.3349609375, 3.51806640625, 3.701171875, 3.88427734375, 4.0673828125, 4.25048828125, 4.43359375, 4.61669921875, 4.7998046875, 4.98291015625, 5.166015625, 5.34912109375, 5.5322265625, 5.71533203125, 5.8984375]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 5.0, 6.0, 8.0, 10.0, 13.0, 10.0, 13.0, 15.0, 15.0, 13.0, 24.0, 27.0, 31.0, 32.0, 32.0, 32.0, 22.0, 34.0, 39.0, 33.0, 56.0, 47.0, 278.0, 1724.0, 96.0, 45.0, 45.0, 47.0, 45.0, 30.0, 30.0, 35.0, 24.0, 19.0, 16.0, 16.0, 16.0, 17.0, 15.0, 3.0, 8.0, 8.0, 8.0, 2.0, 3.0, 4.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.21875, -12.795166015625, -12.37158203125, -11.947998046875, -11.5244140625, -11.100830078125, -10.67724609375, -10.253662109375, -9.830078125, -9.406494140625, -8.98291015625, -8.559326171875, -8.1357421875, -7.712158203125, -7.28857421875, -6.864990234375, -6.44140625, -6.017822265625, -5.59423828125, -5.170654296875, -4.7470703125, -4.323486328125, -3.89990234375, -3.476318359375, -3.052734375, -2.629150390625, -2.20556640625, -1.781982421875, -1.3583984375, -0.934814453125, -0.51123046875, -0.087646484375, 0.3359375, 0.759521484375, 1.18310546875, 1.606689453125, 2.0302734375, 2.453857421875, 2.87744140625, 3.301025390625, 3.724609375, 4.148193359375, 4.57177734375, 4.995361328125, 5.4189453125, 5.842529296875, 6.26611328125, 6.689697265625, 7.11328125, 7.536865234375, 7.96044921875, 8.384033203125, 8.8076171875, 9.231201171875, 9.65478515625, 10.078369140625, 10.501953125, 10.925537109375, 11.34912109375, 11.772705078125, 12.1962890625, 12.619873046875, 13.04345703125, 13.467041015625, 13.890625]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 8.0, 3.0, 6.0, 13.0, 10.0, 9.0, 19.0, 25.0, 40.0, 31.0, 50.0, 108.0, 163.0, 268.0, 529.0, 1496.0, 4890.0, 25738.0, 3049823.0, 51751.0, 7089.0, 1996.0, 704.0, 323.0, 189.0, 113.0, 78.0, 55.0, 32.0, 38.0, 21.0, 21.0, 20.0, 18.0, 8.0, 10.0, 9.0, 2.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.078125, -22.177490234375, -21.27685546875, -20.376220703125, -19.4755859375, -18.574951171875, -17.67431640625, -16.773681640625, -15.873046875, -14.972412109375, -14.07177734375, -13.171142578125, -12.2705078125, -11.369873046875, -10.46923828125, -9.568603515625, -8.66796875, -7.767333984375, -6.86669921875, -5.966064453125, -5.0654296875, -4.164794921875, -3.26416015625, -2.363525390625, -1.462890625, -0.562255859375, 0.33837890625, 1.239013671875, 2.1396484375, 3.040283203125, 3.94091796875, 4.841552734375, 5.7421875, 6.642822265625, 7.54345703125, 8.444091796875, 9.3447265625, 10.245361328125, 11.14599609375, 12.046630859375, 12.947265625, 13.847900390625, 14.74853515625, 15.649169921875, 16.5498046875, 17.450439453125, 18.35107421875, 19.251708984375, 20.15234375, 21.052978515625, 21.95361328125, 22.854248046875, 23.7548828125, 24.655517578125, 25.55615234375, 26.456787109375, 27.357421875, 28.258056640625, 29.15869140625, 30.059326171875, 30.9599609375, 31.860595703125, 32.76123046875, 33.661865234375, 34.5625]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 16.0, 169.0, 634.0, 175.0, 18.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-177.4801788330078, -173.7400665283203, -169.9999542236328, -166.25982666015625, -162.51971435546875, -158.77960205078125, -155.03948974609375, -151.29937744140625, -147.5592498779297, -143.8191375732422, -140.0790252685547, -136.33889770507812, -132.59878540039062, -128.85867309570312, -125.11856079101562, -121.3784408569336, -117.63833618164062, -113.89822387695312, -110.1581039428711, -106.4179916381836, -102.67787170410156, -98.93775939941406, -95.19764709472656, -91.45752716064453, -87.7174072265625, -83.977294921875, -80.23717498779297, -76.49706268310547, -72.75694274902344, -69.01683044433594, -65.27671813964844, -61.536598205566406, -57.79648208618164, -54.056365966796875, -50.31624984741211, -46.576133728027344, -42.836021423339844, -39.09590530395508, -35.35578918457031, -31.61567497253418, -27.875558853149414, -24.13544273376465, -20.395328521728516, -16.65521240234375, -12.9150972366333, -9.174982070922852, -5.434865951538086, -1.6947517395019531, 2.0453643798828125, 5.785479545593262, 9.525594711303711, 13.265710830688477, 17.00582504272461, 20.745941162109375, 24.48605728149414, 28.226171493530273, 31.96628761291504, 35.70640182495117, 39.44651794433594, 43.1866340637207, 46.92675018310547, 50.66686248779297, 54.406982421875, 58.1470947265625, 61.887210845947266]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 7.0, 2.0, 3.0, 13.0, 13.0, 5.0, 14.0, 8.0, 16.0, 20.0, 18.0, 33.0, 30.0, 36.0, 23.0, 41.0, 42.0, 42.0, 45.0, 39.0, 42.0, 48.0, 46.0, 43.0, 37.0, 36.0, 39.0, 38.0, 36.0, 32.0, 20.0, 18.0, 16.0, 15.0, 21.0, 11.0, 18.0, 10.0, 10.0, 6.0, 6.0, 2.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-51.54596710205078, -49.972530364990234, -48.39908981323242, -46.825653076171875, -45.25221633911133, -43.67877960205078, -42.10533905029297, -40.53190231323242, -38.958465576171875, -37.38502883911133, -35.811588287353516, -34.23815155029297, -32.66471481323242, -31.091276168823242, -29.517837524414062, -27.944400787353516, -26.370960235595703, -24.797521591186523, -23.224084854125977, -21.650646209716797, -20.07720947265625, -18.50377082824707, -16.93033218383789, -15.356894493103027, -13.783456802368164, -12.2100191116333, -10.636581420898438, -9.063142776489258, -7.4897050857543945, -5.916267395019531, -4.342828750610352, -2.7693910598754883, -1.195953369140625, 0.3774845600128174, 1.9509224891662598, 3.5243606567382812, 5.0977983474731445, 6.671236038208008, 8.244674682617188, 9.81811237335205, 11.391550064086914, 12.964987754821777, 14.53842544555664, 16.11186408996582, 17.685302734375, 19.258739471435547, 20.832178115844727, 22.405616760253906, 23.979053497314453, 25.552492141723633, 27.12592887878418, 28.69936752319336, 30.272804260253906, 31.846242904663086, 33.419681549072266, 34.99311828613281, 36.566558837890625, 38.13999557495117, 39.713436126708984, 41.28687286376953, 42.86030960083008, 44.433746337890625, 46.00718688964844, 47.580623626708984, 49.15406036376953]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 1.0, 5.0, 6.0, 5.0, 3.0, 7.0, 6.0, 6.0, 12.0, 12.0, 21.0, 13.0, 10.0, 22.0, 30.0, 23.0, 40.0, 41.0, 36.0, 46.0, 47.0, 39.0, 65.0, 47.0, 47.0, 40.0, 56.0, 48.0, 37.0, 27.0, 29.0, 25.0, 23.0, 18.0, 27.0, 23.0, 8.0, 16.0, 8.0, 8.0, 4.0, 3.0, 7.0, 2.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-4.88671875, -4.7510986328125, -4.615478515625, -4.4798583984375, -4.34423828125, -4.2086181640625, -4.072998046875, -3.9373779296875, -3.8017578125, -3.6661376953125, -3.530517578125, -3.3948974609375, -3.25927734375, -3.1236572265625, -2.988037109375, -2.8524169921875, -2.716796875, -2.5811767578125, -2.445556640625, -2.3099365234375, -2.17431640625, -2.0386962890625, -1.903076171875, -1.7674560546875, -1.6318359375, -1.4962158203125, -1.360595703125, -1.2249755859375, -1.08935546875, -0.9537353515625, -0.818115234375, -0.6824951171875, -0.546875, -0.4112548828125, -0.275634765625, -0.1400146484375, -0.00439453125, 0.1312255859375, 0.266845703125, 0.4024658203125, 0.5380859375, 0.6737060546875, 0.809326171875, 0.9449462890625, 1.08056640625, 1.2161865234375, 1.351806640625, 1.4874267578125, 1.623046875, 1.7586669921875, 1.894287109375, 2.0299072265625, 2.16552734375, 2.3011474609375, 2.436767578125, 2.5723876953125, 2.7080078125, 2.8436279296875, 2.979248046875, 3.1148681640625, 3.25048828125, 3.3861083984375, 3.521728515625, 3.6573486328125, 3.79296875]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 3.0, 7.0, 9.0, 8.0, 13.0, 18.0, 26.0, 53.0, 55.0, 101.0, 153.0, 236.0, 365.0, 647.0, 1125.0, 2015.0, 3697.0, 6986.0, 15007.0, 36032.0, 185140.0, 3196809.0, 648287.0, 57923.0, 20462.0, 9116.0, 4482.0, 2337.0, 1248.0, 777.0, 456.0, 256.0, 155.0, 96.0, 68.0, 36.0, 31.0, 13.0, 16.0, 9.0, 5.0, 1.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.1015625, -12.6602783203125, -12.218994140625, -11.7777099609375, -11.33642578125, -10.8951416015625, -10.453857421875, -10.0125732421875, -9.5712890625, -9.1300048828125, -8.688720703125, -8.2474365234375, -7.80615234375, -7.3648681640625, -6.923583984375, -6.4822998046875, -6.041015625, -5.5997314453125, -5.158447265625, -4.7171630859375, -4.27587890625, -3.8345947265625, -3.393310546875, -2.9520263671875, -2.5107421875, -2.0694580078125, -1.628173828125, -1.1868896484375, -0.74560546875, -0.3043212890625, 0.136962890625, 0.5782470703125, 1.01953125, 1.4608154296875, 1.902099609375, 2.3433837890625, 2.78466796875, 3.2259521484375, 3.667236328125, 4.1085205078125, 4.5498046875, 4.9910888671875, 5.432373046875, 5.8736572265625, 6.31494140625, 6.7562255859375, 7.197509765625, 7.6387939453125, 8.080078125, 8.5213623046875, 8.962646484375, 9.4039306640625, 9.84521484375, 10.2864990234375, 10.727783203125, 11.1690673828125, 11.6103515625, 12.0516357421875, 12.492919921875, 12.9342041015625, 13.37548828125, 13.8167724609375, 14.258056640625, 14.6993408203125, 15.140625]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 4.0, 6.0, 7.0, 5.0, 5.0, 6.0, 17.0, 10.0, 13.0, 21.0, 22.0, 32.0, 37.0, 44.0, 71.0, 101.0, 135.0, 284.0, 455.0, 610.0, 691.0, 482.0, 320.0, 191.0, 131.0, 85.0, 63.0, 46.0, 34.0, 30.0, 20.0, 20.0, 13.0, 17.0, 10.0, 5.0, 7.0, 2.0, 8.0, 4.0, 2.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-11.5078125, -11.1611328125, -10.814453125, -10.4677734375, -10.12109375, -9.7744140625, -9.427734375, -9.0810546875, -8.734375, -8.3876953125, -8.041015625, -7.6943359375, -7.34765625, -7.0009765625, -6.654296875, -6.3076171875, -5.9609375, -5.6142578125, -5.267578125, -4.9208984375, -4.57421875, -4.2275390625, -3.880859375, -3.5341796875, -3.1875, -2.8408203125, -2.494140625, -2.1474609375, -1.80078125, -1.4541015625, -1.107421875, -0.7607421875, -0.4140625, -0.0673828125, 0.279296875, 0.6259765625, 0.97265625, 1.3193359375, 1.666015625, 2.0126953125, 2.359375, 2.7060546875, 3.052734375, 3.3994140625, 3.74609375, 4.0927734375, 4.439453125, 4.7861328125, 5.1328125, 5.4794921875, 5.826171875, 6.1728515625, 6.51953125, 6.8662109375, 7.212890625, 7.5595703125, 7.90625, 8.2529296875, 8.599609375, 8.9462890625, 9.29296875, 9.6396484375, 9.986328125, 10.3330078125, 10.6796875]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 3.0, 3.0, 5.0, 11.0, 6.0, 16.0, 13.0, 23.0, 38.0, 50.0, 85.0, 127.0, 254.0, 437.0, 847.0, 1551.0, 2817.0, 5401.0, 11128.0, 25088.0, 65748.0, 307244.0, 3104498.0, 527954.0, 84086.0, 30304.0, 13101.0, 6362.0, 3186.0, 1704.0, 957.0, 496.0, 296.0, 149.0, 115.0, 50.0, 41.0, 33.0, 18.0, 1.0, 13.0, 5.0, 8.0, 4.0, 2.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-18.34375, -17.72412109375, -17.1044921875, -16.48486328125, -15.865234375, -15.24560546875, -14.6259765625, -14.00634765625, -13.38671875, -12.76708984375, -12.1474609375, -11.52783203125, -10.908203125, -10.28857421875, -9.6689453125, -9.04931640625, -8.4296875, -7.81005859375, -7.1904296875, -6.57080078125, -5.951171875, -5.33154296875, -4.7119140625, -4.09228515625, -3.47265625, -2.85302734375, -2.2333984375, -1.61376953125, -0.994140625, -0.37451171875, 0.2451171875, 0.86474609375, 1.484375, 2.10400390625, 2.7236328125, 3.34326171875, 3.962890625, 4.58251953125, 5.2021484375, 5.82177734375, 6.44140625, 7.06103515625, 7.6806640625, 8.30029296875, 8.919921875, 9.53955078125, 10.1591796875, 10.77880859375, 11.3984375, 12.01806640625, 12.6376953125, 13.25732421875, 13.876953125, 14.49658203125, 15.1162109375, 15.73583984375, 16.35546875, 16.97509765625, 17.5947265625, 18.21435546875, 18.833984375, 19.45361328125, 20.0732421875, 20.69287109375, 21.3125]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 12.0, 6.0, 17.0, 29.0, 42.0, 47.0, 92.0, 146.0, 166.0, 143.0, 97.0, 71.0, 52.0, 30.0, 25.0, 9.0, 9.0, 4.0, 2.0, 0.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.87895202636719, -60.52501678466797, -58.171085357666016, -55.81715393066406, -53.463218688964844, -51.109283447265625, -48.75535202026367, -46.40142059326172, -44.0474853515625, -41.69355010986328, -39.33961868286133, -36.985687255859375, -34.631752014160156, -32.27781677246094, -29.923885345458984, -27.5699520111084, -25.216018676757812, -22.862085342407227, -20.50815200805664, -18.154218673706055, -15.800285339355469, -13.446352005004883, -11.092418670654297, -8.738485336303711, -6.384552001953125, -4.030618667602539, -1.6766853332519531, 0.6772480010986328, 3.0311813354492188, 5.385114669799805, 7.739048004150391, 10.092981338500977, 12.446907043457031, 14.800840377807617, 17.154773712158203, 19.50870704650879, 21.862640380859375, 24.21657371520996, 26.570507049560547, 28.924440383911133, 31.27837371826172, 33.63230895996094, 35.98624038696289, 38.340171813964844, 40.69410705566406, 43.04804229736328, 45.401973724365234, 47.75590515136719, 50.109840393066406, 52.463775634765625, 54.81770706176758, 57.17163848876953, 59.52557373046875, 61.87950897216797, 64.23344421386719, 66.58737182617188, 68.9413070678711, 71.29524230957031, 73.649169921875, 76.00310516357422, 78.35704040527344, 80.71097564697266, 83.06491088867188, 85.41883850097656, 87.77277374267578]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [4.0, 2.0, 1.0, 0.0, 3.0, 1.0, 4.0, 6.0, 15.0, 5.0, 7.0, 13.0, 17.0, 13.0, 18.0, 19.0, 21.0, 25.0, 19.0, 34.0, 31.0, 27.0, 32.0, 34.0, 32.0, 36.0, 40.0, 43.0, 38.0, 55.0, 40.0, 43.0, 38.0, 40.0, 33.0, 35.0, 33.0, 22.0, 23.0, 22.0, 22.0, 11.0, 17.0, 12.0, 8.0, 4.0, 4.0, 4.0, 7.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.83740234375, -29.712251663208008, -28.587100982666016, -27.461950302124023, -26.33679962158203, -25.21164894104004, -24.086498260498047, -22.961347579956055, -21.836196899414062, -20.71104621887207, -19.585895538330078, -18.460744857788086, -17.335594177246094, -16.2104434967041, -15.08529281616211, -13.960142135620117, -12.834991455078125, -11.709840774536133, -10.58469009399414, -9.459539413452148, -8.334388732910156, -7.209238052368164, -6.084087371826172, -4.95893669128418, -3.8337860107421875, -2.7086353302001953, -1.5834846496582031, -0.45833396911621094, 0.6668167114257812, 1.7919673919677734, 2.9171180725097656, 4.042268753051758, 5.16741943359375, 6.292570114135742, 7.417720794677734, 8.542871475219727, 9.668022155761719, 10.793172836303711, 11.918323516845703, 13.043474197387695, 14.168624877929688, 15.29377555847168, 16.418926239013672, 17.544076919555664, 18.669227600097656, 19.79437828063965, 20.91952896118164, 22.044679641723633, 23.169830322265625, 24.294981002807617, 25.42013168334961, 26.5452823638916, 27.670433044433594, 28.795583724975586, 29.920734405517578, 31.04588508605957, 32.17103576660156, 33.29618835449219, 34.42133712768555, 35.546485900878906, 36.67163848876953, 37.796791076660156, 38.921939849853516, 40.047088623046875, 41.1722412109375]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 5.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 2.0, 2.0, 6.0, 6.0, 3.0, 8.0, 11.0, 5.0, 13.0, 13.0, 14.0, 22.0, 16.0, 19.0, 18.0, 46.0, 34.0, 35.0, 37.0, 42.0, 56.0, 54.0, 39.0, 50.0, 50.0, 38.0, 45.0, 26.0, 43.0, 34.0, 35.0, 25.0, 19.0, 26.0, 18.0, 14.0, 17.0, 9.0, 17.0, 10.0, 9.0, 5.0, 3.0, 2.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.5859375, -4.45037841796875, -4.3148193359375, -4.17926025390625, -4.043701171875, -3.90814208984375, -3.7725830078125, -3.63702392578125, -3.50146484375, -3.36590576171875, -3.2303466796875, -3.09478759765625, -2.959228515625, -2.82366943359375, -2.6881103515625, -2.55255126953125, -2.4169921875, -2.28143310546875, -2.1458740234375, -2.01031494140625, -1.874755859375, -1.73919677734375, -1.6036376953125, -1.46807861328125, -1.33251953125, -1.19696044921875, -1.0614013671875, -0.92584228515625, -0.790283203125, -0.65472412109375, -0.5191650390625, -0.38360595703125, -0.248046875, -0.11248779296875, 0.0230712890625, 0.15863037109375, 0.294189453125, 0.42974853515625, 0.5653076171875, 0.70086669921875, 0.83642578125, 0.97198486328125, 1.1075439453125, 1.24310302734375, 1.378662109375, 1.51422119140625, 1.6497802734375, 1.78533935546875, 1.9208984375, 2.05645751953125, 2.1920166015625, 2.32757568359375, 2.463134765625, 2.59869384765625, 2.7342529296875, 2.86981201171875, 3.00537109375, 3.14093017578125, 3.2764892578125, 3.41204833984375, 3.547607421875, 3.68316650390625, 3.8187255859375, 3.95428466796875, 4.08984375]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 6.0, 7.0, 11.0, 23.0, 23.0, 26.0, 44.0, 53.0, 114.0, 152.0, 274.0, 428.0, 565.0, 923.0, 1324.0, 2170.0, 3612.0, 5823.0, 9344.0, 16295.0, 28390.0, 52544.0, 101748.0, 209119.0, 294309.0, 150298.0, 75696.0, 40080.0, 22142.0, 12761.0, 7549.0, 4722.0, 2866.0, 1814.0, 1143.0, 759.0, 482.0, 320.0, 205.0, 131.0, 105.0, 56.0, 41.0, 21.0, 18.0, 12.0, 10.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.1751708984375, -0.1695709228515625, -0.163970947265625, -0.1583709716796875, -0.15277099609375, -0.1471710205078125, -0.141571044921875, -0.1359710693359375, -0.13037109375, -0.1247711181640625, -0.119171142578125, -0.1135711669921875, -0.10797119140625, -0.1023712158203125, -0.096771240234375, -0.0911712646484375, -0.0855712890625, -0.0799713134765625, -0.074371337890625, -0.0687713623046875, -0.06317138671875, -0.0575714111328125, -0.051971435546875, -0.0463714599609375, -0.040771484375, -0.0351715087890625, -0.029571533203125, -0.0239715576171875, -0.01837158203125, -0.0127716064453125, -0.007171630859375, -0.0015716552734375, 0.0040283203125, 0.0096282958984375, 0.015228271484375, 0.0208282470703125, 0.02642822265625, 0.0320281982421875, 0.037628173828125, 0.0432281494140625, 0.048828125, 0.0544281005859375, 0.060028076171875, 0.0656280517578125, 0.07122802734375, 0.0768280029296875, 0.082427978515625, 0.0880279541015625, 0.0936279296875, 0.0992279052734375, 0.104827880859375, 0.1104278564453125, 0.11602783203125, 0.1216278076171875, 0.127227783203125, 0.1328277587890625, 0.138427734375, 0.1440277099609375, 0.149627685546875, 0.1552276611328125, 0.16082763671875, 0.1664276123046875, 0.172027587890625, 0.1776275634765625, 0.1832275390625]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 6.0, 6.0, 7.0, 4.0, 7.0, 5.0, 8.0, 13.0, 16.0, 13.0, 18.0, 24.0, 19.0, 19.0, 36.0, 28.0, 43.0, 33.0, 40.0, 39.0, 50.0, 46.0, 1062.0, 35.0, 43.0, 36.0, 39.0, 36.0, 36.0, 36.0, 30.0, 26.0, 18.0, 25.0, 20.0, 21.0, 17.0, 19.0, 6.0, 9.0, 12.0, 8.0, 4.0, 4.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.8984375, -2.807220458984375, -2.71600341796875, -2.624786376953125, -2.5335693359375, -2.442352294921875, -2.35113525390625, -2.259918212890625, -2.168701171875, -2.077484130859375, -1.98626708984375, -1.895050048828125, -1.8038330078125, -1.712615966796875, -1.62139892578125, -1.530181884765625, -1.43896484375, -1.347747802734375, -1.25653076171875, -1.165313720703125, -1.0740966796875, -0.982879638671875, -0.89166259765625, -0.800445556640625, -0.709228515625, -0.618011474609375, -0.52679443359375, -0.435577392578125, -0.3443603515625, -0.253143310546875, -0.16192626953125, -0.070709228515625, 0.0205078125, 0.111724853515625, 0.20294189453125, 0.294158935546875, 0.3853759765625, 0.476593017578125, 0.56781005859375, 0.659027099609375, 0.750244140625, 0.841461181640625, 0.93267822265625, 1.023895263671875, 1.1151123046875, 1.206329345703125, 1.29754638671875, 1.388763427734375, 1.47998046875, 1.571197509765625, 1.66241455078125, 1.753631591796875, 1.8448486328125, 1.936065673828125, 2.02728271484375, 2.118499755859375, 2.209716796875, 2.300933837890625, 2.39215087890625, 2.483367919921875, 2.5745849609375, 2.665802001953125, 2.75701904296875, 2.848236083984375, 2.939453125]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 2.0, 6.0, 8.0, 7.0, 18.0, 28.0, 33.0, 59.0, 55.0, 102.0, 139.0, 199.0, 295.0, 449.0, 598.0, 810.0, 1263.0, 1845.0, 2653.0, 3849.0, 5855.0, 8819.0, 13332.0, 21441.0, 33907.0, 54278.0, 88494.0, 149461.0, 1286932.0, 164573.0, 96258.0, 58556.0, 36134.0, 22880.0, 14950.0, 9478.0, 6346.0, 4096.0, 2818.0, 1946.0, 1236.0, 905.0, 631.0, 420.0, 314.0, 189.0, 162.0, 106.0, 66.0, 48.0, 38.0, 17.0, 14.0, 8.0, 7.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.11968994140625, -0.11590003967285156, -0.11211013793945312, -0.10832023620605469, -0.10453033447265625, -0.10074043273925781, -0.09695053100585938, -0.09316062927246094, -0.0893707275390625, -0.08558082580566406, -0.08179092407226562, -0.07800102233886719, -0.07421112060546875, -0.07042121887207031, -0.06663131713867188, -0.06284141540527344, -0.059051513671875, -0.05526161193847656, -0.051471710205078125, -0.04768180847167969, -0.04389190673828125, -0.04010200500488281, -0.036312103271484375, -0.03252220153808594, -0.0287322998046875, -0.024942398071289062, -0.021152496337890625, -0.017362594604492188, -0.01357269287109375, -0.009782791137695312, -0.005992889404296875, -0.0022029876708984375, 0.0015869140625, 0.0053768157958984375, 0.009166717529296875, 0.012956619262695312, 0.01674652099609375, 0.020536422729492188, 0.024326324462890625, 0.028116226196289062, 0.0319061279296875, 0.03569602966308594, 0.039485931396484375, 0.04327583312988281, 0.04706573486328125, 0.05085563659667969, 0.054645538330078125, 0.05843544006347656, 0.062225341796875, 0.06601524353027344, 0.06980514526367188, 0.07359504699707031, 0.07738494873046875, 0.08117485046386719, 0.08496475219726562, 0.08875465393066406, 0.0925445556640625, 0.09633445739746094, 0.10012435913085938, 0.10391426086425781, 0.10770416259765625, 0.11149406433105469, 0.11528396606445312, 0.11907386779785156, 0.12286376953125]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 3.0, 2.0, 3.0, 4.0, 8.0, 8.0, 9.0, 9.0, 17.0, 19.0, 17.0, 22.0, 33.0, 42.0, 48.0, 84.0, 127.0, 142.0, 101.0, 81.0, 37.0, 19.0, 26.0, 19.0, 28.0, 27.0, 15.0, 12.0, 13.0, 4.0, 2.0, 5.0, 5.0, 5.0, 4.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00018453598022460938, -0.00017823092639446259, -0.0001719258725643158, -0.000165620818734169, -0.00015931576490402222, -0.00015301071107387543, -0.00014670565724372864, -0.00014040060341358185, -0.00013409554958343506, -0.00012779049575328827, -0.00012148544192314148, -0.00011518038809299469, -0.0001088753342628479, -0.00010257028043270111, -9.626522660255432e-05, -8.996017277240753e-05, -8.365511894226074e-05, -7.735006511211395e-05, -7.104501128196716e-05, -6.473995745182037e-05, -5.8434903621673584e-05, -5.2129849791526794e-05, -4.5824795961380005e-05, -3.9519742131233215e-05, -3.3214688301086426e-05, -2.6909634470939636e-05, -2.0604580640792847e-05, -1.4299526810646057e-05, -7.994472980499268e-06, -1.689419150352478e-06, 4.6156346797943115e-06, 1.0920688509941101e-05, 1.722574234008789e-05, 2.353079617023468e-05, 2.983585000038147e-05, 3.614090383052826e-05, 4.244595766067505e-05, 4.875101149082184e-05, 5.505606532096863e-05, 6.136111915111542e-05, 6.766617298126221e-05, 7.3971226811409e-05, 8.027628064155579e-05, 8.658133447170258e-05, 9.288638830184937e-05, 9.919144213199615e-05, 0.00010549649596214294, 0.00011180154979228973, 0.00011810660362243652, 0.0001244116574525833, 0.0001307167112827301, 0.0001370217651128769, 0.00014332681894302368, 0.00014963187277317047, 0.00015593692660331726, 0.00016224198043346405, 0.00016854703426361084, 0.00017485208809375763, 0.00018115714192390442, 0.0001874621957540512, 0.000193767249584198, 0.0002000723034143448, 0.00020637735724449158, 0.00021268241107463837, 0.00021898746490478516]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 4.0, 9.0, 3.0, 12.0, 12.0, 16.0, 21.0, 27.0, 40.0, 55.0, 62.0, 96.0, 167.0, 286.0, 717.0, 2330.0, 12102.0, 127233.0, 860822.0, 36618.0, 5536.0, 1239.0, 443.0, 245.0, 137.0, 84.0, 63.0, 40.0, 41.0, 28.0, 16.0, 10.0, 9.0, 4.0, 9.0, 6.0, 2.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00225067138671875, -0.002180933952331543, -0.002111196517944336, -0.002041459083557129, -0.001971721649169922, -0.0019019842147827148, -0.0018322467803955078, -0.0017625093460083008, -0.0016927719116210938, -0.0016230344772338867, -0.0015532970428466797, -0.0014835596084594727, -0.0014138221740722656, -0.0013440847396850586, -0.0012743473052978516, -0.0012046098709106445, -0.0011348724365234375, -0.0010651350021362305, -0.0009953975677490234, -0.0009256601333618164, -0.0008559226989746094, -0.0007861852645874023, -0.0007164478302001953, -0.0006467103958129883, -0.0005769729614257812, -0.0005072355270385742, -0.0004374980926513672, -0.00036776065826416016, -0.0002980232238769531, -0.0002282857894897461, -0.00015854835510253906, -8.881092071533203e-05, -1.9073486328125e-05, 5.066394805908203e-05, 0.00012040138244628906, 0.0001901388168334961, 0.0002598762512207031, 0.00032961368560791016, 0.0003993511199951172, 0.0004690885543823242, 0.0005388259887695312, 0.0006085634231567383, 0.0006783008575439453, 0.0007480382919311523, 0.0008177757263183594, 0.0008875131607055664, 0.0009572505950927734, 0.0010269880294799805, 0.0010967254638671875, 0.0011664628982543945, 0.0012362003326416016, 0.0013059377670288086, 0.0013756752014160156, 0.0014454126358032227, 0.0015151500701904297, 0.0015848875045776367, 0.0016546249389648438, 0.0017243623733520508, 0.0017940998077392578, 0.0018638372421264648, 0.0019335746765136719, 0.002003312110900879, 0.002073049545288086, 0.002142786979675293, 0.0022125244140625]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 11.0, 24.0, 53.0, 91.0, 269.0, 320.0, 123.0, 56.0, 30.0, 15.0, 3.0, 12.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0005585396429523826, -0.0005473850178532302, -0.0005362303927540779, -0.0005250758258625865, -0.0005139212007634342, -0.0005027665756642818, -0.0004916119505651295, -0.0004804573254659772, -0.0004693027294706553, -0.000458148104371503, -0.0004469935083761811, -0.0004358388832770288, -0.00042468425817787647, -0.0004135296621825546, -0.0004023750370834023, -0.0003912204410880804, -0.0003800658159889281, -0.00036891119088977575, -0.0003577565948944539, -0.00034660196979530156, -0.0003354473737999797, -0.00032429274870082736, -0.00031313812360167503, -0.0003019834985025227, -0.00029082890250720084, -0.0002796742774080485, -0.00026851968141272664, -0.0002573650563135743, -0.000246210431214422, -0.00023505583521910012, -0.0002239012101199478, -0.0002127465995727107, -0.00020159201812930405, -0.00019043740758206695, -0.00017928279703482985, -0.00016812817193567753, -0.00015697356138844043, -0.00014581895084120333, -0.000134664325742051, -0.0001235097151948139, -0.00011235510464757681, -0.00010120049410033971, -9.0045876277145e-05, -7.889125845395029e-05, -6.773664790671319e-05, -5.658203372149728e-05, -4.542741953628138e-05, -3.4272801713086665e-05, -2.3118191165849566e-05, -1.1963576980633661e-05, -8.089627954177558e-07, 1.034565138979815e-05, 2.1500265575014055e-05, 3.265487976022996e-05, 4.3809493945445865e-05, 5.496411176864058e-05, 6.611872231587768e-05, 7.727333286311477e-05, 8.842795068630949e-05, 9.95825685095042e-05, 0.0001107371790567413, 0.0001218917896039784, 0.00013304641470313072, 0.00014420102525036782, 0.00015535563579760492]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 9.0, 4.0, 5.0, 7.0, 2.0, 10.0, 4.0, 17.0, 16.0, 20.0, 19.0, 18.0, 22.0, 26.0, 24.0, 27.0, 41.0, 36.0, 35.0, 29.0, 37.0, 38.0, 49.0, 47.0, 35.0, 39.0, 48.0, 44.0, 30.0, 28.0, 37.0, 23.0, 29.0, 25.0, 13.0, 15.0, 14.0, 13.0, 14.0, 11.0, 7.0, 6.0, 10.0, 12.0, 3.0, 0.0, 6.0, 2.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.362531661987305e-05, -8.097290992736816e-05, -7.832050323486328e-05, -7.56680965423584e-05, -7.301568984985352e-05, -7.036328315734863e-05, -6.771087646484375e-05, -6.505846977233887e-05, -6.240606307983398e-05, -5.97536563873291e-05, -5.710124969482422e-05, -5.4448843002319336e-05, -5.179643630981445e-05, -4.914402961730957e-05, -4.649162292480469e-05, -4.3839216232299805e-05, -4.118680953979492e-05, -3.853440284729004e-05, -3.5881996154785156e-05, -3.3229589462280273e-05, -3.057718276977539e-05, -2.7924776077270508e-05, -2.5272369384765625e-05, -2.2619962692260742e-05, -1.996755599975586e-05, -1.7315149307250977e-05, -1.4662742614746094e-05, -1.2010335922241211e-05, -9.357929229736328e-06, -6.705522537231445e-06, -4.0531158447265625e-06, -1.4007091522216797e-06, 1.2516975402832031e-06, 3.904104232788086e-06, 6.556510925292969e-06, 9.208917617797852e-06, 1.1861324310302734e-05, 1.4513731002807617e-05, 1.71661376953125e-05, 1.9818544387817383e-05, 2.2470951080322266e-05, 2.512335777282715e-05, 2.777576446533203e-05, 3.0428171157836914e-05, 3.30805778503418e-05, 3.573298454284668e-05, 3.838539123535156e-05, 4.1037797927856445e-05, 4.369020462036133e-05, 4.634261131286621e-05, 4.8995018005371094e-05, 5.1647424697875977e-05, 5.429983139038086e-05, 5.695223808288574e-05, 5.9604644775390625e-05, 6.225705146789551e-05, 6.490945816040039e-05, 6.756186485290527e-05, 7.021427154541016e-05, 7.286667823791504e-05, 7.551908493041992e-05, 7.81714916229248e-05, 8.082389831542969e-05, 8.347630500793457e-05, 8.612871170043945e-05]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 5.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 2.0, 2.0, 6.0, 6.0, 3.0, 8.0, 11.0, 5.0, 13.0, 13.0, 14.0, 22.0, 16.0, 19.0, 18.0, 46.0, 34.0, 35.0, 37.0, 42.0, 56.0, 54.0, 39.0, 50.0, 50.0, 38.0, 45.0, 26.0, 43.0, 34.0, 35.0, 25.0, 19.0, 26.0, 18.0, 14.0, 17.0, 9.0, 17.0, 10.0, 9.0, 5.0, 3.0, 2.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.5859375, -4.45037841796875, -4.3148193359375, -4.17926025390625, -4.043701171875, -3.90814208984375, -3.7725830078125, -3.63702392578125, -3.50146484375, -3.36590576171875, -3.2303466796875, -3.09478759765625, -2.959228515625, -2.82366943359375, -2.6881103515625, -2.55255126953125, -2.4169921875, -2.28143310546875, -2.1458740234375, -2.01031494140625, -1.874755859375, -1.73919677734375, -1.6036376953125, -1.46807861328125, -1.33251953125, -1.19696044921875, -1.0614013671875, -0.92584228515625, -0.790283203125, -0.65472412109375, -0.5191650390625, -0.38360595703125, -0.248046875, -0.11248779296875, 0.0230712890625, 0.15863037109375, 0.294189453125, 0.42974853515625, 0.5653076171875, 0.70086669921875, 0.83642578125, 0.97198486328125, 1.1075439453125, 1.24310302734375, 1.378662109375, 1.51422119140625, 1.6497802734375, 1.78533935546875, 1.9208984375, 2.05645751953125, 2.1920166015625, 2.32757568359375, 2.463134765625, 2.59869384765625, 2.7342529296875, 2.86981201171875, 3.00537109375, 3.14093017578125, 3.2764892578125, 3.41204833984375, 3.547607421875, 3.68316650390625, 3.8187255859375, 3.95428466796875, 4.08984375]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 8.0, 8.0, 8.0, 12.0, 20.0, 21.0, 17.0, 28.0, 54.0, 53.0, 72.0, 102.0, 160.0, 244.0, 329.0, 461.0, 683.0, 1026.0, 1480.0, 2482.0, 4390.0, 10225.0, 33441.0, 168995.0, 597317.0, 171182.0, 33781.0, 10193.0, 4495.0, 2454.0, 1518.0, 990.0, 686.0, 453.0, 339.0, 234.0, 148.0, 105.0, 76.0, 79.0, 45.0, 29.0, 36.0, 14.0, 14.0, 15.0, 13.0, 9.0, 6.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 2.0], "bins": [-4.03515625, -3.9110107421875, -3.786865234375, -3.6627197265625, -3.53857421875, -3.4144287109375, -3.290283203125, -3.1661376953125, -3.0419921875, -2.9178466796875, -2.793701171875, -2.6695556640625, -2.54541015625, -2.4212646484375, -2.297119140625, -2.1729736328125, -2.048828125, -1.9246826171875, -1.800537109375, -1.6763916015625, -1.55224609375, -1.4281005859375, -1.303955078125, -1.1798095703125, -1.0556640625, -0.9315185546875, -0.807373046875, -0.6832275390625, -0.55908203125, -0.4349365234375, -0.310791015625, -0.1866455078125, -0.0625, 0.0616455078125, 0.185791015625, 0.3099365234375, 0.43408203125, 0.5582275390625, 0.682373046875, 0.8065185546875, 0.9306640625, 1.0548095703125, 1.178955078125, 1.3031005859375, 1.42724609375, 1.5513916015625, 1.675537109375, 1.7996826171875, 1.923828125, 2.0479736328125, 2.172119140625, 2.2962646484375, 2.42041015625, 2.5445556640625, 2.668701171875, 2.7928466796875, 2.9169921875, 3.0411376953125, 3.165283203125, 3.2894287109375, 3.41357421875, 3.5377197265625, 3.661865234375, 3.7860107421875, 3.91015625]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 6.0, 6.0, 8.0, 7.0, 8.0, 8.0, 13.0, 25.0, 32.0, 32.0, 31.0, 38.0, 42.0, 30.0, 41.0, 42.0, 38.0, 71.0, 401.0, 1672.0, 74.0, 57.0, 49.0, 44.0, 32.0, 37.0, 36.0, 37.0, 29.0, 26.0, 19.0, 16.0, 9.0, 8.0, 9.0, 11.0, 5.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.265625, -18.71630859375, -18.1669921875, -17.61767578125, -17.068359375, -16.51904296875, -15.9697265625, -15.42041015625, -14.87109375, -14.32177734375, -13.7724609375, -13.22314453125, -12.673828125, -12.12451171875, -11.5751953125, -11.02587890625, -10.4765625, -9.92724609375, -9.3779296875, -8.82861328125, -8.279296875, -7.72998046875, -7.1806640625, -6.63134765625, -6.08203125, -5.53271484375, -4.9833984375, -4.43408203125, -3.884765625, -3.33544921875, -2.7861328125, -2.23681640625, -1.6875, -1.13818359375, -0.5888671875, -0.03955078125, 0.509765625, 1.05908203125, 1.6083984375, 2.15771484375, 2.70703125, 3.25634765625, 3.8056640625, 4.35498046875, 4.904296875, 5.45361328125, 6.0029296875, 6.55224609375, 7.1015625, 7.65087890625, 8.2001953125, 8.74951171875, 9.298828125, 9.84814453125, 10.3974609375, 10.94677734375, 11.49609375, 12.04541015625, 12.5947265625, 13.14404296875, 13.693359375, 14.24267578125, 14.7919921875, 15.34130859375, 15.890625]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 5.0, 4.0, 5.0, 9.0, 10.0, 8.0, 10.0, 16.0, 17.0, 37.0, 24.0, 42.0, 55.0, 77.0, 99.0, 175.0, 342.0, 964.0, 5095.0, 283253.0, 2844649.0, 8375.0, 1362.0, 405.0, 228.0, 111.0, 85.0, 50.0, 41.0, 32.0, 38.0, 27.0, 16.0, 10.0, 8.0, 10.0, 6.0, 5.0, 9.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.03125, -24.171630859375, -23.31201171875, -22.452392578125, -21.5927734375, -20.733154296875, -19.87353515625, -19.013916015625, -18.154296875, -17.294677734375, -16.43505859375, -15.575439453125, -14.7158203125, -13.856201171875, -12.99658203125, -12.136962890625, -11.27734375, -10.417724609375, -9.55810546875, -8.698486328125, -7.8388671875, -6.979248046875, -6.11962890625, -5.260009765625, -4.400390625, -3.540771484375, -2.68115234375, -1.821533203125, -0.9619140625, -0.102294921875, 0.75732421875, 1.616943359375, 2.4765625, 3.336181640625, 4.19580078125, 5.055419921875, 5.9150390625, 6.774658203125, 7.63427734375, 8.493896484375, 9.353515625, 10.213134765625, 11.07275390625, 11.932373046875, 12.7919921875, 13.651611328125, 14.51123046875, 15.370849609375, 16.23046875, 17.090087890625, 17.94970703125, 18.809326171875, 19.6689453125, 20.528564453125, 21.38818359375, 22.247802734375, 23.107421875, 23.967041015625, 24.82666015625, 25.686279296875, 26.5458984375, 27.405517578125, 28.26513671875, 29.124755859375, 29.984375]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [2.0, 1.0, 78.0, 555.0, 361.0, 21.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.706419944763184, -7.173535346984863, -4.640650749206543, -2.1077661514282227, 0.42511844635009766, 2.958003044128418, 5.490887641906738, 8.023772239685059, 10.556656837463379, 13.0895414352417, 15.62242603302002, 18.155311584472656, 20.688194274902344, 23.221080780029297, 25.753963470458984, 28.286849975585938, 30.819732666015625, 33.35261535644531, 35.885501861572266, 38.41838836669922, 40.951271057128906, 43.484153747558594, 46.01704025268555, 48.5499267578125, 51.08280944824219, 53.615692138671875, 56.14857864379883, 58.68146514892578, 61.21434783935547, 63.747230529785156, 66.28012084960938, 68.81300354003906, 71.34588623046875, 73.87876892089844, 76.41165161132812, 78.94454193115234, 81.47742462158203, 84.01030731201172, 86.54319763183594, 89.07608032226562, 91.60896301269531, 94.141845703125, 96.67472839355469, 99.2076187133789, 101.7405014038086, 104.27338409423828, 106.8062744140625, 109.33915710449219, 111.87203979492188, 114.40492248535156, 116.93780517578125, 119.47069549560547, 122.00357818603516, 124.53646087646484, 127.06935119628906, 129.60223388671875, 132.13511657714844, 134.66799926757812, 137.2008819580078, 139.7337646484375, 142.26666259765625, 144.79954528808594, 147.33242797851562, 149.8653106689453, 152.398193359375]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 4.0, 4.0, 13.0, 9.0, 8.0, 10.0, 8.0, 16.0, 22.0, 18.0, 30.0, 29.0, 27.0, 31.0, 40.0, 30.0, 39.0, 42.0, 44.0, 44.0, 47.0, 41.0, 45.0, 61.0, 57.0, 27.0, 32.0, 30.0, 30.0, 25.0, 29.0, 24.0, 12.0, 17.0, 13.0, 13.0, 7.0, 3.0, 6.0, 4.0, 4.0, 4.0, 2.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-50.50505447387695, -48.863956451416016, -47.22285461425781, -45.581756591796875, -43.94065856933594, -42.299560546875, -40.6584587097168, -39.01736068725586, -37.37626266479492, -35.735164642333984, -34.09406280517578, -32.452964782714844, -30.811866760253906, -29.170766830444336, -27.529666900634766, -25.888568878173828, -24.247468948364258, -22.606369018554688, -20.96527099609375, -19.32417106628418, -17.683073043823242, -16.041973114013672, -14.400874137878418, -12.759775161743164, -11.11867618560791, -9.477577209472656, -7.836478233337402, -6.19537878036499, -4.554279804229736, -2.913180351257324, -1.2720813751220703, 0.3690176010131836, 2.0101165771484375, 3.6512155532836914, 5.292314529418945, 6.933413982391357, 8.574512481689453, 10.215612411499023, 11.856711387634277, 13.497810363769531, 15.138909339904785, 16.78000831604004, 18.42110824584961, 20.062206268310547, 21.703306198120117, 23.344406127929688, 24.985504150390625, 26.626602172851562, 28.267702102661133, 29.908802032470703, 31.54990005493164, 33.19099807739258, 34.83209991455078, 36.47319793701172, 38.114295959472656, 39.755393981933594, 41.3964958190918, 43.037593841552734, 44.67869567871094, 46.319793701171875, 47.96089172363281, 49.60198974609375, 51.24309158325195, 52.88418960571289, 54.52528762817383]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 4.0, 4.0, 4.0, 5.0, 5.0, 8.0, 9.0, 8.0, 11.0, 13.0, 18.0, 14.0, 20.0, 16.0, 17.0, 34.0, 43.0, 26.0, 42.0, 43.0, 57.0, 41.0, 45.0, 46.0, 50.0, 41.0, 35.0, 45.0, 31.0, 34.0, 38.0, 32.0, 19.0, 22.0, 24.0, 18.0, 17.0, 10.0, 9.0, 13.0, 11.0, 6.0, 5.0, 6.0, 0.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.4609375, -4.32666015625, -4.1923828125, -4.05810546875, -3.923828125, -3.78955078125, -3.6552734375, -3.52099609375, -3.38671875, -3.25244140625, -3.1181640625, -2.98388671875, -2.849609375, -2.71533203125, -2.5810546875, -2.44677734375, -2.3125, -2.17822265625, -2.0439453125, -1.90966796875, -1.775390625, -1.64111328125, -1.5068359375, -1.37255859375, -1.23828125, -1.10400390625, -0.9697265625, -0.83544921875, -0.701171875, -0.56689453125, -0.4326171875, -0.29833984375, -0.1640625, -0.02978515625, 0.1044921875, 0.23876953125, 0.373046875, 0.50732421875, 0.6416015625, 0.77587890625, 0.91015625, 1.04443359375, 1.1787109375, 1.31298828125, 1.447265625, 1.58154296875, 1.7158203125, 1.85009765625, 1.984375, 2.11865234375, 2.2529296875, 2.38720703125, 2.521484375, 2.65576171875, 2.7900390625, 2.92431640625, 3.05859375, 3.19287109375, 3.3271484375, 3.46142578125, 3.595703125, 3.72998046875, 3.8642578125, 3.99853515625, 4.1328125]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 6.0, 4.0, 7.0, 8.0, 12.0, 20.0, 28.0, 43.0, 46.0, 61.0, 93.0, 110.0, 168.0, 250.0, 362.0, 539.0, 726.0, 1136.0, 1713.0, 2542.0, 4223.0, 7002.0, 12309.0, 23572.0, 61232.0, 477667.0, 2889898.0, 579961.0, 72014.0, 25574.0, 13030.0, 7451.0, 4450.0, 2813.0, 1705.0, 1162.0, 722.0, 522.0, 340.0, 272.0, 145.0, 109.0, 76.0, 47.0, 32.0, 29.0, 21.0, 12.0, 12.0, 8.0, 2.0, 3.0, 1.0, 3.0, 1.0], "bins": [-11.5703125, -11.2447509765625, -10.919189453125, -10.5936279296875, -10.26806640625, -9.9425048828125, -9.616943359375, -9.2913818359375, -8.9658203125, -8.6402587890625, -8.314697265625, -7.9891357421875, -7.66357421875, -7.3380126953125, -7.012451171875, -6.6868896484375, -6.361328125, -6.0357666015625, -5.710205078125, -5.3846435546875, -5.05908203125, -4.7335205078125, -4.407958984375, -4.0823974609375, -3.7568359375, -3.4312744140625, -3.105712890625, -2.7801513671875, -2.45458984375, -2.1290283203125, -1.803466796875, -1.4779052734375, -1.15234375, -0.8267822265625, -0.501220703125, -0.1756591796875, 0.14990234375, 0.4754638671875, 0.801025390625, 1.1265869140625, 1.4521484375, 1.7777099609375, 2.103271484375, 2.4288330078125, 2.75439453125, 3.0799560546875, 3.405517578125, 3.7310791015625, 4.056640625, 4.3822021484375, 4.707763671875, 5.0333251953125, 5.35888671875, 5.6844482421875, 6.010009765625, 6.3355712890625, 6.6611328125, 6.9866943359375, 7.312255859375, 7.6378173828125, 7.96337890625, 8.2889404296875, 8.614501953125, 8.9400634765625, 9.265625]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 6.0, 1.0, 6.0, 8.0, 6.0, 16.0, 14.0, 16.0, 18.0, 11.0, 21.0, 36.0, 34.0, 49.0, 61.0, 73.0, 136.0, 207.0, 350.0, 582.0, 722.0, 563.0, 371.0, 226.0, 134.0, 85.0, 64.0, 50.0, 43.0, 32.0, 31.0, 26.0, 17.0, 13.0, 5.0, 10.0, 4.0, 8.0, 6.0, 7.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.53125, -11.1873779296875, -10.843505859375, -10.4996337890625, -10.15576171875, -9.8118896484375, -9.468017578125, -9.1241455078125, -8.7802734375, -8.4364013671875, -8.092529296875, -7.7486572265625, -7.40478515625, -7.0609130859375, -6.717041015625, -6.3731689453125, -6.029296875, -5.6854248046875, -5.341552734375, -4.9976806640625, -4.65380859375, -4.3099365234375, -3.966064453125, -3.6221923828125, -3.2783203125, -2.9344482421875, -2.590576171875, -2.2467041015625, -1.90283203125, -1.5589599609375, -1.215087890625, -0.8712158203125, -0.52734375, -0.1834716796875, 0.160400390625, 0.5042724609375, 0.84814453125, 1.1920166015625, 1.535888671875, 1.8797607421875, 2.2236328125, 2.5675048828125, 2.911376953125, 3.2552490234375, 3.59912109375, 3.9429931640625, 4.286865234375, 4.6307373046875, 4.974609375, 5.3184814453125, 5.662353515625, 6.0062255859375, 6.35009765625, 6.6939697265625, 7.037841796875, 7.3817138671875, 7.7255859375, 8.0694580078125, 8.413330078125, 8.7572021484375, 9.10107421875, 9.4449462890625, 9.788818359375, 10.1326904296875, 10.4765625]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 6.0, 4.0, 7.0, 9.0, 13.0, 31.0, 50.0, 86.0, 133.0, 252.0, 456.0, 774.0, 1410.0, 2391.0, 4487.0, 8370.0, 16005.0, 33129.0, 78197.0, 336758.0, 2812588.0, 704921.0, 109840.0, 42362.0, 19953.0, 10102.0, 5363.0, 2895.0, 1592.0, 884.0, 467.0, 329.0, 160.0, 114.0, 54.0, 39.0, 16.0, 20.0, 7.0, 12.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.7421875, -12.2454833984375, -11.748779296875, -11.2520751953125, -10.75537109375, -10.2586669921875, -9.761962890625, -9.2652587890625, -8.7685546875, -8.2718505859375, -7.775146484375, -7.2784423828125, -6.78173828125, -6.2850341796875, -5.788330078125, -5.2916259765625, -4.794921875, -4.2982177734375, -3.801513671875, -3.3048095703125, -2.80810546875, -2.3114013671875, -1.814697265625, -1.3179931640625, -0.8212890625, -0.3245849609375, 0.172119140625, 0.6688232421875, 1.16552734375, 1.6622314453125, 2.158935546875, 2.6556396484375, 3.15234375, 3.6490478515625, 4.145751953125, 4.6424560546875, 5.13916015625, 5.6358642578125, 6.132568359375, 6.6292724609375, 7.1259765625, 7.6226806640625, 8.119384765625, 8.6160888671875, 9.11279296875, 9.6094970703125, 10.106201171875, 10.6029052734375, 11.099609375, 11.5963134765625, 12.093017578125, 12.5897216796875, 13.08642578125, 13.5831298828125, 14.079833984375, 14.5765380859375, 15.0732421875, 15.5699462890625, 16.066650390625, 16.5633544921875, 17.06005859375, 17.5567626953125, 18.053466796875, 18.5501708984375, 19.046875]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 5.0, 4.0, 6.0, 11.0, 13.0, 17.0, 21.0, 47.0, 64.0, 92.0, 139.0, 108.0, 133.0, 101.0, 78.0, 60.0, 34.0, 21.0, 20.0, 11.0, 10.0, 5.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-93.07738494873047, -91.0455093383789, -89.01364135742188, -86.98176574707031, -84.94989776611328, -82.91802215576172, -80.88615417480469, -78.85427856445312, -76.82240295410156, -74.79052734375, -72.75865936279297, -70.7267837524414, -68.69491577148438, -66.66304016113281, -64.63116455078125, -62.59929656982422, -60.56742477416992, -58.535552978515625, -56.50368118286133, -54.47180938720703, -52.43993377685547, -50.40806198120117, -48.376190185546875, -46.34431838989258, -44.31244659423828, -42.280574798583984, -40.24870300292969, -38.216827392578125, -36.18495559692383, -34.15308380126953, -32.121212005615234, -30.089340209960938, -28.05746078491211, -26.025588989257812, -23.993715286254883, -21.961843490600586, -19.929969787597656, -17.89809799194336, -15.866226196289062, -13.83435344696045, -11.802480697631836, -9.770607948303223, -7.738735675811768, -5.7068634033203125, -3.674990653991699, -1.643117904663086, 0.38875389099121094, 2.420626640319824, 4.4524993896484375, 6.484372138977051, 8.516244888305664, 10.548116683959961, 12.579989433288574, 14.611862182617188, 16.643733978271484, 18.67560577392578, 20.70747947692871, 22.739351272583008, 24.771224975585938, 26.803096771240234, 28.83496856689453, 30.86684226989746, 32.898712158203125, 34.93058776855469, 36.962459564208984]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 2.0, 1.0, 15.0, 10.0, 6.0, 10.0, 15.0, 12.0, 23.0, 25.0, 24.0, 27.0, 25.0, 31.0, 29.0, 35.0, 44.0, 35.0, 40.0, 41.0, 35.0, 37.0, 46.0, 45.0, 39.0, 33.0, 39.0, 47.0, 35.0, 30.0, 23.0, 21.0, 18.0, 18.0, 17.0, 11.0, 11.0, 14.0, 10.0, 11.0, 5.0, 3.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0], "bins": [-41.79270935058594, -40.66359329223633, -39.53447341918945, -38.405357360839844, -37.27623748779297, -36.14712142944336, -35.01800537109375, -33.888885498046875, -32.759769439697266, -31.630651473999023, -30.50153350830078, -29.372417449951172, -28.24329948425293, -27.114181518554688, -25.985063552856445, -24.855945587158203, -23.72682762145996, -22.59770965576172, -21.468591690063477, -20.339473724365234, -19.210357666015625, -18.081239700317383, -16.95212173461914, -15.823003768920898, -14.693886756896973, -13.56476879119873, -12.435651779174805, -11.306533813476562, -10.17741584777832, -9.048298835754395, -7.919180870056152, -6.790063381195068, -5.660945892333984, -4.5318284034729, -3.4027106761932373, -2.273592948913574, -1.1444754600524902, -0.01535797119140625, 1.113759994506836, 2.24287748336792, 3.371994972229004, 4.501112461090088, 5.630229949951172, 6.759347915649414, 7.888465404510498, 9.017582893371582, 10.146700859069824, 11.27581787109375, 12.404935836791992, 13.534053802490234, 14.66317081451416, 15.792288780212402, 16.921405792236328, 18.05052375793457, 19.179641723632812, 20.308759689331055, 21.437877655029297, 22.56699562072754, 23.69611358642578, 24.82522964477539, 25.954347610473633, 27.083465576171875, 28.212583541870117, 29.34170150756836, 30.47081756591797]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 3.0, 4.0, 4.0, 2.0, 7.0, 5.0, 9.0, 7.0, 23.0, 21.0, 18.0, 12.0, 20.0, 31.0, 29.0, 41.0, 35.0, 44.0, 33.0, 50.0, 50.0, 54.0, 44.0, 45.0, 44.0, 48.0, 43.0, 38.0, 30.0, 37.0, 22.0, 24.0, 16.0, 27.0, 21.0, 15.0, 10.0, 4.0, 8.0, 7.0, 6.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.98828125, -4.8446044921875, -4.700927734375, -4.5572509765625, -4.41357421875, -4.2698974609375, -4.126220703125, -3.9825439453125, -3.8388671875, -3.6951904296875, -3.551513671875, -3.4078369140625, -3.26416015625, -3.1204833984375, -2.976806640625, -2.8331298828125, -2.689453125, -2.5457763671875, -2.402099609375, -2.2584228515625, -2.11474609375, -1.9710693359375, -1.827392578125, -1.6837158203125, -1.5400390625, -1.3963623046875, -1.252685546875, -1.1090087890625, -0.96533203125, -0.8216552734375, -0.677978515625, -0.5343017578125, -0.390625, -0.2469482421875, -0.103271484375, 0.0404052734375, 0.18408203125, 0.3277587890625, 0.471435546875, 0.6151123046875, 0.7587890625, 0.9024658203125, 1.046142578125, 1.1898193359375, 1.33349609375, 1.4771728515625, 1.620849609375, 1.7645263671875, 1.908203125, 2.0518798828125, 2.195556640625, 2.3392333984375, 2.48291015625, 2.6265869140625, 2.770263671875, 2.9139404296875, 3.0576171875, 3.2012939453125, 3.344970703125, 3.4886474609375, 3.63232421875, 3.7760009765625, 3.919677734375, 4.0633544921875, 4.20703125]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 5.0, 5.0, 3.0, 5.0, 9.0, 18.0, 18.0, 24.0, 47.0, 68.0, 80.0, 119.0, 191.0, 247.0, 445.0, 644.0, 1034.0, 1591.0, 2662.0, 4189.0, 6840.0, 11641.0, 20344.0, 36698.0, 69608.0, 139366.0, 306871.0, 222974.0, 102228.0, 52635.0, 28047.0, 15872.0, 9178.0, 5523.0, 3341.0, 2063.0, 1285.0, 871.0, 586.0, 398.0, 287.0, 150.0, 101.0, 98.0, 51.0, 42.0, 24.0, 10.0, 15.0, 8.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.2137451171875, -0.20741844177246094, -0.20109176635742188, -0.1947650909423828, -0.18843841552734375, -0.1821117401123047, -0.17578506469726562, -0.16945838928222656, -0.1631317138671875, -0.15680503845214844, -0.15047836303710938, -0.1441516876220703, -0.13782501220703125, -0.1314983367919922, -0.12517166137695312, -0.11884498596191406, -0.112518310546875, -0.10619163513183594, -0.09986495971679688, -0.09353828430175781, -0.08721160888671875, -0.08088493347167969, -0.07455825805664062, -0.06823158264160156, -0.0619049072265625, -0.05557823181152344, -0.049251556396484375, -0.04292488098144531, -0.03659820556640625, -0.030271530151367188, -0.023944854736328125, -0.017618179321289062, -0.01129150390625, -0.0049648284912109375, 0.001361846923828125, 0.0076885223388671875, 0.01401519775390625, 0.020341873168945312, 0.026668548583984375, 0.03299522399902344, 0.0393218994140625, 0.04564857482910156, 0.051975250244140625, 0.05830192565917969, 0.06462860107421875, 0.07095527648925781, 0.07728195190429688, 0.08360862731933594, 0.089935302734375, 0.09626197814941406, 0.10258865356445312, 0.10891532897949219, 0.11524200439453125, 0.12156867980957031, 0.12789535522460938, 0.13422203063964844, 0.1405487060546875, 0.14687538146972656, 0.15320205688476562, 0.1595287322998047, 0.16585540771484375, 0.1721820831298828, 0.17850875854492188, 0.18483543395996094, 0.191162109375]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 4.0, 7.0, 0.0, 3.0, 2.0, 9.0, 9.0, 6.0, 18.0, 14.0, 12.0, 24.0, 12.0, 19.0, 14.0, 25.0, 33.0, 37.0, 34.0, 27.0, 38.0, 40.0, 40.0, 42.0, 33.0, 1056.0, 50.0, 31.0, 32.0, 36.0, 23.0, 31.0, 30.0, 24.0, 28.0, 22.0, 22.0, 20.0, 25.0, 19.0, 15.0, 18.0, 10.0, 8.0, 10.0, 8.0, 8.0, 4.0, 5.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.39453125, -2.31005859375, -2.2255859375, -2.14111328125, -2.056640625, -1.97216796875, -1.8876953125, -1.80322265625, -1.71875, -1.63427734375, -1.5498046875, -1.46533203125, -1.380859375, -1.29638671875, -1.2119140625, -1.12744140625, -1.04296875, -0.95849609375, -0.8740234375, -0.78955078125, -0.705078125, -0.62060546875, -0.5361328125, -0.45166015625, -0.3671875, -0.28271484375, -0.1982421875, -0.11376953125, -0.029296875, 0.05517578125, 0.1396484375, 0.22412109375, 0.30859375, 0.39306640625, 0.4775390625, 0.56201171875, 0.646484375, 0.73095703125, 0.8154296875, 0.89990234375, 0.984375, 1.06884765625, 1.1533203125, 1.23779296875, 1.322265625, 1.40673828125, 1.4912109375, 1.57568359375, 1.66015625, 1.74462890625, 1.8291015625, 1.91357421875, 1.998046875, 2.08251953125, 2.1669921875, 2.25146484375, 2.3359375, 2.42041015625, 2.5048828125, 2.58935546875, 2.673828125, 2.75830078125, 2.8427734375, 2.92724609375, 3.01171875]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 4.0, 2.0, 6.0, 10.0, 7.0, 15.0, 15.0, 33.0, 54.0, 78.0, 136.0, 178.0, 278.0, 380.0, 547.0, 752.0, 1136.0, 1655.0, 2538.0, 3671.0, 5436.0, 8248.0, 12738.0, 19812.0, 30941.0, 49019.0, 78612.0, 130237.0, 1264701.0, 187489.0, 110952.0, 67545.0, 42326.0, 26635.0, 17440.0, 11213.0, 7199.0, 4963.0, 3279.0, 2157.0, 1471.0, 1039.0, 680.0, 483.0, 332.0, 231.0, 172.0, 99.0, 62.0, 38.0, 35.0, 25.0, 12.0, 9.0, 3.0, 8.0, 4.0, 1.0, 4.0, 0.0, 3.0], "bins": [-0.11883544921875, -0.11510372161865234, -0.11137199401855469, -0.10764026641845703, -0.10390853881835938, -0.10017681121826172, -0.09644508361816406, -0.0927133560180664, -0.08898162841796875, -0.0852499008178711, -0.08151817321777344, -0.07778644561767578, -0.07405471801757812, -0.07032299041748047, -0.06659126281738281, -0.06285953521728516, -0.0591278076171875, -0.055396080017089844, -0.05166435241699219, -0.04793262481689453, -0.044200897216796875, -0.04046916961669922, -0.03673744201660156, -0.033005714416503906, -0.02927398681640625, -0.025542259216308594, -0.021810531616210938, -0.01807880401611328, -0.014347076416015625, -0.010615348815917969, -0.0068836212158203125, -0.0031518936157226562, 0.000579833984375, 0.004311561584472656, 0.008043289184570312, 0.011775016784667969, 0.015506744384765625, 0.01923847198486328, 0.022970199584960938, 0.026701927185058594, 0.03043365478515625, 0.034165382385253906, 0.03789710998535156, 0.04162883758544922, 0.045360565185546875, 0.04909229278564453, 0.05282402038574219, 0.056555747985839844, 0.0602874755859375, 0.06401920318603516, 0.06775093078613281, 0.07148265838623047, 0.07521438598632812, 0.07894611358642578, 0.08267784118652344, 0.0864095687866211, 0.09014129638671875, 0.0938730239868164, 0.09760475158691406, 0.10133647918701172, 0.10506820678710938, 0.10879993438720703, 0.11253166198730469, 0.11626338958740234, 0.1199951171875]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 5.0, 2.0, 5.0, 7.0, 8.0, 7.0, 9.0, 5.0, 16.0, 17.0, 21.0, 29.0, 43.0, 50.0, 72.0, 101.0, 123.0, 128.0, 92.0, 61.0, 53.0, 39.0, 27.0, 16.0, 14.0, 10.0, 11.0, 8.0, 3.0, 5.0, 6.0, 3.0, 7.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 1.0], "bins": [-0.0002942085266113281, -0.0002866499125957489, -0.0002790912985801697, -0.00027153268456459045, -0.00026397407054901123, -0.000256415456533432, -0.0002488568425178528, -0.00024129822850227356, -0.00023373961448669434, -0.0002261810004711151, -0.0002186223864555359, -0.00021106377243995667, -0.00020350515842437744, -0.00019594654440879822, -0.000188387930393219, -0.00018082931637763977, -0.00017327070236206055, -0.00016571208834648132, -0.0001581534743309021, -0.00015059486031532288, -0.00014303624629974365, -0.00013547763228416443, -0.0001279190182685852, -0.00012036040425300598, -0.00011280179023742676, -0.00010524317622184753, -9.768456220626831e-05, -9.012594819068909e-05, -8.256733417510986e-05, -7.500872015953064e-05, -6.745010614395142e-05, -5.989149212837219e-05, -5.233287811279297e-05, -4.4774264097213745e-05, -3.721565008163452e-05, -2.9657036066055298e-05, -2.2098422050476074e-05, -1.453980803489685e-05, -6.981194019317627e-06, 5.774199962615967e-07, 8.13603401184082e-06, 1.5694648027420044e-05, 2.3253262042999268e-05, 3.081187605857849e-05, 3.8370490074157715e-05, 4.592910408973694e-05, 5.348771810531616e-05, 6.104633212089539e-05, 6.860494613647461e-05, 7.616356015205383e-05, 8.372217416763306e-05, 9.128078818321228e-05, 9.88394021987915e-05, 0.00010639801621437073, 0.00011395663022994995, 0.00012151524424552917, 0.0001290738582611084, 0.00013663247227668762, 0.00014419108629226685, 0.00015174970030784607, 0.0001593083143234253, 0.00016686692833900452, 0.00017442554235458374, 0.00018198415637016296, 0.0001895427703857422]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 4.0, 7.0, 3.0, 8.0, 5.0, 10.0, 10.0, 11.0, 15.0, 28.0, 41.0, 46.0, 87.0, 178.0, 299.0, 730.0, 2614.0, 25632.0, 927766.0, 84161.0, 4984.0, 1045.0, 356.0, 179.0, 116.0, 67.0, 43.0, 32.0, 22.0, 13.0, 11.0, 14.0, 3.0, 3.0, 4.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0025768280029296875, -0.0024836957454681396, -0.002390563488006592, -0.002297431230545044, -0.002204298973083496, -0.0021111667156219482, -0.0020180344581604004, -0.0019249022006988525, -0.0018317699432373047, -0.0017386376857757568, -0.001645505428314209, -0.0015523731708526611, -0.0014592409133911133, -0.0013661086559295654, -0.0012729763984680176, -0.0011798441410064697, -0.0010867118835449219, -0.000993579626083374, -0.0009004473686218262, -0.0008073151111602783, -0.0007141828536987305, -0.0006210505962371826, -0.0005279183387756348, -0.0004347860813140869, -0.00034165382385253906, -0.0002485215663909912, -0.00015538930892944336, -6.225705146789551e-05, 3.0875205993652344e-05, 0.0001240074634552002, 0.00021713972091674805, 0.0003102719783782959, 0.00040340423583984375, 0.0004965364933013916, 0.0005896687507629395, 0.0006828010082244873, 0.0007759332656860352, 0.000869065523147583, 0.0009621977806091309, 0.0010553300380706787, 0.0011484622955322266, 0.0012415945529937744, 0.0013347268104553223, 0.0014278590679168701, 0.001520991325378418, 0.0016141235828399658, 0.0017072558403015137, 0.0018003880977630615, 0.0018935203552246094, 0.0019866526126861572, 0.002079784870147705, 0.002172917127609253, 0.0022660493850708008, 0.0023591816425323486, 0.0024523138999938965, 0.0025454461574554443, 0.002638578414916992, 0.00273171067237854, 0.002824842929840088, 0.0029179751873016357, 0.0030111074447631836, 0.0031042397022247314, 0.0031973719596862793, 0.003290504217147827, 0.003383636474609375]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 6.0, 19.0, 67.0, 276.0, 450.0, 142.0, 38.0, 9.0, 5.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00016187355504371226, -0.00014212331734597683, -0.0001223730796482414, -0.00010262283467454836, -8.287259697681293e-05, -6.31223592790775e-05, -4.337211430538446e-05, -2.3621876607649028e-05, -3.8716389099135995e-06, 1.5878600606811233e-05, 3.5628840123536065e-05, 5.53790814592503e-05, 7.512931915698573e-05, 9.487955685472116e-05, 0.0001146298018284142, 0.00013438003952614963, 0.00015413027722388506, 0.0001738805149216205, 0.00019363075261935592, 0.00021338099031709135, 0.00023313122801482677, 0.0002528814657125622, 0.00027263170341029763, 0.0002923819702118635, 0.0003121321788057685, 0.0003318824165035039, 0.00035163265420123935, 0.0003713828918989748, 0.0003911331295967102, 0.00041088336729444563, 0.00043063360499218106, 0.00045038387179374695, 0.00047013413859531283, 0.0004898844053968787, 0.0005096346139907837, 0.0005293848807923496, 0.0005491350893862545, 0.0005688853561878204, 0.0005886355647817254, 0.0006083858315832913, 0.0006281360401771963, 0.0006478863069787621, 0.0006676365155726671, 0.000687386782374233, 0.000707136990968138, 0.0007268872577697039, 0.0007466374663636088, 0.0007663877331651747, 0.0007861379999667406, 0.0008058882667683065, 0.0008256384753622115, 0.0008453887421637774, 0.0008651389507576823, 0.0008848892175592482, 0.0009046394261531532, 0.0009243896929547191, 0.000944139901548624, 0.0009638901683501899, 0.0009836404351517558, 0.0010033906437456608, 0.0010231408523395658, 0.0010428910609334707, 0.0010626413859426975, 0.0010823915945366025, 0.0011021418031305075]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 4.0, 5.0, 4.0, 7.0, 8.0, 9.0, 12.0, 12.0, 17.0, 14.0, 19.0, 19.0, 27.0, 26.0, 32.0, 52.0, 36.0, 33.0, 42.0, 31.0, 43.0, 51.0, 42.0, 47.0, 38.0, 52.0, 35.0, 34.0, 45.0, 26.0, 26.0, 28.0, 18.0, 17.0, 18.0, 16.0, 14.0, 14.0, 13.0, 9.0, 4.0, 5.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.781122207641602e-05, -9.447243064641953e-05, -9.113363921642303e-05, -8.779484778642654e-05, -8.445605635643005e-05, -8.111726492643356e-05, -7.777847349643707e-05, -7.443968206644058e-05, -7.110089063644409e-05, -6.77620992064476e-05, -6.442330777645111e-05, -6.108451634645462e-05, -5.774572491645813e-05, -5.440693348646164e-05, -5.106814205646515e-05, -4.772935062646866e-05, -4.439055919647217e-05, -4.105176776647568e-05, -3.771297633647919e-05, -3.4374184906482697e-05, -3.1035393476486206e-05, -2.7696602046489716e-05, -2.4357810616493225e-05, -2.1019019186496735e-05, -1.7680227756500244e-05, -1.4341436326503754e-05, -1.1002644896507263e-05, -7.663853466510773e-06, -4.325062036514282e-06, -9.862706065177917e-07, 2.3525208234786987e-06, 5.691312253475189e-06, 9.03010368347168e-06, 1.236889511346817e-05, 1.570768654346466e-05, 1.904647797346115e-05, 2.238526940345764e-05, 2.5724060833454132e-05, 2.9062852263450623e-05, 3.240164369344711e-05, 3.5740435123443604e-05, 3.9079226553440094e-05, 4.2418017983436584e-05, 4.5756809413433075e-05, 4.9095600843429565e-05, 5.2434392273426056e-05, 5.5773183703422546e-05, 5.911197513341904e-05, 6.245076656341553e-05, 6.578955799341202e-05, 6.912834942340851e-05, 7.2467140853405e-05, 7.580593228340149e-05, 7.914472371339798e-05, 8.248351514339447e-05, 8.582230657339096e-05, 8.916109800338745e-05, 9.249988943338394e-05, 9.583868086338043e-05, 9.917747229337692e-05, 0.00010251626372337341, 0.0001058550551533699, 0.0001091938465833664, 0.00011253263801336288, 0.00011587142944335938]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 3.0, 4.0, 4.0, 2.0, 7.0, 5.0, 9.0, 7.0, 23.0, 21.0, 18.0, 12.0, 20.0, 31.0, 29.0, 41.0, 35.0, 44.0, 33.0, 50.0, 50.0, 54.0, 44.0, 45.0, 44.0, 48.0, 43.0, 38.0, 30.0, 37.0, 22.0, 24.0, 16.0, 27.0, 21.0, 15.0, 10.0, 4.0, 8.0, 7.0, 6.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.98828125, -4.8446044921875, -4.700927734375, -4.5572509765625, -4.41357421875, -4.2698974609375, -4.126220703125, -3.9825439453125, -3.8388671875, -3.6951904296875, -3.551513671875, -3.4078369140625, -3.26416015625, -3.1204833984375, -2.976806640625, -2.8331298828125, -2.689453125, -2.5457763671875, -2.402099609375, -2.2584228515625, -2.11474609375, -1.9710693359375, -1.827392578125, -1.6837158203125, -1.5400390625, -1.3963623046875, -1.252685546875, -1.1090087890625, -0.96533203125, -0.8216552734375, -0.677978515625, -0.5343017578125, -0.390625, -0.2469482421875, -0.103271484375, 0.0404052734375, 0.18408203125, 0.3277587890625, 0.471435546875, 0.6151123046875, 0.7587890625, 0.9024658203125, 1.046142578125, 1.1898193359375, 1.33349609375, 1.4771728515625, 1.620849609375, 1.7645263671875, 1.908203125, 2.0518798828125, 2.195556640625, 2.3392333984375, 2.48291015625, 2.6265869140625, 2.770263671875, 2.9139404296875, 3.0576171875, 3.2012939453125, 3.344970703125, 3.4886474609375, 3.63232421875, 3.7760009765625, 3.919677734375, 4.0633544921875, 4.20703125]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 6.0, 4.0, 5.0, 9.0, 6.0, 13.0, 17.0, 19.0, 22.0, 38.0, 68.0, 86.0, 114.0, 165.0, 214.0, 289.0, 437.0, 634.0, 830.0, 1219.0, 1826.0, 2722.0, 4598.0, 11805.0, 59921.0, 406844.0, 459695.0, 69979.0, 13049.0, 4990.0, 2812.0, 1863.0, 1228.0, 893.0, 607.0, 395.0, 339.0, 212.0, 159.0, 113.0, 72.0, 63.0, 38.0, 38.0, 24.0, 19.0, 15.0, 11.0, 8.0, 14.0, 4.0, 8.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-4.80078125, -4.6461181640625, -4.491455078125, -4.3367919921875, -4.18212890625, -4.0274658203125, -3.872802734375, -3.7181396484375, -3.5634765625, -3.4088134765625, -3.254150390625, -3.0994873046875, -2.94482421875, -2.7901611328125, -2.635498046875, -2.4808349609375, -2.326171875, -2.1715087890625, -2.016845703125, -1.8621826171875, -1.70751953125, -1.5528564453125, -1.398193359375, -1.2435302734375, -1.0888671875, -0.9342041015625, -0.779541015625, -0.6248779296875, -0.47021484375, -0.3155517578125, -0.160888671875, -0.0062255859375, 0.1484375, 0.3031005859375, 0.457763671875, 0.6124267578125, 0.76708984375, 0.9217529296875, 1.076416015625, 1.2310791015625, 1.3857421875, 1.5404052734375, 1.695068359375, 1.8497314453125, 2.00439453125, 2.1590576171875, 2.313720703125, 2.4683837890625, 2.623046875, 2.7777099609375, 2.932373046875, 3.0870361328125, 3.24169921875, 3.3963623046875, 3.551025390625, 3.7056884765625, 3.8603515625, 4.0150146484375, 4.169677734375, 4.3243408203125, 4.47900390625, 4.6336669921875, 4.788330078125, 4.9429931640625, 5.09765625]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 5.0, 4.0, 5.0, 9.0, 13.0, 17.0, 23.0, 13.0, 18.0, 28.0, 32.0, 38.0, 36.0, 43.0, 58.0, 62.0, 70.0, 96.0, 1735.0, 257.0, 57.0, 63.0, 58.0, 49.0, 48.0, 32.0, 29.0, 24.0, 25.0, 21.0, 20.0, 15.0, 15.0, 4.0, 8.0, 8.0, 7.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.796875, -16.213134765625, -15.62939453125, -15.045654296875, -14.4619140625, -13.878173828125, -13.29443359375, -12.710693359375, -12.126953125, -11.543212890625, -10.95947265625, -10.375732421875, -9.7919921875, -9.208251953125, -8.62451171875, -8.040771484375, -7.45703125, -6.873291015625, -6.28955078125, -5.705810546875, -5.1220703125, -4.538330078125, -3.95458984375, -3.370849609375, -2.787109375, -2.203369140625, -1.61962890625, -1.035888671875, -0.4521484375, 0.131591796875, 0.71533203125, 1.299072265625, 1.8828125, 2.466552734375, 3.05029296875, 3.634033203125, 4.2177734375, 4.801513671875, 5.38525390625, 5.968994140625, 6.552734375, 7.136474609375, 7.72021484375, 8.303955078125, 8.8876953125, 9.471435546875, 10.05517578125, 10.638916015625, 11.22265625, 11.806396484375, 12.39013671875, 12.973876953125, 13.5576171875, 14.141357421875, 14.72509765625, 15.308837890625, 15.892578125, 16.476318359375, 17.06005859375, 17.643798828125, 18.2275390625, 18.811279296875, 19.39501953125, 19.978759765625, 20.5625]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 6.0, 13.0, 21.0, 25.0, 35.0, 60.0, 101.0, 218.0, 569.0, 1675.0, 15076.0, 3101025.0, 23599.0, 2161.0, 597.0, 240.0, 117.0, 62.0, 50.0, 26.0, 18.0, 9.0, 5.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.59375, -45.8671875, -44.140625, -42.4140625, -40.6875, -38.9609375, -37.234375, -35.5078125, -33.78125, -32.0546875, -30.328125, -28.6015625, -26.875, -25.1484375, -23.421875, -21.6953125, -19.96875, -18.2421875, -16.515625, -14.7890625, -13.0625, -11.3359375, -9.609375, -7.8828125, -6.15625, -4.4296875, -2.703125, -0.9765625, 0.75, 2.4765625, 4.203125, 5.9296875, 7.65625, 9.3828125, 11.109375, 12.8359375, 14.5625, 16.2890625, 18.015625, 19.7421875, 21.46875, 23.1953125, 24.921875, 26.6484375, 28.375, 30.1015625, 31.828125, 33.5546875, 35.28125, 37.0078125, 38.734375, 40.4609375, 42.1875, 43.9140625, 45.640625, 47.3671875, 49.09375, 50.8203125, 52.546875, 54.2734375, 56.0, 57.7265625, 59.453125, 61.1796875, 62.90625]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 16.0, 810.0, 189.0, 2.0, 2.0, 1.0], "bins": [-646.9931640625, -636.1585693359375, -625.3239135742188, -614.4893188476562, -603.6547241210938, -592.820068359375, -581.9854736328125, -571.15087890625, -560.3162841796875, -549.481689453125, -538.6470336914062, -527.8124389648438, -516.9778442382812, -506.1432189941406, -495.30859375, -484.4739990234375, -473.63934326171875, -462.8047180175781, -451.9701232910156, -441.135498046875, -430.3009033203125, -419.4662780761719, -408.63165283203125, -397.79705810546875, -386.9624328613281, -376.1278076171875, -365.293212890625, -354.4585876464844, -343.62396240234375, -332.78936767578125, -321.9547424316406, -311.1201171875, -300.2854919433594, -289.45086669921875, -278.61627197265625, -267.7816467285156, -256.947021484375, -246.1124267578125, -235.27780151367188, -224.4431915283203, -213.60858154296875, -202.7739715576172, -191.93936157226562, -181.104736328125, -170.27012634277344, -159.43551635742188, -148.60089111328125, -137.7662811279297, -126.93167114257812, -116.09706115722656, -105.26244354248047, -94.42782592773438, -83.59321594238281, -72.75860595703125, -61.923988342285156, -51.08937072753906, -40.2547607421875, -29.420146942138672, -18.585533142089844, -7.750919342041016, 3.0836944580078125, 13.91830825805664, 24.75292205810547, 35.58753967285156, 46.422149658203125]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 6.0, 2.0, 4.0, 6.0, 8.0, 3.0, 5.0, 10.0, 11.0, 9.0, 13.0, 16.0, 21.0, 18.0, 19.0, 22.0, 20.0, 22.0, 23.0, 38.0, 32.0, 30.0, 32.0, 37.0, 36.0, 41.0, 32.0, 38.0, 28.0, 39.0, 43.0, 34.0, 25.0, 42.0, 38.0, 25.0, 27.0, 18.0, 22.0, 11.0, 18.0, 10.0, 9.0, 13.0, 11.0, 9.0, 8.0, 4.0, 5.0, 10.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-46.1485595703125, -44.679508209228516, -43.210453033447266, -41.74140167236328, -40.27234649658203, -38.80329513549805, -37.33424377441406, -35.86518859863281, -34.39613342285156, -32.92708206176758, -31.458026885986328, -29.988975524902344, -28.519920349121094, -27.05086898803711, -25.581815719604492, -24.112762451171875, -22.64371109008789, -21.174657821655273, -19.705604553222656, -18.236553192138672, -16.767498016357422, -15.298445701599121, -13.82939338684082, -12.360340118408203, -10.891286849975586, -9.422233581542969, -7.95318078994751, -6.484127998352051, -5.015074729919434, -3.5460214614868164, -2.0769691467285156, -0.6079158782958984, 0.8611335754394531, 2.330186605453491, 3.7992396354675293, 5.268292427062988, 6.7373456954956055, 8.206398963928223, 9.675451278686523, 11.14450454711914, 12.613557815551758, 14.082611083984375, 15.551664352416992, 17.02071762084961, 18.489768981933594, 19.958824157714844, 21.427875518798828, 22.896928787231445, 24.365982055664062, 25.83503532409668, 27.304088592529297, 28.77313995361328, 30.24219512939453, 31.711246490478516, 33.1802978515625, 34.64935302734375, 36.118408203125, 37.587459564208984, 39.056514739990234, 40.52556610107422, 41.99462127685547, 43.46367263793945, 44.93272399902344, 46.40177917480469, 47.87083053588867]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 7.0, 4.0, 3.0, 7.0, 5.0, 13.0, 18.0, 16.0, 20.0, 22.0, 14.0, 16.0, 38.0, 29.0, 47.0, 52.0, 37.0, 41.0, 54.0, 49.0, 49.0, 41.0, 41.0, 44.0, 44.0, 36.0, 42.0, 28.0, 34.0, 27.0, 27.0, 21.0, 16.0, 12.0, 10.0, 8.0, 5.0, 5.0, 7.0, 5.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.2734375, -5.11822509765625, -4.9630126953125, -4.80780029296875, -4.652587890625, -4.49737548828125, -4.3421630859375, -4.18695068359375, -4.03173828125, -3.87652587890625, -3.7213134765625, -3.56610107421875, -3.410888671875, -3.25567626953125, -3.1004638671875, -2.94525146484375, -2.7900390625, -2.63482666015625, -2.4796142578125, -2.32440185546875, -2.169189453125, -2.01397705078125, -1.8587646484375, -1.70355224609375, -1.54833984375, -1.39312744140625, -1.2379150390625, -1.08270263671875, -0.927490234375, -0.77227783203125, -0.6170654296875, -0.46185302734375, -0.306640625, -0.15142822265625, 0.0037841796875, 0.15899658203125, 0.314208984375, 0.46942138671875, 0.6246337890625, 0.77984619140625, 0.93505859375, 1.09027099609375, 1.2454833984375, 1.40069580078125, 1.555908203125, 1.71112060546875, 1.8663330078125, 2.02154541015625, 2.1767578125, 2.33197021484375, 2.4871826171875, 2.64239501953125, 2.797607421875, 2.95281982421875, 3.1080322265625, 3.26324462890625, 3.41845703125, 3.57366943359375, 3.7288818359375, 3.88409423828125, 4.039306640625, 4.19451904296875, 4.3497314453125, 4.50494384765625, 4.66015625]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 7.0, 14.0, 15.0, 19.0, 19.0, 41.0, 44.0, 69.0, 136.0, 238.0, 318.0, 564.0, 947.0, 1766.0, 3385.0, 6371.0, 13043.0, 30565.0, 122735.0, 2230547.0, 1626561.0, 102866.0, 28354.0, 12456.0, 6029.0, 3199.0, 1705.0, 988.0, 514.0, 286.0, 198.0, 106.0, 64.0, 37.0, 19.0, 15.0, 10.0, 10.0, 6.0, 6.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-15.9453125, -15.513671875, -15.08203125, -14.650390625, -14.21875, -13.787109375, -13.35546875, -12.923828125, -12.4921875, -12.060546875, -11.62890625, -11.197265625, -10.765625, -10.333984375, -9.90234375, -9.470703125, -9.0390625, -8.607421875, -8.17578125, -7.744140625, -7.3125, -6.880859375, -6.44921875, -6.017578125, -5.5859375, -5.154296875, -4.72265625, -4.291015625, -3.859375, -3.427734375, -2.99609375, -2.564453125, -2.1328125, -1.701171875, -1.26953125, -0.837890625, -0.40625, 0.025390625, 0.45703125, 0.888671875, 1.3203125, 1.751953125, 2.18359375, 2.615234375, 3.046875, 3.478515625, 3.91015625, 4.341796875, 4.7734375, 5.205078125, 5.63671875, 6.068359375, 6.5, 6.931640625, 7.36328125, 7.794921875, 8.2265625, 8.658203125, 9.08984375, 9.521484375, 9.953125, 10.384765625, 10.81640625, 11.248046875, 11.6796875]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 6.0, 4.0, 7.0, 11.0, 13.0, 29.0, 46.0, 41.0, 63.0, 99.0, 170.0, 281.0, 493.0, 838.0, 890.0, 505.0, 209.0, 131.0, 66.0, 45.0, 46.0, 34.0, 18.0, 7.0, 10.0, 6.0, 2.0, 3.0, 3.0, 5.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.4609375, -9.9364013671875, -9.411865234375, -8.8873291015625, -8.36279296875, -7.8382568359375, -7.313720703125, -6.7891845703125, -6.2646484375, -5.7401123046875, -5.215576171875, -4.6910400390625, -4.16650390625, -3.6419677734375, -3.117431640625, -2.5928955078125, -2.068359375, -1.5438232421875, -1.019287109375, -0.4947509765625, 0.02978515625, 0.5543212890625, 1.078857421875, 1.6033935546875, 2.1279296875, 2.6524658203125, 3.177001953125, 3.7015380859375, 4.22607421875, 4.7506103515625, 5.275146484375, 5.7996826171875, 6.32421875, 6.8487548828125, 7.373291015625, 7.8978271484375, 8.42236328125, 8.9468994140625, 9.471435546875, 9.9959716796875, 10.5205078125, 11.0450439453125, 11.569580078125, 12.0941162109375, 12.61865234375, 13.1431884765625, 13.667724609375, 14.1922607421875, 14.716796875, 15.2413330078125, 15.765869140625, 16.2904052734375, 16.81494140625, 17.3394775390625, 17.864013671875, 18.3885498046875, 18.9130859375, 19.4376220703125, 19.962158203125, 20.4866943359375, 21.01123046875, 21.5357666015625, 22.060302734375, 22.5848388671875, 23.109375]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 2.0, 7.0, 10.0, 11.0, 11.0, 14.0, 43.0, 47.0, 56.0, 126.0, 230.0, 458.0, 791.0, 1721.0, 3832.0, 8869.0, 23981.0, 72591.0, 428616.0, 3221012.0, 331526.0, 63966.0, 21263.0, 8263.0, 3484.0, 1634.0, 763.0, 423.0, 214.0, 121.0, 66.0, 49.0, 24.0, 21.0, 10.0, 9.0, 11.0, 5.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0], "bins": [-25.703125, -25.03466796875, -24.3662109375, -23.69775390625, -23.029296875, -22.36083984375, -21.6923828125, -21.02392578125, -20.35546875, -19.68701171875, -19.0185546875, -18.35009765625, -17.681640625, -17.01318359375, -16.3447265625, -15.67626953125, -15.0078125, -14.33935546875, -13.6708984375, -13.00244140625, -12.333984375, -11.66552734375, -10.9970703125, -10.32861328125, -9.66015625, -8.99169921875, -8.3232421875, -7.65478515625, -6.986328125, -6.31787109375, -5.6494140625, -4.98095703125, -4.3125, -3.64404296875, -2.9755859375, -2.30712890625, -1.638671875, -0.97021484375, -0.3017578125, 0.36669921875, 1.03515625, 1.70361328125, 2.3720703125, 3.04052734375, 3.708984375, 4.37744140625, 5.0458984375, 5.71435546875, 6.3828125, 7.05126953125, 7.7197265625, 8.38818359375, 9.056640625, 9.72509765625, 10.3935546875, 11.06201171875, 11.73046875, 12.39892578125, 13.0673828125, 13.73583984375, 14.404296875, 15.07275390625, 15.7412109375, 16.40966796875, 17.078125]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 6.0, 12.0, 13.0, 16.0, 62.0, 105.0, 182.0, 252.0, 174.0, 105.0, 41.0, 21.0, 9.0, 10.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-142.0196533203125, -138.1363067626953, -134.25296020507812, -130.36962890625, -126.48627471923828, -122.60293579101562, -118.71958923339844, -114.83624267578125, -110.9529037475586, -107.0695571899414, -103.18621826171875, -99.30287170410156, -95.41952514648438, -91.53618621826172, -87.65283966064453, -83.76950073242188, -79.88615417480469, -76.0028076171875, -72.11946868896484, -68.23612213134766, -64.35277557373047, -60.46943664550781, -56.586090087890625, -52.7027473449707, -48.81939697265625, -44.93605422973633, -41.05270767211914, -37.16936492919922, -33.2860221862793, -29.402677536010742, -25.519332885742188, -21.635990142822266, -17.752647399902344, -13.869303703308105, -9.985960006713867, -6.1026153564453125, -2.219271659851074, 1.664072036743164, 5.547416687011719, 9.43075942993164, 13.314104080200195, 17.19744873046875, 21.080791473388672, 24.964136123657227, 28.84748077392578, 32.7308235168457, 36.614166259765625, 40.49751281738281, 44.380855560302734, 48.264198303222656, 52.147544860839844, 56.030887603759766, 59.91423034667969, 63.797576904296875, 67.68092346191406, 71.56426239013672, 75.4476089477539, 79.3309555053711, 83.21429443359375, 87.09764099121094, 90.98098754882812, 94.86432647705078, 98.74767303466797, 102.63101196289062, 106.51435852050781]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 2.0, 7.0, 10.0, 8.0, 10.0, 24.0, 14.0, 25.0, 21.0, 28.0, 22.0, 35.0, 37.0, 37.0, 46.0, 47.0, 59.0, 48.0, 46.0, 51.0, 53.0, 42.0, 52.0, 43.0, 41.0, 28.0, 32.0, 19.0, 35.0, 20.0, 19.0, 6.0, 9.0, 11.0, 4.0, 5.0, 2.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.46049499511719, -48.06324768066406, -46.66600036621094, -45.26875305175781, -43.87150573730469, -42.47425842285156, -41.07701110839844, -39.67976760864258, -38.28252029418945, -36.88527297973633, -35.4880256652832, -34.09077835083008, -32.69353103637695, -31.29628562927246, -29.899038314819336, -28.501792907714844, -27.104543685913086, -25.70729637145996, -24.310049057006836, -22.912803649902344, -21.51555633544922, -20.118309020996094, -18.72106170654297, -17.323814392089844, -15.926568031311035, -14.52932071685791, -13.132074356079102, -11.734827041625977, -10.337579727172852, -8.940333366394043, -7.543086051940918, -6.145839691162109, -4.748592376708984, -3.3513455390930176, -1.9540984630584717, -0.5568513870239258, 0.840395450592041, 2.237642288208008, 3.634889602661133, 5.032135963439941, 6.429383277893066, 7.826630115509033, 9.223876953125, 10.621124267578125, 12.01837158203125, 13.415617942810059, 14.812865257263184, 16.210111618041992, 17.607358932495117, 19.004606246948242, 20.401853561401367, 21.79909896850586, 23.196346282958984, 24.59359359741211, 25.990840911865234, 27.38808822631836, 28.785335540771484, 30.18258285522461, 31.579830169677734, 32.97707748413086, 34.374324798583984, 35.771568298339844, 37.16881561279297, 38.566062927246094, 39.96331024169922]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 5.0, 3.0, 5.0, 9.0, 7.0, 6.0, 7.0, 8.0, 16.0, 17.0, 14.0, 10.0, 23.0, 24.0, 39.0, 33.0, 35.0, 32.0, 32.0, 43.0, 46.0, 48.0, 48.0, 37.0, 33.0, 45.0, 43.0, 35.0, 30.0, 35.0, 32.0, 33.0, 33.0, 28.0, 16.0, 17.0, 14.0, 12.0, 11.0, 7.0, 7.0, 4.0, 8.0, 8.0, 5.0, 0.0, 1.0, 3.0, 1.0, 3.0], "bins": [-5.2265625, -5.084686279296875, -4.94281005859375, -4.800933837890625, -4.6590576171875, -4.517181396484375, -4.37530517578125, -4.233428955078125, -4.091552734375, -3.949676513671875, -3.80780029296875, -3.665924072265625, -3.5240478515625, -3.382171630859375, -3.24029541015625, -3.098419189453125, -2.95654296875, -2.814666748046875, -2.67279052734375, -2.530914306640625, -2.3890380859375, -2.247161865234375, -2.10528564453125, -1.963409423828125, -1.821533203125, -1.679656982421875, -1.53778076171875, -1.395904541015625, -1.2540283203125, -1.112152099609375, -0.97027587890625, -0.828399658203125, -0.6865234375, -0.544647216796875, -0.40277099609375, -0.260894775390625, -0.1190185546875, 0.022857666015625, 0.16473388671875, 0.306610107421875, 0.448486328125, 0.590362548828125, 0.73223876953125, 0.874114990234375, 1.0159912109375, 1.157867431640625, 1.29974365234375, 1.441619873046875, 1.58349609375, 1.725372314453125, 1.86724853515625, 2.009124755859375, 2.1510009765625, 2.292877197265625, 2.43475341796875, 2.576629638671875, 2.718505859375, 2.860382080078125, 3.00225830078125, 3.144134521484375, 3.2860107421875, 3.427886962890625, 3.56976318359375, 3.711639404296875, 3.853515625]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 3.0, 4.0, 9.0, 8.0, 12.0, 14.0, 19.0, 30.0, 40.0, 50.0, 101.0, 136.0, 190.0, 285.0, 433.0, 656.0, 1017.0, 1503.0, 2344.0, 3727.0, 5727.0, 9282.0, 14688.0, 24444.0, 40896.0, 72008.0, 133755.0, 266930.0, 214884.0, 107377.0, 58795.0, 34236.0, 20567.0, 12577.0, 7773.0, 4966.0, 3122.0, 1994.0, 1278.0, 873.0, 573.0, 386.0, 263.0, 179.0, 123.0, 87.0, 57.0, 44.0, 32.0, 17.0, 18.0, 16.0, 5.0, 5.0, 3.0, 6.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.1832275390625, -0.17728424072265625, -0.1713409423828125, -0.16539764404296875, -0.159454345703125, -0.15351104736328125, -0.1475677490234375, -0.14162445068359375, -0.13568115234375, -0.12973785400390625, -0.1237945556640625, -0.11785125732421875, -0.111907958984375, -0.10596466064453125, -0.1000213623046875, -0.09407806396484375, -0.088134765625, -0.08219146728515625, -0.0762481689453125, -0.07030487060546875, -0.064361572265625, -0.05841827392578125, -0.0524749755859375, -0.04653167724609375, -0.04058837890625, -0.03464508056640625, -0.0287017822265625, -0.02275848388671875, -0.016815185546875, -0.01087188720703125, -0.0049285888671875, 0.00101470947265625, 0.0069580078125, 0.01290130615234375, 0.0188446044921875, 0.02478790283203125, 0.030731201171875, 0.03667449951171875, 0.0426177978515625, 0.04856109619140625, 0.05450439453125, 0.06044769287109375, 0.0663909912109375, 0.07233428955078125, 0.078277587890625, 0.08422088623046875, 0.0901641845703125, 0.09610748291015625, 0.10205078125, 0.10799407958984375, 0.1139373779296875, 0.11988067626953125, 0.125823974609375, 0.13176727294921875, 0.1377105712890625, 0.14365386962890625, 0.14959716796875, 0.15554046630859375, 0.1614837646484375, 0.16742706298828125, 0.173370361328125, 0.17931365966796875, 0.1852569580078125, 0.19120025634765625, 0.1971435546875]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 6.0, 4.0, 4.0, 6.0, 4.0, 9.0, 16.0, 11.0, 17.0, 14.0, 13.0, 27.0, 25.0, 26.0, 31.0, 27.0, 39.0, 36.0, 45.0, 28.0, 45.0, 52.0, 1053.0, 53.0, 39.0, 38.0, 39.0, 35.0, 34.0, 25.0, 27.0, 31.0, 24.0, 16.0, 17.0, 15.0, 17.0, 17.0, 16.0, 9.0, 10.0, 7.0, 4.0, 11.0, 5.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.09765625, -3.003631591796875, -2.90960693359375, -2.815582275390625, -2.7215576171875, -2.627532958984375, -2.53350830078125, -2.439483642578125, -2.345458984375, -2.251434326171875, -2.15740966796875, -2.063385009765625, -1.9693603515625, -1.875335693359375, -1.78131103515625, -1.687286376953125, -1.59326171875, -1.499237060546875, -1.40521240234375, -1.311187744140625, -1.2171630859375, -1.123138427734375, -1.02911376953125, -0.935089111328125, -0.841064453125, -0.747039794921875, -0.65301513671875, -0.558990478515625, -0.4649658203125, -0.370941162109375, -0.27691650390625, -0.182891845703125, -0.0888671875, 0.005157470703125, 0.09918212890625, 0.193206787109375, 0.2872314453125, 0.381256103515625, 0.47528076171875, 0.569305419921875, 0.663330078125, 0.757354736328125, 0.85137939453125, 0.945404052734375, 1.0394287109375, 1.133453369140625, 1.22747802734375, 1.321502685546875, 1.41552734375, 1.509552001953125, 1.60357666015625, 1.697601318359375, 1.7916259765625, 1.885650634765625, 1.97967529296875, 2.073699951171875, 2.167724609375, 2.261749267578125, 2.35577392578125, 2.449798583984375, 2.5438232421875, 2.637847900390625, 2.73187255859375, 2.825897216796875, 2.919921875]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [4.0, 3.0, 10.0, 10.0, 17.0, 22.0, 29.0, 39.0, 33.0, 61.0, 67.0, 110.0, 173.0, 226.0, 338.0, 422.0, 589.0, 822.0, 1189.0, 1543.0, 2245.0, 3225.0, 4684.0, 6693.0, 10218.0, 15150.0, 22858.0, 34778.0, 53615.0, 83440.0, 130572.0, 1243267.0, 168573.0, 108663.0, 69560.0, 44566.0, 29465.0, 18924.0, 12711.0, 8697.0, 5850.0, 3990.0, 2738.0, 1966.0, 1388.0, 1029.0, 694.0, 501.0, 372.0, 269.0, 192.0, 155.0, 108.0, 92.0, 52.0, 46.0, 32.0, 25.0, 12.0, 10.0, 8.0, 6.0, 2.0, 4.0], "bins": [-0.1121826171875, -0.10865402221679688, -0.10512542724609375, -0.10159683227539062, -0.0980682373046875, -0.09453964233398438, -0.09101104736328125, -0.08748245239257812, -0.083953857421875, -0.08042526245117188, -0.07689666748046875, -0.07336807250976562, -0.0698394775390625, -0.06631088256835938, -0.06278228759765625, -0.059253692626953125, -0.05572509765625, -0.052196502685546875, -0.04866790771484375, -0.045139312744140625, -0.0416107177734375, -0.038082122802734375, -0.03455352783203125, -0.031024932861328125, -0.027496337890625, -0.023967742919921875, -0.02043914794921875, -0.016910552978515625, -0.0133819580078125, -0.009853363037109375, -0.00632476806640625, -0.002796173095703125, 0.000732421875, 0.004261016845703125, 0.00778961181640625, 0.011318206787109375, 0.0148468017578125, 0.018375396728515625, 0.02190399169921875, 0.025432586669921875, 0.028961181640625, 0.032489776611328125, 0.03601837158203125, 0.039546966552734375, 0.0430755615234375, 0.046604156494140625, 0.05013275146484375, 0.053661346435546875, 0.05718994140625, 0.060718536376953125, 0.06424713134765625, 0.06777572631835938, 0.0713043212890625, 0.07483291625976562, 0.07836151123046875, 0.08189010620117188, 0.085418701171875, 0.08894729614257812, 0.09247589111328125, 0.09600448608398438, 0.0995330810546875, 0.10306167602539062, 0.10659027099609375, 0.11011886596679688, 0.1136474609375]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 6.0, 2.0, 7.0, 2.0, 8.0, 10.0, 8.0, 11.0, 24.0, 18.0, 24.0, 24.0, 25.0, 22.0, 37.0, 53.0, 58.0, 55.0, 106.0, 106.0, 85.0, 52.0, 38.0, 37.0, 25.0, 13.0, 32.0, 18.0, 14.0, 15.0, 9.0, 9.0, 9.0, 6.0, 8.0, 3.0, 5.0, 3.0, 1.0, 4.0, 7.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0001595020294189453, -0.0001546330749988556, -0.00014976412057876587, -0.00014489516615867615, -0.00014002621173858643, -0.0001351572573184967, -0.00013028830289840698, -0.00012541934847831726, -0.00012055039405822754, -0.00011568143963813782, -0.0001108124852180481, -0.00010594353079795837, -0.00010107457637786865, -9.620562195777893e-05, -9.133666753768921e-05, -8.646771311759949e-05, -8.159875869750977e-05, -7.672980427742004e-05, -7.186084985733032e-05, -6.69918954372406e-05, -6.212294101715088e-05, -5.725398659706116e-05, -5.2385032176971436e-05, -4.7516077756881714e-05, -4.264712333679199e-05, -3.777816891670227e-05, -3.290921449661255e-05, -2.8040260076522827e-05, -2.3171305656433105e-05, -1.8302351236343384e-05, -1.3433396816253662e-05, -8.56444239616394e-06, -3.6954879760742188e-06, 1.173466444015503e-06, 6.042420864105225e-06, 1.0911375284194946e-05, 1.5780329704284668e-05, 2.064928412437439e-05, 2.551823854446411e-05, 3.0387192964553833e-05, 3.5256147384643555e-05, 4.0125101804733276e-05, 4.4994056224823e-05, 4.986301064491272e-05, 5.473196506500244e-05, 5.960091948509216e-05, 6.446987390518188e-05, 6.93388283252716e-05, 7.420778274536133e-05, 7.907673716545105e-05, 8.394569158554077e-05, 8.881464600563049e-05, 9.368360042572021e-05, 9.855255484580994e-05, 0.00010342150926589966, 0.00010829046368598938, 0.0001131594181060791, 0.00011802837252616882, 0.00012289732694625854, 0.00012776628136634827, 0.000132635235786438, 0.0001375041902065277, 0.00014237314462661743, 0.00014724209904670715, 0.00015211105346679688]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 0.0, 5.0, 5.0, 6.0, 10.0, 10.0, 13.0, 9.0, 21.0, 21.0, 39.0, 37.0, 72.0, 93.0, 200.0, 467.0, 1709.0, 10384.0, 185124.0, 821212.0, 24631.0, 3088.0, 736.0, 253.0, 126.0, 71.0, 58.0, 38.0, 19.0, 22.0, 21.0, 18.0, 4.0, 13.0, 4.0, 5.0, 4.0, 3.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.002338409423828125, -0.0022634267807006836, -0.002188444137573242, -0.0021134614944458008, -0.0020384788513183594, -0.001963496208190918, -0.0018885135650634766, -0.0018135309219360352, -0.0017385482788085938, -0.0016635656356811523, -0.001588582992553711, -0.0015136003494262695, -0.0014386177062988281, -0.0013636350631713867, -0.0012886524200439453, -0.001213669776916504, -0.0011386871337890625, -0.001063704490661621, -0.0009887218475341797, -0.0009137392044067383, -0.0008387565612792969, -0.0007637739181518555, -0.0006887912750244141, -0.0006138086318969727, -0.0005388259887695312, -0.00046384334564208984, -0.00038886070251464844, -0.00031387805938720703, -0.00023889541625976562, -0.00016391277313232422, -8.893013000488281e-05, -1.3947486877441406e-05, 6.103515625e-05, 0.0001360177993774414, 0.0002110004425048828, 0.0002859830856323242, 0.0003609657287597656, 0.00043594837188720703, 0.0005109310150146484, 0.0005859136581420898, 0.0006608963012695312, 0.0007358789443969727, 0.0008108615875244141, 0.0008858442306518555, 0.0009608268737792969, 0.0010358095169067383, 0.0011107921600341797, 0.001185774803161621, 0.0012607574462890625, 0.001335740089416504, 0.0014107227325439453, 0.0014857053756713867, 0.0015606880187988281, 0.0016356706619262695, 0.001710653305053711, 0.0017856359481811523, 0.0018606185913085938, 0.0019356012344360352, 0.0020105838775634766, 0.002085566520690918, 0.0021605491638183594, 0.0022355318069458008, 0.002310514450073242, 0.0023854970932006836, 0.002460479736328125]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 3.0, 6.0, 4.0, 16.0, 24.0, 33.0, 73.0, 112.0, 201.0, 217.0, 141.0, 73.0, 46.0, 24.0, 13.0, 13.0, 8.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011385445395717397, -0.00010680659033823758, -9.975873399525881e-05, -9.271087037632242e-05, -8.566300675738603e-05, -7.861515041440725e-05, -7.156728679547086e-05, -6.451942317653447e-05, -5.747156319557689e-05, -5.042370321461931e-05, -4.337583959568292e-05, -3.6327979614725336e-05, -2.928011781477835e-05, -2.2232256014831364e-05, -1.5184396033873782e-05, -8.136532414937392e-06, -1.0886724339798093e-06, 5.959188911219826e-06, 1.3007050256419461e-05, 2.0054911146871746e-05, 2.7102772946818732e-05, 3.415063474676572e-05, 4.11984947277233e-05, 4.824635834665969e-05, 5.529421832761727e-05, 6.234207830857486e-05, 6.938994192751125e-05, 7.643780554644763e-05, 8.348566188942641e-05, 9.05335255083628e-05, 9.758138912729919e-05, 0.00010462924547027797, 0.00011167711636517197, 0.00011872497998410836, 0.00012577284360304475, 0.00013282069994602352, 0.0001398685562890023, 0.0001469164271838963, 0.00015396428352687508, 0.00016101213986985385, 0.00016806001076474786, 0.00017510786710772663, 0.00018215573800262064, 0.0001892035943455994, 0.0001962514506885782, 0.0002032993215834722, 0.00021034717792645097, 0.00021739504882134497, 0.00022444289061240852, 0.0002314907469553873, 0.0002385386178502813, 0.0002455864741932601, 0.0002526343450881541, 0.0002596821868792176, 0.00026673005777411163, 0.00027377792866900563, 0.00028082579956389964, 0.00028787367045879364, 0.0002949215122498572, 0.0003019693831447512, 0.0003090172540396452, 0.00031606509583070874, 0.00032311296672560275, 0.00033016083762049675, 0.0003372086794115603]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 7.0, 3.0, 10.0, 13.0, 11.0, 6.0, 18.0, 11.0, 25.0, 17.0, 22.0, 32.0, 21.0, 38.0, 40.0, 28.0, 37.0, 41.0, 49.0, 32.0, 52.0, 53.0, 40.0, 41.0, 35.0, 35.0, 36.0, 33.0, 18.0, 26.0, 28.0, 27.0, 12.0, 24.0, 10.0, 12.0, 10.0, 18.0, 4.0, 8.0, 4.0, 4.0, 2.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0], "bins": [-7.528066635131836e-05, -7.275864481925964e-05, -7.023662328720093e-05, -6.771460175514221e-05, -6.51925802230835e-05, -6.267055869102478e-05, -6.0148537158966064e-05, -5.762651562690735e-05, -5.510449409484863e-05, -5.258247256278992e-05, -5.00604510307312e-05, -4.7538429498672485e-05, -4.501640796661377e-05, -4.2494386434555054e-05, -3.997236490249634e-05, -3.745034337043762e-05, -3.4928321838378906e-05, -3.240630030632019e-05, -2.9884278774261475e-05, -2.736225724220276e-05, -2.4840235710144043e-05, -2.2318214178085327e-05, -1.979619264602661e-05, -1.7274171113967896e-05, -1.475214958190918e-05, -1.2230128049850464e-05, -9.708106517791748e-06, -7.186084985733032e-06, -4.664063453674316e-06, -2.1420419216156006e-06, 3.7997961044311523e-07, 2.902001142501831e-06, 5.424022674560547e-06, 7.946044206619263e-06, 1.0468065738677979e-05, 1.2990087270736694e-05, 1.551210880279541e-05, 1.8034130334854126e-05, 2.0556151866912842e-05, 2.3078173398971558e-05, 2.5600194931030273e-05, 2.812221646308899e-05, 3.0644237995147705e-05, 3.316625952720642e-05, 3.568828105926514e-05, 3.821030259132385e-05, 4.073232412338257e-05, 4.3254345655441284e-05, 4.57763671875e-05, 4.8298388719558716e-05, 5.082041025161743e-05, 5.334243178367615e-05, 5.586445331573486e-05, 5.838647484779358e-05, 6.0908496379852295e-05, 6.343051791191101e-05, 6.595253944396973e-05, 6.847456097602844e-05, 7.099658250808716e-05, 7.351860404014587e-05, 7.604062557220459e-05, 7.85626471042633e-05, 8.108466863632202e-05, 8.360669016838074e-05, 8.612871170043945e-05]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 5.0, 3.0, 5.0, 9.0, 7.0, 6.0, 7.0, 8.0, 16.0, 17.0, 14.0, 10.0, 23.0, 24.0, 39.0, 33.0, 35.0, 32.0, 32.0, 43.0, 46.0, 48.0, 48.0, 37.0, 33.0, 45.0, 43.0, 35.0, 30.0, 35.0, 32.0, 33.0, 33.0, 28.0, 16.0, 17.0, 14.0, 12.0, 11.0, 7.0, 7.0, 4.0, 8.0, 8.0, 5.0, 0.0, 1.0, 3.0, 1.0, 3.0], "bins": [-5.2265625, -5.084686279296875, -4.94281005859375, -4.800933837890625, -4.6590576171875, -4.517181396484375, -4.37530517578125, -4.233428955078125, -4.091552734375, -3.949676513671875, -3.80780029296875, -3.665924072265625, -3.5240478515625, -3.382171630859375, -3.24029541015625, -3.098419189453125, -2.95654296875, -2.814666748046875, -2.67279052734375, -2.530914306640625, -2.3890380859375, -2.247161865234375, -2.10528564453125, -1.963409423828125, -1.821533203125, -1.679656982421875, -1.53778076171875, -1.395904541015625, -1.2540283203125, -1.112152099609375, -0.97027587890625, -0.828399658203125, -0.6865234375, -0.544647216796875, -0.40277099609375, -0.260894775390625, -0.1190185546875, 0.022857666015625, 0.16473388671875, 0.306610107421875, 0.448486328125, 0.590362548828125, 0.73223876953125, 0.874114990234375, 1.0159912109375, 1.157867431640625, 1.29974365234375, 1.441619873046875, 1.58349609375, 1.725372314453125, 1.86724853515625, 2.009124755859375, 2.1510009765625, 2.292877197265625, 2.43475341796875, 2.576629638671875, 2.718505859375, 2.860382080078125, 3.00225830078125, 3.144134521484375, 3.2860107421875, 3.427886962890625, 3.56976318359375, 3.711639404296875, 3.853515625]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 0.0, 5.0, 3.0, 11.0, 14.0, 18.0, 28.0, 38.0, 37.0, 58.0, 92.0, 128.0, 187.0, 257.0, 402.0, 496.0, 707.0, 1014.0, 1462.0, 2046.0, 2997.0, 4598.0, 7960.0, 16416.0, 48710.0, 229572.0, 569385.0, 104650.0, 27810.0, 11354.0, 6037.0, 3722.0, 2462.0, 1676.0, 1198.0, 877.0, 592.0, 446.0, 306.0, 211.0, 170.0, 114.0, 76.0, 67.0, 38.0, 39.0, 20.0, 16.0, 13.0, 7.0, 7.0, 4.0, 4.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.5859375, -5.39508056640625, -5.2042236328125, -5.01336669921875, -4.822509765625, -4.63165283203125, -4.4407958984375, -4.24993896484375, -4.05908203125, -3.86822509765625, -3.6773681640625, -3.48651123046875, -3.295654296875, -3.10479736328125, -2.9139404296875, -2.72308349609375, -2.5322265625, -2.34136962890625, -2.1505126953125, -1.95965576171875, -1.768798828125, -1.57794189453125, -1.3870849609375, -1.19622802734375, -1.00537109375, -0.81451416015625, -0.6236572265625, -0.43280029296875, -0.241943359375, -0.05108642578125, 0.1397705078125, 0.33062744140625, 0.521484375, 0.71234130859375, 0.9031982421875, 1.09405517578125, 1.284912109375, 1.47576904296875, 1.6666259765625, 1.85748291015625, 2.04833984375, 2.23919677734375, 2.4300537109375, 2.62091064453125, 2.811767578125, 3.00262451171875, 3.1934814453125, 3.38433837890625, 3.5751953125, 3.76605224609375, 3.9569091796875, 4.14776611328125, 4.338623046875, 4.52947998046875, 4.7203369140625, 4.91119384765625, 5.10205078125, 5.29290771484375, 5.4837646484375, 5.67462158203125, 5.865478515625, 6.05633544921875, 6.2471923828125, 6.43804931640625, 6.62890625]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 0.0, 6.0, 3.0, 7.0, 8.0, 10.0, 12.0, 11.0, 15.0, 19.0, 25.0, 15.0, 19.0, 27.0, 36.0, 17.0, 28.0, 38.0, 38.0, 42.0, 54.0, 109.0, 403.0, 1526.0, 113.0, 59.0, 52.0, 42.0, 39.0, 38.0, 35.0, 26.0, 21.0, 25.0, 25.0, 22.0, 12.0, 7.0, 10.0, 14.0, 6.0, 8.0, 7.0, 6.0, 5.0, 4.0, 0.0, 6.0, 2.0, 1.0, 5.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.8515625, -14.3880615234375, -13.924560546875, -13.4610595703125, -12.99755859375, -12.5340576171875, -12.070556640625, -11.6070556640625, -11.1435546875, -10.6800537109375, -10.216552734375, -9.7530517578125, -9.28955078125, -8.8260498046875, -8.362548828125, -7.8990478515625, -7.435546875, -6.9720458984375, -6.508544921875, -6.0450439453125, -5.58154296875, -5.1180419921875, -4.654541015625, -4.1910400390625, -3.7275390625, -3.2640380859375, -2.800537109375, -2.3370361328125, -1.87353515625, -1.4100341796875, -0.946533203125, -0.4830322265625, -0.01953125, 0.4439697265625, 0.907470703125, 1.3709716796875, 1.83447265625, 2.2979736328125, 2.761474609375, 3.2249755859375, 3.6884765625, 4.1519775390625, 4.615478515625, 5.0789794921875, 5.54248046875, 6.0059814453125, 6.469482421875, 6.9329833984375, 7.396484375, 7.8599853515625, 8.323486328125, 8.7869873046875, 9.25048828125, 9.7139892578125, 10.177490234375, 10.6409912109375, 11.1044921875, 11.5679931640625, 12.031494140625, 12.4949951171875, 12.95849609375, 13.4219970703125, 13.885498046875, 14.3489990234375, 14.8125]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 5.0, 6.0, 6.0, 8.0, 10.0, 13.0, 7.0, 18.0, 19.0, 17.0, 28.0, 51.0, 75.0, 75.0, 145.0, 245.0, 584.0, 1842.0, 9979.0, 2141678.0, 979225.0, 8748.0, 1647.0, 564.0, 240.0, 136.0, 105.0, 47.0, 54.0, 38.0, 24.0, 19.0, 15.0, 12.0, 9.0, 7.0, 1.0, 7.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-38.625, -37.5205078125, -36.416015625, -35.3115234375, -34.20703125, -33.1025390625, -31.998046875, -30.8935546875, -29.7890625, -28.6845703125, -27.580078125, -26.4755859375, -25.37109375, -24.2666015625, -23.162109375, -22.0576171875, -20.953125, -19.8486328125, -18.744140625, -17.6396484375, -16.53515625, -15.4306640625, -14.326171875, -13.2216796875, -12.1171875, -11.0126953125, -9.908203125, -8.8037109375, -7.69921875, -6.5947265625, -5.490234375, -4.3857421875, -3.28125, -2.1767578125, -1.072265625, 0.0322265625, 1.13671875, 2.2412109375, 3.345703125, 4.4501953125, 5.5546875, 6.6591796875, 7.763671875, 8.8681640625, 9.97265625, 11.0771484375, 12.181640625, 13.2861328125, 14.390625, 15.4951171875, 16.599609375, 17.7041015625, 18.80859375, 19.9130859375, 21.017578125, 22.1220703125, 23.2265625, 24.3310546875, 25.435546875, 26.5400390625, 27.64453125, 28.7490234375, 29.853515625, 30.9580078125, 32.0625]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 6.0, 111.0, 459.0, 369.0, 61.0, 10.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-136.85890197753906, -134.0025634765625, -131.14620971679688, -128.28985595703125, -125.43351745605469, -122.5771713256836, -119.7208251953125, -116.8644790649414, -114.00813293457031, -111.15178680419922, -108.29544067382812, -105.43909454345703, -102.58274841308594, -99.72640228271484, -96.87005615234375, -94.01371002197266, -91.15736389160156, -88.30101776123047, -85.44467163085938, -82.58832550048828, -79.73197937011719, -76.8756332397461, -74.019287109375, -71.1629409790039, -68.30659484863281, -65.45024871826172, -62.593902587890625, -59.73755645751953, -56.88121032714844, -54.024864196777344, -51.16851806640625, -48.312171936035156, -45.4558219909668, -42.5994758605957, -39.74312973022461, -36.886783599853516, -34.03043746948242, -31.174091339111328, -28.317745208740234, -25.46139907836914, -22.605052947998047, -19.748706817626953, -16.89236068725586, -14.036014556884766, -11.179668426513672, -8.323322296142578, -5.466976165771484, -2.6106300354003906, 0.24571609497070312, 3.102062225341797, 5.958408355712891, 8.814754486083984, 11.671100616455078, 14.527446746826172, 17.383792877197266, 20.24013900756836, 23.096485137939453, 25.952831268310547, 28.80917739868164, 31.665523529052734, 34.52186965942383, 37.37821578979492, 40.234561920166016, 43.09090805053711, 45.9472541809082]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 7.0, 4.0, 6.0, 2.0, 8.0, 12.0, 10.0, 12.0, 15.0, 22.0, 29.0, 33.0, 25.0, 32.0, 39.0, 44.0, 38.0, 35.0, 43.0, 57.0, 48.0, 39.0, 39.0, 36.0, 39.0, 45.0, 29.0, 40.0, 33.0, 23.0, 22.0, 17.0, 19.0, 26.0, 19.0, 9.0, 8.0, 6.0, 8.0, 7.0, 5.0, 5.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-48.24293899536133, -46.78824996948242, -45.33356475830078, -43.878875732421875, -42.42418670654297, -40.96949768066406, -39.514808654785156, -38.060123443603516, -36.60543441772461, -35.1507453918457, -33.69606018066406, -32.241371154785156, -30.78668212890625, -29.331993103027344, -27.87730598449707, -26.422618865966797, -24.96792984008789, -23.513240814208984, -22.05855369567871, -20.603866577148438, -19.14917755126953, -17.694488525390625, -16.23980140686035, -14.785113334655762, -13.330425262451172, -11.875737190246582, -10.421049118041992, -8.966361045837402, -7.5116729736328125, -6.056984901428223, -4.602296829223633, -3.147608757019043, -1.6929168701171875, -0.23822879791259766, 1.2164592742919922, 2.671147346496582, 4.125835418701172, 5.580523490905762, 7.035211563110352, 8.489899635314941, 9.944587707519531, 11.399275779724121, 12.853963851928711, 14.3086519241333, 15.76333999633789, 17.218029022216797, 18.67271614074707, 20.127403259277344, 21.58209228515625, 23.036781311035156, 24.49146842956543, 25.946155548095703, 27.40084457397461, 28.855533599853516, 30.31022071838379, 31.764907836914062, 33.21959686279297, 34.674285888671875, 36.12897491455078, 37.58366012573242, 39.03834915161133, 40.493038177490234, 41.947723388671875, 43.40241241455078, 44.85710144042969]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 4.0, 6.0, 7.0, 8.0, 7.0, 5.0, 10.0, 16.0, 14.0, 14.0, 20.0, 22.0, 30.0, 38.0, 28.0, 36.0, 31.0, 45.0, 44.0, 42.0, 45.0, 46.0, 36.0, 47.0, 39.0, 33.0, 36.0, 38.0, 37.0, 25.0, 38.0, 31.0, 23.0, 17.0, 15.0, 14.0, 13.0, 7.0, 8.0, 8.0, 6.0, 7.0, 1.0, 3.0, 2.0, 3.0, 1.0, 2.0], "bins": [-5.5546875, -5.40655517578125, -5.2584228515625, -5.11029052734375, -4.962158203125, -4.81402587890625, -4.6658935546875, -4.51776123046875, -4.36962890625, -4.22149658203125, -4.0733642578125, -3.92523193359375, -3.777099609375, -3.62896728515625, -3.4808349609375, -3.33270263671875, -3.1845703125, -3.03643798828125, -2.8883056640625, -2.74017333984375, -2.592041015625, -2.44390869140625, -2.2957763671875, -2.14764404296875, -1.99951171875, -1.85137939453125, -1.7032470703125, -1.55511474609375, -1.406982421875, -1.25885009765625, -1.1107177734375, -0.96258544921875, -0.814453125, -0.66632080078125, -0.5181884765625, -0.37005615234375, -0.221923828125, -0.07379150390625, 0.0743408203125, 0.22247314453125, 0.37060546875, 0.51873779296875, 0.6668701171875, 0.81500244140625, 0.963134765625, 1.11126708984375, 1.2593994140625, 1.40753173828125, 1.5556640625, 1.70379638671875, 1.8519287109375, 2.00006103515625, 2.148193359375, 2.29632568359375, 2.4444580078125, 2.59259033203125, 2.74072265625, 2.88885498046875, 3.0369873046875, 3.18511962890625, 3.333251953125, 3.48138427734375, 3.6295166015625, 3.77764892578125, 3.92578125]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 3.0, 6.0, 6.0, 10.0, 24.0, 22.0, 39.0, 50.0, 68.0, 74.0, 130.0, 226.0, 252.0, 402.0, 567.0, 845.0, 1317.0, 1963.0, 3028.0, 4859.0, 8149.0, 14453.0, 27759.0, 82219.0, 655214.0, 2616167.0, 623517.0, 86876.0, 29310.0, 14692.0, 8432.0, 4958.0, 2996.0, 1974.0, 1249.0, 813.0, 508.0, 380.0, 228.0, 177.0, 98.0, 73.0, 48.0, 33.0, 29.0, 17.0, 8.0, 7.0, 7.0, 4.0, 3.0, 0.0, 1.0, 0.0, 3.0], "bins": [-10.4765625, -10.1728515625, -9.869140625, -9.5654296875, -9.26171875, -8.9580078125, -8.654296875, -8.3505859375, -8.046875, -7.7431640625, -7.439453125, -7.1357421875, -6.83203125, -6.5283203125, -6.224609375, -5.9208984375, -5.6171875, -5.3134765625, -5.009765625, -4.7060546875, -4.40234375, -4.0986328125, -3.794921875, -3.4912109375, -3.1875, -2.8837890625, -2.580078125, -2.2763671875, -1.97265625, -1.6689453125, -1.365234375, -1.0615234375, -0.7578125, -0.4541015625, -0.150390625, 0.1533203125, 0.45703125, 0.7607421875, 1.064453125, 1.3681640625, 1.671875, 1.9755859375, 2.279296875, 2.5830078125, 2.88671875, 3.1904296875, 3.494140625, 3.7978515625, 4.1015625, 4.4052734375, 4.708984375, 5.0126953125, 5.31640625, 5.6201171875, 5.923828125, 6.2275390625, 6.53125, 6.8349609375, 7.138671875, 7.4423828125, 7.74609375, 8.0498046875, 8.353515625, 8.6572265625, 8.9609375]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 7.0, 1.0, 4.0, 7.0, 8.0, 18.0, 10.0, 26.0, 23.0, 34.0, 46.0, 78.0, 122.0, 189.0, 385.0, 674.0, 885.0, 663.0, 364.0, 175.0, 119.0, 57.0, 53.0, 40.0, 29.0, 12.0, 7.0, 8.0, 11.0, 7.0, 4.0, 8.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.15625, -15.673583984375, -15.19091796875, -14.708251953125, -14.2255859375, -13.742919921875, -13.26025390625, -12.777587890625, -12.294921875, -11.812255859375, -11.32958984375, -10.846923828125, -10.3642578125, -9.881591796875, -9.39892578125, -8.916259765625, -8.43359375, -7.950927734375, -7.46826171875, -6.985595703125, -6.5029296875, -6.020263671875, -5.53759765625, -5.054931640625, -4.572265625, -4.089599609375, -3.60693359375, -3.124267578125, -2.6416015625, -2.158935546875, -1.67626953125, -1.193603515625, -0.7109375, -0.228271484375, 0.25439453125, 0.737060546875, 1.2197265625, 1.702392578125, 2.18505859375, 2.667724609375, 3.150390625, 3.633056640625, 4.11572265625, 4.598388671875, 5.0810546875, 5.563720703125, 6.04638671875, 6.529052734375, 7.01171875, 7.494384765625, 7.97705078125, 8.459716796875, 8.9423828125, 9.425048828125, 9.90771484375, 10.390380859375, 10.873046875, 11.355712890625, 11.83837890625, 12.321044921875, 12.8037109375, 13.286376953125, 13.76904296875, 14.251708984375, 14.734375]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 8.0, 8.0, 15.0, 17.0, 37.0, 39.0, 77.0, 96.0, 145.0, 250.0, 373.0, 576.0, 998.0, 1809.0, 3325.0, 6784.0, 14456.0, 34091.0, 104524.0, 947880.0, 2747835.0, 235758.0, 54315.0, 21090.0, 9483.0, 4603.0, 2446.0, 1284.0, 726.0, 427.0, 283.0, 172.0, 118.0, 78.0, 49.0, 36.0, 28.0, 17.0, 12.0, 5.0, 4.0, 7.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.1875, -16.63720703125, -16.0869140625, -15.53662109375, -14.986328125, -14.43603515625, -13.8857421875, -13.33544921875, -12.78515625, -12.23486328125, -11.6845703125, -11.13427734375, -10.583984375, -10.03369140625, -9.4833984375, -8.93310546875, -8.3828125, -7.83251953125, -7.2822265625, -6.73193359375, -6.181640625, -5.63134765625, -5.0810546875, -4.53076171875, -3.98046875, -3.43017578125, -2.8798828125, -2.32958984375, -1.779296875, -1.22900390625, -0.6787109375, -0.12841796875, 0.421875, 0.97216796875, 1.5224609375, 2.07275390625, 2.623046875, 3.17333984375, 3.7236328125, 4.27392578125, 4.82421875, 5.37451171875, 5.9248046875, 6.47509765625, 7.025390625, 7.57568359375, 8.1259765625, 8.67626953125, 9.2265625, 9.77685546875, 10.3271484375, 10.87744140625, 11.427734375, 11.97802734375, 12.5283203125, 13.07861328125, 13.62890625, 14.17919921875, 14.7294921875, 15.27978515625, 15.830078125, 16.38037109375, 16.9306640625, 17.48095703125, 18.03125]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 6.0, 9.0, 13.0, 28.0, 44.0, 73.0, 108.0, 156.0, 153.0, 147.0, 96.0, 71.0, 37.0, 28.0, 13.0, 8.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-72.43875885009766, -69.81275177001953, -67.1867446899414, -64.56074523925781, -61.93473815917969, -59.30873107910156, -56.68272399902344, -54.05671691894531, -51.43071365356445, -48.80470657348633, -46.17870330810547, -43.552696228027344, -40.92668914794922, -38.30068588256836, -35.674678802490234, -33.048675537109375, -30.42266845703125, -27.796663284301758, -25.170658111572266, -22.54465103149414, -19.91864585876465, -17.292640686035156, -14.666634559631348, -12.040628433227539, -9.414623260498047, -6.7886176109313965, -4.162611961364746, -1.5366063117980957, 1.0893993377685547, 3.715404510498047, 6.3414106369018555, 8.967416763305664, 11.593429565429688, 14.21943473815918, 16.845439910888672, 19.471446990966797, 22.09745216369629, 24.72345733642578, 27.349464416503906, 29.9754695892334, 32.60147476196289, 35.227481842041016, 37.853485107421875, 40.4794921875, 43.105499267578125, 45.731502532958984, 48.35750961303711, 50.98351287841797, 53.609519958496094, 56.23552703857422, 58.86153030395508, 61.4875373840332, 64.11354064941406, 66.73954772949219, 69.36555480957031, 71.99156188964844, 74.61756896972656, 77.24357604980469, 79.86958312988281, 82.4955825805664, 85.12158966064453, 87.74759674072266, 90.37360382080078, 92.9996109008789, 95.6256103515625]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 7.0, 7.0, 16.0, 14.0, 7.0, 15.0, 20.0, 22.0, 22.0, 32.0, 28.0, 48.0, 37.0, 45.0, 42.0, 35.0, 51.0, 48.0, 49.0, 58.0, 55.0, 33.0, 39.0, 26.0, 31.0, 28.0, 29.0, 24.0, 18.0, 11.0, 17.0, 13.0, 14.0, 13.0, 12.0, 12.0, 4.0, 2.0, 4.0, 5.0, 0.0, 1.0, 2.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.66984939575195, -37.38703918457031, -36.104225158691406, -34.821414947509766, -33.538604736328125, -32.25579071044922, -30.972980499267578, -29.690168380737305, -28.40735626220703, -27.124544143676758, -25.841732025146484, -24.558921813964844, -23.27610969543457, -21.993297576904297, -20.710487365722656, -19.427675247192383, -18.14486312866211, -16.862051010131836, -15.579239845275879, -14.296428680419922, -13.013616561889648, -11.730804443359375, -10.447993278503418, -9.165182113647461, -7.8823699951171875, -6.599558353424072, -5.316746711730957, -4.033935070037842, -2.7511234283447266, -1.4683117866516113, -0.1855001449584961, 1.097311019897461, 2.3801231384277344, 3.6629347801208496, 4.945746421813965, 6.22855806350708, 7.511369705200195, 8.794181823730469, 10.076992988586426, 11.359804153442383, 12.642616271972656, 13.92542839050293, 15.208239555358887, 16.491050720214844, 17.773862838745117, 19.05667495727539, 20.33948516845703, 21.622297286987305, 22.905109405517578, 24.18792152404785, 25.470733642578125, 26.753543853759766, 28.03635597229004, 29.319168090820312, 30.601978302001953, 31.884790420532227, 33.1676025390625, 34.45041275024414, 35.73322677612305, 37.01603698730469, 38.298851013183594, 39.581661224365234, 40.864471435546875, 42.14728546142578, 43.43009567260742]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 6.0, 3.0, 3.0, 9.0, 8.0, 13.0, 12.0, 18.0, 24.0, 20.0, 21.0, 26.0, 34.0, 33.0, 37.0, 39.0, 45.0, 41.0, 50.0, 56.0, 37.0, 40.0, 39.0, 30.0, 45.0, 45.0, 36.0, 35.0, 23.0, 25.0, 22.0, 20.0, 16.0, 15.0, 18.0, 17.0, 13.0, 8.0, 10.0, 1.0, 0.0, 6.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-5.5, -5.34844970703125, -5.1968994140625, -5.04534912109375, -4.893798828125, -4.74224853515625, -4.5906982421875, -4.43914794921875, -4.28759765625, -4.13604736328125, -3.9844970703125, -3.83294677734375, -3.681396484375, -3.52984619140625, -3.3782958984375, -3.22674560546875, -3.0751953125, -2.92364501953125, -2.7720947265625, -2.62054443359375, -2.468994140625, -2.31744384765625, -2.1658935546875, -2.01434326171875, -1.86279296875, -1.71124267578125, -1.5596923828125, -1.40814208984375, -1.256591796875, -1.10504150390625, -0.9534912109375, -0.80194091796875, -0.650390625, -0.49884033203125, -0.3472900390625, -0.19573974609375, -0.044189453125, 0.10736083984375, 0.2589111328125, 0.41046142578125, 0.56201171875, 0.71356201171875, 0.8651123046875, 1.01666259765625, 1.168212890625, 1.31976318359375, 1.4713134765625, 1.62286376953125, 1.7744140625, 1.92596435546875, 2.0775146484375, 2.22906494140625, 2.380615234375, 2.53216552734375, 2.6837158203125, 2.83526611328125, 2.98681640625, 3.13836669921875, 3.2899169921875, 3.44146728515625, 3.593017578125, 3.74456787109375, 3.8961181640625, 4.04766845703125, 4.19921875]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 4.0, 3.0, 4.0, 4.0, 8.0, 7.0, 22.0, 19.0, 39.0, 47.0, 65.0, 111.0, 173.0, 232.0, 389.0, 608.0, 995.0, 1521.0, 2522.0, 4318.0, 7422.0, 12510.0, 22622.0, 40966.0, 79414.0, 170181.0, 338660.0, 182454.0, 84024.0, 43518.0, 23395.0, 13175.0, 7536.0, 4441.0, 2701.0, 1604.0, 1028.0, 644.0, 408.0, 265.0, 160.0, 103.0, 75.0, 61.0, 32.0, 20.0, 21.0, 10.0, 6.0, 8.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.229736328125, -0.2222137451171875, -0.214691162109375, -0.2071685791015625, -0.19964599609375, -0.1921234130859375, -0.184600830078125, -0.1770782470703125, -0.1695556640625, -0.1620330810546875, -0.154510498046875, -0.1469879150390625, -0.13946533203125, -0.1319427490234375, -0.124420166015625, -0.1168975830078125, -0.109375, -0.1018524169921875, -0.094329833984375, -0.0868072509765625, -0.07928466796875, -0.0717620849609375, -0.064239501953125, -0.0567169189453125, -0.0491943359375, -0.0416717529296875, -0.034149169921875, -0.0266265869140625, -0.01910400390625, -0.0115814208984375, -0.004058837890625, 0.0034637451171875, 0.010986328125, 0.0185089111328125, 0.026031494140625, 0.0335540771484375, 0.04107666015625, 0.0485992431640625, 0.056121826171875, 0.0636444091796875, 0.0711669921875, 0.0786895751953125, 0.086212158203125, 0.0937347412109375, 0.10125732421875, 0.1087799072265625, 0.116302490234375, 0.1238250732421875, 0.13134765625, 0.1388702392578125, 0.146392822265625, 0.1539154052734375, 0.16143798828125, 0.1689605712890625, 0.176483154296875, 0.1840057373046875, 0.1915283203125, 0.1990509033203125, 0.206573486328125, 0.2140960693359375, 0.22161865234375, 0.2291412353515625, 0.236663818359375, 0.2441864013671875, 0.251708984375]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 6.0, 7.0, 3.0, 7.0, 6.0, 7.0, 9.0, 11.0, 13.0, 22.0, 25.0, 29.0, 24.0, 22.0, 30.0, 31.0, 31.0, 41.0, 43.0, 43.0, 43.0, 32.0, 1063.0, 41.0, 46.0, 30.0, 40.0, 22.0, 35.0, 28.0, 35.0, 32.0, 24.0, 26.0, 18.0, 24.0, 9.0, 14.0, 14.0, 8.0, 8.0, 5.0, 4.0, 4.0, 7.0, 5.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.580078125, -2.489288330078125, -2.39849853515625, -2.307708740234375, -2.2169189453125, -2.126129150390625, -2.03533935546875, -1.944549560546875, -1.853759765625, -1.762969970703125, -1.67218017578125, -1.581390380859375, -1.4906005859375, -1.399810791015625, -1.30902099609375, -1.218231201171875, -1.12744140625, -1.036651611328125, -0.94586181640625, -0.855072021484375, -0.7642822265625, -0.673492431640625, -0.58270263671875, -0.491912841796875, -0.401123046875, -0.310333251953125, -0.21954345703125, -0.128753662109375, -0.0379638671875, 0.052825927734375, 0.14361572265625, 0.234405517578125, 0.3251953125, 0.415985107421875, 0.50677490234375, 0.597564697265625, 0.6883544921875, 0.779144287109375, 0.86993408203125, 0.960723876953125, 1.051513671875, 1.142303466796875, 1.23309326171875, 1.323883056640625, 1.4146728515625, 1.505462646484375, 1.59625244140625, 1.687042236328125, 1.77783203125, 1.868621826171875, 1.95941162109375, 2.050201416015625, 2.1409912109375, 2.231781005859375, 2.32257080078125, 2.413360595703125, 2.504150390625, 2.594940185546875, 2.68572998046875, 2.776519775390625, 2.8673095703125, 2.958099365234375, 3.04888916015625, 3.139678955078125, 3.23046875]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [4.0, 2.0, 7.0, 7.0, 5.0, 10.0, 19.0, 18.0, 33.0, 36.0, 50.0, 100.0, 131.0, 179.0, 252.0, 337.0, 518.0, 666.0, 946.0, 1212.0, 1779.0, 2682.0, 3664.0, 5303.0, 7799.0, 11208.0, 16565.0, 24573.0, 37098.0, 56673.0, 88701.0, 140867.0, 1254215.0, 155745.0, 97783.0, 62169.0, 40836.0, 27021.0, 18216.0, 12063.0, 8351.0, 5729.0, 3947.0, 2734.0, 1948.0, 1392.0, 992.0, 730.0, 499.0, 387.0, 238.0, 203.0, 153.0, 81.0, 70.0, 51.0, 31.0, 41.0, 25.0, 15.0, 19.0, 7.0, 7.0, 10.0], "bins": [-0.11602783203125, -0.11246967315673828, -0.10891151428222656, -0.10535335540771484, -0.10179519653320312, -0.0982370376586914, -0.09467887878417969, -0.09112071990966797, -0.08756256103515625, -0.08400440216064453, -0.08044624328613281, -0.0768880844116211, -0.07332992553710938, -0.06977176666259766, -0.06621360778808594, -0.06265544891357422, -0.0590972900390625, -0.05553913116455078, -0.05198097229003906, -0.048422813415527344, -0.044864654541015625, -0.041306495666503906, -0.03774833679199219, -0.03419017791748047, -0.03063201904296875, -0.02707386016845703, -0.023515701293945312, -0.019957542419433594, -0.016399383544921875, -0.012841224670410156, -0.009283065795898438, -0.005724906921386719, -0.002166748046875, 0.0013914108276367188, 0.0049495697021484375, 0.008507728576660156, 0.012065887451171875, 0.015624046325683594, 0.019182205200195312, 0.02274036407470703, 0.02629852294921875, 0.02985668182373047, 0.03341484069824219, 0.036972999572753906, 0.040531158447265625, 0.044089317321777344, 0.04764747619628906, 0.05120563507080078, 0.0547637939453125, 0.05832195281982422, 0.06188011169433594, 0.06543827056884766, 0.06899642944335938, 0.0725545883178711, 0.07611274719238281, 0.07967090606689453, 0.08322906494140625, 0.08678722381591797, 0.09034538269042969, 0.0939035415649414, 0.09746170043945312, 0.10101985931396484, 0.10457801818847656, 0.10813617706298828, 0.1116943359375]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 6.0, 2.0, 3.0, 6.0, 5.0, 6.0, 4.0, 6.0, 10.0, 11.0, 8.0, 17.0, 11.0, 12.0, 16.0, 26.0, 28.0, 35.0, 57.0, 70.0, 89.0, 106.0, 80.0, 86.0, 59.0, 48.0, 43.0, 29.0, 27.0, 20.0, 13.0, 20.0, 11.0, 5.0, 7.0, 4.0, 8.0, 5.0, 4.0, 1.0, 2.0, 5.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00020623207092285156, -0.00019990280270576477, -0.00019357353448867798, -0.0001872442662715912, -0.0001809149980545044, -0.0001745857298374176, -0.0001682564616203308, -0.00016192719340324402, -0.00015559792518615723, -0.00014926865696907043, -0.00014293938875198364, -0.00013661012053489685, -0.00013028085231781006, -0.00012395158410072327, -0.00011762231588363647, -0.00011129304766654968, -0.00010496377944946289, -9.86345112323761e-05, -9.23052430152893e-05, -8.597597479820251e-05, -7.964670658111572e-05, -7.331743836402893e-05, -6.698817014694214e-05, -6.065890192985535e-05, -5.4329633712768555e-05, -4.800036549568176e-05, -4.167109727859497e-05, -3.534182906150818e-05, -2.9012560844421387e-05, -2.2683292627334595e-05, -1.6354024410247803e-05, -1.002475619316101e-05, -3.6954879760742188e-06, 2.6337802410125732e-06, 8.963048458099365e-06, 1.5292316675186157e-05, 2.162158489227295e-05, 2.795085310935974e-05, 3.428012132644653e-05, 4.0609389543533325e-05, 4.693865776062012e-05, 5.326792597770691e-05, 5.95971941947937e-05, 6.592646241188049e-05, 7.225573062896729e-05, 7.858499884605408e-05, 8.491426706314087e-05, 9.124353528022766e-05, 9.757280349731445e-05, 0.00010390207171440125, 0.00011023133993148804, 0.00011656060814857483, 0.00012288987636566162, 0.0001292191445827484, 0.0001355484127998352, 0.000141877681016922, 0.0001482069492340088, 0.00015453621745109558, 0.00016086548566818237, 0.00016719475388526917, 0.00017352402210235596, 0.00017985329031944275, 0.00018618255853652954, 0.00019251182675361633, 0.00019884109497070312]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 1.0, 1.0, 6.0, 3.0, 8.0, 6.0, 7.0, 14.0, 11.0, 27.0, 27.0, 34.0, 51.0, 58.0, 104.0, 144.0, 351.0, 1018.0, 4537.0, 36434.0, 851626.0, 140527.0, 10604.0, 1842.0, 517.0, 214.0, 89.0, 67.0, 55.0, 40.0, 20.0, 20.0, 20.0, 17.0, 18.0, 7.0, 7.0, 4.0, 4.0, 6.0, 5.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0024585723876953125, -0.0023729801177978516, -0.0022873878479003906, -0.0022017955780029297, -0.0021162033081054688, -0.002030611038208008, -0.0019450187683105469, -0.001859426498413086, -0.001773834228515625, -0.001688241958618164, -0.0016026496887207031, -0.0015170574188232422, -0.0014314651489257812, -0.0013458728790283203, -0.0012602806091308594, -0.0011746883392333984, -0.0010890960693359375, -0.0010035037994384766, -0.0009179115295410156, -0.0008323192596435547, -0.0007467269897460938, -0.0006611347198486328, -0.0005755424499511719, -0.0004899501800537109, -0.00040435791015625, -0.00031876564025878906, -0.00023317337036132812, -0.0001475811004638672, -6.198883056640625e-05, 2.3603439331054688e-05, 0.00010919570922851562, 0.00019478797912597656, 0.0002803802490234375, 0.00036597251892089844, 0.0004515647888183594, 0.0005371570587158203, 0.0006227493286132812, 0.0007083415985107422, 0.0007939338684082031, 0.0008795261383056641, 0.000965118408203125, 0.001050710678100586, 0.0011363029479980469, 0.0012218952178955078, 0.0013074874877929688, 0.0013930797576904297, 0.0014786720275878906, 0.0015642642974853516, 0.0016498565673828125, 0.0017354488372802734, 0.0018210411071777344, 0.0019066333770751953, 0.0019922256469726562, 0.002077817916870117, 0.002163410186767578, 0.002249002456665039, 0.0023345947265625, 0.002420186996459961, 0.002505779266357422, 0.002591371536254883, 0.0026769638061523438, 0.0027625560760498047, 0.0028481483459472656, 0.0029337406158447266, 0.0030193328857421875]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 6.0, 9.0, 9.0, 23.0, 37.0, 57.0, 97.0, 151.0, 180.0, 173.0, 104.0, 60.0, 33.0, 29.0, 13.0, 8.0, 7.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011117279791506007, -0.00010345063492422923, -9.57284719333984e-05, -8.800631621852517e-05, -8.028415322769433e-05, -7.25619902368635e-05, -6.483982724603266e-05, -5.7117664255201817e-05, -4.939550126437098e-05, -4.167333827354014e-05, -3.39511752827093e-05, -2.622901592985727e-05, -1.850685293902643e-05, -1.0784689948195592e-05, -3.06253059534356e-06, 4.659632395487279e-06, 1.2381795386318117e-05, 2.0103958377148956e-05, 2.782611954899039e-05, 3.5548280720831826e-05, 4.3270443711662665e-05, 5.0992606702493504e-05, 5.8714766055345535e-05, 6.643692904617637e-05, 7.415909203700721e-05, 8.188125502783805e-05, 8.960341801866889e-05, 9.732558100949973e-05, 0.00010504774400033057, 0.0001127699069911614, 0.00012049206270603463, 0.00012821421842090786, 0.00013593639596365392, 0.00014365855895448476, 0.0001513807219453156, 0.00015910288493614644, 0.00016682504792697728, 0.00017454721091780812, 0.00018226937390863895, 0.00018999152234755456, 0.00019771369989030063, 0.00020543586288113147, 0.0002131580258719623, 0.00022088018886279315, 0.00022860235185362399, 0.00023632451484445482, 0.00024404667783528566, 0.0002517688262742013, 0.0002594909747131169, 0.0002672131231520325, 0.00027493530069477856, 0.00028265744913369417, 0.00029037962667644024, 0.00029810177511535585, 0.0003058239526581019, 0.0003135461010970175, 0.0003212682786397636, 0.0003289904270786792, 0.00033671260462142527, 0.0003444347530603409, 0.00035215693060308695, 0.00035987907904200256, 0.0003676012565847486, 0.00037532340502366424, 0.0003830455825664103]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 6.0, 5.0, 8.0, 9.0, 12.0, 10.0, 16.0, 15.0, 12.0, 9.0, 17.0, 19.0, 28.0, 18.0, 28.0, 30.0, 34.0, 31.0, 30.0, 35.0, 43.0, 39.0, 34.0, 39.0, 39.0, 33.0, 31.0, 30.0, 30.0, 42.0, 31.0, 24.0, 28.0, 22.0, 21.0, 13.0, 24.0, 13.0, 17.0, 11.0, 6.0, 8.0, 8.0, 14.0, 7.0, 7.0, 4.0, 2.0, 4.0, 0.0, 3.0, 3.0, 3.0, 2.0, 1.0, 2.0], "bins": [-8.422136306762695e-05, -8.152052760124207e-05, -7.881969213485718e-05, -7.611885666847229e-05, -7.34180212020874e-05, -7.071718573570251e-05, -6.801635026931763e-05, -6.531551480293274e-05, -6.261467933654785e-05, -5.9913843870162964e-05, -5.7213008403778076e-05, -5.451217293739319e-05, -5.18113374710083e-05, -4.911050200462341e-05, -4.6409666538238525e-05, -4.370883107185364e-05, -4.100799560546875e-05, -3.830716013908386e-05, -3.5606324672698975e-05, -3.290548920631409e-05, -3.02046537399292e-05, -2.750381827354431e-05, -2.4802982807159424e-05, -2.2102147340774536e-05, -1.940131187438965e-05, -1.670047640800476e-05, -1.3999640941619873e-05, -1.1298805475234985e-05, -8.597970008850098e-06, -5.89713454246521e-06, -3.1962990760803223e-06, -4.954636096954346e-07, 2.205371856689453e-06, 4.906207323074341e-06, 7.6070427894592285e-06, 1.0307878255844116e-05, 1.3008713722229004e-05, 1.570954918861389e-05, 1.841038465499878e-05, 2.1111220121383667e-05, 2.3812055587768555e-05, 2.6512891054153442e-05, 2.921372652053833e-05, 3.191456198692322e-05, 3.4615397453308105e-05, 3.731623291969299e-05, 4.001706838607788e-05, 4.271790385246277e-05, 4.5418739318847656e-05, 4.8119574785232544e-05, 5.082041025161743e-05, 5.352124571800232e-05, 5.622208118438721e-05, 5.8922916650772095e-05, 6.162375211715698e-05, 6.432458758354187e-05, 6.702542304992676e-05, 6.972625851631165e-05, 7.242709398269653e-05, 7.512792944908142e-05, 7.782876491546631e-05, 8.05296003818512e-05, 8.323043584823608e-05, 8.593127131462097e-05, 8.863210678100586e-05]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 6.0, 3.0, 3.0, 9.0, 8.0, 13.0, 12.0, 18.0, 24.0, 20.0, 21.0, 26.0, 34.0, 33.0, 37.0, 39.0, 45.0, 41.0, 50.0, 56.0, 37.0, 40.0, 39.0, 30.0, 45.0, 45.0, 36.0, 35.0, 23.0, 25.0, 22.0, 20.0, 16.0, 15.0, 18.0, 17.0, 13.0, 8.0, 10.0, 1.0, 0.0, 6.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-5.5, -5.34844970703125, -5.1968994140625, -5.04534912109375, -4.893798828125, -4.74224853515625, -4.5906982421875, -4.43914794921875, -4.28759765625, -4.13604736328125, -3.9844970703125, -3.83294677734375, -3.681396484375, -3.52984619140625, -3.3782958984375, -3.22674560546875, -3.0751953125, -2.92364501953125, -2.7720947265625, -2.62054443359375, -2.468994140625, -2.31744384765625, -2.1658935546875, -2.01434326171875, -1.86279296875, -1.71124267578125, -1.5596923828125, -1.40814208984375, -1.256591796875, -1.10504150390625, -0.9534912109375, -0.80194091796875, -0.650390625, -0.49884033203125, -0.3472900390625, -0.19573974609375, -0.044189453125, 0.10736083984375, 0.2589111328125, 0.41046142578125, 0.56201171875, 0.71356201171875, 0.8651123046875, 1.01666259765625, 1.168212890625, 1.31976318359375, 1.4713134765625, 1.62286376953125, 1.7744140625, 1.92596435546875, 2.0775146484375, 2.22906494140625, 2.380615234375, 2.53216552734375, 2.6837158203125, 2.83526611328125, 2.98681640625, 3.13836669921875, 3.2899169921875, 3.44146728515625, 3.593017578125, 3.74456787109375, 3.8961181640625, 4.04766845703125, 4.19921875]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 2.0, 4.0, 4.0, 14.0, 7.0, 21.0, 27.0, 33.0, 54.0, 65.0, 101.0, 118.0, 183.0, 270.0, 435.0, 635.0, 958.0, 1493.0, 2309.0, 4046.0, 8348.0, 22472.0, 114273.0, 722021.0, 127106.0, 23632.0, 8685.0, 4359.0, 2453.0, 1471.0, 907.0, 636.0, 448.0, 282.0, 209.0, 158.0, 111.0, 50.0, 65.0, 27.0, 22.0, 23.0, 8.0, 5.0, 5.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.96875, -8.6749267578125, -8.381103515625, -8.0872802734375, -7.79345703125, -7.4996337890625, -7.205810546875, -6.9119873046875, -6.6181640625, -6.3243408203125, -6.030517578125, -5.7366943359375, -5.44287109375, -5.1490478515625, -4.855224609375, -4.5614013671875, -4.267578125, -3.9737548828125, -3.679931640625, -3.3861083984375, -3.09228515625, -2.7984619140625, -2.504638671875, -2.2108154296875, -1.9169921875, -1.6231689453125, -1.329345703125, -1.0355224609375, -0.74169921875, -0.4478759765625, -0.154052734375, 0.1397705078125, 0.43359375, 0.7274169921875, 1.021240234375, 1.3150634765625, 1.60888671875, 1.9027099609375, 2.196533203125, 2.4903564453125, 2.7841796875, 3.0780029296875, 3.371826171875, 3.6656494140625, 3.95947265625, 4.2532958984375, 4.547119140625, 4.8409423828125, 5.134765625, 5.4285888671875, 5.722412109375, 6.0162353515625, 6.31005859375, 6.6038818359375, 6.897705078125, 7.1915283203125, 7.4853515625, 7.7791748046875, 8.072998046875, 8.3668212890625, 8.66064453125, 8.9544677734375, 9.248291015625, 9.5421142578125, 9.8359375]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 5.0, 6.0, 10.0, 2.0, 10.0, 11.0, 10.0, 15.0, 24.0, 28.0, 22.0, 37.0, 31.0, 44.0, 45.0, 47.0, 71.0, 105.0, 293.0, 1600.0, 168.0, 86.0, 43.0, 41.0, 46.0, 35.0, 33.0, 31.0, 27.0, 30.0, 20.0, 15.0, 17.0, 16.0, 7.0, 6.0, 2.0, 5.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.71875, -19.14453125, -18.5703125, -17.99609375, -17.421875, -16.84765625, -16.2734375, -15.69921875, -15.125, -14.55078125, -13.9765625, -13.40234375, -12.828125, -12.25390625, -11.6796875, -11.10546875, -10.53125, -9.95703125, -9.3828125, -8.80859375, -8.234375, -7.66015625, -7.0859375, -6.51171875, -5.9375, -5.36328125, -4.7890625, -4.21484375, -3.640625, -3.06640625, -2.4921875, -1.91796875, -1.34375, -0.76953125, -0.1953125, 0.37890625, 0.953125, 1.52734375, 2.1015625, 2.67578125, 3.25, 3.82421875, 4.3984375, 4.97265625, 5.546875, 6.12109375, 6.6953125, 7.26953125, 7.84375, 8.41796875, 8.9921875, 9.56640625, 10.140625, 10.71484375, 11.2890625, 11.86328125, 12.4375, 13.01171875, 13.5859375, 14.16015625, 14.734375, 15.30859375, 15.8828125, 16.45703125, 17.03125]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 3.0, 3.0, 2.0, 11.0, 9.0, 9.0, 22.0, 34.0, 35.0, 37.0, 81.0, 95.0, 203.0, 417.0, 1422.0, 11061.0, 3020396.0, 106573.0, 3826.0, 753.0, 282.0, 151.0, 74.0, 64.0, 45.0, 26.0, 20.0, 14.0, 14.0, 12.0, 8.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.75, -31.1728515625, -29.595703125, -28.0185546875, -26.44140625, -24.8642578125, -23.287109375, -21.7099609375, -20.1328125, -18.5556640625, -16.978515625, -15.4013671875, -13.82421875, -12.2470703125, -10.669921875, -9.0927734375, -7.515625, -5.9384765625, -4.361328125, -2.7841796875, -1.20703125, 0.3701171875, 1.947265625, 3.5244140625, 5.1015625, 6.6787109375, 8.255859375, 9.8330078125, 11.41015625, 12.9873046875, 14.564453125, 16.1416015625, 17.71875, 19.2958984375, 20.873046875, 22.4501953125, 24.02734375, 25.6044921875, 27.181640625, 28.7587890625, 30.3359375, 31.9130859375, 33.490234375, 35.0673828125, 36.64453125, 38.2216796875, 39.798828125, 41.3759765625, 42.953125, 44.5302734375, 46.107421875, 47.6845703125, 49.26171875, 50.8388671875, 52.416015625, 53.9931640625, 55.5703125, 57.1474609375, 58.724609375, 60.3017578125, 61.87890625, 63.4560546875, 65.033203125, 66.6103515625, 68.1875]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 6.0, 78.0, 305.0, 432.0, 169.0, 23.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.01662254333496, -21.103092193603516, -18.189563751220703, -15.276033401489258, -12.362503051757812, -9.448972702026367, -6.535444259643555, -3.6219139099121094, -0.7083835601806641, 2.205146312713623, 5.11867618560791, 8.032205581665039, 10.945735931396484, 13.85926628112793, 16.772794723510742, 19.686325073242188, 22.599855422973633, 25.513385772705078, 28.42691421508789, 31.340444564819336, 34.25397491455078, 37.167503356933594, 40.081031799316406, 42.994564056396484, 45.90809631347656, 48.821624755859375, 51.73515701293945, 54.648685455322266, 57.562217712402344, 60.475746154785156, 63.38927459716797, 66.30280303955078, 69.21633911132812, 72.12986755371094, 75.04339599609375, 77.95692443847656, 80.8704605102539, 83.78398895263672, 86.69751739501953, 89.61104583740234, 92.52458190917969, 95.4381103515625, 98.35163879394531, 101.26516723632812, 104.17870330810547, 107.09223175048828, 110.0057601928711, 112.9192886352539, 115.83281707763672, 118.74634552001953, 121.65987396240234, 124.57341003417969, 127.4869384765625, 130.4004669189453, 133.31399536132812, 136.22752380371094, 139.14105224609375, 142.05458068847656, 144.96810913085938, 147.8816375732422, 150.795166015625, 153.70870971679688, 156.62222290039062, 159.5357666015625, 162.4492950439453]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 4.0, 6.0, 7.0, 5.0, 11.0, 6.0, 13.0, 13.0, 21.0, 16.0, 17.0, 17.0, 29.0, 23.0, 28.0, 35.0, 37.0, 45.0, 40.0, 29.0, 39.0, 42.0, 32.0, 38.0, 38.0, 35.0, 43.0, 28.0, 42.0, 32.0, 28.0, 22.0, 28.0, 25.0, 24.0, 15.0, 11.0, 9.0, 14.0, 19.0, 8.0, 8.0, 5.0, 5.0, 3.0, 3.0, 0.0, 3.0, 5.0, 1.0, 0.0, 1.0], "bins": [-42.793819427490234, -41.54755401611328, -40.301292419433594, -39.05502700805664, -37.80876159667969, -36.5625, -35.31623458862305, -34.069969177246094, -32.823707580566406, -31.577444076538086, -30.331180572509766, -29.084915161132812, -27.838651657104492, -26.592388153076172, -25.34612274169922, -24.0998592376709, -22.853595733642578, -21.607332229614258, -20.361068725585938, -19.114803314208984, -17.868539810180664, -16.622276306152344, -15.376011848449707, -14.12974739074707, -12.88348388671875, -11.63722038269043, -10.390955924987793, -9.144691467285156, -7.898427963256836, -6.652163982391357, -5.405900001525879, -4.159635543823242, -2.9133758544921875, -1.667111873626709, -0.42084789276123047, 0.825416088104248, 2.0716800689697266, 3.317944049835205, 4.564208030700684, 5.81047248840332, 7.056735992431641, 8.302999496459961, 9.549263954162598, 10.795528411865234, 12.041791915893555, 13.288055419921875, 14.534319877624512, 15.780584335327148, 17.02684783935547, 18.27311134338379, 19.51937484741211, 20.765640258789062, 22.011903762817383, 23.258167266845703, 24.504432678222656, 25.750696182250977, 26.996959686279297, 28.243223190307617, 29.489486694335938, 30.73575210571289, 31.98201560974121, 33.22827911376953, 34.474544525146484, 35.72080993652344, 36.967071533203125]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 5.0, 4.0, 4.0, 4.0, 10.0, 8.0, 5.0, 20.0, 24.0, 17.0, 21.0, 21.0, 29.0, 26.0, 29.0, 52.0, 51.0, 45.0, 43.0, 50.0, 52.0, 37.0, 31.0, 38.0, 47.0, 56.0, 35.0, 31.0, 23.0, 32.0, 29.0, 14.0, 21.0, 15.0, 14.0, 14.0, 19.0, 10.0, 5.0, 6.0, 3.0, 6.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.67578125, -5.5133056640625, -5.350830078125, -5.1883544921875, -5.02587890625, -4.8634033203125, -4.700927734375, -4.5384521484375, -4.3759765625, -4.2135009765625, -4.051025390625, -3.8885498046875, -3.72607421875, -3.5635986328125, -3.401123046875, -3.2386474609375, -3.076171875, -2.9136962890625, -2.751220703125, -2.5887451171875, -2.42626953125, -2.2637939453125, -2.101318359375, -1.9388427734375, -1.7763671875, -1.6138916015625, -1.451416015625, -1.2889404296875, -1.12646484375, -0.9639892578125, -0.801513671875, -0.6390380859375, -0.4765625, -0.3140869140625, -0.151611328125, 0.0108642578125, 0.17333984375, 0.3358154296875, 0.498291015625, 0.6607666015625, 0.8232421875, 0.9857177734375, 1.148193359375, 1.3106689453125, 1.47314453125, 1.6356201171875, 1.798095703125, 1.9605712890625, 2.123046875, 2.2855224609375, 2.447998046875, 2.6104736328125, 2.77294921875, 2.9354248046875, 3.097900390625, 3.2603759765625, 3.4228515625, 3.5853271484375, 3.747802734375, 3.9102783203125, 4.07275390625, 4.2352294921875, 4.397705078125, 4.5601806640625, 4.72265625]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 9.0, 3.0, 10.0, 10.0, 15.0, 20.0, 17.0, 30.0, 45.0, 64.0, 69.0, 123.0, 262.0, 482.0, 1051.0, 2702.0, 8056.0, 29472.0, 382297.0, 3608882.0, 130013.0, 20948.0, 5995.0, 2022.0, 798.0, 346.0, 182.0, 95.0, 67.0, 46.0, 41.0, 25.0, 31.0, 17.0, 14.0, 5.0, 4.0, 6.0, 6.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.921875, -25.208984375, -24.49609375, -23.783203125, -23.0703125, -22.357421875, -21.64453125, -20.931640625, -20.21875, -19.505859375, -18.79296875, -18.080078125, -17.3671875, -16.654296875, -15.94140625, -15.228515625, -14.515625, -13.802734375, -13.08984375, -12.376953125, -11.6640625, -10.951171875, -10.23828125, -9.525390625, -8.8125, -8.099609375, -7.38671875, -6.673828125, -5.9609375, -5.248046875, -4.53515625, -3.822265625, -3.109375, -2.396484375, -1.68359375, -0.970703125, -0.2578125, 0.455078125, 1.16796875, 1.880859375, 2.59375, 3.306640625, 4.01953125, 4.732421875, 5.4453125, 6.158203125, 6.87109375, 7.583984375, 8.296875, 9.009765625, 9.72265625, 10.435546875, 11.1484375, 11.861328125, 12.57421875, 13.287109375, 14.0, 14.712890625, 15.42578125, 16.138671875, 16.8515625, 17.564453125, 18.27734375, 18.990234375, 19.703125]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 6.0, 4.0, 10.0, 9.0, 15.0, 22.0, 26.0, 42.0, 71.0, 142.0, 266.0, 559.0, 1058.0, 966.0, 441.0, 199.0, 80.0, 49.0, 46.0, 25.0, 12.0, 13.0, 9.0, 2.0, 6.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-27.34375, -26.6734619140625, -26.003173828125, -25.3328857421875, -24.66259765625, -23.9923095703125, -23.322021484375, -22.6517333984375, -21.9814453125, -21.3111572265625, -20.640869140625, -19.9705810546875, -19.30029296875, -18.6300048828125, -17.959716796875, -17.2894287109375, -16.619140625, -15.9488525390625, -15.278564453125, -14.6082763671875, -13.93798828125, -13.2677001953125, -12.597412109375, -11.9271240234375, -11.2568359375, -10.5865478515625, -9.916259765625, -9.2459716796875, -8.57568359375, -7.9053955078125, -7.235107421875, -6.5648193359375, -5.89453125, -5.2242431640625, -4.553955078125, -3.8836669921875, -3.21337890625, -2.5430908203125, -1.872802734375, -1.2025146484375, -0.5322265625, 0.1380615234375, 0.808349609375, 1.4786376953125, 2.14892578125, 2.8192138671875, 3.489501953125, 4.1597900390625, 4.830078125, 5.5003662109375, 6.170654296875, 6.8409423828125, 7.51123046875, 8.1815185546875, 8.851806640625, 9.5220947265625, 10.1923828125, 10.8626708984375, 11.532958984375, 12.2032470703125, 12.87353515625, 13.5438232421875, 14.214111328125, 14.8843994140625, 15.5546875]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 8.0, 15.0, 20.0, 24.0, 52.0, 79.0, 153.0, 438.0, 1930.0, 11649.0, 174196.0, 3930130.0, 66967.0, 6745.0, 1230.0, 355.0, 129.0, 55.0, 50.0, 23.0, 14.0, 8.0, 12.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.96875, -36.27099609375, -34.5732421875, -32.87548828125, -31.177734375, -29.47998046875, -27.7822265625, -26.08447265625, -24.38671875, -22.68896484375, -20.9912109375, -19.29345703125, -17.595703125, -15.89794921875, -14.2001953125, -12.50244140625, -10.8046875, -9.10693359375, -7.4091796875, -5.71142578125, -4.013671875, -2.31591796875, -0.6181640625, 1.07958984375, 2.77734375, 4.47509765625, 6.1728515625, 7.87060546875, 9.568359375, 11.26611328125, 12.9638671875, 14.66162109375, 16.359375, 18.05712890625, 19.7548828125, 21.45263671875, 23.150390625, 24.84814453125, 26.5458984375, 28.24365234375, 29.94140625, 31.63916015625, 33.3369140625, 35.03466796875, 36.732421875, 38.43017578125, 40.1279296875, 41.82568359375, 43.5234375, 45.22119140625, 46.9189453125, 48.61669921875, 50.314453125, 52.01220703125, 53.7099609375, 55.40771484375, 57.10546875, 58.80322265625, 60.5009765625, 62.19873046875, 63.896484375, 65.59423828125, 67.2919921875, 68.98974609375, 70.6875]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 6.0, 8.0, 8.0, 8.0, 13.0, 9.0, 22.0, 25.0, 30.0, 43.0, 57.0, 71.0, 90.0, 111.0, 113.0, 90.0, 91.0, 54.0, 41.0, 31.0, 20.0, 15.0, 23.0, 19.0, 5.0, 3.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-43.74475860595703, -42.00543212890625, -40.26610565185547, -38.52677536010742, -36.78744888305664, -35.04812240600586, -33.30879592895508, -31.569467544555664, -29.83013916015625, -28.09081268310547, -26.351484298706055, -24.612157821655273, -22.87282943725586, -21.133502960205078, -19.394176483154297, -17.654848098754883, -15.915521621704102, -14.176194190979004, -12.436866760253906, -10.697540283203125, -8.958211898803711, -7.21888542175293, -5.479557991027832, -3.7402305603027344, -2.0009031295776367, -0.2615758180618286, 1.4777514934539795, 3.217078685760498, 4.956406116485596, 6.695733070373535, 8.435060501098633, 10.17438793182373, 11.913715362548828, 13.653042793273926, 15.392370223999023, 17.131696701049805, 18.87102508544922, 20.6103515625, 22.34967803955078, 24.089006423950195, 25.82833480834961, 27.56766128540039, 29.306989669799805, 31.046316146850586, 32.78564453125, 34.52497100830078, 36.26429748535156, 38.003623962402344, 39.742950439453125, 41.482276916503906, 43.22160339355469, 44.960933685302734, 46.700260162353516, 48.4395866394043, 50.17891311645508, 51.918243408203125, 53.657569885253906, 55.39689636230469, 57.13622283935547, 58.875553131103516, 60.6148796081543, 62.35420608520508, 64.09353637695312, 65.8328628540039, 67.57218933105469]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 4.0, 3.0, 2.0, 5.0, 3.0, 8.0, 8.0, 5.0, 16.0, 9.0, 11.0, 19.0, 29.0, 18.0, 19.0, 34.0, 31.0, 34.0, 36.0, 36.0, 36.0, 32.0, 49.0, 34.0, 43.0, 50.0, 36.0, 35.0, 43.0, 37.0, 20.0, 34.0, 27.0, 38.0, 16.0, 19.0, 17.0, 19.0, 16.0, 24.0, 13.0, 10.0, 5.0, 8.0, 4.0, 3.0, 5.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-41.2381706237793, -40.04390335083008, -38.84963607788086, -37.65536880493164, -36.46110534667969, -35.26683807373047, -34.07257080078125, -32.87830352783203, -31.684036254882812, -30.489768981933594, -29.295501708984375, -28.10123634338379, -26.90696907043457, -25.71270179748535, -24.518436431884766, -23.324169158935547, -22.129901885986328, -20.93563461303711, -19.74136734008789, -18.547101974487305, -17.352834701538086, -16.158567428588867, -14.964301109313965, -13.770034790039062, -12.575767517089844, -11.381500244140625, -10.187233924865723, -8.99296760559082, -7.798700332641602, -6.604433536529541, -5.4101667404174805, -4.215900421142578, -3.021636962890625, -1.8273701667785645, -0.6331033706665039, 0.5611634254455566, 1.7554302215576172, 2.9496970176696777, 4.143963813781738, 5.338230133056641, 6.532497406005859, 7.72676420211792, 8.92103099822998, 10.115297317504883, 11.309564590454102, 12.50383186340332, 13.698098182678223, 14.892364501953125, 16.086631774902344, 17.280899047851562, 18.47516632080078, 19.669431686401367, 20.863698959350586, 22.057966232299805, 23.25223159790039, 24.44649887084961, 25.640766143798828, 26.835033416748047, 28.029300689697266, 29.22356605529785, 30.41783332824707, 31.61210060119629, 32.806365966796875, 34.000633239746094, 35.19490051269531]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 1.0, 3.0, 2.0, 3.0, 6.0, 10.0, 10.0, 10.0, 9.0, 23.0, 18.0, 25.0, 26.0, 24.0, 35.0, 43.0, 45.0, 42.0, 37.0, 42.0, 43.0, 39.0, 34.0, 52.0, 44.0, 37.0, 45.0, 33.0, 42.0, 32.0, 23.0, 21.0, 16.0, 20.0, 28.0, 14.0, 13.0, 13.0, 7.0, 3.0, 12.0, 7.0, 6.0, 4.0, 4.0, 1.0, 3.0], "bins": [-6.1953125, -6.03692626953125, -5.8785400390625, -5.72015380859375, -5.561767578125, -5.40338134765625, -5.2449951171875, -5.08660888671875, -4.92822265625, -4.76983642578125, -4.6114501953125, -4.45306396484375, -4.294677734375, -4.13629150390625, -3.9779052734375, -3.81951904296875, -3.6611328125, -3.50274658203125, -3.3443603515625, -3.18597412109375, -3.027587890625, -2.86920166015625, -2.7108154296875, -2.55242919921875, -2.39404296875, -2.23565673828125, -2.0772705078125, -1.91888427734375, -1.760498046875, -1.60211181640625, -1.4437255859375, -1.28533935546875, -1.126953125, -0.96856689453125, -0.8101806640625, -0.65179443359375, -0.493408203125, -0.33502197265625, -0.1766357421875, -0.01824951171875, 0.14013671875, 0.29852294921875, 0.4569091796875, 0.61529541015625, 0.773681640625, 0.93206787109375, 1.0904541015625, 1.24884033203125, 1.4072265625, 1.56561279296875, 1.7239990234375, 1.88238525390625, 2.040771484375, 2.19915771484375, 2.3575439453125, 2.51593017578125, 2.67431640625, 2.83270263671875, 2.9910888671875, 3.14947509765625, 3.307861328125, 3.46624755859375, 3.6246337890625, 3.78302001953125, 3.94140625]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 5.0, 8.0, 8.0, 20.0, 24.0, 29.0, 50.0, 71.0, 104.0, 164.0, 254.0, 425.0, 640.0, 1058.0, 1653.0, 2706.0, 4235.0, 6865.0, 11258.0, 19158.0, 32801.0, 59991.0, 116925.0, 242424.0, 266236.0, 128537.0, 65607.0, 35467.0, 20391.0, 11862.0, 7301.0, 4562.0, 2784.0, 1862.0, 1147.0, 672.0, 465.0, 275.0, 189.0, 104.0, 74.0, 34.0, 33.0, 31.0, 20.0, 11.0, 3.0, 8.0, 4.0, 2.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.22021484375, -0.212890625, -0.20556640625, -0.1982421875, -0.19091796875, -0.18359375, -0.17626953125, -0.1689453125, -0.16162109375, -0.154296875, -0.14697265625, -0.1396484375, -0.13232421875, -0.125, -0.11767578125, -0.1103515625, -0.10302734375, -0.095703125, -0.08837890625, -0.0810546875, -0.07373046875, -0.06640625, -0.05908203125, -0.0517578125, -0.04443359375, -0.037109375, -0.02978515625, -0.0224609375, -0.01513671875, -0.0078125, -0.00048828125, 0.0068359375, 0.01416015625, 0.021484375, 0.02880859375, 0.0361328125, 0.04345703125, 0.05078125, 0.05810546875, 0.0654296875, 0.07275390625, 0.080078125, 0.08740234375, 0.0947265625, 0.10205078125, 0.109375, 0.11669921875, 0.1240234375, 0.13134765625, 0.138671875, 0.14599609375, 0.1533203125, 0.16064453125, 0.16796875, 0.17529296875, 0.1826171875, 0.18994140625, 0.197265625, 0.20458984375, 0.2119140625, 0.21923828125, 0.2265625, 0.23388671875, 0.2412109375, 0.24853515625]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 1.0, 1.0, 3.0, 5.0, 4.0, 3.0, 3.0, 7.0, 8.0, 15.0, 18.0, 16.0, 19.0, 12.0, 26.0, 22.0, 17.0, 31.0, 22.0, 26.0, 40.0, 34.0, 33.0, 34.0, 41.0, 50.0, 1068.0, 56.0, 42.0, 33.0, 33.0, 36.0, 35.0, 27.0, 35.0, 20.0, 25.0, 15.0, 18.0, 23.0, 14.0, 18.0, 15.0, 8.0, 6.0, 5.0, 6.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.92578125, -2.82659912109375, -2.7274169921875, -2.62823486328125, -2.529052734375, -2.42987060546875, -2.3306884765625, -2.23150634765625, -2.13232421875, -2.03314208984375, -1.9339599609375, -1.83477783203125, -1.735595703125, -1.63641357421875, -1.5372314453125, -1.43804931640625, -1.3388671875, -1.23968505859375, -1.1405029296875, -1.04132080078125, -0.942138671875, -0.84295654296875, -0.7437744140625, -0.64459228515625, -0.54541015625, -0.44622802734375, -0.3470458984375, -0.24786376953125, -0.148681640625, -0.04949951171875, 0.0496826171875, 0.14886474609375, 0.248046875, 0.34722900390625, 0.4464111328125, 0.54559326171875, 0.644775390625, 0.74395751953125, 0.8431396484375, 0.94232177734375, 1.04150390625, 1.14068603515625, 1.2398681640625, 1.33905029296875, 1.438232421875, 1.53741455078125, 1.6365966796875, 1.73577880859375, 1.8349609375, 1.93414306640625, 2.0333251953125, 2.13250732421875, 2.231689453125, 2.33087158203125, 2.4300537109375, 2.52923583984375, 2.62841796875, 2.72760009765625, 2.8267822265625, 2.92596435546875, 3.025146484375, 3.12432861328125, 3.2235107421875, 3.32269287109375, 3.421875]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 5.0, 9.0, 8.0, 7.0, 16.0, 31.0, 47.0, 83.0, 95.0, 140.0, 218.0, 309.0, 451.0, 648.0, 940.0, 1459.0, 2352.0, 3558.0, 5496.0, 8870.0, 14441.0, 23602.0, 40237.0, 69133.0, 119904.0, 219176.0, 1276391.0, 127539.0, 73053.0, 42656.0, 25163.0, 15367.0, 9294.0, 5736.0, 3590.0, 2431.0, 1568.0, 1016.0, 659.0, 433.0, 359.0, 214.0, 137.0, 98.0, 62.0, 40.0, 29.0, 20.0, 14.0, 10.0, 7.0, 6.0, 6.0, 4.0, 1.0, 3.0, 0.0, 3.0], "bins": [-0.15234375, -0.14759063720703125, -0.1428375244140625, -0.13808441162109375, -0.133331298828125, -0.12857818603515625, -0.1238250732421875, -0.11907196044921875, -0.11431884765625, -0.10956573486328125, -0.1048126220703125, -0.10005950927734375, -0.095306396484375, -0.09055328369140625, -0.0858001708984375, -0.08104705810546875, -0.0762939453125, -0.07154083251953125, -0.0667877197265625, -0.06203460693359375, -0.057281494140625, -0.05252838134765625, -0.0477752685546875, -0.04302215576171875, -0.03826904296875, -0.03351593017578125, -0.0287628173828125, -0.02400970458984375, -0.019256591796875, -0.01450347900390625, -0.0097503662109375, -0.00499725341796875, -0.000244140625, 0.00450897216796875, 0.0092620849609375, 0.01401519775390625, 0.018768310546875, 0.02352142333984375, 0.0282745361328125, 0.03302764892578125, 0.03778076171875, 0.04253387451171875, 0.0472869873046875, 0.05204010009765625, 0.056793212890625, 0.06154632568359375, 0.0662994384765625, 0.07105255126953125, 0.0758056640625, 0.08055877685546875, 0.0853118896484375, 0.09006500244140625, 0.094818115234375, 0.09957122802734375, 0.1043243408203125, 0.10907745361328125, 0.11383056640625, 0.11858367919921875, 0.1233367919921875, 0.12808990478515625, 0.132843017578125, 0.13759613037109375, 0.1423492431640625, 0.14710235595703125, 0.15185546875]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 1.0, 6.0, 4.0, 9.0, 9.0, 4.0, 9.0, 15.0, 14.0, 12.0, 22.0, 17.0, 29.0, 46.0, 72.0, 149.0, 140.0, 125.0, 89.0, 57.0, 29.0, 27.0, 26.0, 7.0, 10.0, 4.0, 9.0, 8.0, 8.0, 6.0, 5.0, 4.0, 2.0, 4.0, 4.0, 2.0, 4.0, 5.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00022780895233154297, -0.00022038258612155914, -0.00021295621991157532, -0.0002055298537015915, -0.00019810348749160767, -0.00019067712128162384, -0.00018325075507164001, -0.0001758243888616562, -0.00016839802265167236, -0.00016097165644168854, -0.0001535452902317047, -0.00014611892402172089, -0.00013869255781173706, -0.00013126619160175323, -0.0001238398253917694, -0.00011641345918178558, -0.00010898709297180176, -0.00010156072676181793, -9.41343605518341e-05, -8.670799434185028e-05, -7.928162813186646e-05, -7.185526192188263e-05, -6.44288957118988e-05, -5.700252950191498e-05, -4.957616329193115e-05, -4.214979708194733e-05, -3.47234308719635e-05, -2.7297064661979675e-05, -1.987069845199585e-05, -1.2444332242012024e-05, -5.017966032028198e-06, 2.4084001779556274e-06, 9.834766387939453e-06, 1.726113259792328e-05, 2.4687498807907104e-05, 3.211386501789093e-05, 3.9540231227874756e-05, 4.696659743785858e-05, 5.439296364784241e-05, 6.181932985782623e-05, 6.924569606781006e-05, 7.667206227779388e-05, 8.409842848777771e-05, 9.152479469776154e-05, 9.895116090774536e-05, 0.00010637752711772919, 0.00011380389332771301, 0.00012123025953769684, 0.00012865662574768066, 0.0001360829919576645, 0.00014350935816764832, 0.00015093572437763214, 0.00015836209058761597, 0.0001657884567975998, 0.00017321482300758362, 0.00018064118921756744, 0.00018806755542755127, 0.0001954939216375351, 0.00020292028784751892, 0.00021034665405750275, 0.00021777302026748657, 0.0002251993864774704, 0.00023262575268745422, 0.00024005211889743805, 0.0002474784851074219]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 1.0, 1.0, 4.0, 1.0, 4.0, 6.0, 3.0, 8.0, 6.0, 10.0, 12.0, 19.0, 20.0, 17.0, 24.0, 45.0, 71.0, 107.0, 307.0, 1128.0, 10871.0, 787902.0, 240465.0, 6141.0, 802.0, 206.0, 133.0, 52.0, 47.0, 41.0, 26.0, 12.0, 13.0, 14.0, 8.0, 9.0, 4.0, 3.0, 4.0, 5.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004001617431640625, -0.0038799643516540527, -0.0037583112716674805, -0.003636658191680908, -0.003515005111694336, -0.0033933520317077637, -0.0032716989517211914, -0.003150045871734619, -0.003028392791748047, -0.0029067397117614746, -0.0027850866317749023, -0.00266343355178833, -0.002541780471801758, -0.0024201273918151855, -0.0022984743118286133, -0.002176821231842041, -0.0020551681518554688, -0.0019335150718688965, -0.0018118619918823242, -0.001690208911895752, -0.0015685558319091797, -0.0014469027519226074, -0.0013252496719360352, -0.0012035965919494629, -0.0010819435119628906, -0.0009602904319763184, -0.0008386373519897461, -0.0007169842720031738, -0.0005953311920166016, -0.0004736781120300293, -0.00035202503204345703, -0.00023037195205688477, -0.0001087188720703125, 1.2934207916259766e-05, 0.00013458728790283203, 0.0002562403678894043, 0.00037789344787597656, 0.0004995465278625488, 0.0006211996078491211, 0.0007428526878356934, 0.0008645057678222656, 0.0009861588478088379, 0.0011078119277954102, 0.0012294650077819824, 0.0013511180877685547, 0.001472771167755127, 0.0015944242477416992, 0.0017160773277282715, 0.0018377304077148438, 0.001959383487701416, 0.0020810365676879883, 0.0022026896476745605, 0.002324342727661133, 0.002445995807647705, 0.0025676488876342773, 0.0026893019676208496, 0.002810955047607422, 0.002932608127593994, 0.0030542612075805664, 0.0031759142875671387, 0.003297567367553711, 0.003419220447540283, 0.0035408735275268555, 0.0036625266075134277, 0.0037841796875]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 6.0, 27.0, 39.0, 98.0, 277.0, 307.0, 150.0, 58.0, 30.0, 11.0, 3.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002455570502206683, -0.0002312363649252802, -0.00021691566507797688, -0.00020259497978258878, -0.00018827427993528545, -0.00017395359463989735, -0.00015963290934450924, -0.00014531222404912114, -0.0001309915242018178, -0.0001166708316304721, -0.00010235013905912638, -8.802945376373827e-05, -7.370876119239256e-05, -5.938806862104684e-05, -4.506738332565874e-05, -3.074669075431302e-05, -1.6425998182967305e-05, -2.105307430610992e-06, 1.2215383321745321e-05, 2.653607225511223e-05, 4.085676482645795e-05, 5.5177457397803664e-05, 6.949814269319177e-05, 8.381883526453748e-05, 9.81395278358832e-05, 0.00011246022040722892, 0.00012678091297857463, 0.00014110159827396274, 0.00015542228356935084, 0.00016974298341665417, 0.00018406366871204227, 0.0001983843685593456, 0.0002127050538547337, 0.0002270257391501218, 0.00024134643899742514, 0.00025566713884472847, 0.00026998782414011657, 0.0002843085094355047, 0.0002986291947308928, 0.0003129498800262809, 0.00032727059442549944, 0.00034159127972088754, 0.00035591196501627564, 0.0003702326794154942, 0.0003845533647108823, 0.0003988740500062704, 0.0004131947353016585, 0.0004275154205970466, 0.0004418361058924347, 0.0004561567911878228, 0.0004704774764832109, 0.000484798161778599, 0.0004991188761778176, 0.0005134395323693752, 0.0005277602467685938, 0.0005420809611678123, 0.00055640161735937, 0.0005707223317585886, 0.0005850429879501462, 0.0005993637023493648, 0.0006136843585409224, 0.000628005072940141, 0.0006423257291316986, 0.0006566464435309172, 0.0006709671579301357]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 8.0, 7.0, 3.0, 3.0, 15.0, 17.0, 11.0, 12.0, 8.0, 27.0, 15.0, 18.0, 31.0, 29.0, 46.0, 36.0, 35.0, 32.0, 38.0, 53.0, 43.0, 36.0, 39.0, 29.0, 37.0, 31.0, 45.0, 35.0, 28.0, 32.0, 29.0, 21.0, 26.0, 15.0, 15.0, 13.0, 14.0, 7.0, 14.0, 11.0, 8.0, 10.0, 8.0, 3.0, 4.0, 5.0, 3.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.071826934814453e-05, -8.761603385210037e-05, -8.451379835605621e-05, -8.141156286001205e-05, -7.83093273639679e-05, -7.520709186792374e-05, -7.210485637187958e-05, -6.900262087583542e-05, -6.590038537979126e-05, -6.27981498837471e-05, -5.969591438770294e-05, -5.659367889165878e-05, -5.3491443395614624e-05, -5.0389207899570465e-05, -4.7286972403526306e-05, -4.418473690748215e-05, -4.108250141143799e-05, -3.798026591539383e-05, -3.487803041934967e-05, -3.177579492330551e-05, -2.8673559427261353e-05, -2.5571323931217194e-05, -2.2469088435173035e-05, -1.9366852939128876e-05, -1.6264617443084717e-05, -1.3162381947040558e-05, -1.0060146450996399e-05, -6.95791095495224e-06, -3.855675458908081e-06, -7.534399628639221e-07, 2.348795533180237e-06, 5.451031029224396e-06, 8.553266525268555e-06, 1.1655502021312714e-05, 1.4757737517356873e-05, 1.785997301340103e-05, 2.096220850944519e-05, 2.406444400548935e-05, 2.7166679501533508e-05, 3.0268914997577667e-05, 3.3371150493621826e-05, 3.6473385989665985e-05, 3.9575621485710144e-05, 4.26778569817543e-05, 4.578009247779846e-05, 4.888232797384262e-05, 5.198456346988678e-05, 5.508679896593094e-05, 5.81890344619751e-05, 6.129126995801926e-05, 6.439350545406342e-05, 6.749574095010757e-05, 7.059797644615173e-05, 7.370021194219589e-05, 7.680244743824005e-05, 7.990468293428421e-05, 8.300691843032837e-05, 8.610915392637253e-05, 8.921138942241669e-05, 9.231362491846085e-05, 9.5415860414505e-05, 9.851809591054916e-05, 0.00010162033140659332, 0.00010472256690263748, 0.00010782480239868164]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 1.0, 3.0, 2.0, 3.0, 6.0, 10.0, 11.0, 9.0, 9.0, 23.0, 18.0, 25.0, 26.0, 24.0, 35.0, 43.0, 45.0, 42.0, 37.0, 42.0, 43.0, 39.0, 34.0, 52.0, 44.0, 37.0, 45.0, 33.0, 42.0, 32.0, 23.0, 21.0, 16.0, 20.0, 28.0, 14.0, 13.0, 13.0, 7.0, 3.0, 12.0, 7.0, 6.0, 4.0, 4.0, 1.0, 3.0], "bins": [-6.1953125, -6.03692626953125, -5.8785400390625, -5.72015380859375, -5.561767578125, -5.40338134765625, -5.2449951171875, -5.08660888671875, -4.92822265625, -4.76983642578125, -4.6114501953125, -4.45306396484375, -4.294677734375, -4.13629150390625, -3.9779052734375, -3.81951904296875, -3.6611328125, -3.50274658203125, -3.3443603515625, -3.18597412109375, -3.027587890625, -2.86920166015625, -2.7108154296875, -2.55242919921875, -2.39404296875, -2.23565673828125, -2.0772705078125, -1.91888427734375, -1.760498046875, -1.60211181640625, -1.4437255859375, -1.28533935546875, -1.126953125, -0.96856689453125, -0.8101806640625, -0.65179443359375, -0.493408203125, -0.33502197265625, -0.1766357421875, -0.01824951171875, 0.14013671875, 0.29852294921875, 0.4569091796875, 0.61529541015625, 0.773681640625, 0.93206787109375, 1.0904541015625, 1.24884033203125, 1.4072265625, 1.56561279296875, 1.7239990234375, 1.88238525390625, 2.040771484375, 2.19915771484375, 2.3575439453125, 2.51593017578125, 2.67431640625, 2.83270263671875, 2.9910888671875, 3.14947509765625, 3.307861328125, 3.46624755859375, 3.6246337890625, 3.78302001953125, 3.94140625]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 6.0, 3.0, 2.0, 5.0, 4.0, 8.0, 11.0, 14.0, 14.0, 33.0, 42.0, 67.0, 73.0, 114.0, 134.0, 209.0, 286.0, 370.0, 507.0, 601.0, 820.0, 1082.0, 1392.0, 1836.0, 2648.0, 4260.0, 7782.0, 18129.0, 54260.0, 233401.0, 524242.0, 129270.0, 35439.0, 12969.0, 5977.0, 3423.0, 2277.0, 1642.0, 1277.0, 925.0, 751.0, 549.0, 449.0, 331.0, 265.0, 185.0, 135.0, 105.0, 66.0, 46.0, 40.0, 23.0, 27.0, 13.0, 15.0, 4.0, 5.0, 7.0, 1.0, 1.0, 0.0, 2.0], "bins": [-5.203125, -5.0421142578125, -4.881103515625, -4.7200927734375, -4.55908203125, -4.3980712890625, -4.237060546875, -4.0760498046875, -3.9150390625, -3.7540283203125, -3.593017578125, -3.4320068359375, -3.27099609375, -3.1099853515625, -2.948974609375, -2.7879638671875, -2.626953125, -2.4659423828125, -2.304931640625, -2.1439208984375, -1.98291015625, -1.8218994140625, -1.660888671875, -1.4998779296875, -1.3388671875, -1.1778564453125, -1.016845703125, -0.8558349609375, -0.69482421875, -0.5338134765625, -0.372802734375, -0.2117919921875, -0.05078125, 0.1102294921875, 0.271240234375, 0.4322509765625, 0.59326171875, 0.7542724609375, 0.915283203125, 1.0762939453125, 1.2373046875, 1.3983154296875, 1.559326171875, 1.7203369140625, 1.88134765625, 2.0423583984375, 2.203369140625, 2.3643798828125, 2.525390625, 2.6864013671875, 2.847412109375, 3.0084228515625, 3.16943359375, 3.3304443359375, 3.491455078125, 3.6524658203125, 3.8134765625, 3.9744873046875, 4.135498046875, 4.2965087890625, 4.45751953125, 4.6185302734375, 4.779541015625, 4.9405517578125, 5.1015625]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 3.0, 2.0, 3.0, 6.0, 8.0, 8.0, 10.0, 21.0, 14.0, 19.0, 18.0, 23.0, 26.0, 40.0, 40.0, 55.0, 47.0, 57.0, 72.0, 85.0, 300.0, 1506.0, 168.0, 74.0, 62.0, 43.0, 45.0, 44.0, 33.0, 30.0, 28.0, 35.0, 18.0, 18.0, 12.0, 20.0, 13.0, 13.0, 8.0, 9.0, 6.0, 3.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.390625, -15.82958984375, -15.2685546875, -14.70751953125, -14.146484375, -13.58544921875, -13.0244140625, -12.46337890625, -11.90234375, -11.34130859375, -10.7802734375, -10.21923828125, -9.658203125, -9.09716796875, -8.5361328125, -7.97509765625, -7.4140625, -6.85302734375, -6.2919921875, -5.73095703125, -5.169921875, -4.60888671875, -4.0478515625, -3.48681640625, -2.92578125, -2.36474609375, -1.8037109375, -1.24267578125, -0.681640625, -0.12060546875, 0.4404296875, 1.00146484375, 1.5625, 2.12353515625, 2.6845703125, 3.24560546875, 3.806640625, 4.36767578125, 4.9287109375, 5.48974609375, 6.05078125, 6.61181640625, 7.1728515625, 7.73388671875, 8.294921875, 8.85595703125, 9.4169921875, 9.97802734375, 10.5390625, 11.10009765625, 11.6611328125, 12.22216796875, 12.783203125, 13.34423828125, 13.9052734375, 14.46630859375, 15.02734375, 15.58837890625, 16.1494140625, 16.71044921875, 17.271484375, 17.83251953125, 18.3935546875, 18.95458984375, 19.515625]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 3.0, 7.0, 15.0, 19.0, 38.0, 69.0, 105.0, 223.0, 638.0, 4764.0, 3120020.0, 18358.0, 875.0, 289.0, 135.0, 70.0, 26.0, 21.0, 16.0, 8.0, 6.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-130.5, -127.4404296875, -124.380859375, -121.3212890625, -118.26171875, -115.2021484375, -112.142578125, -109.0830078125, -106.0234375, -102.9638671875, -99.904296875, -96.8447265625, -93.78515625, -90.7255859375, -87.666015625, -84.6064453125, -81.546875, -78.4873046875, -75.427734375, -72.3681640625, -69.30859375, -66.2490234375, -63.189453125, -60.1298828125, -57.0703125, -54.0107421875, -50.951171875, -47.8916015625, -44.83203125, -41.7724609375, -38.712890625, -35.6533203125, -32.59375, -29.5341796875, -26.474609375, -23.4150390625, -20.35546875, -17.2958984375, -14.236328125, -11.1767578125, -8.1171875, -5.0576171875, -1.998046875, 1.0615234375, 4.12109375, 7.1806640625, 10.240234375, 13.2998046875, 16.359375, 19.4189453125, 22.478515625, 25.5380859375, 28.59765625, 31.6572265625, 34.716796875, 37.7763671875, 40.8359375, 43.8955078125, 46.955078125, 50.0146484375, 53.07421875, 56.1337890625, 59.193359375, 62.2529296875, 65.3125]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 10.0, 115.0, 702.0, 185.0, 5.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.335866928100586, -19.8385009765625, -14.341134071350098, -8.843767166137695, -3.3464012145996094, 2.1509647369384766, 7.648332595825195, 13.145696640014648, 18.643064498901367, 24.140430450439453, 29.637798309326172, 35.135162353515625, 40.632530212402344, 46.12989807128906, 51.62726593017578, 57.12462615966797, 62.62199401855469, 68.1193618774414, 73.61672973632812, 79.11408996582031, 84.61145782470703, 90.10882568359375, 95.60619354248047, 101.10356140136719, 106.6009292602539, 112.09829711914062, 117.59566497802734, 123.09303283691406, 128.59039306640625, 134.0877685546875, 139.5851287841797, 145.08248901367188, 150.57984924316406, 156.07720947265625, 161.5745849609375, 167.0719451904297, 172.56932067871094, 178.06668090820312, 183.56405639648438, 189.06141662597656, 194.55877685546875, 200.05613708496094, 205.5535125732422, 211.05087280273438, 216.54824829101562, 222.0456085205078, 227.54296875, 233.04034423828125, 238.5377197265625, 244.0350799560547, 249.53245544433594, 255.02981567382812, 260.5271911621094, 266.0245361328125, 271.52191162109375, 277.019287109375, 282.5166320800781, 288.0140075683594, 293.5113525390625, 299.00872802734375, 304.506103515625, 310.00347900390625, 315.5008239746094, 320.9981994628906, 326.4955749511719]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 1.0, 4.0, 9.0, 4.0, 8.0, 3.0, 7.0, 14.0, 21.0, 21.0, 18.0, 24.0, 29.0, 38.0, 24.0, 34.0, 45.0, 48.0, 39.0, 39.0, 38.0, 43.0, 39.0, 42.0, 51.0, 30.0, 35.0, 36.0, 36.0, 29.0, 35.0, 36.0, 16.0, 13.0, 23.0, 20.0, 15.0, 11.0, 8.0, 3.0, 8.0, 1.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-59.065223693847656, -57.421199798583984, -55.77717590332031, -54.133148193359375, -52.4891242980957, -50.84510040283203, -49.20107650756836, -47.55705261230469, -45.91302490234375, -44.26900100708008, -42.624977111816406, -40.98094940185547, -39.3369255065918, -37.692901611328125, -36.04887771606445, -34.40485382080078, -32.76082992553711, -31.116806030273438, -29.472780227661133, -27.82875633239746, -26.184730529785156, -24.540706634521484, -22.896682739257812, -21.25265884399414, -19.608633041381836, -17.964609146118164, -16.32058334350586, -14.676559448242188, -13.0325345993042, -11.388509750366211, -9.744485855102539, -8.10046100616455, -6.456439971923828, -4.81241512298584, -3.1683907508850098, -1.5243663787841797, 0.1196584701538086, 1.7636833190917969, 3.4077072143554688, 5.051732063293457, 6.695756912231445, 8.339781761169434, 9.983806610107422, 11.627830505371094, 13.271855354309082, 14.91588020324707, 16.559904098510742, 18.203929901123047, 19.84795379638672, 21.49197769165039, 23.136003494262695, 24.780027389526367, 26.424053192138672, 28.068077087402344, 29.712100982666016, 31.356124877929688, 33.000152587890625, 34.6441764831543, 36.28820037841797, 37.932228088378906, 39.57625198364258, 41.22027587890625, 42.86429977416992, 44.508323669433594, 46.152347564697266]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 5.0, 5.0, 7.0, 7.0, 14.0, 7.0, 15.0, 20.0, 18.0, 19.0, 29.0, 36.0, 26.0, 32.0, 38.0, 42.0, 49.0, 46.0, 42.0, 36.0, 50.0, 43.0, 35.0, 35.0, 44.0, 32.0, 32.0, 26.0, 34.0, 24.0, 20.0, 18.0, 17.0, 20.0, 17.0, 8.0, 10.0, 13.0, 4.0, 5.0, 7.0, 5.0, 4.0, 4.0, 3.0, 0.0, 0.0, 1.0], "bins": [-5.80859375, -5.6475830078125, -5.486572265625, -5.3255615234375, -5.16455078125, -5.0035400390625, -4.842529296875, -4.6815185546875, -4.5205078125, -4.3594970703125, -4.198486328125, -4.0374755859375, -3.87646484375, -3.7154541015625, -3.554443359375, -3.3934326171875, -3.232421875, -3.0714111328125, -2.910400390625, -2.7493896484375, -2.58837890625, -2.4273681640625, -2.266357421875, -2.1053466796875, -1.9443359375, -1.7833251953125, -1.622314453125, -1.4613037109375, -1.30029296875, -1.1392822265625, -0.978271484375, -0.8172607421875, -0.65625, -0.4952392578125, -0.334228515625, -0.1732177734375, -0.01220703125, 0.1488037109375, 0.309814453125, 0.4708251953125, 0.6318359375, 0.7928466796875, 0.953857421875, 1.1148681640625, 1.27587890625, 1.4368896484375, 1.597900390625, 1.7589111328125, 1.919921875, 2.0809326171875, 2.241943359375, 2.4029541015625, 2.56396484375, 2.7249755859375, 2.885986328125, 3.0469970703125, 3.2080078125, 3.3690185546875, 3.530029296875, 3.6910400390625, 3.85205078125, 4.0130615234375, 4.174072265625, 4.3350830078125, 4.49609375]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 5.0, 2.0, 8.0, 5.0, 12.0, 22.0, 21.0, 31.0, 41.0, 64.0, 80.0, 128.0, 174.0, 247.0, 432.0, 693.0, 1218.0, 1999.0, 3469.0, 6152.0, 12369.0, 28056.0, 128047.0, 1286075.0, 2336097.0, 306298.0, 46138.0, 17010.0, 8497.0, 4519.0, 2632.0, 1504.0, 842.0, 525.0, 288.0, 202.0, 105.0, 84.0, 48.0, 35.0, 38.0, 19.0, 12.0, 14.0, 7.0, 8.0, 3.0, 4.0, 3.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-11.09375, -10.7491455078125, -10.404541015625, -10.0599365234375, -9.71533203125, -9.3707275390625, -9.026123046875, -8.6815185546875, -8.3369140625, -7.9923095703125, -7.647705078125, -7.3031005859375, -6.95849609375, -6.6138916015625, -6.269287109375, -5.9246826171875, -5.580078125, -5.2354736328125, -4.890869140625, -4.5462646484375, -4.20166015625, -3.8570556640625, -3.512451171875, -3.1678466796875, -2.8232421875, -2.4786376953125, -2.134033203125, -1.7894287109375, -1.44482421875, -1.1002197265625, -0.755615234375, -0.4110107421875, -0.06640625, 0.2781982421875, 0.622802734375, 0.9674072265625, 1.31201171875, 1.6566162109375, 2.001220703125, 2.3458251953125, 2.6904296875, 3.0350341796875, 3.379638671875, 3.7242431640625, 4.06884765625, 4.4134521484375, 4.758056640625, 5.1026611328125, 5.447265625, 5.7918701171875, 6.136474609375, 6.4810791015625, 6.82568359375, 7.1702880859375, 7.514892578125, 7.8594970703125, 8.2041015625, 8.5487060546875, 8.893310546875, 9.2379150390625, 9.58251953125, 9.9271240234375, 10.271728515625, 10.6163330078125, 10.9609375]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 5.0, 10.0, 3.0, 5.0, 6.0, 8.0, 16.0, 18.0, 29.0, 25.0, 38.0, 52.0, 86.0, 74.0, 124.0, 211.0, 292.0, 402.0, 605.0, 551.0, 422.0, 325.0, 224.0, 141.0, 107.0, 58.0, 53.0, 29.0, 34.0, 23.0, 26.0, 13.0, 15.0, 6.0, 3.0, 6.0, 9.0, 8.0, 3.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.8671875, -10.5172119140625, -10.167236328125, -9.8172607421875, -9.46728515625, -9.1173095703125, -8.767333984375, -8.4173583984375, -8.0673828125, -7.7174072265625, -7.367431640625, -7.0174560546875, -6.66748046875, -6.3175048828125, -5.967529296875, -5.6175537109375, -5.267578125, -4.9176025390625, -4.567626953125, -4.2176513671875, -3.86767578125, -3.5177001953125, -3.167724609375, -2.8177490234375, -2.4677734375, -2.1177978515625, -1.767822265625, -1.4178466796875, -1.06787109375, -0.7178955078125, -0.367919921875, -0.0179443359375, 0.33203125, 0.6820068359375, 1.031982421875, 1.3819580078125, 1.73193359375, 2.0819091796875, 2.431884765625, 2.7818603515625, 3.1318359375, 3.4818115234375, 3.831787109375, 4.1817626953125, 4.53173828125, 4.8817138671875, 5.231689453125, 5.5816650390625, 5.931640625, 6.2816162109375, 6.631591796875, 6.9815673828125, 7.33154296875, 7.6815185546875, 8.031494140625, 8.3814697265625, 8.7314453125, 9.0814208984375, 9.431396484375, 9.7813720703125, 10.13134765625, 10.4813232421875, 10.831298828125, 11.1812744140625, 11.53125]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0, 4.0, 5.0, 2.0, 9.0, 10.0, 11.0, 7.0, 19.0, 20.0, 28.0, 50.0, 61.0, 102.0, 234.0, 449.0, 933.0, 1982.0, 4529.0, 12012.0, 37308.0, 175480.0, 2620716.0, 1198573.0, 99832.0, 26223.0, 9008.0, 3499.0, 1518.0, 785.0, 379.0, 185.0, 113.0, 70.0, 37.0, 24.0, 22.0, 12.0, 9.0, 6.0, 5.0, 6.0, 4.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-21.609375, -20.9892578125, -20.369140625, -19.7490234375, -19.12890625, -18.5087890625, -17.888671875, -17.2685546875, -16.6484375, -16.0283203125, -15.408203125, -14.7880859375, -14.16796875, -13.5478515625, -12.927734375, -12.3076171875, -11.6875, -11.0673828125, -10.447265625, -9.8271484375, -9.20703125, -8.5869140625, -7.966796875, -7.3466796875, -6.7265625, -6.1064453125, -5.486328125, -4.8662109375, -4.24609375, -3.6259765625, -3.005859375, -2.3857421875, -1.765625, -1.1455078125, -0.525390625, 0.0947265625, 0.71484375, 1.3349609375, 1.955078125, 2.5751953125, 3.1953125, 3.8154296875, 4.435546875, 5.0556640625, 5.67578125, 6.2958984375, 6.916015625, 7.5361328125, 8.15625, 8.7763671875, 9.396484375, 10.0166015625, 10.63671875, 11.2568359375, 11.876953125, 12.4970703125, 13.1171875, 13.7373046875, 14.357421875, 14.9775390625, 15.59765625, 16.2177734375, 16.837890625, 17.4580078125, 18.078125]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 7.0, 17.0, 37.0, 79.0, 143.0, 235.0, 209.0, 136.0, 71.0, 29.0, 23.0, 10.0, 4.0, 2.0, 5.0, 2.0, 1.0], "bins": [-184.7446746826172, -181.25218200683594, -177.7596893310547, -174.26719665527344, -170.7747039794922, -167.28221130371094, -163.7897186279297, -160.2972412109375, -156.80474853515625, -153.312255859375, -149.81976318359375, -146.3272705078125, -142.83477783203125, -139.34228515625, -135.84979248046875, -132.3572998046875, -128.86480712890625, -125.372314453125, -121.87982177734375, -118.3873291015625, -114.89483642578125, -111.40234375, -107.90985870361328, -104.41736602783203, -100.92487335205078, -97.43238067626953, -93.93988800048828, -90.44739532470703, -86.95491027832031, -83.46241760253906, -79.96992492675781, -76.47743225097656, -72.98493957519531, -69.49244689941406, -65.99995422363281, -62.50746536254883, -59.01497268676758, -55.52248001098633, -52.029991149902344, -48.537498474121094, -45.04500198364258, -41.55250930786133, -38.060020446777344, -34.567527770996094, -31.075035095214844, -27.582542419433594, -24.090051651000977, -20.59756088256836, -17.10506820678711, -13.612576484680176, -10.120084762573242, -6.627593040466309, -3.135101318359375, 0.357391357421875, 3.849882125854492, 7.342372894287109, 10.83486557006836, 14.327357292175293, 17.819849014282227, 21.312339782714844, 24.804832458496094, 28.297325134277344, 31.78981590270996, 35.28230667114258, 38.77479934692383]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 1.0, 1.0, 3.0, 4.0, 6.0, 5.0, 9.0, 8.0, 7.0, 13.0, 16.0, 14.0, 12.0, 15.0, 24.0, 24.0, 29.0, 32.0, 33.0, 38.0, 46.0, 32.0, 47.0, 32.0, 49.0, 37.0, 43.0, 31.0, 47.0, 41.0, 28.0, 31.0, 34.0, 18.0, 27.0, 19.0, 22.0, 18.0, 21.0, 23.0, 12.0, 17.0, 8.0, 6.0, 8.0, 8.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.559051513671875, -36.393348693847656, -35.2276496887207, -34.061946868896484, -32.896244049072266, -31.73054313659668, -30.564842224121094, -29.399139404296875, -28.23343849182129, -27.067737579345703, -25.902034759521484, -24.7363338470459, -23.570632934570312, -22.404930114746094, -21.239229202270508, -20.073528289794922, -18.907825469970703, -17.742124557495117, -16.5764217376709, -15.410720825195312, -14.24501895904541, -13.079317092895508, -11.913616180419922, -10.74791431427002, -9.582212448120117, -8.416510581970215, -7.250809192657471, -6.085107803344727, -4.919405937194824, -3.753704071044922, -2.5880026817321777, -1.4223012924194336, -0.2565956115722656, 0.9091060161590576, 2.074807643890381, 3.240509271621704, 4.406210899353027, 5.57191276550293, 6.737614154815674, 7.903315544128418, 9.06901741027832, 10.234719276428223, 11.400421142578125, 12.566122055053711, 13.731823921203613, 14.897525787353516, 16.0632266998291, 17.228927612304688, 18.394630432128906, 19.560331344604492, 20.72603416442871, 21.891735076904297, 23.057437896728516, 24.2231388092041, 25.388839721679688, 26.554542541503906, 27.720243453979492, 28.885944366455078, 30.051647186279297, 31.217348098754883, 32.38304901123047, 33.54875183105469, 34.714454650878906, 35.88015365600586, 37.04585647583008]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 0.0, 4.0, 3.0, 3.0, 5.0, 5.0, 2.0, 5.0, 9.0, 3.0, 12.0, 12.0, 11.0, 10.0, 19.0, 17.0, 19.0, 22.0, 25.0, 28.0, 31.0, 27.0, 28.0, 34.0, 37.0, 48.0, 40.0, 35.0, 45.0, 49.0, 31.0, 31.0, 45.0, 38.0, 29.0, 27.0, 30.0, 23.0, 28.0, 21.0, 20.0, 17.0, 15.0, 11.0, 5.0, 8.0, 11.0, 4.0, 5.0, 5.0, 5.0, 7.0, 3.0, 4.0, 1.0, 3.0], "bins": [-5.28515625, -5.1380615234375, -4.990966796875, -4.8438720703125, -4.69677734375, -4.5496826171875, -4.402587890625, -4.2554931640625, -4.1083984375, -3.9613037109375, -3.814208984375, -3.6671142578125, -3.52001953125, -3.3729248046875, -3.225830078125, -3.0787353515625, -2.931640625, -2.7845458984375, -2.637451171875, -2.4903564453125, -2.34326171875, -2.1961669921875, -2.049072265625, -1.9019775390625, -1.7548828125, -1.6077880859375, -1.460693359375, -1.3135986328125, -1.16650390625, -1.0194091796875, -0.872314453125, -0.7252197265625, -0.578125, -0.4310302734375, -0.283935546875, -0.1368408203125, 0.01025390625, 0.1573486328125, 0.304443359375, 0.4515380859375, 0.5986328125, 0.7457275390625, 0.892822265625, 1.0399169921875, 1.18701171875, 1.3341064453125, 1.481201171875, 1.6282958984375, 1.775390625, 1.9224853515625, 2.069580078125, 2.2166748046875, 2.36376953125, 2.5108642578125, 2.657958984375, 2.8050537109375, 2.9521484375, 3.0992431640625, 3.246337890625, 3.3934326171875, 3.54052734375, 3.6876220703125, 3.834716796875, 3.9818115234375, 4.12890625]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 1.0, 3.0, 11.0, 11.0, 15.0, 21.0, 37.0, 42.0, 79.0, 102.0, 169.0, 232.0, 356.0, 526.0, 801.0, 1194.0, 1800.0, 2705.0, 4136.0, 6257.0, 9622.0, 15167.0, 24159.0, 38024.0, 63540.0, 111522.0, 213159.0, 239972.0, 127398.0, 70947.0, 42724.0, 25973.0, 16767.0, 10840.0, 7121.0, 4463.0, 2863.0, 1891.0, 1277.0, 865.0, 556.0, 383.0, 256.0, 176.0, 112.0, 88.0, 51.0, 51.0, 21.0, 25.0, 16.0, 13.0, 7.0, 12.0, 2.0, 3.0], "bins": [-0.2193603515625, -0.21311187744140625, -0.2068634033203125, -0.20061492919921875, -0.194366455078125, -0.18811798095703125, -0.1818695068359375, -0.17562103271484375, -0.16937255859375, -0.16312408447265625, -0.1568756103515625, -0.15062713623046875, -0.144378662109375, -0.13813018798828125, -0.1318817138671875, -0.12563323974609375, -0.119384765625, -0.11313629150390625, -0.1068878173828125, -0.10063934326171875, -0.094390869140625, -0.08814239501953125, -0.0818939208984375, -0.07564544677734375, -0.06939697265625, -0.06314849853515625, -0.0569000244140625, -0.05065155029296875, -0.044403076171875, -0.03815460205078125, -0.0319061279296875, -0.02565765380859375, -0.0194091796875, -0.01316070556640625, -0.0069122314453125, -0.00066375732421875, 0.005584716796875, 0.01183319091796875, 0.0180816650390625, 0.02433013916015625, 0.03057861328125, 0.03682708740234375, 0.0430755615234375, 0.04932403564453125, 0.055572509765625, 0.06182098388671875, 0.0680694580078125, 0.07431793212890625, 0.08056640625, 0.08681488037109375, 0.0930633544921875, 0.09931182861328125, 0.105560302734375, 0.11180877685546875, 0.1180572509765625, 0.12430572509765625, 0.13055419921875, 0.13680267333984375, 0.1430511474609375, 0.14929962158203125, 0.155548095703125, 0.16179656982421875, 0.1680450439453125, 0.17429351806640625, 0.1805419921875]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 4.0, 1.0, 6.0, 8.0, 1.0, 6.0, 6.0, 11.0, 16.0, 24.0, 25.0, 20.0, 23.0, 34.0, 30.0, 33.0, 48.0, 45.0, 35.0, 46.0, 42.0, 1065.0, 39.0, 42.0, 56.0, 56.0, 50.0, 41.0, 31.0, 36.0, 25.0, 24.0, 20.0, 18.0, 10.0, 20.0, 13.0, 4.0, 7.0, 7.0, 3.0, 2.0, 2.0, 3.0, 2.0], "bins": [-4.875, -4.754425048828125, -4.63385009765625, -4.513275146484375, -4.3927001953125, -4.272125244140625, -4.15155029296875, -4.030975341796875, -3.910400390625, -3.789825439453125, -3.66925048828125, -3.548675537109375, -3.4281005859375, -3.307525634765625, -3.18695068359375, -3.066375732421875, -2.94580078125, -2.825225830078125, -2.70465087890625, -2.584075927734375, -2.4635009765625, -2.342926025390625, -2.22235107421875, -2.101776123046875, -1.981201171875, -1.860626220703125, -1.74005126953125, -1.619476318359375, -1.4989013671875, -1.378326416015625, -1.25775146484375, -1.137176513671875, -1.0166015625, -0.896026611328125, -0.77545166015625, -0.654876708984375, -0.5343017578125, -0.413726806640625, -0.29315185546875, -0.172576904296875, -0.052001953125, 0.068572998046875, 0.18914794921875, 0.309722900390625, 0.4302978515625, 0.550872802734375, 0.67144775390625, 0.792022705078125, 0.91259765625, 1.033172607421875, 1.15374755859375, 1.274322509765625, 1.3948974609375, 1.515472412109375, 1.63604736328125, 1.756622314453125, 1.877197265625, 1.997772216796875, 2.11834716796875, 2.238922119140625, 2.3594970703125, 2.480072021484375, 2.60064697265625, 2.721221923828125, 2.841796875]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 4.0, 1.0, 1.0, 9.0, 4.0, 7.0, 13.0, 17.0, 29.0, 50.0, 78.0, 106.0, 163.0, 234.0, 315.0, 527.0, 783.0, 1087.0, 1690.0, 2607.0, 3915.0, 6134.0, 9869.0, 15997.0, 26937.0, 45851.0, 80982.0, 148291.0, 1298643.0, 196710.0, 107327.0, 59694.0, 34228.0, 20467.0, 12401.0, 7753.0, 4880.0, 3203.0, 2074.0, 1366.0, 872.0, 610.0, 382.0, 297.0, 184.0, 132.0, 88.0, 41.0, 32.0, 19.0, 14.0, 9.0, 4.0, 5.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.1612548828125, -0.1561737060546875, -0.151092529296875, -0.1460113525390625, -0.14093017578125, -0.1358489990234375, -0.130767822265625, -0.1256866455078125, -0.12060546875, -0.1155242919921875, -0.110443115234375, -0.1053619384765625, -0.10028076171875, -0.0951995849609375, -0.090118408203125, -0.0850372314453125, -0.0799560546875, -0.0748748779296875, -0.069793701171875, -0.0647125244140625, -0.05963134765625, -0.0545501708984375, -0.049468994140625, -0.0443878173828125, -0.039306640625, -0.0342254638671875, -0.029144287109375, -0.0240631103515625, -0.01898193359375, -0.0139007568359375, -0.008819580078125, -0.0037384033203125, 0.0013427734375, 0.0064239501953125, 0.011505126953125, 0.0165863037109375, 0.02166748046875, 0.0267486572265625, 0.031829833984375, 0.0369110107421875, 0.0419921875, 0.0470733642578125, 0.052154541015625, 0.0572357177734375, 0.06231689453125, 0.0673980712890625, 0.072479248046875, 0.0775604248046875, 0.0826416015625, 0.0877227783203125, 0.092803955078125, 0.0978851318359375, 0.10296630859375, 0.1080474853515625, 0.113128662109375, 0.1182098388671875, 0.123291015625, 0.1283721923828125, 0.133453369140625, 0.1385345458984375, 0.14361572265625, 0.1486968994140625, 0.153778076171875, 0.1588592529296875, 0.1639404296875]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 5.0, 2.0, 3.0, 5.0, 10.0, 12.0, 25.0, 31.0, 41.0, 51.0, 108.0, 132.0, 167.0, 138.0, 83.0, 59.0, 31.0, 24.0, 18.0, 14.0, 5.0, 6.0, 6.0, 5.0, 1.0, 0.0, 3.0, 4.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0], "bins": [-0.0002617835998535156, -0.0002547726035118103, -0.000247761607170105, -0.00024075061082839966, -0.00023373961448669434, -0.00022672861814498901, -0.0002197176218032837, -0.00021270662546157837, -0.00020569562911987305, -0.00019868463277816772, -0.0001916736364364624, -0.00018466264009475708, -0.00017765164375305176, -0.00017064064741134644, -0.0001636296510696411, -0.0001566186547279358, -0.00014960765838623047, -0.00014259666204452515, -0.00013558566570281982, -0.0001285746693611145, -0.00012156367301940918, -0.00011455267667770386, -0.00010754168033599854, -0.00010053068399429321, -9.351968765258789e-05, -8.650869131088257e-05, -7.949769496917725e-05, -7.248669862747192e-05, -6.54757022857666e-05, -5.846470594406128e-05, -5.145370960235596e-05, -4.4442713260650635e-05, -3.743171691894531e-05, -3.042072057723999e-05, -2.3409724235534668e-05, -1.6398727893829346e-05, -9.387731552124023e-06, -2.376735210418701e-06, 4.634261131286621e-06, 1.1645257472991943e-05, 1.8656253814697266e-05, 2.5667250156402588e-05, 3.267824649810791e-05, 3.968924283981323e-05, 4.6700239181518555e-05, 5.371123552322388e-05, 6.07222318649292e-05, 6.773322820663452e-05, 7.474422454833984e-05, 8.175522089004517e-05, 8.876621723175049e-05, 9.577721357345581e-05, 0.00010278820991516113, 0.00010979920625686646, 0.00011681020259857178, 0.0001238211989402771, 0.00013083219528198242, 0.00013784319162368774, 0.00014485418796539307, 0.0001518651843070984, 0.0001588761806488037, 0.00016588717699050903, 0.00017289817333221436, 0.00017990916967391968, 0.000186920166015625]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 3.0, 4.0, 6.0, 3.0, 9.0, 7.0, 15.0, 13.0, 18.0, 29.0, 41.0, 55.0, 126.0, 243.0, 1031.0, 24858.0, 996105.0, 24453.0, 971.0, 231.0, 120.0, 52.0, 48.0, 34.0, 19.0, 18.0, 11.0, 7.0, 7.0, 1.0, 2.0, 3.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0031185150146484375, -0.0030008256435394287, -0.00288313627243042, -0.002765446901321411, -0.0026477575302124023, -0.0025300681591033936, -0.0024123787879943848, -0.002294689416885376, -0.002177000045776367, -0.0020593106746673584, -0.0019416213035583496, -0.0018239319324493408, -0.001706242561340332, -0.0015885531902313232, -0.0014708638191223145, -0.0013531744480133057, -0.0012354850769042969, -0.001117795705795288, -0.0010001063346862793, -0.0008824169635772705, -0.0007647275924682617, -0.0006470382213592529, -0.0005293488502502441, -0.00041165947914123535, -0.00029397010803222656, -0.00017628073692321777, -5.8591365814208984e-05, 5.9098005294799805e-05, 0.0001767873764038086, 0.0002944767475128174, 0.00041216611862182617, 0.000529855489730835, 0.0006475448608398438, 0.0007652342319488525, 0.0008829236030578613, 0.0010006129741668701, 0.001118302345275879, 0.0012359917163848877, 0.0013536810874938965, 0.0014713704586029053, 0.001589059829711914, 0.0017067492008209229, 0.0018244385719299316, 0.0019421279430389404, 0.0020598173141479492, 0.002177506685256958, 0.002295196056365967, 0.0024128854274749756, 0.0025305747985839844, 0.002648264169692993, 0.002765953540802002, 0.0028836429119110107, 0.0030013322830200195, 0.0031190216541290283, 0.003236711025238037, 0.003354400396347046, 0.0034720897674560547, 0.0035897791385650635, 0.0037074685096740723, 0.003825157880783081, 0.00394284725189209, 0.004060536623001099, 0.004178225994110107, 0.004295915365219116, 0.004413604736328125]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 10.0, 73.0, 585.0, 316.0, 31.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00012557857553474605, -9.938875155057758e-05, -7.319892756640911e-05, -4.700910358224064e-05, -2.081927959807217e-05, 5.370544386096299e-06, 3.156036837026477e-05, 5.775019235443324e-05, 8.394001633860171e-05, 0.00011012984032277018, 0.00013631966430693865, 0.00016250948829110712, 0.0001886993122752756, 0.00021488913625944406, 0.00024107896024361253, 0.0002672687987796962, 0.00029345860821194947, 0.0003196484176442027, 0.0003458382561802864, 0.0003720280947163701, 0.00039821790414862335, 0.0004244077135808766, 0.0004505975521169603, 0.000476787390653044, 0.0005029771709814668, 0.0005291670095175505, 0.0005553568480536342, 0.000581546628382057, 0.0006077364669181406, 0.0006339263054542243, 0.0006601160857826471, 0.0006863059243187308, 0.0007124957628548145, 0.0007386856013908982, 0.0007648754399269819, 0.0007910652202554047, 0.0008172550587914884, 0.0008434448973275721, 0.0008696346776559949, 0.0008958245161920786, 0.0009220143547281623, 0.000948204193264246, 0.0009743940318003297, 0.0010005838703364134, 0.0010267735924571753, 0.001052963430993259, 0.0010791532695293427, 0.0011053431080654263, 0.00113153294660151, 0.0011577227851375937, 0.0011839126236736774, 0.0012101024622097611, 0.0012362923007458448, 0.0012624820228666067, 0.0012886718614026904, 0.0013148616999387741, 0.0013410515384748578, 0.0013672413770109415, 0.0013934312155470252, 0.001419621054083109, 0.0014458107762038708, 0.0014720006147399545, 0.0014981904532760382, 0.0015243802918121219, 0.0015505701303482056]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 2.0, 7.0, 10.0, 14.0, 11.0, 19.0, 23.0, 26.0, 29.0, 36.0, 35.0, 40.0, 39.0, 32.0, 34.0, 53.0, 47.0, 48.0, 60.0, 42.0, 55.0, 57.0, 46.0, 38.0, 38.0, 41.0, 28.0, 27.0, 14.0, 19.0, 10.0, 10.0, 10.0, 3.0, 3.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.906291961669922e-05, -9.575486183166504e-05, -9.244680404663086e-05, -8.913874626159668e-05, -8.58306884765625e-05, -8.252263069152832e-05, -7.921457290649414e-05, -7.590651512145996e-05, -7.259845733642578e-05, -6.92903995513916e-05, -6.598234176635742e-05, -6.267428398132324e-05, -5.936622619628906e-05, -5.605816841125488e-05, -5.27501106262207e-05, -4.9442052841186523e-05, -4.6133995056152344e-05, -4.2825937271118164e-05, -3.9517879486083984e-05, -3.6209821701049805e-05, -3.2901763916015625e-05, -2.9593706130981445e-05, -2.6285648345947266e-05, -2.2977590560913086e-05, -1.9669532775878906e-05, -1.6361474990844727e-05, -1.3053417205810547e-05, -9.745359420776367e-06, -6.4373016357421875e-06, -3.129243850708008e-06, 1.7881393432617188e-07, 3.4868717193603516e-06, 6.794929504394531e-06, 1.0102987289428711e-05, 1.341104507446289e-05, 1.671910285949707e-05, 2.002716064453125e-05, 2.333521842956543e-05, 2.664327621459961e-05, 2.995133399963379e-05, 3.325939178466797e-05, 3.656744956970215e-05, 3.987550735473633e-05, 4.318356513977051e-05, 4.649162292480469e-05, 4.979968070983887e-05, 5.310773849487305e-05, 5.6415796279907227e-05, 5.9723854064941406e-05, 6.303191184997559e-05, 6.633996963500977e-05, 6.964802742004395e-05, 7.295608520507812e-05, 7.62641429901123e-05, 7.957220077514648e-05, 8.288025856018066e-05, 8.618831634521484e-05, 8.949637413024902e-05, 9.28044319152832e-05, 9.611248970031738e-05, 9.942054748535156e-05, 0.00010272860527038574, 0.00010603666305541992, 0.0001093447208404541, 0.00011265277862548828]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 0.0, 4.0, 3.0, 3.0, 5.0, 5.0, 2.0, 5.0, 9.0, 3.0, 12.0, 12.0, 11.0, 10.0, 19.0, 17.0, 19.0, 22.0, 25.0, 28.0, 31.0, 27.0, 28.0, 34.0, 37.0, 48.0, 40.0, 35.0, 45.0, 49.0, 31.0, 31.0, 45.0, 38.0, 29.0, 27.0, 30.0, 23.0, 28.0, 21.0, 20.0, 17.0, 15.0, 11.0, 5.0, 8.0, 11.0, 4.0, 5.0, 5.0, 5.0, 7.0, 3.0, 4.0, 1.0, 3.0], "bins": [-5.28515625, -5.1380615234375, -4.990966796875, -4.8438720703125, -4.69677734375, -4.5496826171875, -4.402587890625, -4.2554931640625, -4.1083984375, -3.9613037109375, -3.814208984375, -3.6671142578125, -3.52001953125, -3.3729248046875, -3.225830078125, -3.0787353515625, -2.931640625, -2.7845458984375, -2.637451171875, -2.4903564453125, -2.34326171875, -2.1961669921875, -2.049072265625, -1.9019775390625, -1.7548828125, -1.6077880859375, -1.460693359375, -1.3135986328125, -1.16650390625, -1.0194091796875, -0.872314453125, -0.7252197265625, -0.578125, -0.4310302734375, -0.283935546875, -0.1368408203125, 0.01025390625, 0.1573486328125, 0.304443359375, 0.4515380859375, 0.5986328125, 0.7457275390625, 0.892822265625, 1.0399169921875, 1.18701171875, 1.3341064453125, 1.481201171875, 1.6282958984375, 1.775390625, 1.9224853515625, 2.069580078125, 2.2166748046875, 2.36376953125, 2.5108642578125, 2.657958984375, 2.8050537109375, 2.9521484375, 3.0992431640625, 3.246337890625, 3.3934326171875, 3.54052734375, 3.6876220703125, 3.834716796875, 3.9818115234375, 4.12890625]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 7.0, 3.0, 4.0, 10.0, 9.0, 7.0, 19.0, 15.0, 27.0, 49.0, 61.0, 109.0, 178.0, 347.0, 621.0, 1136.0, 1990.0, 3747.0, 7852.0, 20973.0, 84973.0, 518478.0, 325726.0, 53687.0, 15313.0, 6250.0, 3096.0, 1674.0, 925.0, 495.0, 286.0, 165.0, 120.0, 58.0, 32.0, 43.0, 11.0, 12.0, 11.0, 11.0, 10.0, 13.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-9.3203125, -9.05291748046875, -8.7855224609375, -8.51812744140625, -8.250732421875, -7.98333740234375, -7.7159423828125, -7.44854736328125, -7.18115234375, -6.91375732421875, -6.6463623046875, -6.37896728515625, -6.111572265625, -5.84417724609375, -5.5767822265625, -5.30938720703125, -5.0419921875, -4.77459716796875, -4.5072021484375, -4.23980712890625, -3.972412109375, -3.70501708984375, -3.4376220703125, -3.17022705078125, -2.90283203125, -2.63543701171875, -2.3680419921875, -2.10064697265625, -1.833251953125, -1.56585693359375, -1.2984619140625, -1.03106689453125, -0.763671875, -0.49627685546875, -0.2288818359375, 0.03851318359375, 0.305908203125, 0.57330322265625, 0.8406982421875, 1.10809326171875, 1.37548828125, 1.64288330078125, 1.9102783203125, 2.17767333984375, 2.445068359375, 2.71246337890625, 2.9798583984375, 3.24725341796875, 3.5146484375, 3.78204345703125, 4.0494384765625, 4.31683349609375, 4.584228515625, 4.85162353515625, 5.1190185546875, 5.38641357421875, 5.65380859375, 5.92120361328125, 6.1885986328125, 6.45599365234375, 6.723388671875, 6.99078369140625, 7.2581787109375, 7.52557373046875, 7.79296875]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 5.0, 3.0, 5.0, 12.0, 14.0, 13.0, 22.0, 13.0, 18.0, 29.0, 35.0, 37.0, 44.0, 48.0, 63.0, 79.0, 140.0, 390.0, 1444.0, 173.0, 88.0, 54.0, 56.0, 38.0, 34.0, 37.0, 32.0, 28.0, 20.0, 15.0, 12.0, 17.0, 3.0, 5.0, 6.0, 7.0, 6.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0], "bins": [-24.890625, -24.236083984375, -23.58154296875, -22.927001953125, -22.2724609375, -21.617919921875, -20.96337890625, -20.308837890625, -19.654296875, -18.999755859375, -18.34521484375, -17.690673828125, -17.0361328125, -16.381591796875, -15.72705078125, -15.072509765625, -14.41796875, -13.763427734375, -13.10888671875, -12.454345703125, -11.7998046875, -11.145263671875, -10.49072265625, -9.836181640625, -9.181640625, -8.527099609375, -7.87255859375, -7.218017578125, -6.5634765625, -5.908935546875, -5.25439453125, -4.599853515625, -3.9453125, -3.290771484375, -2.63623046875, -1.981689453125, -1.3271484375, -0.672607421875, -0.01806640625, 0.636474609375, 1.291015625, 1.945556640625, 2.60009765625, 3.254638671875, 3.9091796875, 4.563720703125, 5.21826171875, 5.872802734375, 6.52734375, 7.181884765625, 7.83642578125, 8.490966796875, 9.1455078125, 9.800048828125, 10.45458984375, 11.109130859375, 11.763671875, 12.418212890625, 13.07275390625, 13.727294921875, 14.3818359375, 15.036376953125, 15.69091796875, 16.345458984375, 17.0]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 2.0, 9.0, 5.0, 3.0, 4.0, 9.0, 10.0, 7.0, 17.0, 23.0, 31.0, 44.0, 55.0, 59.0, 101.0, 152.0, 224.0, 372.0, 892.0, 6559.0, 1615961.0, 1512765.0, 6454.0, 893.0, 353.0, 198.0, 150.0, 94.0, 64.0, 54.0, 28.0, 35.0, 19.0, 14.0, 13.0, 11.0, 9.0, 8.0, 4.0, 4.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.15625, -35.60791015625, -34.0595703125, -32.51123046875, -30.962890625, -29.41455078125, -27.8662109375, -26.31787109375, -24.76953125, -23.22119140625, -21.6728515625, -20.12451171875, -18.576171875, -17.02783203125, -15.4794921875, -13.93115234375, -12.3828125, -10.83447265625, -9.2861328125, -7.73779296875, -6.189453125, -4.64111328125, -3.0927734375, -1.54443359375, 0.00390625, 1.55224609375, 3.1005859375, 4.64892578125, 6.197265625, 7.74560546875, 9.2939453125, 10.84228515625, 12.390625, 13.93896484375, 15.4873046875, 17.03564453125, 18.583984375, 20.13232421875, 21.6806640625, 23.22900390625, 24.77734375, 26.32568359375, 27.8740234375, 29.42236328125, 30.970703125, 32.51904296875, 34.0673828125, 35.61572265625, 37.1640625, 38.71240234375, 40.2607421875, 41.80908203125, 43.357421875, 44.90576171875, 46.4541015625, 48.00244140625, 49.55078125, 51.09912109375, 52.6474609375, 54.19580078125, 55.744140625, 57.29248046875, 58.8408203125, 60.38916015625, 61.9375]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 88.0, 734.0, 187.0, 6.0], "bins": [-352.61859130859375, -346.8965759277344, -341.174560546875, -335.4525146484375, -329.7304992675781, -324.00848388671875, -318.2864685058594, -312.564453125, -306.8424072265625, -301.1203918457031, -295.39837646484375, -289.67633056640625, -283.9543151855469, -278.2322998046875, -272.5102844238281, -266.78826904296875, -261.0662536621094, -255.34423828125, -249.62220764160156, -243.9001922607422, -238.17816162109375, -232.45614624023438, -226.734130859375, -221.01210021972656, -215.29006958007812, -209.56805419921875, -203.8460235595703, -198.12400817871094, -192.4019775390625, -186.67996215820312, -180.95794677734375, -175.2359161376953, -169.51390075683594, -163.79188537597656, -158.06985473632812, -152.34783935546875, -146.6258087158203, -140.90379333496094, -135.1817626953125, -129.45974731445312, -123.73772430419922, -118.01570129394531, -112.2936782836914, -106.5716552734375, -100.84963989257812, -95.12761688232422, -89.40559387207031, -83.68357849121094, -77.9615478515625, -72.2395248413086, -66.51750183105469, -60.79548263549805, -55.073463439941406, -49.3514404296875, -43.629417419433594, -37.90739822387695, -32.18537521362305, -26.463354110717773, -20.7413330078125, -15.019309997558594, -9.29728889465332, -3.575267791748047, 2.1467552185058594, 7.8687744140625, 13.59079647064209]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 2.0, 5.0, 11.0, 8.0, 23.0, 11.0, 14.0, 17.0, 17.0, 21.0, 34.0, 23.0, 23.0, 34.0, 26.0, 29.0, 44.0, 55.0, 43.0, 38.0, 43.0, 51.0, 45.0, 36.0, 39.0, 37.0, 38.0, 41.0, 41.0, 24.0, 25.0, 22.0, 13.0, 21.0, 18.0, 10.0, 6.0, 6.0, 6.0, 1.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-52.89966583251953, -51.41289520263672, -49.926124572753906, -48.439353942871094, -46.95258712768555, -45.465816497802734, -43.97904586791992, -42.49227523803711, -41.0055046081543, -39.518733978271484, -38.03196334838867, -36.545196533203125, -35.05842590332031, -33.5716552734375, -32.08488464355469, -30.598114013671875, -29.111345291137695, -27.624574661254883, -26.137805938720703, -24.65103530883789, -23.164264678955078, -21.677494049072266, -20.190725326538086, -18.703954696655273, -17.217185974121094, -15.730416297912598, -14.243645668029785, -12.756875991821289, -11.270105361938477, -9.78333568572998, -8.296566009521484, -6.809795379638672, -5.323024749755859, -3.836254596710205, -2.34948468208313, -0.8627147674560547, 0.6240553855895996, 2.110825538635254, 3.59759521484375, 5.0843658447265625, 6.571135520935059, 8.057905197143555, 9.544675827026367, 11.031445503234863, 12.51821517944336, 14.004985809326172, 15.491755485534668, 16.978527069091797, 18.465295791625977, 19.95206642150879, 21.43883514404297, 22.92560577392578, 24.412376403808594, 25.899147033691406, 27.385915756225586, 28.8726863861084, 30.359455108642578, 31.84622573852539, 33.3329963684082, 34.81976318359375, 36.30653381347656, 37.793304443359375, 39.28007507324219, 40.766845703125, 42.25361633300781]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 3.0, 4.0, 3.0, 4.0, 6.0, 6.0, 7.0, 7.0, 22.0, 9.0, 8.0, 22.0, 22.0, 12.0, 22.0, 28.0, 31.0, 27.0, 25.0, 26.0, 40.0, 39.0, 51.0, 36.0, 42.0, 48.0, 39.0, 37.0, 35.0, 38.0, 21.0, 32.0, 29.0, 34.0, 27.0, 18.0, 30.0, 15.0, 12.0, 13.0, 12.0, 10.0, 7.0, 7.0, 8.0, 8.0, 4.0, 6.0, 5.0, 1.0, 1.0, 5.0, 3.0], "bins": [-5.55078125, -5.39544677734375, -5.2401123046875, -5.08477783203125, -4.929443359375, -4.77410888671875, -4.6187744140625, -4.46343994140625, -4.30810546875, -4.15277099609375, -3.9974365234375, -3.84210205078125, -3.686767578125, -3.53143310546875, -3.3760986328125, -3.22076416015625, -3.0654296875, -2.91009521484375, -2.7547607421875, -2.59942626953125, -2.444091796875, -2.28875732421875, -2.1334228515625, -1.97808837890625, -1.82275390625, -1.66741943359375, -1.5120849609375, -1.35675048828125, -1.201416015625, -1.04608154296875, -0.8907470703125, -0.73541259765625, -0.580078125, -0.42474365234375, -0.2694091796875, -0.11407470703125, 0.041259765625, 0.19659423828125, 0.3519287109375, 0.50726318359375, 0.66259765625, 0.81793212890625, 0.9732666015625, 1.12860107421875, 1.283935546875, 1.43927001953125, 1.5946044921875, 1.74993896484375, 1.9052734375, 2.06060791015625, 2.2159423828125, 2.37127685546875, 2.526611328125, 2.68194580078125, 2.8372802734375, 2.99261474609375, 3.14794921875, 3.30328369140625, 3.4586181640625, 3.61395263671875, 3.769287109375, 3.92462158203125, 4.0799560546875, 4.23529052734375, 4.390625]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 7.0, 3.0, 5.0, 4.0, 5.0, 4.0, 6.0, 6.0, 14.0, 18.0, 23.0, 21.0, 26.0, 39.0, 58.0, 85.0, 186.0, 378.0, 807.0, 1846.0, 4540.0, 12566.0, 49740.0, 1125193.0, 2839130.0, 127165.0, 20221.0, 6907.0, 2847.0, 1156.0, 574.0, 267.0, 139.0, 78.0, 50.0, 33.0, 27.0, 16.0, 21.0, 20.0, 10.0, 6.0, 5.0, 12.0, 7.0, 7.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-20.765625, -20.175537109375, -19.58544921875, -18.995361328125, -18.4052734375, -17.815185546875, -17.22509765625, -16.635009765625, -16.044921875, -15.454833984375, -14.86474609375, -14.274658203125, -13.6845703125, -13.094482421875, -12.50439453125, -11.914306640625, -11.32421875, -10.734130859375, -10.14404296875, -9.553955078125, -8.9638671875, -8.373779296875, -7.78369140625, -7.193603515625, -6.603515625, -6.013427734375, -5.42333984375, -4.833251953125, -4.2431640625, -3.653076171875, -3.06298828125, -2.472900390625, -1.8828125, -1.292724609375, -0.70263671875, -0.112548828125, 0.4775390625, 1.067626953125, 1.65771484375, 2.247802734375, 2.837890625, 3.427978515625, 4.01806640625, 4.608154296875, 5.1982421875, 5.788330078125, 6.37841796875, 6.968505859375, 7.55859375, 8.148681640625, 8.73876953125, 9.328857421875, 9.9189453125, 10.509033203125, 11.09912109375, 11.689208984375, 12.279296875, 12.869384765625, 13.45947265625, 14.049560546875, 14.6396484375, 15.229736328125, 15.81982421875, 16.409912109375, 17.0]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 2.0, 4.0, 5.0, 11.0, 9.0, 14.0, 11.0, 16.0, 20.0, 26.0, 38.0, 50.0, 73.0, 112.0, 154.0, 225.0, 399.0, 502.0, 616.0, 562.0, 378.0, 259.0, 160.0, 112.0, 75.0, 61.0, 50.0, 38.0, 27.0, 15.0, 10.0, 12.0, 9.0, 6.0, 7.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.78125, -12.38916015625, -11.9970703125, -11.60498046875, -11.212890625, -10.82080078125, -10.4287109375, -10.03662109375, -9.64453125, -9.25244140625, -8.8603515625, -8.46826171875, -8.076171875, -7.68408203125, -7.2919921875, -6.89990234375, -6.5078125, -6.11572265625, -5.7236328125, -5.33154296875, -4.939453125, -4.54736328125, -4.1552734375, -3.76318359375, -3.37109375, -2.97900390625, -2.5869140625, -2.19482421875, -1.802734375, -1.41064453125, -1.0185546875, -0.62646484375, -0.234375, 0.15771484375, 0.5498046875, 0.94189453125, 1.333984375, 1.72607421875, 2.1181640625, 2.51025390625, 2.90234375, 3.29443359375, 3.6865234375, 4.07861328125, 4.470703125, 4.86279296875, 5.2548828125, 5.64697265625, 6.0390625, 6.43115234375, 6.8232421875, 7.21533203125, 7.607421875, 7.99951171875, 8.3916015625, 8.78369140625, 9.17578125, 9.56787109375, 9.9599609375, 10.35205078125, 10.744140625, 11.13623046875, 11.5283203125, 11.92041015625, 12.3125]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 4.0, 6.0, 13.0, 7.0, 6.0, 11.0, 21.0, 27.0, 32.0, 76.0, 139.0, 205.0, 476.0, 1178.0, 3665.0, 13774.0, 77229.0, 2116612.0, 1889613.0, 72433.0, 13200.0, 3394.0, 1127.0, 499.0, 206.0, 129.0, 59.0, 35.0, 31.0, 19.0, 19.0, 13.0, 11.0, 6.0, 1.0, 2.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.03125, -25.1630859375, -24.294921875, -23.4267578125, -22.55859375, -21.6904296875, -20.822265625, -19.9541015625, -19.0859375, -18.2177734375, -17.349609375, -16.4814453125, -15.61328125, -14.7451171875, -13.876953125, -13.0087890625, -12.140625, -11.2724609375, -10.404296875, -9.5361328125, -8.66796875, -7.7998046875, -6.931640625, -6.0634765625, -5.1953125, -4.3271484375, -3.458984375, -2.5908203125, -1.72265625, -0.8544921875, 0.013671875, 0.8818359375, 1.75, 2.6181640625, 3.486328125, 4.3544921875, 5.22265625, 6.0908203125, 6.958984375, 7.8271484375, 8.6953125, 9.5634765625, 10.431640625, 11.2998046875, 12.16796875, 13.0361328125, 13.904296875, 14.7724609375, 15.640625, 16.5087890625, 17.376953125, 18.2451171875, 19.11328125, 19.9814453125, 20.849609375, 21.7177734375, 22.5859375, 23.4541015625, 24.322265625, 25.1904296875, 26.05859375, 26.9267578125, 27.794921875, 28.6630859375, 29.53125]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 8.0, 13.0, 24.0, 33.0, 58.0, 103.0, 145.0, 184.0, 171.0, 117.0, 65.0, 36.0, 20.0, 11.0, 4.0, 13.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-84.35810089111328, -81.84437561035156, -79.33065795898438, -76.81693267822266, -74.30321502685547, -71.78948974609375, -69.27577209472656, -66.76204681396484, -64.24832153320312, -61.73460006713867, -59.22087860107422, -56.7071533203125, -54.19343185424805, -51.679710388183594, -49.16598892211914, -46.65226745605469, -44.138545989990234, -41.62482452392578, -39.11110305786133, -36.597381591796875, -34.083656311035156, -31.569934844970703, -29.05621337890625, -26.542490005493164, -24.02876853942871, -21.515047073364258, -19.001323699951172, -16.48760223388672, -13.97387981414795, -11.46015739440918, -8.946435928344727, -6.432712554931641, -3.9189910888671875, -1.405268907546997, 1.1084532737731934, 3.6221752166748047, 6.135897636413574, 8.649620056152344, 11.163341522216797, 13.677064895629883, 16.190786361694336, 18.70450782775879, 21.218231201171875, 23.731952667236328, 26.24567413330078, 28.759397506713867, 31.27311897277832, 33.786842346191406, 36.30056381225586, 38.81428527832031, 41.328006744384766, 43.84172821044922, 46.35545349121094, 48.86917495727539, 51.382896423339844, 53.89662170410156, 56.41033935546875, 58.9240608215332, 61.437782287597656, 63.951507568359375, 66.46522521972656, 68.97895050048828, 71.49267578125, 74.00639343261719, 76.5201187133789]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 3.0, 6.0, 6.0, 11.0, 7.0, 5.0, 12.0, 20.0, 15.0, 20.0, 23.0, 21.0, 21.0, 31.0, 42.0, 37.0, 30.0, 37.0, 28.0, 41.0, 45.0, 37.0, 48.0, 33.0, 43.0, 34.0, 40.0, 39.0, 34.0, 26.0, 27.0, 34.0, 25.0, 28.0, 15.0, 17.0, 14.0, 9.0, 5.0, 11.0, 9.0, 5.0, 2.0, 2.0, 1.0, 4.0, 2.0, 0.0, 3.0], "bins": [-41.67401123046875, -40.541015625, -39.408016204833984, -38.275020599365234, -37.14202117919922, -36.00902557373047, -34.87602615356445, -33.7430305480957, -32.61003112792969, -31.477033615112305, -30.344036102294922, -29.21103858947754, -28.078041076660156, -26.945043563842773, -25.81204605102539, -24.67905044555664, -23.546052932739258, -22.413055419921875, -21.280057907104492, -20.14706039428711, -19.014062881469727, -17.881065368652344, -16.748069763183594, -15.615071296691895, -14.482073783874512, -13.349076271057129, -12.216078758239746, -11.08308219909668, -9.950084686279297, -8.817087173461914, -7.684089660644531, -6.551092147827148, -5.418092727661133, -4.28509521484375, -3.1520979404449463, -2.0191006660461426, -0.8861031532287598, 0.24689435958862305, 1.3798913955688477, 2.5128889083862305, 3.6458864212036133, 4.778883934020996, 5.911881446838379, 7.0448784828186035, 8.177875518798828, 9.310873031616211, 10.443870544433594, 11.576868057250977, 12.70986557006836, 13.842863082885742, 14.975860595703125, 16.108858108520508, 17.24185562133789, 18.374853134155273, 19.507850646972656, 20.640846252441406, 21.773845672607422, 22.906843185424805, 24.039840698242188, 25.17283821105957, 26.305835723876953, 27.438833236694336, 28.57183074951172, 29.70482635498047, 30.83782386779785]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 1.0, 2.0, 3.0, 3.0, 2.0, 8.0, 3.0, 5.0, 6.0, 11.0, 16.0, 6.0, 14.0, 24.0, 18.0, 17.0, 26.0, 22.0, 31.0, 37.0, 31.0, 34.0, 43.0, 28.0, 49.0, 32.0, 35.0, 40.0, 34.0, 48.0, 37.0, 34.0, 33.0, 37.0, 27.0, 33.0, 25.0, 19.0, 20.0, 25.0, 13.0, 9.0, 9.0, 7.0, 12.0, 8.0, 9.0, 0.0, 4.0, 4.0, 7.0, 2.0, 4.0, 3.0, 0.0, 2.0], "bins": [-5.43359375, -5.27667236328125, -5.1197509765625, -4.96282958984375, -4.805908203125, -4.64898681640625, -4.4920654296875, -4.33514404296875, -4.17822265625, -4.02130126953125, -3.8643798828125, -3.70745849609375, -3.550537109375, -3.39361572265625, -3.2366943359375, -3.07977294921875, -2.9228515625, -2.76593017578125, -2.6090087890625, -2.45208740234375, -2.295166015625, -2.13824462890625, -1.9813232421875, -1.82440185546875, -1.66748046875, -1.51055908203125, -1.3536376953125, -1.19671630859375, -1.039794921875, -0.88287353515625, -0.7259521484375, -0.56903076171875, -0.412109375, -0.25518798828125, -0.0982666015625, 0.05865478515625, 0.215576171875, 0.37249755859375, 0.5294189453125, 0.68634033203125, 0.84326171875, 1.00018310546875, 1.1571044921875, 1.31402587890625, 1.470947265625, 1.62786865234375, 1.7847900390625, 1.94171142578125, 2.0986328125, 2.25555419921875, 2.4124755859375, 2.56939697265625, 2.726318359375, 2.88323974609375, 3.0401611328125, 3.19708251953125, 3.35400390625, 3.51092529296875, 3.6678466796875, 3.82476806640625, 3.981689453125, 4.13861083984375, 4.2955322265625, 4.45245361328125, 4.609375]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 4.0, 8.0, 5.0, 13.0, 19.0, 32.0, 29.0, 63.0, 85.0, 113.0, 182.0, 234.0, 405.0, 588.0, 840.0, 1161.0, 1739.0, 2427.0, 3531.0, 5485.0, 8137.0, 12325.0, 19110.0, 31255.0, 51668.0, 91629.0, 172938.0, 259907.0, 163654.0, 86595.0, 49567.0, 29839.0, 18568.0, 11943.0, 8087.0, 5258.0, 3604.0, 2382.0, 1694.0, 1117.0, 743.0, 499.0, 379.0, 201.0, 147.0, 119.0, 79.0, 46.0, 39.0, 23.0, 11.0, 15.0, 10.0, 4.0, 5.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.213623046875, -0.20637130737304688, -0.19911956787109375, -0.19186782836914062, -0.1846160888671875, -0.17736434936523438, -0.17011260986328125, -0.16286087036132812, -0.155609130859375, -0.14835739135742188, -0.14110565185546875, -0.13385391235351562, -0.1266021728515625, -0.11935043334960938, -0.11209869384765625, -0.10484695434570312, -0.09759521484375, -0.09034347534179688, -0.08309173583984375, -0.07583999633789062, -0.0685882568359375, -0.061336517333984375, -0.05408477783203125, -0.046833038330078125, -0.039581298828125, -0.032329559326171875, -0.02507781982421875, -0.017826080322265625, -0.0105743408203125, -0.003322601318359375, 0.00392913818359375, 0.011180877685546875, 0.0184326171875, 0.025684356689453125, 0.03293609619140625, 0.040187835693359375, 0.0474395751953125, 0.054691314697265625, 0.06194305419921875, 0.06919479370117188, 0.076446533203125, 0.08369827270507812, 0.09095001220703125, 0.09820175170898438, 0.1054534912109375, 0.11270523071289062, 0.11995697021484375, 0.12720870971679688, 0.13446044921875, 0.14171218872070312, 0.14896392822265625, 0.15621566772460938, 0.1634674072265625, 0.17071914672851562, 0.17797088623046875, 0.18522262573242188, 0.192474365234375, 0.19972610473632812, 0.20697784423828125, 0.21422958374023438, 0.2214813232421875, 0.22873306274414062, 0.23598480224609375, 0.24323654174804688, 0.25048828125]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0, 2.0, 8.0, 13.0, 8.0, 6.0, 10.0, 7.0, 9.0, 21.0, 27.0, 27.0, 28.0, 25.0, 31.0, 36.0, 44.0, 33.0, 41.0, 30.0, 47.0, 39.0, 1053.0, 46.0, 40.0, 35.0, 41.0, 39.0, 35.0, 20.0, 21.0, 21.0, 15.0, 26.0, 23.0, 16.0, 11.0, 14.0, 12.0, 12.0, 8.0, 7.0, 11.0, 4.0, 6.0, 0.0, 5.0, 2.0, 4.0, 5.0, 4.0, 1.0, 3.0], "bins": [-3.345703125, -3.246337890625, -3.14697265625, -3.047607421875, -2.9482421875, -2.848876953125, -2.74951171875, -2.650146484375, -2.55078125, -2.451416015625, -2.35205078125, -2.252685546875, -2.1533203125, -2.053955078125, -1.95458984375, -1.855224609375, -1.755859375, -1.656494140625, -1.55712890625, -1.457763671875, -1.3583984375, -1.259033203125, -1.15966796875, -1.060302734375, -0.9609375, -0.861572265625, -0.76220703125, -0.662841796875, -0.5634765625, -0.464111328125, -0.36474609375, -0.265380859375, -0.166015625, -0.066650390625, 0.03271484375, 0.132080078125, 0.2314453125, 0.330810546875, 0.43017578125, 0.529541015625, 0.62890625, 0.728271484375, 0.82763671875, 0.927001953125, 1.0263671875, 1.125732421875, 1.22509765625, 1.324462890625, 1.423828125, 1.523193359375, 1.62255859375, 1.721923828125, 1.8212890625, 1.920654296875, 2.02001953125, 2.119384765625, 2.21875, 2.318115234375, 2.41748046875, 2.516845703125, 2.6162109375, 2.715576171875, 2.81494140625, 2.914306640625, 3.013671875]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 4.0, 8.0, 13.0, 21.0, 33.0, 51.0, 69.0, 74.0, 119.0, 142.0, 223.0, 295.0, 405.0, 583.0, 789.0, 1103.0, 1566.0, 2249.0, 3185.0, 4541.0, 6935.0, 10453.0, 15613.0, 24554.0, 39381.0, 63588.0, 104622.0, 174453.0, 1270041.0, 141192.0, 85356.0, 51594.0, 32360.0, 20428.0, 13262.0, 8582.0, 5871.0, 3928.0, 2775.0, 1885.0, 1331.0, 958.0, 692.0, 500.0, 352.0, 275.0, 201.0, 144.0, 96.0, 83.0, 42.0, 40.0, 25.0, 14.0, 17.0, 8.0, 11.0, 4.0, 2.0, 3.0], "bins": [-0.147705078125, -0.14313125610351562, -0.13855743408203125, -0.13398361206054688, -0.1294097900390625, -0.12483596801757812, -0.12026214599609375, -0.11568832397460938, -0.111114501953125, -0.10654067993164062, -0.10196685791015625, -0.09739303588867188, -0.0928192138671875, -0.08824539184570312, -0.08367156982421875, -0.07909774780273438, -0.07452392578125, -0.06995010375976562, -0.06537628173828125, -0.060802459716796875, -0.0562286376953125, -0.051654815673828125, -0.04708099365234375, -0.042507171630859375, -0.037933349609375, -0.033359527587890625, -0.02878570556640625, -0.024211883544921875, -0.0196380615234375, -0.015064239501953125, -0.01049041748046875, -0.005916595458984375, -0.0013427734375, 0.003231048583984375, 0.00780487060546875, 0.012378692626953125, 0.0169525146484375, 0.021526336669921875, 0.02610015869140625, 0.030673980712890625, 0.035247802734375, 0.039821624755859375, 0.04439544677734375, 0.048969268798828125, 0.0535430908203125, 0.058116912841796875, 0.06269073486328125, 0.06726455688476562, 0.07183837890625, 0.07641220092773438, 0.08098602294921875, 0.08555984497070312, 0.0901336669921875, 0.09470748901367188, 0.09928131103515625, 0.10385513305664062, 0.108428955078125, 0.11300277709960938, 0.11757659912109375, 0.12215042114257812, 0.1267242431640625, 0.13129806518554688, 0.13587188720703125, 0.14044570922851562, 0.14501953125]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 4.0, 1.0, 1.0, 3.0, 2.0, 6.0, 8.0, 6.0, 10.0, 7.0, 16.0, 26.0, 27.0, 37.0, 49.0, 51.0, 100.0, 122.0, 133.0, 113.0, 71.0, 51.0, 29.0, 25.0, 19.0, 17.0, 14.0, 16.0, 10.0, 4.0, 9.0, 8.0, 1.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00026345252990722656, -0.000254753977060318, -0.0002460554242134094, -0.00023735687136650085, -0.00022865831851959229, -0.00021995976567268372, -0.00021126121282577515, -0.00020256265997886658, -0.000193864107131958, -0.00018516555428504944, -0.00017646700143814087, -0.0001677684485912323, -0.00015906989574432373, -0.00015037134289741516, -0.0001416727900505066, -0.00013297423720359802, -0.00012427568435668945, -0.00011557713150978088, -0.00010687857866287231, -9.818002581596375e-05, -8.948147296905518e-05, -8.07829201221466e-05, -7.208436727523804e-05, -6.338581442832947e-05, -5.46872615814209e-05, -4.598870873451233e-05, -3.729015588760376e-05, -2.859160304069519e-05, -1.989305019378662e-05, -1.1194497346878052e-05, -2.4959444999694824e-06, 6.202608346939087e-06, 1.4901161193847656e-05, 2.3599714040756226e-05, 3.2298266887664795e-05, 4.0996819734573364e-05, 4.9695372581481934e-05, 5.83939254283905e-05, 6.709247827529907e-05, 7.579103112220764e-05, 8.448958396911621e-05, 9.318813681602478e-05, 0.00010188668966293335, 0.00011058524250984192, 0.00011928379535675049, 0.00012798234820365906, 0.00013668090105056763, 0.0001453794538974762, 0.00015407800674438477, 0.00016277655959129333, 0.0001714751124382019, 0.00018017366528511047, 0.00018887221813201904, 0.0001975707709789276, 0.00020626932382583618, 0.00021496787667274475, 0.00022366642951965332, 0.0002323649823665619, 0.00024106353521347046, 0.00024976208806037903, 0.0002584606409072876, 0.00026715919375419617, 0.00027585774660110474, 0.0002845562994480133, 0.0002932548522949219]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 7.0, 6.0, 12.0, 11.0, 14.0, 28.0, 21.0, 41.0, 59.0, 75.0, 141.0, 307.0, 1922.0, 137163.0, 902379.0, 5391.0, 460.0, 172.0, 96.0, 66.0, 54.0, 27.0, 29.0, 11.0, 22.0, 6.0, 5.0, 6.0, 8.0, 0.0, 2.0, 3.0, 1.0, 5.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.00543975830078125, -0.005285024642944336, -0.005130290985107422, -0.004975557327270508, -0.004820823669433594, -0.00466609001159668, -0.004511356353759766, -0.0043566226959228516, -0.0042018890380859375, -0.0040471553802490234, -0.0038924217224121094, -0.0037376880645751953, -0.0035829544067382812, -0.003428220748901367, -0.003273487091064453, -0.003118753433227539, -0.002964019775390625, -0.002809286117553711, -0.002654552459716797, -0.002499818801879883, -0.0023450851440429688, -0.0021903514862060547, -0.0020356178283691406, -0.0018808841705322266, -0.0017261505126953125, -0.0015714168548583984, -0.0014166831970214844, -0.0012619495391845703, -0.0011072158813476562, -0.0009524822235107422, -0.0007977485656738281, -0.0006430149078369141, -0.00048828125, -0.00033354759216308594, -0.00017881393432617188, -2.4080276489257812e-05, 0.00013065338134765625, 0.0002853870391845703, 0.0004401206970214844, 0.0005948543548583984, 0.0007495880126953125, 0.0009043216705322266, 0.0010590553283691406, 0.0012137889862060547, 0.0013685226440429688, 0.0015232563018798828, 0.0016779899597167969, 0.001832723617553711, 0.001987457275390625, 0.002142190933227539, 0.002296924591064453, 0.002451658248901367, 0.0026063919067382812, 0.0027611255645751953, 0.0029158592224121094, 0.0030705928802490234, 0.0032253265380859375, 0.0033800601959228516, 0.0035347938537597656, 0.0036895275115966797, 0.0038442611694335938, 0.003998994827270508, 0.004153728485107422, 0.004308462142944336, 0.00446319580078125]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 3.0, 16.0, 43.0, 99.0, 201.0, 316.0, 187.0, 89.0, 40.0, 12.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00045145832700654864, -0.0004383531922940165, -0.0004252480575814843, -0.0004121429519727826, -0.00039903781726025045, -0.0003859326825477183, -0.0003728275478351861, -0.00035972241312265396, -0.00034661730751395226, -0.0003335121728014201, -0.00032040703808888793, -0.0003073019324801862, -0.00029419679776765406, -0.0002810916630551219, -0.00026798652834258974, -0.0002548813936300576, -0.0002417762589175254, -0.00022867112420499325, -0.00021556600404437631, -0.00020246086933184415, -0.00018935574917122722, -0.00017625061445869505, -0.0001631454797461629, -0.00015004034503363073, -0.0001369352248730138, -0.00012383009016048163, -0.0001107249699998647, -9.761983528733253e-05, -8.451470785075799e-05, -7.140958041418344e-05, -5.8304445701651275e-05, -4.519931826507673e-05, -3.209416172467172e-05, -1.898903246910777e-05, -5.883903213543817e-06, 7.221227861009538e-06, 2.0326355297584087e-05, 3.3431482734158635e-05, 4.65366174466908e-05, 5.9641744883265346e-05, 7.27468723198399e-05, 8.585199975641444e-05, 9.895712719298899e-05, 0.00011206226190552115, 0.00012516739661805332, 0.00013827251677867025, 0.00015137765149120241, 0.00016448277165181935, 0.0001775879063643515, 0.00019069304107688367, 0.0002037981612375006, 0.00021690329595003277, 0.0002300084161106497, 0.00024311355082318187, 0.00025621868553571403, 0.0002693238202482462, 0.0002824289258569479, 0.00029553406056948006, 0.0003086391952820122, 0.00032174430089071393, 0.0003348494356032461, 0.00034795457031577826, 0.0003610597050283104, 0.0003741648397408426, 0.00038726997445337474]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 0.0, 0.0, 3.0, 4.0, 8.0, 6.0, 6.0, 6.0, 10.0, 8.0, 18.0, 12.0, 20.0, 16.0, 26.0, 17.0, 35.0, 24.0, 26.0, 30.0, 31.0, 38.0, 36.0, 32.0, 41.0, 36.0, 34.0, 34.0, 40.0, 31.0, 37.0, 30.0, 27.0, 29.0, 29.0, 18.0, 28.0, 32.0, 26.0, 17.0, 16.0, 16.0, 15.0, 10.0, 5.0, 11.0, 5.0, 5.0, 2.0, 4.0, 3.0, 3.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0], "bins": [-9.5367431640625e-05, -9.240582585334778e-05, -8.944422006607056e-05, -8.648261427879333e-05, -8.352100849151611e-05, -8.055940270423889e-05, -7.759779691696167e-05, -7.463619112968445e-05, -7.167458534240723e-05, -6.871297955513e-05, -6.575137376785278e-05, -6.278976798057556e-05, -5.982816219329834e-05, -5.686655640602112e-05, -5.3904950618743896e-05, -5.0943344831466675e-05, -4.798173904418945e-05, -4.502013325691223e-05, -4.205852746963501e-05, -3.909692168235779e-05, -3.6135315895080566e-05, -3.3173710107803345e-05, -3.0212104320526123e-05, -2.72504985332489e-05, -2.428889274597168e-05, -2.1327286958694458e-05, -1.8365681171417236e-05, -1.5404075384140015e-05, -1.2442469596862793e-05, -9.480863809585571e-06, -6.51925802230835e-06, -3.557652235031128e-06, -5.960464477539062e-07, 2.3655593395233154e-06, 5.327165126800537e-06, 8.288770914077759e-06, 1.125037670135498e-05, 1.4211982488632202e-05, 1.7173588275909424e-05, 2.0135194063186646e-05, 2.3096799850463867e-05, 2.605840563774109e-05, 2.902001142501831e-05, 3.198161721229553e-05, 3.4943222999572754e-05, 3.7904828786849976e-05, 4.08664345741272e-05, 4.382804036140442e-05, 4.678964614868164e-05, 4.975125193595886e-05, 5.2712857723236084e-05, 5.5674463510513306e-05, 5.863606929779053e-05, 6.159767508506775e-05, 6.455928087234497e-05, 6.752088665962219e-05, 7.048249244689941e-05, 7.344409823417664e-05, 7.640570402145386e-05, 7.936730980873108e-05, 8.23289155960083e-05, 8.529052138328552e-05, 8.825212717056274e-05, 9.121373295783997e-05, 9.417533874511719e-05]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 1.0, 2.0, 3.0, 3.0, 2.0, 8.0, 3.0, 5.0, 6.0, 11.0, 16.0, 6.0, 14.0, 24.0, 18.0, 17.0, 26.0, 22.0, 31.0, 37.0, 31.0, 34.0, 43.0, 28.0, 49.0, 32.0, 35.0, 40.0, 34.0, 48.0, 37.0, 34.0, 33.0, 37.0, 27.0, 33.0, 25.0, 19.0, 20.0, 25.0, 13.0, 9.0, 9.0, 7.0, 12.0, 8.0, 9.0, 0.0, 4.0, 4.0, 7.0, 2.0, 4.0, 3.0, 0.0, 2.0], "bins": [-5.43359375, -5.27667236328125, -5.1197509765625, -4.96282958984375, -4.805908203125, -4.64898681640625, -4.4920654296875, -4.33514404296875, -4.17822265625, -4.02130126953125, -3.8643798828125, -3.70745849609375, -3.550537109375, -3.39361572265625, -3.2366943359375, -3.07977294921875, -2.9228515625, -2.76593017578125, -2.6090087890625, -2.45208740234375, -2.295166015625, -2.13824462890625, -1.9813232421875, -1.82440185546875, -1.66748046875, -1.51055908203125, -1.3536376953125, -1.19671630859375, -1.039794921875, -0.88287353515625, -0.7259521484375, -0.56903076171875, -0.412109375, -0.25518798828125, -0.0982666015625, 0.05865478515625, 0.215576171875, 0.37249755859375, 0.5294189453125, 0.68634033203125, 0.84326171875, 1.00018310546875, 1.1571044921875, 1.31402587890625, 1.470947265625, 1.62786865234375, 1.7847900390625, 1.94171142578125, 2.0986328125, 2.25555419921875, 2.4124755859375, 2.56939697265625, 2.726318359375, 2.88323974609375, 3.0401611328125, 3.19708251953125, 3.35400390625, 3.51092529296875, 3.6678466796875, 3.82476806640625, 3.981689453125, 4.13861083984375, 4.2955322265625, 4.45245361328125, 4.609375]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 7.0, 6.0, 7.0, 13.0, 16.0, 15.0, 32.0, 38.0, 72.0, 112.0, 178.0, 357.0, 645.0, 1195.0, 2636.0, 5807.0, 13843.0, 37781.0, 130268.0, 514531.0, 244439.0, 60692.0, 20409.0, 8318.0, 3592.0, 1657.0, 790.0, 467.0, 222.0, 158.0, 87.0, 43.0, 43.0, 29.0, 12.0, 14.0, 7.0, 7.0, 8.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-10.4609375, -10.16796875, -9.875, -9.58203125, -9.2890625, -8.99609375, -8.703125, -8.41015625, -8.1171875, -7.82421875, -7.53125, -7.23828125, -6.9453125, -6.65234375, -6.359375, -6.06640625, -5.7734375, -5.48046875, -5.1875, -4.89453125, -4.6015625, -4.30859375, -4.015625, -3.72265625, -3.4296875, -3.13671875, -2.84375, -2.55078125, -2.2578125, -1.96484375, -1.671875, -1.37890625, -1.0859375, -0.79296875, -0.5, -0.20703125, 0.0859375, 0.37890625, 0.671875, 0.96484375, 1.2578125, 1.55078125, 1.84375, 2.13671875, 2.4296875, 2.72265625, 3.015625, 3.30859375, 3.6015625, 3.89453125, 4.1875, 4.48046875, 4.7734375, 5.06640625, 5.359375, 5.65234375, 5.9453125, 6.23828125, 6.53125, 6.82421875, 7.1171875, 7.41015625, 7.703125, 7.99609375, 8.2890625]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 6.0, 9.0, 3.0, 5.0, 6.0, 5.0, 12.0, 17.0, 15.0, 17.0, 24.0, 23.0, 36.0, 38.0, 57.0, 53.0, 61.0, 80.0, 143.0, 1432.0, 391.0, 162.0, 80.0, 59.0, 38.0, 41.0, 38.0, 32.0, 21.0, 25.0, 27.0, 20.0, 25.0, 11.0, 7.0, 8.0, 4.0, 11.0, 9.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-21.984375, -21.356201171875, -20.72802734375, -20.099853515625, -19.4716796875, -18.843505859375, -18.21533203125, -17.587158203125, -16.958984375, -16.330810546875, -15.70263671875, -15.074462890625, -14.4462890625, -13.818115234375, -13.18994140625, -12.561767578125, -11.93359375, -11.305419921875, -10.67724609375, -10.049072265625, -9.4208984375, -8.792724609375, -8.16455078125, -7.536376953125, -6.908203125, -6.280029296875, -5.65185546875, -5.023681640625, -4.3955078125, -3.767333984375, -3.13916015625, -2.510986328125, -1.8828125, -1.254638671875, -0.62646484375, 0.001708984375, 0.6298828125, 1.258056640625, 1.88623046875, 2.514404296875, 3.142578125, 3.770751953125, 4.39892578125, 5.027099609375, 5.6552734375, 6.283447265625, 6.91162109375, 7.539794921875, 8.16796875, 8.796142578125, 9.42431640625, 10.052490234375, 10.6806640625, 11.308837890625, 11.93701171875, 12.565185546875, 13.193359375, 13.821533203125, 14.44970703125, 15.077880859375, 15.7060546875, 16.334228515625, 16.96240234375, 17.590576171875, 18.21875]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 6.0, 15.0, 16.0, 18.0, 24.0, 31.0, 49.0, 73.0, 114.0, 146.0, 280.0, 507.0, 1514.0, 11975.0, 2929617.0, 194892.0, 4427.0, 968.0, 421.0, 214.0, 128.0, 73.0, 46.0, 39.0, 31.0, 24.0, 22.0, 12.0, 11.0, 3.0, 5.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.6875, -62.7744140625, -60.861328125, -58.9482421875, -57.03515625, -55.1220703125, -53.208984375, -51.2958984375, -49.3828125, -47.4697265625, -45.556640625, -43.6435546875, -41.73046875, -39.8173828125, -37.904296875, -35.9912109375, -34.078125, -32.1650390625, -30.251953125, -28.3388671875, -26.42578125, -24.5126953125, -22.599609375, -20.6865234375, -18.7734375, -16.8603515625, -14.947265625, -13.0341796875, -11.12109375, -9.2080078125, -7.294921875, -5.3818359375, -3.46875, -1.5556640625, 0.357421875, 2.2705078125, 4.18359375, 6.0966796875, 8.009765625, 9.9228515625, 11.8359375, 13.7490234375, 15.662109375, 17.5751953125, 19.48828125, 21.4013671875, 23.314453125, 25.2275390625, 27.140625, 29.0537109375, 30.966796875, 32.8798828125, 34.79296875, 36.7060546875, 38.619140625, 40.5322265625, 42.4453125, 44.3583984375, 46.271484375, 48.1845703125, 50.09765625, 52.0107421875, 53.923828125, 55.8369140625, 57.75]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 56.0, 909.0, 54.0], "bins": [-819.0232543945312, -805.9126586914062, -792.8020629882812, -779.69140625, -766.580810546875, -753.47021484375, -740.359619140625, -727.2490234375, -714.138427734375, -701.02783203125, -687.917236328125, -674.806640625, -661.6959838867188, -648.5853881835938, -635.4747924804688, -622.3641967773438, -609.2535400390625, -596.1429443359375, -583.0323486328125, -569.9217529296875, -556.8110961914062, -543.7005004882812, -530.5899047851562, -517.4793090820312, -504.36871337890625, -491.25811767578125, -478.1474914550781, -465.0368957519531, -451.9263000488281, -438.815673828125, -425.705078125, -412.594482421875, -399.4838562011719, -386.3732604980469, -373.26263427734375, -360.15203857421875, -347.04144287109375, -333.9308166503906, -320.8202209472656, -307.7095947265625, -294.5990295410156, -281.4884338378906, -268.3778076171875, -255.2672119140625, -242.15660095214844, -229.04598999023438, -215.93539428710938, -202.8247833251953, -189.71417236328125, -176.6035614013672, -163.4929656982422, -150.38235473632812, -137.27174377441406, -124.16114044189453, -111.050537109375, -97.93992614746094, -84.82931518554688, -71.71871185302734, -58.60810089111328, -45.49749755859375, -32.38689041137695, -19.276283264160156, -6.165679931640625, 6.9449310302734375, 20.055532455444336]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 3.0, 1.0, 5.0, 5.0, 4.0, 8.0, 7.0, 9.0, 13.0, 21.0, 18.0, 21.0, 27.0, 22.0, 21.0, 25.0, 24.0, 34.0, 30.0, 36.0, 30.0, 45.0, 47.0, 36.0, 48.0, 28.0, 45.0, 33.0, 33.0, 47.0, 24.0, 36.0, 28.0, 25.0, 34.0, 17.0, 30.0, 12.0, 13.0, 8.0, 5.0, 12.0, 11.0, 10.0, 6.0, 5.0, 1.0, 3.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-41.331886291503906, -39.768226623535156, -38.20457077026367, -36.64091110229492, -35.07725524902344, -33.51359558105469, -31.94993782043457, -30.386280059814453, -28.822620391845703, -27.258962631225586, -25.69530487060547, -24.13164520263672, -22.5679874420166, -21.004329681396484, -19.440671920776367, -17.87701416015625, -16.313356399536133, -14.749698638916016, -13.186039924621582, -11.622382164001465, -10.058723449707031, -8.495065689086914, -6.931407928466797, -5.367749214172363, -3.804091453552246, -2.2404332160949707, -0.6767752170562744, 0.8868827819824219, 2.4505410194396973, 4.014199256896973, 5.57785701751709, 7.141515731811523, 8.70517349243164, 10.268831253051758, 11.832489967346191, 13.396147727966309, 14.959806442260742, 16.52346420288086, 18.087121963500977, 19.650779724121094, 21.214439392089844, 22.77809715270996, 24.341754913330078, 25.905414581298828, 27.469072341918945, 29.032730102539062, 30.59638786315918, 32.1600456237793, 33.72370147705078, 35.28736114501953, 36.851016998291016, 38.414676666259766, 39.97833251953125, 41.5419921875, 43.10565185546875, 44.669307708740234, 46.232967376708984, 47.796627044677734, 49.36028289794922, 50.92394256591797, 52.48759841918945, 54.0512580871582, 55.61491394042969, 57.17857360839844, 58.74223327636719]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 6.0, 3.0, 4.0, 6.0, 12.0, 3.0, 12.0, 8.0, 10.0, 18.0, 26.0, 21.0, 16.0, 26.0, 32.0, 35.0, 30.0, 39.0, 35.0, 37.0, 35.0, 42.0, 45.0, 33.0, 33.0, 40.0, 31.0, 41.0, 44.0, 27.0, 34.0, 25.0, 27.0, 24.0, 19.0, 17.0, 20.0, 11.0, 12.0, 11.0, 8.0, 7.0, 9.0, 5.0, 7.0, 6.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-5.6640625, -5.48779296875, -5.3115234375, -5.13525390625, -4.958984375, -4.78271484375, -4.6064453125, -4.43017578125, -4.25390625, -4.07763671875, -3.9013671875, -3.72509765625, -3.548828125, -3.37255859375, -3.1962890625, -3.02001953125, -2.84375, -2.66748046875, -2.4912109375, -2.31494140625, -2.138671875, -1.96240234375, -1.7861328125, -1.60986328125, -1.43359375, -1.25732421875, -1.0810546875, -0.90478515625, -0.728515625, -0.55224609375, -0.3759765625, -0.19970703125, -0.0234375, 0.15283203125, 0.3291015625, 0.50537109375, 0.681640625, 0.85791015625, 1.0341796875, 1.21044921875, 1.38671875, 1.56298828125, 1.7392578125, 1.91552734375, 2.091796875, 2.26806640625, 2.4443359375, 2.62060546875, 2.796875, 2.97314453125, 3.1494140625, 3.32568359375, 3.501953125, 3.67822265625, 3.8544921875, 4.03076171875, 4.20703125, 4.38330078125, 4.5595703125, 4.73583984375, 4.912109375, 5.08837890625, 5.2646484375, 5.44091796875, 5.6171875]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 5.0, 5.0, 5.0, 7.0, 8.0, 8.0, 13.0, 17.0, 23.0, 35.0, 40.0, 71.0, 100.0, 129.0, 220.0, 390.0, 723.0, 1413.0, 3109.0, 8342.0, 26932.0, 240383.0, 2953489.0, 885046.0, 51883.0, 13278.0, 4496.0, 1909.0, 950.0, 487.0, 236.0, 169.0, 105.0, 69.0, 49.0, 30.0, 19.0, 17.0, 11.0, 21.0, 6.0, 11.0, 7.0, 7.0, 5.0, 3.0, 0.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-19.046875, -18.481689453125, -17.91650390625, -17.351318359375, -16.7861328125, -16.220947265625, -15.65576171875, -15.090576171875, -14.525390625, -13.960205078125, -13.39501953125, -12.829833984375, -12.2646484375, -11.699462890625, -11.13427734375, -10.569091796875, -10.00390625, -9.438720703125, -8.87353515625, -8.308349609375, -7.7431640625, -7.177978515625, -6.61279296875, -6.047607421875, -5.482421875, -4.917236328125, -4.35205078125, -3.786865234375, -3.2216796875, -2.656494140625, -2.09130859375, -1.526123046875, -0.9609375, -0.395751953125, 0.16943359375, 0.734619140625, 1.2998046875, 1.864990234375, 2.43017578125, 2.995361328125, 3.560546875, 4.125732421875, 4.69091796875, 5.256103515625, 5.8212890625, 6.386474609375, 6.95166015625, 7.516845703125, 8.08203125, 8.647216796875, 9.21240234375, 9.777587890625, 10.3427734375, 10.907958984375, 11.47314453125, 12.038330078125, 12.603515625, 13.168701171875, 13.73388671875, 14.299072265625, 14.8642578125, 15.429443359375, 15.99462890625, 16.559814453125, 17.125]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 3.0, 2.0, 7.0, 11.0, 11.0, 19.0, 29.0, 37.0, 50.0, 68.0, 99.0, 191.0, 305.0, 521.0, 736.0, 695.0, 457.0, 323.0, 147.0, 121.0, 69.0, 46.0, 27.0, 28.0, 21.0, 17.0, 12.0, 4.0, 4.0, 5.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.015625, -13.47607421875, -12.9365234375, -12.39697265625, -11.857421875, -11.31787109375, -10.7783203125, -10.23876953125, -9.69921875, -9.15966796875, -8.6201171875, -8.08056640625, -7.541015625, -7.00146484375, -6.4619140625, -5.92236328125, -5.3828125, -4.84326171875, -4.3037109375, -3.76416015625, -3.224609375, -2.68505859375, -2.1455078125, -1.60595703125, -1.06640625, -0.52685546875, 0.0126953125, 0.55224609375, 1.091796875, 1.63134765625, 2.1708984375, 2.71044921875, 3.25, 3.78955078125, 4.3291015625, 4.86865234375, 5.408203125, 5.94775390625, 6.4873046875, 7.02685546875, 7.56640625, 8.10595703125, 8.6455078125, 9.18505859375, 9.724609375, 10.26416015625, 10.8037109375, 11.34326171875, 11.8828125, 12.42236328125, 12.9619140625, 13.50146484375, 14.041015625, 14.58056640625, 15.1201171875, 15.65966796875, 16.19921875, 16.73876953125, 17.2783203125, 17.81787109375, 18.357421875, 18.89697265625, 19.4365234375, 19.97607421875, 20.515625]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 3.0, 5.0, 4.0, 6.0, 15.0, 13.0, 26.0, 34.0, 36.0, 64.0, 122.0, 253.0, 667.0, 3677.0, 52307.0, 3961992.0, 166717.0, 6567.0, 1029.0, 350.0, 150.0, 83.0, 42.0, 41.0, 29.0, 15.0, 11.0, 9.0, 1.0, 6.0, 2.0, 2.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-69.375, -67.57958984375, -65.7841796875, -63.98876953125, -62.193359375, -60.39794921875, -58.6025390625, -56.80712890625, -55.01171875, -53.21630859375, -51.4208984375, -49.62548828125, -47.830078125, -46.03466796875, -44.2392578125, -42.44384765625, -40.6484375, -38.85302734375, -37.0576171875, -35.26220703125, -33.466796875, -31.67138671875, -29.8759765625, -28.08056640625, -26.28515625, -24.48974609375, -22.6943359375, -20.89892578125, -19.103515625, -17.30810546875, -15.5126953125, -13.71728515625, -11.921875, -10.12646484375, -8.3310546875, -6.53564453125, -4.740234375, -2.94482421875, -1.1494140625, 0.64599609375, 2.44140625, 4.23681640625, 6.0322265625, 7.82763671875, 9.623046875, 11.41845703125, 13.2138671875, 15.00927734375, 16.8046875, 18.60009765625, 20.3955078125, 22.19091796875, 23.986328125, 25.78173828125, 27.5771484375, 29.37255859375, 31.16796875, 32.96337890625, 34.7587890625, 36.55419921875, 38.349609375, 40.14501953125, 41.9404296875, 43.73583984375, 45.53125]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 11.0, 25.0, 50.0, 64.0, 141.0, 202.0, 206.0, 149.0, 90.0, 47.0, 9.0, 9.0, 7.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-79.82642364501953, -76.34666442871094, -72.86690521240234, -69.38714599609375, -65.90738677978516, -62.42762756347656, -58.947872161865234, -55.46811294555664, -51.98835372924805, -48.50859451293945, -45.02883529663086, -41.54907989501953, -38.06932067871094, -34.589561462402344, -31.10980224609375, -27.630043029785156, -24.150283813476562, -20.67052459716797, -17.190765380859375, -13.711008071899414, -10.23124885559082, -6.751489639282227, -3.2717323303222656, 0.20802688598632812, 3.687786102294922, 7.167544841766357, 10.647303581237793, 14.12706184387207, 17.606821060180664, 21.086580276489258, 24.56633758544922, 28.046096801757812, 31.525863647460938, 35.00562286376953, 38.485382080078125, 41.96514129638672, 45.44490051269531, 48.924659729003906, 52.404415130615234, 55.88417434692383, 59.36393356323242, 62.843692779541016, 66.32344818115234, 69.80320739746094, 73.28296661376953, 76.76272583007812, 80.24248504638672, 83.72224426269531, 87.2020034790039, 90.6817626953125, 94.1615219116211, 97.64128112792969, 101.12104034423828, 104.60079956054688, 108.08055114746094, 111.56031799316406, 115.04006958007812, 118.51982879638672, 121.99958801269531, 125.4793472290039, 128.9591064453125, 132.43885803222656, 135.9186248779297, 139.39837646484375, 142.87814331054688]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 6.0, 4.0, 1.0, 2.0, 2.0, 5.0, 9.0, 13.0, 10.0, 11.0, 8.0, 14.0, 17.0, 16.0, 22.0, 29.0, 19.0, 28.0, 23.0, 33.0, 31.0, 45.0, 31.0, 36.0, 39.0, 36.0, 51.0, 35.0, 46.0, 47.0, 24.0, 18.0, 35.0, 25.0, 23.0, 30.0, 23.0, 28.0, 19.0, 17.0, 19.0, 15.0, 12.0, 10.0, 15.0, 9.0, 3.0, 9.0, 5.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-36.98271560668945, -35.75434875488281, -34.525978088378906, -33.297611236572266, -32.069244384765625, -30.84087371826172, -29.612506866455078, -28.384138107299805, -27.15576934814453, -25.927400588989258, -24.699033737182617, -23.470664978027344, -22.24229621887207, -21.013927459716797, -19.785560607910156, -18.557191848754883, -17.328824996948242, -16.10045623779297, -14.872088432312012, -13.643720626831055, -12.415351867675781, -11.186984062194824, -9.958616256713867, -8.730247497558594, -7.501879692077637, -6.2735114097595215, -5.045143127441406, -3.816775321960449, -2.588407039642334, -1.3600387573242188, -0.13167095184326172, 1.0966978073120117, 2.3250656127929688, 3.553433895111084, 4.781802177429199, 6.010169982910156, 7.2385382652282715, 8.466906547546387, 9.695274353027344, 10.923643112182617, 12.152010917663574, 13.380378723144531, 14.608747482299805, 15.837115287780762, 17.06548309326172, 18.293851852416992, 19.522220611572266, 20.750587463378906, 21.97895622253418, 23.207324981689453, 24.435691833496094, 25.664060592651367, 26.89242935180664, 28.12079620361328, 29.349164962768555, 30.577533721923828, 31.80590057373047, 33.03426742553711, 34.262638092041016, 35.491004943847656, 36.7193717956543, 37.9477424621582, 39.176109313964844, 40.40447998046875, 41.63284683227539]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 3.0, 3.0, 9.0, 6.0, 17.0, 13.0, 19.0, 17.0, 17.0, 23.0, 25.0, 28.0, 34.0, 31.0, 40.0, 54.0, 55.0, 47.0, 51.0, 52.0, 46.0, 57.0, 32.0, 37.0, 35.0, 41.0, 39.0, 21.0, 27.0, 23.0, 22.0, 15.0, 17.0, 8.0, 3.0, 14.0, 2.0, 7.0, 6.0, 3.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.5390625, -6.3299560546875, -6.120849609375, -5.9117431640625, -5.70263671875, -5.4935302734375, -5.284423828125, -5.0753173828125, -4.8662109375, -4.6571044921875, -4.447998046875, -4.2388916015625, -4.02978515625, -3.8206787109375, -3.611572265625, -3.4024658203125, -3.193359375, -2.9842529296875, -2.775146484375, -2.5660400390625, -2.35693359375, -2.1478271484375, -1.938720703125, -1.7296142578125, -1.5205078125, -1.3114013671875, -1.102294921875, -0.8931884765625, -0.68408203125, -0.4749755859375, -0.265869140625, -0.0567626953125, 0.15234375, 0.3614501953125, 0.570556640625, 0.7796630859375, 0.98876953125, 1.1978759765625, 1.406982421875, 1.6160888671875, 1.8251953125, 2.0343017578125, 2.243408203125, 2.4525146484375, 2.66162109375, 2.8707275390625, 3.079833984375, 3.2889404296875, 3.498046875, 3.7071533203125, 3.916259765625, 4.1253662109375, 4.33447265625, 4.5435791015625, 4.752685546875, 4.9617919921875, 5.1708984375, 5.3800048828125, 5.589111328125, 5.7982177734375, 6.00732421875, 6.2164306640625, 6.425537109375, 6.6346435546875, 6.84375]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 4.0, 6.0, 10.0, 15.0, 27.0, 27.0, 40.0, 88.0, 139.0, 216.0, 340.0, 556.0, 960.0, 1525.0, 2656.0, 4511.0, 7780.0, 13707.0, 24668.0, 44747.0, 88104.0, 204865.0, 339651.0, 156695.0, 70828.0, 37687.0, 20722.0, 11627.0, 6723.0, 4026.0, 2237.0, 1286.0, 788.0, 513.0, 286.0, 175.0, 105.0, 75.0, 49.0, 34.0, 23.0, 18.0, 9.0, 4.0, 2.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.345703125, -0.3353385925292969, -0.32497406005859375, -0.3146095275878906, -0.3042449951171875, -0.2938804626464844, -0.28351593017578125, -0.2731513977050781, -0.262786865234375, -0.2524223327636719, -0.24205780029296875, -0.23169326782226562, -0.2213287353515625, -0.21096420288085938, -0.20059967041015625, -0.19023513793945312, -0.17987060546875, -0.16950607299804688, -0.15914154052734375, -0.14877700805664062, -0.1384124755859375, -0.12804794311523438, -0.11768341064453125, -0.10731887817382812, -0.096954345703125, -0.08658981323242188, -0.07622528076171875, -0.06586074829101562, -0.0554962158203125, -0.045131683349609375, -0.03476715087890625, -0.024402618408203125, -0.0140380859375, -0.003673553466796875, 0.00669097900390625, 0.017055511474609375, 0.0274200439453125, 0.037784576416015625, 0.04814910888671875, 0.058513641357421875, 0.068878173828125, 0.07924270629882812, 0.08960723876953125, 0.09997177124023438, 0.1103363037109375, 0.12070083618164062, 0.13106536865234375, 0.14142990112304688, 0.15179443359375, 0.16215896606445312, 0.17252349853515625, 0.18288803100585938, 0.1932525634765625, 0.20361709594726562, 0.21398162841796875, 0.22434616088867188, 0.234710693359375, 0.24507522583007812, 0.25543975830078125, 0.2658042907714844, 0.2761688232421875, 0.2865333557128906, 0.29689788818359375, 0.3072624206542969, 0.317626953125]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 9.0, 5.0, 4.0, 4.0, 4.0, 17.0, 12.0, 14.0, 18.0, 18.0, 15.0, 23.0, 26.0, 25.0, 30.0, 25.0, 28.0, 27.0, 40.0, 37.0, 44.0, 43.0, 1070.0, 31.0, 36.0, 34.0, 38.0, 39.0, 48.0, 25.0, 30.0, 32.0, 25.0, 28.0, 26.0, 26.0, 11.0, 14.0, 9.0, 9.0, 13.0, 9.0, 5.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 2.0], "bins": [-4.06640625, -3.95172119140625, -3.8370361328125, -3.72235107421875, -3.607666015625, -3.49298095703125, -3.3782958984375, -3.26361083984375, -3.14892578125, -3.03424072265625, -2.9195556640625, -2.80487060546875, -2.690185546875, -2.57550048828125, -2.4608154296875, -2.34613037109375, -2.2314453125, -2.11676025390625, -2.0020751953125, -1.88739013671875, -1.772705078125, -1.65802001953125, -1.5433349609375, -1.42864990234375, -1.31396484375, -1.19927978515625, -1.0845947265625, -0.96990966796875, -0.855224609375, -0.74053955078125, -0.6258544921875, -0.51116943359375, -0.396484375, -0.28179931640625, -0.1671142578125, -0.05242919921875, 0.062255859375, 0.17694091796875, 0.2916259765625, 0.40631103515625, 0.52099609375, 0.63568115234375, 0.7503662109375, 0.86505126953125, 0.979736328125, 1.09442138671875, 1.2091064453125, 1.32379150390625, 1.4384765625, 1.55316162109375, 1.6678466796875, 1.78253173828125, 1.897216796875, 2.01190185546875, 2.1265869140625, 2.24127197265625, 2.35595703125, 2.47064208984375, 2.5853271484375, 2.70001220703125, 2.814697265625, 2.92938232421875, 3.0440673828125, 3.15875244140625, 3.2734375]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 8.0, 6.0, 21.0, 25.0, 42.0, 58.0, 73.0, 109.0, 160.0, 221.0, 360.0, 537.0, 744.0, 1010.0, 1377.0, 2181.0, 3177.0, 4634.0, 6843.0, 10871.0, 16520.0, 25858.0, 41124.0, 66861.0, 109907.0, 182691.0, 1265740.0, 134915.0, 80872.0, 50217.0, 31663.0, 20182.0, 12752.0, 8190.0, 5606.0, 3628.0, 2430.0, 1724.0, 1175.0, 800.0, 528.0, 388.0, 289.0, 214.0, 136.0, 98.0, 52.0, 33.0, 29.0, 18.0, 12.0, 10.0, 7.0, 7.0, 3.0, 2.0, 2.0, 2.0], "bins": [-0.1632080078125, -0.1581401824951172, -0.15307235717773438, -0.14800453186035156, -0.14293670654296875, -0.13786888122558594, -0.13280105590820312, -0.1277332305908203, -0.1226654052734375, -0.11759757995605469, -0.11252975463867188, -0.10746192932128906, -0.10239410400390625, -0.09732627868652344, -0.09225845336914062, -0.08719062805175781, -0.082122802734375, -0.07705497741699219, -0.07198715209960938, -0.06691932678222656, -0.06185150146484375, -0.05678367614746094, -0.051715850830078125, -0.04664802551269531, -0.0415802001953125, -0.03651237487792969, -0.031444549560546875, -0.026376724243164062, -0.02130889892578125, -0.016241073608398438, -0.011173248291015625, -0.0061054229736328125, -0.00103759765625, 0.0040302276611328125, 0.009098052978515625, 0.014165878295898438, 0.01923370361328125, 0.024301528930664062, 0.029369354248046875, 0.03443717956542969, 0.0395050048828125, 0.04457283020019531, 0.049640655517578125, 0.05470848083496094, 0.05977630615234375, 0.06484413146972656, 0.06991195678710938, 0.07497978210449219, 0.080047607421875, 0.08511543273925781, 0.09018325805664062, 0.09525108337402344, 0.10031890869140625, 0.10538673400878906, 0.11045455932617188, 0.11552238464355469, 0.1205902099609375, 0.1256580352783203, 0.13072586059570312, 0.13579368591308594, 0.14086151123046875, 0.14592933654785156, 0.15099716186523438, 0.1560649871826172, 0.1611328125]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 2.0, 6.0, 7.0, 6.0, 6.0, 11.0, 21.0, 13.0, 34.0, 37.0, 56.0, 89.0, 109.0, 115.0, 124.0, 91.0, 65.0, 44.0, 39.0, 29.0, 15.0, 11.0, 15.0, 13.0, 12.0, 7.0, 5.0, 5.0, 5.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002167224884033203, -0.00020942464470863342, -0.00020212680101394653, -0.00019482895731925964, -0.00018753111362457275, -0.00018023326992988586, -0.00017293542623519897, -0.00016563758254051208, -0.0001583397388458252, -0.0001510418951511383, -0.00014374405145645142, -0.00013644620776176453, -0.00012914836406707764, -0.00012185052037239075, -0.00011455267667770386, -0.00010725483298301697, -9.995698928833008e-05, -9.265914559364319e-05, -8.53613018989563e-05, -7.806345820426941e-05, -7.076561450958252e-05, -6.346777081489563e-05, -5.616992712020874e-05, -4.887208342552185e-05, -4.157423973083496e-05, -3.427639603614807e-05, -2.697855234146118e-05, -1.9680708646774292e-05, -1.2382864952087402e-05, -5.085021257400513e-06, 2.212822437286377e-06, 9.510666131973267e-06, 1.6808509826660156e-05, 2.4106353521347046e-05, 3.1404197216033936e-05, 3.8702040910720825e-05, 4.5999884605407715e-05, 5.3297728300094604e-05, 6.0595571994781494e-05, 6.789341568946838e-05, 7.519125938415527e-05, 8.248910307884216e-05, 8.978694677352905e-05, 9.708479046821594e-05, 0.00010438263416290283, 0.00011168047785758972, 0.00011897832155227661, 0.0001262761652469635, 0.0001335740089416504, 0.00014087185263633728, 0.00014816969633102417, 0.00015546754002571106, 0.00016276538372039795, 0.00017006322741508484, 0.00017736107110977173, 0.00018465891480445862, 0.0001919567584991455, 0.0001992546021938324, 0.0002065524458885193, 0.00021385028958320618, 0.00022114813327789307, 0.00022844597697257996, 0.00023574382066726685, 0.00024304166436195374, 0.0002503395080566406]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 7.0, 9.0, 17.0, 14.0, 17.0, 17.0, 41.0, 43.0, 73.0, 124.0, 264.0, 1170.0, 54006.0, 981968.0, 9695.0, 587.0, 207.0, 113.0, 65.0, 37.0, 22.0, 16.0, 7.0, 7.0, 9.0, 6.0, 4.0, 1.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.005214691162109375, -0.005062758922576904, -0.004910826683044434, -0.004758894443511963, -0.004606962203979492, -0.0044550299644470215, -0.004303097724914551, -0.00415116548538208, -0.003999233245849609, -0.0038473010063171387, -0.003695368766784668, -0.0035434365272521973, -0.0033915042877197266, -0.003239572048187256, -0.003087639808654785, -0.0029357075691223145, -0.0027837753295898438, -0.002631843090057373, -0.0024799108505249023, -0.0023279786109924316, -0.002176046371459961, -0.0020241141319274902, -0.0018721818923950195, -0.0017202496528625488, -0.0015683174133300781, -0.0014163851737976074, -0.0012644529342651367, -0.001112520694732666, -0.0009605884552001953, -0.0008086562156677246, -0.0006567239761352539, -0.0005047917366027832, -0.0003528594970703125, -0.0002009272575378418, -4.8995018005371094e-05, 0.00010293722152709961, 0.0002548694610595703, 0.000406801700592041, 0.0005587339401245117, 0.0007106661796569824, 0.0008625984191894531, 0.0010145306587219238, 0.0011664628982543945, 0.0013183951377868652, 0.001470327377319336, 0.0016222596168518066, 0.0017741918563842773, 0.001926124095916748, 0.0020780563354492188, 0.0022299885749816895, 0.00238192081451416, 0.002533853054046631, 0.0026857852935791016, 0.0028377175331115723, 0.002989649772644043, 0.0031415820121765137, 0.0032935142517089844, 0.003445446491241455, 0.0035973787307739258, 0.0037493109703063965, 0.003901243209838867, 0.004053175449371338, 0.004205107688903809, 0.004357039928436279, 0.00450897216796875]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 12.0, 38.0, 171.0, 514.0, 223.0, 43.0, 14.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008655885467305779, -0.0008419420919381082, -0.0008182956953532994, -0.0007946492405608296, -0.0007710028439760208, -0.0007473563891835511, -0.0007237099343910813, -0.0007000635378062725, -0.0006764171412214637, -0.0006527706864289939, -0.0006291242898441851, -0.0006054778350517154, -0.0005818314384669065, -0.0005581849836744368, -0.0005345385288819671, -0.0005108921322971582, -0.0004872456775046885, -0.0004635992518160492, -0.00043995282612740993, -0.0004163063713349402, -0.00039265997475013137, -0.00036901351995766163, -0.00034536709426902235, -0.00032172066858038306, -0.0002980742428917438, -0.0002744278172031045, -0.0002507813915144652, -0.0002271349512739107, -0.00020348852558527142, -0.00017984209989663213, -0.00015619565965607762, -0.00013254923396743834, -0.00010890280827879906, -8.525638259015977e-05, -6.160994962556288e-05, -3.796351666096598e-05, -1.4317090972326696e-05, 9.329334716312587e-06, 3.29757749568671e-05, 5.662220064550638e-05, 8.026862633414567e-05, 0.00010391505202278495, 0.00012756147771142423, 0.00015120791795197874, 0.00017485434364061803, 0.0001985007693292573, 0.00022214720956981182, 0.0002457936352584511, 0.0002694400609470904, 0.00029308648663572967, 0.00031673291232436895, 0.0003403793671168387, 0.0003640257637016475, 0.00038767221849411726, 0.00041131864418275654, 0.0004349650698713958, 0.0004586114955600351, 0.0004822579212486744, 0.0005059043760411441, 0.000529550772625953, 0.0005531972274184227, 0.0005768436240032315, 0.0006004900787957013, 0.000624136533588171, 0.0006477829301729798]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 4.0, 4.0, 4.0, 2.0, 7.0, 10.0, 8.0, 8.0, 13.0, 22.0, 14.0, 19.0, 20.0, 29.0, 26.0, 33.0, 30.0, 29.0, 30.0, 36.0, 31.0, 33.0, 38.0, 39.0, 36.0, 39.0, 40.0, 43.0, 30.0, 40.0, 31.0, 35.0, 22.0, 25.0, 21.0, 29.0, 23.0, 15.0, 8.0, 14.0, 18.0, 8.0, 8.0, 8.0, 11.0, 3.0, 3.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-8.308887481689453e-05, -8.052308112382889e-05, -7.795728743076324e-05, -7.53914937376976e-05, -7.282570004463196e-05, -7.025990635156631e-05, -6.769411265850067e-05, -6.512831896543503e-05, -6.256252527236938e-05, -5.999673157930374e-05, -5.74309378862381e-05, -5.4865144193172455e-05, -5.229935050010681e-05, -4.973355680704117e-05, -4.7167763113975525e-05, -4.460196942090988e-05, -4.203617572784424e-05, -3.9470382034778595e-05, -3.690458834171295e-05, -3.433879464864731e-05, -3.1773000955581665e-05, -2.9207207262516022e-05, -2.664141356945038e-05, -2.4075619876384735e-05, -2.1509826183319092e-05, -1.894403249025345e-05, -1.6378238797187805e-05, -1.3812445104122162e-05, -1.1246651411056519e-05, -8.680857717990875e-06, -6.115064024925232e-06, -3.5492703318595886e-06, -9.834766387939453e-07, 1.582317054271698e-06, 4.148110747337341e-06, 6.713904440402985e-06, 9.279698133468628e-06, 1.1845491826534271e-05, 1.4411285519599915e-05, 1.6977079212665558e-05, 1.95428729057312e-05, 2.2108666598796844e-05, 2.4674460291862488e-05, 2.724025398492813e-05, 2.9806047677993774e-05, 3.237184137105942e-05, 3.493763506412506e-05, 3.7503428757190704e-05, 4.006922245025635e-05, 4.263501614332199e-05, 4.5200809836387634e-05, 4.776660352945328e-05, 5.033239722251892e-05, 5.2898190915584564e-05, 5.546398460865021e-05, 5.802977830171585e-05, 6.0595571994781494e-05, 6.316136568784714e-05, 6.572715938091278e-05, 6.829295307397842e-05, 7.085874676704407e-05, 7.342454046010971e-05, 7.599033415317535e-05, 7.8556127846241e-05, 8.112192153930664e-05]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 3.0, 3.0, 9.0, 6.0, 17.0, 13.0, 19.0, 17.0, 17.0, 23.0, 25.0, 28.0, 34.0, 31.0, 40.0, 54.0, 55.0, 47.0, 51.0, 52.0, 46.0, 57.0, 32.0, 37.0, 35.0, 41.0, 39.0, 21.0, 27.0, 23.0, 22.0, 15.0, 17.0, 8.0, 3.0, 14.0, 2.0, 7.0, 6.0, 3.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.5390625, -6.3299560546875, -6.120849609375, -5.9117431640625, -5.70263671875, -5.4935302734375, -5.284423828125, -5.0753173828125, -4.8662109375, -4.6571044921875, -4.447998046875, -4.2388916015625, -4.02978515625, -3.8206787109375, -3.611572265625, -3.4024658203125, -3.193359375, -2.9842529296875, -2.775146484375, -2.5660400390625, -2.35693359375, -2.1478271484375, -1.938720703125, -1.7296142578125, -1.5205078125, -1.3114013671875, -1.102294921875, -0.8931884765625, -0.68408203125, -0.4749755859375, -0.265869140625, -0.0567626953125, 0.15234375, 0.3614501953125, 0.570556640625, 0.7796630859375, 0.98876953125, 1.1978759765625, 1.406982421875, 1.6160888671875, 1.8251953125, 2.0343017578125, 2.243408203125, 2.4525146484375, 2.66162109375, 2.8707275390625, 3.079833984375, 3.2889404296875, 3.498046875, 3.7071533203125, 3.916259765625, 4.1253662109375, 4.33447265625, 4.5435791015625, 4.752685546875, 4.9617919921875, 5.1708984375, 5.3800048828125, 5.589111328125, 5.7982177734375, 6.00732421875, 6.2164306640625, 6.425537109375, 6.6346435546875, 6.84375]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 8.0, 3.0, 8.0, 15.0, 17.0, 29.0, 43.0, 75.0, 84.0, 196.0, 277.0, 526.0, 858.0, 1570.0, 2837.0, 5482.0, 11350.0, 28818.0, 127624.0, 595910.0, 205293.0, 39513.0, 13838.0, 6624.0, 3336.0, 1806.0, 1002.0, 549.0, 322.0, 212.0, 125.0, 67.0, 47.0, 36.0, 19.0, 21.0, 7.0, 6.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.1875, -9.875244140625, -9.56298828125, -9.250732421875, -8.9384765625, -8.626220703125, -8.31396484375, -8.001708984375, -7.689453125, -7.377197265625, -7.06494140625, -6.752685546875, -6.4404296875, -6.128173828125, -5.81591796875, -5.503662109375, -5.19140625, -4.879150390625, -4.56689453125, -4.254638671875, -3.9423828125, -3.630126953125, -3.31787109375, -3.005615234375, -2.693359375, -2.381103515625, -2.06884765625, -1.756591796875, -1.4443359375, -1.132080078125, -0.81982421875, -0.507568359375, -0.1953125, 0.116943359375, 0.42919921875, 0.741455078125, 1.0537109375, 1.365966796875, 1.67822265625, 1.990478515625, 2.302734375, 2.614990234375, 2.92724609375, 3.239501953125, 3.5517578125, 3.864013671875, 4.17626953125, 4.488525390625, 4.80078125, 5.113037109375, 5.42529296875, 5.737548828125, 6.0498046875, 6.362060546875, 6.67431640625, 6.986572265625, 7.298828125, 7.611083984375, 7.92333984375, 8.235595703125, 8.5478515625, 8.860107421875, 9.17236328125, 9.484619140625, 9.796875]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 2.0, 3.0, 5.0, 9.0, 8.0, 10.0, 20.0, 11.0, 12.0, 19.0, 19.0, 30.0, 35.0, 34.0, 30.0, 55.0, 45.0, 40.0, 70.0, 177.0, 1573.0, 294.0, 92.0, 61.0, 40.0, 57.0, 39.0, 43.0, 31.0, 36.0, 25.0, 29.0, 19.0, 18.0, 12.0, 9.0, 9.0, 8.0, 4.0, 7.0, 4.0, 3.0, 3.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.6875, -19.001708984375, -18.31591796875, -17.630126953125, -16.9443359375, -16.258544921875, -15.57275390625, -14.886962890625, -14.201171875, -13.515380859375, -12.82958984375, -12.143798828125, -11.4580078125, -10.772216796875, -10.08642578125, -9.400634765625, -8.71484375, -8.029052734375, -7.34326171875, -6.657470703125, -5.9716796875, -5.285888671875, -4.60009765625, -3.914306640625, -3.228515625, -2.542724609375, -1.85693359375, -1.171142578125, -0.4853515625, 0.200439453125, 0.88623046875, 1.572021484375, 2.2578125, 2.943603515625, 3.62939453125, 4.315185546875, 5.0009765625, 5.686767578125, 6.37255859375, 7.058349609375, 7.744140625, 8.429931640625, 9.11572265625, 9.801513671875, 10.4873046875, 11.173095703125, 11.85888671875, 12.544677734375, 13.23046875, 13.916259765625, 14.60205078125, 15.287841796875, 15.9736328125, 16.659423828125, 17.34521484375, 18.031005859375, 18.716796875, 19.402587890625, 20.08837890625, 20.774169921875, 21.4599609375, 22.145751953125, 22.83154296875, 23.517333984375, 24.203125]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 5.0, 5.0, 8.0, 5.0, 4.0, 9.0, 13.0, 26.0, 38.0, 60.0, 85.0, 166.0, 331.0, 881.0, 14759.0, 3118041.0, 9884.0, 727.0, 278.0, 159.0, 80.0, 52.0, 30.0, 12.0, 9.0, 7.0, 15.0, 4.0, 2.0, 2.0, 3.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-118.375, -114.939453125, -111.50390625, -108.068359375, -104.6328125, -101.197265625, -97.76171875, -94.326171875, -90.890625, -87.455078125, -84.01953125, -80.583984375, -77.1484375, -73.712890625, -70.27734375, -66.841796875, -63.40625, -59.970703125, -56.53515625, -53.099609375, -49.6640625, -46.228515625, -42.79296875, -39.357421875, -35.921875, -32.486328125, -29.05078125, -25.615234375, -22.1796875, -18.744140625, -15.30859375, -11.873046875, -8.4375, -5.001953125, -1.56640625, 1.869140625, 5.3046875, 8.740234375, 12.17578125, 15.611328125, 19.046875, 22.482421875, 25.91796875, 29.353515625, 32.7890625, 36.224609375, 39.66015625, 43.095703125, 46.53125, 49.966796875, 53.40234375, 56.837890625, 60.2734375, 63.708984375, 67.14453125, 70.580078125, 74.015625, 77.451171875, 80.88671875, 84.322265625, 87.7578125, 91.193359375, 94.62890625, 98.064453125, 101.5]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 127.0, 881.0, 10.0], "bins": [-911.3828735351562, -896.7440795898438, -882.105224609375, -867.4664306640625, -852.82763671875, -838.1888427734375, -823.5499877929688, -808.9111938476562, -794.2723999023438, -779.6336059570312, -764.9947509765625, -750.35595703125, -735.7171630859375, -721.078369140625, -706.4395141601562, -691.8007202148438, -677.1619262695312, -662.5231323242188, -647.88427734375, -633.2454833984375, -618.606689453125, -603.9678955078125, -589.3290405273438, -574.6902465820312, -560.0514526367188, -545.4126586914062, -530.7738037109375, -516.135009765625, -501.4962158203125, -486.8573913574219, -472.2185974121094, -457.57977294921875, -442.94091796875, -428.3020935058594, -413.6632995605469, -399.02447509765625, -384.38568115234375, -369.7468566894531, -355.1080627441406, -340.46923828125, -325.8304443359375, -311.1916198730469, -296.5528259277344, -281.91400146484375, -267.27520751953125, -252.63638305664062, -237.99758911132812, -223.3587646484375, -208.719970703125, -194.08116149902344, -179.44235229492188, -164.8035430908203, -150.16473388671875, -135.52590942382812, -120.8871078491211, -106.24829864501953, -91.60948181152344, -76.97067260742188, -62.33186340332031, -47.693050384521484, -33.05424118041992, -18.415428161621094, -3.7766189575195312, 10.862190246582031, 25.500995635986328]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 2.0, 10.0, 7.0, 6.0, 4.0, 11.0, 5.0, 22.0, 12.0, 18.0, 23.0, 17.0, 16.0, 31.0, 28.0, 40.0, 33.0, 32.0, 28.0, 33.0, 43.0, 43.0, 46.0, 44.0, 49.0, 44.0, 34.0, 42.0, 35.0, 39.0, 33.0, 30.0, 19.0, 28.0, 10.0, 14.0, 17.0, 7.0, 10.0, 8.0, 6.0, 7.0, 9.0, 5.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.141475677490234, -52.46421813964844, -50.786964416503906, -49.10970687866211, -47.43244934082031, -45.75519561767578, -44.077938079833984, -42.40068054199219, -40.723426818847656, -39.04616928100586, -37.36891555786133, -35.69165802001953, -34.014400482177734, -32.33714294433594, -30.659889221191406, -28.98263168334961, -27.305374145507812, -25.62811851501465, -23.95086097717285, -22.273605346679688, -20.59634780883789, -18.919092178344727, -17.241836547851562, -15.564579963684082, -13.887323379516602, -12.210066795349121, -10.53281021118164, -8.855554580688477, -7.178297996520996, -5.501041412353516, -3.8237857818603516, -2.146529197692871, -0.46927642822265625, 1.2079799175262451, 2.8852362632751465, 4.562492370605469, 6.239748954772949, 7.91700553894043, 9.594261169433594, 11.271517753601074, 12.948774337768555, 14.626030921936035, 16.303287506103516, 17.98054313659668, 19.657798767089844, 21.33505630493164, 23.012311935424805, 24.68956756591797, 26.366825103759766, 28.04408073425293, 29.721338272094727, 31.39859390258789, 33.07585144042969, 34.75310516357422, 36.430362701416016, 38.10762023925781, 39.784873962402344, 41.46213150024414, 43.13938522338867, 44.81664276123047, 46.493900299072266, 48.17115783691406, 49.848411560058594, 51.52566909790039, 53.20292663574219]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 8.0, 6.0, 7.0, 5.0, 13.0, 12.0, 13.0, 14.0, 14.0, 30.0, 24.0, 29.0, 32.0, 30.0, 44.0, 53.0, 47.0, 46.0, 34.0, 48.0, 45.0, 50.0, 41.0, 40.0, 35.0, 38.0, 31.0, 29.0, 32.0, 25.0, 25.0, 18.0, 18.0, 8.0, 14.0, 11.0, 7.0, 11.0, 3.0, 4.0, 6.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.5625, -7.3397216796875, -7.116943359375, -6.8941650390625, -6.67138671875, -6.4486083984375, -6.225830078125, -6.0030517578125, -5.7802734375, -5.5574951171875, -5.334716796875, -5.1119384765625, -4.88916015625, -4.6663818359375, -4.443603515625, -4.2208251953125, -3.998046875, -3.7752685546875, -3.552490234375, -3.3297119140625, -3.10693359375, -2.8841552734375, -2.661376953125, -2.4385986328125, -2.2158203125, -1.9930419921875, -1.770263671875, -1.5474853515625, -1.32470703125, -1.1019287109375, -0.879150390625, -0.6563720703125, -0.43359375, -0.2108154296875, 0.011962890625, 0.2347412109375, 0.45751953125, 0.6802978515625, 0.903076171875, 1.1258544921875, 1.3486328125, 1.5714111328125, 1.794189453125, 2.0169677734375, 2.23974609375, 2.4625244140625, 2.685302734375, 2.9080810546875, 3.130859375, 3.3536376953125, 3.576416015625, 3.7991943359375, 4.02197265625, 4.2447509765625, 4.467529296875, 4.6903076171875, 4.9130859375, 5.1358642578125, 5.358642578125, 5.5814208984375, 5.80419921875, 6.0269775390625, 6.249755859375, 6.4725341796875, 6.6953125]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 8.0, 8.0, 18.0, 15.0, 18.0, 25.0, 41.0, 69.0, 85.0, 125.0, 215.0, 271.0, 477.0, 694.0, 1224.0, 2318.0, 4806.0, 13244.0, 65542.0, 842786.0, 2700254.0, 497851.0, 44110.0, 10921.0, 4323.0, 1974.0, 1006.0, 694.0, 366.0, 240.0, 164.0, 130.0, 73.0, 60.0, 35.0, 32.0, 18.0, 11.0, 15.0, 5.0, 5.0, 3.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0], "bins": [-15.875, -15.426513671875, -14.97802734375, -14.529541015625, -14.0810546875, -13.632568359375, -13.18408203125, -12.735595703125, -12.287109375, -11.838623046875, -11.39013671875, -10.941650390625, -10.4931640625, -10.044677734375, -9.59619140625, -9.147705078125, -8.69921875, -8.250732421875, -7.80224609375, -7.353759765625, -6.9052734375, -6.456787109375, -6.00830078125, -5.559814453125, -5.111328125, -4.662841796875, -4.21435546875, -3.765869140625, -3.3173828125, -2.868896484375, -2.42041015625, -1.971923828125, -1.5234375, -1.074951171875, -0.62646484375, -0.177978515625, 0.2705078125, 0.718994140625, 1.16748046875, 1.615966796875, 2.064453125, 2.512939453125, 2.96142578125, 3.409912109375, 3.8583984375, 4.306884765625, 4.75537109375, 5.203857421875, 5.65234375, 6.100830078125, 6.54931640625, 6.997802734375, 7.4462890625, 7.894775390625, 8.34326171875, 8.791748046875, 9.240234375, 9.688720703125, 10.13720703125, 10.585693359375, 11.0341796875, 11.482666015625, 11.93115234375, 12.379638671875, 12.828125]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 5.0, 8.0, 9.0, 9.0, 8.0, 24.0, 16.0, 28.0, 42.0, 54.0, 87.0, 95.0, 135.0, 225.0, 396.0, 532.0, 707.0, 554.0, 375.0, 257.0, 147.0, 97.0, 71.0, 51.0, 43.0, 26.0, 24.0, 14.0, 12.0, 3.0, 8.0, 3.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.40625, -12.951904296875, -12.49755859375, -12.043212890625, -11.5888671875, -11.134521484375, -10.68017578125, -10.225830078125, -9.771484375, -9.317138671875, -8.86279296875, -8.408447265625, -7.9541015625, -7.499755859375, -7.04541015625, -6.591064453125, -6.13671875, -5.682373046875, -5.22802734375, -4.773681640625, -4.3193359375, -3.864990234375, -3.41064453125, -2.956298828125, -2.501953125, -2.047607421875, -1.59326171875, -1.138916015625, -0.6845703125, -0.230224609375, 0.22412109375, 0.678466796875, 1.1328125, 1.587158203125, 2.04150390625, 2.495849609375, 2.9501953125, 3.404541015625, 3.85888671875, 4.313232421875, 4.767578125, 5.221923828125, 5.67626953125, 6.130615234375, 6.5849609375, 7.039306640625, 7.49365234375, 7.947998046875, 8.40234375, 8.856689453125, 9.31103515625, 9.765380859375, 10.2197265625, 10.674072265625, 11.12841796875, 11.582763671875, 12.037109375, 12.491455078125, 12.94580078125, 13.400146484375, 13.8544921875, 14.308837890625, 14.76318359375, 15.217529296875, 15.671875]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 5.0, 7.0, 5.0, 7.0, 14.0, 24.0, 22.0, 33.0, 61.0, 81.0, 143.0, 236.0, 515.0, 2346.0, 23430.0, 2878115.0, 1270843.0, 15637.0, 1692.0, 469.0, 192.0, 113.0, 95.0, 52.0, 35.0, 29.0, 15.0, 25.0, 9.0, 9.0, 10.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-54.0, -52.4541015625, -50.908203125, -49.3623046875, -47.81640625, -46.2705078125, -44.724609375, -43.1787109375, -41.6328125, -40.0869140625, -38.541015625, -36.9951171875, -35.44921875, -33.9033203125, -32.357421875, -30.8115234375, -29.265625, -27.7197265625, -26.173828125, -24.6279296875, -23.08203125, -21.5361328125, -19.990234375, -18.4443359375, -16.8984375, -15.3525390625, -13.806640625, -12.2607421875, -10.71484375, -9.1689453125, -7.623046875, -6.0771484375, -4.53125, -2.9853515625, -1.439453125, 0.1064453125, 1.65234375, 3.1982421875, 4.744140625, 6.2900390625, 7.8359375, 9.3818359375, 10.927734375, 12.4736328125, 14.01953125, 15.5654296875, 17.111328125, 18.6572265625, 20.203125, 21.7490234375, 23.294921875, 24.8408203125, 26.38671875, 27.9326171875, 29.478515625, 31.0244140625, 32.5703125, 34.1162109375, 35.662109375, 37.2080078125, 38.75390625, 40.2998046875, 41.845703125, 43.3916015625, 44.9375]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 6.0, 5.0, 18.0, 36.0, 86.0, 180.0, 208.0, 200.0, 129.0, 85.0, 36.0, 13.0, 7.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-163.62261962890625, -160.40814208984375, -157.19366455078125, -153.97918701171875, -150.76470947265625, -147.55023193359375, -144.3357696533203, -141.1212921142578, -137.9068145751953, -134.6923370361328, -131.4778594970703, -128.2633819580078, -125.04891204833984, -121.83443450927734, -118.61995697021484, -115.40548706054688, -112.19100952148438, -108.97653198242188, -105.76205444335938, -102.5475845336914, -99.3331069946289, -96.1186294555664, -92.9041519165039, -89.68968200683594, -86.4751968383789, -83.2607192993164, -80.0462417602539, -76.83177185058594, -73.61729431152344, -70.40281677246094, -67.18833923339844, -63.9738655090332, -60.759395599365234, -57.544918060302734, -54.3304443359375, -51.115966796875, -47.901493072509766, -44.687015533447266, -41.47254180908203, -38.25806427001953, -35.04358673095703, -31.829111099243164, -28.614635467529297, -25.400157928466797, -22.185684204101562, -18.971206665039062, -15.756731033325195, -12.542255401611328, -9.327781677246094, -6.113306045532227, -2.898829936981201, 0.3156461715698242, 3.5301218032836914, 6.744598388671875, 9.959074020385742, 13.17354965209961, 16.388025283813477, 19.602500915527344, 22.81697654724121, 26.031452178955078, 29.245929718017578, 32.46040344238281, 35.67488098144531, 38.88935852050781, 42.10383224487305]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 5.0, 6.0, 7.0, 14.0, 10.0, 8.0, 17.0, 15.0, 18.0, 20.0, 20.0, 24.0, 35.0, 33.0, 26.0, 41.0, 36.0, 30.0, 45.0, 46.0, 41.0, 36.0, 35.0, 42.0, 33.0, 42.0, 30.0, 43.0, 36.0, 42.0, 29.0, 29.0, 16.0, 13.0, 18.0, 9.0, 13.0, 10.0, 6.0, 5.0, 7.0, 9.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-35.07271194458008, -33.81715774536133, -32.56160354614258, -31.306047439575195, -30.050491333007812, -28.794937133789062, -27.539382934570312, -26.28382682800293, -25.028270721435547, -23.772716522216797, -22.517160415649414, -21.261606216430664, -20.00605010986328, -18.75049591064453, -17.49494171142578, -16.2393856048584, -14.983831405639648, -13.728276252746582, -12.472721099853516, -11.217166900634766, -9.961610794067383, -8.706056594848633, -7.450501441955566, -6.1949462890625, -4.939391136169434, -3.683835983276367, -2.42828106880188, -1.1727261543273926, 0.08282899856567383, 1.3383841514587402, 2.5939388275146484, 3.849493980407715, 5.105049133300781, 6.360604286193848, 7.616159439086914, 8.871713638305664, 10.127269744873047, 11.382823944091797, 12.638379096984863, 13.89393424987793, 15.149489402770996, 16.405044555664062, 17.660598754882812, 18.916154861450195, 20.171709060668945, 21.427265167236328, 22.682819366455078, 23.938373565673828, 25.19392967224121, 26.44948387145996, 27.705039978027344, 28.960594177246094, 30.216150283813477, 31.471704483032227, 32.72726058959961, 33.98281478881836, 35.23836898803711, 36.49392318725586, 37.74947738647461, 39.005035400390625, 40.260589599609375, 41.516143798828125, 42.771697998046875, 44.027252197265625, 45.28281021118164]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 5.0, 6.0, 6.0, 8.0, 16.0, 7.0, 11.0, 14.0, 11.0, 20.0, 20.0, 23.0, 32.0, 21.0, 37.0, 44.0, 47.0, 45.0, 52.0, 40.0, 45.0, 33.0, 46.0, 40.0, 35.0, 51.0, 34.0, 33.0, 26.0, 34.0, 23.0, 23.0, 19.0, 12.0, 9.0, 17.0, 16.0, 11.0, 7.0, 9.0, 7.0, 2.0, 4.0, 1.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.6875, -6.4852294921875, -6.282958984375, -6.0806884765625, -5.87841796875, -5.6761474609375, -5.473876953125, -5.2716064453125, -5.0693359375, -4.8670654296875, -4.664794921875, -4.4625244140625, -4.26025390625, -4.0579833984375, -3.855712890625, -3.6534423828125, -3.451171875, -3.2489013671875, -3.046630859375, -2.8443603515625, -2.64208984375, -2.4398193359375, -2.237548828125, -2.0352783203125, -1.8330078125, -1.6307373046875, -1.428466796875, -1.2261962890625, -1.02392578125, -0.8216552734375, -0.619384765625, -0.4171142578125, -0.21484375, -0.0125732421875, 0.189697265625, 0.3919677734375, 0.59423828125, 0.7965087890625, 0.998779296875, 1.2010498046875, 1.4033203125, 1.6055908203125, 1.807861328125, 2.0101318359375, 2.21240234375, 2.4146728515625, 2.616943359375, 2.8192138671875, 3.021484375, 3.2237548828125, 3.426025390625, 3.6282958984375, 3.83056640625, 4.0328369140625, 4.235107421875, 4.4373779296875, 4.6396484375, 4.8419189453125, 5.044189453125, 5.2464599609375, 5.44873046875, 5.6510009765625, 5.853271484375, 6.0555419921875, 6.2578125]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 3.0, 4.0, 7.0, 13.0, 10.0, 14.0, 38.0, 47.0, 59.0, 88.0, 115.0, 151.0, 204.0, 332.0, 451.0, 640.0, 924.0, 1257.0, 1881.0, 2681.0, 4020.0, 5983.0, 8657.0, 12933.0, 19853.0, 31616.0, 52753.0, 93197.0, 177639.0, 266353.0, 153158.0, 81764.0, 47400.0, 29122.0, 18149.0, 12003.0, 7743.0, 5172.0, 3653.0, 2533.0, 1762.0, 1196.0, 867.0, 643.0, 442.0, 300.0, 232.0, 164.0, 98.0, 74.0, 59.0, 32.0, 30.0, 16.0, 14.0, 10.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.2529296875, -0.244873046875, -0.23681640625, -0.228759765625, -0.220703125, -0.212646484375, -0.20458984375, -0.196533203125, -0.1884765625, -0.180419921875, -0.17236328125, -0.164306640625, -0.15625, -0.148193359375, -0.14013671875, -0.132080078125, -0.1240234375, -0.115966796875, -0.10791015625, -0.099853515625, -0.091796875, -0.083740234375, -0.07568359375, -0.067626953125, -0.0595703125, -0.051513671875, -0.04345703125, -0.035400390625, -0.02734375, -0.019287109375, -0.01123046875, -0.003173828125, 0.0048828125, 0.012939453125, 0.02099609375, 0.029052734375, 0.037109375, 0.045166015625, 0.05322265625, 0.061279296875, 0.0693359375, 0.077392578125, 0.08544921875, 0.093505859375, 0.1015625, 0.109619140625, 0.11767578125, 0.125732421875, 0.1337890625, 0.141845703125, 0.14990234375, 0.157958984375, 0.166015625, 0.174072265625, 0.18212890625, 0.190185546875, 0.1982421875, 0.206298828125, 0.21435546875, 0.222412109375, 0.23046875, 0.238525390625, 0.24658203125, 0.254638671875, 0.2626953125]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 6.0, 2.0, 9.0, 4.0, 8.0, 7.0, 13.0, 10.0, 10.0, 13.0, 25.0, 25.0, 21.0, 30.0, 36.0, 42.0, 38.0, 38.0, 50.0, 45.0, 35.0, 1057.0, 54.0, 49.0, 44.0, 42.0, 38.0, 31.0, 33.0, 41.0, 27.0, 22.0, 22.0, 12.0, 11.0, 16.0, 20.0, 13.0, 14.0, 6.0, 3.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.20703125, -4.07720947265625, -3.9473876953125, -3.81756591796875, -3.687744140625, -3.55792236328125, -3.4281005859375, -3.29827880859375, -3.16845703125, -3.03863525390625, -2.9088134765625, -2.77899169921875, -2.649169921875, -2.51934814453125, -2.3895263671875, -2.25970458984375, -2.1298828125, -2.00006103515625, -1.8702392578125, -1.74041748046875, -1.610595703125, -1.48077392578125, -1.3509521484375, -1.22113037109375, -1.09130859375, -0.96148681640625, -0.8316650390625, -0.70184326171875, -0.572021484375, -0.44219970703125, -0.3123779296875, -0.18255615234375, -0.052734375, 0.07708740234375, 0.2069091796875, 0.33673095703125, 0.466552734375, 0.59637451171875, 0.7261962890625, 0.85601806640625, 0.98583984375, 1.11566162109375, 1.2454833984375, 1.37530517578125, 1.505126953125, 1.63494873046875, 1.7647705078125, 1.89459228515625, 2.0244140625, 2.15423583984375, 2.2840576171875, 2.41387939453125, 2.543701171875, 2.67352294921875, 2.8033447265625, 2.93316650390625, 3.06298828125, 3.19281005859375, 3.3226318359375, 3.45245361328125, 3.582275390625, 3.71209716796875, 3.8419189453125, 3.97174072265625, 4.1015625]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 4.0, 4.0, 7.0, 10.0, 27.0, 31.0, 58.0, 66.0, 111.0, 133.0, 212.0, 336.0, 493.0, 716.0, 1076.0, 1640.0, 2488.0, 3794.0, 5936.0, 9315.0, 14942.0, 24893.0, 41446.0, 72332.0, 133492.0, 1293290.0, 216159.0, 114863.0, 63230.0, 36825.0, 21618.0, 13533.0, 8380.0, 5392.0, 3522.0, 2174.0, 1506.0, 1015.0, 700.0, 466.0, 299.0, 186.0, 147.0, 90.0, 64.0, 39.0, 27.0, 21.0, 7.0, 11.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.198486328125, -0.1922607421875, -0.18603515625, -0.1798095703125, -0.173583984375, -0.1673583984375, -0.1611328125, -0.1549072265625, -0.148681640625, -0.1424560546875, -0.13623046875, -0.1300048828125, -0.123779296875, -0.1175537109375, -0.111328125, -0.1051025390625, -0.098876953125, -0.0926513671875, -0.08642578125, -0.0802001953125, -0.073974609375, -0.0677490234375, -0.0615234375, -0.0552978515625, -0.049072265625, -0.0428466796875, -0.03662109375, -0.0303955078125, -0.024169921875, -0.0179443359375, -0.01171875, -0.0054931640625, 0.000732421875, 0.0069580078125, 0.01318359375, 0.0194091796875, 0.025634765625, 0.0318603515625, 0.0380859375, 0.0443115234375, 0.050537109375, 0.0567626953125, 0.06298828125, 0.0692138671875, 0.075439453125, 0.0816650390625, 0.087890625, 0.0941162109375, 0.100341796875, 0.1065673828125, 0.11279296875, 0.1190185546875, 0.125244140625, 0.1314697265625, 0.1376953125, 0.1439208984375, 0.150146484375, 0.1563720703125, 0.16259765625, 0.1688232421875, 0.175048828125, 0.1812744140625, 0.1875, 0.1937255859375, 0.199951171875]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 3.0, 3.0, 5.0, 2.0, 4.0, 3.0, 3.0, 3.0, 1.0, 6.0, 2.0, 11.0, 9.0, 14.0, 16.0, 15.0, 14.0, 23.0, 23.0, 30.0, 39.0, 53.0, 88.0, 81.0, 85.0, 119.0, 83.0, 62.0, 36.0, 44.0, 25.0, 17.0, 12.0, 4.0, 14.0, 10.0, 9.0, 3.0, 4.0, 3.0, 4.0, 2.0, 6.0, 2.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 4.0], "bins": [-0.0001875162124633789, -0.0001815836876630783, -0.0001756511628627777, -0.0001697186380624771, -0.00016378611326217651, -0.00015785358846187592, -0.00015192106366157532, -0.00014598853886127472, -0.00014005601406097412, -0.00013412348926067352, -0.00012819096446037292, -0.00012225843966007233, -0.00011632591485977173, -0.00011039339005947113, -0.00010446086525917053, -9.852834045886993e-05, -9.259581565856934e-05, -8.666329085826874e-05, -8.073076605796814e-05, -7.479824125766754e-05, -6.886571645736694e-05, -6.293319165706635e-05, -5.700066685676575e-05, -5.106814205646515e-05, -4.513561725616455e-05, -3.920309245586395e-05, -3.3270567655563354e-05, -2.7338042855262756e-05, -2.1405518054962158e-05, -1.547299325466156e-05, -9.540468454360962e-06, -3.6079436540603638e-06, 2.3245811462402344e-06, 8.257105946540833e-06, 1.418963074684143e-05, 2.012215554714203e-05, 2.6054680347442627e-05, 3.1987205147743225e-05, 3.791972994804382e-05, 4.385225474834442e-05, 4.978477954864502e-05, 5.571730434894562e-05, 6.164982914924622e-05, 6.758235394954681e-05, 7.351487874984741e-05, 7.944740355014801e-05, 8.537992835044861e-05, 9.13124531507492e-05, 9.72449779510498e-05, 0.0001031775027513504, 0.000109110027551651, 0.0001150425523519516, 0.0001209750771522522, 0.0001269076019525528, 0.0001328401267528534, 0.000138772651553154, 0.0001447051763534546, 0.0001506377011537552, 0.00015657022595405579, 0.00016250275075435638, 0.00016843527555465698, 0.00017436780035495758, 0.00018030032515525818, 0.00018623284995555878, 0.00019216537475585938]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 6.0, 3.0, 4.0, 3.0, 9.0, 12.0, 4.0, 7.0, 12.0, 10.0, 12.0, 16.0, 26.0, 24.0, 24.0, 29.0, 53.0, 86.0, 141.0, 275.0, 787.0, 4570.0, 58321.0, 945719.0, 33783.0, 3268.0, 635.0, 225.0, 118.0, 82.0, 51.0, 40.0, 39.0, 23.0, 17.0, 20.0, 22.0, 12.0, 15.0, 16.0, 6.0, 7.0, 1.0, 3.0, 9.0, 5.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.003570556640625, -0.0034637153148651123, -0.0033568739891052246, -0.003250032663345337, -0.0031431913375854492, -0.0030363500118255615, -0.002929508686065674, -0.002822667360305786, -0.0027158260345458984, -0.0026089847087860107, -0.002502143383026123, -0.0023953020572662354, -0.0022884607315063477, -0.00218161940574646, -0.0020747780799865723, -0.0019679367542266846, -0.0018610954284667969, -0.0017542541027069092, -0.0016474127769470215, -0.0015405714511871338, -0.001433730125427246, -0.0013268887996673584, -0.0012200474739074707, -0.001113206148147583, -0.0010063648223876953, -0.0008995234966278076, -0.0007926821708679199, -0.0006858408451080322, -0.0005789995193481445, -0.00047215819358825684, -0.00036531686782836914, -0.00025847554206848145, -0.00015163421630859375, -4.4792890548706055e-05, 6.204843521118164e-05, 0.00016888976097106934, 0.00027573108673095703, 0.0003825724124908447, 0.0004894137382507324, 0.0005962550640106201, 0.0007030963897705078, 0.0008099377155303955, 0.0009167790412902832, 0.001023620367050171, 0.0011304616928100586, 0.0012373030185699463, 0.001344144344329834, 0.0014509856700897217, 0.0015578269958496094, 0.001664668321609497, 0.0017715096473693848, 0.0018783509731292725, 0.00198519229888916, 0.002092033624649048, 0.0021988749504089355, 0.0023057162761688232, 0.002412557601928711, 0.0025193989276885986, 0.0026262402534484863, 0.002733081579208374, 0.0028399229049682617, 0.0029467642307281494, 0.003053605556488037, 0.003160446882247925, 0.0032672882080078125]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 7.0, 50.0, 301.0, 532.0, 103.0, 18.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004028836265206337, -0.0003723732952494174, -0.0003418629930820316, -0.00031135266181081533, -0.0002808423596434295, -0.00025033202837221324, -0.0002198217116529122, -0.00018931139493361115, -0.0001588010782143101, -0.00012829076149500906, -9.778044477570802e-05, -6.727012078044936e-05, -3.6759804061148316e-05, -6.2494800658896565e-06, 2.426083665341139e-05, 5.477115337271243e-05, 8.528147009201348e-05, 0.00011579178681131452, 0.00014630210353061557, 0.00017681243480183184, 0.00020732273696921766, 0.00023783306824043393, 0.00026834337040781975, 0.000298853701679036, 0.0003293640329502523, 0.00035987436422146857, 0.0003903846663888544, 0.00042089499766007066, 0.0004514052998274565, 0.00048191563109867275, 0.000512425962369889, 0.0005429362645372748, 0.0005734465667046607, 0.0006039568688720465, 0.0006344672292470932, 0.000664977531414479, 0.0006954878335818648, 0.0007259981939569116, 0.0007565084961242974, 0.0007870187982916832, 0.000817529100459069, 0.0008480394026264548, 0.0008785497630015016, 0.0009090600651688874, 0.0009395703673362732, 0.0009700807277113199, 0.0010005909716710448, 0.0010311013320460916, 0.0010616116924211383, 0.001092122052796185, 0.00112263229675591, 0.0011531426571309566, 0.0011836530175060034, 0.0012141632614657283, 0.001244673621840775, 0.0012751838658005, 0.0013056942261755466, 0.0013362045865505934, 0.0013667148305103183, 0.001397225190885365, 0.0014277355512604117, 0.0014582457952201366, 0.0014887561555951834, 0.00151926651597023, 0.001549776759929955]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 6.0, 9.0, 2.0, 6.0, 11.0, 14.0, 14.0, 21.0, 22.0, 31.0, 31.0, 23.0, 42.0, 29.0, 37.0, 38.0, 36.0, 37.0, 40.0, 57.0, 45.0, 40.0, 40.0, 45.0, 43.0, 30.0, 28.0, 40.0, 30.0, 22.0, 26.0, 18.0, 20.0, 21.0, 8.0, 10.0, 8.0, 11.0, 5.0, 2.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.00011587142944335938, -0.0001124255359172821, -0.00010897964239120483, -0.00010553374886512756, -0.00010208785533905029, -9.864196181297302e-05, -9.519606828689575e-05, -9.175017476081848e-05, -8.830428123474121e-05, -8.485838770866394e-05, -8.141249418258667e-05, -7.79666006565094e-05, -7.452070713043213e-05, -7.107481360435486e-05, -6.762892007827759e-05, -6.418302655220032e-05, -6.073713302612305e-05, -5.7291239500045776e-05, -5.3845345973968506e-05, -5.0399452447891235e-05, -4.6953558921813965e-05, -4.3507665395736694e-05, -4.0061771869659424e-05, -3.661587834358215e-05, -3.316998481750488e-05, -2.9724091291427612e-05, -2.6278197765350342e-05, -2.283230423927307e-05, -1.93864107131958e-05, -1.594051718711853e-05, -1.249462366104126e-05, -9.04873013496399e-06, -5.602836608886719e-06, -2.1569430828094482e-06, 1.2889504432678223e-06, 4.734843969345093e-06, 8.180737495422363e-06, 1.1626631021499634e-05, 1.5072524547576904e-05, 1.8518418073654175e-05, 2.1964311599731445e-05, 2.5410205125808716e-05, 2.8856098651885986e-05, 3.230199217796326e-05, 3.574788570404053e-05, 3.91937792301178e-05, 4.263967275619507e-05, 4.608556628227234e-05, 4.953145980834961e-05, 5.297735333442688e-05, 5.642324686050415e-05, 5.986914038658142e-05, 6.331503391265869e-05, 6.676092743873596e-05, 7.020682096481323e-05, 7.36527144908905e-05, 7.709860801696777e-05, 8.054450154304504e-05, 8.399039506912231e-05, 8.743628859519958e-05, 9.088218212127686e-05, 9.432807564735413e-05, 9.77739691734314e-05, 0.00010121986269950867, 0.00010466575622558594]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 5.0, 6.0, 6.0, 8.0, 16.0, 7.0, 11.0, 14.0, 11.0, 20.0, 20.0, 23.0, 32.0, 21.0, 37.0, 44.0, 47.0, 45.0, 52.0, 40.0, 45.0, 33.0, 46.0, 40.0, 35.0, 51.0, 34.0, 33.0, 26.0, 34.0, 23.0, 23.0, 19.0, 12.0, 9.0, 17.0, 16.0, 11.0, 7.0, 9.0, 7.0, 2.0, 4.0, 1.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.6875, -6.4852294921875, -6.282958984375, -6.0806884765625, -5.87841796875, -5.6761474609375, -5.473876953125, -5.2716064453125, -5.0693359375, -4.8670654296875, -4.664794921875, -4.4625244140625, -4.26025390625, -4.0579833984375, -3.855712890625, -3.6534423828125, -3.451171875, -3.2489013671875, -3.046630859375, -2.8443603515625, -2.64208984375, -2.4398193359375, -2.237548828125, -2.0352783203125, -1.8330078125, -1.6307373046875, -1.428466796875, -1.2261962890625, -1.02392578125, -0.8216552734375, -0.619384765625, -0.4171142578125, -0.21484375, -0.0125732421875, 0.189697265625, 0.3919677734375, 0.59423828125, 0.7965087890625, 0.998779296875, 1.2010498046875, 1.4033203125, 1.6055908203125, 1.807861328125, 2.0101318359375, 2.21240234375, 2.4146728515625, 2.616943359375, 2.8192138671875, 3.021484375, 3.2237548828125, 3.426025390625, 3.6282958984375, 3.83056640625, 4.0328369140625, 4.235107421875, 4.4373779296875, 4.6396484375, 4.8419189453125, 5.044189453125, 5.2464599609375, 5.44873046875, 5.6510009765625, 5.853271484375, 6.0555419921875, 6.2578125]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 9.0, 12.0, 18.0, 19.0, 27.0, 32.0, 55.0, 81.0, 94.0, 140.0, 180.0, 260.0, 353.0, 519.0, 721.0, 1028.0, 1620.0, 2571.0, 4441.0, 8581.0, 20786.0, 63486.0, 220317.0, 472582.0, 166261.0, 49214.0, 16902.0, 7312.0, 3798.0, 2314.0, 1495.0, 953.0, 678.0, 490.0, 326.0, 232.0, 167.0, 132.0, 105.0, 71.0, 49.0, 40.0, 22.0, 24.0, 9.0, 15.0, 10.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-6.80078125, -6.59710693359375, -6.3934326171875, -6.18975830078125, -5.986083984375, -5.78240966796875, -5.5787353515625, -5.37506103515625, -5.17138671875, -4.96771240234375, -4.7640380859375, -4.56036376953125, -4.356689453125, -4.15301513671875, -3.9493408203125, -3.74566650390625, -3.5419921875, -3.33831787109375, -3.1346435546875, -2.93096923828125, -2.727294921875, -2.52362060546875, -2.3199462890625, -2.11627197265625, -1.91259765625, -1.70892333984375, -1.5052490234375, -1.30157470703125, -1.097900390625, -0.89422607421875, -0.6905517578125, -0.48687744140625, -0.283203125, -0.07952880859375, 0.1241455078125, 0.32781982421875, 0.531494140625, 0.73516845703125, 0.9388427734375, 1.14251708984375, 1.34619140625, 1.54986572265625, 1.7535400390625, 1.95721435546875, 2.160888671875, 2.36456298828125, 2.5682373046875, 2.77191162109375, 2.9755859375, 3.17926025390625, 3.3829345703125, 3.58660888671875, 3.790283203125, 3.99395751953125, 4.1976318359375, 4.40130615234375, 4.60498046875, 4.80865478515625, 5.0123291015625, 5.21600341796875, 5.419677734375, 5.62335205078125, 5.8270263671875, 6.03070068359375, 6.234375]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 3.0, 7.0, 4.0, 4.0, 6.0, 9.0, 6.0, 14.0, 11.0, 12.0, 18.0, 28.0, 28.0, 24.0, 21.0, 38.0, 38.0, 44.0, 44.0, 51.0, 75.0, 232.0, 1540.0, 281.0, 75.0, 47.0, 45.0, 48.0, 39.0, 37.0, 32.0, 33.0, 23.0, 16.0, 26.0, 22.0, 19.0, 13.0, 14.0, 4.0, 5.0, 2.0, 5.0, 5.0, 1.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-20.5, -19.851318359375, -19.20263671875, -18.553955078125, -17.9052734375, -17.256591796875, -16.60791015625, -15.959228515625, -15.310546875, -14.661865234375, -14.01318359375, -13.364501953125, -12.7158203125, -12.067138671875, -11.41845703125, -10.769775390625, -10.12109375, -9.472412109375, -8.82373046875, -8.175048828125, -7.5263671875, -6.877685546875, -6.22900390625, -5.580322265625, -4.931640625, -4.282958984375, -3.63427734375, -2.985595703125, -2.3369140625, -1.688232421875, -1.03955078125, -0.390869140625, 0.2578125, 0.906494140625, 1.55517578125, 2.203857421875, 2.8525390625, 3.501220703125, 4.14990234375, 4.798583984375, 5.447265625, 6.095947265625, 6.74462890625, 7.393310546875, 8.0419921875, 8.690673828125, 9.33935546875, 9.988037109375, 10.63671875, 11.285400390625, 11.93408203125, 12.582763671875, 13.2314453125, 13.880126953125, 14.52880859375, 15.177490234375, 15.826171875, 16.474853515625, 17.12353515625, 17.772216796875, 18.4208984375, 19.069580078125, 19.71826171875, 20.366943359375, 21.015625]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 0.0, 5.0, 10.0, 13.0, 21.0, 27.0, 40.0, 78.0, 116.0, 188.0, 392.0, 1198.0, 60445.0, 3079378.0, 2694.0, 502.0, 234.0, 127.0, 95.0, 56.0, 33.0, 23.0, 14.0, 16.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-108.1875, -105.197265625, -102.20703125, -99.216796875, -96.2265625, -93.236328125, -90.24609375, -87.255859375, -84.265625, -81.275390625, -78.28515625, -75.294921875, -72.3046875, -69.314453125, -66.32421875, -63.333984375, -60.34375, -57.353515625, -54.36328125, -51.373046875, -48.3828125, -45.392578125, -42.40234375, -39.412109375, -36.421875, -33.431640625, -30.44140625, -27.451171875, -24.4609375, -21.470703125, -18.48046875, -15.490234375, -12.5, -9.509765625, -6.51953125, -3.529296875, -0.5390625, 2.451171875, 5.44140625, 8.431640625, 11.421875, 14.412109375, 17.40234375, 20.392578125, 23.3828125, 26.373046875, 29.36328125, 32.353515625, 35.34375, 38.333984375, 41.32421875, 44.314453125, 47.3046875, 50.294921875, 53.28515625, 56.275390625, 59.265625, 62.255859375, 65.24609375, 68.236328125, 71.2265625, 74.216796875, 77.20703125, 80.197265625, 83.1875]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 20.0, 283.0, 590.0, 109.0, 16.0, 0.0, 1.0, 0.0, 1.0], "bins": [-237.1805419921875, -233.03941345214844, -228.89828491210938, -224.75714111328125, -220.6160125732422, -216.47488403320312, -212.33375549316406, -208.192626953125, -204.05148315429688, -199.9103546142578, -195.76922607421875, -191.62808227539062, -187.48695373535156, -183.3458251953125, -179.20469665527344, -175.06356811523438, -170.9224395751953, -166.78131103515625, -162.6401824951172, -158.49903869628906, -154.35791015625, -150.21678161621094, -146.07565307617188, -141.9345245361328, -137.79339599609375, -133.6522674560547, -129.51113891601562, -125.37000274658203, -121.22886657714844, -117.08773803710938, -112.94660949707031, -108.80548095703125, -104.66434478759766, -100.5232162475586, -96.382080078125, -92.24095153808594, -88.09982299804688, -83.95868682861328, -79.81755828857422, -75.67642211914062, -71.53529357910156, -67.3941650390625, -63.253028869628906, -59.111900329589844, -54.970767974853516, -50.82963562011719, -46.688507080078125, -42.5473747253418, -38.40624237060547, -34.26511001586914, -30.123979568481445, -25.98284912109375, -21.841716766357422, -17.700584411621094, -13.559453964233398, -9.418323516845703, -5.277189254760742, -1.1360578536987305, 3.0050735473632812, 7.146204948425293, 11.287336349487305, 15.428468704223633, 19.569599151611328, 23.710729598999023, 27.85186195373535]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 7.0, 8.0, 16.0, 10.0, 14.0, 11.0, 14.0, 26.0, 23.0, 12.0, 29.0, 25.0, 38.0, 32.0, 36.0, 27.0, 41.0, 35.0, 39.0, 47.0, 37.0, 42.0, 38.0, 41.0, 55.0, 38.0, 42.0, 26.0, 28.0, 34.0, 13.0, 33.0, 18.0, 15.0, 13.0, 7.0, 10.0, 7.0, 3.0, 4.0, 6.0, 3.0, 1.0, 3.0, 3.0, 2.0, 2.0], "bins": [-61.30418395996094, -59.64155578613281, -57.97892761230469, -56.3162956237793, -54.65366744995117, -52.99103927612305, -51.328407287597656, -49.66577911376953, -48.003150939941406, -46.34052276611328, -44.677894592285156, -43.015262603759766, -41.35263442993164, -39.690006256103516, -38.027374267578125, -36.36474609375, -34.702117919921875, -33.03948974609375, -31.376859664916992, -29.714229583740234, -28.05160140991211, -26.388973236083984, -24.726343154907227, -23.06371307373047, -21.401084899902344, -19.73845672607422, -18.07582664489746, -16.413196563720703, -14.750568389892578, -13.087939262390137, -11.425310134887695, -9.762681007385254, -8.100048065185547, -6.4374189376831055, -4.774789810180664, -3.1121606826782227, -1.4495315551757812, 0.21309757232666016, 1.8757266998291016, 3.538355827331543, 5.200984954833984, 6.863614082336426, 8.526243209838867, 10.188872337341309, 11.85150146484375, 13.514130592346191, 15.176759719848633, 16.83938980102539, 18.502017974853516, 20.16464614868164, 21.8272762298584, 23.489906311035156, 25.15253448486328, 26.815162658691406, 28.477792739868164, 30.140422821044922, 31.803050994873047, 33.46567916870117, 35.12831115722656, 36.79093933105469, 38.45356750488281, 40.11619567871094, 41.77882385253906, 43.44145584106445, 45.10408401489258]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 4.0, 3.0, 9.0, 13.0, 10.0, 12.0, 12.0, 12.0, 12.0, 22.0, 27.0, 26.0, 30.0, 40.0, 40.0, 45.0, 42.0, 53.0, 45.0, 39.0, 46.0, 44.0, 45.0, 37.0, 47.0, 35.0, 30.0, 41.0, 35.0, 23.0, 21.0, 19.0, 14.0, 13.0, 13.0, 10.0, 15.0, 7.0, 8.0, 2.0, 7.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.68359375, -7.45257568359375, -7.2215576171875, -6.99053955078125, -6.759521484375, -6.52850341796875, -6.2974853515625, -6.06646728515625, -5.83544921875, -5.60443115234375, -5.3734130859375, -5.14239501953125, -4.911376953125, -4.68035888671875, -4.4493408203125, -4.21832275390625, -3.9873046875, -3.75628662109375, -3.5252685546875, -3.29425048828125, -3.063232421875, -2.83221435546875, -2.6011962890625, -2.37017822265625, -2.13916015625, -1.90814208984375, -1.6771240234375, -1.44610595703125, -1.215087890625, -0.98406982421875, -0.7530517578125, -0.52203369140625, -0.291015625, -0.05999755859375, 0.1710205078125, 0.40203857421875, 0.633056640625, 0.86407470703125, 1.0950927734375, 1.32611083984375, 1.55712890625, 1.78814697265625, 2.0191650390625, 2.25018310546875, 2.481201171875, 2.71221923828125, 2.9432373046875, 3.17425537109375, 3.4052734375, 3.63629150390625, 3.8673095703125, 4.09832763671875, 4.329345703125, 4.56036376953125, 4.7913818359375, 5.02239990234375, 5.25341796875, 5.48443603515625, 5.7154541015625, 5.94647216796875, 6.177490234375, 6.40850830078125, 6.6395263671875, 6.87054443359375, 7.1015625]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 2.0, 1.0, 2.0, 6.0, 8.0, 8.0, 11.0, 15.0, 20.0, 29.0, 36.0, 50.0, 69.0, 92.0, 128.0, 195.0, 284.0, 473.0, 910.0, 1955.0, 4862.0, 14553.0, 100522.0, 1443921.0, 2358644.0, 232494.0, 23075.0, 6581.0, 2550.0, 1141.0, 582.0, 379.0, 198.0, 128.0, 96.0, 72.0, 48.0, 34.0, 25.0, 20.0, 22.0, 18.0, 8.0, 11.0, 6.0, 2.0, 0.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.4375, -15.9561767578125, -15.474853515625, -14.9935302734375, -14.51220703125, -14.0308837890625, -13.549560546875, -13.0682373046875, -12.5869140625, -12.1055908203125, -11.624267578125, -11.1429443359375, -10.66162109375, -10.1802978515625, -9.698974609375, -9.2176513671875, -8.736328125, -8.2550048828125, -7.773681640625, -7.2923583984375, -6.81103515625, -6.3297119140625, -5.848388671875, -5.3670654296875, -4.8857421875, -4.4044189453125, -3.923095703125, -3.4417724609375, -2.96044921875, -2.4791259765625, -1.997802734375, -1.5164794921875, -1.03515625, -0.5538330078125, -0.072509765625, 0.4088134765625, 0.89013671875, 1.3714599609375, 1.852783203125, 2.3341064453125, 2.8154296875, 3.2967529296875, 3.778076171875, 4.2593994140625, 4.74072265625, 5.2220458984375, 5.703369140625, 6.1846923828125, 6.666015625, 7.1473388671875, 7.628662109375, 8.1099853515625, 8.59130859375, 9.0726318359375, 9.553955078125, 10.0352783203125, 10.5166015625, 10.9979248046875, 11.479248046875, 11.9605712890625, 12.44189453125, 12.9232177734375, 13.404541015625, 13.8858642578125, 14.3671875]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 3.0, 4.0, 4.0, 7.0, 9.0, 11.0, 13.0, 15.0, 24.0, 24.0, 37.0, 44.0, 71.0, 67.0, 108.0, 171.0, 220.0, 334.0, 478.0, 557.0, 551.0, 441.0, 252.0, 162.0, 114.0, 93.0, 62.0, 57.0, 33.0, 21.0, 17.0, 12.0, 10.0, 10.0, 11.0, 4.0, 2.0, 8.0, 2.0, 3.0, 5.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.109375, -11.7142333984375, -11.319091796875, -10.9239501953125, -10.52880859375, -10.1336669921875, -9.738525390625, -9.3433837890625, -8.9482421875, -8.5531005859375, -8.157958984375, -7.7628173828125, -7.36767578125, -6.9725341796875, -6.577392578125, -6.1822509765625, -5.787109375, -5.3919677734375, -4.996826171875, -4.6016845703125, -4.20654296875, -3.8114013671875, -3.416259765625, -3.0211181640625, -2.6259765625, -2.2308349609375, -1.835693359375, -1.4405517578125, -1.04541015625, -0.6502685546875, -0.255126953125, 0.1400146484375, 0.53515625, 0.9302978515625, 1.325439453125, 1.7205810546875, 2.11572265625, 2.5108642578125, 2.906005859375, 3.3011474609375, 3.6962890625, 4.0914306640625, 4.486572265625, 4.8817138671875, 5.27685546875, 5.6719970703125, 6.067138671875, 6.4622802734375, 6.857421875, 7.2525634765625, 7.647705078125, 8.0428466796875, 8.43798828125, 8.8331298828125, 9.228271484375, 9.6234130859375, 10.0185546875, 10.4136962890625, 10.808837890625, 11.2039794921875, 11.59912109375, 11.9942626953125, 12.389404296875, 12.7845458984375, 13.1796875]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 2.0, 3.0, 5.0, 4.0, 3.0, 5.0, 6.0, 6.0, 13.0, 11.0, 13.0, 20.0, 22.0, 31.0, 64.0, 69.0, 93.0, 144.0, 259.0, 687.0, 4842.0, 183604.0, 3968652.0, 32396.0, 2142.0, 462.0, 236.0, 124.0, 90.0, 69.0, 53.0, 33.0, 27.0, 24.0, 13.0, 15.0, 9.0, 10.0, 9.0, 3.0, 5.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-59.28125, -57.44677734375, -55.6123046875, -53.77783203125, -51.943359375, -50.10888671875, -48.2744140625, -46.43994140625, -44.60546875, -42.77099609375, -40.9365234375, -39.10205078125, -37.267578125, -35.43310546875, -33.5986328125, -31.76416015625, -29.9296875, -28.09521484375, -26.2607421875, -24.42626953125, -22.591796875, -20.75732421875, -18.9228515625, -17.08837890625, -15.25390625, -13.41943359375, -11.5849609375, -9.75048828125, -7.916015625, -6.08154296875, -4.2470703125, -2.41259765625, -0.578125, 1.25634765625, 3.0908203125, 4.92529296875, 6.759765625, 8.59423828125, 10.4287109375, 12.26318359375, 14.09765625, 15.93212890625, 17.7666015625, 19.60107421875, 21.435546875, 23.27001953125, 25.1044921875, 26.93896484375, 28.7734375, 30.60791015625, 32.4423828125, 34.27685546875, 36.111328125, 37.94580078125, 39.7802734375, 41.61474609375, 43.44921875, 45.28369140625, 47.1181640625, 48.95263671875, 50.787109375, 52.62158203125, 54.4560546875, 56.29052734375, 58.125]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 18.0, 47.0, 236.0, 465.0, 191.0, 48.0, 9.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-340.7276306152344, -334.5817565917969, -328.43585205078125, -322.28997802734375, -316.1440734863281, -309.9981994628906, -303.8523254394531, -297.7064208984375, -291.560546875, -285.4146728515625, -279.2687683105469, -273.1228942871094, -266.97698974609375, -260.83111572265625, -254.6852264404297, -248.53933715820312, -242.39346313476562, -236.24757385253906, -230.1016845703125, -223.955810546875, -217.80992126464844, -211.66403198242188, -205.5181427001953, -199.37225341796875, -193.2263641357422, -187.08047485351562, -180.93458557128906, -174.78871154785156, -168.642822265625, -162.49693298339844, -156.35104370117188, -150.20516967773438, -144.05926513671875, -137.9133758544922, -131.76748657226562, -125.6216049194336, -119.47572326660156, -113.329833984375, -107.18394470214844, -101.0380630493164, -94.89218139648438, -88.74629211425781, -82.60041046142578, -76.45452117919922, -70.30863952636719, -64.16275024414062, -58.01686477661133, -51.87097930908203, -45.725093841552734, -39.57920837402344, -33.43332290649414, -27.28743553161621, -21.141550064086914, -14.995664596557617, -8.849777221679688, -2.7038917541503906, 3.4419937133789062, 9.587879180908203, 15.733765602111816, 21.87965202331543, 28.025537490844727, 34.171424865722656, 40.31731033325195, 46.46319580078125, 52.60908126831055]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 3.0, 3.0, 4.0, 3.0, 7.0, 8.0, 8.0, 11.0, 15.0, 20.0, 25.0, 23.0, 25.0, 24.0, 27.0, 39.0, 33.0, 37.0, 49.0, 33.0, 45.0, 41.0, 45.0, 55.0, 43.0, 43.0, 46.0, 34.0, 32.0, 40.0, 25.0, 32.0, 20.0, 20.0, 11.0, 20.0, 14.0, 9.0, 7.0, 5.0, 10.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-49.86748123168945, -48.42293930053711, -46.9783935546875, -45.533851623535156, -44.08930969238281, -42.64476776123047, -41.20022201538086, -39.755680084228516, -38.311134338378906, -36.86659240722656, -35.42204666137695, -33.97750473022461, -32.532962799072266, -31.08841896057129, -29.643875122070312, -28.19933319091797, -26.754791259765625, -25.31024742126465, -23.865705490112305, -22.421161651611328, -20.976619720458984, -19.532075881958008, -18.08753204345703, -16.642990112304688, -15.198446273803711, -13.75390338897705, -12.30936050415039, -10.864816665649414, -9.420273780822754, -7.975730895996094, -6.531187057495117, -5.086644172668457, -3.6421051025390625, -2.1975619792938232, -0.753018856048584, 0.6915245056152344, 2.1360673904418945, 3.5806102752685547, 5.025154113769531, 6.469696998596191, 7.914239883422852, 9.358782768249512, 10.803325653076172, 12.247869491577148, 13.692412376403809, 15.136955261230469, 16.581499099731445, 18.026042938232422, 19.470584869384766, 20.915128707885742, 22.359670639038086, 23.804214477539062, 25.248756408691406, 26.693300247192383, 28.13784408569336, 29.582386016845703, 31.02692985534668, 32.471473693847656, 33.916015625, 35.360557556152344, 36.80510330200195, 38.2496452331543, 39.694190979003906, 41.13873291015625, 42.583274841308594]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 6.0, 1.0, 4.0, 4.0, 2.0, 8.0, 5.0, 11.0, 9.0, 13.0, 14.0, 24.0, 20.0, 28.0, 26.0, 28.0, 28.0, 49.0, 46.0, 41.0, 39.0, 59.0, 47.0, 46.0, 45.0, 40.0, 45.0, 33.0, 41.0, 38.0, 29.0, 32.0, 26.0, 21.0, 19.0, 20.0, 15.0, 8.0, 20.0, 9.0, 4.0, 5.0, 5.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.44921875, -7.2308349609375, -7.012451171875, -6.7940673828125, -6.57568359375, -6.3572998046875, -6.138916015625, -5.9205322265625, -5.7021484375, -5.4837646484375, -5.265380859375, -5.0469970703125, -4.82861328125, -4.6102294921875, -4.391845703125, -4.1734619140625, -3.955078125, -3.7366943359375, -3.518310546875, -3.2999267578125, -3.08154296875, -2.8631591796875, -2.644775390625, -2.4263916015625, -2.2080078125, -1.9896240234375, -1.771240234375, -1.5528564453125, -1.33447265625, -1.1160888671875, -0.897705078125, -0.6793212890625, -0.4609375, -0.2425537109375, -0.024169921875, 0.1942138671875, 0.41259765625, 0.6309814453125, 0.849365234375, 1.0677490234375, 1.2861328125, 1.5045166015625, 1.722900390625, 1.9412841796875, 2.15966796875, 2.3780517578125, 2.596435546875, 2.8148193359375, 3.033203125, 3.2515869140625, 3.469970703125, 3.6883544921875, 3.90673828125, 4.1251220703125, 4.343505859375, 4.5618896484375, 4.7802734375, 4.9986572265625, 5.217041015625, 5.4354248046875, 5.65380859375, 5.8721923828125, 6.090576171875, 6.3089599609375, 6.52734375]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 5.0, 4.0, 17.0, 26.0, 26.0, 60.0, 78.0, 110.0, 168.0, 230.0, 302.0, 492.0, 727.0, 1129.0, 1649.0, 2479.0, 3806.0, 5837.0, 9091.0, 14947.0, 25042.0, 44702.0, 85542.0, 173083.0, 307265.0, 174944.0, 85521.0, 44635.0, 25243.0, 14911.0, 9268.0, 5838.0, 3811.0, 2568.0, 1632.0, 1080.0, 793.0, 472.0, 326.0, 233.0, 153.0, 103.0, 81.0, 46.0, 22.0, 26.0, 15.0, 7.0, 6.0, 4.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.322509765625, -0.3125877380371094, -0.30266571044921875, -0.2927436828613281, -0.2828216552734375, -0.2728996276855469, -0.26297760009765625, -0.2530555725097656, -0.243133544921875, -0.23321151733398438, -0.22328948974609375, -0.21336746215820312, -0.2034454345703125, -0.19352340698242188, -0.18360137939453125, -0.17367935180664062, -0.16375732421875, -0.15383529663085938, -0.14391326904296875, -0.13399124145507812, -0.1240692138671875, -0.11414718627929688, -0.10422515869140625, -0.09430313110351562, -0.084381103515625, -0.07445907592773438, -0.06453704833984375, -0.054615020751953125, -0.0446929931640625, -0.034770965576171875, -0.02484893798828125, -0.014926910400390625, -0.0050048828125, 0.004917144775390625, 0.01483917236328125, 0.024761199951171875, 0.0346832275390625, 0.044605255126953125, 0.05452728271484375, 0.06444931030273438, 0.074371337890625, 0.08429336547851562, 0.09421539306640625, 0.10413742065429688, 0.1140594482421875, 0.12398147583007812, 0.13390350341796875, 0.14382553100585938, 0.15374755859375, 0.16366958618164062, 0.17359161376953125, 0.18351364135742188, 0.1934356689453125, 0.20335769653320312, 0.21327972412109375, 0.22320175170898438, 0.233123779296875, 0.24304580688476562, 0.25296783447265625, 0.2628898620605469, 0.2728118896484375, 0.2827339172363281, 0.29265594482421875, 0.3025779724121094, 0.3125]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 6.0, 1.0, 1.0, 9.0, 12.0, 12.0, 20.0, 13.0, 10.0, 17.0, 22.0, 25.0, 29.0, 25.0, 26.0, 34.0, 32.0, 55.0, 38.0, 38.0, 41.0, 1061.0, 30.0, 52.0, 40.0, 36.0, 45.0, 44.0, 32.0, 33.0, 32.0, 27.0, 26.0, 20.0, 19.0, 15.0, 9.0, 7.0, 16.0, 5.0, 6.0, 8.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.26171875, -4.1292724609375, -3.996826171875, -3.8643798828125, -3.73193359375, -3.5994873046875, -3.467041015625, -3.3345947265625, -3.2021484375, -3.0697021484375, -2.937255859375, -2.8048095703125, -2.67236328125, -2.5399169921875, -2.407470703125, -2.2750244140625, -2.142578125, -2.0101318359375, -1.877685546875, -1.7452392578125, -1.61279296875, -1.4803466796875, -1.347900390625, -1.2154541015625, -1.0830078125, -0.9505615234375, -0.818115234375, -0.6856689453125, -0.55322265625, -0.4207763671875, -0.288330078125, -0.1558837890625, -0.0234375, 0.1090087890625, 0.241455078125, 0.3739013671875, 0.50634765625, 0.6387939453125, 0.771240234375, 0.9036865234375, 1.0361328125, 1.1685791015625, 1.301025390625, 1.4334716796875, 1.56591796875, 1.6983642578125, 1.830810546875, 1.9632568359375, 2.095703125, 2.2281494140625, 2.360595703125, 2.4930419921875, 2.62548828125, 2.7579345703125, 2.890380859375, 3.0228271484375, 3.1552734375, 3.2877197265625, 3.420166015625, 3.5526123046875, 3.68505859375, 3.8175048828125, 3.949951171875, 4.0823974609375, 4.21484375]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 7.0, 3.0, 9.0, 10.0, 15.0, 31.0, 46.0, 49.0, 101.0, 110.0, 154.0, 202.0, 305.0, 397.0, 599.0, 832.0, 1152.0, 1615.0, 2255.0, 3186.0, 4572.0, 6679.0, 9756.0, 14368.0, 22057.0, 34122.0, 53373.0, 86476.0, 142469.0, 1267709.0, 166447.0, 100575.0, 60982.0, 38603.0, 25166.0, 16594.0, 10874.0, 7511.0, 5220.0, 3568.0, 2533.0, 1855.0, 1308.0, 938.0, 675.0, 472.0, 361.0, 227.0, 150.0, 132.0, 77.0, 72.0, 50.0, 39.0, 20.0, 16.0, 9.0, 4.0, 7.0, 3.0, 3.0], "bins": [-0.174072265625, -0.16874122619628906, -0.16341018676757812, -0.1580791473388672, -0.15274810791015625, -0.1474170684814453, -0.14208602905273438, -0.13675498962402344, -0.1314239501953125, -0.12609291076660156, -0.12076187133789062, -0.11543083190917969, -0.11009979248046875, -0.10476875305175781, -0.09943771362304688, -0.09410667419433594, -0.088775634765625, -0.08344459533691406, -0.07811355590820312, -0.07278251647949219, -0.06745147705078125, -0.06212043762207031, -0.056789398193359375, -0.05145835876464844, -0.0461273193359375, -0.04079627990722656, -0.035465240478515625, -0.030134201049804688, -0.02480316162109375, -0.019472122192382812, -0.014141082763671875, -0.008810043334960938, -0.00347900390625, 0.0018520355224609375, 0.007183074951171875, 0.012514114379882812, 0.01784515380859375, 0.023176193237304688, 0.028507232666015625, 0.03383827209472656, 0.0391693115234375, 0.04450035095214844, 0.049831390380859375, 0.05516242980957031, 0.06049346923828125, 0.06582450866699219, 0.07115554809570312, 0.07648658752441406, 0.081817626953125, 0.08714866638183594, 0.09247970581054688, 0.09781074523925781, 0.10314178466796875, 0.10847282409667969, 0.11380386352539062, 0.11913490295410156, 0.1244659423828125, 0.12979698181152344, 0.13512802124023438, 0.1404590606689453, 0.14579010009765625, 0.1511211395263672, 0.15645217895507812, 0.16178321838378906, 0.1671142578125]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 5.0, 8.0, 10.0, 11.0, 9.0, 16.0, 14.0, 15.0, 11.0, 15.0, 31.0, 25.0, 46.0, 55.0, 52.0, 67.0, 67.0, 66.0, 84.0, 63.0, 59.0, 62.0, 31.0, 20.0, 24.0, 19.0, 13.0, 13.0, 15.0, 8.0, 7.0, 14.0, 9.0, 5.0, 10.0, 3.0, 4.0, 3.0, 6.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0003161430358886719, -0.00030638277530670166, -0.00029662251472473145, -0.00028686225414276123, -0.000277101993560791, -0.0002673417329788208, -0.0002575814723968506, -0.00024782121181488037, -0.00023806095123291016, -0.00022830069065093994, -0.00021854043006896973, -0.0002087801694869995, -0.0001990199089050293, -0.00018925964832305908, -0.00017949938774108887, -0.00016973912715911865, -0.00015997886657714844, -0.00015021860599517822, -0.000140458345413208, -0.0001306980848312378, -0.00012093782424926758, -0.00011117756366729736, -0.00010141730308532715, -9.165704250335693e-05, -8.189678192138672e-05, -7.21365213394165e-05, -6.237626075744629e-05, -5.2616000175476074e-05, -4.285573959350586e-05, -3.3095479011535645e-05, -2.333521842956543e-05, -1.3574957847595215e-05, -3.814697265625e-06, 5.945563316345215e-06, 1.570582389831543e-05, 2.5466084480285645e-05, 3.522634506225586e-05, 4.4986605644226074e-05, 5.474686622619629e-05, 6.45071268081665e-05, 7.426738739013672e-05, 8.402764797210693e-05, 9.378790855407715e-05, 0.00010354816913604736, 0.00011330842971801758, 0.0001230686902999878, 0.000132828950881958, 0.00014258921146392822, 0.00015234947204589844, 0.00016210973262786865, 0.00017186999320983887, 0.00018163025379180908, 0.0001913905143737793, 0.0002011507749557495, 0.00021091103553771973, 0.00022067129611968994, 0.00023043155670166016, 0.00024019181728363037, 0.0002499520778656006, 0.0002597123384475708, 0.000269472599029541, 0.00027923285961151123, 0.00028899312019348145, 0.00029875338077545166, 0.0003085136413574219]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 5.0, 2.0, 7.0, 8.0, 9.0, 11.0, 15.0, 17.0, 16.0, 19.0, 38.0, 33.0, 46.0, 57.0, 85.0, 111.0, 193.0, 484.0, 3201.0, 213018.0, 824054.0, 5769.0, 604.0, 226.0, 137.0, 70.0, 78.0, 56.0, 36.0, 33.0, 20.0, 25.0, 14.0, 17.0, 5.0, 8.0, 6.0, 8.0, 9.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.00635528564453125, -0.006157279014587402, -0.005959272384643555, -0.005761265754699707, -0.005563259124755859, -0.005365252494812012, -0.005167245864868164, -0.004969239234924316, -0.004771232604980469, -0.004573225975036621, -0.0043752193450927734, -0.004177212715148926, -0.003979206085205078, -0.0037811994552612305, -0.003583192825317383, -0.003385186195373535, -0.0031871795654296875, -0.00298917293548584, -0.002791166305541992, -0.0025931596755981445, -0.002395153045654297, -0.0021971464157104492, -0.0019991397857666016, -0.001801133155822754, -0.0016031265258789062, -0.0014051198959350586, -0.001207113265991211, -0.0010091066360473633, -0.0008111000061035156, -0.000613093376159668, -0.0004150867462158203, -0.00021708011627197266, -1.9073486328125e-05, 0.00017893314361572266, 0.0003769397735595703, 0.000574946403503418, 0.0007729530334472656, 0.0009709596633911133, 0.001168966293334961, 0.0013669729232788086, 0.0015649795532226562, 0.001762986183166504, 0.0019609928131103516, 0.0021589994430541992, 0.002357006072998047, 0.0025550127029418945, 0.002753019332885742, 0.00295102596282959, 0.0031490325927734375, 0.003347039222717285, 0.003545045852661133, 0.0037430524826049805, 0.003941059112548828, 0.004139065742492676, 0.0043370723724365234, 0.004535079002380371, 0.004733085632324219, 0.004931092262268066, 0.005129098892211914, 0.005327105522155762, 0.005525112152099609, 0.005723118782043457, 0.005921125411987305, 0.006119132041931152, 0.006317138671875]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 14.0, 963.0, 39.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00035580756957642734, -0.00021655917225871235, -7.731077494099736e-05, 6.193763692863286e-05, 0.00020118601969443262, 0.0003404344024602324, 0.00047968284343369305, 0.0006189312553033233, 0.0007581795798614621, 0.0008974279626272619, 0.0010366763453930616, 0.0011759247863665223, 0.001315173227339983, 0.0014544215518981218, 0.0015936699928715825, 0.0017329184338450432, 0.001872166758403182, 0.002011415082961321, 0.0021506636403501034, 0.0022899119649082422, 0.002429160289466381, 0.0025684088468551636, 0.0027076571714133024, 0.0028469054959714413, 0.0029861540533602238, 0.0031254023779183626, 0.003264650935307145, 0.003403899259865284, 0.003543147584423423, 0.0036823959089815617, 0.003821644466370344, 0.003960893023759127, 0.004100141581147909, 0.004239390138536692, 0.004378638230264187, 0.004517886787652969, 0.004657135345041752, 0.004796383436769247, 0.0049356319941580296, 0.005074880551546812, 0.005214128643274307, 0.00535337720066309, 0.005492625292390585, 0.0056318738497793674, 0.00577112240716815, 0.005910370498895645, 0.006049619056284428, 0.00618886761367321, 0.006328116171061993, 0.006467364728450775, 0.00660661282017827, 0.006745861377567053, 0.006885109934955835, 0.0070243580266833305, 0.007163606584072113, 0.0073028551414608955, 0.007442103233188391, 0.007581351790577173, 0.007720599882304668, 0.007859848439693451, 0.007999096997082233, 0.008138345554471016, 0.008277593180537224, 0.008416841737926006, 0.008556090295314789]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 9.0, 1.0, 9.0, 11.0, 25.0, 16.0, 34.0, 45.0, 56.0, 59.0, 69.0, 51.0, 65.0, 61.0, 69.0, 69.0, 68.0, 67.0, 50.0, 44.0, 34.0, 27.0, 14.0, 22.0, 9.0, 9.0, 8.0, 5.0, 4.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.00045931339263916016, -0.00044902414083480835, -0.00043873488903045654, -0.00042844563722610474, -0.00041815638542175293, -0.0004078671336174011, -0.0003975778818130493, -0.0003872886300086975, -0.0003769993782043457, -0.0003667101263999939, -0.0003564208745956421, -0.0003461316227912903, -0.0003358423709869385, -0.00032555311918258667, -0.00031526386737823486, -0.00030497461557388306, -0.00029468536376953125, -0.00028439611196517944, -0.00027410686016082764, -0.00026381760835647583, -0.000253528356552124, -0.00024323910474777222, -0.0002329498529434204, -0.0002226606011390686, -0.0002123713493347168, -0.000202082097530365, -0.00019179284572601318, -0.00018150359392166138, -0.00017121434211730957, -0.00016092509031295776, -0.00015063583850860596, -0.00014034658670425415, -0.00013005733489990234, -0.00011976808309555054, -0.00010947883129119873, -9.918957948684692e-05, -8.890032768249512e-05, -7.861107587814331e-05, -6.83218240737915e-05, -5.80325722694397e-05, -4.774332046508789e-05, -3.7454068660736084e-05, -2.7164816856384277e-05, -1.687556505203247e-05, -6.586313247680664e-06, 3.7029385566711426e-06, 1.399219036102295e-05, 2.4281442165374756e-05, 3.457069396972656e-05, 4.485994577407837e-05, 5.5149197578430176e-05, 6.543844938278198e-05, 7.572770118713379e-05, 8.60169529914856e-05, 9.63062047958374e-05, 0.00010659545660018921, 0.00011688470840454102, 0.00012717396020889282, 0.00013746321201324463, 0.00014775246381759644, 0.00015804171562194824, 0.00016833096742630005, 0.00017862021923065186, 0.00018890947103500366, 0.00019919872283935547]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 6.0, 1.0, 4.0, 4.0, 2.0, 8.0, 5.0, 11.0, 9.0, 13.0, 14.0, 24.0, 20.0, 28.0, 26.0, 28.0, 28.0, 49.0, 46.0, 41.0, 39.0, 59.0, 47.0, 46.0, 45.0, 40.0, 45.0, 33.0, 40.0, 39.0, 29.0, 32.0, 26.0, 21.0, 19.0, 20.0, 15.0, 8.0, 20.0, 9.0, 4.0, 5.0, 5.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.44921875, -7.2308349609375, -7.012451171875, -6.7940673828125, -6.57568359375, -6.3572998046875, -6.138916015625, -5.9205322265625, -5.7021484375, -5.4837646484375, -5.265380859375, -5.0469970703125, -4.82861328125, -4.6102294921875, -4.391845703125, -4.1734619140625, -3.955078125, -3.7366943359375, -3.518310546875, -3.2999267578125, -3.08154296875, -2.8631591796875, -2.644775390625, -2.4263916015625, -2.2080078125, -1.9896240234375, -1.771240234375, -1.5528564453125, -1.33447265625, -1.1160888671875, -0.897705078125, -0.6793212890625, -0.4609375, -0.2425537109375, -0.024169921875, 0.1942138671875, 0.41259765625, 0.6309814453125, 0.849365234375, 1.0677490234375, 1.2861328125, 1.5045166015625, 1.722900390625, 1.9412841796875, 2.15966796875, 2.3780517578125, 2.596435546875, 2.8148193359375, 3.033203125, 3.2515869140625, 3.469970703125, 3.6883544921875, 3.90673828125, 4.1251220703125, 4.343505859375, 4.5618896484375, 4.7802734375, 4.9986572265625, 5.217041015625, 5.4354248046875, 5.65380859375, 5.8721923828125, 6.090576171875, 6.3089599609375, 6.52734375]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 5.0, 7.0, 10.0, 13.0, 20.0, 32.0, 38.0, 60.0, 65.0, 138.0, 178.0, 280.0, 452.0, 712.0, 1145.0, 1970.0, 3531.0, 6509.0, 13157.0, 29261.0, 74564.0, 241758.0, 440463.0, 143041.0, 49195.0, 20531.0, 9720.0, 4927.0, 2680.0, 1517.0, 937.0, 531.0, 373.0, 230.0, 158.0, 119.0, 68.0, 47.0, 44.0, 21.0, 19.0, 10.0, 10.0, 7.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.3515625, -6.15484619140625, -5.9581298828125, -5.76141357421875, -5.564697265625, -5.36798095703125, -5.1712646484375, -4.97454833984375, -4.77783203125, -4.58111572265625, -4.3843994140625, -4.18768310546875, -3.990966796875, -3.79425048828125, -3.5975341796875, -3.40081787109375, -3.2041015625, -3.00738525390625, -2.8106689453125, -2.61395263671875, -2.417236328125, -2.22052001953125, -2.0238037109375, -1.82708740234375, -1.63037109375, -1.43365478515625, -1.2369384765625, -1.04022216796875, -0.843505859375, -0.64678955078125, -0.4500732421875, -0.25335693359375, -0.056640625, 0.14007568359375, 0.3367919921875, 0.53350830078125, 0.730224609375, 0.92694091796875, 1.1236572265625, 1.32037353515625, 1.51708984375, 1.71380615234375, 1.9105224609375, 2.10723876953125, 2.303955078125, 2.50067138671875, 2.6973876953125, 2.89410400390625, 3.0908203125, 3.28753662109375, 3.4842529296875, 3.68096923828125, 3.877685546875, 4.07440185546875, 4.2711181640625, 4.46783447265625, 4.66455078125, 4.86126708984375, 5.0579833984375, 5.25469970703125, 5.451416015625, 5.64813232421875, 5.8448486328125, 6.04156494140625, 6.23828125]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 8.0, 4.0, 1.0, 4.0, 6.0, 8.0, 8.0, 9.0, 11.0, 13.0, 23.0, 20.0, 20.0, 30.0, 26.0, 28.0, 43.0, 45.0, 45.0, 55.0, 82.0, 210.0, 1576.0, 252.0, 97.0, 58.0, 42.0, 42.0, 39.0, 40.0, 39.0, 31.0, 28.0, 23.0, 21.0, 17.0, 12.0, 5.0, 1.0, 9.0, 9.0, 7.0, 2.0, 1.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.125, -18.454833984375, -17.78466796875, -17.114501953125, -16.4443359375, -15.774169921875, -15.10400390625, -14.433837890625, -13.763671875, -13.093505859375, -12.42333984375, -11.753173828125, -11.0830078125, -10.412841796875, -9.74267578125, -9.072509765625, -8.40234375, -7.732177734375, -7.06201171875, -6.391845703125, -5.7216796875, -5.051513671875, -4.38134765625, -3.711181640625, -3.041015625, -2.370849609375, -1.70068359375, -1.030517578125, -0.3603515625, 0.309814453125, 0.97998046875, 1.650146484375, 2.3203125, 2.990478515625, 3.66064453125, 4.330810546875, 5.0009765625, 5.671142578125, 6.34130859375, 7.011474609375, 7.681640625, 8.351806640625, 9.02197265625, 9.692138671875, 10.3623046875, 11.032470703125, 11.70263671875, 12.372802734375, 13.04296875, 13.713134765625, 14.38330078125, 15.053466796875, 15.7236328125, 16.393798828125, 17.06396484375, 17.734130859375, 18.404296875, 19.074462890625, 19.74462890625, 20.414794921875, 21.0849609375, 21.755126953125, 22.42529296875, 23.095458984375, 23.765625]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 5.0, 4.0, 1.0, 2.0, 5.0, 12.0, 8.0, 10.0, 11.0, 17.0, 21.0, 30.0, 52.0, 49.0, 75.0, 86.0, 104.0, 180.0, 207.0, 335.0, 687.0, 3803.0, 718440.0, 2413963.0, 5637.0, 801.0, 304.0, 213.0, 166.0, 123.0, 64.0, 67.0, 48.0, 39.0, 37.0, 26.0, 17.0, 9.0, 14.0, 8.0, 8.0, 4.0, 4.0, 4.0, 10.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-54.5625, -53.00634765625, -51.4501953125, -49.89404296875, -48.337890625, -46.78173828125, -45.2255859375, -43.66943359375, -42.11328125, -40.55712890625, -39.0009765625, -37.44482421875, -35.888671875, -34.33251953125, -32.7763671875, -31.22021484375, -29.6640625, -28.10791015625, -26.5517578125, -24.99560546875, -23.439453125, -21.88330078125, -20.3271484375, -18.77099609375, -17.21484375, -15.65869140625, -14.1025390625, -12.54638671875, -10.990234375, -9.43408203125, -7.8779296875, -6.32177734375, -4.765625, -3.20947265625, -1.6533203125, -0.09716796875, 1.458984375, 3.01513671875, 4.5712890625, 6.12744140625, 7.68359375, 9.23974609375, 10.7958984375, 12.35205078125, 13.908203125, 15.46435546875, 17.0205078125, 18.57666015625, 20.1328125, 21.68896484375, 23.2451171875, 24.80126953125, 26.357421875, 27.91357421875, 29.4697265625, 31.02587890625, 32.58203125, 34.13818359375, 35.6943359375, 37.25048828125, 38.806640625, 40.36279296875, 41.9189453125, 43.47509765625, 45.03125]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 7.0, 117.0, 520.0, 324.0, 45.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.345001220703125, -42.9844856262207, -39.62397384643555, -36.263458251953125, -32.90294647216797, -29.542430877685547, -26.181915283203125, -22.821401596069336, -19.460887908935547, -16.100374221801758, -12.739859580993652, -9.379344940185547, -6.018831253051758, -2.6583175659179688, 0.7021980285644531, 4.062711715698242, 7.423225402832031, 10.78373908996582, 14.144253730773926, 17.50476837158203, 20.86528205871582, 24.22579574584961, 27.58631134033203, 30.94682502746582, 34.30733871459961, 37.66785430908203, 41.02836608886719, 44.38888168334961, 47.74939727783203, 51.10990905761719, 54.47042465209961, 57.83094024658203, 61.19145202636719, 64.55196380615234, 67.91248321533203, 71.27299499511719, 74.63350677490234, 77.9940185546875, 81.35453796386719, 84.71504974365234, 88.0755615234375, 91.43607330322266, 94.79659271240234, 98.1571044921875, 101.51761627197266, 104.87812805175781, 108.2386474609375, 111.59915924072266, 114.95967864990234, 118.3201904296875, 121.68070983886719, 125.04122161865234, 128.4017333984375, 131.7622528076172, 135.12277221679688, 138.4832763671875, 141.8437957763672, 145.20431518554688, 148.5648193359375, 151.9253387451172, 155.28585815429688, 158.6463623046875, 162.0068817138672, 165.36740112304688, 168.7279052734375]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 6.0, 10.0, 11.0, 6.0, 7.0, 9.0, 19.0, 14.0, 11.0, 20.0, 23.0, 30.0, 29.0, 19.0, 31.0, 29.0, 38.0, 38.0, 45.0, 42.0, 45.0, 48.0, 34.0, 36.0, 38.0, 34.0, 39.0, 37.0, 29.0, 26.0, 35.0, 27.0, 16.0, 11.0, 22.0, 16.0, 11.0, 15.0, 6.0, 6.0, 9.0, 9.0, 6.0, 4.0, 4.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0], "bins": [-52.46171569824219, -50.881256103515625, -49.30079650878906, -47.7203369140625, -46.13987731933594, -44.55941390991211, -42.97895431518555, -41.398494720458984, -39.81803512573242, -38.23757553100586, -36.6571159362793, -35.076656341552734, -33.496192932128906, -31.915735244750977, -30.33527374267578, -28.75481414794922, -27.174354553222656, -25.593894958496094, -24.01343536376953, -22.432973861694336, -20.852514266967773, -19.27205467224121, -17.691593170166016, -16.111133575439453, -14.53067398071289, -12.950214385986328, -11.36975383758545, -9.78929328918457, -8.208833694458008, -6.628373622894287, -5.047913551330566, -3.4674530029296875, -1.886993408203125, -0.3065333366394043, 1.2739267349243164, 2.854386806488037, 4.434846878051758, 6.0153069496154785, 7.595767021179199, 9.176227569580078, 10.75668716430664, 12.337146759033203, 13.917607307434082, 15.498067855834961, 17.078527450561523, 18.658987045288086, 20.23944854736328, 21.819908142089844, 23.400367736816406, 24.98082733154297, 26.56128692626953, 28.141748428344727, 29.72220802307129, 31.30266761779785, 32.88312911987305, 34.46358871459961, 36.04404830932617, 37.624507904052734, 39.2049674987793, 40.78542709350586, 42.36589050292969, 43.94635009765625, 45.52680969238281, 47.107269287109375, 48.68772888183594]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 7.0, 7.0, 0.0, 6.0, 5.0, 7.0, 15.0, 10.0, 12.0, 16.0, 16.0, 22.0, 23.0, 31.0, 22.0, 30.0, 41.0, 43.0, 36.0, 35.0, 50.0, 50.0, 56.0, 41.0, 52.0, 30.0, 23.0, 34.0, 38.0, 36.0, 31.0, 26.0, 33.0, 19.0, 17.0, 14.0, 10.0, 19.0, 9.0, 12.0, 5.0, 10.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-7.38671875, -7.17340087890625, -6.9600830078125, -6.74676513671875, -6.533447265625, -6.32012939453125, -6.1068115234375, -5.89349365234375, -5.68017578125, -5.46685791015625, -5.2535400390625, -5.04022216796875, -4.826904296875, -4.61358642578125, -4.4002685546875, -4.18695068359375, -3.9736328125, -3.76031494140625, -3.5469970703125, -3.33367919921875, -3.120361328125, -2.90704345703125, -2.6937255859375, -2.48040771484375, -2.26708984375, -2.05377197265625, -1.8404541015625, -1.62713623046875, -1.413818359375, -1.20050048828125, -0.9871826171875, -0.77386474609375, -0.560546875, -0.34722900390625, -0.1339111328125, 0.07940673828125, 0.292724609375, 0.50604248046875, 0.7193603515625, 0.93267822265625, 1.14599609375, 1.35931396484375, 1.5726318359375, 1.78594970703125, 1.999267578125, 2.21258544921875, 2.4259033203125, 2.63922119140625, 2.8525390625, 3.06585693359375, 3.2791748046875, 3.49249267578125, 3.705810546875, 3.91912841796875, 4.1324462890625, 4.34576416015625, 4.55908203125, 4.77239990234375, 4.9857177734375, 5.19903564453125, 5.412353515625, 5.62567138671875, 5.8389892578125, 6.05230712890625, 6.265625]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 7.0, 2.0, 5.0, 7.0, 1.0, 10.0, 7.0, 7.0, 12.0, 8.0, 27.0, 27.0, 33.0, 47.0, 59.0, 96.0, 134.0, 254.0, 414.0, 801.0, 1851.0, 4839.0, 19209.0, 287128.0, 3087101.0, 745288.0, 35075.0, 6999.0, 2483.0, 981.0, 530.0, 280.0, 167.0, 121.0, 68.0, 51.0, 29.0, 32.0, 23.0, 16.0, 8.0, 16.0, 9.0, 10.0, 8.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0], "bins": [-20.375, -19.786865234375, -19.19873046875, -18.610595703125, -18.0224609375, -17.434326171875, -16.84619140625, -16.258056640625, -15.669921875, -15.081787109375, -14.49365234375, -13.905517578125, -13.3173828125, -12.729248046875, -12.14111328125, -11.552978515625, -10.96484375, -10.376708984375, -9.78857421875, -9.200439453125, -8.6123046875, -8.024169921875, -7.43603515625, -6.847900390625, -6.259765625, -5.671630859375, -5.08349609375, -4.495361328125, -3.9072265625, -3.319091796875, -2.73095703125, -2.142822265625, -1.5546875, -0.966552734375, -0.37841796875, 0.209716796875, 0.7978515625, 1.385986328125, 1.97412109375, 2.562255859375, 3.150390625, 3.738525390625, 4.32666015625, 4.914794921875, 5.5029296875, 6.091064453125, 6.67919921875, 7.267333984375, 7.85546875, 8.443603515625, 9.03173828125, 9.619873046875, 10.2080078125, 10.796142578125, 11.38427734375, 11.972412109375, 12.560546875, 13.148681640625, 13.73681640625, 14.324951171875, 14.9130859375, 15.501220703125, 16.08935546875, 16.677490234375, 17.265625]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 4.0, 4.0, 7.0, 13.0, 14.0, 25.0, 29.0, 36.0, 50.0, 82.0, 122.0, 191.0, 284.0, 500.0, 677.0, 650.0, 542.0, 328.0, 162.0, 107.0, 71.0, 57.0, 41.0, 19.0, 13.0, 15.0, 7.0, 9.0, 5.0, 3.0, 5.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-18.6875, -18.2086181640625, -17.729736328125, -17.2508544921875, -16.77197265625, -16.2930908203125, -15.814208984375, -15.3353271484375, -14.8564453125, -14.3775634765625, -13.898681640625, -13.4197998046875, -12.94091796875, -12.4620361328125, -11.983154296875, -11.5042724609375, -11.025390625, -10.5465087890625, -10.067626953125, -9.5887451171875, -9.10986328125, -8.6309814453125, -8.152099609375, -7.6732177734375, -7.1943359375, -6.7154541015625, -6.236572265625, -5.7576904296875, -5.27880859375, -4.7999267578125, -4.321044921875, -3.8421630859375, -3.36328125, -2.8843994140625, -2.405517578125, -1.9266357421875, -1.44775390625, -0.9688720703125, -0.489990234375, -0.0111083984375, 0.4677734375, 0.9466552734375, 1.425537109375, 1.9044189453125, 2.38330078125, 2.8621826171875, 3.341064453125, 3.8199462890625, 4.298828125, 4.7777099609375, 5.256591796875, 5.7354736328125, 6.21435546875, 6.6932373046875, 7.172119140625, 7.6510009765625, 8.1298828125, 8.6087646484375, 9.087646484375, 9.5665283203125, 10.04541015625, 10.5242919921875, 11.003173828125, 11.4820556640625, 11.9609375]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 5.0, 4.0, 3.0, 7.0, 10.0, 14.0, 10.0, 26.0, 21.0, 59.0, 68.0, 130.0, 200.0, 536.0, 3089.0, 315759.0, 3863527.0, 9167.0, 882.0, 299.0, 170.0, 97.0, 64.0, 33.0, 30.0, 32.0, 12.0, 13.0, 6.0, 5.0, 3.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.40625, -55.12646484375, -52.8466796875, -50.56689453125, -48.287109375, -46.00732421875, -43.7275390625, -41.44775390625, -39.16796875, -36.88818359375, -34.6083984375, -32.32861328125, -30.048828125, -27.76904296875, -25.4892578125, -23.20947265625, -20.9296875, -18.64990234375, -16.3701171875, -14.09033203125, -11.810546875, -9.53076171875, -7.2509765625, -4.97119140625, -2.69140625, -0.41162109375, 1.8681640625, 4.14794921875, 6.427734375, 8.70751953125, 10.9873046875, 13.26708984375, 15.546875, 17.82666015625, 20.1064453125, 22.38623046875, 24.666015625, 26.94580078125, 29.2255859375, 31.50537109375, 33.78515625, 36.06494140625, 38.3447265625, 40.62451171875, 42.904296875, 45.18408203125, 47.4638671875, 49.74365234375, 52.0234375, 54.30322265625, 56.5830078125, 58.86279296875, 61.142578125, 63.42236328125, 65.7021484375, 67.98193359375, 70.26171875, 72.54150390625, 74.8212890625, 77.10107421875, 79.380859375, 81.66064453125, 83.9404296875, 86.22021484375, 88.5]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 15.0, 28.0, 80.0, 157.0, 280.0, 275.0, 121.0, 44.0, 9.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-192.33062744140625, -188.61984252929688, -184.90904235839844, -181.19825744628906, -177.48745727539062, -173.77667236328125, -170.0658721923828, -166.35508728027344, -162.644287109375, -158.93350219726562, -155.2227020263672, -151.5119171142578, -147.80111694335938, -144.09033203125, -140.37953186035156, -136.6687469482422, -132.9579620361328, -129.24717712402344, -125.536376953125, -121.8255844116211, -118.11479187011719, -114.40400695800781, -110.69320678710938, -106.982421875, -103.27162170410156, -99.56082916259766, -95.85003662109375, -92.13924407958984, -88.42845153808594, -84.71766662597656, -81.00686645507812, -77.29608154296875, -73.58528137207031, -69.8744888305664, -66.1636962890625, -62.452903747558594, -58.74211502075195, -55.03132247924805, -51.32052993774414, -47.6097412109375, -43.898948669433594, -40.18815612792969, -36.47736358642578, -32.766571044921875, -29.055782318115234, -25.344989776611328, -21.634197235107422, -17.92340660095215, -14.212615966796875, -10.501824378967285, -6.791032314300537, -3.080240249633789, 0.6305513381958008, 4.341342926025391, 8.052135467529297, 11.76292610168457, 15.473718643188477, 19.184511184692383, 22.895301818847656, 26.606094360351562, 30.31688690185547, 34.027679443359375, 37.73847198486328, 41.44926071166992, 45.16005325317383]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 5.0, 5.0, 3.0, 14.0, 7.0, 10.0, 8.0, 14.0, 8.0, 12.0, 25.0, 29.0, 28.0, 19.0, 27.0, 32.0, 34.0, 32.0, 35.0, 46.0, 45.0, 55.0, 49.0, 40.0, 45.0, 52.0, 40.0, 26.0, 40.0, 35.0, 24.0, 19.0, 26.0, 18.0, 16.0, 9.0, 19.0, 15.0, 10.0, 8.0, 8.0, 4.0, 4.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-44.25641632080078, -43.02717590332031, -41.79793930053711, -40.56869888305664, -39.33946228027344, -38.11022186279297, -36.8809814453125, -35.6517448425293, -34.42250442504883, -33.19326400756836, -31.964027404785156, -30.734786987304688, -29.50554847717285, -28.276309967041016, -27.04707145690918, -25.817832946777344, -24.588594436645508, -23.359355926513672, -22.130117416381836, -20.90087890625, -19.67163848876953, -18.442399978637695, -17.21316146850586, -15.983922004699707, -14.754683494567871, -13.525444984436035, -12.296205520629883, -11.066967010498047, -9.837728500366211, -8.608489036560059, -7.379250526428223, -6.15001106262207, -4.920772552490234, -3.6915335655212402, -2.462294816970825, -1.2330560684204102, -0.0038170814514160156, 1.2254219055175781, 2.454660415649414, 3.6838998794555664, 4.913138389587402, 6.1423773765563965, 7.371616363525391, 8.600854873657227, 9.830093383789062, 11.059332847595215, 12.28857135772705, 13.517810821533203, 14.747049331665039, 15.976287841796875, 17.20552635192871, 18.434764862060547, 19.664005279541016, 20.89324378967285, 22.122482299804688, 23.351722717285156, 24.58095932006836, 25.810197830200195, 27.03943634033203, 28.2686767578125, 29.497915267944336, 30.727153778076172, 31.956392288208008, 33.185630798339844, 34.41487121582031]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 6.0, 6.0, 4.0, 9.0, 11.0, 11.0, 12.0, 16.0, 18.0, 17.0, 30.0, 22.0, 18.0, 27.0, 43.0, 38.0, 35.0, 39.0, 46.0, 40.0, 46.0, 36.0, 47.0, 44.0, 37.0, 31.0, 45.0, 28.0, 35.0, 28.0, 21.0, 29.0, 18.0, 21.0, 15.0, 13.0, 12.0, 10.0, 14.0, 7.0, 8.0, 6.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.546875, -6.34478759765625, -6.1427001953125, -5.94061279296875, -5.738525390625, -5.53643798828125, -5.3343505859375, -5.13226318359375, -4.93017578125, -4.72808837890625, -4.5260009765625, -4.32391357421875, -4.121826171875, -3.91973876953125, -3.7176513671875, -3.51556396484375, -3.3134765625, -3.11138916015625, -2.9093017578125, -2.70721435546875, -2.505126953125, -2.30303955078125, -2.1009521484375, -1.89886474609375, -1.69677734375, -1.49468994140625, -1.2926025390625, -1.09051513671875, -0.888427734375, -0.68634033203125, -0.4842529296875, -0.28216552734375, -0.080078125, 0.12200927734375, 0.3240966796875, 0.52618408203125, 0.728271484375, 0.93035888671875, 1.1324462890625, 1.33453369140625, 1.53662109375, 1.73870849609375, 1.9407958984375, 2.14288330078125, 2.344970703125, 2.54705810546875, 2.7491455078125, 2.95123291015625, 3.1533203125, 3.35540771484375, 3.5574951171875, 3.75958251953125, 3.961669921875, 4.16375732421875, 4.3658447265625, 4.56793212890625, 4.77001953125, 4.97210693359375, 5.1741943359375, 5.37628173828125, 5.578369140625, 5.78045654296875, 5.9825439453125, 6.18463134765625, 6.38671875]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 1.0, 8.0, 7.0, 8.0, 27.0, 27.0, 56.0, 54.0, 78.0, 150.0, 188.0, 264.0, 446.0, 627.0, 978.0, 1390.0, 2111.0, 2992.0, 4606.0, 6934.0, 10357.0, 16059.0, 25309.0, 40384.0, 67371.0, 118673.0, 232063.0, 225701.0, 115107.0, 65868.0, 39655.0, 24694.0, 15749.0, 10135.0, 6759.0, 4370.0, 3048.0, 2099.0, 1388.0, 906.0, 662.0, 388.0, 280.0, 210.0, 118.0, 94.0, 60.0, 38.0, 12.0, 13.0, 23.0, 9.0, 2.0, 7.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.258544921875, -0.2501983642578125, -0.241851806640625, -0.2335052490234375, -0.22515869140625, -0.2168121337890625, -0.208465576171875, -0.2001190185546875, -0.1917724609375, -0.1834259033203125, -0.175079345703125, -0.1667327880859375, -0.15838623046875, -0.1500396728515625, -0.141693115234375, -0.1333465576171875, -0.125, -0.1166534423828125, -0.108306884765625, -0.0999603271484375, -0.09161376953125, -0.0832672119140625, -0.074920654296875, -0.0665740966796875, -0.0582275390625, -0.0498809814453125, -0.041534423828125, -0.0331878662109375, -0.02484130859375, -0.0164947509765625, -0.008148193359375, 0.0001983642578125, 0.008544921875, 0.0168914794921875, 0.025238037109375, 0.0335845947265625, 0.04193115234375, 0.0502777099609375, 0.058624267578125, 0.0669708251953125, 0.0753173828125, 0.0836639404296875, 0.092010498046875, 0.1003570556640625, 0.10870361328125, 0.1170501708984375, 0.125396728515625, 0.1337432861328125, 0.14208984375, 0.1504364013671875, 0.158782958984375, 0.1671295166015625, 0.17547607421875, 0.1838226318359375, 0.192169189453125, 0.2005157470703125, 0.2088623046875, 0.2172088623046875, 0.225555419921875, 0.2339019775390625, 0.24224853515625, 0.2505950927734375, 0.258941650390625, 0.2672882080078125, 0.275634765625]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 13.0, 8.0, 15.0, 8.0, 15.0, 11.0, 9.0, 21.0, 22.0, 27.0, 22.0, 32.0, 37.0, 31.0, 43.0, 38.0, 45.0, 34.0, 38.0, 1070.0, 32.0, 33.0, 45.0, 36.0, 39.0, 42.0, 30.0, 38.0, 30.0, 35.0, 22.0, 14.0, 19.0, 13.0, 11.0, 13.0, 11.0, 5.0, 8.0, 3.0, 4.0, 5.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.880859375, -3.749542236328125, -3.61822509765625, -3.486907958984375, -3.3555908203125, -3.224273681640625, -3.09295654296875, -2.961639404296875, -2.830322265625, -2.699005126953125, -2.56768798828125, -2.436370849609375, -2.3050537109375, -2.173736572265625, -2.04241943359375, -1.911102294921875, -1.77978515625, -1.648468017578125, -1.51715087890625, -1.385833740234375, -1.2545166015625, -1.123199462890625, -0.99188232421875, -0.860565185546875, -0.729248046875, -0.597930908203125, -0.46661376953125, -0.335296630859375, -0.2039794921875, -0.072662353515625, 0.05865478515625, 0.189971923828125, 0.3212890625, 0.452606201171875, 0.58392333984375, 0.715240478515625, 0.8465576171875, 0.977874755859375, 1.10919189453125, 1.240509033203125, 1.371826171875, 1.503143310546875, 1.63446044921875, 1.765777587890625, 1.8970947265625, 2.028411865234375, 2.15972900390625, 2.291046142578125, 2.42236328125, 2.553680419921875, 2.68499755859375, 2.816314697265625, 2.9476318359375, 3.078948974609375, 3.21026611328125, 3.341583251953125, 3.472900390625, 3.604217529296875, 3.73553466796875, 3.866851806640625, 3.9981689453125, 4.129486083984375, 4.26080322265625, 4.392120361328125, 4.5234375]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 4.0, 8.0, 5.0, 17.0, 15.0, 31.0, 37.0, 40.0, 74.0, 108.0, 165.0, 227.0, 314.0, 406.0, 619.0, 874.0, 1296.0, 1896.0, 2665.0, 3941.0, 5839.0, 8934.0, 13638.0, 21314.0, 33515.0, 55443.0, 93210.0, 161362.0, 1290687.0, 158965.0, 91432.0, 54719.0, 33577.0, 21188.0, 13518.0, 8781.0, 5663.0, 3953.0, 2632.0, 1795.0, 1238.0, 866.0, 609.0, 450.0, 297.0, 234.0, 164.0, 109.0, 89.0, 54.0, 34.0, 28.0, 23.0, 10.0, 14.0, 5.0, 9.0, 4.0, 2.0, 2.0], "bins": [-0.19091796875, -0.1850414276123047, -0.17916488647460938, -0.17328834533691406, -0.16741180419921875, -0.16153526306152344, -0.15565872192382812, -0.1497821807861328, -0.1439056396484375, -0.1380290985107422, -0.13215255737304688, -0.12627601623535156, -0.12039947509765625, -0.11452293395996094, -0.10864639282226562, -0.10276985168457031, -0.096893310546875, -0.09101676940917969, -0.08514022827148438, -0.07926368713378906, -0.07338714599609375, -0.06751060485839844, -0.061634063720703125, -0.05575752258300781, -0.0498809814453125, -0.04400444030761719, -0.038127899169921875, -0.03225135803222656, -0.02637481689453125, -0.020498275756835938, -0.014621734619140625, -0.008745193481445312, -0.00286865234375, 0.0030078887939453125, 0.008884429931640625, 0.014760971069335938, 0.02063751220703125, 0.026514053344726562, 0.032390594482421875, 0.03826713562011719, 0.0441436767578125, 0.05002021789550781, 0.055896759033203125, 0.06177330017089844, 0.06764984130859375, 0.07352638244628906, 0.07940292358398438, 0.08527946472167969, 0.091156005859375, 0.09703254699707031, 0.10290908813476562, 0.10878562927246094, 0.11466217041015625, 0.12053871154785156, 0.12641525268554688, 0.1322917938232422, 0.1381683349609375, 0.1440448760986328, 0.14992141723632812, 0.15579795837402344, 0.16167449951171875, 0.16755104064941406, 0.17342758178710938, 0.1793041229248047, 0.1851806640625]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 2.0, 3.0, 7.0, 6.0, 9.0, 11.0, 10.0, 13.0, 18.0, 25.0, 28.0, 34.0, 37.0, 35.0, 79.0, 108.0, 140.0, 112.0, 83.0, 52.0, 41.0, 30.0, 22.0, 16.0, 17.0, 10.0, 16.0, 6.0, 7.0, 7.0, 4.0, 0.0, 0.0, 3.0, 0.0, 3.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003261566162109375, -0.00031606853008270264, -0.0003059804439544678, -0.0002958923578262329, -0.00028580427169799805, -0.0002757161855697632, -0.0002656280994415283, -0.00025554001331329346, -0.0002454519271850586, -0.00023536384105682373, -0.00022527575492858887, -0.000215187668800354, -0.00020509958267211914, -0.00019501149654388428, -0.00018492341041564941, -0.00017483532428741455, -0.0001647472381591797, -0.00015465915203094482, -0.00014457106590270996, -0.0001344829797744751, -0.00012439489364624023, -0.00011430680751800537, -0.00010421872138977051, -9.413063526153564e-05, -8.404254913330078e-05, -7.395446300506592e-05, -6.386637687683105e-05, -5.377829074859619e-05, -4.369020462036133e-05, -3.3602118492126465e-05, -2.35140323638916e-05, -1.3425946235656738e-05, -3.337860107421875e-06, 6.750226020812988e-06, 1.683831214904785e-05, 2.6926398277282715e-05, 3.701448440551758e-05, 4.710257053375244e-05, 5.7190656661987305e-05, 6.727874279022217e-05, 7.736682891845703e-05, 8.74549150466919e-05, 9.754300117492676e-05, 0.00010763108730316162, 0.00011771917343139648, 0.00012780725955963135, 0.0001378953456878662, 0.00014798343181610107, 0.00015807151794433594, 0.0001681596040725708, 0.00017824769020080566, 0.00018833577632904053, 0.0001984238624572754, 0.00020851194858551025, 0.00021860003471374512, 0.00022868812084197998, 0.00023877620697021484, 0.0002488642930984497, 0.00025895237922668457, 0.00026904046535491943, 0.0002791285514831543, 0.00028921663761138916, 0.000299304723739624, 0.0003093928098678589, 0.00031948089599609375]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 9.0, 6.0, 14.0, 9.0, 12.0, 20.0, 25.0, 35.0, 35.0, 62.0, 99.0, 131.0, 249.0, 679.0, 16097.0, 1023624.0, 6272.0, 509.0, 195.0, 119.0, 90.0, 67.0, 47.0, 31.0, 24.0, 17.0, 16.0, 9.0, 9.0, 12.0, 7.0, 2.0, 6.0, 2.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.006137847900390625, -0.0059424638748168945, -0.005747079849243164, -0.005551695823669434, -0.005356311798095703, -0.005160927772521973, -0.004965543746948242, -0.004770159721374512, -0.004574775695800781, -0.004379391670227051, -0.00418400764465332, -0.00398862361907959, -0.0037932395935058594, -0.003597855567932129, -0.0034024715423583984, -0.003207087516784668, -0.0030117034912109375, -0.002816319465637207, -0.0026209354400634766, -0.002425551414489746, -0.0022301673889160156, -0.002034783363342285, -0.0018393993377685547, -0.0016440153121948242, -0.0014486312866210938, -0.0012532472610473633, -0.0010578632354736328, -0.0008624792098999023, -0.0006670951843261719, -0.0004717111587524414, -0.00027632713317871094, -8.094310760498047e-05, 0.00011444091796875, 0.00030982494354248047, 0.0005052089691162109, 0.0007005929946899414, 0.0008959770202636719, 0.0010913610458374023, 0.0012867450714111328, 0.0014821290969848633, 0.0016775131225585938, 0.0018728971481323242, 0.0020682811737060547, 0.002263665199279785, 0.0024590492248535156, 0.002654433250427246, 0.0028498172760009766, 0.003045201301574707, 0.0032405853271484375, 0.003435969352722168, 0.0036313533782958984, 0.003826737403869629, 0.004022121429443359, 0.00421750545501709, 0.00441288948059082, 0.004608273506164551, 0.004803657531738281, 0.004999041557312012, 0.005194425582885742, 0.005389809608459473, 0.005585193634033203, 0.005780577659606934, 0.005975961685180664, 0.0061713457107543945, 0.006366729736328125]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 7.0, 201.0, 762.0, 42.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000331379531417042, -0.00028601803933270276, -0.00024065653269644827, -0.00019529502606019378, -0.00014993353397585452, -0.00010457204189151525, -5.921052070334554e-05, -1.3849028619006276e-05, 3.1512463465332985e-05, 7.687396282562986e-05, 0.00012223546218592674, 0.00016759696882218122, 0.00021295846090652049, 0.00025831995299085975, 0.00030368147417902946, 0.0003490429662633687, 0.000394404458347708, 0.00043976595043204725, 0.0004851274425163865, 0.0005304889637045562, 0.0005758504848927259, 0.0006212119478732347, 0.0006665734690614045, 0.0007119349902495742, 0.000757296453230083, 0.0008026579744182527, 0.0008480194373987615, 0.0008933809585869312, 0.00093874242156744, 0.0009841038845479488, 0.0010294654639437795, 0.0010748269269242883, 0.001120188506320119, 0.0011655499693006277, 0.0012109115486964583, 0.0012562730116769671, 0.001301634474657476, 0.0013469960540533066, 0.0013923575170338154, 0.0014377189800143242, 0.001483080442994833, 0.0015284419059753418, 0.0015738034853711724, 0.0016191649483516812, 0.00166452641133219, 0.0017098879907280207, 0.0017552494537085295, 0.0018006109166890383, 0.001845972496084869, 0.0018913339590653777, 0.0019366955384612083, 0.001982057001441717, 0.002027418464422226, 0.0020727799274027348, 0.0021181413903832436, 0.002163503086194396, 0.002208864549174905, 0.0022542260121554136, 0.0022995874751359224, 0.002344949170947075, 0.0023903106339275837, 0.0024356720969080925, 0.0024810335598886013, 0.00252639502286911, 0.002571756485849619]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 7.0, 3.0, 3.0, 8.0, 5.0, 9.0, 10.0, 13.0, 14.0, 15.0, 24.0, 15.0, 26.0, 24.0, 30.0, 36.0, 32.0, 29.0, 39.0, 45.0, 41.0, 38.0, 37.0, 54.0, 33.0, 50.0, 38.0, 41.0, 47.0, 37.0, 37.0, 28.0, 23.0, 19.0, 11.0, 18.0, 16.0, 18.0, 5.0, 4.0, 11.0, 5.0, 6.0, 2.0, 2.0, 3.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.00016635656356811523, -0.0001615956425666809, -0.00015683472156524658, -0.00015207380056381226, -0.00014731287956237793, -0.0001425519585609436, -0.00013779103755950928, -0.00013303011655807495, -0.00012826919555664062, -0.0001235082745552063, -0.00011874735355377197, -0.00011398643255233765, -0.00010922551155090332, -0.000104464590549469, -9.970366954803467e-05, -9.494274854660034e-05, -9.018182754516602e-05, -8.542090654373169e-05, -8.065998554229736e-05, -7.589906454086304e-05, -7.113814353942871e-05, -6.637722253799438e-05, -6.161630153656006e-05, -5.685538053512573e-05, -5.2094459533691406e-05, -4.733353853225708e-05, -4.2572617530822754e-05, -3.781169652938843e-05, -3.30507755279541e-05, -2.8289854526519775e-05, -2.352893352508545e-05, -1.8768012523651123e-05, -1.4007091522216797e-05, -9.24617052078247e-06, -4.4852495193481445e-06, 2.7567148208618164e-07, 5.036592483520508e-06, 9.797513484954834e-06, 1.455843448638916e-05, 1.9319355487823486e-05, 2.4080276489257812e-05, 2.884119749069214e-05, 3.3602118492126465e-05, 3.836303949356079e-05, 4.312396049499512e-05, 4.788488149642944e-05, 5.264580249786377e-05, 5.7406723499298096e-05, 6.216764450073242e-05, 6.692856550216675e-05, 7.168948650360107e-05, 7.64504075050354e-05, 8.121132850646973e-05, 8.597224950790405e-05, 9.073317050933838e-05, 9.54940915107727e-05, 0.00010025501251220703, 0.00010501593351364136, 0.00010977685451507568, 0.00011453777551651001, 0.00011929869651794434, 0.00012405961751937866, 0.000128820538520813, 0.00013358145952224731, 0.00013834238052368164]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 6.0, 6.0, 4.0, 9.0, 11.0, 11.0, 12.0, 16.0, 18.0, 17.0, 30.0, 22.0, 18.0, 27.0, 43.0, 38.0, 35.0, 39.0, 46.0, 40.0, 46.0, 36.0, 47.0, 44.0, 37.0, 31.0, 45.0, 28.0, 35.0, 28.0, 21.0, 29.0, 18.0, 21.0, 15.0, 13.0, 12.0, 10.0, 14.0, 7.0, 8.0, 6.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.546875, -6.34478759765625, -6.1427001953125, -5.94061279296875, -5.738525390625, -5.53643798828125, -5.3343505859375, -5.13226318359375, -4.93017578125, -4.72808837890625, -4.5260009765625, -4.32391357421875, -4.121826171875, -3.91973876953125, -3.7176513671875, -3.51556396484375, -3.3134765625, -3.11138916015625, -2.9093017578125, -2.70721435546875, -2.505126953125, -2.30303955078125, -2.1009521484375, -1.89886474609375, -1.69677734375, -1.49468994140625, -1.2926025390625, -1.09051513671875, -0.888427734375, -0.68634033203125, -0.4842529296875, -0.28216552734375, -0.080078125, 0.12200927734375, 0.3240966796875, 0.52618408203125, 0.728271484375, 0.93035888671875, 1.1324462890625, 1.33453369140625, 1.53662109375, 1.73870849609375, 1.9407958984375, 2.14288330078125, 2.344970703125, 2.54705810546875, 2.7491455078125, 2.95123291015625, 3.1533203125, 3.35540771484375, 3.5574951171875, 3.75958251953125, 3.961669921875, 4.16375732421875, 4.3658447265625, 4.56793212890625, 4.77001953125, 4.97210693359375, 5.1741943359375, 5.37628173828125, 5.578369140625, 5.78045654296875, 5.9825439453125, 6.18463134765625, 6.38671875]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 9.0, 5.0, 22.0, 12.0, 31.0, 24.0, 48.0, 63.0, 83.0, 92.0, 162.0, 231.0, 373.0, 507.0, 893.0, 1557.0, 2876.0, 5482.0, 11961.0, 29042.0, 80595.0, 236563.0, 430414.0, 155295.0, 53545.0, 20083.0, 8813.0, 4151.0, 2202.0, 1230.0, 723.0, 456.0, 298.0, 206.0, 150.0, 86.0, 81.0, 45.0, 47.0, 29.0, 17.0, 22.0, 11.0, 8.0, 9.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0], "bins": [-6.81640625, -6.60540771484375, -6.3944091796875, -6.18341064453125, -5.972412109375, -5.76141357421875, -5.5504150390625, -5.33941650390625, -5.12841796875, -4.91741943359375, -4.7064208984375, -4.49542236328125, -4.284423828125, -4.07342529296875, -3.8624267578125, -3.65142822265625, -3.4404296875, -3.22943115234375, -3.0184326171875, -2.80743408203125, -2.596435546875, -2.38543701171875, -2.1744384765625, -1.96343994140625, -1.75244140625, -1.54144287109375, -1.3304443359375, -1.11944580078125, -0.908447265625, -0.69744873046875, -0.4864501953125, -0.27545166015625, -0.064453125, 0.14654541015625, 0.3575439453125, 0.56854248046875, 0.779541015625, 0.99053955078125, 1.2015380859375, 1.41253662109375, 1.62353515625, 1.83453369140625, 2.0455322265625, 2.25653076171875, 2.467529296875, 2.67852783203125, 2.8895263671875, 3.10052490234375, 3.3115234375, 3.52252197265625, 3.7335205078125, 3.94451904296875, 4.155517578125, 4.36651611328125, 4.5775146484375, 4.78851318359375, 4.99951171875, 5.21051025390625, 5.4215087890625, 5.63250732421875, 5.843505859375, 6.05450439453125, 6.2655029296875, 6.47650146484375, 6.6875]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 6.0, 4.0, 3.0, 3.0, 9.0, 14.0, 4.0, 12.0, 8.0, 20.0, 19.0, 25.0, 24.0, 30.0, 22.0, 28.0, 28.0, 29.0, 37.0, 66.0, 86.0, 179.0, 1512.0, 308.0, 107.0, 69.0, 44.0, 37.0, 37.0, 40.0, 43.0, 22.0, 33.0, 29.0, 23.0, 15.0, 14.0, 9.0, 12.0, 9.0, 15.0, 6.0, 6.0, 3.0, 3.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.28125, -17.739013671875, -17.19677734375, -16.654541015625, -16.1123046875, -15.570068359375, -15.02783203125, -14.485595703125, -13.943359375, -13.401123046875, -12.85888671875, -12.316650390625, -11.7744140625, -11.232177734375, -10.68994140625, -10.147705078125, -9.60546875, -9.063232421875, -8.52099609375, -7.978759765625, -7.4365234375, -6.894287109375, -6.35205078125, -5.809814453125, -5.267578125, -4.725341796875, -4.18310546875, -3.640869140625, -3.0986328125, -2.556396484375, -2.01416015625, -1.471923828125, -0.9296875, -0.387451171875, 0.15478515625, 0.697021484375, 1.2392578125, 1.781494140625, 2.32373046875, 2.865966796875, 3.408203125, 3.950439453125, 4.49267578125, 5.034912109375, 5.5771484375, 6.119384765625, 6.66162109375, 7.203857421875, 7.74609375, 8.288330078125, 8.83056640625, 9.372802734375, 9.9150390625, 10.457275390625, 10.99951171875, 11.541748046875, 12.083984375, 12.626220703125, 13.16845703125, 13.710693359375, 14.2529296875, 14.795166015625, 15.33740234375, 15.879638671875, 16.421875]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 4.0, 3.0, 5.0, 5.0, 6.0, 14.0, 12.0, 12.0, 16.0, 25.0, 36.0, 29.0, 48.0, 62.0, 78.0, 105.0, 135.0, 237.0, 432.0, 915.0, 3873.0, 322805.0, 2806583.0, 7814.0, 1111.0, 425.0, 250.0, 175.0, 132.0, 89.0, 73.0, 42.0, 42.0, 28.0, 21.0, 16.0, 13.0, 10.0, 11.0, 8.0, 4.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-44.75, -43.26513671875, -41.7802734375, -40.29541015625, -38.810546875, -37.32568359375, -35.8408203125, -34.35595703125, -32.87109375, -31.38623046875, -29.9013671875, -28.41650390625, -26.931640625, -25.44677734375, -23.9619140625, -22.47705078125, -20.9921875, -19.50732421875, -18.0224609375, -16.53759765625, -15.052734375, -13.56787109375, -12.0830078125, -10.59814453125, -9.11328125, -7.62841796875, -6.1435546875, -4.65869140625, -3.173828125, -1.68896484375, -0.2041015625, 1.28076171875, 2.765625, 4.25048828125, 5.7353515625, 7.22021484375, 8.705078125, 10.18994140625, 11.6748046875, 13.15966796875, 14.64453125, 16.12939453125, 17.6142578125, 19.09912109375, 20.583984375, 22.06884765625, 23.5537109375, 25.03857421875, 26.5234375, 28.00830078125, 29.4931640625, 30.97802734375, 32.462890625, 33.94775390625, 35.4326171875, 36.91748046875, 38.40234375, 39.88720703125, 41.3720703125, 42.85693359375, 44.341796875, 45.82666015625, 47.3115234375, 48.79638671875, 50.28125]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 111.0, 524.0, 345.0, 33.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-204.02435302734375, -200.29823303222656, -196.57211303710938, -192.84597778320312, -189.11985778808594, -185.39373779296875, -181.66761779785156, -177.94149780273438, -174.21536254882812, -170.48924255371094, -166.76312255859375, -163.0369873046875, -159.3108673095703, -155.58474731445312, -151.85862731933594, -148.13250732421875, -144.40638732910156, -140.68026733398438, -136.9541473388672, -133.22801208496094, -129.50189208984375, -125.77577209472656, -122.04965209960938, -118.32352447509766, -114.59739685058594, -110.87127685546875, -107.14514923095703, -103.41902923583984, -99.69290161132812, -95.96678161621094, -92.24066162109375, -88.51453399658203, -84.78840637207031, -81.06228637695312, -77.3361587524414, -73.61003875732422, -69.8839111328125, -66.15779113769531, -62.43166732788086, -58.705543518066406, -54.97942352294922, -51.253299713134766, -47.52717590332031, -43.801055908203125, -40.07493209838867, -36.34880828857422, -32.622684478759766, -28.896562576293945, -25.170440673828125, -21.444316864013672, -17.71819496154785, -13.992071151733398, -10.265948295593262, -6.539825439453125, -2.813701629638672, 0.9124202728271484, 4.638544082641602, 8.364666938781738, 12.090789794921875, 15.816913604736328, 19.54303741455078, 23.2691593170166, 26.995283126831055, 30.721405029296875, 34.44752883911133]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 6.0, 2.0, 2.0, 0.0, 3.0, 4.0, 5.0, 8.0, 6.0, 12.0, 18.0, 17.0, 21.0, 16.0, 25.0, 23.0, 19.0, 25.0, 32.0, 26.0, 33.0, 44.0, 37.0, 42.0, 44.0, 52.0, 45.0, 40.0, 33.0, 35.0, 21.0, 36.0, 41.0, 45.0, 34.0, 26.0, 29.0, 17.0, 15.0, 16.0, 15.0, 8.0, 10.0, 9.0, 5.0, 3.0, 4.0, 5.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.30317687988281, -39.91122055053711, -38.51926803588867, -37.12731170654297, -35.735355377197266, -34.34339904785156, -32.951446533203125, -31.559490203857422, -30.16753578186035, -28.77558135986328, -27.383625030517578, -25.991670608520508, -24.599716186523438, -23.207759857177734, -21.815805435180664, -20.423851013183594, -19.03189468383789, -17.63994026184082, -16.247983932495117, -14.856029510498047, -13.46407413482666, -12.072118759155273, -10.680164337158203, -9.288208961486816, -7.89625358581543, -6.504298210144043, -5.1123433113098145, -3.720388412475586, -2.328433036804199, -0.9364776611328125, 0.4554767608642578, 1.8474321365356445, 3.239391326904297, 4.631346702575684, 6.023301601409912, 7.415256500244141, 8.807211875915527, 10.199167251586914, 11.591121673583984, 12.983077049255371, 14.375032424926758, 15.766987800598145, 17.15894317626953, 18.5508975982666, 19.942852020263672, 21.334808349609375, 22.726762771606445, 24.118717193603516, 25.51067352294922, 26.90262794494629, 28.294584274291992, 29.686538696289062, 31.078495025634766, 32.47045135498047, 33.862403869628906, 35.25436019897461, 36.64631652832031, 38.038272857666016, 39.43022537231445, 40.822181701660156, 42.21413803100586, 43.60609436035156, 44.998046875, 46.3900032043457, 47.78195571899414]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 3.0, 6.0, 7.0, 4.0, 9.0, 10.0, 12.0, 15.0, 22.0, 22.0, 22.0, 20.0, 19.0, 23.0, 24.0, 46.0, 34.0, 42.0, 54.0, 46.0, 34.0, 44.0, 42.0, 41.0, 43.0, 30.0, 45.0, 33.0, 26.0, 32.0, 37.0, 28.0, 16.0, 19.0, 16.0, 14.0, 15.0, 8.0, 8.0, 10.0, 11.0, 10.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.0, -6.7862548828125, -6.572509765625, -6.3587646484375, -6.14501953125, -5.9312744140625, -5.717529296875, -5.5037841796875, -5.2900390625, -5.0762939453125, -4.862548828125, -4.6488037109375, -4.43505859375, -4.2213134765625, -4.007568359375, -3.7938232421875, -3.580078125, -3.3663330078125, -3.152587890625, -2.9388427734375, -2.72509765625, -2.5113525390625, -2.297607421875, -2.0838623046875, -1.8701171875, -1.6563720703125, -1.442626953125, -1.2288818359375, -1.01513671875, -0.8013916015625, -0.587646484375, -0.3739013671875, -0.16015625, 0.0535888671875, 0.267333984375, 0.4810791015625, 0.69482421875, 0.9085693359375, 1.122314453125, 1.3360595703125, 1.5498046875, 1.7635498046875, 1.977294921875, 2.1910400390625, 2.40478515625, 2.6185302734375, 2.832275390625, 3.0460205078125, 3.259765625, 3.4735107421875, 3.687255859375, 3.9010009765625, 4.11474609375, 4.3284912109375, 4.542236328125, 4.7559814453125, 4.9697265625, 5.1834716796875, 5.397216796875, 5.6109619140625, 5.82470703125, 6.0384521484375, 6.252197265625, 6.4659423828125, 6.6796875]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 7.0, 4.0, 2.0, 11.0, 10.0, 8.0, 10.0, 14.0, 18.0, 19.0, 35.0, 33.0, 54.0, 66.0, 80.0, 162.0, 336.0, 866.0, 2372.0, 9401.0, 96906.0, 2905599.0, 1138901.0, 31322.0, 5229.0, 1524.0, 554.0, 270.0, 139.0, 78.0, 58.0, 39.0, 35.0, 16.0, 21.0, 16.0, 14.0, 11.0, 15.0, 5.0, 11.0, 6.0, 3.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-23.453125, -22.759521484375, -22.06591796875, -21.372314453125, -20.6787109375, -19.985107421875, -19.29150390625, -18.597900390625, -17.904296875, -17.210693359375, -16.51708984375, -15.823486328125, -15.1298828125, -14.436279296875, -13.74267578125, -13.049072265625, -12.35546875, -11.661865234375, -10.96826171875, -10.274658203125, -9.5810546875, -8.887451171875, -8.19384765625, -7.500244140625, -6.806640625, -6.113037109375, -5.41943359375, -4.725830078125, -4.0322265625, -3.338623046875, -2.64501953125, -1.951416015625, -1.2578125, -0.564208984375, 0.12939453125, 0.822998046875, 1.5166015625, 2.210205078125, 2.90380859375, 3.597412109375, 4.291015625, 4.984619140625, 5.67822265625, 6.371826171875, 7.0654296875, 7.759033203125, 8.45263671875, 9.146240234375, 9.83984375, 10.533447265625, 11.22705078125, 11.920654296875, 12.6142578125, 13.307861328125, 14.00146484375, 14.695068359375, 15.388671875, 16.082275390625, 16.77587890625, 17.469482421875, 18.1630859375, 18.856689453125, 19.55029296875, 20.243896484375, 20.9375]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 2.0, 3.0, 7.0, 2.0, 2.0, 8.0, 10.0, 19.0, 17.0, 20.0, 38.0, 37.0, 46.0, 59.0, 76.0, 142.0, 204.0, 297.0, 418.0, 519.0, 530.0, 485.0, 352.0, 232.0, 158.0, 110.0, 72.0, 48.0, 28.0, 20.0, 22.0, 17.0, 17.0, 15.0, 11.0, 8.0, 6.0, 6.0, 4.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.2109375, -11.8538818359375, -11.496826171875, -11.1397705078125, -10.78271484375, -10.4256591796875, -10.068603515625, -9.7115478515625, -9.3544921875, -8.9974365234375, -8.640380859375, -8.2833251953125, -7.92626953125, -7.5692138671875, -7.212158203125, -6.8551025390625, -6.498046875, -6.1409912109375, -5.783935546875, -5.4268798828125, -5.06982421875, -4.7127685546875, -4.355712890625, -3.9986572265625, -3.6416015625, -3.2845458984375, -2.927490234375, -2.5704345703125, -2.21337890625, -1.8563232421875, -1.499267578125, -1.1422119140625, -0.78515625, -0.4281005859375, -0.071044921875, 0.2860107421875, 0.64306640625, 1.0001220703125, 1.357177734375, 1.7142333984375, 2.0712890625, 2.4283447265625, 2.785400390625, 3.1424560546875, 3.49951171875, 3.8565673828125, 4.213623046875, 4.5706787109375, 4.927734375, 5.2847900390625, 5.641845703125, 5.9989013671875, 6.35595703125, 6.7130126953125, 7.070068359375, 7.4271240234375, 7.7841796875, 8.1412353515625, 8.498291015625, 8.8553466796875, 9.21240234375, 9.5694580078125, 9.926513671875, 10.2835693359375, 10.640625]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 3.0, 9.0, 3.0, 5.0, 9.0, 12.0, 9.0, 20.0, 19.0, 17.0, 20.0, 24.0, 55.0, 58.0, 94.0, 164.0, 254.0, 505.0, 2381.0, 78636.0, 4068334.0, 40659.0, 1782.0, 466.0, 234.0, 151.0, 83.0, 60.0, 45.0, 43.0, 30.0, 25.0, 14.0, 18.0, 17.0, 6.0, 2.0, 2.0, 7.0, 4.0, 0.0, 2.0, 2.0, 5.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.875, -53.9765625, -52.078125, -50.1796875, -48.28125, -46.3828125, -44.484375, -42.5859375, -40.6875, -38.7890625, -36.890625, -34.9921875, -33.09375, -31.1953125, -29.296875, -27.3984375, -25.5, -23.6015625, -21.703125, -19.8046875, -17.90625, -16.0078125, -14.109375, -12.2109375, -10.3125, -8.4140625, -6.515625, -4.6171875, -2.71875, -0.8203125, 1.078125, 2.9765625, 4.875, 6.7734375, 8.671875, 10.5703125, 12.46875, 14.3671875, 16.265625, 18.1640625, 20.0625, 21.9609375, 23.859375, 25.7578125, 27.65625, 29.5546875, 31.453125, 33.3515625, 35.25, 37.1484375, 39.046875, 40.9453125, 42.84375, 44.7421875, 46.640625, 48.5390625, 50.4375, 52.3359375, 54.234375, 56.1328125, 58.03125, 59.9296875, 61.828125, 63.7265625, 65.625]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 17.0, 97.0, 297.0, 399.0, 160.0, 34.0, 7.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.88795471191406, -38.234310150146484, -33.580665588378906, -28.927021026611328, -24.27337646484375, -19.619731903076172, -14.966087341308594, -10.312442779541016, -5.6587982177734375, -1.0051536560058594, 3.6484909057617188, 8.302135467529297, 12.955780029296875, 17.609424591064453, 22.26306915283203, 26.91671371459961, 31.570358276367188, 36.224002838134766, 40.877647399902344, 45.53129196166992, 50.1849365234375, 54.83858108520508, 59.492225646972656, 64.1458740234375, 68.79951477050781, 73.45315551757812, 78.10680389404297, 82.76045227050781, 87.41409301757812, 92.06773376464844, 96.72138214111328, 101.37503051757812, 106.02867126464844, 110.68231201171875, 115.3359603881836, 119.98960876464844, 124.64324951171875, 129.29689025878906, 133.95053100585938, 138.60418701171875, 143.25782775878906, 147.91146850585938, 152.56512451171875, 157.21876525878906, 161.87240600585938, 166.5260467529297, 171.1796875, 175.83334350585938, 180.4869842529297, 185.140625, 189.79428100585938, 194.4479217529297, 199.1015625, 203.7552032470703, 208.40884399414062, 213.0625, 217.7161407470703, 222.36978149414062, 227.0234375, 231.6770782470703, 236.33071899414062, 240.98435974121094, 245.63800048828125, 250.29165649414062, 254.94529724121094]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 4.0, 9.0, 9.0, 6.0, 8.0, 8.0, 15.0, 14.0, 21.0, 19.0, 23.0, 29.0, 30.0, 29.0, 31.0, 49.0, 29.0, 32.0, 44.0, 46.0, 41.0, 42.0, 41.0, 35.0, 45.0, 34.0, 33.0, 34.0, 30.0, 28.0, 26.0, 22.0, 18.0, 13.0, 18.0, 16.0, 15.0, 7.0, 12.0, 5.0, 7.0, 10.0, 6.0, 3.0, 5.0, 1.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 3.0], "bins": [-33.48048782348633, -32.41051483154297, -31.34054183959961, -30.27056884765625, -29.20059585571289, -28.13062286376953, -27.060651779174805, -25.990678787231445, -24.920705795288086, -23.850732803344727, -22.780759811401367, -21.710786819458008, -20.64081573486328, -19.570842742919922, -18.500869750976562, -17.430896759033203, -16.360923767089844, -15.290950775146484, -14.220977783203125, -13.151005744934082, -12.081032752990723, -11.011059761047363, -9.94108772277832, -8.871114730834961, -7.801141738891602, -6.731168746948242, -5.661196231842041, -4.59122371673584, -3.5212507247924805, -2.451277732849121, -1.38130521774292, -0.31133270263671875, 0.758636474609375, 1.8286092281341553, 2.8985819816589355, 3.968554735183716, 5.038527488708496, 6.1085004806518555, 7.178472995758057, 8.248445510864258, 9.318418502807617, 10.388391494750977, 11.458364486694336, 12.528336524963379, 13.598309516906738, 14.668282508850098, 15.73825454711914, 16.8082275390625, 17.87820053100586, 18.94817352294922, 20.018146514892578, 21.088119506835938, 22.158092498779297, 23.228065490722656, 24.298036575317383, 25.368009567260742, 26.4379825592041, 27.50795555114746, 28.57792854309082, 29.64790153503418, 30.717872619628906, 31.787845611572266, 32.857818603515625, 33.927791595458984, 34.997764587402344]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 5.0, 9.0, 8.0, 4.0, 14.0, 12.0, 12.0, 20.0, 13.0, 23.0, 19.0, 18.0, 22.0, 37.0, 21.0, 33.0, 27.0, 41.0, 43.0, 47.0, 53.0, 35.0, 46.0, 36.0, 39.0, 36.0, 32.0, 22.0, 25.0, 39.0, 36.0, 26.0, 24.0, 24.0, 9.0, 15.0, 11.0, 15.0, 14.0, 7.0, 8.0, 8.0, 4.0, 4.0, 1.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.9296875, -5.73681640625, -5.5439453125, -5.35107421875, -5.158203125, -4.96533203125, -4.7724609375, -4.57958984375, -4.38671875, -4.19384765625, -4.0009765625, -3.80810546875, -3.615234375, -3.42236328125, -3.2294921875, -3.03662109375, -2.84375, -2.65087890625, -2.4580078125, -2.26513671875, -2.072265625, -1.87939453125, -1.6865234375, -1.49365234375, -1.30078125, -1.10791015625, -0.9150390625, -0.72216796875, -0.529296875, -0.33642578125, -0.1435546875, 0.04931640625, 0.2421875, 0.43505859375, 0.6279296875, 0.82080078125, 1.013671875, 1.20654296875, 1.3994140625, 1.59228515625, 1.78515625, 1.97802734375, 2.1708984375, 2.36376953125, 2.556640625, 2.74951171875, 2.9423828125, 3.13525390625, 3.328125, 3.52099609375, 3.7138671875, 3.90673828125, 4.099609375, 4.29248046875, 4.4853515625, 4.67822265625, 4.87109375, 5.06396484375, 5.2568359375, 5.44970703125, 5.642578125, 5.83544921875, 6.0283203125, 6.22119140625, 6.4140625]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [5.0, 0.0, 1.0, 2.0, 3.0, 5.0, 10.0, 6.0, 25.0, 18.0, 30.0, 44.0, 76.0, 105.0, 149.0, 211.0, 322.0, 462.0, 711.0, 869.0, 1333.0, 1890.0, 2655.0, 3837.0, 5356.0, 7714.0, 11215.0, 15740.0, 22848.0, 34712.0, 54040.0, 91650.0, 171407.0, 250851.0, 144417.0, 78467.0, 47596.0, 31069.0, 20973.0, 14189.0, 9968.0, 7011.0, 4901.0, 3401.0, 2486.0, 1766.0, 1216.0, 877.0, 627.0, 420.0, 284.0, 202.0, 141.0, 94.0, 56.0, 42.0, 30.0, 20.0, 8.0, 9.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.271240234375, -0.2631111145019531, -0.25498199462890625, -0.24685287475585938, -0.2387237548828125, -0.23059463500976562, -0.22246551513671875, -0.21433639526367188, -0.206207275390625, -0.19807815551757812, -0.18994903564453125, -0.18181991577148438, -0.1736907958984375, -0.16556167602539062, -0.15743255615234375, -0.14930343627929688, -0.14117431640625, -0.13304519653320312, -0.12491607666015625, -0.11678695678710938, -0.1086578369140625, -0.10052871704101562, -0.09239959716796875, -0.08427047729492188, -0.076141357421875, -0.06801223754882812, -0.05988311767578125, -0.051753997802734375, -0.0436248779296875, -0.035495758056640625, -0.02736663818359375, -0.019237518310546875, -0.0111083984375, -0.002979278564453125, 0.00514984130859375, 0.013278961181640625, 0.0214080810546875, 0.029537200927734375, 0.03766632080078125, 0.045795440673828125, 0.053924560546875, 0.062053680419921875, 0.07018280029296875, 0.07831192016601562, 0.0864410400390625, 0.09457015991210938, 0.10269927978515625, 0.11082839965820312, 0.11895751953125, 0.12708663940429688, 0.13521575927734375, 0.14334487915039062, 0.1514739990234375, 0.15960311889648438, 0.16773223876953125, 0.17586135864257812, 0.183990478515625, 0.19211959838867188, 0.20024871826171875, 0.20837783813476562, 0.2165069580078125, 0.22463607788085938, 0.23276519775390625, 0.24089431762695312, 0.2490234375]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 3.0, 8.0, 9.0, 9.0, 12.0, 20.0, 11.0, 12.0, 21.0, 27.0, 21.0, 26.0, 34.0, 42.0, 39.0, 32.0, 37.0, 42.0, 52.0, 36.0, 1071.0, 44.0, 49.0, 49.0, 33.0, 57.0, 26.0, 32.0, 26.0, 27.0, 20.0, 16.0, 19.0, 10.0, 14.0, 8.0, 8.0, 8.0, 6.0, 7.0, 4.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.36328125, -4.2230224609375, -4.082763671875, -3.9425048828125, -3.80224609375, -3.6619873046875, -3.521728515625, -3.3814697265625, -3.2412109375, -3.1009521484375, -2.960693359375, -2.8204345703125, -2.68017578125, -2.5399169921875, -2.399658203125, -2.2593994140625, -2.119140625, -1.9788818359375, -1.838623046875, -1.6983642578125, -1.55810546875, -1.4178466796875, -1.277587890625, -1.1373291015625, -0.9970703125, -0.8568115234375, -0.716552734375, -0.5762939453125, -0.43603515625, -0.2957763671875, -0.155517578125, -0.0152587890625, 0.125, 0.2652587890625, 0.405517578125, 0.5457763671875, 0.68603515625, 0.8262939453125, 0.966552734375, 1.1068115234375, 1.2470703125, 1.3873291015625, 1.527587890625, 1.6678466796875, 1.80810546875, 1.9483642578125, 2.088623046875, 2.2288818359375, 2.369140625, 2.5093994140625, 2.649658203125, 2.7899169921875, 2.93017578125, 3.0704345703125, 3.210693359375, 3.3509521484375, 3.4912109375, 3.6314697265625, 3.771728515625, 3.9119873046875, 4.05224609375, 4.1925048828125, 4.332763671875, 4.4730224609375, 4.61328125]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 11.0, 12.0, 17.0, 34.0, 47.0, 79.0, 106.0, 163.0, 209.0, 299.0, 439.0, 680.0, 939.0, 1345.0, 1942.0, 2970.0, 4371.0, 6571.0, 9849.0, 15448.0, 24789.0, 40028.0, 65291.0, 113333.0, 208472.0, 1279433.0, 127252.0, 72797.0, 43475.0, 27261.0, 16775.0, 10925.0, 7041.0, 4811.0, 3128.0, 2102.0, 1475.0, 998.0, 698.0, 443.0, 354.0, 236.0, 151.0, 105.0, 68.0, 49.0, 32.0, 27.0, 20.0, 10.0, 8.0, 7.0, 5.0, 2.0, 3.0, 0.0, 3.0], "bins": [-0.203369140625, -0.19703292846679688, -0.19069671630859375, -0.18436050415039062, -0.1780242919921875, -0.17168807983398438, -0.16535186767578125, -0.15901565551757812, -0.152679443359375, -0.14634323120117188, -0.14000701904296875, -0.13367080688476562, -0.1273345947265625, -0.12099838256835938, -0.11466217041015625, -0.10832595825195312, -0.10198974609375, -0.09565353393554688, -0.08931732177734375, -0.08298110961914062, -0.0766448974609375, -0.07030868530273438, -0.06397247314453125, -0.057636260986328125, -0.051300048828125, -0.044963836669921875, -0.03862762451171875, -0.032291412353515625, -0.0259552001953125, -0.019618988037109375, -0.01328277587890625, -0.006946563720703125, -0.0006103515625, 0.005725860595703125, 0.01206207275390625, 0.018398284912109375, 0.0247344970703125, 0.031070709228515625, 0.03740692138671875, 0.043743133544921875, 0.050079345703125, 0.056415557861328125, 0.06275177001953125, 0.06908798217773438, 0.0754241943359375, 0.08176040649414062, 0.08809661865234375, 0.09443283081054688, 0.10076904296875, 0.10710525512695312, 0.11344146728515625, 0.11977767944335938, 0.1261138916015625, 0.13245010375976562, 0.13878631591796875, 0.14512252807617188, 0.151458740234375, 0.15779495239257812, 0.16413116455078125, 0.17046737670898438, 0.1768035888671875, 0.18313980102539062, 0.18947601318359375, 0.19581222534179688, 0.2021484375]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 5.0, 2.0, 2.0, 2.0, 5.0, 3.0, 3.0, 19.0, 16.0, 31.0, 46.0, 68.0, 106.0, 174.0, 191.0, 114.0, 71.0, 48.0, 38.0, 21.0, 16.0, 6.0, 7.0, 6.0, 4.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00024962425231933594, -0.00023877620697021484, -0.00022792816162109375, -0.00021708011627197266, -0.00020623207092285156, -0.00019538402557373047, -0.00018453598022460938, -0.00017368793487548828, -0.0001628398895263672, -0.0001519918441772461, -0.000141143798828125, -0.0001302957534790039, -0.00011944770812988281, -0.00010859966278076172, -9.775161743164062e-05, -8.690357208251953e-05, -7.605552673339844e-05, -6.520748138427734e-05, -5.435943603515625e-05, -4.3511390686035156e-05, -3.266334533691406e-05, -2.181529998779297e-05, -1.0967254638671875e-05, -1.1920928955078125e-07, 1.0728836059570312e-05, 2.1576881408691406e-05, 3.24249267578125e-05, 4.3272972106933594e-05, 5.412101745605469e-05, 6.496906280517578e-05, 7.581710815429688e-05, 8.666515350341797e-05, 9.751319885253906e-05, 0.00010836124420166016, 0.00011920928955078125, 0.00013005733489990234, 0.00014090538024902344, 0.00015175342559814453, 0.00016260147094726562, 0.00017344951629638672, 0.0001842975616455078, 0.0001951456069946289, 0.00020599365234375, 0.0002168416976928711, 0.0002276897430419922, 0.00023853778839111328, 0.0002493858337402344, 0.00026023387908935547, 0.00027108192443847656, 0.00028192996978759766, 0.00029277801513671875, 0.00030362606048583984, 0.00031447410583496094, 0.00032532215118408203, 0.0003361701965332031, 0.0003470182418823242, 0.0003578662872314453, 0.0003687143325805664, 0.0003795623779296875, 0.0003904104232788086, 0.0004012584686279297, 0.0004121065139770508, 0.0004229545593261719, 0.00043380260467529297, 0.00044465065002441406]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 4.0, 1.0, 8.0, 13.0, 12.0, 10.0, 27.0, 41.0, 80.0, 118.0, 355.0, 1662.0, 568968.0, 475003.0, 1593.0, 351.0, 136.0, 67.0, 31.0, 27.0, 12.0, 10.0, 7.0, 7.0, 3.0, 2.0, 7.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00909423828125, -0.008872389793395996, -0.008650541305541992, -0.008428692817687988, -0.008206844329833984, -0.00798499584197998, -0.0077631473541259766, -0.007541298866271973, -0.007319450378417969, -0.007097601890563965, -0.006875753402709961, -0.006653904914855957, -0.006432056427001953, -0.006210207939147949, -0.005988359451293945, -0.005766510963439941, -0.0055446624755859375, -0.005322813987731934, -0.00510096549987793, -0.004879117012023926, -0.004657268524169922, -0.004435420036315918, -0.004213571548461914, -0.00399172306060791, -0.0037698745727539062, -0.0035480260848999023, -0.0033261775970458984, -0.0031043291091918945, -0.0028824806213378906, -0.0026606321334838867, -0.002438783645629883, -0.002216935157775879, -0.001995086669921875, -0.001773238182067871, -0.0015513896942138672, -0.0013295412063598633, -0.0011076927185058594, -0.0008858442306518555, -0.0006639957427978516, -0.00044214725494384766, -0.00022029876708984375, 1.5497207641601562e-06, 0.00022339820861816406, 0.00044524669647216797, 0.0006670951843261719, 0.0008889436721801758, 0.0011107921600341797, 0.0013326406478881836, 0.0015544891357421875, 0.0017763376235961914, 0.0019981861114501953, 0.0022200345993041992, 0.002441883087158203, 0.002663731575012207, 0.002885580062866211, 0.003107428550720215, 0.0033292770385742188, 0.0035511255264282227, 0.0037729740142822266, 0.0039948225021362305, 0.004216670989990234, 0.004438519477844238, 0.004660367965698242, 0.004882216453552246, 0.00510406494140625]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 16.0, 12.0, 37.0, 87.0, 168.0, 243.0, 216.0, 116.0, 60.0, 32.0, 11.0, 3.0, 3.0, 5.0], "bins": [-0.0006774240173399448, -0.0006652597221545875, -0.0006530954269692302, -0.0006409311899915338, -0.0006287668948061764, -0.0006166025996208191, -0.0006044383044354618, -0.0005922740092501044, -0.000580109772272408, -0.0005679454770870507, -0.0005557811819016933, -0.0005436169449239969, -0.0005314526497386396, -0.0005192883545532823, -0.0005071240593679249, -0.0004949597641825676, -0.00048279546899721026, -0.00047063117381185293, -0.00045846690773032606, -0.0004463026125449687, -0.00043413834646344185, -0.0004219740512780845, -0.0004098097560927272, -0.0003976454900112003, -0.00038548122392967343, -0.0003733169287443161, -0.0003611526626627892, -0.0003489883674774319, -0.000336824101395905, -0.0003246598062105477, -0.00031249551102519035, -0.0003003312449436635, -0.00028816694975830615, -0.0002760026545729488, -0.00026383838849142194, -0.0002516740933060646, -0.0002395098126726225, -0.0002273455320391804, -0.0002151812514057383, -0.0002030169707722962, -0.00019085267558693886, -0.00017868839495349675, -0.00016652411432005465, -0.00015435981913469732, -0.00014219553850125521, -0.0001300312578678131, -0.000117866977234371, -0.00010570268932497129, -9.35384159674868e-05, -8.13741353340447e-05, -6.920984742464498e-05, -5.704556679120287e-05, -4.488128251978196e-05, -3.271699824836105e-05, -2.0552717614918947e-05, -8.38842970551923e-06, 3.7758509279228747e-06, 1.5940135199343786e-05, 2.8104417651775293e-05, 4.02687001042068e-05, 5.243298437562771e-05, 6.459726864704862e-05, 7.676154928049073e-05, 8.892583718989044e-05, 0.00010109011782333255]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 5.0, 4.0, 4.0, 6.0, 7.0, 8.0, 15.0, 12.0, 13.0, 17.0, 24.0, 36.0, 23.0, 30.0, 38.0, 31.0, 35.0, 35.0, 43.0, 34.0, 40.0, 42.0, 48.0, 54.0, 38.0, 40.0, 48.0, 38.0, 36.0, 31.0, 28.0, 20.0, 27.0, 17.0, 17.0, 10.0, 12.0, 11.0, 6.0, 6.0, 4.0, 2.0, 2.0, 4.0, 4.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001068115234375, -0.00010351184755563736, -0.00010021217167377472, -9.691249579191208e-05, -9.361281991004944e-05, -9.03131440281868e-05, -8.701346814632416e-05, -8.371379226446152e-05, -8.041411638259888e-05, -7.711444050073624e-05, -7.38147646188736e-05, -7.051508873701096e-05, -6.721541285514832e-05, -6.391573697328568e-05, -6.0616061091423035e-05, -5.7316385209560394e-05, -5.4016709327697754e-05, -5.0717033445835114e-05, -4.741735756397247e-05, -4.411768168210983e-05, -4.081800580024719e-05, -3.751832991838455e-05, -3.421865403652191e-05, -3.091897815465927e-05, -2.761930227279663e-05, -2.431962639093399e-05, -2.101995050907135e-05, -1.772027462720871e-05, -1.442059874534607e-05, -1.1120922863483429e-05, -7.821246981620789e-06, -4.521571099758148e-06, -1.2218952178955078e-06, 2.0777806639671326e-06, 5.377456545829773e-06, 8.677132427692413e-06, 1.1976808309555054e-05, 1.5276484191417694e-05, 1.8576160073280334e-05, 2.1875835955142975e-05, 2.5175511837005615e-05, 2.8475187718868256e-05, 3.1774863600730896e-05, 3.5074539482593536e-05, 3.837421536445618e-05, 4.167389124631882e-05, 4.497356712818146e-05, 4.82732430100441e-05, 5.157291889190674e-05, 5.487259477376938e-05, 5.817227065563202e-05, 6.147194653749466e-05, 6.47716224193573e-05, 6.807129830121994e-05, 7.137097418308258e-05, 7.467065006494522e-05, 7.797032594680786e-05, 8.12700018286705e-05, 8.456967771053314e-05, 8.786935359239578e-05, 9.116902947425842e-05, 9.446870535612106e-05, 9.77683812379837e-05, 0.00010106805711984634, 0.00010436773300170898]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 5.0, 9.0, 8.0, 4.0, 14.0, 12.0, 12.0, 20.0, 13.0, 23.0, 19.0, 18.0, 22.0, 37.0, 21.0, 33.0, 27.0, 41.0, 43.0, 47.0, 53.0, 35.0, 46.0, 36.0, 39.0, 36.0, 32.0, 22.0, 25.0, 39.0, 36.0, 26.0, 24.0, 24.0, 9.0, 15.0, 11.0, 15.0, 14.0, 7.0, 8.0, 8.0, 4.0, 4.0, 1.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.9296875, -5.73681640625, -5.5439453125, -5.35107421875, -5.158203125, -4.96533203125, -4.7724609375, -4.57958984375, -4.38671875, -4.19384765625, -4.0009765625, -3.80810546875, -3.615234375, -3.42236328125, -3.2294921875, -3.03662109375, -2.84375, -2.65087890625, -2.4580078125, -2.26513671875, -2.072265625, -1.87939453125, -1.6865234375, -1.49365234375, -1.30078125, -1.10791015625, -0.9150390625, -0.72216796875, -0.529296875, -0.33642578125, -0.1435546875, 0.04931640625, 0.2421875, 0.43505859375, 0.6279296875, 0.82080078125, 1.013671875, 1.20654296875, 1.3994140625, 1.59228515625, 1.78515625, 1.97802734375, 2.1708984375, 2.36376953125, 2.556640625, 2.74951171875, 2.9423828125, 3.13525390625, 3.328125, 3.52099609375, 3.7138671875, 3.90673828125, 4.099609375, 4.29248046875, 4.4853515625, 4.67822265625, 4.87109375, 5.06396484375, 5.2568359375, 5.44970703125, 5.642578125, 5.83544921875, 6.0283203125, 6.22119140625, 6.4140625]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 3.0, 5.0, 6.0, 11.0, 15.0, 6.0, 19.0, 19.0, 28.0, 33.0, 44.0, 49.0, 90.0, 113.0, 145.0, 295.0, 486.0, 1061.0, 2248.0, 6058.0, 22651.0, 133918.0, 702383.0, 143688.0, 24202.0, 6207.0, 2252.0, 1073.0, 537.0, 303.0, 164.0, 119.0, 89.0, 56.0, 43.0, 24.0, 26.0, 16.0, 19.0, 14.0, 8.0, 10.0, 7.0, 1.0, 3.0, 3.0, 5.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.7421875, -11.36962890625, -10.9970703125, -10.62451171875, -10.251953125, -9.87939453125, -9.5068359375, -9.13427734375, -8.76171875, -8.38916015625, -8.0166015625, -7.64404296875, -7.271484375, -6.89892578125, -6.5263671875, -6.15380859375, -5.78125, -5.40869140625, -5.0361328125, -4.66357421875, -4.291015625, -3.91845703125, -3.5458984375, -3.17333984375, -2.80078125, -2.42822265625, -2.0556640625, -1.68310546875, -1.310546875, -0.93798828125, -0.5654296875, -0.19287109375, 0.1796875, 0.55224609375, 0.9248046875, 1.29736328125, 1.669921875, 2.04248046875, 2.4150390625, 2.78759765625, 3.16015625, 3.53271484375, 3.9052734375, 4.27783203125, 4.650390625, 5.02294921875, 5.3955078125, 5.76806640625, 6.140625, 6.51318359375, 6.8857421875, 7.25830078125, 7.630859375, 8.00341796875, 8.3759765625, 8.74853515625, 9.12109375, 9.49365234375, 9.8662109375, 10.23876953125, 10.611328125, 10.98388671875, 11.3564453125, 11.72900390625, 12.1015625]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 1.0, 4.0, 3.0, 5.0, 2.0, 6.0, 5.0, 13.0, 13.0, 10.0, 13.0, 16.0, 14.0, 21.0, 42.0, 27.0, 26.0, 24.0, 29.0, 49.0, 46.0, 48.0, 106.0, 185.0, 1531.0, 243.0, 99.0, 73.0, 54.0, 39.0, 36.0, 45.0, 30.0, 28.0, 23.0, 26.0, 19.0, 20.0, 11.0, 15.0, 13.0, 9.0, 4.0, 14.0, 5.0, 2.0, 2.0, 5.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-18.0625, -17.510498046875, -16.95849609375, -16.406494140625, -15.8544921875, -15.302490234375, -14.75048828125, -14.198486328125, -13.646484375, -13.094482421875, -12.54248046875, -11.990478515625, -11.4384765625, -10.886474609375, -10.33447265625, -9.782470703125, -9.23046875, -8.678466796875, -8.12646484375, -7.574462890625, -7.0224609375, -6.470458984375, -5.91845703125, -5.366455078125, -4.814453125, -4.262451171875, -3.71044921875, -3.158447265625, -2.6064453125, -2.054443359375, -1.50244140625, -0.950439453125, -0.3984375, 0.153564453125, 0.70556640625, 1.257568359375, 1.8095703125, 2.361572265625, 2.91357421875, 3.465576171875, 4.017578125, 4.569580078125, 5.12158203125, 5.673583984375, 6.2255859375, 6.777587890625, 7.32958984375, 7.881591796875, 8.43359375, 8.985595703125, 9.53759765625, 10.089599609375, 10.6416015625, 11.193603515625, 11.74560546875, 12.297607421875, 12.849609375, 13.401611328125, 13.95361328125, 14.505615234375, 15.0576171875, 15.609619140625, 16.16162109375, 16.713623046875, 17.265625]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 5.0, 2.0, 3.0, 8.0, 8.0, 17.0, 15.0, 18.0, 25.0, 26.0, 26.0, 39.0, 34.0, 62.0, 84.0, 86.0, 137.0, 314.0, 621.0, 2213.0, 74032.0, 3054895.0, 10563.0, 1242.0, 458.0, 242.0, 135.0, 75.0, 64.0, 44.0, 43.0, 43.0, 26.0, 15.0, 19.0, 8.0, 13.0, 11.0, 12.0, 6.0, 5.0, 8.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-50.0625, -48.41064453125, -46.7587890625, -45.10693359375, -43.455078125, -41.80322265625, -40.1513671875, -38.49951171875, -36.84765625, -35.19580078125, -33.5439453125, -31.89208984375, -30.240234375, -28.58837890625, -26.9365234375, -25.28466796875, -23.6328125, -21.98095703125, -20.3291015625, -18.67724609375, -17.025390625, -15.37353515625, -13.7216796875, -12.06982421875, -10.41796875, -8.76611328125, -7.1142578125, -5.46240234375, -3.810546875, -2.15869140625, -0.5068359375, 1.14501953125, 2.796875, 4.44873046875, 6.1005859375, 7.75244140625, 9.404296875, 11.05615234375, 12.7080078125, 14.35986328125, 16.01171875, 17.66357421875, 19.3154296875, 20.96728515625, 22.619140625, 24.27099609375, 25.9228515625, 27.57470703125, 29.2265625, 30.87841796875, 32.5302734375, 34.18212890625, 35.833984375, 37.48583984375, 39.1376953125, 40.78955078125, 42.44140625, 44.09326171875, 45.7451171875, 47.39697265625, 49.048828125, 50.70068359375, 52.3525390625, 54.00439453125, 55.65625]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 15.0, 40.0, 96.0, 201.0, 288.0, 210.0, 116.0, 31.0, 19.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.84120559692383, -32.39612579345703, -30.951047897338867, -29.505970001220703, -28.060890197753906, -26.615812301635742, -25.170734405517578, -23.72565460205078, -22.280576705932617, -20.835498809814453, -19.390419006347656, -17.945341110229492, -16.500263214111328, -15.055183410644531, -13.610105514526367, -12.165026664733887, -10.719947814941406, -9.274868965148926, -7.8297905921936035, -6.384712219238281, -4.939633369445801, -3.4945545196533203, -2.0494766235351562, -0.6043977737426758, 0.8406810760498047, 2.285759687423706, 3.7308382987976074, 5.17591667175293, 6.62099552154541, 8.06607437133789, 9.511152267456055, 10.956231117248535, 12.40130615234375, 13.84638500213623, 15.291463851928711, 16.736541748046875, 18.181621551513672, 19.626699447631836, 21.07177734375, 22.516857147216797, 23.96193504333496, 25.407012939453125, 26.852092742919922, 28.297170639038086, 29.74224853515625, 31.187328338623047, 32.632408142089844, 34.077484130859375, 35.52256393432617, 36.96764373779297, 38.4127197265625, 39.8577995300293, 41.302879333496094, 42.747955322265625, 44.19303512573242, 45.63811492919922, 47.08319091796875, 48.52827072143555, 49.97334671020508, 51.418426513671875, 52.86350631713867, 54.30858612060547, 55.753662109375, 57.1987419128418, 58.643821716308594]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 6.0, 9.0, 6.0, 8.0, 8.0, 15.0, 15.0, 17.0, 23.0, 18.0, 21.0, 36.0, 27.0, 27.0, 28.0, 37.0, 34.0, 42.0, 50.0, 49.0, 42.0, 43.0, 47.0, 29.0, 44.0, 39.0, 28.0, 34.0, 30.0, 32.0, 39.0, 16.0, 17.0, 14.0, 19.0, 7.0, 7.0, 6.0, 10.0, 6.0, 8.0, 4.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.48288345336914, -47.91722106933594, -46.35155487060547, -44.785892486572266, -43.22023010253906, -41.654563903808594, -40.08890151977539, -38.52323913574219, -36.95757293701172, -35.391910552978516, -33.82624435424805, -32.260581970214844, -30.694917678833008, -29.129253387451172, -27.56359100341797, -25.997926712036133, -24.432262420654297, -22.86659812927246, -21.300933837890625, -19.735271453857422, -18.169607162475586, -16.60394287109375, -15.03827953338623, -13.472616195678711, -11.906951904296875, -10.341287612915039, -8.77562427520752, -7.209960460662842, -5.644296646118164, -4.078632831573486, -2.5129690170288086, -0.9473056793212891, 0.6183547973632812, 2.184018611907959, 3.7496824264526367, 5.3153462409973145, 6.881010055541992, 8.446674346923828, 10.012337684631348, 11.578001022338867, 13.143665313720703, 14.709329605102539, 16.274993896484375, 17.840656280517578, 19.406320571899414, 20.97198486328125, 22.537647247314453, 24.10331153869629, 25.668975830078125, 27.23464012145996, 28.800304412841797, 30.365966796875, 31.931631088256836, 33.49729537963867, 35.062957763671875, 36.628623962402344, 38.19428634643555, 39.75994873046875, 41.32561492919922, 42.89127731323242, 44.456939697265625, 46.022605895996094, 47.5882682800293, 49.1539306640625, 50.71959686279297]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 6.0, 9.0, 8.0, 10.0, 6.0, 9.0, 16.0, 20.0, 12.0, 24.0, 12.0, 16.0, 26.0, 30.0, 31.0, 34.0, 31.0, 33.0, 42.0, 43.0, 33.0, 50.0, 48.0, 37.0, 53.0, 25.0, 26.0, 37.0, 22.0, 30.0, 30.0, 34.0, 28.0, 16.0, 19.0, 17.0, 16.0, 14.0, 9.0, 11.0, 13.0, 3.0, 5.0, 4.0, 3.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-6.57421875, -6.36981201171875, -6.1654052734375, -5.96099853515625, -5.756591796875, -5.55218505859375, -5.3477783203125, -5.14337158203125, -4.93896484375, -4.73455810546875, -4.5301513671875, -4.32574462890625, -4.121337890625, -3.91693115234375, -3.7125244140625, -3.50811767578125, -3.3037109375, -3.09930419921875, -2.8948974609375, -2.69049072265625, -2.486083984375, -2.28167724609375, -2.0772705078125, -1.87286376953125, -1.66845703125, -1.46405029296875, -1.2596435546875, -1.05523681640625, -0.850830078125, -0.64642333984375, -0.4420166015625, -0.23760986328125, -0.033203125, 0.17120361328125, 0.3756103515625, 0.58001708984375, 0.784423828125, 0.98883056640625, 1.1932373046875, 1.39764404296875, 1.60205078125, 1.80645751953125, 2.0108642578125, 2.21527099609375, 2.419677734375, 2.62408447265625, 2.8284912109375, 3.03289794921875, 3.2373046875, 3.44171142578125, 3.6461181640625, 3.85052490234375, 4.054931640625, 4.25933837890625, 4.4637451171875, 4.66815185546875, 4.87255859375, 5.07696533203125, 5.2813720703125, 5.48577880859375, 5.690185546875, 5.89459228515625, 6.0989990234375, 6.30340576171875, 6.5078125]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 9.0, 4.0, 3.0, 7.0, 9.0, 17.0, 20.0, 36.0, 38.0, 62.0, 90.0, 136.0, 202.0, 246.0, 355.0, 575.0, 1016.0, 1834.0, 3374.0, 7121.0, 18088.0, 68283.0, 336425.0, 1239735.0, 1704808.0, 629566.0, 131729.0, 29604.0, 10282.0, 4614.0, 2423.0, 1317.0, 755.0, 483.0, 295.0, 211.0, 140.0, 111.0, 94.0, 49.0, 37.0, 26.0, 14.0, 18.0, 8.0, 14.0, 7.0, 6.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.78125, -9.50347900390625, -9.2257080078125, -8.94793701171875, -8.670166015625, -8.39239501953125, -8.1146240234375, -7.83685302734375, -7.55908203125, -7.28131103515625, -7.0035400390625, -6.72576904296875, -6.447998046875, -6.17022705078125, -5.8924560546875, -5.61468505859375, -5.3369140625, -5.05914306640625, -4.7813720703125, -4.50360107421875, -4.225830078125, -3.94805908203125, -3.6702880859375, -3.39251708984375, -3.11474609375, -2.83697509765625, -2.5592041015625, -2.28143310546875, -2.003662109375, -1.72589111328125, -1.4481201171875, -1.17034912109375, -0.892578125, -0.61480712890625, -0.3370361328125, -0.05926513671875, 0.218505859375, 0.49627685546875, 0.7740478515625, 1.05181884765625, 1.32958984375, 1.60736083984375, 1.8851318359375, 2.16290283203125, 2.440673828125, 2.71844482421875, 2.9962158203125, 3.27398681640625, 3.5517578125, 3.82952880859375, 4.1072998046875, 4.38507080078125, 4.662841796875, 4.94061279296875, 5.2183837890625, 5.49615478515625, 5.77392578125, 6.05169677734375, 6.3294677734375, 6.60723876953125, 6.885009765625, 7.16278076171875, 7.4405517578125, 7.71832275390625, 7.99609375]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 7.0, 6.0, 8.0, 10.0, 15.0, 15.0, 18.0, 17.0, 31.0, 27.0, 49.0, 45.0, 68.0, 95.0, 122.0, 172.0, 254.0, 348.0, 373.0, 501.0, 441.0, 341.0, 285.0, 193.0, 146.0, 118.0, 73.0, 62.0, 43.0, 28.0, 28.0, 32.0, 24.0, 19.0, 15.0, 8.0, 5.0, 4.0, 10.0, 5.0, 2.0, 6.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0], "bins": [-11.1796875, -10.8673095703125, -10.554931640625, -10.2425537109375, -9.93017578125, -9.6177978515625, -9.305419921875, -8.9930419921875, -8.6806640625, -8.3682861328125, -8.055908203125, -7.7435302734375, -7.43115234375, -7.1187744140625, -6.806396484375, -6.4940185546875, -6.181640625, -5.8692626953125, -5.556884765625, -5.2445068359375, -4.93212890625, -4.6197509765625, -4.307373046875, -3.9949951171875, -3.6826171875, -3.3702392578125, -3.057861328125, -2.7454833984375, -2.43310546875, -2.1207275390625, -1.808349609375, -1.4959716796875, -1.18359375, -0.8712158203125, -0.558837890625, -0.2464599609375, 0.06591796875, 0.3782958984375, 0.690673828125, 1.0030517578125, 1.3154296875, 1.6278076171875, 1.940185546875, 2.2525634765625, 2.56494140625, 2.8773193359375, 3.189697265625, 3.5020751953125, 3.814453125, 4.1268310546875, 4.439208984375, 4.7515869140625, 5.06396484375, 5.3763427734375, 5.688720703125, 6.0010986328125, 6.3134765625, 6.6258544921875, 6.938232421875, 7.2506103515625, 7.56298828125, 7.8753662109375, 8.187744140625, 8.5001220703125, 8.8125]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 3.0, 0.0, 4.0, 3.0, 1.0, 4.0, 11.0, 4.0, 7.0, 8.0, 19.0, 13.0, 26.0, 30.0, 35.0, 38.0, 47.0, 76.0, 130.0, 188.0, 255.0, 512.0, 1245.0, 5342.0, 70054.0, 3714986.0, 384466.0, 12720.0, 2170.0, 748.0, 410.0, 225.0, 137.0, 91.0, 61.0, 48.0, 40.0, 27.0, 24.0, 11.0, 18.0, 15.0, 5.0, 11.0, 8.0, 4.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.9375, -31.7900390625, -30.642578125, -29.4951171875, -28.34765625, -27.2001953125, -26.052734375, -24.9052734375, -23.7578125, -22.6103515625, -21.462890625, -20.3154296875, -19.16796875, -18.0205078125, -16.873046875, -15.7255859375, -14.578125, -13.4306640625, -12.283203125, -11.1357421875, -9.98828125, -8.8408203125, -7.693359375, -6.5458984375, -5.3984375, -4.2509765625, -3.103515625, -1.9560546875, -0.80859375, 0.3388671875, 1.486328125, 2.6337890625, 3.78125, 4.9287109375, 6.076171875, 7.2236328125, 8.37109375, 9.5185546875, 10.666015625, 11.8134765625, 12.9609375, 14.1083984375, 15.255859375, 16.4033203125, 17.55078125, 18.6982421875, 19.845703125, 20.9931640625, 22.140625, 23.2880859375, 24.435546875, 25.5830078125, 26.73046875, 27.8779296875, 29.025390625, 30.1728515625, 31.3203125, 32.4677734375, 33.615234375, 34.7626953125, 35.91015625, 37.0576171875, 38.205078125, 39.3525390625, 40.5]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 5.0, 17.0, 23.0, 73.0, 171.0, 218.0, 226.0, 140.0, 82.0, 40.0, 11.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.88778305053711, -42.240169525146484, -39.592552185058594, -36.94493865966797, -34.297325134277344, -31.649709701538086, -29.002094268798828, -26.354480743408203, -23.706865310668945, -21.059249877929688, -18.411636352539062, -15.764020919799805, -13.116406440734863, -10.468791961669922, -7.821176528930664, -5.173563003540039, -2.5259475708007812, 0.12166714668273926, 2.7692818641662598, 5.416896820068359, 8.0645112991333, 10.712125778198242, 13.3597412109375, 16.007354736328125, 18.654970169067383, 21.30258560180664, 23.950199127197266, 26.597814559936523, 29.24542999267578, 31.893043518066406, 34.54065704345703, 37.188270568847656, 39.83589172363281, 42.48350524902344, 45.13112258911133, 47.77873611450195, 50.42634963989258, 53.07396697998047, 55.721580505371094, 58.36919403076172, 61.016807556152344, 63.66442108154297, 66.3120346069336, 68.95965576171875, 71.60726928710938, 74.2548828125, 76.90249633789062, 79.55010986328125, 82.19772338867188, 84.8453369140625, 87.49295043945312, 90.14056396484375, 92.7881851196289, 95.43579864501953, 98.08341217041016, 100.73102569580078, 103.37864685058594, 106.02626037597656, 108.67387390136719, 111.32148742675781, 113.96910858154297, 116.6167221069336, 119.26433563232422, 121.91194915771484, 124.55956268310547]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 2.0, 6.0, 5.0, 5.0, 8.0, 7.0, 7.0, 12.0, 21.0, 21.0, 18.0, 21.0, 22.0, 26.0, 40.0, 35.0, 34.0, 39.0, 48.0, 48.0, 52.0, 33.0, 42.0, 51.0, 39.0, 47.0, 41.0, 29.0, 33.0, 27.0, 30.0, 23.0, 19.0, 13.0, 13.0, 21.0, 7.0, 19.0, 13.0, 7.0, 10.0, 5.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-43.8133659362793, -42.58719253540039, -41.36101531982422, -40.13484191894531, -38.908668518066406, -37.682491302490234, -36.45631790161133, -35.230140686035156, -34.00396728515625, -32.777793884277344, -31.551616668701172, -30.325443267822266, -29.099267959594727, -27.873092651367188, -26.64691925048828, -25.420743942260742, -24.194568634033203, -22.968393325805664, -21.742218017578125, -20.51604461669922, -19.28986930847168, -18.06369400024414, -16.837520599365234, -15.611345291137695, -14.385169982910156, -13.158994674682617, -11.932820320129395, -10.706645965576172, -9.480470657348633, -8.254295349121094, -7.028120994567871, -5.801946640014648, -4.575767517089844, -3.349592685699463, -2.123417854309082, -0.8972430229187012, 0.3289318084716797, 1.5551066398620605, 2.7812814712524414, 4.007455825805664, 5.233631134033203, 6.459805965423584, 7.685980796813965, 8.912155151367188, 10.138330459594727, 11.364505767822266, 12.590680122375488, 13.816854476928711, 15.04302978515625, 16.26920509338379, 17.495380401611328, 18.721553802490234, 19.947729110717773, 21.173904418945312, 22.40007781982422, 23.626253128051758, 24.852428436279297, 26.078603744506836, 27.304779052734375, 28.53095245361328, 29.75712776184082, 30.98330307006836, 32.209476470947266, 33.43565368652344, 34.661827087402344]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 1.0, 0.0, 6.0, 4.0, 4.0, 5.0, 3.0, 8.0, 13.0, 6.0, 13.0, 12.0, 17.0, 15.0, 13.0, 19.0, 22.0, 34.0, 20.0, 34.0, 32.0, 37.0, 29.0, 35.0, 34.0, 41.0, 37.0, 45.0, 30.0, 37.0, 27.0, 34.0, 39.0, 36.0, 35.0, 26.0, 23.0, 22.0, 18.0, 15.0, 25.0, 13.0, 16.0, 12.0, 14.0, 7.0, 8.0, 6.0, 10.0, 3.0, 4.0, 4.0, 3.0, 0.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0, 2.0], "bins": [-5.40625, -5.22894287109375, -5.0516357421875, -4.87432861328125, -4.697021484375, -4.51971435546875, -4.3424072265625, -4.16510009765625, -3.98779296875, -3.81048583984375, -3.6331787109375, -3.45587158203125, -3.278564453125, -3.10125732421875, -2.9239501953125, -2.74664306640625, -2.5693359375, -2.39202880859375, -2.2147216796875, -2.03741455078125, -1.860107421875, -1.68280029296875, -1.5054931640625, -1.32818603515625, -1.15087890625, -0.97357177734375, -0.7962646484375, -0.61895751953125, -0.441650390625, -0.26434326171875, -0.0870361328125, 0.09027099609375, 0.267578125, 0.44488525390625, 0.6221923828125, 0.79949951171875, 0.976806640625, 1.15411376953125, 1.3314208984375, 1.50872802734375, 1.68603515625, 1.86334228515625, 2.0406494140625, 2.21795654296875, 2.395263671875, 2.57257080078125, 2.7498779296875, 2.92718505859375, 3.1044921875, 3.28179931640625, 3.4591064453125, 3.63641357421875, 3.813720703125, 3.99102783203125, 4.1683349609375, 4.34564208984375, 4.52294921875, 4.70025634765625, 4.8775634765625, 5.05487060546875, 5.232177734375, 5.40948486328125, 5.5867919921875, 5.76409912109375, 5.94140625]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 6.0, 6.0, 9.0, 12.0, 33.0, 49.0, 85.0, 86.0, 164.0, 226.0, 353.0, 587.0, 868.0, 1218.0, 2111.0, 3129.0, 5006.0, 8183.0, 12913.0, 21867.0, 38254.0, 69455.0, 136670.0, 295442.0, 218328.0, 102582.0, 54157.0, 30415.0, 17526.0, 10533.0, 6599.0, 4212.0, 2526.0, 1730.0, 1136.0, 687.0, 447.0, 308.0, 225.0, 146.0, 74.0, 58.0, 44.0, 30.0, 20.0, 21.0, 9.0, 8.0, 3.0, 1.0, 2.0, 3.0, 2.0, 1.0], "bins": [-0.3330078125, -0.3231544494628906, -0.31330108642578125, -0.3034477233886719, -0.2935943603515625, -0.2837409973144531, -0.27388763427734375, -0.2640342712402344, -0.254180908203125, -0.24432754516601562, -0.23447418212890625, -0.22462081909179688, -0.2147674560546875, -0.20491409301757812, -0.19506072998046875, -0.18520736694335938, -0.17535400390625, -0.16550064086914062, -0.15564727783203125, -0.14579391479492188, -0.1359405517578125, -0.12608718872070312, -0.11623382568359375, -0.10638046264648438, -0.096527099609375, -0.08667373657226562, -0.07682037353515625, -0.06696701049804688, -0.0571136474609375, -0.047260284423828125, -0.03740692138671875, -0.027553558349609375, -0.0177001953125, -0.007846832275390625, 0.00200653076171875, 0.011859893798828125, 0.0217132568359375, 0.031566619873046875, 0.04141998291015625, 0.051273345947265625, 0.061126708984375, 0.07098007202148438, 0.08083343505859375, 0.09068679809570312, 0.1005401611328125, 0.11039352416992188, 0.12024688720703125, 0.13010025024414062, 0.13995361328125, 0.14980697631835938, 0.15966033935546875, 0.16951370239257812, 0.1793670654296875, 0.18922042846679688, 0.19907379150390625, 0.20892715454101562, 0.218780517578125, 0.22863388061523438, 0.23848724365234375, 0.24834060668945312, 0.2581939697265625, 0.2680473327636719, 0.27790069580078125, 0.2877540588378906, 0.297607421875]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 0.0, 1.0, 3.0, 3.0, 7.0, 6.0, 8.0, 4.0, 10.0, 9.0, 5.0, 12.0, 16.0, 12.0, 8.0, 21.0, 20.0, 18.0, 24.0, 22.0, 30.0, 20.0, 39.0, 20.0, 39.0, 28.0, 31.0, 39.0, 1058.0, 33.0, 23.0, 37.0, 38.0, 27.0, 35.0, 29.0, 36.0, 24.0, 29.0, 27.0, 17.0, 24.0, 23.0, 22.0, 12.0, 12.0, 13.0, 8.0, 7.0, 12.0, 11.0, 10.0, 5.0, 5.0, 2.0, 2.0, 1.0, 2.0], "bins": [-3.685546875, -3.579833984375, -3.47412109375, -3.368408203125, -3.2626953125, -3.156982421875, -3.05126953125, -2.945556640625, -2.83984375, -2.734130859375, -2.62841796875, -2.522705078125, -2.4169921875, -2.311279296875, -2.20556640625, -2.099853515625, -1.994140625, -1.888427734375, -1.78271484375, -1.677001953125, -1.5712890625, -1.465576171875, -1.35986328125, -1.254150390625, -1.1484375, -1.042724609375, -0.93701171875, -0.831298828125, -0.7255859375, -0.619873046875, -0.51416015625, -0.408447265625, -0.302734375, -0.197021484375, -0.09130859375, 0.014404296875, 0.1201171875, 0.225830078125, 0.33154296875, 0.437255859375, 0.54296875, 0.648681640625, 0.75439453125, 0.860107421875, 0.9658203125, 1.071533203125, 1.17724609375, 1.282958984375, 1.388671875, 1.494384765625, 1.60009765625, 1.705810546875, 1.8115234375, 1.917236328125, 2.02294921875, 2.128662109375, 2.234375, 2.340087890625, 2.44580078125, 2.551513671875, 2.6572265625, 2.762939453125, 2.86865234375, 2.974365234375, 3.080078125]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [7.0, 7.0, 14.0, 17.0, 23.0, 34.0, 28.0, 47.0, 66.0, 81.0, 123.0, 182.0, 272.0, 356.0, 501.0, 612.0, 893.0, 1107.0, 1570.0, 2169.0, 2903.0, 4188.0, 5687.0, 7902.0, 11348.0, 16307.0, 23831.0, 35077.0, 53301.0, 84798.0, 137819.0, 1250855.0, 161791.0, 99567.0, 62448.0, 40494.0, 26914.0, 18570.0, 12682.0, 9019.0, 6425.0, 4626.0, 3386.0, 2415.0, 1802.0, 1293.0, 976.0, 700.0, 536.0, 376.0, 294.0, 187.0, 164.0, 117.0, 70.0, 52.0, 45.0, 28.0, 16.0, 12.0, 8.0, 6.0, 4.0, 4.0], "bins": [-0.15869140625, -0.15368080139160156, -0.14867019653320312, -0.1436595916748047, -0.13864898681640625, -0.1336383819580078, -0.12862777709960938, -0.12361717224121094, -0.1186065673828125, -0.11359596252441406, -0.10858535766601562, -0.10357475280761719, -0.09856414794921875, -0.09355354309082031, -0.08854293823242188, -0.08353233337402344, -0.078521728515625, -0.07351112365722656, -0.06850051879882812, -0.06348991394042969, -0.05847930908203125, -0.05346870422363281, -0.048458099365234375, -0.04344749450683594, -0.0384368896484375, -0.03342628479003906, -0.028415679931640625, -0.023405075073242188, -0.01839447021484375, -0.013383865356445312, -0.008373260498046875, -0.0033626556396484375, 0.00164794921875, 0.0066585540771484375, 0.011669158935546875, 0.016679763793945312, 0.02169036865234375, 0.026700973510742188, 0.031711578369140625, 0.03672218322753906, 0.0417327880859375, 0.04674339294433594, 0.051753997802734375, 0.05676460266113281, 0.06177520751953125, 0.06678581237792969, 0.07179641723632812, 0.07680702209472656, 0.081817626953125, 0.08682823181152344, 0.09183883666992188, 0.09684944152832031, 0.10186004638671875, 0.10687065124511719, 0.11188125610351562, 0.11689186096191406, 0.1219024658203125, 0.12691307067871094, 0.13192367553710938, 0.1369342803955078, 0.14194488525390625, 0.1469554901123047, 0.15196609497070312, 0.15697669982910156, 0.1619873046875]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 10.0, 3.0, 4.0, 1.0, 10.0, 5.0, 9.0, 4.0, 12.0, 20.0, 21.0, 39.0, 54.0, 95.0, 122.0, 139.0, 155.0, 97.0, 48.0, 45.0, 21.0, 23.0, 8.0, 14.0, 18.0, 6.0, 9.0, 3.0, 4.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00030350685119628906, -0.00029393285512924194, -0.0002843588590621948, -0.0002747848629951477, -0.0002652108669281006, -0.00025563687086105347, -0.00024606287479400635, -0.00023648887872695923, -0.0002269148826599121, -0.000217340886592865, -0.00020776689052581787, -0.00019819289445877075, -0.00018861889839172363, -0.00017904490232467651, -0.0001694709062576294, -0.00015989691019058228, -0.00015032291412353516, -0.00014074891805648804, -0.00013117492198944092, -0.0001216009259223938, -0.00011202692985534668, -0.00010245293378829956, -9.287893772125244e-05, -8.330494165420532e-05, -7.37309455871582e-05, -6.415694952011108e-05, -5.4582953453063965e-05, -4.5008957386016846e-05, -3.5434961318969727e-05, -2.5860965251922607e-05, -1.6286969184875488e-05, -6.712973117828369e-06, 2.86102294921875e-06, 1.2435019016265869e-05, 2.2009015083312988e-05, 3.158301115036011e-05, 4.1157007217407227e-05, 5.0731003284454346e-05, 6.0304999351501465e-05, 6.987899541854858e-05, 7.94529914855957e-05, 8.902698755264282e-05, 9.860098361968994e-05, 0.00010817497968673706, 0.00011774897575378418, 0.0001273229718208313, 0.00013689696788787842, 0.00014647096395492554, 0.00015604496002197266, 0.00016561895608901978, 0.0001751929521560669, 0.00018476694822311401, 0.00019434094429016113, 0.00020391494035720825, 0.00021348893642425537, 0.0002230629324913025, 0.0002326369285583496, 0.00024221092462539673, 0.00025178492069244385, 0.00026135891675949097, 0.0002709329128265381, 0.0002805069088935852, 0.0002900809049606323, 0.00029965490102767944, 0.00030922889709472656]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 1.0, 1.0, 4.0, 1.0, 5.0, 6.0, 13.0, 10.0, 19.0, 22.0, 27.0, 54.0, 77.0, 120.0, 234.0, 723.0, 10962.0, 1028055.0, 7004.0, 634.0, 248.0, 110.0, 60.0, 54.0, 24.0, 18.0, 20.0, 8.0, 15.0, 2.0, 7.0, 4.0, 5.0, 7.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006572723388671875, -0.006370186805725098, -0.00616765022277832, -0.005965113639831543, -0.005762577056884766, -0.005560040473937988, -0.005357503890991211, -0.005154967308044434, -0.004952430725097656, -0.004749894142150879, -0.0045473575592041016, -0.004344820976257324, -0.004142284393310547, -0.0039397478103637695, -0.003737211227416992, -0.003534674644470215, -0.0033321380615234375, -0.00312960147857666, -0.002927064895629883, -0.0027245283126831055, -0.002521991729736328, -0.0023194551467895508, -0.0021169185638427734, -0.001914381980895996, -0.0017118453979492188, -0.0015093088150024414, -0.001306772232055664, -0.0011042356491088867, -0.0009016990661621094, -0.000699162483215332, -0.0004966259002685547, -0.00029408931732177734, -9.1552734375e-05, 0.00011098384857177734, 0.0003135204315185547, 0.000516057014465332, 0.0007185935974121094, 0.0009211301803588867, 0.001123666763305664, 0.0013262033462524414, 0.0015287399291992188, 0.001731276512145996, 0.0019338130950927734, 0.0021363496780395508, 0.002338886260986328, 0.0025414228439331055, 0.002743959426879883, 0.00294649600982666, 0.0031490325927734375, 0.003351569175720215, 0.003554105758666992, 0.0037566423416137695, 0.003959178924560547, 0.004161715507507324, 0.0043642520904541016, 0.004566788673400879, 0.004769325256347656, 0.004971861839294434, 0.005174398422241211, 0.005376935005187988, 0.005579471588134766, 0.005782008171081543, 0.00598454475402832, 0.006187081336975098, 0.006389617919921875]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [3.0, 176.0, 809.0, 30.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00013096180919092149, -7.412311970256269e-05, -1.7284430214203894e-05, 3.95542592741549e-05, 9.63929487625137e-05, 0.00015323162369895726, 0.0002100703277392313, 0.0002669090172275901, 0.00032374769216403365, 0.0003805863671004772, 0.00043742507114075124, 0.0004942637751810253, 0.0005511024501174688, 0.0006079411250539124, 0.000664779799990356, 0.0007216185331344604, 0.000778457208070904, 0.0008352958830073476, 0.0008921346161514521, 0.0009489732910878956, 0.0010058119660243392, 0.0010626506991684437, 0.0011194893158972263, 0.0011763280490413308, 0.0012331667821854353, 0.0012900055153295398, 0.0013468441320583224, 0.001403682865202427, 0.0014605214819312096, 0.001517360215075314, 0.0015741989482194185, 0.0016310375649482012, 0.0016878761816769838, 0.0017447149148210883, 0.001801553531549871, 0.0018583922646939754, 0.001915230881422758, 0.0019720694981515408, 0.002028908347710967, 0.0020857469644397497, 0.002142585813999176, 0.0021994244307279587, 0.002256263280287385, 0.0023131018970161676, 0.0023699405137449503, 0.0024267793633043766, 0.0024836179800331593, 0.002540456596761942, 0.0025972952134907246, 0.0026541338302195072, 0.0027109726797789335, 0.002767811296507716, 0.002824649913236499, 0.002881488762795925, 0.002938327379524708, 0.0029951659962534904, 0.003052004612982273, 0.0031088432297110558, 0.003165682079270482, 0.0032225206959992647, 0.0032793593127280474, 0.0033361981622874737, 0.0033930367790162563, 0.003449875395745039, 0.0035067142453044653]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 3.0, 6.0, 6.0, 4.0, 4.0, 8.0, 7.0, 8.0, 19.0, 17.0, 22.0, 26.0, 34.0, 28.0, 44.0, 45.0, 44.0, 40.0, 48.0, 42.0, 58.0, 43.0, 54.0, 50.0, 40.0, 44.0, 44.0, 36.0, 34.0, 28.0, 29.0, 19.0, 18.0, 16.0, 16.0, 13.0, 8.0, 0.0, 4.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.0001665949821472168, -0.00016227364540100098, -0.00015795230865478516, -0.00015363097190856934, -0.00014930963516235352, -0.0001449882984161377, -0.00014066696166992188, -0.00013634562492370605, -0.00013202428817749023, -0.00012770295143127441, -0.0001233816146850586, -0.00011906027793884277, -0.00011473894119262695, -0.00011041760444641113, -0.00010609626770019531, -0.00010177493095397949, -9.745359420776367e-05, -9.313225746154785e-05, -8.881092071533203e-05, -8.448958396911621e-05, -8.016824722290039e-05, -7.584691047668457e-05, -7.152557373046875e-05, -6.720423698425293e-05, -6.288290023803711e-05, -5.856156349182129e-05, -5.424022674560547e-05, -4.991888999938965e-05, -4.559755325317383e-05, -4.127621650695801e-05, -3.695487976074219e-05, -3.263354301452637e-05, -2.8312206268310547e-05, -2.3990869522094727e-05, -1.9669532775878906e-05, -1.5348196029663086e-05, -1.1026859283447266e-05, -6.705522537231445e-06, -2.384185791015625e-06, 1.9371509552001953e-06, 6.258487701416016e-06, 1.0579824447631836e-05, 1.4901161193847656e-05, 1.9222497940063477e-05, 2.3543834686279297e-05, 2.7865171432495117e-05, 3.218650817871094e-05, 3.650784492492676e-05, 4.082918167114258e-05, 4.51505184173584e-05, 4.947185516357422e-05, 5.379319190979004e-05, 5.811452865600586e-05, 6.243586540222168e-05, 6.67572021484375e-05, 7.107853889465332e-05, 7.539987564086914e-05, 7.972121238708496e-05, 8.404254913330078e-05, 8.83638858795166e-05, 9.268522262573242e-05, 9.700655937194824e-05, 0.00010132789611816406, 0.00010564923286437988, 0.0001099705696105957]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 1.0, 0.0, 6.0, 4.0, 4.0, 5.0, 3.0, 8.0, 13.0, 6.0, 13.0, 12.0, 17.0, 15.0, 13.0, 19.0, 22.0, 34.0, 20.0, 34.0, 32.0, 37.0, 29.0, 35.0, 34.0, 41.0, 37.0, 45.0, 30.0, 37.0, 27.0, 34.0, 38.0, 37.0, 35.0, 26.0, 23.0, 22.0, 18.0, 15.0, 25.0, 13.0, 16.0, 12.0, 14.0, 7.0, 8.0, 6.0, 10.0, 3.0, 4.0, 4.0, 3.0, 0.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0, 2.0], "bins": [-5.40625, -5.22894287109375, -5.0516357421875, -4.87432861328125, -4.697021484375, -4.51971435546875, -4.3424072265625, -4.16510009765625, -3.98779296875, -3.81048583984375, -3.6331787109375, -3.45587158203125, -3.278564453125, -3.10125732421875, -2.9239501953125, -2.74664306640625, -2.5693359375, -2.39202880859375, -2.2147216796875, -2.03741455078125, -1.860107421875, -1.68280029296875, -1.5054931640625, -1.32818603515625, -1.15087890625, -0.97357177734375, -0.7962646484375, -0.61895751953125, -0.441650390625, -0.26434326171875, -0.0870361328125, 0.09027099609375, 0.267578125, 0.44488525390625, 0.6221923828125, 0.79949951171875, 0.976806640625, 1.15411376953125, 1.3314208984375, 1.50872802734375, 1.68603515625, 1.86334228515625, 2.0406494140625, 2.21795654296875, 2.395263671875, 2.57257080078125, 2.7498779296875, 2.92718505859375, 3.1044921875, 3.28179931640625, 3.4591064453125, 3.63641357421875, 3.813720703125, 3.99102783203125, 4.1683349609375, 4.34564208984375, 4.52294921875, 4.70025634765625, 4.8775634765625, 5.05487060546875, 5.232177734375, 5.40948486328125, 5.5867919921875, 5.76409912109375, 5.94140625]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 4.0, 2.0, 6.0, 3.0, 7.0, 8.0, 8.0, 17.0, 22.0, 29.0, 44.0, 54.0, 72.0, 98.0, 146.0, 283.0, 407.0, 715.0, 1380.0, 2661.0, 4745.0, 9418.0, 18887.0, 39266.0, 88066.0, 228736.0, 368858.0, 158495.0, 65807.0, 30121.0, 14416.0, 7253.0, 3723.0, 2047.0, 1116.0, 553.0, 368.0, 213.0, 138.0, 124.0, 71.0, 48.0, 28.0, 25.0, 15.0, 12.0, 15.0, 11.0, 2.0, 9.0, 2.0, 2.0, 4.0, 1.0, 1.0, 2.0, 4.0, 0.0, 0.0, 1.0], "bins": [-5.95703125, -5.76055908203125, -5.5640869140625, -5.36761474609375, -5.171142578125, -4.97467041015625, -4.7781982421875, -4.58172607421875, -4.38525390625, -4.18878173828125, -3.9923095703125, -3.79583740234375, -3.599365234375, -3.40289306640625, -3.2064208984375, -3.00994873046875, -2.8134765625, -2.61700439453125, -2.4205322265625, -2.22406005859375, -2.027587890625, -1.83111572265625, -1.6346435546875, -1.43817138671875, -1.24169921875, -1.04522705078125, -0.8487548828125, -0.65228271484375, -0.455810546875, -0.25933837890625, -0.0628662109375, 0.13360595703125, 0.330078125, 0.52655029296875, 0.7230224609375, 0.91949462890625, 1.115966796875, 1.31243896484375, 1.5089111328125, 1.70538330078125, 1.90185546875, 2.09832763671875, 2.2947998046875, 2.49127197265625, 2.687744140625, 2.88421630859375, 3.0806884765625, 3.27716064453125, 3.4736328125, 3.67010498046875, 3.8665771484375, 4.06304931640625, 4.259521484375, 4.45599365234375, 4.6524658203125, 4.84893798828125, 5.04541015625, 5.24188232421875, 5.4383544921875, 5.63482666015625, 5.831298828125, 6.02777099609375, 6.2242431640625, 6.42071533203125, 6.6171875]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 7.0, 4.0, 4.0, 12.0, 5.0, 18.0, 15.0, 19.0, 23.0, 24.0, 36.0, 45.0, 37.0, 37.0, 48.0, 73.0, 87.0, 166.0, 1486.0, 317.0, 110.0, 77.0, 49.0, 49.0, 33.0, 35.0, 34.0, 36.0, 31.0, 21.0, 30.0, 15.0, 10.0, 13.0, 9.0, 7.0, 7.0, 4.0, 5.0, 2.0, 2.0, 3.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0], "bins": [-20.75, -20.1533203125, -19.556640625, -18.9599609375, -18.36328125, -17.7666015625, -17.169921875, -16.5732421875, -15.9765625, -15.3798828125, -14.783203125, -14.1865234375, -13.58984375, -12.9931640625, -12.396484375, -11.7998046875, -11.203125, -10.6064453125, -10.009765625, -9.4130859375, -8.81640625, -8.2197265625, -7.623046875, -7.0263671875, -6.4296875, -5.8330078125, -5.236328125, -4.6396484375, -4.04296875, -3.4462890625, -2.849609375, -2.2529296875, -1.65625, -1.0595703125, -0.462890625, 0.1337890625, 0.73046875, 1.3271484375, 1.923828125, 2.5205078125, 3.1171875, 3.7138671875, 4.310546875, 4.9072265625, 5.50390625, 6.1005859375, 6.697265625, 7.2939453125, 7.890625, 8.4873046875, 9.083984375, 9.6806640625, 10.27734375, 10.8740234375, 11.470703125, 12.0673828125, 12.6640625, 13.2607421875, 13.857421875, 14.4541015625, 15.05078125, 15.6474609375, 16.244140625, 16.8408203125, 17.4375]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 6.0, 1.0, 5.0, 9.0, 8.0, 16.0, 14.0, 23.0, 27.0, 30.0, 45.0, 52.0, 78.0, 122.0, 139.0, 206.0, 367.0, 896.0, 5832.0, 312002.0, 2801132.0, 21786.0, 1581.0, 470.0, 256.0, 172.0, 116.0, 75.0, 56.0, 51.0, 38.0, 28.0, 18.0, 8.0, 15.0, 5.0, 5.0, 8.0, 3.0, 2.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-40.34375, -39.19775390625, -38.0517578125, -36.90576171875, -35.759765625, -34.61376953125, -33.4677734375, -32.32177734375, -31.17578125, -30.02978515625, -28.8837890625, -27.73779296875, -26.591796875, -25.44580078125, -24.2998046875, -23.15380859375, -22.0078125, -20.86181640625, -19.7158203125, -18.56982421875, -17.423828125, -16.27783203125, -15.1318359375, -13.98583984375, -12.83984375, -11.69384765625, -10.5478515625, -9.40185546875, -8.255859375, -7.10986328125, -5.9638671875, -4.81787109375, -3.671875, -2.52587890625, -1.3798828125, -0.23388671875, 0.912109375, 2.05810546875, 3.2041015625, 4.35009765625, 5.49609375, 6.64208984375, 7.7880859375, 8.93408203125, 10.080078125, 11.22607421875, 12.3720703125, 13.51806640625, 14.6640625, 15.81005859375, 16.9560546875, 18.10205078125, 19.248046875, 20.39404296875, 21.5400390625, 22.68603515625, 23.83203125, 24.97802734375, 26.1240234375, 27.27001953125, 28.416015625, 29.56201171875, 30.7080078125, 31.85400390625, 33.0]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 257.0, 737.0, 25.0], "bins": [-478.84661865234375, -471.14825439453125, -463.4499206542969, -455.7515563964844, -448.05322265625, -440.3548583984375, -432.656494140625, -424.9581604003906, -417.2597961425781, -409.5614318847656, -401.86309814453125, -394.16473388671875, -386.4664001464844, -378.7680358886719, -371.0697021484375, -363.371337890625, -355.6729736328125, -347.974609375, -340.2762756347656, -332.5779113769531, -324.87957763671875, -317.18121337890625, -309.48284912109375, -301.7845153808594, -294.086181640625, -286.3878173828125, -278.6894836425781, -270.9911193847656, -263.29278564453125, -255.59442138671875, -247.8960723876953, -240.19772338867188, -232.49935913085938, -224.80101013183594, -217.1026611328125, -209.404296875, -201.70594787597656, -194.00759887695312, -186.3092498779297, -178.61090087890625, -170.91253662109375, -163.2141876220703, -155.51583862304688, -147.81747436523438, -140.11912536621094, -132.4207763671875, -124.72242736816406, -117.02407836914062, -109.32572937011719, -101.62738037109375, -93.92902374267578, -86.23067474365234, -78.53231811523438, -70.83396911621094, -63.1356201171875, -55.4372673034668, -47.738914489746094, -40.04056167602539, -32.34220886230469, -24.64385986328125, -16.945507049560547, -9.247154235839844, -1.5488052368164062, 6.149547576904297, 13.847900390625]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 1.0, 5.0, 2.0, 7.0, 5.0, 7.0, 7.0, 6.0, 18.0, 13.0, 11.0, 16.0, 20.0, 19.0, 26.0, 23.0, 20.0, 32.0, 35.0, 32.0, 43.0, 55.0, 36.0, 30.0, 42.0, 56.0, 42.0, 39.0, 29.0, 37.0, 41.0, 30.0, 27.0, 37.0, 23.0, 21.0, 21.0, 15.0, 13.0, 11.0, 11.0, 9.0, 11.0, 5.0, 3.0, 4.0, 7.0, 0.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-42.76203536987305, -41.372535705566406, -39.98303985595703, -38.593544006347656, -37.204044342041016, -35.814544677734375, -34.425048828125, -33.035552978515625, -31.646053314208984, -30.256555557250977, -28.86705780029297, -27.47756004333496, -26.088062286376953, -24.698564529418945, -23.309066772460938, -21.91956901550293, -20.530071258544922, -19.140573501586914, -17.751075744628906, -16.3615779876709, -14.97208023071289, -13.582582473754883, -12.193084716796875, -10.803586959838867, -9.41408920288086, -8.024591445922852, -6.635093688964844, -5.245595932006836, -3.856098175048828, -2.4666004180908203, -1.0771026611328125, 0.3123950958251953, 1.7018966674804688, 3.0913944244384766, 4.480892181396484, 5.870389938354492, 7.2598876953125, 8.649385452270508, 10.038883209228516, 11.428380966186523, 12.817878723144531, 14.207376480102539, 15.596874237060547, 16.986371994018555, 18.375869750976562, 19.76536750793457, 21.154865264892578, 22.544363021850586, 23.933860778808594, 25.3233585357666, 26.71285629272461, 28.102354049682617, 29.491851806640625, 30.881349563598633, 32.27084732055664, 33.66034698486328, 35.049842834472656, 36.43933868408203, 37.82883834838867, 39.21833801269531, 40.60783386230469, 41.99732971191406, 43.3868293762207, 44.776329040527344, 46.16582489013672]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 6.0, 5.0, 7.0, 3.0, 17.0, 15.0, 12.0, 15.0, 18.0, 15.0, 19.0, 16.0, 31.0, 24.0, 31.0, 31.0, 31.0, 31.0, 37.0, 42.0, 39.0, 41.0, 43.0, 33.0, 33.0, 38.0, 40.0, 29.0, 33.0, 38.0, 32.0, 30.0, 18.0, 19.0, 16.0, 22.0, 25.0, 9.0, 12.0, 12.0, 7.0, 10.0, 6.0, 2.0, 5.0, 3.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.69921875, -5.506103515625, -5.31298828125, -5.119873046875, -4.9267578125, -4.733642578125, -4.54052734375, -4.347412109375, -4.154296875, -3.961181640625, -3.76806640625, -3.574951171875, -3.3818359375, -3.188720703125, -2.99560546875, -2.802490234375, -2.609375, -2.416259765625, -2.22314453125, -2.030029296875, -1.8369140625, -1.643798828125, -1.45068359375, -1.257568359375, -1.064453125, -0.871337890625, -0.67822265625, -0.485107421875, -0.2919921875, -0.098876953125, 0.09423828125, 0.287353515625, 0.48046875, 0.673583984375, 0.86669921875, 1.059814453125, 1.2529296875, 1.446044921875, 1.63916015625, 1.832275390625, 2.025390625, 2.218505859375, 2.41162109375, 2.604736328125, 2.7978515625, 2.990966796875, 3.18408203125, 3.377197265625, 3.5703125, 3.763427734375, 3.95654296875, 4.149658203125, 4.3427734375, 4.535888671875, 4.72900390625, 4.922119140625, 5.115234375, 5.308349609375, 5.50146484375, 5.694580078125, 5.8876953125, 6.080810546875, 6.27392578125, 6.467041015625, 6.66015625]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 5.0, 5.0, 4.0, 6.0, 5.0, 12.0, 16.0, 12.0, 19.0, 19.0, 18.0, 31.0, 30.0, 50.0, 55.0, 111.0, 206.0, 408.0, 1025.0, 2956.0, 13624.0, 209392.0, 3180894.0, 748721.0, 28928.0, 4808.0, 1534.0, 617.0, 300.0, 163.0, 80.0, 43.0, 35.0, 31.0, 25.0, 14.0, 16.0, 10.0, 8.0, 15.0, 5.0, 5.0, 9.0, 8.0, 2.0, 2.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.1875, -18.581787109375, -17.97607421875, -17.370361328125, -16.7646484375, -16.158935546875, -15.55322265625, -14.947509765625, -14.341796875, -13.736083984375, -13.13037109375, -12.524658203125, -11.9189453125, -11.313232421875, -10.70751953125, -10.101806640625, -9.49609375, -8.890380859375, -8.28466796875, -7.678955078125, -7.0732421875, -6.467529296875, -5.86181640625, -5.256103515625, -4.650390625, -4.044677734375, -3.43896484375, -2.833251953125, -2.2275390625, -1.621826171875, -1.01611328125, -0.410400390625, 0.1953125, 0.801025390625, 1.40673828125, 2.012451171875, 2.6181640625, 3.223876953125, 3.82958984375, 4.435302734375, 5.041015625, 5.646728515625, 6.25244140625, 6.858154296875, 7.4638671875, 8.069580078125, 8.67529296875, 9.281005859375, 9.88671875, 10.492431640625, 11.09814453125, 11.703857421875, 12.3095703125, 12.915283203125, 13.52099609375, 14.126708984375, 14.732421875, 15.338134765625, 15.94384765625, 16.549560546875, 17.1552734375, 17.760986328125, 18.36669921875, 18.972412109375, 19.578125]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 4.0, 9.0, 12.0, 2.0, 5.0, 8.0, 14.0, 17.0, 31.0, 26.0, 42.0, 57.0, 62.0, 75.0, 124.0, 184.0, 284.0, 392.0, 496.0, 570.0, 462.0, 331.0, 265.0, 163.0, 100.0, 70.0, 63.0, 40.0, 45.0, 23.0, 20.0, 11.0, 13.0, 11.0, 9.0, 9.0, 9.0, 1.0, 5.0, 5.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.046875, -8.7279052734375, -8.408935546875, -8.0899658203125, -7.77099609375, -7.4520263671875, -7.133056640625, -6.8140869140625, -6.4951171875, -6.1761474609375, -5.857177734375, -5.5382080078125, -5.21923828125, -4.9002685546875, -4.581298828125, -4.2623291015625, -3.943359375, -3.6243896484375, -3.305419921875, -2.9864501953125, -2.66748046875, -2.3485107421875, -2.029541015625, -1.7105712890625, -1.3916015625, -1.0726318359375, -0.753662109375, -0.4346923828125, -0.11572265625, 0.2032470703125, 0.522216796875, 0.8411865234375, 1.16015625, 1.4791259765625, 1.798095703125, 2.1170654296875, 2.43603515625, 2.7550048828125, 3.073974609375, 3.3929443359375, 3.7119140625, 4.0308837890625, 4.349853515625, 4.6688232421875, 4.98779296875, 5.3067626953125, 5.625732421875, 5.9447021484375, 6.263671875, 6.5826416015625, 6.901611328125, 7.2205810546875, 7.53955078125, 7.8585205078125, 8.177490234375, 8.4964599609375, 8.8154296875, 9.1343994140625, 9.453369140625, 9.7723388671875, 10.09130859375, 10.4102783203125, 10.729248046875, 11.0482177734375, 11.3671875]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 7.0, 6.0, 8.0, 7.0, 12.0, 17.0, 13.0, 20.0, 21.0, 34.0, 50.0, 47.0, 81.0, 116.0, 156.0, 262.0, 520.0, 1660.0, 9640.0, 169759.0, 3871619.0, 128818.0, 8443.0, 1514.0, 560.0, 276.0, 164.0, 107.0, 93.0, 65.0, 48.0, 45.0, 26.0, 14.0, 10.0, 4.0, 8.0, 11.0, 5.0, 4.0, 8.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-40.625, -39.4794921875, -38.333984375, -37.1884765625, -36.04296875, -34.8974609375, -33.751953125, -32.6064453125, -31.4609375, -30.3154296875, -29.169921875, -28.0244140625, -26.87890625, -25.7333984375, -24.587890625, -23.4423828125, -22.296875, -21.1513671875, -20.005859375, -18.8603515625, -17.71484375, -16.5693359375, -15.423828125, -14.2783203125, -13.1328125, -11.9873046875, -10.841796875, -9.6962890625, -8.55078125, -7.4052734375, -6.259765625, -5.1142578125, -3.96875, -2.8232421875, -1.677734375, -0.5322265625, 0.61328125, 1.7587890625, 2.904296875, 4.0498046875, 5.1953125, 6.3408203125, 7.486328125, 8.6318359375, 9.77734375, 10.9228515625, 12.068359375, 13.2138671875, 14.359375, 15.5048828125, 16.650390625, 17.7958984375, 18.94140625, 20.0869140625, 21.232421875, 22.3779296875, 23.5234375, 24.6689453125, 25.814453125, 26.9599609375, 28.10546875, 29.2509765625, 30.396484375, 31.5419921875, 32.6875]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 18.0, 276.0, 553.0, 155.0, 15.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-107.67435455322266, -101.0995101928711, -94.52466583251953, -87.9498291015625, -81.37498474121094, -74.80014038085938, -68.22529602050781, -61.65045166015625, -55.07560729980469, -48.500762939453125, -41.92591857910156, -35.351078033447266, -28.776233673095703, -22.20138931274414, -15.626548767089844, -9.051704406738281, -2.4768600463867188, 4.097983360290527, 10.672826766967773, 17.247669219970703, 23.822513580322266, 30.397357940673828, 36.972198486328125, 43.54704284667969, 50.12188720703125, 56.69673156738281, 63.271575927734375, 69.84642028808594, 76.4212646484375, 82.99610900878906, 89.5709457397461, 96.14579010009766, 102.72064208984375, 109.29548645019531, 115.87033081054688, 122.44517517089844, 129.02001953125, 135.59486389160156, 142.16970825195312, 148.74453735351562, 155.31939697265625, 161.8942413330078, 168.46908569335938, 175.04393005371094, 181.6187744140625, 188.19361877441406, 194.76846313476562, 201.34329223632812, 207.9181365966797, 214.49298095703125, 221.0678253173828, 227.64266967773438, 234.21751403808594, 240.7923583984375, 247.3671875, 253.94204711914062, 260.5168762207031, 267.0917053222656, 273.66656494140625, 280.24139404296875, 286.8162536621094, 293.3910827636719, 299.9659423828125, 306.540771484375, 313.1156311035156]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 9.0, 11.0, 5.0, 10.0, 11.0, 16.0, 15.0, 16.0, 22.0, 21.0, 21.0, 36.0, 26.0, 51.0, 27.0, 34.0, 35.0, 30.0, 35.0, 41.0, 40.0, 40.0, 45.0, 40.0, 52.0, 36.0, 34.0, 29.0, 24.0, 27.0, 27.0, 14.0, 22.0, 14.0, 26.0, 12.0, 11.0, 10.0, 5.0, 9.0, 4.0, 7.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0], "bins": [-36.977989196777344, -35.93315505981445, -34.88832092285156, -33.843482971191406, -32.798648834228516, -31.753814697265625, -30.708980560302734, -29.664146423339844, -28.61931037902832, -27.57447624206543, -26.529640197753906, -25.484806060791016, -24.439971923828125, -23.3951358795166, -22.35030174255371, -21.305465698242188, -20.260631561279297, -19.215797424316406, -18.170961380004883, -17.126127243041992, -16.08129119873047, -15.036457061767578, -13.991622924804688, -12.94678783416748, -11.901952743530273, -10.857117652893066, -9.81228256225586, -8.767448425292969, -7.722613334655762, -6.677778244018555, -5.632943630218506, -4.588109016418457, -3.543275833129883, -2.498440980911255, -1.453606128692627, -0.408771276473999, 0.6360635757446289, 1.680898666381836, 2.7257332801818848, 3.7705678939819336, 4.815402984619141, 5.860238075256348, 6.9050726890563965, 7.949907302856445, 8.994742393493652, 10.03957748413086, 11.08441162109375, 12.129246711730957, 13.174081802368164, 14.218916893005371, 15.263751983642578, 16.30858612060547, 17.35342025756836, 18.398256301879883, 19.443090438842773, 20.487926483154297, 21.532760620117188, 22.577594757080078, 23.6224308013916, 24.667264938354492, 25.712100982666016, 26.756935119628906, 27.801769256591797, 28.846603393554688, 29.89143943786621]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 6.0, 8.0, 8.0, 5.0, 12.0, 12.0, 30.0, 26.0, 29.0, 35.0, 32.0, 38.0, 37.0, 41.0, 55.0, 62.0, 61.0, 40.0, 45.0, 53.0, 70.0, 47.0, 38.0, 35.0, 29.0, 28.0, 23.0, 28.0, 24.0, 11.0, 13.0, 6.0, 8.0, 5.0, 5.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.671875, -9.4132080078125, -9.154541015625, -8.8958740234375, -8.63720703125, -8.3785400390625, -8.119873046875, -7.8612060546875, -7.6025390625, -7.3438720703125, -7.085205078125, -6.8265380859375, -6.56787109375, -6.3092041015625, -6.050537109375, -5.7918701171875, -5.533203125, -5.2745361328125, -5.015869140625, -4.7572021484375, -4.49853515625, -4.2398681640625, -3.981201171875, -3.7225341796875, -3.4638671875, -3.2052001953125, -2.946533203125, -2.6878662109375, -2.42919921875, -2.1705322265625, -1.911865234375, -1.6531982421875, -1.39453125, -1.1358642578125, -0.877197265625, -0.6185302734375, -0.35986328125, -0.1011962890625, 0.157470703125, 0.4161376953125, 0.6748046875, 0.9334716796875, 1.192138671875, 1.4508056640625, 1.70947265625, 1.9681396484375, 2.226806640625, 2.4854736328125, 2.744140625, 3.0028076171875, 3.261474609375, 3.5201416015625, 3.77880859375, 4.0374755859375, 4.296142578125, 4.5548095703125, 4.8134765625, 5.0721435546875, 5.330810546875, 5.5894775390625, 5.84814453125, 6.1068115234375, 6.365478515625, 6.6241455078125, 6.8828125]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 6.0, 6.0, 8.0, 13.0, 12.0, 16.0, 32.0, 41.0, 71.0, 107.0, 167.0, 297.0, 466.0, 766.0, 1244.0, 2195.0, 3899.0, 7108.0, 12478.0, 23348.0, 44054.0, 90613.0, 220050.0, 351102.0, 149046.0, 66795.0, 33864.0, 17873.0, 9837.0, 5339.0, 3144.0, 1867.0, 1050.0, 621.0, 395.0, 228.0, 149.0, 76.0, 53.0, 44.0, 25.0, 19.0, 10.0, 8.0, 6.0, 4.0, 4.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.3857421875, -0.3737983703613281, -0.36185455322265625, -0.3499107360839844, -0.3379669189453125, -0.3260231018066406, -0.31407928466796875, -0.3021354675292969, -0.290191650390625, -0.2782478332519531, -0.26630401611328125, -0.2543601989746094, -0.2424163818359375, -0.23047256469726562, -0.21852874755859375, -0.20658493041992188, -0.19464111328125, -0.18269729614257812, -0.17075347900390625, -0.15880966186523438, -0.1468658447265625, -0.13492202758789062, -0.12297821044921875, -0.11103439331054688, -0.099090576171875, -0.08714675903320312, -0.07520294189453125, -0.06325912475585938, -0.0513153076171875, -0.039371490478515625, -0.02742767333984375, -0.015483856201171875, -0.0035400390625, 0.008403778076171875, 0.02034759521484375, 0.032291412353515625, 0.0442352294921875, 0.056179046630859375, 0.06812286376953125, 0.08006668090820312, 0.092010498046875, 0.10395431518554688, 0.11589813232421875, 0.12784194946289062, 0.1397857666015625, 0.15172958374023438, 0.16367340087890625, 0.17561721801757812, 0.18756103515625, 0.19950485229492188, 0.21144866943359375, 0.22339248657226562, 0.2353363037109375, 0.24728012084960938, 0.25922393798828125, 0.2711677551269531, 0.283111572265625, 0.2950553894042969, 0.30699920654296875, 0.3189430236816406, 0.3308868408203125, 0.3428306579589844, 0.35477447509765625, 0.3667182922363281, 0.378662109375]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 5.0, 3.0, 9.0, 9.0, 15.0, 13.0, 18.0, 19.0, 30.0, 26.0, 35.0, 25.0, 28.0, 39.0, 44.0, 40.0, 43.0, 43.0, 41.0, 1077.0, 44.0, 48.0, 43.0, 29.0, 39.0, 48.0, 36.0, 30.0, 32.0, 23.0, 16.0, 13.0, 16.0, 13.0, 9.0, 4.0, 6.0, 7.0, 8.0, 2.0, 1.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.958984375, -3.813079833984375, -3.66717529296875, -3.521270751953125, -3.3753662109375, -3.229461669921875, -3.08355712890625, -2.937652587890625, -2.791748046875, -2.645843505859375, -2.49993896484375, -2.354034423828125, -2.2081298828125, -2.062225341796875, -1.91632080078125, -1.770416259765625, -1.62451171875, -1.478607177734375, -1.33270263671875, -1.186798095703125, -1.0408935546875, -0.894989013671875, -0.74908447265625, -0.603179931640625, -0.457275390625, -0.311370849609375, -0.16546630859375, -0.019561767578125, 0.1263427734375, 0.272247314453125, 0.41815185546875, 0.564056396484375, 0.7099609375, 0.855865478515625, 1.00177001953125, 1.147674560546875, 1.2935791015625, 1.439483642578125, 1.58538818359375, 1.731292724609375, 1.877197265625, 2.023101806640625, 2.16900634765625, 2.314910888671875, 2.4608154296875, 2.606719970703125, 2.75262451171875, 2.898529052734375, 3.04443359375, 3.190338134765625, 3.33624267578125, 3.482147216796875, 3.6280517578125, 3.773956298828125, 3.91986083984375, 4.065765380859375, 4.211669921875, 4.357574462890625, 4.50347900390625, 4.649383544921875, 4.7952880859375, 4.941192626953125, 5.08709716796875, 5.233001708984375, 5.37890625]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 4.0, 11.0, 16.0, 18.0, 41.0, 62.0, 104.0, 151.0, 252.0, 342.0, 540.0, 870.0, 1298.0, 1950.0, 3113.0, 4732.0, 7664.0, 12241.0, 20008.0, 34014.0, 58725.0, 107812.0, 209151.0, 1314363.0, 138802.0, 74045.0, 42241.0, 24648.0, 14790.0, 9021.0, 5775.0, 3664.0, 2367.0, 1438.0, 991.0, 620.0, 447.0, 270.0, 208.0, 107.0, 61.0, 48.0, 28.0, 29.0, 19.0, 10.0, 7.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 3.0], "bins": [-0.2293701171875, -0.2222461700439453, -0.21512222290039062, -0.20799827575683594, -0.20087432861328125, -0.19375038146972656, -0.18662643432617188, -0.1795024871826172, -0.1723785400390625, -0.1652545928955078, -0.15813064575195312, -0.15100669860839844, -0.14388275146484375, -0.13675880432128906, -0.12963485717773438, -0.12251091003417969, -0.115386962890625, -0.10826301574707031, -0.10113906860351562, -0.09401512145996094, -0.08689117431640625, -0.07976722717285156, -0.07264328002929688, -0.06551933288574219, -0.0583953857421875, -0.05127143859863281, -0.044147491455078125, -0.03702354431152344, -0.02989959716796875, -0.022775650024414062, -0.015651702880859375, -0.008527755737304688, -0.00140380859375, 0.0057201385498046875, 0.012844085693359375, 0.019968032836914062, 0.02709197998046875, 0.03421592712402344, 0.041339874267578125, 0.04846382141113281, 0.0555877685546875, 0.06271171569824219, 0.06983566284179688, 0.07695960998535156, 0.08408355712890625, 0.09120750427246094, 0.09833145141601562, 0.10545539855957031, 0.112579345703125, 0.11970329284667969, 0.12682723999023438, 0.13395118713378906, 0.14107513427734375, 0.14819908142089844, 0.15532302856445312, 0.1624469757080078, 0.1695709228515625, 0.1766948699951172, 0.18381881713867188, 0.19094276428222656, 0.19806671142578125, 0.20519065856933594, 0.21231460571289062, 0.2194385528564453, 0.2265625]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 5.0, 5.0, 9.0, 10.0, 13.0, 8.0, 8.0, 18.0, 26.0, 33.0, 34.0, 44.0, 47.0, 65.0, 56.0, 59.0, 82.0, 75.0, 61.0, 58.0, 53.0, 50.0, 33.0, 34.0, 21.0, 15.0, 22.0, 7.0, 10.0, 11.0, 6.0, 4.0, 5.0, 4.0, 3.0, 5.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0003516674041748047, -0.00034119561314582825, -0.0003307238221168518, -0.00032025203108787537, -0.0003097802400588989, -0.0002993084490299225, -0.00028883665800094604, -0.0002783648669719696, -0.00026789307594299316, -0.0002574212849140167, -0.0002469494938850403, -0.00023647770285606384, -0.0002260059118270874, -0.00021553412079811096, -0.00020506232976913452, -0.00019459053874015808, -0.00018411874771118164, -0.0001736469566822052, -0.00016317516565322876, -0.00015270337462425232, -0.00014223158359527588, -0.00013175979256629944, -0.000121288001537323, -0.00011081621050834656, -0.00010034441947937012, -8.987262845039368e-05, -7.940083742141724e-05, -6.89290463924408e-05, -5.8457255363464355e-05, -4.7985464334487915e-05, -3.7513673305511475e-05, -2.7041882276535034e-05, -1.6570091247558594e-05, -6.098300218582153e-06, 4.373490810394287e-06, 1.4845281839370728e-05, 2.5317072868347168e-05, 3.578886389732361e-05, 4.626065492630005e-05, 5.673244595527649e-05, 6.720423698425293e-05, 7.767602801322937e-05, 8.814781904220581e-05, 9.861961007118225e-05, 0.00010909140110015869, 0.00011956319212913513, 0.00013003498315811157, 0.000140506774187088, 0.00015097856521606445, 0.0001614503562450409, 0.00017192214727401733, 0.00018239393830299377, 0.00019286572933197021, 0.00020333752036094666, 0.0002138093113899231, 0.00022428110241889954, 0.00023475289344787598, 0.0002452246844768524, 0.00025569647550582886, 0.0002661682665348053, 0.00027664005756378174, 0.0002871118485927582, 0.0002975836396217346, 0.00030805543065071106, 0.0003185272216796875]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 0.0, 4.0, 5.0, 2.0, 5.0, 7.0, 8.0, 14.0, 15.0, 20.0, 24.0, 27.0, 46.0, 42.0, 74.0, 123.0, 169.0, 324.0, 867.0, 20678.0, 1019646.0, 5108.0, 570.0, 242.0, 159.0, 101.0, 65.0, 56.0, 43.0, 28.0, 15.0, 6.0, 11.0, 14.0, 10.0, 5.0, 8.0, 6.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.00695037841796875, -0.006721436977386475, -0.006492495536804199, -0.006263554096221924, -0.0060346126556396484, -0.005805671215057373, -0.005576729774475098, -0.005347788333892822, -0.005118846893310547, -0.0048899054527282715, -0.004660964012145996, -0.004432022571563721, -0.004203081130981445, -0.00397413969039917, -0.0037451982498168945, -0.003516256809234619, -0.0032873153686523438, -0.0030583739280700684, -0.002829432487487793, -0.0026004910469055176, -0.002371549606323242, -0.002142608165740967, -0.0019136667251586914, -0.001684725284576416, -0.0014557838439941406, -0.0012268424034118652, -0.0009979009628295898, -0.0007689595222473145, -0.0005400180816650391, -0.00031107664108276367, -8.213520050048828e-05, 0.0001468062400817871, 0.0003757476806640625, 0.0006046891212463379, 0.0008336305618286133, 0.0010625720024108887, 0.001291513442993164, 0.0015204548835754395, 0.0017493963241577148, 0.0019783377647399902, 0.0022072792053222656, 0.002436220645904541, 0.0026651620864868164, 0.002894103527069092, 0.003123044967651367, 0.0033519864082336426, 0.003580927848815918, 0.0038098692893981934, 0.004038810729980469, 0.004267752170562744, 0.0044966936111450195, 0.004725635051727295, 0.00495457649230957, 0.005183517932891846, 0.005412459373474121, 0.0056414008140563965, 0.005870342254638672, 0.006099283695220947, 0.006328225135803223, 0.006557166576385498, 0.0067861080169677734, 0.007015049457550049, 0.007243990898132324, 0.0074729323387146, 0.007701873779296875]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 796.0, 220.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00020801069331355393, -9.725535346660763e-05, 1.3499986380338669e-05, 0.0001242553407792002, 0.00023501066607423127, 0.00034576599136926234, 0.0004565213748719543, 0.0005672767292708158, 0.0006780320545658469, 0.000788787379860878, 0.0008995427051559091, 0.0010102980304509401, 0.001121053472161293, 0.0012318086810410023, 0.0013425641227513552, 0.0014533194480463862, 0.0015640747733414173, 0.0016748300986364484, 0.0017855854239314795, 0.0018963408656418324, 0.0020070960745215416, 0.0021178515162318945, 0.0022286069579422474, 0.0023393621668219566, 0.002450117375701666, 0.0025608728174120188, 0.002671628026291728, 0.002782383468002081, 0.00289313867688179, 0.003003894118592143, 0.003114649560302496, 0.003225404769182205, 0.0033361599780619144, 0.0034469154197722673, 0.0035576706286519766, 0.0036684260703623295, 0.0037791812792420387, 0.0038899367209523916, 0.0040006921626627445, 0.004111447371542454, 0.004222202580422163, 0.004332957789301872, 0.004443713463842869, 0.004554468672722578, 0.004665223881602287, 0.0047759790904819965, 0.004886734765022993, 0.004997489973902702, 0.005108245648443699, 0.005219000857323408, 0.005329756531864405, 0.005440511740744114, 0.005551266949623823, 0.005662022158503532, 0.005772777833044529, 0.005883533041924238, 0.0059942882508039474, 0.006105043459683657, 0.006215799134224653, 0.0063265543431043625, 0.006437309551984072, 0.006548064760863781, 0.0066588204354047775, 0.006769575644284487, 0.006880330853164196]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 4.0, 5.0, 3.0, 2.0, 7.0, 10.0, 14.0, 16.0, 17.0, 24.0, 29.0, 23.0, 44.0, 36.0, 38.0, 44.0, 56.0, 48.0, 49.0, 70.0, 60.0, 55.0, 53.0, 47.0, 33.0, 33.0, 39.0, 31.0, 26.0, 21.0, 22.0, 12.0, 19.0, 9.0, 6.0, 2.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0], "bins": [-0.00030040740966796875, -0.0002930592745542526, -0.0002857111394405365, -0.0002783630043268204, -0.00027101486921310425, -0.0002636667340993881, -0.000256318598985672, -0.00024897046387195587, -0.00024162232875823975, -0.00023427419364452362, -0.0002269260585308075, -0.00021957792341709137, -0.00021222978830337524, -0.00020488165318965912, -0.000197533518075943, -0.00019018538296222687, -0.00018283724784851074, -0.00017548911273479462, -0.0001681409776210785, -0.00016079284250736237, -0.00015344470739364624, -0.00014609657227993011, -0.000138748437166214, -0.00013140030205249786, -0.00012405216693878174, -0.00011670403182506561, -0.00010935589671134949, -0.00010200776159763336, -9.465962648391724e-05, -8.731149137020111e-05, -7.996335625648499e-05, -7.261522114276886e-05, -6.526708602905273e-05, -5.791895091533661e-05, -5.0570815801620483e-05, -4.322268068790436e-05, -3.587454557418823e-05, -2.8526410460472107e-05, -2.117827534675598e-05, -1.3830140233039856e-05, -6.4820051193237305e-06, 8.66129994392395e-07, 8.21426510810852e-06, 1.5562400221824646e-05, 2.291053533554077e-05, 3.0258670449256897e-05, 3.760680556297302e-05, 4.495494067668915e-05, 5.2303075790405273e-05, 5.96512109041214e-05, 6.699934601783752e-05, 7.434748113155365e-05, 8.169561624526978e-05, 8.90437513589859e-05, 9.639188647270203e-05, 0.00010374002158641815, 0.00011108815670013428, 0.0001184362918138504, 0.00012578442692756653, 0.00013313256204128265, 0.00014048069715499878, 0.0001478288322687149, 0.00015517696738243103, 0.00016252510249614716, 0.00016987323760986328]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 6.0, 8.0, 8.0, 5.0, 12.0, 12.0, 30.0, 26.0, 29.0, 35.0, 32.0, 38.0, 37.0, 41.0, 55.0, 62.0, 61.0, 40.0, 45.0, 53.0, 70.0, 47.0, 38.0, 35.0, 29.0, 28.0, 23.0, 28.0, 24.0, 11.0, 13.0, 6.0, 8.0, 5.0, 5.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.671875, -9.4132080078125, -9.154541015625, -8.8958740234375, -8.63720703125, -8.3785400390625, -8.119873046875, -7.8612060546875, -7.6025390625, -7.3438720703125, -7.085205078125, -6.8265380859375, -6.56787109375, -6.3092041015625, -6.050537109375, -5.7918701171875, -5.533203125, -5.2745361328125, -5.015869140625, -4.7572021484375, -4.49853515625, -4.2398681640625, -3.981201171875, -3.7225341796875, -3.4638671875, -3.2052001953125, -2.946533203125, -2.6878662109375, -2.42919921875, -2.1705322265625, -1.911865234375, -1.6531982421875, -1.39453125, -1.1358642578125, -0.877197265625, -0.6185302734375, -0.35986328125, -0.1011962890625, 0.157470703125, 0.4161376953125, 0.6748046875, 0.9334716796875, 1.192138671875, 1.4508056640625, 1.70947265625, 1.9681396484375, 2.226806640625, 2.4854736328125, 2.744140625, 3.0028076171875, 3.261474609375, 3.5201416015625, 3.77880859375, 4.0374755859375, 4.296142578125, 4.5548095703125, 4.8134765625, 5.0721435546875, 5.330810546875, 5.5894775390625, 5.84814453125, 6.1068115234375, 6.365478515625, 6.6241455078125, 6.8828125]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 6.0, 5.0, 10.0, 11.0, 22.0, 34.0, 51.0, 78.0, 107.0, 171.0, 311.0, 519.0, 956.0, 2042.0, 4615.0, 14015.0, 82677.0, 816673.0, 101197.0, 15533.0, 4961.0, 2095.0, 1099.0, 554.0, 336.0, 182.0, 96.0, 70.0, 54.0, 31.0, 14.0, 15.0, 7.0, 8.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-18.921875, -18.3740234375, -17.826171875, -17.2783203125, -16.73046875, -16.1826171875, -15.634765625, -15.0869140625, -14.5390625, -13.9912109375, -13.443359375, -12.8955078125, -12.34765625, -11.7998046875, -11.251953125, -10.7041015625, -10.15625, -9.6083984375, -9.060546875, -8.5126953125, -7.96484375, -7.4169921875, -6.869140625, -6.3212890625, -5.7734375, -5.2255859375, -4.677734375, -4.1298828125, -3.58203125, -3.0341796875, -2.486328125, -1.9384765625, -1.390625, -0.8427734375, -0.294921875, 0.2529296875, 0.80078125, 1.3486328125, 1.896484375, 2.4443359375, 2.9921875, 3.5400390625, 4.087890625, 4.6357421875, 5.18359375, 5.7314453125, 6.279296875, 6.8271484375, 7.375, 7.9228515625, 8.470703125, 9.0185546875, 9.56640625, 10.1142578125, 10.662109375, 11.2099609375, 11.7578125, 12.3056640625, 12.853515625, 13.4013671875, 13.94921875, 14.4970703125, 15.044921875, 15.5927734375, 16.140625]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 6.0, 2.0, 5.0, 3.0, 3.0, 4.0, 4.0, 12.0, 12.0, 10.0, 15.0, 25.0, 12.0, 21.0, 16.0, 31.0, 25.0, 29.0, 32.0, 41.0, 38.0, 51.0, 63.0, 121.0, 273.0, 1468.0, 201.0, 84.0, 72.0, 37.0, 38.0, 43.0, 33.0, 40.0, 26.0, 22.0, 23.0, 14.0, 17.0, 14.0, 13.0, 10.0, 8.0, 6.0, 8.0, 6.0, 8.0, 5.0, 3.0, 4.0, 3.0, 3.0, 0.0, 1.0], "bins": [-17.4375, -16.943603515625, -16.44970703125, -15.955810546875, -15.4619140625, -14.968017578125, -14.47412109375, -13.980224609375, -13.486328125, -12.992431640625, -12.49853515625, -12.004638671875, -11.5107421875, -11.016845703125, -10.52294921875, -10.029052734375, -9.53515625, -9.041259765625, -8.54736328125, -8.053466796875, -7.5595703125, -7.065673828125, -6.57177734375, -6.077880859375, -5.583984375, -5.090087890625, -4.59619140625, -4.102294921875, -3.6083984375, -3.114501953125, -2.62060546875, -2.126708984375, -1.6328125, -1.138916015625, -0.64501953125, -0.151123046875, 0.3427734375, 0.836669921875, 1.33056640625, 1.824462890625, 2.318359375, 2.812255859375, 3.30615234375, 3.800048828125, 4.2939453125, 4.787841796875, 5.28173828125, 5.775634765625, 6.26953125, 6.763427734375, 7.25732421875, 7.751220703125, 8.2451171875, 8.739013671875, 9.23291015625, 9.726806640625, 10.220703125, 10.714599609375, 11.20849609375, 11.702392578125, 12.1962890625, 12.690185546875, 13.18408203125, 13.677978515625, 14.171875]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 8.0, 9.0, 11.0, 15.0, 16.0, 25.0, 29.0, 34.0, 41.0, 65.0, 107.0, 133.0, 294.0, 896.0, 10446.0, 3063431.0, 67284.0, 1860.0, 432.0, 186.0, 113.0, 73.0, 49.0, 40.0, 36.0, 25.0, 23.0, 9.0, 7.0, 6.0, 7.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-52.1875, -50.4306640625, -48.673828125, -46.9169921875, -45.16015625, -43.4033203125, -41.646484375, -39.8896484375, -38.1328125, -36.3759765625, -34.619140625, -32.8623046875, -31.10546875, -29.3486328125, -27.591796875, -25.8349609375, -24.078125, -22.3212890625, -20.564453125, -18.8076171875, -17.05078125, -15.2939453125, -13.537109375, -11.7802734375, -10.0234375, -8.2666015625, -6.509765625, -4.7529296875, -2.99609375, -1.2392578125, 0.517578125, 2.2744140625, 4.03125, 5.7880859375, 7.544921875, 9.3017578125, 11.05859375, 12.8154296875, 14.572265625, 16.3291015625, 18.0859375, 19.8427734375, 21.599609375, 23.3564453125, 25.11328125, 26.8701171875, 28.626953125, 30.3837890625, 32.140625, 33.8974609375, 35.654296875, 37.4111328125, 39.16796875, 40.9248046875, 42.681640625, 44.4384765625, 46.1953125, 47.9521484375, 49.708984375, 51.4658203125, 53.22265625, 54.9794921875, 56.736328125, 58.4931640625, 60.25]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 165.0, 641.0, 191.0, 12.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-91.22120666503906, -87.34039306640625, -83.45957946777344, -79.5787582397461, -75.69794464111328, -71.81713104248047, -67.93631744384766, -64.05549621582031, -60.1746826171875, -56.29386901855469, -52.41305160522461, -48.5322380065918, -44.65142059326172, -40.770606994628906, -36.889793395996094, -33.008975982666016, -29.128162384033203, -25.247346878051758, -21.366531372070312, -17.4857177734375, -13.604901313781738, -9.72408676147461, -5.843271255493164, -1.9624557495117188, 1.9183597564697266, 5.799175262451172, 9.679990768432617, 13.560805320739746, 17.441619873046875, 21.32243537902832, 25.203250885009766, 29.08406639099121, 32.964881896972656, 36.84569549560547, 40.72651290893555, 44.60732650756836, 48.48814392089844, 52.36895751953125, 56.24977111816406, 60.13058853149414, 64.01140594482422, 67.89221954345703, 71.77303314208984, 75.65385437011719, 79.53466796875, 83.41548156738281, 87.29629516601562, 91.17710876464844, 95.05792236328125, 98.93873596191406, 102.81954956054688, 106.70037078857422, 110.58118438720703, 114.46199798583984, 118.34281158447266, 122.2236328125, 126.10444641113281, 129.98526000976562, 133.86607360839844, 137.74688720703125, 141.62770080566406, 145.50851440429688, 149.38934326171875, 153.27015686035156, 157.15097045898438]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 5.0, 0.0, 0.0, 7.0, 9.0, 4.0, 8.0, 8.0, 8.0, 16.0, 15.0, 11.0, 14.0, 22.0, 24.0, 22.0, 27.0, 31.0, 36.0, 33.0, 40.0, 34.0, 32.0, 45.0, 39.0, 41.0, 53.0, 43.0, 42.0, 43.0, 30.0, 40.0, 36.0, 26.0, 26.0, 26.0, 20.0, 20.0, 19.0, 9.0, 6.0, 7.0, 8.0, 6.0, 6.0, 6.0, 1.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.70075607299805, -41.321895599365234, -39.94303512573242, -38.564178466796875, -37.18531799316406, -35.80645751953125, -34.42759704589844, -33.048736572265625, -31.669878005981445, -30.291017532348633, -28.912158966064453, -27.53329849243164, -26.154438018798828, -24.77557945251465, -23.396718978881836, -22.017860412597656, -20.638999938964844, -19.26013946533203, -17.88128089904785, -16.50242042541504, -15.123560905456543, -13.744701385498047, -12.365840911865234, -10.986981391906738, -9.608121871948242, -8.229262351989746, -6.850402355194092, -5.4715423583984375, -4.092682838439941, -2.7138233184814453, -1.3349628448486328, 0.04389667510986328, 1.422760009765625, 2.8016197681427, 4.180479526519775, 5.55933952331543, 6.938199043273926, 8.317058563232422, 9.695919036865234, 11.07477855682373, 12.453638076782227, 13.832497596740723, 15.211357116699219, 16.59021759033203, 17.969078063964844, 19.347936630249023, 20.726797103881836, 22.105655670166016, 23.484516143798828, 24.86337661743164, 26.24223518371582, 27.621095657348633, 28.999954223632812, 30.378814697265625, 31.757675170898438, 33.13653564453125, 34.51539611816406, 35.894256591796875, 37.27311706542969, 38.6519775390625, 40.03083419799805, 41.40969467163086, 42.78855514526367, 44.167415618896484, 45.54627227783203]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 6.0, 0.0, 6.0, 14.0, 5.0, 12.0, 11.0, 31.0, 23.0, 23.0, 27.0, 35.0, 36.0, 46.0, 44.0, 47.0, 52.0, 39.0, 53.0, 62.0, 52.0, 41.0, 42.0, 45.0, 41.0, 39.0, 26.0, 34.0, 25.0, 23.0, 10.0, 12.0, 10.0, 9.0, 13.0, 4.0, 7.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0], "bins": [-9.9296875, -9.6739501953125, -9.418212890625, -9.1624755859375, -8.90673828125, -8.6510009765625, -8.395263671875, -8.1395263671875, -7.8837890625, -7.6280517578125, -7.372314453125, -7.1165771484375, -6.86083984375, -6.6051025390625, -6.349365234375, -6.0936279296875, -5.837890625, -5.5821533203125, -5.326416015625, -5.0706787109375, -4.81494140625, -4.5592041015625, -4.303466796875, -4.0477294921875, -3.7919921875, -3.5362548828125, -3.280517578125, -3.0247802734375, -2.76904296875, -2.5133056640625, -2.257568359375, -2.0018310546875, -1.74609375, -1.4903564453125, -1.234619140625, -0.9788818359375, -0.72314453125, -0.4674072265625, -0.211669921875, 0.0440673828125, 0.2998046875, 0.5555419921875, 0.811279296875, 1.0670166015625, 1.32275390625, 1.5784912109375, 1.834228515625, 2.0899658203125, 2.345703125, 2.6014404296875, 2.857177734375, 3.1129150390625, 3.36865234375, 3.6243896484375, 3.880126953125, 4.1358642578125, 4.3916015625, 4.6473388671875, 4.903076171875, 5.1588134765625, 5.41455078125, 5.6702880859375, 5.926025390625, 6.1817626953125, 6.4375]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 3.0, 8.0, 9.0, 15.0, 15.0, 28.0, 32.0, 55.0, 65.0, 89.0, 162.0, 265.0, 567.0, 1202.0, 3521.0, 15535.0, 231300.0, 2960020.0, 930848.0, 40300.0, 6629.0, 1903.0, 758.0, 373.0, 221.0, 110.0, 75.0, 42.0, 37.0, 25.0, 13.0, 12.0, 13.0, 9.0, 9.0, 5.0, 6.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-20.984375, -20.427978515625, -19.87158203125, -19.315185546875, -18.7587890625, -18.202392578125, -17.64599609375, -17.089599609375, -16.533203125, -15.976806640625, -15.42041015625, -14.864013671875, -14.3076171875, -13.751220703125, -13.19482421875, -12.638427734375, -12.08203125, -11.525634765625, -10.96923828125, -10.412841796875, -9.8564453125, -9.300048828125, -8.74365234375, -8.187255859375, -7.630859375, -7.074462890625, -6.51806640625, -5.961669921875, -5.4052734375, -4.848876953125, -4.29248046875, -3.736083984375, -3.1796875, -2.623291015625, -2.06689453125, -1.510498046875, -0.9541015625, -0.397705078125, 0.15869140625, 0.715087890625, 1.271484375, 1.827880859375, 2.38427734375, 2.940673828125, 3.4970703125, 4.053466796875, 4.60986328125, 5.166259765625, 5.72265625, 6.279052734375, 6.83544921875, 7.391845703125, 7.9482421875, 8.504638671875, 9.06103515625, 9.617431640625, 10.173828125, 10.730224609375, 11.28662109375, 11.843017578125, 12.3994140625, 12.955810546875, 13.51220703125, 14.068603515625, 14.625]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 3.0, 7.0, 5.0, 2.0, 3.0, 9.0, 18.0, 16.0, 20.0, 26.0, 36.0, 53.0, 67.0, 93.0, 136.0, 198.0, 323.0, 477.0, 553.0, 553.0, 444.0, 330.0, 213.0, 157.0, 97.0, 53.0, 46.0, 36.0, 25.0, 11.0, 13.0, 11.0, 9.0, 12.0, 3.0, 4.0, 5.0, 3.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.015625, -10.69189453125, -10.3681640625, -10.04443359375, -9.720703125, -9.39697265625, -9.0732421875, -8.74951171875, -8.42578125, -8.10205078125, -7.7783203125, -7.45458984375, -7.130859375, -6.80712890625, -6.4833984375, -6.15966796875, -5.8359375, -5.51220703125, -5.1884765625, -4.86474609375, -4.541015625, -4.21728515625, -3.8935546875, -3.56982421875, -3.24609375, -2.92236328125, -2.5986328125, -2.27490234375, -1.951171875, -1.62744140625, -1.3037109375, -0.97998046875, -0.65625, -0.33251953125, -0.0087890625, 0.31494140625, 0.638671875, 0.96240234375, 1.2861328125, 1.60986328125, 1.93359375, 2.25732421875, 2.5810546875, 2.90478515625, 3.228515625, 3.55224609375, 3.8759765625, 4.19970703125, 4.5234375, 4.84716796875, 5.1708984375, 5.49462890625, 5.818359375, 6.14208984375, 6.4658203125, 6.78955078125, 7.11328125, 7.43701171875, 7.7607421875, 8.08447265625, 8.408203125, 8.73193359375, 9.0556640625, 9.37939453125, 9.703125]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 7.0, 3.0, 3.0, 15.0, 18.0, 15.0, 23.0, 26.0, 52.0, 68.0, 91.0, 158.0, 218.0, 415.0, 880.0, 2593.0, 12131.0, 131558.0, 3616194.0, 401799.0, 21501.0, 3915.0, 1201.0, 514.0, 287.0, 163.0, 126.0, 80.0, 54.0, 56.0, 27.0, 27.0, 22.0, 9.0, 6.0, 6.0, 7.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-25.125, -24.277587890625, -23.43017578125, -22.582763671875, -21.7353515625, -20.887939453125, -20.04052734375, -19.193115234375, -18.345703125, -17.498291015625, -16.65087890625, -15.803466796875, -14.9560546875, -14.108642578125, -13.26123046875, -12.413818359375, -11.56640625, -10.718994140625, -9.87158203125, -9.024169921875, -8.1767578125, -7.329345703125, -6.48193359375, -5.634521484375, -4.787109375, -3.939697265625, -3.09228515625, -2.244873046875, -1.3974609375, -0.550048828125, 0.29736328125, 1.144775390625, 1.9921875, 2.839599609375, 3.68701171875, 4.534423828125, 5.3818359375, 6.229248046875, 7.07666015625, 7.924072265625, 8.771484375, 9.618896484375, 10.46630859375, 11.313720703125, 12.1611328125, 13.008544921875, 13.85595703125, 14.703369140625, 15.55078125, 16.398193359375, 17.24560546875, 18.093017578125, 18.9404296875, 19.787841796875, 20.63525390625, 21.482666015625, 22.330078125, 23.177490234375, 24.02490234375, 24.872314453125, 25.7197265625, 26.567138671875, 27.41455078125, 28.261962890625, 29.109375]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 4.0, 8.0, 17.0, 76.0, 197.0, 322.0, 247.0, 102.0, 33.0, 8.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.93488121032715, -28.945446014404297, -25.956010818481445, -22.966575622558594, -19.97713851928711, -16.98770523071289, -13.998268127441406, -11.008832931518555, -8.019397735595703, -5.029962539672852, -2.040526866912842, 0.948908805847168, 3.9383440017700195, 6.927779197692871, 9.917215347290039, 12.90665054321289, 15.896085739135742, 18.885520935058594, 21.874956130981445, 24.864391326904297, 27.85382843017578, 30.84326171875, 33.832698822021484, 36.82213592529297, 39.81156921386719, 42.80100631713867, 45.79043960571289, 48.779876708984375, 51.769309997558594, 54.75874710083008, 57.74818420410156, 60.73761749267578, 63.72705841064453, 66.71649169921875, 69.7059326171875, 72.69536590576172, 75.68479919433594, 78.67423248291016, 81.6636734008789, 84.65310668945312, 87.64253997802734, 90.63197326660156, 93.62141418457031, 96.61084747314453, 99.60028076171875, 102.58971405029297, 105.57915496826172, 108.56858825683594, 111.55802917480469, 114.5474624633789, 117.53690338134766, 120.52633666992188, 123.5157699584961, 126.50520324707031, 129.49464416503906, 132.48406982421875, 135.4735107421875, 138.46295166015625, 141.45237731933594, 144.4418182373047, 147.43125915527344, 150.42068481445312, 153.41012573242188, 156.39956665039062, 159.3889923095703]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 4.0, 9.0, 6.0, 10.0, 8.0, 17.0, 15.0, 15.0, 26.0, 26.0, 24.0, 24.0, 23.0, 30.0, 29.0, 31.0, 37.0, 38.0, 40.0, 34.0, 41.0, 29.0, 41.0, 33.0, 44.0, 36.0, 29.0, 42.0, 21.0, 41.0, 27.0, 30.0, 20.0, 22.0, 12.0, 17.0, 10.0, 8.0, 9.0, 11.0, 8.0, 4.0, 7.0, 4.0, 1.0, 7.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.238014221191406, -24.36113739013672, -23.48426055908203, -22.60738182067871, -21.730504989624023, -20.853628158569336, -19.976749420166016, -19.099872589111328, -18.22299575805664, -17.346118927001953, -16.469242095947266, -15.592363357543945, -14.715486526489258, -13.83860969543457, -12.961731910705566, -12.084854125976562, -11.207977294921875, -10.331100463867188, -9.454222679138184, -8.57734489440918, -7.700468063354492, -6.8235907554626465, -5.946713447570801, -5.069836139678955, -4.192958831787109, -3.3160815238952637, -2.439204216003418, -1.5623269081115723, -0.6854496002197266, 0.19142770767211914, 1.0683050155639648, 1.9451823234558105, 2.8220577239990234, 3.698935031890869, 4.575812339782715, 5.4526896476745605, 6.329566955566406, 7.206444263458252, 8.083321571350098, 8.960199356079102, 9.837076187133789, 10.713953018188477, 11.59083080291748, 12.467708587646484, 13.344585418701172, 14.22146224975586, 15.098340034484863, 15.975217819213867, 16.852094650268555, 17.728971481323242, 18.605850219726562, 19.48272705078125, 20.359603881835938, 21.236480712890625, 22.113357543945312, 22.990236282348633, 23.86711311340332, 24.743989944458008, 25.620868682861328, 26.497745513916016, 27.374622344970703, 28.25149917602539, 29.128376007080078, 30.0052547454834, 30.882131576538086]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 4.0, 5.0, 7.0, 5.0, 7.0, 5.0, 8.0, 10.0, 17.0, 20.0, 14.0, 19.0, 17.0, 30.0, 26.0, 22.0, 26.0, 29.0, 42.0, 30.0, 46.0, 40.0, 52.0, 35.0, 38.0, 29.0, 34.0, 34.0, 38.0, 31.0, 40.0, 28.0, 24.0, 31.0, 21.0, 19.0, 19.0, 14.0, 14.0, 10.0, 12.0, 9.0, 12.0, 8.0, 5.0, 5.0, 4.0, 2.0, 3.0, 3.0, 0.0, 3.0, 4.0, 0.0, 0.0, 0.0, 3.0], "bins": [-5.84375, -5.65521240234375, -5.4666748046875, -5.27813720703125, -5.089599609375, -4.90106201171875, -4.7125244140625, -4.52398681640625, -4.33544921875, -4.14691162109375, -3.9583740234375, -3.76983642578125, -3.581298828125, -3.39276123046875, -3.2042236328125, -3.01568603515625, -2.8271484375, -2.63861083984375, -2.4500732421875, -2.26153564453125, -2.072998046875, -1.88446044921875, -1.6959228515625, -1.50738525390625, -1.31884765625, -1.13031005859375, -0.9417724609375, -0.75323486328125, -0.564697265625, -0.37615966796875, -0.1876220703125, 0.00091552734375, 0.189453125, 0.37799072265625, 0.5665283203125, 0.75506591796875, 0.943603515625, 1.13214111328125, 1.3206787109375, 1.50921630859375, 1.69775390625, 1.88629150390625, 2.0748291015625, 2.26336669921875, 2.451904296875, 2.64044189453125, 2.8289794921875, 3.01751708984375, 3.2060546875, 3.39459228515625, 3.5831298828125, 3.77166748046875, 3.960205078125, 4.14874267578125, 4.3372802734375, 4.52581787109375, 4.71435546875, 4.90289306640625, 5.0914306640625, 5.27996826171875, 5.468505859375, 5.65704345703125, 5.8455810546875, 6.03411865234375, 6.22265625]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 6.0, 8.0, 9.0, 15.0, 14.0, 30.0, 42.0, 75.0, 135.0, 177.0, 248.0, 407.0, 579.0, 1011.0, 1480.0, 2231.0, 3385.0, 5242.0, 8063.0, 13327.0, 22180.0, 37596.0, 69155.0, 143328.0, 303455.0, 214169.0, 97224.0, 50420.0, 28531.0, 16940.0, 10431.0, 6532.0, 4226.0, 2714.0, 1849.0, 1170.0, 734.0, 493.0, 310.0, 224.0, 146.0, 90.0, 57.0, 36.0, 19.0, 19.0, 7.0, 7.0, 6.0, 8.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.302978515625, -0.2924385070800781, -0.28189849853515625, -0.2713584899902344, -0.2608184814453125, -0.2502784729003906, -0.23973846435546875, -0.22919845581054688, -0.218658447265625, -0.20811843872070312, -0.19757843017578125, -0.18703842163085938, -0.1764984130859375, -0.16595840454101562, -0.15541839599609375, -0.14487838745117188, -0.13433837890625, -0.12379837036132812, -0.11325836181640625, -0.10271835327148438, -0.0921783447265625, -0.08163833618164062, -0.07109832763671875, -0.060558319091796875, -0.050018310546875, -0.039478302001953125, -0.02893829345703125, -0.018398284912109375, -0.0078582763671875, 0.002681732177734375, 0.01322174072265625, 0.023761749267578125, 0.0343017578125, 0.044841766357421875, 0.05538177490234375, 0.06592178344726562, 0.0764617919921875, 0.08700180053710938, 0.09754180908203125, 0.10808181762695312, 0.118621826171875, 0.12916183471679688, 0.13970184326171875, 0.15024185180664062, 0.1607818603515625, 0.17132186889648438, 0.18186187744140625, 0.19240188598632812, 0.20294189453125, 0.21348190307617188, 0.22402191162109375, 0.23456192016601562, 0.2451019287109375, 0.2556419372558594, 0.26618194580078125, 0.2767219543457031, 0.287261962890625, 0.2978019714355469, 0.30834197998046875, 0.3188819885253906, 0.3294219970703125, 0.3399620056152344, 0.35050201416015625, 0.3610420227050781, 0.37158203125]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 3.0, 2.0, 6.0, 7.0, 3.0, 9.0, 8.0, 12.0, 8.0, 15.0, 22.0, 18.0, 18.0, 24.0, 22.0, 22.0, 37.0, 38.0, 38.0, 43.0, 30.0, 56.0, 47.0, 1060.0, 52.0, 42.0, 35.0, 37.0, 39.0, 38.0, 28.0, 37.0, 31.0, 25.0, 16.0, 22.0, 18.0, 17.0, 7.0, 10.0, 10.0, 5.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.51953125, -4.3863525390625, -4.253173828125, -4.1199951171875, -3.98681640625, -3.8536376953125, -3.720458984375, -3.5872802734375, -3.4541015625, -3.3209228515625, -3.187744140625, -3.0545654296875, -2.92138671875, -2.7882080078125, -2.655029296875, -2.5218505859375, -2.388671875, -2.2554931640625, -2.122314453125, -1.9891357421875, -1.85595703125, -1.7227783203125, -1.589599609375, -1.4564208984375, -1.3232421875, -1.1900634765625, -1.056884765625, -0.9237060546875, -0.79052734375, -0.6573486328125, -0.524169921875, -0.3909912109375, -0.2578125, -0.1246337890625, 0.008544921875, 0.1417236328125, 0.27490234375, 0.4080810546875, 0.541259765625, 0.6744384765625, 0.8076171875, 0.9407958984375, 1.073974609375, 1.2071533203125, 1.34033203125, 1.4735107421875, 1.606689453125, 1.7398681640625, 1.873046875, 2.0062255859375, 2.139404296875, 2.2725830078125, 2.40576171875, 2.5389404296875, 2.672119140625, 2.8052978515625, 2.9384765625, 3.0716552734375, 3.204833984375, 3.3380126953125, 3.47119140625, 3.6043701171875, 3.737548828125, 3.8707275390625, 4.00390625]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 7.0, 4.0, 6.0, 22.0, 25.0, 29.0, 32.0, 40.0, 80.0, 104.0, 155.0, 176.0, 271.0, 349.0, 444.0, 639.0, 899.0, 1279.0, 1740.0, 2401.0, 3596.0, 5064.0, 7300.0, 10776.0, 16064.0, 25047.0, 39144.0, 62357.0, 102925.0, 181339.0, 1275706.0, 136549.0, 79553.0, 49312.0, 30865.0, 20138.0, 13349.0, 8818.0, 6169.0, 4164.0, 2912.0, 2052.0, 1455.0, 983.0, 773.0, 586.0, 418.0, 302.0, 207.0, 128.0, 99.0, 87.0, 59.0, 35.0, 35.0, 27.0, 17.0, 11.0, 10.0, 9.0, 3.0, 3.0], "bins": [-0.1895751953125, -0.18369674682617188, -0.17781829833984375, -0.17193984985351562, -0.1660614013671875, -0.16018295288085938, -0.15430450439453125, -0.14842605590820312, -0.142547607421875, -0.13666915893554688, -0.13079071044921875, -0.12491226196289062, -0.1190338134765625, -0.11315536499023438, -0.10727691650390625, -0.10139846801757812, -0.09552001953125, -0.08964157104492188, -0.08376312255859375, -0.07788467407226562, -0.0720062255859375, -0.06612777709960938, -0.06024932861328125, -0.054370880126953125, -0.048492431640625, -0.042613983154296875, -0.03673553466796875, -0.030857086181640625, -0.0249786376953125, -0.019100189208984375, -0.01322174072265625, -0.007343292236328125, -0.00146484375, 0.004413604736328125, 0.01029205322265625, 0.016170501708984375, 0.0220489501953125, 0.027927398681640625, 0.03380584716796875, 0.039684295654296875, 0.045562744140625, 0.051441192626953125, 0.05731964111328125, 0.06319808959960938, 0.0690765380859375, 0.07495498657226562, 0.08083343505859375, 0.08671188354492188, 0.09259033203125, 0.09846878051757812, 0.10434722900390625, 0.11022567749023438, 0.1161041259765625, 0.12198257446289062, 0.12786102294921875, 0.13373947143554688, 0.139617919921875, 0.14549636840820312, 0.15137481689453125, 0.15725326538085938, 0.1631317138671875, 0.16901016235351562, 0.17488861083984375, 0.18076705932617188, 0.1866455078125]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 2.0, 3.0, 4.0, 2.0, 10.0, 6.0, 13.0, 20.0, 23.0, 23.0, 38.0, 40.0, 63.0, 60.0, 77.0, 110.0, 86.0, 86.0, 57.0, 50.0, 53.0, 46.0, 29.0, 24.0, 17.0, 19.0, 11.0, 7.0, 3.0, 7.0, 4.0, 6.0, 6.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00016629695892333984, -0.00016037747263908386, -0.00015445798635482788, -0.0001485385000705719, -0.00014261901378631592, -0.00013669952750205994, -0.00013078004121780396, -0.00012486055493354797, -0.00011894106864929199, -0.00011302158236503601, -0.00010710209608078003, -0.00010118260979652405, -9.526312351226807e-05, -8.934363722801208e-05, -8.34241509437561e-05, -7.750466465950012e-05, -7.158517837524414e-05, -6.566569209098816e-05, -5.974620580673218e-05, -5.3826719522476196e-05, -4.7907233238220215e-05, -4.1987746953964233e-05, -3.606826066970825e-05, -3.014877438545227e-05, -2.422928810119629e-05, -1.8309801816940308e-05, -1.2390315532684326e-05, -6.470829248428345e-06, -5.513429641723633e-07, 5.368143320083618e-06, 1.12876296043396e-05, 1.720711588859558e-05, 2.3126602172851562e-05, 2.9046088457107544e-05, 3.4965574741363525e-05, 4.088506102561951e-05, 4.680454730987549e-05, 5.272403359413147e-05, 5.864351987838745e-05, 6.456300616264343e-05, 7.048249244689941e-05, 7.64019787311554e-05, 8.232146501541138e-05, 8.824095129966736e-05, 9.416043758392334e-05, 0.00010007992386817932, 0.0001059994101524353, 0.00011191889643669128, 0.00011783838272094727, 0.00012375786900520325, 0.00012967735528945923, 0.0001355968415737152, 0.0001415163278579712, 0.00014743581414222717, 0.00015335530042648315, 0.00015927478671073914, 0.00016519427299499512, 0.0001711137592792511, 0.00017703324556350708, 0.00018295273184776306, 0.00018887221813201904, 0.00019479170441627502, 0.000200711190700531, 0.000206630676984787, 0.00021255016326904297]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 6.0, 2.0, 3.0, 7.0, 4.0, 9.0, 9.0, 20.0, 18.0, 21.0, 24.0, 30.0, 35.0, 57.0, 105.0, 172.0, 303.0, 527.0, 2102.0, 132420.0, 904750.0, 6270.0, 790.0, 323.0, 189.0, 110.0, 85.0, 49.0, 25.0, 30.0, 19.0, 7.0, 13.0, 7.0, 11.0, 4.0, 4.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.004146575927734375, -0.004031956195831299, -0.003917336463928223, -0.0038027167320251465, -0.0036880970001220703, -0.003573477268218994, -0.003458857536315918, -0.003344237804412842, -0.0032296180725097656, -0.0031149983406066895, -0.0030003786087036133, -0.002885758876800537, -0.002771139144897461, -0.0026565194129943848, -0.0025418996810913086, -0.0024272799491882324, -0.0023126602172851562, -0.00219804048538208, -0.002083420753479004, -0.0019688010215759277, -0.0018541812896728516, -0.0017395615577697754, -0.0016249418258666992, -0.001510322093963623, -0.0013957023620605469, -0.0012810826301574707, -0.0011664628982543945, -0.0010518431663513184, -0.0009372234344482422, -0.000822603702545166, -0.0007079839706420898, -0.0005933642387390137, -0.0004787445068359375, -0.00036412477493286133, -0.00024950504302978516, -0.00013488531112670898, -2.0265579223632812e-05, 9.435415267944336e-05, 0.00020897388458251953, 0.0003235936164855957, 0.0004382133483886719, 0.000552833080291748, 0.0006674528121948242, 0.0007820725440979004, 0.0008966922760009766, 0.0010113120079040527, 0.001125931739807129, 0.001240551471710205, 0.0013551712036132812, 0.0014697909355163574, 0.0015844106674194336, 0.0016990303993225098, 0.001813650131225586, 0.0019282698631286621, 0.0020428895950317383, 0.0021575093269348145, 0.0022721290588378906, 0.002386748790740967, 0.002501368522644043, 0.002615988254547119, 0.0027306079864501953, 0.0028452277183532715, 0.0029598474502563477, 0.003074467182159424, 0.0031890869140625]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 9.0, 43.0, 124.0, 290.0, 307.0, 157.0, 59.0, 14.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003818266559392214, -0.0003699302324093878, -0.00035803383798338473, -0.0003461374144535512, -0.0003342409909237176, -0.0003223445964977145, -0.00031044817296788096, -0.0002985517494380474, -0.00028665532590821385, -0.0002747589023783803, -0.0002628625079523772, -0.00025096608442254364, -0.0002390696608927101, -0.00022717325191479176, -0.00021527684293687344, -0.00020338041940703988, -0.00019148402498103678, -0.00017958761600311846, -0.0001676911924732849, -0.00015579478349536657, -0.00014389835996553302, -0.0001320019509876147, -0.00012010554200969636, -0.00010820912575582042, -9.631270950194448e-05, -8.441629324806854e-05, -7.25198769941926e-05, -6.0623468016274273e-05, -4.872705176239833e-05, -3.683063550852239e-05, -2.4934226530604064e-05, -1.3037810276728123e-05, -1.1413649190217257e-06, 1.0755049515864812e-05, 2.265146395075135e-05, 3.454787656664848e-05, 4.6444292820524424e-05, 5.8340709074400365e-05, 7.023711805231869e-05, 8.213353430619463e-05, 9.402995056007057e-05, 0.00010592636681394652, 0.00011782278306782246, 0.00012971919204574078, 0.0001416156010236591, 0.00015351202455349267, 0.000165408433531411, 0.00017730484250932932, 0.00018920126603916287, 0.0002010976750170812, 0.00021299409854691476, 0.00022489050752483308, 0.00023678693105466664, 0.00024868332548066974, 0.0002605797490105033, 0.00027247617254033685, 0.0002843725960701704, 0.00029626901960000396, 0.00030816541402600706, 0.0003200618375558406, 0.00033195826108567417, 0.00034385465551167727, 0.0003557510790415108, 0.0003676475025713444, 0.0003795438969973475]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 1.0, 0.0, 2.0, 5.0, 5.0, 5.0, 8.0, 12.0, 8.0, 16.0, 16.0, 19.0, 15.0, 22.0, 26.0, 27.0, 26.0, 46.0, 34.0, 29.0, 30.0, 44.0, 38.0, 45.0, 50.0, 34.0, 54.0, 27.0, 40.0, 34.0, 21.0, 35.0, 34.0, 37.0, 21.0, 31.0, 18.0, 14.0, 11.0, 16.0, 13.0, 8.0, 8.0, 8.0, 4.0, 2.0, 2.0, 4.0, 1.0, 3.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.450580596923828e-05, -7.209181785583496e-05, -6.967782974243164e-05, -6.726384162902832e-05, -6.4849853515625e-05, -6.243586540222168e-05, -6.002187728881836e-05, -5.760788917541504e-05, -5.519390106201172e-05, -5.27799129486084e-05, -5.036592483520508e-05, -4.795193672180176e-05, -4.553794860839844e-05, -4.312396049499512e-05, -4.07099723815918e-05, -3.8295984268188477e-05, -3.5881996154785156e-05, -3.3468008041381836e-05, -3.1054019927978516e-05, -2.8640031814575195e-05, -2.6226043701171875e-05, -2.3812055587768555e-05, -2.1398067474365234e-05, -1.8984079360961914e-05, -1.6570091247558594e-05, -1.4156103134155273e-05, -1.1742115020751953e-05, -9.328126907348633e-06, -6.9141387939453125e-06, -4.500150680541992e-06, -2.086162567138672e-06, 3.2782554626464844e-07, 2.7418136596679688e-06, 5.155801773071289e-06, 7.569789886474609e-06, 9.98377799987793e-06, 1.239776611328125e-05, 1.481175422668457e-05, 1.722574234008789e-05, 1.963973045349121e-05, 2.205371856689453e-05, 2.446770668029785e-05, 2.6881694793701172e-05, 2.9295682907104492e-05, 3.170967102050781e-05, 3.412365913391113e-05, 3.653764724731445e-05, 3.8951635360717773e-05, 4.1365623474121094e-05, 4.3779611587524414e-05, 4.6193599700927734e-05, 4.8607587814331055e-05, 5.1021575927734375e-05, 5.3435564041137695e-05, 5.5849552154541016e-05, 5.8263540267944336e-05, 6.0677528381347656e-05, 6.309151649475098e-05, 6.55055046081543e-05, 6.791949272155762e-05, 7.033348083496094e-05, 7.274746894836426e-05, 7.516145706176758e-05, 7.75754451751709e-05, 7.998943328857422e-05]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 4.0, 5.0, 7.0, 5.0, 7.0, 5.0, 8.0, 10.0, 17.0, 20.0, 14.0, 19.0, 17.0, 30.0, 26.0, 22.0, 26.0, 29.0, 42.0, 30.0, 46.0, 40.0, 52.0, 35.0, 38.0, 29.0, 34.0, 34.0, 38.0, 31.0, 40.0, 28.0, 24.0, 31.0, 21.0, 19.0, 19.0, 14.0, 14.0, 10.0, 12.0, 9.0, 12.0, 8.0, 5.0, 5.0, 4.0, 2.0, 3.0, 3.0, 0.0, 3.0, 4.0, 0.0, 0.0, 0.0, 3.0], "bins": [-5.84375, -5.65521240234375, -5.4666748046875, -5.27813720703125, -5.089599609375, -4.90106201171875, -4.7125244140625, -4.52398681640625, -4.33544921875, -4.14691162109375, -3.9583740234375, -3.76983642578125, -3.581298828125, -3.39276123046875, -3.2042236328125, -3.01568603515625, -2.8271484375, -2.63861083984375, -2.4500732421875, -2.26153564453125, -2.072998046875, -1.88446044921875, -1.6959228515625, -1.50738525390625, -1.31884765625, -1.13031005859375, -0.9417724609375, -0.75323486328125, -0.564697265625, -0.37615966796875, -0.1876220703125, 0.00091552734375, 0.189453125, 0.37799072265625, 0.5665283203125, 0.75506591796875, 0.943603515625, 1.13214111328125, 1.3206787109375, 1.50921630859375, 1.69775390625, 1.88629150390625, 2.0748291015625, 2.26336669921875, 2.451904296875, 2.64044189453125, 2.8289794921875, 3.01751708984375, 3.2060546875, 3.39459228515625, 3.5831298828125, 3.77166748046875, 3.960205078125, 4.14874267578125, 4.3372802734375, 4.52581787109375, 4.71435546875, 4.90289306640625, 5.0914306640625, 5.27996826171875, 5.468505859375, 5.65704345703125, 5.8455810546875, 6.03411865234375, 6.22265625]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 5.0, 1.0, 0.0, 4.0, 4.0, 6.0, 10.0, 10.0, 17.0, 14.0, 11.0, 28.0, 35.0, 47.0, 77.0, 81.0, 87.0, 132.0, 199.0, 203.0, 312.0, 431.0, 747.0, 1473.0, 3521.0, 10122.0, 32845.0, 216667.0, 690389.0, 63908.0, 16595.0, 5537.0, 2086.0, 959.0, 555.0, 357.0, 257.0, 170.0, 152.0, 118.0, 90.0, 78.0, 45.0, 44.0, 35.0, 19.0, 20.0, 15.0, 11.0, 11.0, 9.0, 4.0, 6.0, 3.0, 1.0, 2.0, 5.0, 0.0, 0.0, 1.0, 2.0], "bins": [-14.4140625, -13.952392578125, -13.49072265625, -13.029052734375, -12.5673828125, -12.105712890625, -11.64404296875, -11.182373046875, -10.720703125, -10.259033203125, -9.79736328125, -9.335693359375, -8.8740234375, -8.412353515625, -7.95068359375, -7.489013671875, -7.02734375, -6.565673828125, -6.10400390625, -5.642333984375, -5.1806640625, -4.718994140625, -4.25732421875, -3.795654296875, -3.333984375, -2.872314453125, -2.41064453125, -1.948974609375, -1.4873046875, -1.025634765625, -0.56396484375, -0.102294921875, 0.359375, 0.821044921875, 1.28271484375, 1.744384765625, 2.2060546875, 2.667724609375, 3.12939453125, 3.591064453125, 4.052734375, 4.514404296875, 4.97607421875, 5.437744140625, 5.8994140625, 6.361083984375, 6.82275390625, 7.284423828125, 7.74609375, 8.207763671875, 8.66943359375, 9.131103515625, 9.5927734375, 10.054443359375, 10.51611328125, 10.977783203125, 11.439453125, 11.901123046875, 12.36279296875, 12.824462890625, 13.2861328125, 13.747802734375, 14.20947265625, 14.671142578125, 15.1328125]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 1.0, 2.0, 5.0, 10.0, 6.0, 17.0, 21.0, 12.0, 30.0, 27.0, 28.0, 39.0, 43.0, 38.0, 48.0, 58.0, 70.0, 135.0, 347.0, 1502.0, 136.0, 83.0, 60.0, 40.0, 48.0, 39.0, 29.0, 25.0, 32.0, 23.0, 19.0, 10.0, 11.0, 4.0, 14.0, 10.0, 5.0, 8.0, 5.0, 7.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-18.4375, -17.863037109375, -17.28857421875, -16.714111328125, -16.1396484375, -15.565185546875, -14.99072265625, -14.416259765625, -13.841796875, -13.267333984375, -12.69287109375, -12.118408203125, -11.5439453125, -10.969482421875, -10.39501953125, -9.820556640625, -9.24609375, -8.671630859375, -8.09716796875, -7.522705078125, -6.9482421875, -6.373779296875, -5.79931640625, -5.224853515625, -4.650390625, -4.075927734375, -3.50146484375, -2.927001953125, -2.3525390625, -1.778076171875, -1.20361328125, -0.629150390625, -0.0546875, 0.519775390625, 1.09423828125, 1.668701171875, 2.2431640625, 2.817626953125, 3.39208984375, 3.966552734375, 4.541015625, 5.115478515625, 5.68994140625, 6.264404296875, 6.8388671875, 7.413330078125, 7.98779296875, 8.562255859375, 9.13671875, 9.711181640625, 10.28564453125, 10.860107421875, 11.4345703125, 12.009033203125, 12.58349609375, 13.157958984375, 13.732421875, 14.306884765625, 14.88134765625, 15.455810546875, 16.0302734375, 16.604736328125, 17.17919921875, 17.753662109375, 18.328125]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 5.0, 3.0, 9.0, 8.0, 7.0, 14.0, 21.0, 6.0, 9.0, 18.0, 28.0, 33.0, 40.0, 45.0, 51.0, 79.0, 146.0, 234.0, 592.0, 2202.0, 24798.0, 3049652.0, 62907.0, 3203.0, 757.0, 280.0, 128.0, 97.0, 70.0, 55.0, 40.0, 38.0, 35.0, 21.0, 23.0, 9.0, 16.0, 12.0, 2.0, 3.0, 6.0, 2.0, 3.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-46.71875, -45.24072265625, -43.7626953125, -42.28466796875, -40.806640625, -39.32861328125, -37.8505859375, -36.37255859375, -34.89453125, -33.41650390625, -31.9384765625, -30.46044921875, -28.982421875, -27.50439453125, -26.0263671875, -24.54833984375, -23.0703125, -21.59228515625, -20.1142578125, -18.63623046875, -17.158203125, -15.68017578125, -14.2021484375, -12.72412109375, -11.24609375, -9.76806640625, -8.2900390625, -6.81201171875, -5.333984375, -3.85595703125, -2.3779296875, -0.89990234375, 0.578125, 2.05615234375, 3.5341796875, 5.01220703125, 6.490234375, 7.96826171875, 9.4462890625, 10.92431640625, 12.40234375, 13.88037109375, 15.3583984375, 16.83642578125, 18.314453125, 19.79248046875, 21.2705078125, 22.74853515625, 24.2265625, 25.70458984375, 27.1826171875, 28.66064453125, 30.138671875, 31.61669921875, 33.0947265625, 34.57275390625, 36.05078125, 37.52880859375, 39.0068359375, 40.48486328125, 41.962890625, 43.44091796875, 44.9189453125, 46.39697265625, 47.875]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 7.0, 18.0, 93.0, 266.0, 357.0, 181.0, 76.0, 16.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.84257125854492, -34.94148635864258, -33.040401458740234, -31.13931655883789, -29.238231658935547, -27.337146759033203, -25.436059951782227, -23.534975051879883, -21.63389015197754, -19.732805252075195, -17.83172035217285, -15.930634498596191, -14.029549598693848, -12.128464698791504, -10.227378845214844, -8.3262939453125, -6.425209045410156, -4.5241241455078125, -2.6230387687683105, -0.7219533920288086, 1.1791315078735352, 3.080216407775879, 4.981302261352539, 6.882387161254883, 8.783472061157227, 10.68455696105957, 12.585641860961914, 14.486727714538574, 16.387813568115234, 18.288898468017578, 20.189983367919922, 22.091068267822266, 23.992156982421875, 25.89324188232422, 27.794326782226562, 29.695411682128906, 31.59649658203125, 33.497581481933594, 35.39866638183594, 37.29975128173828, 39.200836181640625, 41.10192108154297, 43.00300598144531, 44.904090881347656, 46.80517578125, 48.706260681152344, 50.60734558105469, 52.50843048095703, 54.40951919555664, 56.310604095458984, 58.21168899536133, 60.11277389526367, 62.013858795166016, 63.91494369506836, 65.81603240966797, 67.71711730957031, 69.61820220947266, 71.519287109375, 73.42037200927734, 75.32145690917969, 77.22254180908203, 79.12362670898438, 81.02471160888672, 82.92579650878906, 84.8268814086914]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 7.0, 4.0, 4.0, 6.0, 9.0, 9.0, 14.0, 12.0, 15.0, 19.0, 18.0, 31.0, 35.0, 30.0, 33.0, 28.0, 26.0, 35.0, 47.0, 45.0, 40.0, 60.0, 37.0, 36.0, 44.0, 43.0, 30.0, 34.0, 39.0, 37.0, 25.0, 28.0, 21.0, 17.0, 21.0, 11.0, 5.0, 17.0, 8.0, 8.0, 4.0, 5.0, 0.0, 3.0, 2.0, 5.0, 2.0, 1.0, 2.0, 1.0], "bins": [-47.06272506713867, -45.744659423828125, -44.42658996582031, -43.108524322509766, -41.79045486450195, -40.472389221191406, -39.154319763183594, -37.83625411987305, -36.5181884765625, -35.20012283325195, -33.88205337524414, -32.563987731933594, -31.24591827392578, -29.927852630615234, -28.609785079956055, -27.291717529296875, -25.973648071289062, -24.655580520629883, -23.337512969970703, -22.019445419311523, -20.701377868652344, -19.383312225341797, -18.065244674682617, -16.747177124023438, -15.429109573364258, -14.111042022705078, -12.792974472045898, -11.474907875061035, -10.156840324401855, -8.838772773742676, -7.520705699920654, -6.202638626098633, -4.884574890136719, -3.566507577896118, -2.2484402656555176, -0.930372953414917, 0.3876943588256836, 1.7057619094848633, 3.0238289833068848, 4.341896057128906, 5.659963607788086, 6.978031158447266, 8.296098709106445, 9.614165306091309, 10.932232856750488, 12.250300407409668, 13.568367004394531, 14.886434555053711, 16.20450210571289, 17.52256965637207, 18.84063720703125, 20.15870475769043, 21.47677230834961, 22.794837951660156, 24.112905502319336, 25.430973052978516, 26.749040603637695, 28.067108154296875, 29.385175704956055, 30.703243255615234, 32.02130889892578, 33.339378356933594, 34.65744400024414, 35.97550964355469, 37.2935791015625]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [4.0, 2.0, 2.0, 1.0, 4.0, 4.0, 4.0, 3.0, 8.0, 8.0, 4.0, 11.0, 14.0, 10.0, 18.0, 22.0, 17.0, 19.0, 24.0, 38.0, 21.0, 34.0, 32.0, 44.0, 29.0, 47.0, 34.0, 38.0, 38.0, 46.0, 51.0, 31.0, 30.0, 34.0, 32.0, 32.0, 25.0, 26.0, 25.0, 32.0, 21.0, 19.0, 14.0, 11.0, 8.0, 7.0, 10.0, 5.0, 3.0, 4.0, 5.0, 2.0, 3.0, 4.0, 5.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.66015625, -5.4608154296875, -5.261474609375, -5.0621337890625, -4.86279296875, -4.6634521484375, -4.464111328125, -4.2647705078125, -4.0654296875, -3.8660888671875, -3.666748046875, -3.4674072265625, -3.26806640625, -3.0687255859375, -2.869384765625, -2.6700439453125, -2.470703125, -2.2713623046875, -2.072021484375, -1.8726806640625, -1.67333984375, -1.4739990234375, -1.274658203125, -1.0753173828125, -0.8759765625, -0.6766357421875, -0.477294921875, -0.2779541015625, -0.07861328125, 0.1207275390625, 0.320068359375, 0.5194091796875, 0.71875, 0.9180908203125, 1.117431640625, 1.3167724609375, 1.51611328125, 1.7154541015625, 1.914794921875, 2.1141357421875, 2.3134765625, 2.5128173828125, 2.712158203125, 2.9114990234375, 3.11083984375, 3.3101806640625, 3.509521484375, 3.7088623046875, 3.908203125, 4.1075439453125, 4.306884765625, 4.5062255859375, 4.70556640625, 4.9049072265625, 5.104248046875, 5.3035888671875, 5.5029296875, 5.7022705078125, 5.901611328125, 6.1009521484375, 6.30029296875, 6.4996337890625, 6.698974609375, 6.8983154296875, 7.09765625]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 5.0, 6.0, 3.0, 17.0, 10.0, 15.0, 38.0, 42.0, 53.0, 69.0, 114.0, 132.0, 210.0, 297.0, 509.0, 948.0, 1623.0, 3432.0, 8155.0, 30882.0, 199027.0, 1352154.0, 2096572.0, 422061.0, 55816.0, 12366.0, 4674.0, 2142.0, 1102.0, 651.0, 379.0, 229.0, 153.0, 100.0, 95.0, 39.0, 45.0, 29.0, 21.0, 19.0, 13.0, 8.0, 10.0, 5.0, 6.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-10.7265625, -10.382568359375, -10.03857421875, -9.694580078125, -9.3505859375, -9.006591796875, -8.66259765625, -8.318603515625, -7.974609375, -7.630615234375, -7.28662109375, -6.942626953125, -6.5986328125, -6.254638671875, -5.91064453125, -5.566650390625, -5.22265625, -4.878662109375, -4.53466796875, -4.190673828125, -3.8466796875, -3.502685546875, -3.15869140625, -2.814697265625, -2.470703125, -2.126708984375, -1.78271484375, -1.438720703125, -1.0947265625, -0.750732421875, -0.40673828125, -0.062744140625, 0.28125, 0.625244140625, 0.96923828125, 1.313232421875, 1.6572265625, 2.001220703125, 2.34521484375, 2.689208984375, 3.033203125, 3.377197265625, 3.72119140625, 4.065185546875, 4.4091796875, 4.753173828125, 5.09716796875, 5.441162109375, 5.78515625, 6.129150390625, 6.47314453125, 6.817138671875, 7.1611328125, 7.505126953125, 7.84912109375, 8.193115234375, 8.537109375, 8.881103515625, 9.22509765625, 9.569091796875, 9.9130859375, 10.257080078125, 10.60107421875, 10.945068359375, 11.2890625]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 2.0, 5.0, 2.0, 4.0, 3.0, 8.0, 12.0, 17.0, 8.0, 24.0, 23.0, 43.0, 44.0, 50.0, 104.0, 155.0, 198.0, 281.0, 415.0, 512.0, 549.0, 492.0, 352.0, 224.0, 154.0, 116.0, 73.0, 50.0, 50.0, 27.0, 19.0, 8.0, 14.0, 18.0, 9.0, 5.0, 2.0, 3.0, 2.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.6953125, -9.384521484375, -9.07373046875, -8.762939453125, -8.4521484375, -8.141357421875, -7.83056640625, -7.519775390625, -7.208984375, -6.898193359375, -6.58740234375, -6.276611328125, -5.9658203125, -5.655029296875, -5.34423828125, -5.033447265625, -4.72265625, -4.411865234375, -4.10107421875, -3.790283203125, -3.4794921875, -3.168701171875, -2.85791015625, -2.547119140625, -2.236328125, -1.925537109375, -1.61474609375, -1.303955078125, -0.9931640625, -0.682373046875, -0.37158203125, -0.060791015625, 0.25, 0.560791015625, 0.87158203125, 1.182373046875, 1.4931640625, 1.803955078125, 2.11474609375, 2.425537109375, 2.736328125, 3.047119140625, 3.35791015625, 3.668701171875, 3.9794921875, 4.290283203125, 4.60107421875, 4.911865234375, 5.22265625, 5.533447265625, 5.84423828125, 6.155029296875, 6.4658203125, 6.776611328125, 7.08740234375, 7.398193359375, 7.708984375, 8.019775390625, 8.33056640625, 8.641357421875, 8.9521484375, 9.262939453125, 9.57373046875, 9.884521484375, 10.1953125]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 4.0, 2.0, 3.0, 3.0, 10.0, 14.0, 24.0, 25.0, 27.0, 42.0, 61.0, 118.0, 167.0, 281.0, 618.0, 1569.0, 6320.0, 58548.0, 2953365.0, 1135582.0, 30646.0, 4320.0, 1211.0, 532.0, 280.0, 168.0, 104.0, 64.0, 57.0, 32.0, 17.0, 21.0, 12.0, 14.0, 4.0, 3.0, 4.0, 3.0, 4.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.71875, -27.81787109375, -26.9169921875, -26.01611328125, -25.115234375, -24.21435546875, -23.3134765625, -22.41259765625, -21.51171875, -20.61083984375, -19.7099609375, -18.80908203125, -17.908203125, -17.00732421875, -16.1064453125, -15.20556640625, -14.3046875, -13.40380859375, -12.5029296875, -11.60205078125, -10.701171875, -9.80029296875, -8.8994140625, -7.99853515625, -7.09765625, -6.19677734375, -5.2958984375, -4.39501953125, -3.494140625, -2.59326171875, -1.6923828125, -0.79150390625, 0.109375, 1.01025390625, 1.9111328125, 2.81201171875, 3.712890625, 4.61376953125, 5.5146484375, 6.41552734375, 7.31640625, 8.21728515625, 9.1181640625, 10.01904296875, 10.919921875, 11.82080078125, 12.7216796875, 13.62255859375, 14.5234375, 15.42431640625, 16.3251953125, 17.22607421875, 18.126953125, 19.02783203125, 19.9287109375, 20.82958984375, 21.73046875, 22.63134765625, 23.5322265625, 24.43310546875, 25.333984375, 26.23486328125, 27.1357421875, 28.03662109375, 28.9375]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 6.0, 42.0, 240.0, 436.0, 247.0, 36.0, 6.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-78.63336181640625, -74.14485931396484, -69.65635681152344, -65.1678466796875, -60.679344177246094, -56.19084167480469, -51.702335357666016, -47.213829040527344, -42.72532653808594, -38.23682403564453, -33.74831771850586, -29.25981330871582, -24.77130889892578, -20.282804489135742, -15.794300079345703, -11.305795669555664, -6.817291259765625, -2.328786849975586, 2.159717559814453, 6.648221969604492, 11.136726379394531, 15.62523078918457, 20.11373519897461, 24.60223960876465, 29.090744018554688, 33.579246520996094, 38.067752838134766, 42.55625915527344, 47.044761657714844, 51.53326416015625, 56.02177047729492, 60.510276794433594, 64.99876403808594, 69.48726654052734, 73.97576904296875, 78.46427917480469, 82.9527816772461, 87.4412841796875, 91.92979431152344, 96.41829681396484, 100.90679931640625, 105.39530181884766, 109.88380432128906, 114.372314453125, 118.8608169555664, 123.34931945800781, 127.83782958984375, 132.32632446289062, 136.81483459472656, 141.3033447265625, 145.79183959960938, 150.2803497314453, 154.76885986328125, 159.25735473632812, 163.74586486816406, 168.23435974121094, 172.72286987304688, 177.2113800048828, 181.6998748779297, 186.18838500976562, 190.6768798828125, 195.16539001464844, 199.65390014648438, 204.14239501953125, 208.6309051513672]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 9.0, 8.0, 9.0, 7.0, 10.0, 20.0, 17.0, 27.0, 29.0, 29.0, 17.0, 25.0, 24.0, 42.0, 50.0, 35.0, 49.0, 41.0, 43.0, 45.0, 37.0, 50.0, 36.0, 37.0, 44.0, 31.0, 31.0, 21.0, 26.0, 29.0, 19.0, 19.0, 12.0, 14.0, 11.0, 6.0, 7.0, 16.0, 6.0, 4.0, 4.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-34.675350189208984, -33.692710876464844, -32.71007537841797, -31.727436065673828, -30.744796752929688, -29.76215934753418, -28.779521942138672, -27.79688262939453, -26.814245223999023, -25.831607818603516, -24.848968505859375, -23.866331100463867, -22.88369369506836, -21.90105438232422, -20.91841697692871, -19.935779571533203, -18.953140258789062, -17.970502853393555, -16.987863540649414, -16.005226135253906, -15.022587776184082, -14.039949417114258, -13.05731201171875, -12.074673652648926, -11.092035293579102, -10.109396934509277, -9.126758575439453, -8.144121170043945, -7.161482810974121, -6.178844451904297, -5.196206569671631, -4.213568687438965, -3.2309322357177734, -2.2482941150665283, -1.2656559944152832, -0.2830178737640381, 0.699620246887207, 1.6822586059570312, 2.6648964881896973, 3.6475343704223633, 4.6301727294921875, 5.612811088562012, 6.595448970794678, 7.578086853027344, 8.560725212097168, 9.543363571166992, 10.5260009765625, 11.508639335632324, 12.491277694702148, 13.473916053771973, 14.456554412841797, 15.439191818237305, 16.421829223632812, 17.404468536376953, 18.38710594177246, 19.36974334716797, 20.35238265991211, 21.335020065307617, 22.317659378051758, 23.300296783447266, 24.282936096191406, 25.265573501586914, 26.248210906982422, 27.230850219726562, 28.21348762512207]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 6.0, 1.0, 7.0, 8.0, 13.0, 9.0, 14.0, 15.0, 18.0, 16.0, 17.0, 26.0, 26.0, 22.0, 29.0, 36.0, 41.0, 35.0, 43.0, 52.0, 37.0, 43.0, 34.0, 48.0, 36.0, 47.0, 38.0, 32.0, 37.0, 32.0, 21.0, 22.0, 17.0, 14.0, 24.0, 13.0, 16.0, 12.0, 8.0, 7.0, 3.0, 7.0, 5.0, 4.0, 3.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-6.05859375, -5.8546142578125, -5.650634765625, -5.4466552734375, -5.24267578125, -5.0386962890625, -4.834716796875, -4.6307373046875, -4.4267578125, -4.2227783203125, -4.018798828125, -3.8148193359375, -3.61083984375, -3.4068603515625, -3.202880859375, -2.9989013671875, -2.794921875, -2.5909423828125, -2.386962890625, -2.1829833984375, -1.97900390625, -1.7750244140625, -1.571044921875, -1.3670654296875, -1.1630859375, -0.9591064453125, -0.755126953125, -0.5511474609375, -0.34716796875, -0.1431884765625, 0.060791015625, 0.2647705078125, 0.46875, 0.6727294921875, 0.876708984375, 1.0806884765625, 1.28466796875, 1.4886474609375, 1.692626953125, 1.8966064453125, 2.1005859375, 2.3045654296875, 2.508544921875, 2.7125244140625, 2.91650390625, 3.1204833984375, 3.324462890625, 3.5284423828125, 3.732421875, 3.9364013671875, 4.140380859375, 4.3443603515625, 4.54833984375, 4.7523193359375, 4.956298828125, 5.1602783203125, 5.3642578125, 5.5682373046875, 5.772216796875, 5.9761962890625, 6.18017578125, 6.3841552734375, 6.588134765625, 6.7921142578125, 6.99609375]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 12.0, 9.0, 15.0, 19.0, 36.0, 43.0, 77.0, 113.0, 171.0, 294.0, 445.0, 739.0, 1135.0, 1911.0, 3259.0, 5631.0, 9732.0, 17207.0, 30775.0, 56782.0, 113389.0, 258475.0, 285659.0, 123748.0, 61829.0, 33259.0, 18618.0, 10440.0, 5883.0, 3438.0, 2063.0, 1284.0, 756.0, 484.0, 288.0, 175.0, 108.0, 76.0, 63.0, 39.0, 31.0, 15.0, 17.0, 6.0, 7.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.35546875, -0.344024658203125, -0.33258056640625, -0.321136474609375, -0.3096923828125, -0.298248291015625, -0.28680419921875, -0.275360107421875, -0.263916015625, -0.252471923828125, -0.24102783203125, -0.229583740234375, -0.2181396484375, -0.206695556640625, -0.19525146484375, -0.183807373046875, -0.17236328125, -0.160919189453125, -0.14947509765625, -0.138031005859375, -0.1265869140625, -0.115142822265625, -0.10369873046875, -0.092254638671875, -0.080810546875, -0.069366455078125, -0.05792236328125, -0.046478271484375, -0.0350341796875, -0.023590087890625, -0.01214599609375, -0.000701904296875, 0.0107421875, 0.022186279296875, 0.03363037109375, 0.045074462890625, 0.0565185546875, 0.067962646484375, 0.07940673828125, 0.090850830078125, 0.102294921875, 0.113739013671875, 0.12518310546875, 0.136627197265625, 0.1480712890625, 0.159515380859375, 0.17095947265625, 0.182403564453125, 0.19384765625, 0.205291748046875, 0.21673583984375, 0.228179931640625, 0.2396240234375, 0.251068115234375, 0.26251220703125, 0.273956298828125, 0.285400390625, 0.296844482421875, 0.30828857421875, 0.319732666015625, 0.3311767578125, 0.342620849609375, 0.35406494140625, 0.365509033203125, 0.376953125]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 3.0, 0.0, 3.0, 5.0, 3.0, 3.0, 3.0, 9.0, 8.0, 5.0, 18.0, 13.0, 6.0, 13.0, 19.0, 25.0, 22.0, 24.0, 21.0, 35.0, 30.0, 35.0, 42.0, 22.0, 31.0, 38.0, 44.0, 35.0, 1066.0, 39.0, 31.0, 44.0, 31.0, 23.0, 42.0, 33.0, 37.0, 18.0, 21.0, 19.0, 21.0, 13.0, 16.0, 11.0, 14.0, 11.0, 9.0, 5.0, 5.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 5.0, 1.0, 0.0, 1.0], "bins": [-3.974609375, -3.850677490234375, -3.72674560546875, -3.602813720703125, -3.4788818359375, -3.354949951171875, -3.23101806640625, -3.107086181640625, -2.983154296875, -2.859222412109375, -2.73529052734375, -2.611358642578125, -2.4874267578125, -2.363494873046875, -2.23956298828125, -2.115631103515625, -1.99169921875, -1.867767333984375, -1.74383544921875, -1.619903564453125, -1.4959716796875, -1.372039794921875, -1.24810791015625, -1.124176025390625, -1.000244140625, -0.876312255859375, -0.75238037109375, -0.628448486328125, -0.5045166015625, -0.380584716796875, -0.25665283203125, -0.132720947265625, -0.0087890625, 0.115142822265625, 0.23907470703125, 0.363006591796875, 0.4869384765625, 0.610870361328125, 0.73480224609375, 0.858734130859375, 0.982666015625, 1.106597900390625, 1.23052978515625, 1.354461669921875, 1.4783935546875, 1.602325439453125, 1.72625732421875, 1.850189208984375, 1.97412109375, 2.098052978515625, 2.22198486328125, 2.345916748046875, 2.4698486328125, 2.593780517578125, 2.71771240234375, 2.841644287109375, 2.965576171875, 3.089508056640625, 3.21343994140625, 3.337371826171875, 3.4613037109375, 3.585235595703125, 3.70916748046875, 3.833099365234375, 3.95703125]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 12.0, 9.0, 23.0, 28.0, 55.0, 52.0, 83.0, 99.0, 135.0, 207.0, 343.0, 514.0, 664.0, 951.0, 1376.0, 2080.0, 3185.0, 4587.0, 6982.0, 11056.0, 16971.0, 27667.0, 45905.0, 77461.0, 135318.0, 1292015.0, 196389.0, 108482.0, 62532.0, 37726.0, 22690.0, 14345.0, 9189.0, 5954.0, 3859.0, 2555.0, 1764.0, 1228.0, 771.0, 567.0, 370.0, 276.0, 190.0, 156.0, 91.0, 60.0, 45.0, 37.0, 18.0, 18.0, 13.0, 13.0, 8.0, 5.0, 6.0, 3.0, 3.0], "bins": [-0.219970703125, -0.21326446533203125, -0.2065582275390625, -0.19985198974609375, -0.193145751953125, -0.18643951416015625, -0.1797332763671875, -0.17302703857421875, -0.16632080078125, -0.15961456298828125, -0.1529083251953125, -0.14620208740234375, -0.139495849609375, -0.13278961181640625, -0.1260833740234375, -0.11937713623046875, -0.1126708984375, -0.10596466064453125, -0.0992584228515625, -0.09255218505859375, -0.085845947265625, -0.07913970947265625, -0.0724334716796875, -0.06572723388671875, -0.05902099609375, -0.05231475830078125, -0.0456085205078125, -0.03890228271484375, -0.032196044921875, -0.02548980712890625, -0.0187835693359375, -0.01207733154296875, -0.00537109375, 0.00133514404296875, 0.0080413818359375, 0.01474761962890625, 0.021453857421875, 0.02816009521484375, 0.0348663330078125, 0.04157257080078125, 0.04827880859375, 0.05498504638671875, 0.0616912841796875, 0.06839752197265625, 0.075103759765625, 0.08180999755859375, 0.0885162353515625, 0.09522247314453125, 0.1019287109375, 0.10863494873046875, 0.1153411865234375, 0.12204742431640625, 0.128753662109375, 0.13545989990234375, 0.1421661376953125, 0.14887237548828125, 0.15557861328125, 0.16228485107421875, 0.1689910888671875, 0.17569732666015625, 0.182403564453125, 0.18910980224609375, 0.1958160400390625, 0.20252227783203125, 0.209228515625]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 7.0, 7.0, 4.0, 11.0, 9.0, 15.0, 21.0, 17.0, 18.0, 21.0, 29.0, 32.0, 39.0, 48.0, 63.0, 91.0, 97.0, 90.0, 67.0, 52.0, 62.0, 40.0, 26.0, 21.0, 13.0, 19.0, 14.0, 18.0, 10.0, 8.0, 9.0, 5.0, 4.0, 2.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.00022935867309570312, -0.00022295117378234863, -0.00021654367446899414, -0.00021013617515563965, -0.00020372867584228516, -0.00019732117652893066, -0.00019091367721557617, -0.00018450617790222168, -0.0001780986785888672, -0.0001716911792755127, -0.0001652836799621582, -0.0001588761806488037, -0.00015246868133544922, -0.00014606118202209473, -0.00013965368270874023, -0.00013324618339538574, -0.00012683868408203125, -0.00012043118476867676, -0.00011402368545532227, -0.00010761618614196777, -0.00010120868682861328, -9.480118751525879e-05, -8.83936882019043e-05, -8.19861888885498e-05, -7.557868957519531e-05, -6.917119026184082e-05, -6.276369094848633e-05, -5.6356191635131836e-05, -4.9948692321777344e-05, -4.354119300842285e-05, -3.713369369506836e-05, -3.072619438171387e-05, -2.4318695068359375e-05, -1.7911195755004883e-05, -1.150369644165039e-05, -5.0961971282958984e-06, 1.3113021850585938e-06, 7.718801498413086e-06, 1.4126300811767578e-05, 2.053380012512207e-05, 2.6941299438476562e-05, 3.3348798751831055e-05, 3.975629806518555e-05, 4.616379737854004e-05, 5.257129669189453e-05, 5.8978796005249023e-05, 6.538629531860352e-05, 7.179379463195801e-05, 7.82012939453125e-05, 8.460879325866699e-05, 9.101629257202148e-05, 9.742379188537598e-05, 0.00010383129119873047, 0.00011023879051208496, 0.00011664628982543945, 0.00012305378913879395, 0.00012946128845214844, 0.00013586878776550293, 0.00014227628707885742, 0.00014868378639221191, 0.0001550912857055664, 0.0001614987850189209, 0.0001679062843322754, 0.00017431378364562988, 0.00018072128295898438]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 0.0, 6.0, 4.0, 8.0, 10.0, 8.0, 10.0, 17.0, 25.0, 39.0, 39.0, 43.0, 67.0, 103.0, 153.0, 291.0, 714.0, 4782.0, 944448.0, 94874.0, 1709.0, 457.0, 215.0, 141.0, 81.0, 71.0, 44.0, 46.0, 26.0, 31.0, 25.0, 16.0, 11.0, 5.0, 6.0, 5.0, 5.0, 6.0, 5.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.0043182373046875, -0.00418245792388916, -0.00404667854309082, -0.0039108991622924805, -0.0037751197814941406, -0.0036393404006958008, -0.003503561019897461, -0.003367781639099121, -0.0032320022583007812, -0.0030962228775024414, -0.0029604434967041016, -0.0028246641159057617, -0.002688884735107422, -0.002553105354309082, -0.002417325973510742, -0.0022815465927124023, -0.0021457672119140625, -0.0020099878311157227, -0.0018742084503173828, -0.001738429069519043, -0.0016026496887207031, -0.0014668703079223633, -0.0013310909271240234, -0.0011953115463256836, -0.0010595321655273438, -0.0009237527847290039, -0.0007879734039306641, -0.0006521940231323242, -0.0005164146423339844, -0.00038063526153564453, -0.0002448558807373047, -0.00010907649993896484, 2.6702880859375e-05, 0.00016248226165771484, 0.0002982616424560547, 0.00043404102325439453, 0.0005698204040527344, 0.0007055997848510742, 0.0008413791656494141, 0.000977158546447754, 0.0011129379272460938, 0.0012487173080444336, 0.0013844966888427734, 0.0015202760696411133, 0.0016560554504394531, 0.001791834831237793, 0.0019276142120361328, 0.0020633935928344727, 0.0021991729736328125, 0.0023349523544311523, 0.002470731735229492, 0.002606511116027832, 0.002742290496826172, 0.0028780698776245117, 0.0030138492584228516, 0.0031496286392211914, 0.0032854080200195312, 0.003421187400817871, 0.003556966781616211, 0.0036927461624145508, 0.0038285255432128906, 0.0039643049240112305, 0.00410008430480957, 0.00423586368560791, 0.00437164306640625]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 19.0, 62.0, 261.0, 376.0, 215.0, 62.0, 10.0, 6.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002169082290492952, -0.00020182506705168635, -0.0001867419050540775, -0.00017165874305646867, -0.00015657558105885983, -0.00014149240450933576, -0.00012640925706364214, -0.00011132608779007569, -9.624292579246685e-05, -8.115976379485801e-05, -6.607660179724917e-05, -5.099343616166152e-05, -3.591027416405268e-05, -2.0827108528465033e-05, -5.743946530856192e-06, 9.339215466752648e-06, 2.442237746436149e-05, 3.950553946197033e-05, 5.458870145957917e-05, 6.967186345718801e-05, 8.475502545479685e-05, 9.98381947283633e-05, 0.00011492135672597215, 0.00013000451144762337, 0.00014508768799714744, 0.00016017084999475628, 0.00017525401199236512, 0.00019033717398997396, 0.0002054203359875828, 0.00022050351253710687, 0.00023558665998280048, 0.00025066983653232455, 0.00026575298397801816, 0.00028083616052754223, 0.00029591930797323585, 0.0003110024845227599, 0.0003260856319684535, 0.0003411688085179776, 0.0003562519559636712, 0.0003713351325131953, 0.0003864182799588889, 0.00040150145650841296, 0.00041658460395410657, 0.00043166778050363064, 0.00044675092794932425, 0.0004618341044988483, 0.00047691725194454193, 0.000492000428494066, 0.0005070836050435901, 0.0005221667815931141, 0.0005372499581426382, 0.0005523330764845014, 0.0005674162530340254, 0.0005824994295835495, 0.0005975826061330736, 0.0006126657244749367, 0.0006277489010244608, 0.0006428320775739849, 0.0006579152541235089, 0.0006729983724653721, 0.0006880815490148962, 0.0007031647255644202, 0.0007182479021139443, 0.0007333310204558074, 0.0007484141970053315]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 8.0, 6.0, 4.0, 7.0, 2.0, 5.0, 12.0, 13.0, 16.0, 18.0, 16.0, 15.0, 25.0, 21.0, 27.0, 22.0, 30.0, 36.0, 35.0, 38.0, 55.0, 55.0, 47.0, 47.0, 46.0, 38.0, 42.0, 40.0, 31.0, 35.0, 35.0, 24.0, 24.0, 23.0, 20.0, 19.0, 15.0, 11.0, 9.0, 8.0, 8.0, 6.0, 1.0, 7.0, 3.0, 4.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00011020898818969727, -0.00010703317821025848, -0.0001038573682308197, -0.00010068155825138092, -9.750574827194214e-05, -9.432993829250336e-05, -9.115412831306458e-05, -8.79783183336258e-05, -8.480250835418701e-05, -8.162669837474823e-05, -7.845088839530945e-05, -7.527507841587067e-05, -7.209926843643188e-05, -6.89234584569931e-05, -6.574764847755432e-05, -6.257183849811554e-05, -5.939602851867676e-05, -5.6220218539237976e-05, -5.3044408559799194e-05, -4.986859858036041e-05, -4.669278860092163e-05, -4.351697862148285e-05, -4.034116864204407e-05, -3.7165358662605286e-05, -3.3989548683166504e-05, -3.081373870372772e-05, -2.763792872428894e-05, -2.446211874485016e-05, -2.1286308765411377e-05, -1.8110498785972595e-05, -1.4934688806533813e-05, -1.1758878827095032e-05, -8.58306884765625e-06, -5.407258868217468e-06, -2.2314488887786865e-06, 9.443610906600952e-07, 4.120171070098877e-06, 7.295981049537659e-06, 1.047179102897644e-05, 1.3647601008415222e-05, 1.6823410987854004e-05, 1.9999220967292786e-05, 2.3175030946731567e-05, 2.635084092617035e-05, 2.952665090560913e-05, 3.270246088504791e-05, 3.5878270864486694e-05, 3.9054080843925476e-05, 4.222989082336426e-05, 4.540570080280304e-05, 4.858151078224182e-05, 5.17573207616806e-05, 5.4933130741119385e-05, 5.8108940720558167e-05, 6.128475069999695e-05, 6.446056067943573e-05, 6.763637065887451e-05, 7.08121806383133e-05, 7.398799061775208e-05, 7.716380059719086e-05, 8.033961057662964e-05, 8.351542055606842e-05, 8.66912305355072e-05, 8.986704051494598e-05, 9.304285049438477e-05]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 6.0, 1.0, 7.0, 8.0, 13.0, 9.0, 14.0, 15.0, 18.0, 16.0, 17.0, 26.0, 26.0, 22.0, 29.0, 36.0, 41.0, 36.0, 42.0, 52.0, 37.0, 43.0, 34.0, 48.0, 36.0, 47.0, 38.0, 32.0, 37.0, 32.0, 21.0, 22.0, 17.0, 14.0, 24.0, 13.0, 16.0, 12.0, 8.0, 7.0, 3.0, 7.0, 5.0, 4.0, 3.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-6.05859375, -5.8546142578125, -5.650634765625, -5.4466552734375, -5.24267578125, -5.0386962890625, -4.834716796875, -4.6307373046875, -4.4267578125, -4.2227783203125, -4.018798828125, -3.8148193359375, -3.61083984375, -3.4068603515625, -3.202880859375, -2.9989013671875, -2.794921875, -2.5909423828125, -2.386962890625, -2.1829833984375, -1.97900390625, -1.7750244140625, -1.571044921875, -1.3670654296875, -1.1630859375, -0.9591064453125, -0.755126953125, -0.5511474609375, -0.34716796875, -0.1431884765625, 0.060791015625, 0.2647705078125, 0.46875, 0.6727294921875, 0.876708984375, 1.0806884765625, 1.28466796875, 1.4886474609375, 1.692626953125, 1.8966064453125, 2.1005859375, 2.3045654296875, 2.508544921875, 2.7125244140625, 2.91650390625, 3.1204833984375, 3.324462890625, 3.5284423828125, 3.732421875, 3.9364013671875, 4.140380859375, 4.3443603515625, 4.54833984375, 4.7523193359375, 4.956298828125, 5.1602783203125, 5.3642578125, 5.5682373046875, 5.772216796875, 5.9761962890625, 6.18017578125, 6.3841552734375, 6.588134765625, 6.7921142578125, 6.99609375]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 1.0, 0.0, 3.0, 7.0, 6.0, 5.0, 10.0, 22.0, 24.0, 22.0, 39.0, 63.0, 83.0, 99.0, 153.0, 188.0, 294.0, 427.0, 647.0, 1077.0, 1788.0, 3308.0, 6428.0, 12836.0, 27325.0, 62595.0, 159004.0, 382407.0, 231709.0, 86157.0, 36889.0, 16574.0, 8294.0, 4136.0, 2243.0, 1335.0, 761.0, 486.0, 326.0, 225.0, 164.0, 114.0, 72.0, 56.0, 36.0, 30.0, 26.0, 20.0, 18.0, 8.0, 6.0, 8.0, 4.0, 3.0, 2.0, 0.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.546875, -7.2926025390625, -7.038330078125, -6.7840576171875, -6.52978515625, -6.2755126953125, -6.021240234375, -5.7669677734375, -5.5126953125, -5.2584228515625, -5.004150390625, -4.7498779296875, -4.49560546875, -4.2413330078125, -3.987060546875, -3.7327880859375, -3.478515625, -3.2242431640625, -2.969970703125, -2.7156982421875, -2.46142578125, -2.2071533203125, -1.952880859375, -1.6986083984375, -1.4443359375, -1.1900634765625, -0.935791015625, -0.6815185546875, -0.42724609375, -0.1729736328125, 0.081298828125, 0.3355712890625, 0.58984375, 0.8441162109375, 1.098388671875, 1.3526611328125, 1.60693359375, 1.8612060546875, 2.115478515625, 2.3697509765625, 2.6240234375, 2.8782958984375, 3.132568359375, 3.3868408203125, 3.64111328125, 3.8953857421875, 4.149658203125, 4.4039306640625, 4.658203125, 4.9124755859375, 5.166748046875, 5.4210205078125, 5.67529296875, 5.9295654296875, 6.183837890625, 6.4381103515625, 6.6923828125, 6.9466552734375, 7.200927734375, 7.4552001953125, 7.70947265625, 7.9637451171875, 8.218017578125, 8.4722900390625, 8.7265625]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 4.0, 6.0, 6.0, 4.0, 6.0, 12.0, 16.0, 18.0, 19.0, 22.0, 35.0, 26.0, 46.0, 36.0, 50.0, 50.0, 65.0, 74.0, 179.0, 1438.0, 352.0, 163.0, 68.0, 52.0, 43.0, 35.0, 32.0, 25.0, 21.0, 35.0, 27.0, 13.0, 16.0, 12.0, 7.0, 10.0, 7.0, 8.0, 3.0, 3.0, 4.0, 3.0, 3.0, 1.0, 0.0, 4.0, 0.0, 1.0, 1.0], "bins": [-19.875, -19.30419921875, -18.7333984375, -18.16259765625, -17.591796875, -17.02099609375, -16.4501953125, -15.87939453125, -15.30859375, -14.73779296875, -14.1669921875, -13.59619140625, -13.025390625, -12.45458984375, -11.8837890625, -11.31298828125, -10.7421875, -10.17138671875, -9.6005859375, -9.02978515625, -8.458984375, -7.88818359375, -7.3173828125, -6.74658203125, -6.17578125, -5.60498046875, -5.0341796875, -4.46337890625, -3.892578125, -3.32177734375, -2.7509765625, -2.18017578125, -1.609375, -1.03857421875, -0.4677734375, 0.10302734375, 0.673828125, 1.24462890625, 1.8154296875, 2.38623046875, 2.95703125, 3.52783203125, 4.0986328125, 4.66943359375, 5.240234375, 5.81103515625, 6.3818359375, 6.95263671875, 7.5234375, 8.09423828125, 8.6650390625, 9.23583984375, 9.806640625, 10.37744140625, 10.9482421875, 11.51904296875, 12.08984375, 12.66064453125, 13.2314453125, 13.80224609375, 14.373046875, 14.94384765625, 15.5146484375, 16.08544921875, 16.65625]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 7.0, 5.0, 4.0, 9.0, 8.0, 17.0, 16.0, 32.0, 46.0, 41.0, 74.0, 109.0, 175.0, 289.0, 523.0, 1373.0, 12487.0, 553706.0, 2542521.0, 30320.0, 2305.0, 641.0, 369.0, 199.0, 160.0, 71.0, 61.0, 26.0, 26.0, 24.0, 17.0, 14.0, 7.0, 6.0, 5.0, 2.0, 2.0, 8.0, 2.0, 4.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.59375, -25.64892578125, -24.7041015625, -23.75927734375, -22.814453125, -21.86962890625, -20.9248046875, -19.97998046875, -19.03515625, -18.09033203125, -17.1455078125, -16.20068359375, -15.255859375, -14.31103515625, -13.3662109375, -12.42138671875, -11.4765625, -10.53173828125, -9.5869140625, -8.64208984375, -7.697265625, -6.75244140625, -5.8076171875, -4.86279296875, -3.91796875, -2.97314453125, -2.0283203125, -1.08349609375, -0.138671875, 0.80615234375, 1.7509765625, 2.69580078125, 3.640625, 4.58544921875, 5.5302734375, 6.47509765625, 7.419921875, 8.36474609375, 9.3095703125, 10.25439453125, 11.19921875, 12.14404296875, 13.0888671875, 14.03369140625, 14.978515625, 15.92333984375, 16.8681640625, 17.81298828125, 18.7578125, 19.70263671875, 20.6474609375, 21.59228515625, 22.537109375, 23.48193359375, 24.4267578125, 25.37158203125, 26.31640625, 27.26123046875, 28.2060546875, 29.15087890625, 30.095703125, 31.04052734375, 31.9853515625, 32.93017578125, 33.875]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 10.0, 768.0, 238.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-362.8045959472656, -353.2045593261719, -343.6045227050781, -334.0044860839844, -324.4044494628906, -314.804443359375, -305.20440673828125, -295.6043701171875, -286.00433349609375, -276.404296875, -266.80426025390625, -257.2042236328125, -247.6042022705078, -238.00416564941406, -228.4041290283203, -218.80410766601562, -209.2040557861328, -199.60401916503906, -190.0039825439453, -180.40396118164062, -170.80392456054688, -161.20388793945312, -151.60385131835938, -142.00381469726562, -132.40377807617188, -122.80374145507812, -113.2037124633789, -103.60367584228516, -94.00364685058594, -84.40361022949219, -74.80357360839844, -65.20354461669922, -55.60353088378906, -46.00349807739258, -36.403465270996094, -26.803428649902344, -17.20339584350586, -7.603363037109375, 1.996673583984375, 11.596702575683594, 21.196739196777344, 30.796772003173828, 40.39680480957031, 49.99684143066406, 59.59687423706055, 69.19690704345703, 78.79694366455078, 88.39697265625, 97.99700927734375, 107.5970458984375, 117.19707489013672, 126.79711151123047, 136.3971405029297, 145.99717712402344, 155.5972137451172, 165.19723510742188, 174.79727172851562, 184.39730834960938, 193.99734497070312, 203.59738159179688, 213.19740295410156, 222.7974395751953, 232.39747619628906, 241.99749755859375, 251.59754943847656]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 1.0, 4.0, 1.0, 7.0, 7.0, 8.0, 4.0, 9.0, 8.0, 14.0, 18.0, 12.0, 28.0, 17.0, 26.0, 26.0, 25.0, 29.0, 32.0, 35.0, 46.0, 32.0, 41.0, 49.0, 43.0, 38.0, 39.0, 37.0, 34.0, 29.0, 30.0, 26.0, 35.0, 34.0, 34.0, 18.0, 18.0, 17.0, 14.0, 12.0, 14.0, 7.0, 14.0, 11.0, 4.0, 4.0, 6.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 3.0], "bins": [-35.90821838378906, -34.79539489746094, -33.68257141113281, -32.56974792480469, -31.456926345825195, -30.34410285949707, -29.231281280517578, -28.118457794189453, -27.005634307861328, -25.892810821533203, -24.779987335205078, -23.667165756225586, -22.55434226989746, -21.441518783569336, -20.328697204589844, -19.21587371826172, -18.103050231933594, -16.99022674560547, -15.87740421295166, -14.764581680297852, -13.651758193969727, -12.538934707641602, -11.426112174987793, -10.313289642333984, -9.20046615600586, -8.087642669677734, -6.974820137023926, -5.861997127532959, -4.749174118041992, -3.6363511085510254, -2.5235280990600586, -1.4107050895690918, -0.297882080078125, 0.8149409294128418, 1.9277639389038086, 3.0405869483947754, 4.153409957885742, 5.266232967376709, 6.379055976867676, 7.491878986358643, 8.60470199584961, 9.717525482177734, 10.830348014831543, 11.943170547485352, 13.055994033813477, 14.168817520141602, 15.28164005279541, 16.39446258544922, 17.507286071777344, 18.62010955810547, 19.732933044433594, 20.845754623413086, 21.95857810974121, 23.071401596069336, 24.184223175048828, 25.297046661376953, 26.409870147705078, 27.522693634033203, 28.635517120361328, 29.74833869934082, 30.861162185668945, 31.97398567199707, 33.08680725097656, 34.19963073730469, 35.31245422363281]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 2.0, 6.0, 2.0, 3.0, 4.0, 4.0, 7.0, 5.0, 17.0, 13.0, 15.0, 13.0, 13.0, 20.0, 19.0, 26.0, 25.0, 29.0, 36.0, 31.0, 38.0, 43.0, 46.0, 43.0, 38.0, 42.0, 47.0, 50.0, 33.0, 43.0, 36.0, 37.0, 29.0, 27.0, 20.0, 15.0, 22.0, 9.0, 24.0, 19.0, 10.0, 13.0, 8.0, 4.0, 6.0, 4.0, 6.0, 3.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.1171875, -5.9072265625, -5.697265625, -5.4873046875, -5.27734375, -5.0673828125, -4.857421875, -4.6474609375, -4.4375, -4.2275390625, -4.017578125, -3.8076171875, -3.59765625, -3.3876953125, -3.177734375, -2.9677734375, -2.7578125, -2.5478515625, -2.337890625, -2.1279296875, -1.91796875, -1.7080078125, -1.498046875, -1.2880859375, -1.078125, -0.8681640625, -0.658203125, -0.4482421875, -0.23828125, -0.0283203125, 0.181640625, 0.3916015625, 0.6015625, 0.8115234375, 1.021484375, 1.2314453125, 1.44140625, 1.6513671875, 1.861328125, 2.0712890625, 2.28125, 2.4912109375, 2.701171875, 2.9111328125, 3.12109375, 3.3310546875, 3.541015625, 3.7509765625, 3.9609375, 4.1708984375, 4.380859375, 4.5908203125, 4.80078125, 5.0107421875, 5.220703125, 5.4306640625, 5.640625, 5.8505859375, 6.060546875, 6.2705078125, 6.48046875, 6.6904296875, 6.900390625, 7.1103515625, 7.3203125]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 8.0, 7.0, 7.0, 10.0, 19.0, 18.0, 29.0, 34.0, 54.0, 68.0, 75.0, 121.0, 174.0, 284.0, 384.0, 644.0, 1080.0, 1883.0, 3429.0, 7264.0, 19712.0, 77012.0, 370679.0, 1434643.0, 1660833.0, 477064.0, 98234.0, 23270.0, 8293.0, 3799.0, 2024.0, 1105.0, 658.0, 416.0, 285.0, 189.0, 143.0, 95.0, 60.0, 40.0, 42.0, 28.0, 14.0, 21.0, 14.0, 5.0, 9.0, 2.0, 5.0, 4.0, 0.0, 1.0, 1.0, 1.0], "bins": [-8.703125, -8.44775390625, -8.1923828125, -7.93701171875, -7.681640625, -7.42626953125, -7.1708984375, -6.91552734375, -6.66015625, -6.40478515625, -6.1494140625, -5.89404296875, -5.638671875, -5.38330078125, -5.1279296875, -4.87255859375, -4.6171875, -4.36181640625, -4.1064453125, -3.85107421875, -3.595703125, -3.34033203125, -3.0849609375, -2.82958984375, -2.57421875, -2.31884765625, -2.0634765625, -1.80810546875, -1.552734375, -1.29736328125, -1.0419921875, -0.78662109375, -0.53125, -0.27587890625, -0.0205078125, 0.23486328125, 0.490234375, 0.74560546875, 1.0009765625, 1.25634765625, 1.51171875, 1.76708984375, 2.0224609375, 2.27783203125, 2.533203125, 2.78857421875, 3.0439453125, 3.29931640625, 3.5546875, 3.81005859375, 4.0654296875, 4.32080078125, 4.576171875, 4.83154296875, 5.0869140625, 5.34228515625, 5.59765625, 5.85302734375, 6.1083984375, 6.36376953125, 6.619140625, 6.87451171875, 7.1298828125, 7.38525390625, 7.640625]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 5.0, 4.0, 4.0, 4.0, 7.0, 9.0, 17.0, 22.0, 17.0, 18.0, 61.0, 56.0, 69.0, 135.0, 223.0, 314.0, 557.0, 727.0, 651.0, 407.0, 259.0, 188.0, 95.0, 72.0, 36.0, 21.0, 25.0, 18.0, 11.0, 13.0, 9.0, 8.0, 5.0, 3.0, 3.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.65625, -10.3087158203125, -9.961181640625, -9.6136474609375, -9.26611328125, -8.9185791015625, -8.571044921875, -8.2235107421875, -7.8759765625, -7.5284423828125, -7.180908203125, -6.8333740234375, -6.48583984375, -6.1383056640625, -5.790771484375, -5.4432373046875, -5.095703125, -4.7481689453125, -4.400634765625, -4.0531005859375, -3.70556640625, -3.3580322265625, -3.010498046875, -2.6629638671875, -2.3154296875, -1.9678955078125, -1.620361328125, -1.2728271484375, -0.92529296875, -0.5777587890625, -0.230224609375, 0.1173095703125, 0.46484375, 0.8123779296875, 1.159912109375, 1.5074462890625, 1.85498046875, 2.2025146484375, 2.550048828125, 2.8975830078125, 3.2451171875, 3.5926513671875, 3.940185546875, 4.2877197265625, 4.63525390625, 4.9827880859375, 5.330322265625, 5.6778564453125, 6.025390625, 6.3729248046875, 6.720458984375, 7.0679931640625, 7.41552734375, 7.7630615234375, 8.110595703125, 8.4581298828125, 8.8056640625, 9.1531982421875, 9.500732421875, 9.8482666015625, 10.19580078125, 10.5433349609375, 10.890869140625, 11.2384033203125, 11.5859375]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 5.0, 9.0, 3.0, 9.0, 16.0, 35.0, 41.0, 42.0, 79.0, 120.0, 212.0, 311.0, 710.0, 1500.0, 3634.0, 11162.0, 43019.0, 333421.0, 3208993.0, 515509.0, 54512.0, 13068.0, 4342.0, 1670.0, 771.0, 409.0, 246.0, 151.0, 100.0, 58.0, 34.0, 29.0, 16.0, 16.0, 11.0, 9.0, 7.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-17.578125, -17.0545654296875, -16.531005859375, -16.0074462890625, -15.48388671875, -14.9603271484375, -14.436767578125, -13.9132080078125, -13.3896484375, -12.8660888671875, -12.342529296875, -11.8189697265625, -11.29541015625, -10.7718505859375, -10.248291015625, -9.7247314453125, -9.201171875, -8.6776123046875, -8.154052734375, -7.6304931640625, -7.10693359375, -6.5833740234375, -6.059814453125, -5.5362548828125, -5.0126953125, -4.4891357421875, -3.965576171875, -3.4420166015625, -2.91845703125, -2.3948974609375, -1.871337890625, -1.3477783203125, -0.82421875, -0.3006591796875, 0.222900390625, 0.7464599609375, 1.27001953125, 1.7935791015625, 2.317138671875, 2.8406982421875, 3.3642578125, 3.8878173828125, 4.411376953125, 4.9349365234375, 5.45849609375, 5.9820556640625, 6.505615234375, 7.0291748046875, 7.552734375, 8.0762939453125, 8.599853515625, 9.1234130859375, 9.64697265625, 10.1705322265625, 10.694091796875, 11.2176513671875, 11.7412109375, 12.2647705078125, 12.788330078125, 13.3118896484375, 13.83544921875, 14.3590087890625, 14.882568359375, 15.4061279296875, 15.9296875]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 3.0, 11.0, 37.0, 107.0, 266.0, 276.0, 185.0, 87.0, 30.0, 7.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.15627670288086, -19.474689483642578, -16.793102264404297, -14.111513137817383, -11.429925918579102, -8.74833869934082, -6.066749572753906, -3.385162353515625, -0.7035751342773438, 1.9780125617980957, 4.659600257873535, 7.341188430786133, 10.022775650024414, 12.704362869262695, 15.38595199584961, 18.06753921508789, 20.749126434326172, 23.430713653564453, 26.112300872802734, 28.79388999938965, 31.47547721862793, 34.157066345214844, 36.838653564453125, 39.520240783691406, 42.20182800292969, 44.88341522216797, 47.56500244140625, 50.24658966064453, 52.92817687988281, 55.609764099121094, 58.29135513305664, 60.97294235229492, 63.65452575683594, 66.33611297607422, 69.0177001953125, 71.69928741455078, 74.38087463378906, 77.06246185302734, 79.74404907226562, 82.42564392089844, 85.10722351074219, 87.78881072998047, 90.47039794921875, 93.15198516845703, 95.83357238769531, 98.5151596069336, 101.19674682617188, 103.87834167480469, 106.55992889404297, 109.24151611328125, 111.92310333251953, 114.60469055175781, 117.2862777709961, 119.96786499023438, 122.64945983886719, 125.33103942871094, 128.01263427734375, 130.69422912597656, 133.3758087158203, 136.05740356445312, 138.73898315429688, 141.4205780029297, 144.10215759277344, 146.78375244140625, 149.46533203125]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 4.0, 2.0, 7.0, 7.0, 9.0, 10.0, 5.0, 12.0, 5.0, 16.0, 6.0, 24.0, 21.0, 32.0, 22.0, 32.0, 27.0, 28.0, 29.0, 36.0, 34.0, 52.0, 40.0, 32.0, 38.0, 48.0, 47.0, 39.0, 51.0, 31.0, 33.0, 32.0, 37.0, 33.0, 22.0, 12.0, 22.0, 15.0, 12.0, 9.0, 9.0, 8.0, 3.0, 7.0, 1.0, 4.0, 3.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-31.46980857849121, -30.543197631835938, -29.61658477783203, -28.689973831176758, -27.76336097717285, -26.836750030517578, -25.910137176513672, -24.9835262298584, -24.056915283203125, -23.13030433654785, -22.203691482543945, -21.277080535888672, -20.350467681884766, -19.423856735229492, -18.49724578857422, -17.570632934570312, -16.644020080566406, -15.717408180236816, -14.790796279907227, -13.864185333251953, -12.937572479248047, -12.010961532592773, -11.084349632263184, -10.157737731933594, -9.231125831604004, -8.304513931274414, -7.377902030944824, -6.451290607452393, -5.524678707122803, -4.598066806793213, -3.6714553833007812, -2.7448434829711914, -1.8182296752929688, -0.8916178941726685, 0.034993886947631836, 0.9616055488586426, 1.8882174491882324, 2.8148293495178223, 3.741440773010254, 4.668052673339844, 5.594664573669434, 6.521276473999023, 7.447888374328613, 8.374500274658203, 9.301111221313477, 10.227724075317383, 11.154335021972656, 12.080946922302246, 13.007558822631836, 13.934170722961426, 14.860782623291016, 15.787393569946289, 16.714006423950195, 17.64061737060547, 18.567230224609375, 19.49384117126465, 20.420452117919922, 21.347063064575195, 22.2736759185791, 23.200286865234375, 24.12689971923828, 25.053510665893555, 25.980121612548828, 26.906734466552734, 27.83334732055664]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 5.0, 3.0, 2.0, 5.0, 3.0, 8.0, 5.0, 7.0, 9.0, 8.0, 9.0, 12.0, 18.0, 21.0, 23.0, 28.0, 33.0, 23.0, 40.0, 33.0, 39.0, 36.0, 52.0, 39.0, 38.0, 42.0, 57.0, 33.0, 36.0, 31.0, 32.0, 29.0, 28.0, 29.0, 34.0, 19.0, 20.0, 19.0, 15.0, 18.0, 10.0, 8.0, 10.0, 10.0, 10.0, 5.0, 5.0, 1.0, 5.0, 2.0, 4.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-6.61328125, -6.40802001953125, -6.2027587890625, -5.99749755859375, -5.792236328125, -5.58697509765625, -5.3817138671875, -5.17645263671875, -4.97119140625, -4.76593017578125, -4.5606689453125, -4.35540771484375, -4.150146484375, -3.94488525390625, -3.7396240234375, -3.53436279296875, -3.3291015625, -3.12384033203125, -2.9185791015625, -2.71331787109375, -2.508056640625, -2.30279541015625, -2.0975341796875, -1.89227294921875, -1.68701171875, -1.48175048828125, -1.2764892578125, -1.07122802734375, -0.865966796875, -0.66070556640625, -0.4554443359375, -0.25018310546875, -0.044921875, 0.16033935546875, 0.3656005859375, 0.57086181640625, 0.776123046875, 0.98138427734375, 1.1866455078125, 1.39190673828125, 1.59716796875, 1.80242919921875, 2.0076904296875, 2.21295166015625, 2.418212890625, 2.62347412109375, 2.8287353515625, 3.03399658203125, 3.2392578125, 3.44451904296875, 3.6497802734375, 3.85504150390625, 4.060302734375, 4.26556396484375, 4.4708251953125, 4.67608642578125, 4.88134765625, 5.08660888671875, 5.2918701171875, 5.49713134765625, 5.702392578125, 5.90765380859375, 6.1129150390625, 6.31817626953125, 6.5234375]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 7.0, 12.0, 12.0, 18.0, 42.0, 65.0, 92.0, 161.0, 251.0, 357.0, 580.0, 895.0, 1178.0, 1956.0, 3026.0, 4539.0, 7349.0, 11501.0, 18434.0, 30857.0, 53748.0, 98229.0, 196597.0, 284532.0, 147429.0, 76829.0, 42438.0, 25047.0, 15401.0, 9587.0, 6129.0, 3891.0, 2480.0, 1702.0, 1106.0, 777.0, 463.0, 277.0, 223.0, 130.0, 73.0, 44.0, 29.0, 22.0, 18.0, 9.0, 3.0, 1.0, 7.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.312744140625, -0.30306243896484375, -0.2933807373046875, -0.28369903564453125, -0.274017333984375, -0.26433563232421875, -0.2546539306640625, -0.24497222900390625, -0.23529052734375, -0.22560882568359375, -0.2159271240234375, -0.20624542236328125, -0.196563720703125, -0.18688201904296875, -0.1772003173828125, -0.16751861572265625, -0.1578369140625, -0.14815521240234375, -0.1384735107421875, -0.12879180908203125, -0.119110107421875, -0.10942840576171875, -0.0997467041015625, -0.09006500244140625, -0.08038330078125, -0.07070159912109375, -0.0610198974609375, -0.05133819580078125, -0.041656494140625, -0.03197479248046875, -0.0222930908203125, -0.01261138916015625, -0.0029296875, 0.00675201416015625, 0.0164337158203125, 0.02611541748046875, 0.035797119140625, 0.04547882080078125, 0.0551605224609375, 0.06484222412109375, 0.07452392578125, 0.08420562744140625, 0.0938873291015625, 0.10356903076171875, 0.113250732421875, 0.12293243408203125, 0.1326141357421875, 0.14229583740234375, 0.1519775390625, 0.16165924072265625, 0.1713409423828125, 0.18102264404296875, 0.190704345703125, 0.20038604736328125, 0.2100677490234375, 0.21974945068359375, 0.22943115234375, 0.23911285400390625, 0.2487945556640625, 0.25847625732421875, 0.268157958984375, 0.27783966064453125, 0.2875213623046875, 0.29720306396484375, 0.306884765625]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 1.0, 6.0, 4.0, 5.0, 8.0, 10.0, 8.0, 11.0, 5.0, 21.0, 18.0, 30.0, 31.0, 30.0, 31.0, 37.0, 49.0, 44.0, 63.0, 55.0, 1058.0, 44.0, 49.0, 46.0, 46.0, 45.0, 35.0, 28.0, 37.0, 27.0, 32.0, 20.0, 21.0, 20.0, 8.0, 10.0, 9.0, 9.0, 5.0, 5.0, 3.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.53515625, -5.37103271484375, -5.2069091796875, -5.04278564453125, -4.878662109375, -4.71453857421875, -4.5504150390625, -4.38629150390625, -4.22216796875, -4.05804443359375, -3.8939208984375, -3.72979736328125, -3.565673828125, -3.40155029296875, -3.2374267578125, -3.07330322265625, -2.9091796875, -2.74505615234375, -2.5809326171875, -2.41680908203125, -2.252685546875, -2.08856201171875, -1.9244384765625, -1.76031494140625, -1.59619140625, -1.43206787109375, -1.2679443359375, -1.10382080078125, -0.939697265625, -0.77557373046875, -0.6114501953125, -0.44732666015625, -0.283203125, -0.11907958984375, 0.0450439453125, 0.20916748046875, 0.373291015625, 0.53741455078125, 0.7015380859375, 0.86566162109375, 1.02978515625, 1.19390869140625, 1.3580322265625, 1.52215576171875, 1.686279296875, 1.85040283203125, 2.0145263671875, 2.17864990234375, 2.3427734375, 2.50689697265625, 2.6710205078125, 2.83514404296875, 2.999267578125, 3.16339111328125, 3.3275146484375, 3.49163818359375, 3.65576171875, 3.81988525390625, 3.9840087890625, 4.14813232421875, 4.312255859375, 4.47637939453125, 4.6405029296875, 4.80462646484375, 4.96875]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 16.0, 9.0, 25.0, 22.0, 29.0, 35.0, 49.0, 76.0, 73.0, 133.0, 186.0, 243.0, 324.0, 492.0, 654.0, 879.0, 1226.0, 1667.0, 2456.0, 3574.0, 4955.0, 7081.0, 10610.0, 15706.0, 23857.0, 36767.0, 58570.0, 97580.0, 169920.0, 1281235.0, 144426.0, 84053.0, 50971.0, 32588.0, 20965.0, 13941.0, 9440.0, 6619.0, 4530.0, 3150.0, 2239.0, 1613.0, 1129.0, 817.0, 580.0, 458.0, 360.0, 238.0, 162.0, 110.0, 78.0, 67.0, 37.0, 35.0, 23.0, 27.0, 14.0, 12.0, 10.0, 1.0, 3.0], "bins": [-0.1976318359375, -0.19152450561523438, -0.18541717529296875, -0.17930984497070312, -0.1732025146484375, -0.16709518432617188, -0.16098785400390625, -0.15488052368164062, -0.148773193359375, -0.14266586303710938, -0.13655853271484375, -0.13045120239257812, -0.1243438720703125, -0.11823654174804688, -0.11212921142578125, -0.10602188110351562, -0.09991455078125, -0.09380722045898438, -0.08769989013671875, -0.08159255981445312, -0.0754852294921875, -0.06937789916992188, -0.06327056884765625, -0.057163238525390625, -0.051055908203125, -0.044948577880859375, -0.03884124755859375, -0.032733917236328125, -0.0266265869140625, -0.020519256591796875, -0.01441192626953125, -0.008304595947265625, -0.002197265625, 0.003910064697265625, 0.01001739501953125, 0.016124725341796875, 0.0222320556640625, 0.028339385986328125, 0.03444671630859375, 0.040554046630859375, 0.046661376953125, 0.052768707275390625, 0.05887603759765625, 0.06498336791992188, 0.0710906982421875, 0.07719802856445312, 0.08330535888671875, 0.08941268920898438, 0.09552001953125, 0.10162734985351562, 0.10773468017578125, 0.11384201049804688, 0.1199493408203125, 0.12605667114257812, 0.13216400146484375, 0.13827133178710938, 0.144378662109375, 0.15048599243164062, 0.15659332275390625, 0.16270065307617188, 0.1688079833984375, 0.17491531372070312, 0.18102264404296875, 0.18712997436523438, 0.1932373046875]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 4.0, 4.0, 8.0, 11.0, 9.0, 11.0, 10.0, 15.0, 15.0, 31.0, 39.0, 58.0, 57.0, 90.0, 83.0, 109.0, 81.0, 70.0, 58.0, 41.0, 45.0, 34.0, 19.0, 21.0, 15.0, 13.0, 16.0, 5.0, 9.0, 5.0, 5.0, 3.0, 3.0, 3.0, 0.0, 4.0, 1.0, 2.0, 1.0], "bins": [-0.0004286766052246094, -0.00041804462671279907, -0.00040741264820098877, -0.00039678066968917847, -0.00038614869117736816, -0.00037551671266555786, -0.00036488473415374756, -0.00035425275564193726, -0.00034362077713012695, -0.00033298879861831665, -0.00032235682010650635, -0.00031172484159469604, -0.00030109286308288574, -0.00029046088457107544, -0.00027982890605926514, -0.00026919692754745483, -0.00025856494903564453, -0.00024793297052383423, -0.00023730099201202393, -0.00022666901350021362, -0.00021603703498840332, -0.00020540505647659302, -0.00019477307796478271, -0.0001841410994529724, -0.0001735091209411621, -0.0001628771424293518, -0.0001522451639175415, -0.0001416131854057312, -0.0001309812068939209, -0.0001203492283821106, -0.00010971724987030029, -9.908527135848999e-05, -8.845329284667969e-05, -7.782131433486938e-05, -6.718933582305908e-05, -5.655735731124878e-05, -4.5925378799438477e-05, -3.5293400287628174e-05, -2.466142177581787e-05, -1.4029443264007568e-05, -3.3974647521972656e-06, 7.234513759613037e-06, 1.786649227142334e-05, 2.8498470783233643e-05, 3.9130449295043945e-05, 4.976242780685425e-05, 6.039440631866455e-05, 7.102638483047485e-05, 8.165836334228516e-05, 9.229034185409546e-05, 0.00010292232036590576, 0.00011355429887771606, 0.00012418627738952637, 0.00013481825590133667, 0.00014545023441314697, 0.00015608221292495728, 0.00016671419143676758, 0.00017734616994857788, 0.00018797814846038818, 0.00019861012697219849, 0.0002092421054840088, 0.0002198740839958191, 0.0002305060625076294, 0.0002411380410194397, 0.00025177001953125]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 2.0, 6.0, 4.0, 4.0, 6.0, 8.0, 10.0, 16.0, 14.0, 22.0, 22.0, 32.0, 49.0, 62.0, 88.0, 146.0, 176.0, 359.0, 706.0, 5878.0, 1024920.0, 14185.0, 805.0, 369.0, 229.0, 146.0, 89.0, 38.0, 39.0, 25.0, 21.0, 26.0, 17.0, 13.0, 9.0, 11.0, 2.0, 5.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004779815673828125, -0.0045771002769470215, -0.004374384880065918, -0.0041716694831848145, -0.003968954086303711, -0.0037662386894226074, -0.003563523292541504, -0.0033608078956604004, -0.003158092498779297, -0.0029553771018981934, -0.00275266170501709, -0.0025499463081359863, -0.002347230911254883, -0.0021445155143737793, -0.0019418001174926758, -0.0017390847206115723, -0.0015363693237304688, -0.0013336539268493652, -0.0011309385299682617, -0.0009282231330871582, -0.0007255077362060547, -0.0005227923393249512, -0.00032007694244384766, -0.00011736154556274414, 8.535385131835938e-05, 0.0002880692481994629, 0.0004907846450805664, 0.0006935000419616699, 0.0008962154388427734, 0.001098930835723877, 0.0013016462326049805, 0.001504361629486084, 0.0017070770263671875, 0.001909792423248291, 0.0021125078201293945, 0.002315223217010498, 0.0025179386138916016, 0.002720654010772705, 0.0029233694076538086, 0.003126084804534912, 0.0033288002014160156, 0.003531515598297119, 0.0037342309951782227, 0.003936946392059326, 0.00413966178894043, 0.004342377185821533, 0.004545092582702637, 0.00474780797958374, 0.004950523376464844, 0.005153238773345947, 0.005355954170227051, 0.005558669567108154, 0.005761384963989258, 0.005964100360870361, 0.006166815757751465, 0.006369531154632568, 0.006572246551513672, 0.006774961948394775, 0.006977677345275879, 0.007180392742156982, 0.007383108139038086, 0.0075858235359191895, 0.007788538932800293, 0.007991254329681396, 0.0081939697265625]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 7.0, 15.0, 90.0, 472.0, 358.0, 63.0, 5.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0013327023480087519, -0.0013069864362478256, -0.0012812705244868994, -0.0012555544963106513, -0.001229838584549725, -0.0012041226727887988, -0.0011784066446125507, -0.0011526907328516245, -0.0011269748210906982, -0.001101258909329772, -0.0010755429975688457, -0.0010498269693925977, -0.0010241110576316714, -0.0009983951458707452, -0.000972679175902158, -0.0009469632059335709, -0.0009212472941726446, -0.0008955313824117184, -0.0008698154124431312, -0.000844099442474544, -0.0008183835307136178, -0.0007926676189526916, -0.0007669516489841044, -0.0007412356790155172, -0.000715519767254591, -0.0006898038554936647, -0.0006640878855250776, -0.0006383719155564904, -0.0006126560037955642, -0.0005869400920346379, -0.0005612241220660508, -0.0005355081520974636, -0.0005097922403365374, -0.00048407629947178066, -0.00045836035860702395, -0.00043264441774226725, -0.00040692847687751055, -0.00038121253601275384, -0.00035549659514799714, -0.00032978065428324044, -0.0003040646843146533, -0.0002783487434498966, -0.00025263280258513987, -0.00022691686172038317, -0.00020120092085562646, -0.00017548497999086976, -0.00014976903912611306, -0.00012405309826135635, -9.833715739659965e-05, -7.262121653184295e-05, -4.6905275667086244e-05, -2.118933480232954e-05, 4.526606062427163e-06, 3.0242546927183867e-05, 5.595848779194057e-05, 8.167442865669727e-05, 0.00010739036952145398, 0.00013310631038621068, 0.00015882225125096738, 0.0001845381921157241, 0.0002102541329804808, 0.0002359700738452375, 0.0002616860147099942, 0.0002874019555747509, 0.0003131178964395076]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 3.0, 6.0, 7.0, 13.0, 14.0, 8.0, 14.0, 10.0, 21.0, 21.0, 21.0, 25.0, 33.0, 29.0, 38.0, 33.0, 47.0, 44.0, 34.0, 37.0, 35.0, 50.0, 33.0, 31.0, 33.0, 34.0, 39.0, 36.0, 39.0, 29.0, 22.0, 33.0, 23.0, 23.0, 16.0, 14.0, 9.0, 5.0, 10.0, 8.0, 10.0, 5.0, 5.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00014925003051757812, -0.0001447303220629692, -0.0001402106136083603, -0.00013569090515375137, -0.00013117119669914246, -0.00012665148824453354, -0.00012213177978992462, -0.0001176120713353157, -0.00011309236288070679, -0.00010857265442609787, -0.00010405294597148895, -9.953323751688004e-05, -9.501352906227112e-05, -9.04938206076622e-05, -8.597411215305328e-05, -8.145440369844437e-05, -7.693469524383545e-05, -7.241498678922653e-05, -6.789527833461761e-05, -6.33755698800087e-05, -5.885586142539978e-05, -5.433615297079086e-05, -4.9816444516181946e-05, -4.529673606157303e-05, -4.077702760696411e-05, -3.6257319152355194e-05, -3.173761069774628e-05, -2.721790224313736e-05, -2.2698193788528442e-05, -1.8178485333919525e-05, -1.3658776879310608e-05, -9.13906842470169e-06, -4.6193599700927734e-06, -9.96515154838562e-08, 4.420056939125061e-06, 8.939765393733978e-06, 1.3459473848342896e-05, 1.7979182302951813e-05, 2.249889075756073e-05, 2.7018599212169647e-05, 3.1538307666778564e-05, 3.605801612138748e-05, 4.05777245759964e-05, 4.5097433030605316e-05, 4.9617141485214233e-05, 5.413684993982315e-05, 5.865655839443207e-05, 6.317626684904099e-05, 6.76959753036499e-05, 7.221568375825882e-05, 7.673539221286774e-05, 8.125510066747665e-05, 8.577480912208557e-05, 9.029451757669449e-05, 9.48142260313034e-05, 9.933393448591232e-05, 0.00010385364294052124, 0.00010837335139513016, 0.00011289305984973907, 0.00011741276830434799, 0.00012193247675895691, 0.00012645218521356583, 0.00013097189366817474, 0.00013549160212278366, 0.00014001131057739258]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 5.0, 3.0, 2.0, 5.0, 3.0, 8.0, 5.0, 7.0, 9.0, 8.0, 9.0, 12.0, 18.0, 21.0, 23.0, 28.0, 33.0, 23.0, 40.0, 33.0, 39.0, 36.0, 52.0, 39.0, 38.0, 42.0, 57.0, 33.0, 36.0, 31.0, 32.0, 29.0, 28.0, 29.0, 34.0, 19.0, 20.0, 19.0, 15.0, 18.0, 10.0, 8.0, 10.0, 10.0, 10.0, 5.0, 5.0, 1.0, 5.0, 2.0, 4.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-6.61328125, -6.40802001953125, -6.2027587890625, -5.99749755859375, -5.792236328125, -5.58697509765625, -5.3817138671875, -5.17645263671875, -4.97119140625, -4.76593017578125, -4.5606689453125, -4.35540771484375, -4.150146484375, -3.94488525390625, -3.7396240234375, -3.53436279296875, -3.3291015625, -3.12384033203125, -2.9185791015625, -2.71331787109375, -2.508056640625, -2.30279541015625, -2.0975341796875, -1.89227294921875, -1.68701171875, -1.48175048828125, -1.2764892578125, -1.07122802734375, -0.865966796875, -0.66070556640625, -0.4554443359375, -0.25018310546875, -0.044921875, 0.16033935546875, 0.3656005859375, 0.57086181640625, 0.776123046875, 0.98138427734375, 1.1866455078125, 1.39190673828125, 1.59716796875, 1.80242919921875, 2.0076904296875, 2.21295166015625, 2.418212890625, 2.62347412109375, 2.8287353515625, 3.03399658203125, 3.2392578125, 3.44451904296875, 3.6497802734375, 3.85504150390625, 4.060302734375, 4.26556396484375, 4.4708251953125, 4.67608642578125, 4.88134765625, 5.08660888671875, 5.2918701171875, 5.49713134765625, 5.702392578125, 5.90765380859375, 6.1129150390625, 6.31817626953125, 6.5234375]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 4.0, 4.0, 7.0, 10.0, 12.0, 20.0, 23.0, 29.0, 34.0, 45.0, 65.0, 85.0, 140.0, 161.0, 247.0, 369.0, 581.0, 962.0, 1657.0, 3050.0, 6055.0, 13413.0, 33891.0, 96368.0, 270738.0, 379119.0, 151718.0, 52094.0, 19640.0, 8421.0, 4090.0, 2122.0, 1167.0, 706.0, 467.0, 295.0, 218.0, 157.0, 110.0, 64.0, 54.0, 39.0, 27.0, 24.0, 12.0, 17.0, 11.0, 7.0, 3.0, 9.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.6796875, -8.401611328125, -8.12353515625, -7.845458984375, -7.5673828125, -7.289306640625, -7.01123046875, -6.733154296875, -6.455078125, -6.177001953125, -5.89892578125, -5.620849609375, -5.3427734375, -5.064697265625, -4.78662109375, -4.508544921875, -4.23046875, -3.952392578125, -3.67431640625, -3.396240234375, -3.1181640625, -2.840087890625, -2.56201171875, -2.283935546875, -2.005859375, -1.727783203125, -1.44970703125, -1.171630859375, -0.8935546875, -0.615478515625, -0.33740234375, -0.059326171875, 0.21875, 0.496826171875, 0.77490234375, 1.052978515625, 1.3310546875, 1.609130859375, 1.88720703125, 2.165283203125, 2.443359375, 2.721435546875, 2.99951171875, 3.277587890625, 3.5556640625, 3.833740234375, 4.11181640625, 4.389892578125, 4.66796875, 4.946044921875, 5.22412109375, 5.502197265625, 5.7802734375, 6.058349609375, 6.33642578125, 6.614501953125, 6.892578125, 7.170654296875, 7.44873046875, 7.726806640625, 8.0048828125, 8.282958984375, 8.56103515625, 8.839111328125, 9.1171875]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 10.0, 6.0, 8.0, 10.0, 11.0, 15.0, 20.0, 23.0, 21.0, 29.0, 36.0, 39.0, 47.0, 52.0, 62.0, 89.0, 194.0, 1377.0, 374.0, 167.0, 91.0, 49.0, 63.0, 51.0, 57.0, 31.0, 32.0, 26.0, 17.0, 11.0, 7.0, 8.0, 3.0, 4.0, 6.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.796875, -16.19677734375, -15.5966796875, -14.99658203125, -14.396484375, -13.79638671875, -13.1962890625, -12.59619140625, -11.99609375, -11.39599609375, -10.7958984375, -10.19580078125, -9.595703125, -8.99560546875, -8.3955078125, -7.79541015625, -7.1953125, -6.59521484375, -5.9951171875, -5.39501953125, -4.794921875, -4.19482421875, -3.5947265625, -2.99462890625, -2.39453125, -1.79443359375, -1.1943359375, -0.59423828125, 0.005859375, 0.60595703125, 1.2060546875, 1.80615234375, 2.40625, 3.00634765625, 3.6064453125, 4.20654296875, 4.806640625, 5.40673828125, 6.0068359375, 6.60693359375, 7.20703125, 7.80712890625, 8.4072265625, 9.00732421875, 9.607421875, 10.20751953125, 10.8076171875, 11.40771484375, 12.0078125, 12.60791015625, 13.2080078125, 13.80810546875, 14.408203125, 15.00830078125, 15.6083984375, 16.20849609375, 16.80859375, 17.40869140625, 18.0087890625, 18.60888671875, 19.208984375, 19.80908203125, 20.4091796875, 21.00927734375, 21.609375]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 4.0, 7.0, 9.0, 5.0, 17.0, 9.0, 19.0, 24.0, 26.0, 49.0, 60.0, 90.0, 135.0, 187.0, 298.0, 514.0, 1081.0, 5032.0, 143675.0, 2925395.0, 63500.0, 3221.0, 927.0, 461.0, 278.0, 207.0, 125.0, 98.0, 63.0, 36.0, 38.0, 30.0, 22.0, 14.0, 14.0, 6.0, 4.0, 7.0, 5.0, 4.0, 3.0, 5.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.109375, -25.190185546875, -24.27099609375, -23.351806640625, -22.4326171875, -21.513427734375, -20.59423828125, -19.675048828125, -18.755859375, -17.836669921875, -16.91748046875, -15.998291015625, -15.0791015625, -14.159912109375, -13.24072265625, -12.321533203125, -11.40234375, -10.483154296875, -9.56396484375, -8.644775390625, -7.7255859375, -6.806396484375, -5.88720703125, -4.968017578125, -4.048828125, -3.129638671875, -2.21044921875, -1.291259765625, -0.3720703125, 0.547119140625, 1.46630859375, 2.385498046875, 3.3046875, 4.223876953125, 5.14306640625, 6.062255859375, 6.9814453125, 7.900634765625, 8.81982421875, 9.739013671875, 10.658203125, 11.577392578125, 12.49658203125, 13.415771484375, 14.3349609375, 15.254150390625, 16.17333984375, 17.092529296875, 18.01171875, 18.930908203125, 19.85009765625, 20.769287109375, 21.6884765625, 22.607666015625, 23.52685546875, 24.446044921875, 25.365234375, 26.284423828125, 27.20361328125, 28.122802734375, 29.0419921875, 29.961181640625, 30.88037109375, 31.799560546875, 32.71875]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 915.0, 104.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-437.2157897949219, -422.03289794921875, -406.8500061035156, -391.6671142578125, -376.4842224121094, -361.30133056640625, -346.1184387207031, -330.935546875, -315.7526550292969, -300.56976318359375, -285.3868713378906, -270.2039794921875, -255.02108764648438, -239.83819580078125, -224.65530395507812, -209.472412109375, -194.28952026367188, -179.10662841796875, -163.92373657226562, -148.7408447265625, -133.55795288085938, -118.37506103515625, -103.19216918945312, -88.00927734375, -72.82638549804688, -57.64349365234375, -42.460601806640625, -27.2777099609375, -12.094818115234375, 3.08807373046875, 18.270965576171875, 33.453857421875, 48.63671875, 63.819610595703125, 79.00250244140625, 94.18539428710938, 109.3682861328125, 124.55117797851562, 139.73406982421875, 154.91696166992188, 170.099853515625, 185.28274536132812, 200.46563720703125, 215.64852905273438, 230.8314208984375, 246.01431274414062, 261.19720458984375, 276.3800964355469, 291.56298828125, 306.7458801269531, 321.92877197265625, 337.1116638183594, 352.2945556640625, 367.4774475097656, 382.66033935546875, 397.8432312011719, 413.026123046875, 428.2090148925781, 443.39190673828125, 458.5747985839844, 473.7576904296875, 488.9405822753906, 504.12347412109375, 519.306396484375, 534.4892578125]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 6.0, 11.0, 8.0, 15.0, 9.0, 6.0, 22.0, 21.0, 21.0, 39.0, 32.0, 33.0, 48.0, 28.0, 39.0, 47.0, 30.0, 48.0, 44.0, 54.0, 45.0, 44.0, 34.0, 34.0, 36.0, 43.0, 32.0, 26.0, 24.0, 22.0, 18.0, 13.0, 9.0, 17.0, 12.0, 12.0, 5.0, 6.0, 1.0, 0.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-47.79768753051758, -46.52851486206055, -45.259342193603516, -43.990169525146484, -42.72099685668945, -41.45182800292969, -40.182655334472656, -38.913482666015625, -37.644309997558594, -36.37513732910156, -35.10596466064453, -33.8367919921875, -32.56761932373047, -31.29844856262207, -30.02927589416504, -28.76010513305664, -27.490930557250977, -26.221757888793945, -24.952585220336914, -23.683414459228516, -22.414241790771484, -21.145069122314453, -19.875896453857422, -18.60672378540039, -17.33755111694336, -16.068378448486328, -14.799206733703613, -13.530034065246582, -12.260862350463867, -10.991689682006836, -9.722517013549805, -8.45334529876709, -7.184173583984375, -5.915001392364502, -4.645829200744629, -3.3766565322875977, -2.1074843406677246, -0.8383121490478516, 0.4308605194091797, 1.7000322341918945, 2.969204902648926, 4.238377094268799, 5.507549285888672, 6.776721954345703, 8.045894622802734, 9.31506633758545, 10.58423900604248, 11.853410720825195, 13.122583389282227, 14.391756057739258, 15.660927772521973, 16.930099487304688, 18.19927215576172, 19.46844482421875, 20.73761749267578, 22.006790161132812, 23.275962829589844, 24.545135498046875, 25.814308166503906, 27.083480834960938, 28.352651596069336, 29.621824264526367, 30.8909969329834, 32.1601676940918, 33.42934036254883]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 8.0, 4.0, 3.0, 3.0, 2.0, 4.0, 5.0, 7.0, 6.0, 5.0, 12.0, 13.0, 10.0, 12.0, 18.0, 22.0, 26.0, 30.0, 39.0, 31.0, 29.0, 32.0, 38.0, 37.0, 24.0, 46.0, 35.0, 33.0, 42.0, 29.0, 39.0, 33.0, 27.0, 27.0, 27.0, 32.0, 25.0, 27.0, 26.0, 26.0, 16.0, 15.0, 13.0, 11.0, 11.0, 8.0, 5.0, 8.0, 3.0, 5.0, 8.0, 5.0, 1.0, 4.0, 4.0, 1.0, 3.0], "bins": [-6.42578125, -6.23797607421875, -6.0501708984375, -5.86236572265625, -5.674560546875, -5.48675537109375, -5.2989501953125, -5.11114501953125, -4.92333984375, -4.73553466796875, -4.5477294921875, -4.35992431640625, -4.172119140625, -3.98431396484375, -3.7965087890625, -3.60870361328125, -3.4208984375, -3.23309326171875, -3.0452880859375, -2.85748291015625, -2.669677734375, -2.48187255859375, -2.2940673828125, -2.10626220703125, -1.91845703125, -1.73065185546875, -1.5428466796875, -1.35504150390625, -1.167236328125, -0.97943115234375, -0.7916259765625, -0.60382080078125, -0.416015625, -0.22821044921875, -0.0404052734375, 0.14739990234375, 0.335205078125, 0.52301025390625, 0.7108154296875, 0.89862060546875, 1.08642578125, 1.27423095703125, 1.4620361328125, 1.64984130859375, 1.837646484375, 2.02545166015625, 2.2132568359375, 2.40106201171875, 2.5888671875, 2.77667236328125, 2.9644775390625, 3.15228271484375, 3.340087890625, 3.52789306640625, 3.7156982421875, 3.90350341796875, 4.09130859375, 4.27911376953125, 4.4669189453125, 4.65472412109375, 4.842529296875, 5.03033447265625, 5.2181396484375, 5.40594482421875, 5.59375]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 3.0, 4.0, 0.0, 2.0, 4.0, 3.0, 11.0, 13.0, 22.0, 14.0, 24.0, 22.0, 20.0, 33.0, 48.0, 59.0, 60.0, 94.0, 116.0, 164.0, 224.0, 327.0, 459.0, 1894.0, 47737.0, 4122540.0, 17479.0, 1274.0, 417.0, 302.0, 216.0, 156.0, 121.0, 91.0, 63.0, 43.0, 41.0, 36.0, 33.0, 22.0, 21.0, 16.0, 10.0, 13.0, 8.0, 9.0, 7.0, 2.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-64.0, -62.02490234375, -60.0498046875, -58.07470703125, -56.099609375, -54.12451171875, -52.1494140625, -50.17431640625, -48.19921875, -46.22412109375, -44.2490234375, -42.27392578125, -40.298828125, -38.32373046875, -36.3486328125, -34.37353515625, -32.3984375, -30.42333984375, -28.4482421875, -26.47314453125, -24.498046875, -22.52294921875, -20.5478515625, -18.57275390625, -16.59765625, -14.62255859375, -12.6474609375, -10.67236328125, -8.697265625, -6.72216796875, -4.7470703125, -2.77197265625, -0.796875, 1.17822265625, 3.1533203125, 5.12841796875, 7.103515625, 9.07861328125, 11.0537109375, 13.02880859375, 15.00390625, 16.97900390625, 18.9541015625, 20.92919921875, 22.904296875, 24.87939453125, 26.8544921875, 28.82958984375, 30.8046875, 32.77978515625, 34.7548828125, 36.72998046875, 38.705078125, 40.68017578125, 42.6552734375, 44.63037109375, 46.60546875, 48.58056640625, 50.5556640625, 52.53076171875, 54.505859375, 56.48095703125, 58.4560546875, 60.43115234375, 62.40625]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 0.0, 6.0, 3.0, 4.0, 5.0, 8.0, 9.0, 7.0, 7.0, 12.0, 11.0, 14.0, 19.0, 21.0, 38.0, 47.0, 51.0, 68.0, 98.0, 149.0, 232.0, 352.0, 494.0, 565.0, 549.0, 395.0, 257.0, 187.0, 114.0, 74.0, 71.0, 40.0, 29.0, 30.0, 24.0, 17.0, 20.0, 15.0, 7.0, 7.0, 8.0, 6.0, 7.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-11.28125, -10.98138427734375, -10.6815185546875, -10.38165283203125, -10.081787109375, -9.78192138671875, -9.4820556640625, -9.18218994140625, -8.88232421875, -8.58245849609375, -8.2825927734375, -7.98272705078125, -7.682861328125, -7.38299560546875, -7.0831298828125, -6.78326416015625, -6.4833984375, -6.18353271484375, -5.8836669921875, -5.58380126953125, -5.283935546875, -4.98406982421875, -4.6842041015625, -4.38433837890625, -4.08447265625, -3.78460693359375, -3.4847412109375, -3.18487548828125, -2.885009765625, -2.58514404296875, -2.2852783203125, -1.98541259765625, -1.685546875, -1.38568115234375, -1.0858154296875, -0.78594970703125, -0.486083984375, -0.18621826171875, 0.1136474609375, 0.41351318359375, 0.71337890625, 1.01324462890625, 1.3131103515625, 1.61297607421875, 1.912841796875, 2.21270751953125, 2.5125732421875, 2.81243896484375, 3.1123046875, 3.41217041015625, 3.7120361328125, 4.01190185546875, 4.311767578125, 4.61163330078125, 4.9114990234375, 5.21136474609375, 5.51123046875, 5.81109619140625, 6.1109619140625, 6.41082763671875, 6.710693359375, 7.01055908203125, 7.3104248046875, 7.61029052734375, 7.91015625]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 3.0, 12.0, 10.0, 16.0, 25.0, 22.0, 41.0, 57.0, 98.0, 284.0, 1011.0, 7152.0, 221403.0, 3916352.0, 43917.0, 2894.0, 516.0, 164.0, 96.0, 56.0, 42.0, 27.0, 24.0, 20.0, 11.0, 14.0, 3.0, 6.0, 3.0, 2.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.46875, -35.98828125, -34.5078125, -33.02734375, -31.546875, -30.06640625, -28.5859375, -27.10546875, -25.625, -24.14453125, -22.6640625, -21.18359375, -19.703125, -18.22265625, -16.7421875, -15.26171875, -13.78125, -12.30078125, -10.8203125, -9.33984375, -7.859375, -6.37890625, -4.8984375, -3.41796875, -1.9375, -0.45703125, 1.0234375, 2.50390625, 3.984375, 5.46484375, 6.9453125, 8.42578125, 9.90625, 11.38671875, 12.8671875, 14.34765625, 15.828125, 17.30859375, 18.7890625, 20.26953125, 21.75, 23.23046875, 24.7109375, 26.19140625, 27.671875, 29.15234375, 30.6328125, 32.11328125, 33.59375, 35.07421875, 36.5546875, 38.03515625, 39.515625, 40.99609375, 42.4765625, 43.95703125, 45.4375, 46.91796875, 48.3984375, 49.87890625, 51.359375, 52.83984375, 54.3203125, 55.80078125, 57.28125]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 9.0, 25.0, 111.0, 258.0, 328.0, 197.0, 63.0, 16.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-93.01484680175781, -89.48133850097656, -85.94783782958984, -82.4143295288086, -78.88082885742188, -75.34732055664062, -71.81381225585938, -68.28031158447266, -64.74681091308594, -61.21330642700195, -57.67980194091797, -54.14629364013672, -50.61279296875, -47.07928466796875, -43.545780181884766, -40.01227569580078, -36.47876739501953, -32.94526290893555, -29.411758422851562, -25.878252029418945, -22.34474754333496, -18.811243057250977, -15.27773666381836, -11.744232177734375, -8.21072769165039, -4.677222728729248, -1.1437177658081055, 2.3897876739501953, 5.92329216003418, 9.456796646118164, 12.990303039550781, 16.523807525634766, 20.05731201171875, 23.590816497802734, 27.12432098388672, 30.657827377319336, 34.19132995605469, 37.72483825683594, 41.25834274291992, 44.791847229003906, 48.32535171508789, 51.858856201171875, 55.39236068725586, 58.925865173339844, 62.459373474121094, 65.99287414550781, 69.52638244628906, 73.05989074707031, 76.59339141845703, 80.12689971923828, 83.660400390625, 87.19390869140625, 90.72740936279297, 94.26091766357422, 97.79441833496094, 101.32792663574219, 104.86143493652344, 108.39494323730469, 111.9284439086914, 115.46195220947266, 118.99545288085938, 122.52896118164062, 126.06246948242188, 129.59597778320312, 133.1294708251953]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 6.0, 4.0, 5.0, 5.0, 12.0, 16.0, 18.0, 12.0, 22.0, 11.0, 37.0, 39.0, 30.0, 46.0, 51.0, 45.0, 51.0, 55.0, 50.0, 50.0, 46.0, 48.0, 41.0, 46.0, 44.0, 25.0, 37.0, 31.0, 23.0, 17.0, 17.0, 10.0, 13.0, 11.0, 7.0, 5.0, 2.0, 2.0, 8.0, 3.0, 1.0, 3.0, 3.0, 3.0], "bins": [-45.58680725097656, -44.40829849243164, -43.22978973388672, -42.0512809753418, -40.872772216796875, -39.69426727294922, -38.5157585144043, -37.337249755859375, -36.15874099731445, -34.98023223876953, -33.80172348022461, -32.62321472167969, -31.4447078704834, -30.266199111938477, -29.087692260742188, -27.909183502197266, -26.730674743652344, -25.552165985107422, -24.3736572265625, -23.19515037536621, -22.01664161682129, -20.838132858276367, -19.659626007080078, -18.481117248535156, -17.302608489990234, -16.124099731445312, -14.945591926574707, -13.767084121704102, -12.58857536315918, -11.410066604614258, -10.231558799743652, -9.053050994873047, -7.874546051025391, -6.696037769317627, -5.517529487609863, -4.3390212059021, -3.160512924194336, -1.9820046424865723, -0.8034963607788086, 0.3750114440917969, 1.5535202026367188, 2.7320284843444824, 3.910536766052246, 5.08904504776001, 6.267553329467773, 7.446061611175537, 8.6245698928833, 9.803077697753906, 10.981586456298828, 12.16009521484375, 13.338603019714355, 14.517110824584961, 15.695619583129883, 16.874128341674805, 18.052635192871094, 19.231143951416016, 20.409652709960938, 21.58816146850586, 22.76667022705078, 23.94517707824707, 25.123685836791992, 26.302194595336914, 27.480701446533203, 28.659210205078125, 29.837718963623047]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 2.0, 6.0, 3.0, 2.0, 6.0, 7.0, 5.0, 15.0, 17.0, 17.0, 17.0, 25.0, 25.0, 27.0, 34.0, 24.0, 37.0, 45.0, 37.0, 42.0, 62.0, 48.0, 36.0, 30.0, 44.0, 46.0, 38.0, 38.0, 34.0, 33.0, 25.0, 27.0, 30.0, 17.0, 24.0, 15.0, 8.0, 16.0, 9.0, 9.0, 7.0, 2.0, 4.0, 7.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.3515625, -7.1251220703125, -6.898681640625, -6.6722412109375, -6.44580078125, -6.2193603515625, -5.992919921875, -5.7664794921875, -5.5400390625, -5.3135986328125, -5.087158203125, -4.8607177734375, -4.63427734375, -4.4078369140625, -4.181396484375, -3.9549560546875, -3.728515625, -3.5020751953125, -3.275634765625, -3.0491943359375, -2.82275390625, -2.5963134765625, -2.369873046875, -2.1434326171875, -1.9169921875, -1.6905517578125, -1.464111328125, -1.2376708984375, -1.01123046875, -0.7847900390625, -0.558349609375, -0.3319091796875, -0.10546875, 0.1209716796875, 0.347412109375, 0.5738525390625, 0.80029296875, 1.0267333984375, 1.253173828125, 1.4796142578125, 1.7060546875, 1.9324951171875, 2.158935546875, 2.3853759765625, 2.61181640625, 2.8382568359375, 3.064697265625, 3.2911376953125, 3.517578125, 3.7440185546875, 3.970458984375, 4.1968994140625, 4.42333984375, 4.6497802734375, 4.876220703125, 5.1026611328125, 5.3291015625, 5.5555419921875, 5.781982421875, 6.0084228515625, 6.23486328125, 6.4613037109375, 6.687744140625, 6.9141845703125, 7.140625]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 4.0, 7.0, 8.0, 16.0, 12.0, 20.0, 45.0, 71.0, 103.0, 167.0, 267.0, 413.0, 742.0, 1181.0, 1842.0, 3172.0, 5289.0, 9030.0, 15720.0, 27608.0, 52424.0, 108969.0, 247205.0, 303896.0, 131809.0, 62713.0, 32477.0, 18010.0, 10241.0, 5990.0, 3566.0, 2148.0, 1335.0, 778.0, 489.0, 298.0, 166.0, 110.0, 70.0, 54.0, 34.0, 18.0, 17.0, 12.0, 7.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.368896484375, -0.3570442199707031, -0.34519195556640625, -0.3333396911621094, -0.3214874267578125, -0.3096351623535156, -0.29778289794921875, -0.2859306335449219, -0.274078369140625, -0.2622261047363281, -0.25037384033203125, -0.23852157592773438, -0.2266693115234375, -0.21481704711914062, -0.20296478271484375, -0.19111251831054688, -0.17926025390625, -0.16740798950195312, -0.15555572509765625, -0.14370346069335938, -0.1318511962890625, -0.11999893188476562, -0.10814666748046875, -0.09629440307617188, -0.084442138671875, -0.07258987426757812, -0.06073760986328125, -0.048885345458984375, -0.0370330810546875, -0.025180816650390625, -0.01332855224609375, -0.001476287841796875, 0.0103759765625, 0.022228240966796875, 0.03408050537109375, 0.045932769775390625, 0.0577850341796875, 0.06963729858398438, 0.08148956298828125, 0.09334182739257812, 0.105194091796875, 0.11704635620117188, 0.12889862060546875, 0.14075088500976562, 0.1526031494140625, 0.16445541381835938, 0.17630767822265625, 0.18815994262695312, 0.20001220703125, 0.21186447143554688, 0.22371673583984375, 0.23556900024414062, 0.2474212646484375, 0.2592735290527344, 0.27112579345703125, 0.2829780578613281, 0.294830322265625, 0.3066825866699219, 0.31853485107421875, 0.3303871154785156, 0.3422393798828125, 0.3540916442871094, 0.36594390869140625, 0.3777961730957031, 0.3896484375]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 3.0, 4.0, 8.0, 9.0, 7.0, 11.0, 12.0, 18.0, 12.0, 19.0, 16.0, 30.0, 25.0, 25.0, 38.0, 29.0, 33.0, 46.0, 32.0, 37.0, 53.0, 1059.0, 35.0, 40.0, 38.0, 40.0, 39.0, 35.0, 29.0, 19.0, 26.0, 24.0, 20.0, 26.0, 18.0, 19.0, 15.0, 13.0, 13.0, 15.0, 10.0, 7.0, 7.0, 1.0, 5.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.28125, -4.150390625, -4.01953125, -3.888671875, -3.7578125, -3.626953125, -3.49609375, -3.365234375, -3.234375, -3.103515625, -2.97265625, -2.841796875, -2.7109375, -2.580078125, -2.44921875, -2.318359375, -2.1875, -2.056640625, -1.92578125, -1.794921875, -1.6640625, -1.533203125, -1.40234375, -1.271484375, -1.140625, -1.009765625, -0.87890625, -0.748046875, -0.6171875, -0.486328125, -0.35546875, -0.224609375, -0.09375, 0.037109375, 0.16796875, 0.298828125, 0.4296875, 0.560546875, 0.69140625, 0.822265625, 0.953125, 1.083984375, 1.21484375, 1.345703125, 1.4765625, 1.607421875, 1.73828125, 1.869140625, 2.0, 2.130859375, 2.26171875, 2.392578125, 2.5234375, 2.654296875, 2.78515625, 2.916015625, 3.046875, 3.177734375, 3.30859375, 3.439453125, 3.5703125, 3.701171875, 3.83203125, 3.962890625, 4.09375]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 10.0, 15.0, 18.0, 30.0, 36.0, 55.0, 83.0, 116.0, 168.0, 237.0, 338.0, 480.0, 692.0, 997.0, 1491.0, 2174.0, 3024.0, 4617.0, 7161.0, 10724.0, 16889.0, 26563.0, 43106.0, 70313.0, 121128.0, 1269629.0, 217216.0, 117080.0, 67680.0, 41148.0, 25819.0, 16144.0, 10572.0, 6864.0, 4661.0, 3089.0, 2069.0, 1451.0, 975.0, 728.0, 469.0, 326.0, 223.0, 163.0, 106.0, 90.0, 52.0, 36.0, 19.0, 21.0, 11.0, 12.0, 7.0, 6.0, 4.0, 4.0, 3.0], "bins": [-0.2186279296875, -0.21199607849121094, -0.20536422729492188, -0.1987323760986328, -0.19210052490234375, -0.1854686737060547, -0.17883682250976562, -0.17220497131347656, -0.1655731201171875, -0.15894126892089844, -0.15230941772460938, -0.1456775665283203, -0.13904571533203125, -0.1324138641357422, -0.12578201293945312, -0.11915016174316406, -0.112518310546875, -0.10588645935058594, -0.09925460815429688, -0.09262275695800781, -0.08599090576171875, -0.07935905456542969, -0.07272720336914062, -0.06609535217285156, -0.0594635009765625, -0.05283164978027344, -0.046199798583984375, -0.03956794738769531, -0.03293609619140625, -0.026304244995117188, -0.019672393798828125, -0.013040542602539062, -0.00640869140625, 0.0002231597900390625, 0.006855010986328125, 0.013486862182617188, 0.02011871337890625, 0.026750564575195312, 0.033382415771484375, 0.04001426696777344, 0.0466461181640625, 0.05327796936035156, 0.059909820556640625, 0.06654167175292969, 0.07317352294921875, 0.07980537414550781, 0.08643722534179688, 0.09306907653808594, 0.099700927734375, 0.10633277893066406, 0.11296463012695312, 0.11959648132324219, 0.12622833251953125, 0.1328601837158203, 0.13949203491210938, 0.14612388610839844, 0.1527557373046875, 0.15938758850097656, 0.16601943969726562, 0.1726512908935547, 0.17928314208984375, 0.1859149932861328, 0.19254684448242188, 0.19917869567871094, 0.205810546875]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 1.0, 2.0, 3.0, 2.0, 5.0, 3.0, 8.0, 15.0, 19.0, 39.0, 56.0, 91.0, 115.0, 156.0, 140.0, 112.0, 79.0, 56.0, 33.0, 19.0, 12.0, 11.0, 2.0, 7.0, 4.0, 2.0, 1.0, 4.0, 3.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00036978721618652344, -0.0003594718873500824, -0.00034915655851364136, -0.0003388412296772003, -0.0003285259008407593, -0.00031821057200431824, -0.0003078952431678772, -0.00029757991433143616, -0.0002872645854949951, -0.0002769492566585541, -0.00026663392782211304, -0.000256318598985672, -0.00024600327014923096, -0.00023568794131278992, -0.00022537261247634888, -0.00021505728363990784, -0.0002047419548034668, -0.00019442662596702576, -0.00018411129713058472, -0.00017379596829414368, -0.00016348063945770264, -0.0001531653106212616, -0.00014284998178482056, -0.00013253465294837952, -0.00012221932411193848, -0.00011190399527549744, -0.0001015886664390564, -9.127333760261536e-05, -8.095800876617432e-05, -7.064267992973328e-05, -6.0327351093292236e-05, -5.0012022256851196e-05, -3.9696693420410156e-05, -2.9381364583969116e-05, -1.9066035747528076e-05, -8.750706911087036e-06, 1.564621925354004e-06, 1.1879950761795044e-05, 2.2195279598236084e-05, 3.2510608434677124e-05, 4.2825937271118164e-05, 5.3141266107559204e-05, 6.345659494400024e-05, 7.377192378044128e-05, 8.408725261688232e-05, 9.440258145332336e-05, 0.0001047179102897644, 0.00011503323912620544, 0.00012534856796264648, 0.00013566389679908752, 0.00014597922563552856, 0.0001562945544719696, 0.00016660988330841064, 0.00017692521214485168, 0.00018724054098129272, 0.00019755586981773376, 0.0002078711986541748, 0.00021818652749061584, 0.00022850185632705688, 0.00023881718516349792, 0.00024913251399993896, 0.00025944784283638, 0.00026976317167282104, 0.0002800785005092621, 0.0002903938293457031]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 2.0, 4.0, 4.0, 1.0, 2.0, 9.0, 2.0, 4.0, 10.0, 16.0, 14.0, 30.0, 31.0, 59.0, 86.0, 167.0, 371.0, 949.0, 120268.0, 924132.0, 1533.0, 401.0, 182.0, 96.0, 60.0, 30.0, 22.0, 15.0, 10.0, 6.0, 9.0, 6.0, 3.0, 11.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.005306243896484375, -0.005117475986480713, -0.004928708076477051, -0.004739940166473389, -0.0045511722564697266, -0.0043624043464660645, -0.004173636436462402, -0.00398486852645874, -0.003796100616455078, -0.003607332706451416, -0.003418564796447754, -0.003229796886444092, -0.0030410289764404297, -0.0028522610664367676, -0.0026634931564331055, -0.0024747252464294434, -0.0022859573364257812, -0.002097189426422119, -0.001908421516418457, -0.001719653606414795, -0.0015308856964111328, -0.0013421177864074707, -0.0011533498764038086, -0.0009645819664001465, -0.0007758140563964844, -0.0005870461463928223, -0.00039827823638916016, -0.00020951032638549805, -2.0742416381835938e-05, 0.00016802549362182617, 0.0003567934036254883, 0.0005455613136291504, 0.0007343292236328125, 0.0009230971336364746, 0.0011118650436401367, 0.0013006329536437988, 0.001489400863647461, 0.001678168773651123, 0.0018669366836547852, 0.0020557045936584473, 0.0022444725036621094, 0.0024332404136657715, 0.0026220083236694336, 0.0028107762336730957, 0.002999544143676758, 0.00318831205368042, 0.003377079963684082, 0.003565847873687744, 0.0037546157836914062, 0.003943383693695068, 0.0041321516036987305, 0.004320919513702393, 0.004509687423706055, 0.004698455333709717, 0.004887223243713379, 0.005075991153717041, 0.005264759063720703, 0.005453526973724365, 0.005642294883728027, 0.0058310627937316895, 0.0060198307037353516, 0.006208598613739014, 0.006397366523742676, 0.006586134433746338, 0.00677490234375]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 5.0, 9.0, 18.0, 22.0, 33.0, 54.0, 76.0, 113.0, 128.0, 144.0, 112.0, 93.0, 70.0, 49.0, 26.0, 17.0, 13.0, 11.0, 5.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00020413870515767485, -0.0001996419596252963, -0.00019514521409291774, -0.00019064845400862396, -0.0001861517084762454, -0.00018165496294386685, -0.0001771582174114883, -0.00017266147187910974, -0.00016816472634673119, -0.00016366798081435263, -0.00015917123528197408, -0.0001546744751976803, -0.00015017772966530174, -0.00014568098413292319, -0.00014118423860054463, -0.00013668749306816608, -0.0001321907329838723, -0.00012769398745149374, -0.00012319724191911519, -0.00011870048911077902, -0.00011420373630244285, -0.0001097069907700643, -0.00010521024523768574, -0.00010071349970530719, -9.621674689697102e-05, -9.172000136459246e-05, -8.72232485562563e-05, -8.272650302387774e-05, -7.822975749149919e-05, -7.373300468316302e-05, -6.923625915078446e-05, -6.47395063424483e-05, -6.024277536198497e-05, -5.574602619162761e-05, -5.1249277021270245e-05, -4.675253148889169e-05, -4.225578231853433e-05, -3.775903314817697e-05, -3.3262287615798414e-05, -2.8765538445441052e-05, -2.426878927508369e-05, -1.977204010472633e-05, -1.527529275335837e-05, -1.0778544492495712e-05, -6.281796231633052e-06, -1.7850470612756908e-06, 2.711700290092267e-06, 7.208447641460225e-06, 1.1705196811817586e-05, 1.6201945982174948e-05, 2.0698693333542906e-05, 2.5195440684910864e-05, 2.9692189855268225e-05, 3.4188939025625587e-05, 3.868568455800414e-05, 4.31824337283615e-05, 4.7679182898718864e-05, 5.2175932069076225e-05, 5.6672681239433587e-05, 6.116942677181214e-05, 6.56661723041907e-05, 7.016292511252686e-05, 7.465967064490542e-05, 7.915642345324159e-05, 8.365316898562014e-05]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 4.0, 3.0, 6.0, 9.0, 9.0, 9.0, 14.0, 15.0, 12.0, 10.0, 22.0, 22.0, 32.0, 31.0, 30.0, 31.0, 30.0, 39.0, 40.0, 35.0, 32.0, 29.0, 37.0, 34.0, 33.0, 44.0, 39.0, 35.0, 33.0, 32.0, 29.0, 31.0, 27.0, 27.0, 20.0, 17.0, 16.0, 17.0, 8.0, 12.0, 9.0, 8.0, 12.0, 7.0, 3.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-9.161233901977539e-05, -8.865073323249817e-05, -8.568912744522095e-05, -8.272752165794373e-05, -7.97659158706665e-05, -7.680431008338928e-05, -7.384270429611206e-05, -7.088109850883484e-05, -6.791949272155762e-05, -6.49578869342804e-05, -6.199628114700317e-05, -5.903467535972595e-05, -5.607306957244873e-05, -5.311146378517151e-05, -5.014985799789429e-05, -4.7188252210617065e-05, -4.4226646423339844e-05, -4.126504063606262e-05, -3.83034348487854e-05, -3.534182906150818e-05, -3.238022327423096e-05, -2.9418617486953735e-05, -2.6457011699676514e-05, -2.3495405912399292e-05, -2.053380012512207e-05, -1.757219433784485e-05, -1.4610588550567627e-05, -1.1648982763290405e-05, -8.687376976013184e-06, -5.725771188735962e-06, -2.7641654014587402e-06, 1.9744038581848145e-07, 3.159046173095703e-06, 6.120651960372925e-06, 9.082257747650146e-06, 1.2043863534927368e-05, 1.500546932220459e-05, 1.796707510948181e-05, 2.0928680896759033e-05, 2.3890286684036255e-05, 2.6851892471313477e-05, 2.9813498258590698e-05, 3.277510404586792e-05, 3.573670983314514e-05, 3.869831562042236e-05, 4.1659921407699585e-05, 4.462152719497681e-05, 4.758313298225403e-05, 5.054473876953125e-05, 5.350634455680847e-05, 5.646795034408569e-05, 5.9429556131362915e-05, 6.239116191864014e-05, 6.535276770591736e-05, 6.831437349319458e-05, 7.12759792804718e-05, 7.423758506774902e-05, 7.719919085502625e-05, 8.016079664230347e-05, 8.312240242958069e-05, 8.608400821685791e-05, 8.904561400413513e-05, 9.200721979141235e-05, 9.496882557868958e-05, 9.79304313659668e-05]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 2.0, 6.0, 3.0, 2.0, 6.0, 7.0, 5.0, 15.0, 17.0, 17.0, 17.0, 25.0, 25.0, 27.0, 34.0, 24.0, 37.0, 45.0, 37.0, 42.0, 62.0, 48.0, 36.0, 30.0, 44.0, 46.0, 38.0, 38.0, 34.0, 33.0, 25.0, 27.0, 30.0, 17.0, 24.0, 15.0, 8.0, 16.0, 9.0, 9.0, 7.0, 2.0, 4.0, 7.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.3515625, -7.1251220703125, -6.898681640625, -6.6722412109375, -6.44580078125, -6.2193603515625, -5.992919921875, -5.7664794921875, -5.5400390625, -5.3135986328125, -5.087158203125, -4.8607177734375, -4.63427734375, -4.4078369140625, -4.181396484375, -3.9549560546875, -3.728515625, -3.5020751953125, -3.275634765625, -3.0491943359375, -2.82275390625, -2.5963134765625, -2.369873046875, -2.1434326171875, -1.9169921875, -1.6905517578125, -1.464111328125, -1.2376708984375, -1.01123046875, -0.7847900390625, -0.558349609375, -0.3319091796875, -0.10546875, 0.1209716796875, 0.347412109375, 0.5738525390625, 0.80029296875, 1.0267333984375, 1.253173828125, 1.4796142578125, 1.7060546875, 1.9324951171875, 2.158935546875, 2.3853759765625, 2.61181640625, 2.8382568359375, 3.064697265625, 3.2911376953125, 3.517578125, 3.7440185546875, 3.970458984375, 4.1968994140625, 4.42333984375, 4.6497802734375, 4.876220703125, 5.1026611328125, 5.3291015625, 5.5555419921875, 5.781982421875, 6.0084228515625, 6.23486328125, 6.4613037109375, 6.687744140625, 6.9141845703125, 7.140625]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 7.0, 5.0, 4.0, 9.0, 12.0, 15.0, 24.0, 17.0, 39.0, 41.0, 81.0, 114.0, 152.0, 209.0, 293.0, 400.0, 632.0, 881.0, 1436.0, 3082.0, 9379.0, 45160.0, 280564.0, 552357.0, 121644.0, 20951.0, 5372.0, 2087.0, 1135.0, 765.0, 508.0, 340.0, 230.0, 156.0, 140.0, 94.0, 59.0, 50.0, 34.0, 17.0, 21.0, 17.0, 6.0, 10.0, 9.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.9453125, -14.482177734375, -14.01904296875, -13.555908203125, -13.0927734375, -12.629638671875, -12.16650390625, -11.703369140625, -11.240234375, -10.777099609375, -10.31396484375, -9.850830078125, -9.3876953125, -8.924560546875, -8.46142578125, -7.998291015625, -7.53515625, -7.072021484375, -6.60888671875, -6.145751953125, -5.6826171875, -5.219482421875, -4.75634765625, -4.293212890625, -3.830078125, -3.366943359375, -2.90380859375, -2.440673828125, -1.9775390625, -1.514404296875, -1.05126953125, -0.588134765625, -0.125, 0.338134765625, 0.80126953125, 1.264404296875, 1.7275390625, 2.190673828125, 2.65380859375, 3.116943359375, 3.580078125, 4.043212890625, 4.50634765625, 4.969482421875, 5.4326171875, 5.895751953125, 6.35888671875, 6.822021484375, 7.28515625, 7.748291015625, 8.21142578125, 8.674560546875, 9.1376953125, 9.600830078125, 10.06396484375, 10.527099609375, 10.990234375, 11.453369140625, 11.91650390625, 12.379638671875, 12.8427734375, 13.305908203125, 13.76904296875, 14.232177734375, 14.6953125]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 6.0, 4.0, 0.0, 7.0, 5.0, 10.0, 11.0, 12.0, 7.0, 17.0, 23.0, 32.0, 25.0, 34.0, 35.0, 64.0, 54.0, 72.0, 147.0, 313.0, 1469.0, 220.0, 104.0, 64.0, 53.0, 52.0, 28.0, 34.0, 34.0, 20.0, 23.0, 13.0, 13.0, 10.0, 13.0, 7.0, 8.0, 5.0, 4.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.90625, -16.348876953125, -15.79150390625, -15.234130859375, -14.6767578125, -14.119384765625, -13.56201171875, -13.004638671875, -12.447265625, -11.889892578125, -11.33251953125, -10.775146484375, -10.2177734375, -9.660400390625, -9.10302734375, -8.545654296875, -7.98828125, -7.430908203125, -6.87353515625, -6.316162109375, -5.7587890625, -5.201416015625, -4.64404296875, -4.086669921875, -3.529296875, -2.971923828125, -2.41455078125, -1.857177734375, -1.2998046875, -0.742431640625, -0.18505859375, 0.372314453125, 0.9296875, 1.487060546875, 2.04443359375, 2.601806640625, 3.1591796875, 3.716552734375, 4.27392578125, 4.831298828125, 5.388671875, 5.946044921875, 6.50341796875, 7.060791015625, 7.6181640625, 8.175537109375, 8.73291015625, 9.290283203125, 9.84765625, 10.405029296875, 10.96240234375, 11.519775390625, 12.0771484375, 12.634521484375, 13.19189453125, 13.749267578125, 14.306640625, 14.864013671875, 15.42138671875, 15.978759765625, 16.5361328125, 17.093505859375, 17.65087890625, 18.208251953125, 18.765625]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 2.0, 1.0, 4.0, 7.0, 8.0, 20.0, 15.0, 15.0, 20.0, 41.0, 47.0, 77.0, 120.0, 203.0, 368.0, 687.0, 1953.0, 2818998.0, 319889.0, 1678.0, 681.0, 362.0, 191.0, 90.0, 72.0, 41.0, 29.0, 18.0, 14.0, 15.0, 7.0, 10.0, 11.0, 1.0, 3.0, 4.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-82.3125, -79.8125, -77.3125, -74.8125, -72.3125, -69.8125, -67.3125, -64.8125, -62.3125, -59.8125, -57.3125, -54.8125, -52.3125, -49.8125, -47.3125, -44.8125, -42.3125, -39.8125, -37.3125, -34.8125, -32.3125, -29.8125, -27.3125, -24.8125, -22.3125, -19.8125, -17.3125, -14.8125, -12.3125, -9.8125, -7.3125, -4.8125, -2.3125, 0.1875, 2.6875, 5.1875, 7.6875, 10.1875, 12.6875, 15.1875, 17.6875, 20.1875, 22.6875, 25.1875, 27.6875, 30.1875, 32.6875, 35.1875, 37.6875, 40.1875, 42.6875, 45.1875, 47.6875, 50.1875, 52.6875, 55.1875, 57.6875, 60.1875, 62.6875, 65.1875, 67.6875, 70.1875, 72.6875, 75.1875, 77.6875]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 7.0, 177.0, 634.0, 186.0, 10.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-143.6464385986328, -137.5465850830078, -131.44671630859375, -125.34686279296875, -119.24700164794922, -113.14714050292969, -107.04728698730469, -100.94742584228516, -94.84756469726562, -88.7477035522461, -82.64784240722656, -76.54798889160156, -70.44812774658203, -64.3482666015625, -58.248409271240234, -52.14855194091797, -46.04869079589844, -39.948829650878906, -33.84897232055664, -27.749113082885742, -21.649253845214844, -15.549394607543945, -9.449535369873047, -3.3496780395507812, 2.75018310546875, 8.850042343139648, 14.949901580810547, 21.049760818481445, 27.149620056152344, 33.249481201171875, 39.34933853149414, 45.449195861816406, 51.54905700683594, 57.64891815185547, 63.748775482177734, 69.8486328125, 75.94849395751953, 82.04835510253906, 88.14820861816406, 94.2480697631836, 100.34793090820312, 106.44779205322266, 112.54765319824219, 118.64750671386719, 124.74736785888672, 130.84722900390625, 136.94708251953125, 143.04693603515625, 149.1468048095703, 155.2466583251953, 161.34652709960938, 167.44638061523438, 173.54623413085938, 179.64610290527344, 185.74595642089844, 191.8458251953125, 197.9456787109375, 204.0455322265625, 210.14540100097656, 216.24525451660156, 222.34512329101562, 228.44497680664062, 234.54483032226562, 240.64468383789062, 246.7445526123047]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 4.0, 5.0, 6.0, 11.0, 9.0, 6.0, 6.0, 10.0, 9.0, 9.0, 17.0, 19.0, 19.0, 25.0, 26.0, 26.0, 36.0, 34.0, 36.0, 33.0, 32.0, 47.0, 41.0, 44.0, 47.0, 45.0, 49.0, 39.0, 36.0, 26.0, 31.0, 24.0, 35.0, 20.0, 23.0, 19.0, 12.0, 13.0, 19.0, 9.0, 10.0, 6.0, 1.0, 10.0, 5.0, 6.0, 3.0, 5.0, 4.0, 2.0, 0.0, 2.0, 2.0], "bins": [-47.49513244628906, -46.16862869262695, -44.842124938964844, -43.515625, -42.18912124633789, -40.86261749267578, -39.53611373901367, -38.20960998535156, -36.88310623168945, -35.556602478027344, -34.230098724365234, -32.903594970703125, -31.57709312438965, -30.250591278076172, -28.924087524414062, -27.597583770751953, -26.271081924438477, -24.944578170776367, -23.61807632446289, -22.29157257080078, -20.965068817138672, -19.638565063476562, -18.312063217163086, -16.985559463500977, -15.659056663513184, -14.33255386352539, -13.006050109863281, -11.679547309875488, -10.353044509887695, -9.026540756225586, -7.700037956237793, -6.373534202575684, -5.047031402587891, -3.7205281257629395, -2.3940250873565674, -1.0675220489501953, 0.25898122787475586, 1.585484504699707, 2.9119873046875, 4.238491058349609, 5.564993858337402, 6.8914971351623535, 8.218000411987305, 9.544503211975098, 10.87100601196289, 12.197509765625, 13.524012565612793, 14.850516319274902, 16.177019119262695, 17.503522872924805, 18.83002471923828, 20.15652847290039, 21.4830322265625, 22.80953598022461, 24.136037826538086, 25.462541580200195, 26.789043426513672, 28.11554718017578, 29.442049026489258, 30.768552780151367, 32.095054626464844, 33.42155838012695, 34.74806213378906, 36.07456588745117, 37.40106964111328]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 4.0, 3.0, 3.0, 3.0, 3.0, 3.0, 9.0, 6.0, 10.0, 9.0, 14.0, 12.0, 12.0, 21.0, 23.0, 35.0, 25.0, 33.0, 28.0, 26.0, 37.0, 39.0, 34.0, 56.0, 34.0, 42.0, 40.0, 40.0, 43.0, 39.0, 38.0, 35.0, 29.0, 34.0, 37.0, 15.0, 23.0, 24.0, 18.0, 10.0, 16.0, 6.0, 5.0, 6.0, 7.0, 8.0, 4.0, 3.0, 4.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.5234375, -6.30291748046875, -6.0823974609375, -5.86187744140625, -5.641357421875, -5.42083740234375, -5.2003173828125, -4.97979736328125, -4.75927734375, -4.53875732421875, -4.3182373046875, -4.09771728515625, -3.877197265625, -3.65667724609375, -3.4361572265625, -3.21563720703125, -2.9951171875, -2.77459716796875, -2.5540771484375, -2.33355712890625, -2.113037109375, -1.89251708984375, -1.6719970703125, -1.45147705078125, -1.23095703125, -1.01043701171875, -0.7899169921875, -0.56939697265625, -0.348876953125, -0.12835693359375, 0.0921630859375, 0.31268310546875, 0.533203125, 0.75372314453125, 0.9742431640625, 1.19476318359375, 1.415283203125, 1.63580322265625, 1.8563232421875, 2.07684326171875, 2.29736328125, 2.51788330078125, 2.7384033203125, 2.95892333984375, 3.179443359375, 3.39996337890625, 3.6204833984375, 3.84100341796875, 4.0615234375, 4.28204345703125, 4.5025634765625, 4.72308349609375, 4.943603515625, 5.16412353515625, 5.3846435546875, 5.60516357421875, 5.82568359375, 6.04620361328125, 6.2667236328125, 6.48724365234375, 6.707763671875, 6.92828369140625, 7.1488037109375, 7.36932373046875, 7.58984375]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 5.0, 3.0, 5.0, 7.0, 11.0, 11.0, 18.0, 26.0, 30.0, 76.0, 68.0, 138.0, 148.0, 197.0, 309.0, 438.0, 639.0, 1006.0, 1665.0, 3426.0, 8617.0, 29884.0, 195266.0, 1706759.0, 1959980.0, 233557.0, 33713.0, 9515.0, 3662.0, 1873.0, 1081.0, 669.0, 410.0, 313.0, 243.0, 160.0, 96.0, 81.0, 57.0, 42.0, 27.0, 19.0, 14.0, 7.0, 8.0, 1.0, 7.0, 5.0, 2.0], "bins": [-18.453125, -17.98046875, -17.5078125, -17.03515625, -16.5625, -16.08984375, -15.6171875, -15.14453125, -14.671875, -14.19921875, -13.7265625, -13.25390625, -12.78125, -12.30859375, -11.8359375, -11.36328125, -10.890625, -10.41796875, -9.9453125, -9.47265625, -9.0, -8.52734375, -8.0546875, -7.58203125, -7.109375, -6.63671875, -6.1640625, -5.69140625, -5.21875, -4.74609375, -4.2734375, -3.80078125, -3.328125, -2.85546875, -2.3828125, -1.91015625, -1.4375, -0.96484375, -0.4921875, -0.01953125, 0.453125, 0.92578125, 1.3984375, 1.87109375, 2.34375, 2.81640625, 3.2890625, 3.76171875, 4.234375, 4.70703125, 5.1796875, 5.65234375, 6.125, 6.59765625, 7.0703125, 7.54296875, 8.015625, 8.48828125, 8.9609375, 9.43359375, 9.90625, 10.37890625, 10.8515625, 11.32421875, 11.796875]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 4.0, 6.0, 15.0, 11.0, 25.0, 31.0, 50.0, 69.0, 79.0, 133.0, 205.0, 347.0, 636.0, 836.0, 601.0, 338.0, 220.0, 150.0, 107.0, 73.0, 54.0, 27.0, 28.0, 17.0, 10.0, 6.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.8359375, -9.2735595703125, -8.711181640625, -8.1488037109375, -7.58642578125, -7.0240478515625, -6.461669921875, -5.8992919921875, -5.3369140625, -4.7745361328125, -4.212158203125, -3.6497802734375, -3.08740234375, -2.5250244140625, -1.962646484375, -1.4002685546875, -0.837890625, -0.2755126953125, 0.286865234375, 0.8492431640625, 1.41162109375, 1.9739990234375, 2.536376953125, 3.0987548828125, 3.6611328125, 4.2235107421875, 4.785888671875, 5.3482666015625, 5.91064453125, 6.4730224609375, 7.035400390625, 7.5977783203125, 8.16015625, 8.7225341796875, 9.284912109375, 9.8472900390625, 10.40966796875, 10.9720458984375, 11.534423828125, 12.0968017578125, 12.6591796875, 13.2215576171875, 13.783935546875, 14.3463134765625, 14.90869140625, 15.4710693359375, 16.033447265625, 16.5958251953125, 17.158203125, 17.7205810546875, 18.282958984375, 18.8453369140625, 19.40771484375, 19.9700927734375, 20.532470703125, 21.0948486328125, 21.6572265625, 22.2196044921875, 22.781982421875, 23.3443603515625, 23.90673828125, 24.4691162109375, 25.031494140625, 25.5938720703125, 26.15625]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 1.0, 9.0, 9.0, 16.0, 17.0, 24.0, 23.0, 47.0, 95.0, 114.0, 231.0, 523.0, 1222.0, 4202.0, 25103.0, 384727.0, 3580564.0, 176849.0, 15691.0, 2938.0, 948.0, 406.0, 202.0, 107.0, 78.0, 46.0, 30.0, 14.0, 11.0, 9.0, 11.0, 7.0, 6.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.203125, -28.241943359375, -27.28076171875, -26.319580078125, -25.3583984375, -24.397216796875, -23.43603515625, -22.474853515625, -21.513671875, -20.552490234375, -19.59130859375, -18.630126953125, -17.6689453125, -16.707763671875, -15.74658203125, -14.785400390625, -13.82421875, -12.863037109375, -11.90185546875, -10.940673828125, -9.9794921875, -9.018310546875, -8.05712890625, -7.095947265625, -6.134765625, -5.173583984375, -4.21240234375, -3.251220703125, -2.2900390625, -1.328857421875, -0.36767578125, 0.593505859375, 1.5546875, 2.515869140625, 3.47705078125, 4.438232421875, 5.3994140625, 6.360595703125, 7.32177734375, 8.282958984375, 9.244140625, 10.205322265625, 11.16650390625, 12.127685546875, 13.0888671875, 14.050048828125, 15.01123046875, 15.972412109375, 16.93359375, 17.894775390625, 18.85595703125, 19.817138671875, 20.7783203125, 21.739501953125, 22.70068359375, 23.661865234375, 24.623046875, 25.584228515625, 26.54541015625, 27.506591796875, 28.4677734375, 29.428955078125, 30.39013671875, 31.351318359375, 32.3125]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 56.0, 821.0, 135.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-681.2179565429688, -663.0795288085938, -644.9411010742188, -626.8026733398438, -608.6642456054688, -590.5258178710938, -572.3873901367188, -554.2490234375, -536.110595703125, -517.97216796875, -499.833740234375, -481.6953125, -463.556884765625, -445.41845703125, -427.2800598144531, -409.1416320800781, -391.003173828125, -372.86474609375, -354.726318359375, -336.587890625, -318.449462890625, -300.31103515625, -282.1726379394531, -264.0342102050781, -245.89578247070312, -227.75735473632812, -209.61892700195312, -191.4805145263672, -173.3420867919922, -155.2036590576172, -137.06524658203125, -118.92681884765625, -100.78842163085938, -82.64999389648438, -64.5115737915039, -46.37314987182617, -28.234725952148438, -10.096298217773438, 8.042121887207031, 26.1805419921875, 44.3189697265625, 62.457393646240234, 80.59581756591797, 98.73423767089844, 116.87266540527344, 135.01109313964844, 153.14950561523438, 171.28793334960938, 189.42636108398438, 207.56478881835938, 225.70321655273438, 243.8416290283203, 261.98004150390625, 280.11846923828125, 298.25689697265625, 316.39532470703125, 334.53375244140625, 352.67218017578125, 370.81060791015625, 388.94903564453125, 407.08746337890625, 425.22589111328125, 443.3642883300781, 461.5027160644531, 479.6411437988281]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 0.0, 5.0, 4.0, 6.0, 10.0, 13.0, 12.0, 16.0, 12.0, 23.0, 14.0, 23.0, 18.0, 29.0, 35.0, 35.0, 38.0, 34.0, 40.0, 44.0, 49.0, 48.0, 38.0, 46.0, 44.0, 44.0, 42.0, 42.0, 29.0, 28.0, 26.0, 30.0, 17.0, 21.0, 15.0, 14.0, 13.0, 17.0, 4.0, 8.0, 6.0, 6.0, 5.0, 2.0, 1.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.875518798828125, -46.12812042236328, -44.38072204589844, -42.633323669433594, -40.88592529296875, -39.138526916503906, -37.39112854003906, -35.64373016357422, -33.896331787109375, -32.14893341064453, -30.401535034179688, -28.654136657714844, -26.90673828125, -25.159339904785156, -23.411941528320312, -21.66454315185547, -19.917144775390625, -18.16974639892578, -16.422348022460938, -14.674949645996094, -12.92755126953125, -11.180152893066406, -9.432754516601562, -7.685356140136719, -5.937957763671875, -4.190559387207031, -2.4431610107421875, -0.6957626342773438, 1.0516357421875, 2.7990341186523438, 4.5464324951171875, 6.293830871582031, 8.041229248046875, 9.788627624511719, 11.536026000976562, 13.283424377441406, 15.03082275390625, 16.778221130371094, 18.525619506835938, 20.27301788330078, 22.020416259765625, 23.76781463623047, 25.515213012695312, 27.262611389160156, 29.010009765625, 30.757408142089844, 32.50480651855469, 34.25220489501953, 35.999603271484375, 37.74700164794922, 39.49440002441406, 41.241798400878906, 42.98919677734375, 44.736595153808594, 46.48399353027344, 48.23139190673828, 49.978790283203125, 51.72618865966797, 53.47358703613281, 55.220985412597656, 56.9683837890625, 58.715782165527344, 60.46318054199219, 62.21057891845703, 63.957977294921875]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 7.0, 4.0, 2.0, 5.0, 2.0, 3.0, 5.0, 8.0, 14.0, 24.0, 20.0, 22.0, 28.0, 27.0, 29.0, 35.0, 35.0, 53.0, 40.0, 31.0, 59.0, 48.0, 58.0, 37.0, 40.0, 31.0, 56.0, 34.0, 51.0, 28.0, 30.0, 25.0, 19.0, 23.0, 14.0, 19.0, 5.0, 6.0, 9.0, 5.0, 1.0, 7.0, 9.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.0390625, -6.8204345703125, -6.601806640625, -6.3831787109375, -6.16455078125, -5.9459228515625, -5.727294921875, -5.5086669921875, -5.2900390625, -5.0714111328125, -4.852783203125, -4.6341552734375, -4.41552734375, -4.1968994140625, -3.978271484375, -3.7596435546875, -3.541015625, -3.3223876953125, -3.103759765625, -2.8851318359375, -2.66650390625, -2.4478759765625, -2.229248046875, -2.0106201171875, -1.7919921875, -1.5733642578125, -1.354736328125, -1.1361083984375, -0.91748046875, -0.6988525390625, -0.480224609375, -0.2615966796875, -0.04296875, 0.1756591796875, 0.394287109375, 0.6129150390625, 0.83154296875, 1.0501708984375, 1.268798828125, 1.4874267578125, 1.7060546875, 1.9246826171875, 2.143310546875, 2.3619384765625, 2.58056640625, 2.7991943359375, 3.017822265625, 3.2364501953125, 3.455078125, 3.6737060546875, 3.892333984375, 4.1109619140625, 4.32958984375, 4.5482177734375, 4.766845703125, 4.9854736328125, 5.2041015625, 5.4227294921875, 5.641357421875, 5.8599853515625, 6.07861328125, 6.2972412109375, 6.515869140625, 6.7344970703125, 6.953125]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 7.0, 9.0, 10.0, 26.0, 22.0, 37.0, 69.0, 84.0, 112.0, 192.0, 238.0, 403.0, 525.0, 845.0, 1150.0, 1829.0, 2803.0, 4170.0, 6552.0, 10267.0, 16707.0, 28188.0, 48480.0, 90425.0, 185873.0, 310203.0, 153485.0, 77248.0, 42682.0, 24531.0, 14969.0, 9338.0, 5829.0, 3784.0, 2472.0, 1607.0, 1082.0, 744.0, 503.0, 341.0, 204.0, 195.0, 93.0, 83.0, 38.0, 40.0, 18.0, 15.0, 13.0, 8.0, 5.0, 4.0, 5.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.291748046875, -0.28273773193359375, -0.2737274169921875, -0.26471710205078125, -0.255706787109375, -0.24669647216796875, -0.2376861572265625, -0.22867584228515625, -0.21966552734375, -0.21065521240234375, -0.2016448974609375, -0.19263458251953125, -0.183624267578125, -0.17461395263671875, -0.1656036376953125, -0.15659332275390625, -0.1475830078125, -0.13857269287109375, -0.1295623779296875, -0.12055206298828125, -0.111541748046875, -0.10253143310546875, -0.0935211181640625, -0.08451080322265625, -0.07550048828125, -0.06649017333984375, -0.0574798583984375, -0.04846954345703125, -0.039459228515625, -0.03044891357421875, -0.0214385986328125, -0.01242828369140625, -0.00341796875, 0.00559234619140625, 0.0146026611328125, 0.02361297607421875, 0.032623291015625, 0.04163360595703125, 0.0506439208984375, 0.05965423583984375, 0.06866455078125, 0.07767486572265625, 0.0866851806640625, 0.09569549560546875, 0.104705810546875, 0.11371612548828125, 0.1227264404296875, 0.13173675537109375, 0.1407470703125, 0.14975738525390625, 0.1587677001953125, 0.16777801513671875, 0.176788330078125, 0.18579864501953125, 0.1948089599609375, 0.20381927490234375, 0.21282958984375, 0.22183990478515625, 0.2308502197265625, 0.23986053466796875, 0.248870849609375, 0.25788116455078125, 0.2668914794921875, 0.27590179443359375, 0.284912109375]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 6.0, 9.0, 4.0, 8.0, 8.0, 7.0, 9.0, 21.0, 25.0, 22.0, 23.0, 20.0, 30.0, 26.0, 33.0, 32.0, 35.0, 39.0, 44.0, 43.0, 48.0, 1070.0, 37.0, 38.0, 41.0, 40.0, 35.0, 29.0, 36.0, 26.0, 30.0, 23.0, 15.0, 16.0, 17.0, 18.0, 13.0, 13.0, 3.0, 5.0, 6.0, 4.0, 9.0, 4.0, 6.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-4.4296875, -4.29766845703125, -4.1656494140625, -4.03363037109375, -3.901611328125, -3.76959228515625, -3.6375732421875, -3.50555419921875, -3.37353515625, -3.24151611328125, -3.1094970703125, -2.97747802734375, -2.845458984375, -2.71343994140625, -2.5814208984375, -2.44940185546875, -2.3173828125, -2.18536376953125, -2.0533447265625, -1.92132568359375, -1.789306640625, -1.65728759765625, -1.5252685546875, -1.39324951171875, -1.26123046875, -1.12921142578125, -0.9971923828125, -0.86517333984375, -0.733154296875, -0.60113525390625, -0.4691162109375, -0.33709716796875, -0.205078125, -0.07305908203125, 0.0589599609375, 0.19097900390625, 0.322998046875, 0.45501708984375, 0.5870361328125, 0.71905517578125, 0.85107421875, 0.98309326171875, 1.1151123046875, 1.24713134765625, 1.379150390625, 1.51116943359375, 1.6431884765625, 1.77520751953125, 1.9072265625, 2.03924560546875, 2.1712646484375, 2.30328369140625, 2.435302734375, 2.56732177734375, 2.6993408203125, 2.83135986328125, 2.96337890625, 3.09539794921875, 3.2274169921875, 3.35943603515625, 3.491455078125, 3.62347412109375, 3.7554931640625, 3.88751220703125, 4.01953125]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 4.0, 1.0, 6.0, 4.0, 3.0, 13.0, 30.0, 34.0, 59.0, 100.0, 130.0, 167.0, 231.0, 382.0, 503.0, 743.0, 988.0, 1511.0, 2276.0, 3170.0, 4605.0, 7087.0, 10905.0, 16619.0, 26677.0, 43204.0, 71334.0, 124210.0, 1281843.0, 212140.0, 112676.0, 65409.0, 39698.0, 24215.0, 15533.0, 9782.0, 6648.0, 4418.0, 2981.0, 2011.0, 1531.0, 1014.0, 672.0, 457.0, 345.0, 265.0, 167.0, 127.0, 79.0, 40.0, 38.0, 18.0, 21.0, 7.0, 6.0, 4.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.2044677734375, -0.1980609893798828, -0.19165420532226562, -0.18524742126464844, -0.17884063720703125, -0.17243385314941406, -0.16602706909179688, -0.1596202850341797, -0.1532135009765625, -0.1468067169189453, -0.14039993286132812, -0.13399314880371094, -0.12758636474609375, -0.12117958068847656, -0.11477279663085938, -0.10836601257324219, -0.101959228515625, -0.09555244445800781, -0.08914566040039062, -0.08273887634277344, -0.07633209228515625, -0.06992530822753906, -0.06351852416992188, -0.05711174011230469, -0.0507049560546875, -0.04429817199707031, -0.037891387939453125, -0.03148460388183594, -0.02507781982421875, -0.018671035766601562, -0.012264251708984375, -0.0058574676513671875, 0.00054931640625, 0.0069561004638671875, 0.013362884521484375, 0.019769668579101562, 0.02617645263671875, 0.03258323669433594, 0.038990020751953125, 0.04539680480957031, 0.0518035888671875, 0.05821037292480469, 0.06461715698242188, 0.07102394104003906, 0.07743072509765625, 0.08383750915527344, 0.09024429321289062, 0.09665107727050781, 0.103057861328125, 0.10946464538574219, 0.11587142944335938, 0.12227821350097656, 0.12868499755859375, 0.13509178161621094, 0.14149856567382812, 0.1479053497314453, 0.1543121337890625, 0.1607189178466797, 0.16712570190429688, 0.17353248596191406, 0.17993927001953125, 0.18634605407714844, 0.19275283813476562, 0.1991596221923828, 0.20556640625]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 6.0, 1.0, 6.0, 4.0, 0.0, 8.0, 6.0, 5.0, 7.0, 5.0, 11.0, 10.0, 11.0, 19.0, 14.0, 20.0, 29.0, 30.0, 47.0, 78.0, 168.0, 148.0, 94.0, 60.0, 43.0, 38.0, 28.0, 27.0, 14.0, 12.0, 9.0, 11.0, 6.0, 4.0, 4.0, 6.0, 5.0, 4.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.00025463104248046875, -0.0002467148005962372, -0.00023879855871200562, -0.00023088231682777405, -0.00022296607494354248, -0.0002150498330593109, -0.00020713359117507935, -0.00019921734929084778, -0.0001913011074066162, -0.00018338486552238464, -0.00017546862363815308, -0.0001675523817539215, -0.00015963613986968994, -0.00015171989798545837, -0.0001438036561012268, -0.00013588741421699524, -0.00012797117233276367, -0.0001200549304485321, -0.00011213868856430054, -0.00010422244668006897, -9.63062047958374e-05, -8.838996291160583e-05, -8.047372102737427e-05, -7.25574791431427e-05, -6.464123725891113e-05, -5.6724995374679565e-05, -4.8808753490448e-05, -4.089251160621643e-05, -3.297626972198486e-05, -2.5060027837753296e-05, -1.714378595352173e-05, -9.227544069290161e-06, -1.3113021850585938e-06, 6.604939699172974e-06, 1.4521181583404541e-05, 2.243742346763611e-05, 3.0353665351867676e-05, 3.826990723609924e-05, 4.618614912033081e-05, 5.410239100456238e-05, 6.201863288879395e-05, 6.993487477302551e-05, 7.785111665725708e-05, 8.576735854148865e-05, 9.368360042572021e-05, 0.00010159984230995178, 0.00010951608419418335, 0.00011743232607841492, 0.00012534856796264648, 0.00013326480984687805, 0.00014118105173110962, 0.0001490972936153412, 0.00015701353549957275, 0.00016492977738380432, 0.0001728460192680359, 0.00018076226115226746, 0.00018867850303649902, 0.0001965947449207306, 0.00020451098680496216, 0.00021242722868919373, 0.0002203434705734253, 0.00022825971245765686, 0.00023617595434188843, 0.00024409219622612, 0.00025200843811035156]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 4.0, 10.0, 7.0, 10.0, 8.0, 16.0, 20.0, 23.0, 29.0, 29.0, 39.0, 76.0, 90.0, 171.0, 262.0, 540.0, 3356.0, 982615.0, 59155.0, 1029.0, 386.0, 174.0, 138.0, 82.0, 51.0, 49.0, 32.0, 23.0, 22.0, 18.0, 14.0, 10.0, 7.0, 7.0, 8.0, 17.0, 7.0, 5.0, 6.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.00449371337890625, -0.004352271556854248, -0.004210829734802246, -0.004069387912750244, -0.003927946090698242, -0.0037865042686462402, -0.0036450624465942383, -0.0035036206245422363, -0.0033621788024902344, -0.0032207369804382324, -0.0030792951583862305, -0.0029378533363342285, -0.0027964115142822266, -0.0026549696922302246, -0.0025135278701782227, -0.0023720860481262207, -0.0022306442260742188, -0.002089202404022217, -0.0019477605819702148, -0.0018063187599182129, -0.001664876937866211, -0.001523435115814209, -0.001381993293762207, -0.001240551471710205, -0.0010991096496582031, -0.0009576678276062012, -0.0008162260055541992, -0.0006747841835021973, -0.0005333423614501953, -0.00039190053939819336, -0.0002504587173461914, -0.00010901689529418945, 3.24249267578125e-05, 0.00017386674880981445, 0.0003153085708618164, 0.00045675039291381836, 0.0005981922149658203, 0.0007396340370178223, 0.0008810758590698242, 0.0010225176811218262, 0.0011639595031738281, 0.00130540132522583, 0.001446843147277832, 0.001588284969329834, 0.001729726791381836, 0.0018711686134338379, 0.00201261043548584, 0.002154052257537842, 0.0022954940795898438, 0.0024369359016418457, 0.0025783777236938477, 0.0027198195457458496, 0.0028612613677978516, 0.0030027031898498535, 0.0031441450119018555, 0.0032855868339538574, 0.0034270286560058594, 0.0035684704780578613, 0.0037099123001098633, 0.0038513541221618652, 0.003992795944213867, 0.004134237766265869, 0.004275679588317871, 0.004417121410369873, 0.004558563232421875]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 23.0, 461.0, 495.0, 31.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0002590591611806303, -0.00023027369752526283, -0.00020148824842181057, -0.00017270278476644307, -0.0001439173356629908, -0.00011513187200762331, -8.634640835225582e-05, -5.7560959248803556e-05, -2.8775495593436062e-05, 9.962604963220656e-09, 2.8795420803362504e-05, 5.758088082075119e-05, 8.636633720016107e-05, 0.00011515179357957095, 0.00014393725723493844, 0.0001727227063383907, 0.0002015081699937582, 0.0002302936336491257, 0.0002590790973044932, 0.0002878645318560302, 0.0003166499955113977, 0.0003454354591667652, 0.0003742209228221327, 0.0004030063864775002, 0.00043179182102903724, 0.00046057728468440473, 0.0004893627483397722, 0.0005181481828913093, 0.0005469336756505072, 0.0005757191102020442, 0.0006045046029612422, 0.0006332900375127792, 0.0006620755302719772, 0.0006908609648235142, 0.0007196464575827122, 0.0007484318921342492, 0.0007772173848934472, 0.0008060028194449842, 0.0008347883122041821, 0.0008635737467557192, 0.0008923591813072562, 0.0009211446158587933, 0.0009499301086179912, 0.0009787156013771892, 0.0010075010359287262, 0.0010362864704802632, 0.0010650719050318003, 0.0010938573395833373, 0.0011226428905501962, 0.0011514283251017332, 0.0011802137596532702, 0.0012089993106201291, 0.0012377847451716661, 0.0012665701797232032, 0.0012953556142747402, 0.0013241410488262773, 0.0013529264833778143, 0.0013817119179293513, 0.0014104973524808884, 0.0014392829034477472, 0.0014680683379992843, 0.0014968537725508213, 0.0015256392071023583, 0.0015544246416538954, 0.0015832101926207542]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 2.0, 2.0, 5.0, 9.0, 7.0, 10.0, 17.0, 14.0, 19.0, 25.0, 15.0, 25.0, 25.0, 29.0, 37.0, 36.0, 29.0, 41.0, 49.0, 41.0, 30.0, 42.0, 47.0, 45.0, 37.0, 38.0, 31.0, 34.0, 33.0, 31.0, 33.0, 22.0, 20.0, 18.0, 25.0, 19.0, 11.0, 11.0, 12.0, 3.0, 8.0, 5.0, 4.0, 3.0, 3.0, 0.0, 4.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.0001271367073059082, -0.00012324098497629166, -0.00011934526264667511, -0.00011544954031705856, -0.00011155381798744202, -0.00010765809565782547, -0.00010376237332820892, -9.986665099859238e-05, -9.597092866897583e-05, -9.207520633935928e-05, -8.817948400974274e-05, -8.428376168012619e-05, -8.038803935050964e-05, -7.64923170208931e-05, -7.259659469127655e-05, -6.870087236166e-05, -6.480515003204346e-05, -6.090942770242691e-05, -5.7013705372810364e-05, -5.311798304319382e-05, -4.922226071357727e-05, -4.5326538383960724e-05, -4.143081605434418e-05, -3.753509372472763e-05, -3.3639371395111084e-05, -2.9743649065494537e-05, -2.584792673587799e-05, -2.1952204406261444e-05, -1.8056482076644897e-05, -1.416075974702835e-05, -1.0265037417411804e-05, -6.3693150877952576e-06, -2.473592758178711e-06, 1.4221295714378357e-06, 5.317851901054382e-06, 9.213574230670929e-06, 1.3109296560287476e-05, 1.7005018889904022e-05, 2.090074121952057e-05, 2.4796463549137115e-05, 2.8692185878753662e-05, 3.258790820837021e-05, 3.6483630537986755e-05, 4.03793528676033e-05, 4.427507519721985e-05, 4.8170797526836395e-05, 5.206651985645294e-05, 5.596224218606949e-05, 5.9857964515686035e-05, 6.375368684530258e-05, 6.764940917491913e-05, 7.154513150453568e-05, 7.544085383415222e-05, 7.933657616376877e-05, 8.323229849338531e-05, 8.712802082300186e-05, 9.102374315261841e-05, 9.491946548223495e-05, 9.88151878118515e-05, 0.00010271091014146805, 0.0001066066324710846, 0.00011050235480070114, 0.00011439807713031769, 0.00011829379945993423, 0.00012218952178955078]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 7.0, 4.0, 2.0, 5.0, 2.0, 3.0, 5.0, 8.0, 14.0, 24.0, 20.0, 22.0, 28.0, 27.0, 29.0, 35.0, 35.0, 53.0, 40.0, 31.0, 59.0, 47.0, 59.0, 37.0, 40.0, 31.0, 56.0, 34.0, 51.0, 28.0, 30.0, 25.0, 19.0, 23.0, 14.0, 19.0, 5.0, 6.0, 9.0, 5.0, 1.0, 7.0, 9.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.0390625, -6.8204345703125, -6.601806640625, -6.3831787109375, -6.16455078125, -5.9459228515625, -5.727294921875, -5.5086669921875, -5.2900390625, -5.0714111328125, -4.852783203125, -4.6341552734375, -4.41552734375, -4.1968994140625, -3.978271484375, -3.7596435546875, -3.541015625, -3.3223876953125, -3.103759765625, -2.8851318359375, -2.66650390625, -2.4478759765625, -2.229248046875, -2.0106201171875, -1.7919921875, -1.5733642578125, -1.354736328125, -1.1361083984375, -0.91748046875, -0.6988525390625, -0.480224609375, -0.2615966796875, -0.04296875, 0.1756591796875, 0.394287109375, 0.6129150390625, 0.83154296875, 1.0501708984375, 1.268798828125, 1.4874267578125, 1.7060546875, 1.9246826171875, 2.143310546875, 2.3619384765625, 2.58056640625, 2.7991943359375, 3.017822265625, 3.2364501953125, 3.455078125, 3.6737060546875, 3.892333984375, 4.1109619140625, 4.32958984375, 4.5482177734375, 4.766845703125, 4.9854736328125, 5.2041015625, 5.4227294921875, 5.641357421875, 5.8599853515625, 6.07861328125, 6.2972412109375, 6.515869140625, 6.7344970703125, 6.953125]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 6.0, 6.0, 6.0, 9.0, 10.0, 23.0, 23.0, 37.0, 49.0, 49.0, 77.0, 101.0, 155.0, 250.0, 312.0, 460.0, 691.0, 1175.0, 2081.0, 4041.0, 9836.0, 38024.0, 420594.0, 506787.0, 43125.0, 10761.0, 4207.0, 2044.0, 1212.0, 766.0, 488.0, 331.0, 256.0, 176.0, 112.0, 79.0, 61.0, 42.0, 32.0, 23.0, 9.0, 9.0, 7.0, 8.0, 6.0, 3.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.421875, -18.833984375, -18.24609375, -17.658203125, -17.0703125, -16.482421875, -15.89453125, -15.306640625, -14.71875, -14.130859375, -13.54296875, -12.955078125, -12.3671875, -11.779296875, -11.19140625, -10.603515625, -10.015625, -9.427734375, -8.83984375, -8.251953125, -7.6640625, -7.076171875, -6.48828125, -5.900390625, -5.3125, -4.724609375, -4.13671875, -3.548828125, -2.9609375, -2.373046875, -1.78515625, -1.197265625, -0.609375, -0.021484375, 0.56640625, 1.154296875, 1.7421875, 2.330078125, 2.91796875, 3.505859375, 4.09375, 4.681640625, 5.26953125, 5.857421875, 6.4453125, 7.033203125, 7.62109375, 8.208984375, 8.796875, 9.384765625, 9.97265625, 10.560546875, 11.1484375, 11.736328125, 12.32421875, 12.912109375, 13.5, 14.087890625, 14.67578125, 15.263671875, 15.8515625, 16.439453125, 17.02734375, 17.615234375, 18.203125]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 3.0, 7.0, 0.0, 3.0, 4.0, 11.0, 6.0, 11.0, 11.0, 24.0, 13.0, 16.0, 28.0, 23.0, 27.0, 32.0, 42.0, 47.0, 72.0, 101.0, 268.0, 1521.0, 252.0, 104.0, 74.0, 58.0, 50.0, 40.0, 30.0, 26.0, 25.0, 25.0, 14.0, 15.0, 15.0, 13.0, 11.0, 9.0, 1.0, 3.0, 8.0, 5.0, 3.0, 2.0, 4.0, 0.0, 1.0, 3.0], "bins": [-18.828125, -18.325439453125, -17.82275390625, -17.320068359375, -16.8173828125, -16.314697265625, -15.81201171875, -15.309326171875, -14.806640625, -14.303955078125, -13.80126953125, -13.298583984375, -12.7958984375, -12.293212890625, -11.79052734375, -11.287841796875, -10.78515625, -10.282470703125, -9.77978515625, -9.277099609375, -8.7744140625, -8.271728515625, -7.76904296875, -7.266357421875, -6.763671875, -6.260986328125, -5.75830078125, -5.255615234375, -4.7529296875, -4.250244140625, -3.74755859375, -3.244873046875, -2.7421875, -2.239501953125, -1.73681640625, -1.234130859375, -0.7314453125, -0.228759765625, 0.27392578125, 0.776611328125, 1.279296875, 1.781982421875, 2.28466796875, 2.787353515625, 3.2900390625, 3.792724609375, 4.29541015625, 4.798095703125, 5.30078125, 5.803466796875, 6.30615234375, 6.808837890625, 7.3115234375, 7.814208984375, 8.31689453125, 8.819580078125, 9.322265625, 9.824951171875, 10.32763671875, 10.830322265625, 11.3330078125, 11.835693359375, 12.33837890625, 12.841064453125, 13.34375]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 1.0, 4.0, 3.0, 3.0, 10.0, 8.0, 14.0, 9.0, 16.0, 20.0, 22.0, 35.0, 56.0, 68.0, 94.0, 173.0, 269.0, 458.0, 887.0, 2457.0, 1548124.0, 1588433.0, 2486.0, 860.0, 444.0, 249.0, 158.0, 90.0, 67.0, 55.0, 28.0, 23.0, 22.0, 17.0, 7.0, 13.0, 6.0, 7.0, 7.0, 2.0, 6.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.4375, -46.6435546875, -44.849609375, -43.0556640625, -41.26171875, -39.4677734375, -37.673828125, -35.8798828125, -34.0859375, -32.2919921875, -30.498046875, -28.7041015625, -26.91015625, -25.1162109375, -23.322265625, -21.5283203125, -19.734375, -17.9404296875, -16.146484375, -14.3525390625, -12.55859375, -10.7646484375, -8.970703125, -7.1767578125, -5.3828125, -3.5888671875, -1.794921875, -0.0009765625, 1.79296875, 3.5869140625, 5.380859375, 7.1748046875, 8.96875, 10.7626953125, 12.556640625, 14.3505859375, 16.14453125, 17.9384765625, 19.732421875, 21.5263671875, 23.3203125, 25.1142578125, 26.908203125, 28.7021484375, 30.49609375, 32.2900390625, 34.083984375, 35.8779296875, 37.671875, 39.4658203125, 41.259765625, 43.0537109375, 44.84765625, 46.6416015625, 48.435546875, 50.2294921875, 52.0234375, 53.8173828125, 55.611328125, 57.4052734375, 59.19921875, 60.9931640625, 62.787109375, 64.5810546875, 66.375]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 8.0, 18.0, 120.0, 349.0, 339.0, 143.0, 31.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-140.62673950195312, -137.43357849121094, -134.24041748046875, -131.04725646972656, -127.85409545898438, -124.66093444824219, -121.4677734375, -118.27461242675781, -115.08145141601562, -111.88829040527344, -108.69512939453125, -105.50196838378906, -102.30880737304688, -99.11564636230469, -95.9224853515625, -92.72932434082031, -89.5361557006836, -86.3429946899414, -83.14983367919922, -79.95667266845703, -76.76351165771484, -73.57035064697266, -70.37718200683594, -67.18402099609375, -63.99086380004883, -60.79770278930664, -57.60454177856445, -54.411376953125, -51.21821594238281, -48.025054931640625, -44.83189392089844, -41.63873291015625, -38.4455680847168, -35.25240707397461, -32.05924606323242, -28.8660831451416, -25.672922134399414, -22.479761123657227, -19.286598205566406, -16.09343719482422, -12.900276184082031, -9.707115173339844, -6.51395320892334, -3.320791244506836, -0.12763023376464844, 3.065530776977539, 6.258693695068359, 9.451854705810547, 12.645015716552734, 15.838176727294922, 19.03133773803711, 22.22450065612793, 25.417661666870117, 28.610822677612305, 31.803985595703125, 34.99714660644531, 38.1903076171875, 41.38346862792969, 44.576629638671875, 47.76979064941406, 50.96295166015625, 54.15611267089844, 57.34927749633789, 60.54243850708008, 63.735599517822266]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 2.0, 11.0, 10.0, 6.0, 14.0, 11.0, 17.0, 16.0, 16.0, 24.0, 29.0, 27.0, 24.0, 32.0, 34.0, 35.0, 36.0, 36.0, 45.0, 37.0, 43.0, 38.0, 34.0, 38.0, 25.0, 39.0, 28.0, 44.0, 19.0, 30.0, 24.0, 23.0, 25.0, 19.0, 16.0, 19.0, 14.0, 14.0, 10.0, 5.0, 5.0, 6.0, 3.0, 8.0, 6.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-42.93523406982422, -41.71271896362305, -40.490203857421875, -39.26769256591797, -38.0451774597168, -36.822662353515625, -35.60014724731445, -34.37763214111328, -33.15511703491211, -31.932601928710938, -30.7100887298584, -29.487573623657227, -28.265058517456055, -27.042545318603516, -25.820030212402344, -24.597515106201172, -23.375001907348633, -22.15248680114746, -20.929973602294922, -19.70745849609375, -18.484943389892578, -17.262428283691406, -16.039915084838867, -14.817399978637695, -13.59488582611084, -12.372371673583984, -11.149856567382812, -9.927342414855957, -8.704828262329102, -7.48231315612793, -6.259799003601074, -5.037283897399902, -3.814769744873047, -2.592255115509033, -1.3697407245635986, -0.14722633361816406, 1.0752882957458496, 2.2978029251098633, 3.5203170776367188, 4.742832183837891, 5.965346336364746, 7.18786096572876, 8.410375595092773, 9.632889747619629, 10.855403900146484, 12.077919006347656, 13.300433158874512, 14.522948265075684, 15.745462417602539, 16.96797752380371, 18.19049072265625, 19.413005828857422, 20.635520935058594, 21.858036041259766, 23.080549240112305, 24.303064346313477, 25.525577545166016, 26.748092651367188, 27.970605850219727, 29.1931209564209, 30.41563606262207, 31.63814926147461, 32.86066436767578, 34.08317947387695, 35.305694580078125]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 3.0, 2.0, 4.0, 3.0, 11.0, 8.0, 8.0, 9.0, 8.0, 16.0, 18.0, 24.0, 22.0, 28.0, 32.0, 27.0, 25.0, 35.0, 32.0, 39.0, 46.0, 46.0, 54.0, 48.0, 40.0, 47.0, 39.0, 30.0, 38.0, 28.0, 32.0, 33.0, 23.0, 23.0, 17.0, 24.0, 21.0, 9.0, 9.0, 10.0, 11.0, 7.0, 5.0, 5.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0], "bins": [-6.68359375, -6.4759521484375, -6.268310546875, -6.0606689453125, -5.85302734375, -5.6453857421875, -5.437744140625, -5.2301025390625, -5.0224609375, -4.8148193359375, -4.607177734375, -4.3995361328125, -4.19189453125, -3.9842529296875, -3.776611328125, -3.5689697265625, -3.361328125, -3.1536865234375, -2.946044921875, -2.7384033203125, -2.53076171875, -2.3231201171875, -2.115478515625, -1.9078369140625, -1.7001953125, -1.4925537109375, -1.284912109375, -1.0772705078125, -0.86962890625, -0.6619873046875, -0.454345703125, -0.2467041015625, -0.0390625, 0.1685791015625, 0.376220703125, 0.5838623046875, 0.79150390625, 0.9991455078125, 1.206787109375, 1.4144287109375, 1.6220703125, 1.8297119140625, 2.037353515625, 2.2449951171875, 2.45263671875, 2.6602783203125, 2.867919921875, 3.0755615234375, 3.283203125, 3.4908447265625, 3.698486328125, 3.9061279296875, 4.11376953125, 4.3214111328125, 4.529052734375, 4.7366943359375, 4.9443359375, 5.1519775390625, 5.359619140625, 5.5672607421875, 5.77490234375, 5.9825439453125, 6.190185546875, 6.3978271484375, 6.60546875]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 4.0, 3.0, 5.0, 8.0, 6.0, 19.0, 27.0, 28.0, 38.0, 55.0, 67.0, 110.0, 122.0, 172.0, 227.0, 305.0, 453.0, 598.0, 906.0, 1319.0, 2127.0, 3967.0, 8239.0, 20419.0, 70801.0, 460040.0, 2265999.0, 1140421.0, 159300.0, 33431.0, 11763.0, 5222.0, 2781.0, 1643.0, 1068.0, 758.0, 501.0, 356.0, 259.0, 199.0, 146.0, 112.0, 66.0, 54.0, 39.0, 35.0, 20.0, 18.0, 14.0, 6.0, 8.0, 4.0, 4.0, 1.0, 0.0, 1.0], "bins": [-14.1484375, -13.7410888671875, -13.333740234375, -12.9263916015625, -12.51904296875, -12.1116943359375, -11.704345703125, -11.2969970703125, -10.8896484375, -10.4822998046875, -10.074951171875, -9.6676025390625, -9.26025390625, -8.8529052734375, -8.445556640625, -8.0382080078125, -7.630859375, -7.2235107421875, -6.816162109375, -6.4088134765625, -6.00146484375, -5.5941162109375, -5.186767578125, -4.7794189453125, -4.3720703125, -3.9647216796875, -3.557373046875, -3.1500244140625, -2.74267578125, -2.3353271484375, -1.927978515625, -1.5206298828125, -1.11328125, -0.7059326171875, -0.298583984375, 0.1087646484375, 0.51611328125, 0.9234619140625, 1.330810546875, 1.7381591796875, 2.1455078125, 2.5528564453125, 2.960205078125, 3.3675537109375, 3.77490234375, 4.1822509765625, 4.589599609375, 4.9969482421875, 5.404296875, 5.8116455078125, 6.218994140625, 6.6263427734375, 7.03369140625, 7.4410400390625, 7.848388671875, 8.2557373046875, 8.6630859375, 9.0704345703125, 9.477783203125, 9.8851318359375, 10.29248046875, 10.6998291015625, 11.107177734375, 11.5145263671875, 11.921875]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 2.0, 11.0, 12.0, 26.0, 47.0, 70.0, 138.0, 244.0, 432.0, 835.0, 972.0, 571.0, 301.0, 168.0, 107.0, 63.0, 41.0, 21.0, 10.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.2890625, -12.5938720703125, -11.898681640625, -11.2034912109375, -10.50830078125, -9.8131103515625, -9.117919921875, -8.4227294921875, -7.7275390625, -7.0323486328125, -6.337158203125, -5.6419677734375, -4.94677734375, -4.2515869140625, -3.556396484375, -2.8612060546875, -2.166015625, -1.4708251953125, -0.775634765625, -0.0804443359375, 0.61474609375, 1.3099365234375, 2.005126953125, 2.7003173828125, 3.3955078125, 4.0906982421875, 4.785888671875, 5.4810791015625, 6.17626953125, 6.8714599609375, 7.566650390625, 8.2618408203125, 8.95703125, 9.6522216796875, 10.347412109375, 11.0426025390625, 11.73779296875, 12.4329833984375, 13.128173828125, 13.8233642578125, 14.5185546875, 15.2137451171875, 15.908935546875, 16.6041259765625, 17.29931640625, 17.9945068359375, 18.689697265625, 19.3848876953125, 20.080078125, 20.7752685546875, 21.470458984375, 22.1656494140625, 22.86083984375, 23.5560302734375, 24.251220703125, 24.9464111328125, 25.6416015625, 26.3367919921875, 27.031982421875, 27.7271728515625, 28.42236328125, 29.1175537109375, 29.812744140625, 30.5079345703125, 31.203125]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 5.0, 11.0, 9.0, 10.0, 20.0, 38.0, 59.0, 84.0, 137.0, 241.0, 398.0, 946.0, 3363.0, 31919.0, 3158954.0, 978333.0, 15929.0, 2291.0, 705.0, 319.0, 171.0, 101.0, 73.0, 46.0, 37.0, 21.0, 17.0, 18.0, 7.0, 6.0, 9.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-41.71875, -40.55615234375, -39.3935546875, -38.23095703125, -37.068359375, -35.90576171875, -34.7431640625, -33.58056640625, -32.41796875, -31.25537109375, -30.0927734375, -28.93017578125, -27.767578125, -26.60498046875, -25.4423828125, -24.27978515625, -23.1171875, -21.95458984375, -20.7919921875, -19.62939453125, -18.466796875, -17.30419921875, -16.1416015625, -14.97900390625, -13.81640625, -12.65380859375, -11.4912109375, -10.32861328125, -9.166015625, -8.00341796875, -6.8408203125, -5.67822265625, -4.515625, -3.35302734375, -2.1904296875, -1.02783203125, 0.134765625, 1.29736328125, 2.4599609375, 3.62255859375, 4.78515625, 5.94775390625, 7.1103515625, 8.27294921875, 9.435546875, 10.59814453125, 11.7607421875, 12.92333984375, 14.0859375, 15.24853515625, 16.4111328125, 17.57373046875, 18.736328125, 19.89892578125, 21.0615234375, 22.22412109375, 23.38671875, 24.54931640625, 25.7119140625, 26.87451171875, 28.037109375, 29.19970703125, 30.3623046875, 31.52490234375, 32.6875]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 15.0, 65.0, 301.0, 462.0, 134.0, 32.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.3144760131836, -60.042022705078125, -52.76956558227539, -45.497108459472656, -38.22465515136719, -30.95220184326172, -23.679744720458984, -16.40728759765625, -9.134834289550781, -1.8623790740966797, 5.410076141357422, 12.682531356811523, 19.954986572265625, 27.227439880371094, 34.49989700317383, 41.77235412597656, 49.04480743408203, 56.3172607421875, 63.589717864990234, 70.86217498779297, 78.13462829589844, 85.4070816040039, 92.67953491210938, 99.95199584960938, 107.22444915771484, 114.49690246582031, 121.76936340332031, 129.04180908203125, 136.31427001953125, 143.58673095703125, 150.8591766357422, 158.1316375732422, 165.40408325195312, 172.67654418945312, 179.94898986816406, 187.22145080566406, 194.493896484375, 201.766357421875, 209.038818359375, 216.311279296875, 223.58372497558594, 230.85618591308594, 238.12863159179688, 245.40109252929688, 252.67355346679688, 259.94598388671875, 267.21844482421875, 274.49090576171875, 281.76336669921875, 289.03582763671875, 296.30828857421875, 303.5807189941406, 310.8531799316406, 318.1256408691406, 325.3981018066406, 332.6705627441406, 339.9429931640625, 347.2154541015625, 354.4879150390625, 361.7603454589844, 369.0328063964844, 376.3052673339844, 383.5777282714844, 390.8501892089844, 398.1226501464844]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 5.0, 2.0, 9.0, 7.0, 9.0, 9.0, 10.0, 12.0, 16.0, 20.0, 15.0, 16.0, 21.0, 24.0, 34.0, 30.0, 40.0, 33.0, 37.0, 36.0, 42.0, 46.0, 27.0, 38.0, 49.0, 26.0, 41.0, 36.0, 38.0, 35.0, 28.0, 24.0, 29.0, 17.0, 21.0, 25.0, 17.0, 19.0, 14.0, 13.0, 8.0, 5.0, 10.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0], "bins": [-45.9328727722168, -44.4693717956543, -43.0058708190918, -41.5423698425293, -40.0788688659668, -38.6153678894043, -37.1518669128418, -35.6883659362793, -34.2248649597168, -32.7613639831543, -31.297863006591797, -29.834362030029297, -28.370861053466797, -26.907360076904297, -25.443859100341797, -23.980358123779297, -22.516857147216797, -21.053356170654297, -19.589855194091797, -18.126354217529297, -16.662853240966797, -15.199352264404297, -13.735851287841797, -12.272350311279297, -10.808849334716797, -9.345348358154297, -7.881847381591797, -6.418346405029297, -4.954845428466797, -3.491344451904297, -2.027843475341797, -0.5643424987792969, 0.8991584777832031, 2.362659454345703, 3.826160430908203, 5.289661407470703, 6.753162384033203, 8.216663360595703, 9.680164337158203, 11.143665313720703, 12.607166290283203, 14.070667266845703, 15.534168243408203, 16.997669219970703, 18.461170196533203, 19.924671173095703, 21.388172149658203, 22.851673126220703, 24.315174102783203, 25.778675079345703, 27.242176055908203, 28.705677032470703, 30.169178009033203, 31.632678985595703, 33.0961799621582, 34.5596809387207, 36.0231819152832, 37.4866828918457, 38.9501838684082, 40.4136848449707, 41.8771858215332, 43.3406867980957, 44.8041877746582, 46.2676887512207, 47.7311897277832]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 5.0, 5.0, 7.0, 2.0, 11.0, 11.0, 10.0, 11.0, 21.0, 25.0, 28.0, 32.0, 25.0, 44.0, 33.0, 36.0, 49.0, 40.0, 43.0, 50.0, 37.0, 56.0, 43.0, 45.0, 37.0, 30.0, 34.0, 35.0, 35.0, 32.0, 17.0, 17.0, 22.0, 14.0, 10.0, 8.0, 13.0, 10.0, 3.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.671875, -6.4588623046875, -6.245849609375, -6.0328369140625, -5.81982421875, -5.6068115234375, -5.393798828125, -5.1807861328125, -4.9677734375, -4.7547607421875, -4.541748046875, -4.3287353515625, -4.11572265625, -3.9027099609375, -3.689697265625, -3.4766845703125, -3.263671875, -3.0506591796875, -2.837646484375, -2.6246337890625, -2.41162109375, -2.1986083984375, -1.985595703125, -1.7725830078125, -1.5595703125, -1.3465576171875, -1.133544921875, -0.9205322265625, -0.70751953125, -0.4945068359375, -0.281494140625, -0.0684814453125, 0.14453125, 0.3575439453125, 0.570556640625, 0.7835693359375, 0.99658203125, 1.2095947265625, 1.422607421875, 1.6356201171875, 1.8486328125, 2.0616455078125, 2.274658203125, 2.4876708984375, 2.70068359375, 2.9136962890625, 3.126708984375, 3.3397216796875, 3.552734375, 3.7657470703125, 3.978759765625, 4.1917724609375, 4.40478515625, 4.6177978515625, 4.830810546875, 5.0438232421875, 5.2568359375, 5.4698486328125, 5.682861328125, 5.8958740234375, 6.10888671875, 6.3218994140625, 6.534912109375, 6.7479248046875, 6.9609375]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 3.0, 4.0, 3.0, 10.0, 19.0, 15.0, 24.0, 38.0, 65.0, 107.0, 121.0, 182.0, 256.0, 376.0, 563.0, 764.0, 1043.0, 1620.0, 2294.0, 3536.0, 5205.0, 7867.0, 11968.0, 18461.0, 28973.0, 47850.0, 83073.0, 162082.0, 291845.0, 164310.0, 83983.0, 47676.0, 29343.0, 18661.0, 12088.0, 7967.0, 5206.0, 3422.0, 2331.0, 1600.0, 1105.0, 762.0, 484.0, 382.0, 249.0, 194.0, 121.0, 98.0, 72.0, 37.0, 34.0, 24.0, 16.0, 18.0, 10.0, 2.0, 2.0, 0.0, 1.0, 2.0, 4.0], "bins": [-0.25732421875, -0.24915695190429688, -0.24098968505859375, -0.23282241821289062, -0.2246551513671875, -0.21648788452148438, -0.20832061767578125, -0.20015335083007812, -0.191986083984375, -0.18381881713867188, -0.17565155029296875, -0.16748428344726562, -0.1593170166015625, -0.15114974975585938, -0.14298248291015625, -0.13481521606445312, -0.12664794921875, -0.11848068237304688, -0.11031341552734375, -0.10214614868164062, -0.0939788818359375, -0.08581161499023438, -0.07764434814453125, -0.06947708129882812, -0.061309814453125, -0.053142547607421875, -0.04497528076171875, -0.036808013916015625, -0.0286407470703125, -0.020473480224609375, -0.01230621337890625, -0.004138946533203125, 0.0040283203125, 0.012195587158203125, 0.02036285400390625, 0.028530120849609375, 0.0366973876953125, 0.044864654541015625, 0.05303192138671875, 0.061199188232421875, 0.069366455078125, 0.07753372192382812, 0.08570098876953125, 0.09386825561523438, 0.1020355224609375, 0.11020278930664062, 0.11837005615234375, 0.12653732299804688, 0.13470458984375, 0.14287185668945312, 0.15103912353515625, 0.15920639038085938, 0.1673736572265625, 0.17554092407226562, 0.18370819091796875, 0.19187545776367188, 0.200042724609375, 0.20820999145507812, 0.21637725830078125, 0.22454452514648438, 0.2327117919921875, 0.24087905883789062, 0.24904632568359375, 0.2572135925292969, 0.265380859375]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 2.0, 3.0, 10.0, 11.0, 8.0, 17.0, 15.0, 19.0, 27.0, 21.0, 20.0, 20.0, 35.0, 35.0, 30.0, 29.0, 43.0, 37.0, 31.0, 35.0, 1071.0, 45.0, 31.0, 50.0, 39.0, 37.0, 39.0, 46.0, 37.0, 22.0, 17.0, 25.0, 21.0, 17.0, 9.0, 19.0, 13.0, 13.0, 5.0, 9.0, 0.0, 5.0, 3.0, 1.0, 3.0, 1.0, 1.0], "bins": [-5.09375, -4.95831298828125, -4.8228759765625, -4.68743896484375, -4.552001953125, -4.41656494140625, -4.2811279296875, -4.14569091796875, -4.01025390625, -3.87481689453125, -3.7393798828125, -3.60394287109375, -3.468505859375, -3.33306884765625, -3.1976318359375, -3.06219482421875, -2.9267578125, -2.79132080078125, -2.6558837890625, -2.52044677734375, -2.385009765625, -2.24957275390625, -2.1141357421875, -1.97869873046875, -1.84326171875, -1.70782470703125, -1.5723876953125, -1.43695068359375, -1.301513671875, -1.16607666015625, -1.0306396484375, -0.89520263671875, -0.759765625, -0.62432861328125, -0.4888916015625, -0.35345458984375, -0.218017578125, -0.08258056640625, 0.0528564453125, 0.18829345703125, 0.32373046875, 0.45916748046875, 0.5946044921875, 0.73004150390625, 0.865478515625, 1.00091552734375, 1.1363525390625, 1.27178955078125, 1.4072265625, 1.54266357421875, 1.6781005859375, 1.81353759765625, 1.948974609375, 2.08441162109375, 2.2198486328125, 2.35528564453125, 2.49072265625, 2.62615966796875, 2.7615966796875, 2.89703369140625, 3.032470703125, 3.16790771484375, 3.3033447265625, 3.43878173828125, 3.57421875]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 4.0, 5.0, 4.0, 13.0, 17.0, 25.0, 47.0, 57.0, 94.0, 130.0, 168.0, 260.0, 374.0, 536.0, 728.0, 1137.0, 1600.0, 2368.0, 3525.0, 5225.0, 7946.0, 12026.0, 18849.0, 30319.0, 48888.0, 82873.0, 149090.0, 1317241.0, 171968.0, 92922.0, 54981.0, 33350.0, 20686.0, 13363.0, 8633.0, 5790.0, 3798.0, 2501.0, 1695.0, 1235.0, 831.0, 606.0, 401.0, 265.0, 179.0, 120.0, 86.0, 57.0, 48.0, 32.0, 24.0, 9.0, 5.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.2105712890625, -0.20390892028808594, -0.19724655151367188, -0.1905841827392578, -0.18392181396484375, -0.1772594451904297, -0.17059707641601562, -0.16393470764160156, -0.1572723388671875, -0.15060997009277344, -0.14394760131835938, -0.1372852325439453, -0.13062286376953125, -0.12396049499511719, -0.11729812622070312, -0.11063575744628906, -0.103973388671875, -0.09731101989746094, -0.09064865112304688, -0.08398628234863281, -0.07732391357421875, -0.07066154479980469, -0.06399917602539062, -0.05733680725097656, -0.0506744384765625, -0.04401206970214844, -0.037349700927734375, -0.030687332153320312, -0.02402496337890625, -0.017362594604492188, -0.010700225830078125, -0.0040378570556640625, 0.00262451171875, 0.009286880493164062, 0.015949249267578125, 0.022611618041992188, 0.02927398681640625, 0.03593635559082031, 0.042598724365234375, 0.04926109313964844, 0.0559234619140625, 0.06258583068847656, 0.06924819946289062, 0.07591056823730469, 0.08257293701171875, 0.08923530578613281, 0.09589767456054688, 0.10256004333496094, 0.109222412109375, 0.11588478088378906, 0.12254714965820312, 0.1292095184326172, 0.13587188720703125, 0.1425342559814453, 0.14919662475585938, 0.15585899353027344, 0.1625213623046875, 0.16918373107910156, 0.17584609985351562, 0.1825084686279297, 0.18917083740234375, 0.1958332061767578, 0.20249557495117188, 0.20915794372558594, 0.2158203125]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 6.0, 4.0, 6.0, 7.0, 12.0, 17.0, 10.0, 14.0, 27.0, 20.0, 25.0, 36.0, 25.0, 42.0, 53.0, 57.0, 58.0, 61.0, 68.0, 64.0, 61.0, 51.0, 43.0, 33.0, 32.0, 34.0, 19.0, 19.0, 21.0, 16.0, 15.0, 8.0, 9.0, 4.0, 5.0, 5.0, 2.0, 3.0, 1.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011307001113891602, -0.0001094769686460495, -0.00010588392615318298, -0.00010229088366031647, -9.869784116744995e-05, -9.510479867458344e-05, -9.151175618171692e-05, -8.79187136888504e-05, -8.432567119598389e-05, -8.073262870311737e-05, -7.713958621025085e-05, -7.354654371738434e-05, -6.995350122451782e-05, -6.63604587316513e-05, -6.276741623878479e-05, -5.9174373745918274e-05, -5.558133125305176e-05, -5.198828876018524e-05, -4.8395246267318726e-05, -4.480220377445221e-05, -4.120916128158569e-05, -3.761611878871918e-05, -3.402307629585266e-05, -3.0430033802986145e-05, -2.683699131011963e-05, -2.3243948817253113e-05, -1.9650906324386597e-05, -1.605786383152008e-05, -1.2464821338653564e-05, -8.871778845787048e-06, -5.278736352920532e-06, -1.6856938600540161e-06, 1.9073486328125e-06, 5.500391125679016e-06, 9.093433618545532e-06, 1.2686476111412048e-05, 1.6279518604278564e-05, 1.987256109714508e-05, 2.3465603590011597e-05, 2.7058646082878113e-05, 3.065168857574463e-05, 3.4244731068611145e-05, 3.783777356147766e-05, 4.143081605434418e-05, 4.502385854721069e-05, 4.861690104007721e-05, 5.2209943532943726e-05, 5.580298602581024e-05, 5.939602851867676e-05, 6.298907101154327e-05, 6.658211350440979e-05, 7.01751559972763e-05, 7.376819849014282e-05, 7.736124098300934e-05, 8.095428347587585e-05, 8.454732596874237e-05, 8.814036846160889e-05, 9.17334109544754e-05, 9.532645344734192e-05, 9.891949594020844e-05, 0.00010251253843307495, 0.00010610558092594147, 0.00010969862341880798, 0.0001132916659116745, 0.00011688470840454102]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 6.0, 3.0, 5.0, 10.0, 2.0, 6.0, 7.0, 14.0, 13.0, 22.0, 27.0, 39.0, 33.0, 54.0, 67.0, 75.0, 115.0, 152.0, 215.0, 334.0, 640.0, 2475.0, 81453.0, 945710.0, 14522.0, 1217.0, 410.0, 252.0, 173.0, 110.0, 100.0, 67.0, 53.0, 37.0, 36.0, 22.0, 19.0, 18.0, 7.0, 11.0, 7.0, 3.0, 7.0, 5.0, 4.0, 2.0, 1.0, 4.0, 2.0, 0.0, 3.0, 1.0], "bins": [-0.002300262451171875, -0.002235099673271179, -0.0021699368953704834, -0.0021047741174697876, -0.002039611339569092, -0.001974448561668396, -0.0019092857837677002, -0.0018441230058670044, -0.0017789602279663086, -0.0017137974500656128, -0.001648634672164917, -0.0015834718942642212, -0.0015183091163635254, -0.0014531463384628296, -0.0013879835605621338, -0.001322820782661438, -0.0012576580047607422, -0.0011924952268600464, -0.0011273324489593506, -0.0010621696710586548, -0.000997006893157959, -0.0009318441152572632, -0.0008666813373565674, -0.0008015185594558716, -0.0007363557815551758, -0.00067119300365448, -0.0006060302257537842, -0.0005408674478530884, -0.0004757046699523926, -0.0004105418920516968, -0.000345379114151001, -0.0002802163362503052, -0.00021505355834960938, -0.00014989078044891357, -8.472800254821777e-05, -1.9565224647521973e-05, 4.559755325317383e-05, 0.00011076033115386963, 0.00017592310905456543, 0.00024108588695526123, 0.00030624866485595703, 0.00037141144275665283, 0.00043657422065734863, 0.0005017369985580444, 0.0005668997764587402, 0.000632062554359436, 0.0006972253322601318, 0.0007623881101608276, 0.0008275508880615234, 0.0008927136659622192, 0.000957876443862915, 0.0010230392217636108, 0.0010882019996643066, 0.0011533647775650024, 0.0012185275554656982, 0.001283690333366394, 0.0013488531112670898, 0.0014140158891677856, 0.0014791786670684814, 0.0015443414449691772, 0.001609504222869873, 0.0016746670007705688, 0.0017398297786712646, 0.0018049925565719604, 0.0018701553344726562]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 3.0, 12.0, 28.0, 71.0, 158.0, 243.0, 292.0, 122.0, 56.0, 23.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.687364707933739e-05, -4.00920762331225e-05, -3.33105017489288e-05, -2.6528929083724506e-05, -1.9747356418520212e-05, -1.2965785572305322e-05, -6.184211088111624e-06, 5.973633960820735e-07, 7.378934242296964e-06, 1.4160506907501258e-05, 2.0942079572705552e-05, 2.7723652237909846e-05, 3.450522490311414e-05, 4.128679574932903e-05, 4.806837023352273e-05, 5.4849944717716426e-05, 6.163151556393132e-05, 6.84130864101462e-05, 7.519466453231871e-05, 8.19762353785336e-05, 8.875780622474849e-05, 9.553937707096338e-05, 0.00010232094791717827, 0.00010910252603935078, 0.00011588409688556567, 0.00012266567500773817, 0.00012944724585395306, 0.00013622881670016795, 0.00014301038754638284, 0.00014979195839259773, 0.00015657352923881263, 0.00016335511463694274, 0.00017013668548315763, 0.00017691825632937253, 0.00018369982717558742, 0.0001904813980218023, 0.0001972629688680172, 0.0002040445397142321, 0.0002108261251123622, 0.0002176076959585771, 0.000224389266804792, 0.00023117083765100688, 0.00023795240849722177, 0.0002447339938953519, 0.0002515155647415668, 0.00025829713558778167, 0.00026507870643399656, 0.00027186027728021145, 0.00027864184812642634, 0.00028542341897264123, 0.0002922049898188561, 0.000298986560665071, 0.0003057681315112859, 0.0003125497023575008, 0.0003193312732037157, 0.00032611284404993057, 0.0003328944439999759, 0.0003396760148461908, 0.0003464575856924057, 0.0003532391565386206, 0.0003600207273848355, 0.00036680229823105037, 0.00037358386907726526, 0.0003803654690273106, 0.00038714701076969504]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 4.0, 5.0, 2.0, 7.0, 6.0, 11.0, 13.0, 17.0, 17.0, 23.0, 17.0, 27.0, 25.0, 31.0, 27.0, 39.0, 28.0, 37.0, 37.0, 36.0, 43.0, 46.0, 37.0, 32.0, 54.0, 36.0, 42.0, 29.0, 40.0, 28.0, 27.0, 23.0, 23.0, 24.0, 21.0, 16.0, 16.0, 11.0, 20.0, 13.0, 4.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.878376007080078e-05, -6.683450192213058e-05, -6.488524377346039e-05, -6.293598562479019e-05, -6.0986727476119995e-05, -5.90374693274498e-05, -5.70882111787796e-05, -5.5138953030109406e-05, -5.318969488143921e-05, -5.124043673276901e-05, -4.9291178584098816e-05, -4.734192043542862e-05, -4.539266228675842e-05, -4.3443404138088226e-05, -4.149414598941803e-05, -3.954488784074783e-05, -3.759562969207764e-05, -3.564637154340744e-05, -3.3697113394737244e-05, -3.174785524606705e-05, -2.979859709739685e-05, -2.7849338948726654e-05, -2.5900080800056458e-05, -2.395082265138626e-05, -2.2001564502716064e-05, -2.0052306354045868e-05, -1.810304820537567e-05, -1.6153790056705475e-05, -1.4204531908035278e-05, -1.2255273759365082e-05, -1.0306015610694885e-05, -8.356757462024689e-06, -6.407499313354492e-06, -4.458241164684296e-06, -2.508983016014099e-06, -5.597248673439026e-07, 1.389533281326294e-06, 3.3387914299964905e-06, 5.288049578666687e-06, 7.2373077273368835e-06, 9.18656587600708e-06, 1.1135824024677277e-05, 1.3085082173347473e-05, 1.503434032201767e-05, 1.6983598470687866e-05, 1.8932856619358063e-05, 2.088211476802826e-05, 2.2831372916698456e-05, 2.4780631065368652e-05, 2.672988921403885e-05, 2.8679147362709045e-05, 3.062840551137924e-05, 3.257766366004944e-05, 3.4526921808719635e-05, 3.647617995738983e-05, 3.842543810606003e-05, 4.0374696254730225e-05, 4.232395440340042e-05, 4.427321255207062e-05, 4.6222470700740814e-05, 4.817172884941101e-05, 5.012098699808121e-05, 5.2070245146751404e-05, 5.40195032954216e-05, 5.59687614440918e-05]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 5.0, 5.0, 7.0, 2.0, 11.0, 11.0, 10.0, 11.0, 21.0, 25.0, 28.0, 32.0, 25.0, 44.0, 33.0, 36.0, 49.0, 40.0, 43.0, 50.0, 37.0, 56.0, 43.0, 45.0, 37.0, 30.0, 34.0, 35.0, 35.0, 32.0, 17.0, 17.0, 22.0, 14.0, 10.0, 8.0, 13.0, 10.0, 3.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.671875, -6.4588623046875, -6.245849609375, -6.0328369140625, -5.81982421875, -5.6068115234375, -5.393798828125, -5.1807861328125, -4.9677734375, -4.7547607421875, -4.541748046875, -4.3287353515625, -4.11572265625, -3.9027099609375, -3.689697265625, -3.4766845703125, -3.263671875, -3.0506591796875, -2.837646484375, -2.6246337890625, -2.41162109375, -2.1986083984375, -1.985595703125, -1.7725830078125, -1.5595703125, -1.3465576171875, -1.133544921875, -0.9205322265625, -0.70751953125, -0.4945068359375, -0.281494140625, -0.0684814453125, 0.14453125, 0.3575439453125, 0.570556640625, 0.7835693359375, 0.99658203125, 1.2095947265625, 1.422607421875, 1.6356201171875, 1.8486328125, 2.0616455078125, 2.274658203125, 2.4876708984375, 2.70068359375, 2.9136962890625, 3.126708984375, 3.3397216796875, 3.552734375, 3.7657470703125, 3.978759765625, 4.1917724609375, 4.40478515625, 4.6177978515625, 4.830810546875, 5.0438232421875, 5.2568359375, 5.4698486328125, 5.682861328125, 5.8958740234375, 6.10888671875, 6.3218994140625, 6.534912109375, 6.7479248046875, 6.9609375]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 4.0, 2.0, 5.0, 8.0, 11.0, 10.0, 11.0, 21.0, 24.0, 40.0, 37.0, 52.0, 87.0, 133.0, 156.0, 235.0, 338.0, 506.0, 854.0, 1213.0, 2265.0, 4172.0, 9086.0, 23327.0, 84663.0, 468341.0, 353237.0, 63608.0, 19376.0, 7592.0, 3656.0, 2006.0, 1215.0, 707.0, 468.0, 309.0, 209.0, 161.0, 104.0, 81.0, 68.0, 40.0, 33.0, 19.0, 16.0, 16.0, 9.0, 10.0, 8.0, 5.0, 2.0, 3.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-11.4296875, -11.0474853515625, -10.665283203125, -10.2830810546875, -9.90087890625, -9.5186767578125, -9.136474609375, -8.7542724609375, -8.3720703125, -7.9898681640625, -7.607666015625, -7.2254638671875, -6.84326171875, -6.4610595703125, -6.078857421875, -5.6966552734375, -5.314453125, -4.9322509765625, -4.550048828125, -4.1678466796875, -3.78564453125, -3.4034423828125, -3.021240234375, -2.6390380859375, -2.2568359375, -1.8746337890625, -1.492431640625, -1.1102294921875, -0.72802734375, -0.3458251953125, 0.036376953125, 0.4185791015625, 0.80078125, 1.1829833984375, 1.565185546875, 1.9473876953125, 2.32958984375, 2.7117919921875, 3.093994140625, 3.4761962890625, 3.8583984375, 4.2406005859375, 4.622802734375, 5.0050048828125, 5.38720703125, 5.7694091796875, 6.151611328125, 6.5338134765625, 6.916015625, 7.2982177734375, 7.680419921875, 8.0626220703125, 8.44482421875, 8.8270263671875, 9.209228515625, 9.5914306640625, 9.9736328125, 10.3558349609375, 10.738037109375, 11.1202392578125, 11.50244140625, 11.8846435546875, 12.266845703125, 12.6490478515625, 13.03125]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 2.0, 5.0, 6.0, 7.0, 7.0, 11.0, 17.0, 16.0, 24.0, 24.0, 43.0, 51.0, 47.0, 54.0, 83.0, 152.0, 289.0, 1504.0, 210.0, 123.0, 83.0, 48.0, 40.0, 41.0, 37.0, 29.0, 25.0, 17.0, 10.0, 15.0, 5.0, 4.0, 7.0, 6.0, 4.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-23.84375, -23.12744140625, -22.4111328125, -21.69482421875, -20.978515625, -20.26220703125, -19.5458984375, -18.82958984375, -18.11328125, -17.39697265625, -16.6806640625, -15.96435546875, -15.248046875, -14.53173828125, -13.8154296875, -13.09912109375, -12.3828125, -11.66650390625, -10.9501953125, -10.23388671875, -9.517578125, -8.80126953125, -8.0849609375, -7.36865234375, -6.65234375, -5.93603515625, -5.2197265625, -4.50341796875, -3.787109375, -3.07080078125, -2.3544921875, -1.63818359375, -0.921875, -0.20556640625, 0.5107421875, 1.22705078125, 1.943359375, 2.65966796875, 3.3759765625, 4.09228515625, 4.80859375, 5.52490234375, 6.2412109375, 6.95751953125, 7.673828125, 8.39013671875, 9.1064453125, 9.82275390625, 10.5390625, 11.25537109375, 11.9716796875, 12.68798828125, 13.404296875, 14.12060546875, 14.8369140625, 15.55322265625, 16.26953125, 16.98583984375, 17.7021484375, 18.41845703125, 19.134765625, 19.85107421875, 20.5673828125, 21.28369140625, 22.0]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 6.0, 4.0, 2.0, 5.0, 8.0, 15.0, 13.0, 20.0, 18.0, 45.0, 59.0, 100.0, 173.0, 344.0, 940.0, 3480.0, 37244.0, 3042283.0, 54866.0, 4238.0, 989.0, 361.0, 191.0, 104.0, 55.0, 39.0, 29.0, 27.0, 12.0, 10.0, 10.0, 5.0, 3.0, 5.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-51.75, -50.05615234375, -48.3623046875, -46.66845703125, -44.974609375, -43.28076171875, -41.5869140625, -39.89306640625, -38.19921875, -36.50537109375, -34.8115234375, -33.11767578125, -31.423828125, -29.72998046875, -28.0361328125, -26.34228515625, -24.6484375, -22.95458984375, -21.2607421875, -19.56689453125, -17.873046875, -16.17919921875, -14.4853515625, -12.79150390625, -11.09765625, -9.40380859375, -7.7099609375, -6.01611328125, -4.322265625, -2.62841796875, -0.9345703125, 0.75927734375, 2.453125, 4.14697265625, 5.8408203125, 7.53466796875, 9.228515625, 10.92236328125, 12.6162109375, 14.31005859375, 16.00390625, 17.69775390625, 19.3916015625, 21.08544921875, 22.779296875, 24.47314453125, 26.1669921875, 27.86083984375, 29.5546875, 31.24853515625, 32.9423828125, 34.63623046875, 36.330078125, 38.02392578125, 39.7177734375, 41.41162109375, 43.10546875, 44.79931640625, 46.4931640625, 48.18701171875, 49.880859375, 51.57470703125, 53.2685546875, 54.96240234375, 56.65625]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 13.0, 73.0, 478.0, 381.0, 45.0, 13.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-419.5840148925781, -410.0306701660156, -400.477294921875, -390.9239501953125, -381.3705749511719, -371.8172302246094, -362.26385498046875, -352.71051025390625, -343.15716552734375, -333.60382080078125, -324.0504455566406, -314.4971008300781, -304.9437255859375, -295.390380859375, -285.8370056152344, -276.2836608886719, -266.73028564453125, -257.17694091796875, -247.62356567382812, -238.07020568847656, -228.516845703125, -218.9635009765625, -209.41014099121094, -199.85678100585938, -190.3034210205078, -180.75006103515625, -171.1967010498047, -161.64334106445312, -152.08999633789062, -142.53662109375, -132.9832763671875, -123.42991638183594, -113.87657165527344, -104.32321166992188, -94.76985168457031, -85.21649932861328, -75.66313934326172, -66.10977935791016, -56.55642318725586, -47.00306701660156, -37.44970703125, -27.89634895324707, -18.34299087524414, -8.789632797241211, 0.7637252807617188, 10.317085266113281, 19.870441436767578, 29.423797607421875, 38.97715759277344, 48.530517578125, 58.0838737487793, 67.6372299194336, 77.19058990478516, 86.74394989013672, 96.29730224609375, 105.85066223144531, 115.40402221679688, 124.95738220214844, 134.5107421875, 144.06410217285156, 153.61746215820312, 163.17080688476562, 172.7241668701172, 182.27752685546875, 191.8308868408203]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 2.0, 6.0, 7.0, 9.0, 8.0, 9.0, 9.0, 12.0, 7.0, 23.0, 21.0, 19.0, 24.0, 31.0, 39.0, 31.0, 28.0, 37.0, 41.0, 43.0, 30.0, 31.0, 37.0, 37.0, 29.0, 43.0, 46.0, 36.0, 34.0, 32.0, 45.0, 30.0, 29.0, 21.0, 7.0, 23.0, 16.0, 12.0, 11.0, 8.0, 11.0, 6.0, 5.0, 3.0, 4.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-39.6685676574707, -38.464664459228516, -37.26076126098633, -36.05685806274414, -34.85295486450195, -33.649051666259766, -32.44514846801758, -31.241247177124023, -30.037343978881836, -28.83344078063965, -27.62953758239746, -26.425634384155273, -25.22173309326172, -24.01782989501953, -22.813926696777344, -21.610023498535156, -20.40612030029297, -19.20221710205078, -17.998313903808594, -16.794410705566406, -15.590508460998535, -14.386605262756348, -13.182703018188477, -11.978799819946289, -10.774896621704102, -9.570993423461914, -8.367090225219727, -7.1631879806518555, -5.959284782409668, -4.7553815841674805, -3.551478862762451, -2.347576141357422, -1.1436729431152344, 0.06023001670837402, 1.2641329765319824, 2.468035936355591, 3.671938896179199, 4.875842094421387, 6.079744815826416, 7.283647537231445, 8.487550735473633, 9.69145393371582, 10.895357131958008, 12.099259376525879, 13.303162574768066, 14.507065773010254, 15.710968017578125, 16.914871215820312, 18.1187744140625, 19.322677612304688, 20.526580810546875, 21.730484008789062, 22.93438720703125, 24.138290405273438, 25.342191696166992, 26.54609489440918, 27.749998092651367, 28.953901290893555, 30.157804489135742, 31.36170768737793, 32.565608978271484, 33.76951217651367, 34.97341537475586, 36.17731857299805, 37.381221771240234]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 6.0, 8.0, 10.0, 6.0, 16.0, 14.0, 15.0, 19.0, 29.0, 18.0, 21.0, 21.0, 34.0, 31.0, 34.0, 36.0, 41.0, 58.0, 47.0, 39.0, 38.0, 38.0, 42.0, 45.0, 34.0, 36.0, 31.0, 25.0, 26.0, 29.0, 18.0, 24.0, 19.0, 20.0, 14.0, 10.0, 8.0, 10.0, 7.0, 7.0, 4.0, 2.0, 1.0, 4.0, 4.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.2109375, -6.971923828125, -6.73291015625, -6.493896484375, -6.2548828125, -6.015869140625, -5.77685546875, -5.537841796875, -5.298828125, -5.059814453125, -4.82080078125, -4.581787109375, -4.3427734375, -4.103759765625, -3.86474609375, -3.625732421875, -3.38671875, -3.147705078125, -2.90869140625, -2.669677734375, -2.4306640625, -2.191650390625, -1.95263671875, -1.713623046875, -1.474609375, -1.235595703125, -0.99658203125, -0.757568359375, -0.5185546875, -0.279541015625, -0.04052734375, 0.198486328125, 0.4375, 0.676513671875, 0.91552734375, 1.154541015625, 1.3935546875, 1.632568359375, 1.87158203125, 2.110595703125, 2.349609375, 2.588623046875, 2.82763671875, 3.066650390625, 3.3056640625, 3.544677734375, 3.78369140625, 4.022705078125, 4.26171875, 4.500732421875, 4.73974609375, 4.978759765625, 5.2177734375, 5.456787109375, 5.69580078125, 5.934814453125, 6.173828125, 6.412841796875, 6.65185546875, 6.890869140625, 7.1298828125, 7.368896484375, 7.60791015625, 7.846923828125, 8.0859375]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 5.0, 5.0, 5.0, 5.0, 11.0, 21.0, 21.0, 24.0, 34.0, 53.0, 75.0, 117.0, 137.0, 192.0, 255.0, 349.0, 538.0, 937.0, 1953.0, 4646.0, 14872.0, 78215.0, 2272957.0, 1737448.0, 59731.0, 12775.0, 4381.0, 1874.0, 907.0, 518.0, 344.0, 244.0, 183.0, 107.0, 84.0, 70.0, 49.0, 35.0, 27.0, 24.0, 20.0, 7.0, 9.0, 10.0, 6.0, 7.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.90625, -26.87060546875, -25.8349609375, -24.79931640625, -23.763671875, -22.72802734375, -21.6923828125, -20.65673828125, -19.62109375, -18.58544921875, -17.5498046875, -16.51416015625, -15.478515625, -14.44287109375, -13.4072265625, -12.37158203125, -11.3359375, -10.30029296875, -9.2646484375, -8.22900390625, -7.193359375, -6.15771484375, -5.1220703125, -4.08642578125, -3.05078125, -2.01513671875, -0.9794921875, 0.05615234375, 1.091796875, 2.12744140625, 3.1630859375, 4.19873046875, 5.234375, 6.27001953125, 7.3056640625, 8.34130859375, 9.376953125, 10.41259765625, 11.4482421875, 12.48388671875, 13.51953125, 14.55517578125, 15.5908203125, 16.62646484375, 17.662109375, 18.69775390625, 19.7333984375, 20.76904296875, 21.8046875, 22.84033203125, 23.8759765625, 24.91162109375, 25.947265625, 26.98291015625, 28.0185546875, 29.05419921875, 30.08984375, 31.12548828125, 32.1611328125, 33.19677734375, 34.232421875, 35.26806640625, 36.3037109375, 37.33935546875, 38.375]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 5.0, 3.0, 7.0, 15.0, 17.0, 26.0, 39.0, 66.0, 98.0, 178.0, 348.0, 608.0, 858.0, 753.0, 445.0, 238.0, 156.0, 70.0, 52.0, 28.0, 28.0, 15.0, 4.0, 6.0, 5.0, 4.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-28.171875, -27.5126953125, -26.853515625, -26.1943359375, -25.53515625, -24.8759765625, -24.216796875, -23.5576171875, -22.8984375, -22.2392578125, -21.580078125, -20.9208984375, -20.26171875, -19.6025390625, -18.943359375, -18.2841796875, -17.625, -16.9658203125, -16.306640625, -15.6474609375, -14.98828125, -14.3291015625, -13.669921875, -13.0107421875, -12.3515625, -11.6923828125, -11.033203125, -10.3740234375, -9.71484375, -9.0556640625, -8.396484375, -7.7373046875, -7.078125, -6.4189453125, -5.759765625, -5.1005859375, -4.44140625, -3.7822265625, -3.123046875, -2.4638671875, -1.8046875, -1.1455078125, -0.486328125, 0.1728515625, 0.83203125, 1.4912109375, 2.150390625, 2.8095703125, 3.46875, 4.1279296875, 4.787109375, 5.4462890625, 6.10546875, 6.7646484375, 7.423828125, 8.0830078125, 8.7421875, 9.4013671875, 10.060546875, 10.7197265625, 11.37890625, 12.0380859375, 12.697265625, 13.3564453125, 14.015625]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 5.0, 0.0, 2.0, 6.0, 4.0, 9.0, 9.0, 11.0, 9.0, 16.0, 15.0, 27.0, 33.0, 47.0, 63.0, 67.0, 79.0, 119.0, 195.0, 294.0, 489.0, 1024.0, 2788.0, 8131.0, 29659.0, 156763.0, 2441680.0, 1414089.0, 105472.0, 22456.0, 6329.0, 2221.0, 912.0, 480.0, 239.0, 135.0, 127.0, 67.0, 46.0, 36.0, 28.0, 27.0, 22.0, 10.0, 18.0, 12.0, 6.0, 3.0, 7.0, 5.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.828125, -18.21875, -17.609375, -17.0, -16.390625, -15.78125, -15.171875, -14.5625, -13.953125, -13.34375, -12.734375, -12.125, -11.515625, -10.90625, -10.296875, -9.6875, -9.078125, -8.46875, -7.859375, -7.25, -6.640625, -6.03125, -5.421875, -4.8125, -4.203125, -3.59375, -2.984375, -2.375, -1.765625, -1.15625, -0.546875, 0.0625, 0.671875, 1.28125, 1.890625, 2.5, 3.109375, 3.71875, 4.328125, 4.9375, 5.546875, 6.15625, 6.765625, 7.375, 7.984375, 8.59375, 9.203125, 9.8125, 10.421875, 11.03125, 11.640625, 12.25, 12.859375, 13.46875, 14.078125, 14.6875, 15.296875, 15.90625, 16.515625, 17.125, 17.734375, 18.34375, 18.953125, 19.5625, 20.171875]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 6.0, 5.0, 3.0, 6.0, 9.0, 13.0, 13.0, 16.0, 26.0, 34.0, 26.0, 53.0, 67.0, 76.0, 79.0, 89.0, 80.0, 73.0, 71.0, 49.0, 39.0, 47.0, 28.0, 20.0, 17.0, 13.0, 14.0, 12.0, 9.0, 3.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-91.79130554199219, -89.21698760986328, -86.64266204833984, -84.06834411621094, -81.4940185546875, -78.9197006225586, -76.34538269042969, -73.77105712890625, -71.19673919677734, -68.62242126464844, -66.048095703125, -63.473777770996094, -60.89945602416992, -58.32513427734375, -55.75081253051758, -53.176490783691406, -50.602169036865234, -48.02784729003906, -45.45352554321289, -42.87920379638672, -40.30488586425781, -37.73056411743164, -35.15624237060547, -32.58192443847656, -30.007600784301758, -27.433279037475586, -24.858959197998047, -22.284637451171875, -19.710315704345703, -17.135995864868164, -14.561674118041992, -11.987354278564453, -9.413032531738281, -6.838711738586426, -4.264390468597412, -1.6900691986083984, 0.884251594543457, 3.4585723876953125, 6.032894134521484, 8.607213973999023, 11.181535720825195, 13.75585651397705, 16.330177307128906, 18.904499053955078, 21.47882080078125, 24.05314064025879, 26.62746238708496, 29.2017822265625, 31.776103973388672, 34.350425720214844, 36.924747467041016, 39.49906921386719, 42.073387145996094, 44.647708892822266, 47.22203063964844, 49.796348571777344, 52.37067413330078, 54.94499588012695, 57.519317626953125, 60.09363555908203, 62.6679573059082, 65.24227905273438, 67.81660461425781, 70.39092254638672, 72.96524047851562]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 4.0, 3.0, 2.0, 3.0, 9.0, 6.0, 11.0, 12.0, 18.0, 22.0, 29.0, 22.0, 36.0, 37.0, 49.0, 42.0, 54.0, 53.0, 71.0, 62.0, 61.0, 61.0, 49.0, 44.0, 33.0, 40.0, 29.0, 28.0, 23.0, 20.0, 12.0, 13.0, 11.0, 7.0, 8.0, 5.0, 4.0, 2.0, 4.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-69.92576599121094, -67.708984375, -65.49220275878906, -63.27542495727539, -61.05864715576172, -58.84186553955078, -56.625083923339844, -54.40830612182617, -52.1915283203125, -49.97474670410156, -47.75796890258789, -45.54118728637695, -43.32440948486328, -41.107627868652344, -38.890846252441406, -36.674068450927734, -34.4572868347168, -32.24050521850586, -30.023727416992188, -27.80694580078125, -25.590167999267578, -23.37338638305664, -21.156606674194336, -18.93982696533203, -16.723047256469727, -14.506267547607422, -12.289487838745117, -10.072707176208496, -7.855927467346191, -5.639147758483887, -3.4223670959472656, -1.205587387084961, 1.0111923217773438, 3.2279722690582275, 5.444752216339111, 7.661532402038574, 9.878312110900879, 12.095091819763184, 14.311872482299805, 16.52865219116211, 18.745431900024414, 20.96221160888672, 23.178991317749023, 25.395771026611328, 27.612552642822266, 29.829330444335938, 32.046112060546875, 34.26289367675781, 36.479671478271484, 38.69645309448242, 40.913230895996094, 43.13001251220703, 45.3467903137207, 47.56357192993164, 49.78034973144531, 51.99713134765625, 54.21391296386719, 56.430694580078125, 58.6474723815918, 60.864253997802734, 63.081031799316406, 65.29781341552734, 67.51459503173828, 69.73136901855469, 71.94815063476562]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 2.0, 1.0, 2.0, 4.0, 1.0, 3.0, 7.0, 4.0, 8.0, 11.0, 12.0, 8.0, 11.0, 14.0, 16.0, 25.0, 40.0, 28.0, 32.0, 42.0, 33.0, 32.0, 41.0, 40.0, 27.0, 43.0, 38.0, 32.0, 56.0, 36.0, 36.0, 48.0, 27.0, 35.0, 36.0, 20.0, 25.0, 23.0, 13.0, 20.0, 12.0, 16.0, 7.0, 7.0, 11.0, 4.0, 4.0, 6.0, 4.0, 4.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-96.0, -93.115234375, -90.23046875, -87.345703125, -84.4609375, -81.576171875, -78.69140625, -75.806640625, -72.921875, -70.037109375, -67.15234375, -64.267578125, -61.3828125, -58.498046875, -55.61328125, -52.728515625, -49.84375, -46.958984375, -44.07421875, -41.189453125, -38.3046875, -35.419921875, -32.53515625, -29.650390625, -26.765625, -23.880859375, -20.99609375, -18.111328125, -15.2265625, -12.341796875, -9.45703125, -6.572265625, -3.6875, -0.802734375, 2.08203125, 4.966796875, 7.8515625, 10.736328125, 13.62109375, 16.505859375, 19.390625, 22.275390625, 25.16015625, 28.044921875, 30.9296875, 33.814453125, 36.69921875, 39.583984375, 42.46875, 45.353515625, 48.23828125, 51.123046875, 54.0078125, 56.892578125, 59.77734375, 62.662109375, 65.546875, 68.431640625, 71.31640625, 74.201171875, 77.0859375, 79.970703125, 82.85546875, 85.740234375, 88.625]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 5.0, 7.0, 6.0, 11.0, 18.0, 19.0, 42.0, 51.0, 84.0, 129.0, 193.0, 271.0, 457.0, 654.0, 943.0, 1435.0, 2162.0, 3188.0, 4928.0, 7651.0, 11372.0, 17390.0, 27254.0, 42984.0, 68931.0, 111789.0, 191741.0, 214021.0, 127683.0, 77426.0, 48398.0, 30406.0, 19762.0, 12552.0, 8386.0, 5444.0, 3663.0, 2400.0, 1595.0, 1008.0, 713.0, 471.0, 302.0, 213.0, 148.0, 86.0, 58.0, 41.0, 25.0, 13.0, 17.0, 10.0, 5.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.1953125, -3.085601806640625, -2.97589111328125, -2.866180419921875, -2.7564697265625, -2.646759033203125, -2.53704833984375, -2.427337646484375, -2.317626953125, -2.207916259765625, -2.09820556640625, -1.988494873046875, -1.8787841796875, -1.769073486328125, -1.65936279296875, -1.549652099609375, -1.43994140625, -1.330230712890625, -1.22052001953125, -1.110809326171875, -1.0010986328125, -0.891387939453125, -0.78167724609375, -0.671966552734375, -0.562255859375, -0.452545166015625, -0.34283447265625, -0.233123779296875, -0.1234130859375, -0.013702392578125, 0.09600830078125, 0.205718994140625, 0.3154296875, 0.425140380859375, 0.53485107421875, 0.644561767578125, 0.7542724609375, 0.863983154296875, 0.97369384765625, 1.083404541015625, 1.193115234375, 1.302825927734375, 1.41253662109375, 1.522247314453125, 1.6319580078125, 1.741668701171875, 1.85137939453125, 1.961090087890625, 2.07080078125, 2.180511474609375, 2.29022216796875, 2.399932861328125, 2.5096435546875, 2.619354248046875, 2.72906494140625, 2.838775634765625, 2.948486328125, 3.058197021484375, 3.16790771484375, 3.277618408203125, 3.3873291015625, 3.497039794921875, 3.60675048828125, 3.716461181640625, 3.826171875]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 4.0, 8.0, 5.0, 9.0, 14.0, 10.0, 16.0, 22.0, 12.0, 17.0, 15.0, 21.0, 29.0, 29.0, 37.0, 36.0, 28.0, 46.0, 33.0, 53.0, 46.0, 1061.0, 33.0, 46.0, 33.0, 41.0, 30.0, 22.0, 39.0, 36.0, 26.0, 23.0, 19.0, 17.0, 15.0, 12.0, 12.0, 14.0, 16.0, 6.0, 12.0, 8.0, 8.0, 5.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-59.5625, -57.74853515625, -55.9345703125, -54.12060546875, -52.306640625, -50.49267578125, -48.6787109375, -46.86474609375, -45.05078125, -43.23681640625, -41.4228515625, -39.60888671875, -37.794921875, -35.98095703125, -34.1669921875, -32.35302734375, -30.5390625, -28.72509765625, -26.9111328125, -25.09716796875, -23.283203125, -21.46923828125, -19.6552734375, -17.84130859375, -16.02734375, -14.21337890625, -12.3994140625, -10.58544921875, -8.771484375, -6.95751953125, -5.1435546875, -3.32958984375, -1.515625, 0.29833984375, 2.1123046875, 3.92626953125, 5.740234375, 7.55419921875, 9.3681640625, 11.18212890625, 12.99609375, 14.81005859375, 16.6240234375, 18.43798828125, 20.251953125, 22.06591796875, 23.8798828125, 25.69384765625, 27.5078125, 29.32177734375, 31.1357421875, 32.94970703125, 34.763671875, 36.57763671875, 38.3916015625, 40.20556640625, 42.01953125, 43.83349609375, 45.6474609375, 47.46142578125, 49.275390625, 51.08935546875, 52.9033203125, 54.71728515625, 56.53125]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 3.0, 6.0, 8.0, 12.0, 11.0, 22.0, 16.0, 22.0, 44.0, 74.0, 108.0, 186.0, 248.0, 326.0, 510.0, 771.0, 1062.0, 1602.0, 2297.0, 3635.0, 5236.0, 8196.0, 12743.0, 20532.0, 32601.0, 53416.0, 91772.0, 167776.0, 1303029.0, 161899.0, 88895.0, 52049.0, 32056.0, 19699.0, 12411.0, 7892.0, 5273.0, 3549.0, 2313.0, 1623.0, 1016.0, 701.0, 477.0, 321.0, 231.0, 161.0, 94.0, 76.0, 40.0, 27.0, 33.0, 15.0, 5.0, 5.0, 5.0, 6.0, 4.0, 4.0, 1.0, 3.0], "bins": [-3.01953125, -2.926544189453125, -2.83355712890625, -2.740570068359375, -2.6475830078125, -2.554595947265625, -2.46160888671875, -2.368621826171875, -2.275634765625, -2.182647705078125, -2.08966064453125, -1.996673583984375, -1.9036865234375, -1.810699462890625, -1.71771240234375, -1.624725341796875, -1.53173828125, -1.438751220703125, -1.34576416015625, -1.252777099609375, -1.1597900390625, -1.066802978515625, -0.97381591796875, -0.880828857421875, -0.787841796875, -0.694854736328125, -0.60186767578125, -0.508880615234375, -0.4158935546875, -0.322906494140625, -0.22991943359375, -0.136932373046875, -0.0439453125, 0.049041748046875, 0.14202880859375, 0.235015869140625, 0.3280029296875, 0.420989990234375, 0.51397705078125, 0.606964111328125, 0.699951171875, 0.792938232421875, 0.88592529296875, 0.978912353515625, 1.0718994140625, 1.164886474609375, 1.25787353515625, 1.350860595703125, 1.44384765625, 1.536834716796875, 1.62982177734375, 1.722808837890625, 1.8157958984375, 1.908782958984375, 2.00177001953125, 2.094757080078125, 2.187744140625, 2.280731201171875, 2.37371826171875, 2.466705322265625, 2.5596923828125, 2.652679443359375, 2.74566650390625, 2.838653564453125, 2.931640625]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 0.0, 3.0, 2.0, 2.0, 4.0, 5.0, 7.0, 6.0, 6.0, 7.0, 20.0, 23.0, 13.0, 30.0, 49.0, 106.0, 143.0, 154.0, 123.0, 93.0, 66.0, 36.0, 30.0, 15.0, 12.0, 11.0, 7.0, 6.0, 4.0, 3.0, 6.0, 0.0, 4.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.006519317626953125, -0.0063405632972717285, -0.006161808967590332, -0.0059830546379089355, -0.005804300308227539, -0.005625545978546143, -0.005446791648864746, -0.00526803731918335, -0.005089282989501953, -0.004910528659820557, -0.00473177433013916, -0.004553020000457764, -0.004374265670776367, -0.004195511341094971, -0.004016757011413574, -0.0038380026817321777, -0.0036592483520507812, -0.0034804940223693848, -0.0033017396926879883, -0.003122985363006592, -0.0029442310333251953, -0.002765476703643799, -0.0025867223739624023, -0.002407968044281006, -0.0022292137145996094, -0.002050459384918213, -0.0018717050552368164, -0.00169295072555542, -0.0015141963958740234, -0.001335442066192627, -0.0011566877365112305, -0.000977933406829834, -0.0007991790771484375, -0.000620424747467041, -0.00044167041778564453, -0.00026291608810424805, -8.416175842285156e-05, 9.459257125854492e-05, 0.0002733469009399414, 0.0004521012306213379, 0.0006308555603027344, 0.0008096098899841309, 0.0009883642196655273, 0.0011671185493469238, 0.0013458728790283203, 0.0015246272087097168, 0.0017033815383911133, 0.0018821358680725098, 0.0020608901977539062, 0.0022396445274353027, 0.0024183988571166992, 0.0025971531867980957, 0.002775907516479492, 0.0029546618461608887, 0.003133416175842285, 0.0033121705055236816, 0.003490924835205078, 0.0036696791648864746, 0.003848433494567871, 0.004027187824249268, 0.004205942153930664, 0.0043846964836120605, 0.004563450813293457, 0.0047422051429748535, 0.00492095947265625]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 5.0, 1.0, 3.0, 4.0, 2.0, 9.0, 8.0, 9.0, 7.0, 18.0, 18.0, 25.0, 38.0, 61.0, 113.0, 205.0, 403.0, 701.0, 1365.0, 2567.0, 5839.0, 14286.0, 41111.0, 159506.0, 614819.0, 144649.0, 38488.0, 13421.0, 5472.0, 2536.0, 1287.0, 699.0, 371.0, 195.0, 102.0, 64.0, 40.0, 27.0, 20.0, 13.0, 9.0, 8.0, 10.0, 8.0, 7.0, 4.0, 4.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.02276611328125, -0.02196645736694336, -0.02116680145263672, -0.020367145538330078, -0.019567489624023438, -0.018767833709716797, -0.017968177795410156, -0.017168521881103516, -0.016368865966796875, -0.015569210052490234, -0.014769554138183594, -0.013969898223876953, -0.013170242309570312, -0.012370586395263672, -0.011570930480957031, -0.01077127456665039, -0.00997161865234375, -0.00917196273803711, -0.008372306823730469, -0.007572650909423828, -0.0067729949951171875, -0.005973339080810547, -0.005173683166503906, -0.004374027252197266, -0.003574371337890625, -0.0027747154235839844, -0.0019750595092773438, -0.0011754035949707031, -0.0003757476806640625, 0.0004239082336425781, 0.0012235641479492188, 0.0020232200622558594, 0.0028228759765625, 0.0036225318908691406, 0.004422187805175781, 0.005221843719482422, 0.0060214996337890625, 0.006821155548095703, 0.007620811462402344, 0.008420467376708984, 0.009220123291015625, 0.010019779205322266, 0.010819435119628906, 0.011619091033935547, 0.012418746948242188, 0.013218402862548828, 0.014018058776855469, 0.01481771469116211, 0.01561737060546875, 0.01641702651977539, 0.01721668243408203, 0.018016338348388672, 0.018815994262695312, 0.019615650177001953, 0.020415306091308594, 0.021214962005615234, 0.022014617919921875, 0.022814273834228516, 0.023613929748535156, 0.024413585662841797, 0.025213241577148438, 0.026012897491455078, 0.02681255340576172, 0.02761220932006836, 0.028411865234375]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 8.0, 2.0, 16.0, 25.0, 23.0, 34.0, 52.0, 64.0, 103.0, 119.0, 117.0, 127.0, 83.0, 52.0, 60.0, 42.0, 12.0, 21.0, 12.0, 11.0, 8.0, 6.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.006828643381595612, -0.0066714719869196415, -0.006514300592243671, -0.006357129197567701, -0.006199957802891731, -0.006042786408215761, -0.005885615013539791, -0.005728443618863821, -0.005571272224187851, -0.005414100829511881, -0.005256929434835911, -0.005099758040159941, -0.004942586645483971, -0.0047854152508080006, -0.0046282438561320305, -0.00447107246145606, -0.00431390106678009, -0.00415672967210412, -0.00399955827742815, -0.00384238688275218, -0.00368521548807621, -0.00352804409340024, -0.00337087269872427, -0.0032137013040483, -0.0030565294437110424, -0.0028993580490350723, -0.0027421866543591022, -0.002585015259683132, -0.002427843865007162, -0.002270672470331192, -0.002113501075655222, -0.001956329680979252, -0.0017991585191339254, -0.0016419871244579554, -0.0014848157297819853, -0.0013276443351060152, -0.0011704729404300451, -0.001013301545754075, -0.0008561300346627831, -0.0006989586399868131, -0.000541787245310843, -0.0003846158506348729, -0.00022744442685507238, -7.027300307527184e-05, 8.689839160069823e-05, 0.0002440697862766683, 0.0004012412391602993, 0.0005584126338362694, 0.0007155840285122395, 0.0008727554231882095, 0.0010299268178641796, 0.0011870982125401497, 0.0013442696072161198, 0.0015014410018920898, 0.0016586125129833817, 0.0018157839076593518, 0.00197295518592, 0.00213012658059597, 0.0022872979752719402, 0.0024444693699479103, 0.0026016407646238804, 0.0027588121592998505, 0.0029159835539758205, 0.0030731549486517906, 0.0032303265761584044]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 3.0, 5.0, 2.0, 2.0, 3.0, 6.0, 5.0, 7.0, 8.0, 13.0, 18.0, 10.0, 10.0, 14.0, 23.0, 21.0, 31.0, 31.0, 39.0, 34.0, 27.0, 36.0, 31.0, 36.0, 35.0, 45.0, 29.0, 28.0, 45.0, 37.0, 37.0, 29.0, 44.0, 34.0, 20.0, 30.0, 25.0, 27.0, 24.0, 16.0, 13.0, 16.0, 9.0, 9.0, 10.0, 5.0, 7.0, 5.0, 6.0, 1.0, 6.0, 3.0, 1.0, 1.0, 2.0, 0.0, 3.0], "bins": [-0.0022095441818237305, -0.0021430132910609245, -0.0020764824002981186, -0.0020099515095353127, -0.0019434206187725067, -0.0018768897280097008, -0.0018103588372468948, -0.001743827946484089, -0.001677297055721283, -0.001610766164958477, -0.001544235274195671, -0.0014777043834328651, -0.0014111734926700592, -0.0013446426019072533, -0.0012781117111444473, -0.0012115808203816414, -0.0011450499296188354, -0.0010785190388560295, -0.0010119881480932236, -0.0009454572573304176, -0.0008789263665676117, -0.0008123954758048058, -0.0007458645850419998, -0.0006793336942791939, -0.0006128028035163879, -0.000546271912753582, -0.00047974102199077606, -0.0004132101312279701, -0.0003466792404651642, -0.00028014834970235825, -0.0002136174589395523, -0.00014708656817674637, -8.055567741394043e-05, -1.4024786651134491e-05, 5.250610411167145e-05, 0.00011903699487447739, 0.00018556788563728333, 0.00025209877640008926, 0.0003186296671628952, 0.00038516055792570114, 0.0004516914486885071, 0.000518222339451313, 0.000584753230214119, 0.0006512841209769249, 0.0007178150117397308, 0.0007843459025025368, 0.0008508767932653427, 0.0009174076840281487, 0.0009839385747909546, 0.0010504694655537605, 0.0011170003563165665, 0.0011835312470793724, 0.0012500621378421783, 0.0013165930286049843, 0.0013831239193677902, 0.0014496548101305962, 0.001516185700893402, 0.001582716591656208, 0.001649247482419014, 0.00171577837318182, 0.0017823092639446259, 0.0018488401547074318, 0.0019153710454702377, 0.0019819019362330437, 0.0020484328269958496]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 2.0, 1.0, 2.0, 4.0, 1.0, 3.0, 7.0, 4.0, 8.0, 11.0, 12.0, 8.0, 11.0, 14.0, 16.0, 25.0, 40.0, 28.0, 32.0, 42.0, 33.0, 32.0, 41.0, 40.0, 27.0, 43.0, 38.0, 33.0, 55.0, 36.0, 36.0, 47.0, 28.0, 35.0, 36.0, 20.0, 25.0, 23.0, 13.0, 20.0, 12.0, 16.0, 6.0, 8.0, 11.0, 4.0, 4.0, 6.0, 4.0, 4.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-96.0, -93.115234375, -90.23046875, -87.345703125, -84.4609375, -81.576171875, -78.69140625, -75.806640625, -72.921875, -70.037109375, -67.15234375, -64.267578125, -61.3828125, -58.498046875, -55.61328125, -52.728515625, -49.84375, -46.958984375, -44.07421875, -41.189453125, -38.3046875, -35.419921875, -32.53515625, -29.650390625, -26.765625, -23.880859375, -20.99609375, -18.111328125, -15.2265625, -12.341796875, -9.45703125, -6.572265625, -3.6875, -0.802734375, 2.08203125, 4.966796875, 7.8515625, 10.736328125, 13.62109375, 16.505859375, 19.390625, 22.275390625, 25.16015625, 28.044921875, 30.9296875, 33.814453125, 36.69921875, 39.583984375, 42.46875, 45.353515625, 48.23828125, 51.123046875, 54.0078125, 56.892578125, 59.77734375, 62.662109375, 65.546875, 68.431640625, 71.31640625, 74.201171875, 77.0859375, 79.970703125, 82.85546875, 85.740234375, 88.625]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 4.0, 3.0, 3.0, 4.0, 6.0, 8.0, 11.0, 12.0, 13.0, 21.0, 20.0, 35.0, 42.0, 57.0, 65.0, 85.0, 127.0, 168.0, 230.0, 398.0, 647.0, 1310.0, 2845.0, 6721.0, 18497.0, 61082.0, 236245.0, 480986.0, 168851.0, 44986.0, 14346.0, 5551.0, 2267.0, 1150.0, 604.0, 368.0, 180.0, 135.0, 97.0, 84.0, 68.0, 47.0, 43.0, 30.0, 24.0, 21.0, 18.0, 14.0, 11.0, 8.0, 6.0, 4.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0], "bins": [-14.5546875, -14.11865234375, -13.6826171875, -13.24658203125, -12.810546875, -12.37451171875, -11.9384765625, -11.50244140625, -11.06640625, -10.63037109375, -10.1943359375, -9.75830078125, -9.322265625, -8.88623046875, -8.4501953125, -8.01416015625, -7.578125, -7.14208984375, -6.7060546875, -6.27001953125, -5.833984375, -5.39794921875, -4.9619140625, -4.52587890625, -4.08984375, -3.65380859375, -3.2177734375, -2.78173828125, -2.345703125, -1.90966796875, -1.4736328125, -1.03759765625, -0.6015625, -0.16552734375, 0.2705078125, 0.70654296875, 1.142578125, 1.57861328125, 2.0146484375, 2.45068359375, 2.88671875, 3.32275390625, 3.7587890625, 4.19482421875, 4.630859375, 5.06689453125, 5.5029296875, 5.93896484375, 6.375, 6.81103515625, 7.2470703125, 7.68310546875, 8.119140625, 8.55517578125, 8.9912109375, 9.42724609375, 9.86328125, 10.29931640625, 10.7353515625, 11.17138671875, 11.607421875, 12.04345703125, 12.4794921875, 12.91552734375, 13.3515625]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 1.0, 1.0, 0.0, 2.0, 5.0, 6.0, 8.0, 13.0, 13.0, 14.0, 25.0, 27.0, 44.0, 51.0, 47.0, 57.0, 68.0, 67.0, 2074.0, 107.0, 58.0, 62.0, 61.0, 68.0, 37.0, 34.0, 30.0, 18.0, 18.0, 8.0, 14.0, 3.0, 4.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-233.625, -227.267578125, -220.91015625, -214.552734375, -208.1953125, -201.837890625, -195.48046875, -189.123046875, -182.765625, -176.408203125, -170.05078125, -163.693359375, -157.3359375, -150.978515625, -144.62109375, -138.263671875, -131.90625, -125.548828125, -119.19140625, -112.833984375, -106.4765625, -100.119140625, -93.76171875, -87.404296875, -81.046875, -74.689453125, -68.33203125, -61.974609375, -55.6171875, -49.259765625, -42.90234375, -36.544921875, -30.1875, -23.830078125, -17.47265625, -11.115234375, -4.7578125, 1.599609375, 7.95703125, 14.314453125, 20.671875, 27.029296875, 33.38671875, 39.744140625, 46.1015625, 52.458984375, 58.81640625, 65.173828125, 71.53125, 77.888671875, 84.24609375, 90.603515625, 96.9609375, 103.318359375, 109.67578125, 116.033203125, 122.390625, 128.748046875, 135.10546875, 141.462890625, 147.8203125, 154.177734375, 160.53515625, 166.892578125, 173.25]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 4.0, 1.0, 9.0, 7.0, 4.0, 18.0, 19.0, 41.0, 43.0, 63.0, 85.0, 131.0, 211.0, 355.0, 554.0, 1019.0, 2384.0, 8939.0, 78084.0, 2868548.0, 165138.0, 14049.0, 2969.0, 1252.0, 643.0, 385.0, 238.0, 144.0, 95.0, 72.0, 43.0, 38.0, 32.0, 21.0, 13.0, 10.0, 8.0, 5.0, 5.0, 8.0, 5.0, 3.0, 4.0, 1.0, 5.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-26.234375, -25.284912109375, -24.33544921875, -23.385986328125, -22.4365234375, -21.487060546875, -20.53759765625, -19.588134765625, -18.638671875, -17.689208984375, -16.73974609375, -15.790283203125, -14.8408203125, -13.891357421875, -12.94189453125, -11.992431640625, -11.04296875, -10.093505859375, -9.14404296875, -8.194580078125, -7.2451171875, -6.295654296875, -5.34619140625, -4.396728515625, -3.447265625, -2.497802734375, -1.54833984375, -0.598876953125, 0.3505859375, 1.300048828125, 2.24951171875, 3.198974609375, 4.1484375, 5.097900390625, 6.04736328125, 6.996826171875, 7.9462890625, 8.895751953125, 9.84521484375, 10.794677734375, 11.744140625, 12.693603515625, 13.64306640625, 14.592529296875, 15.5419921875, 16.491455078125, 17.44091796875, 18.390380859375, 19.33984375, 20.289306640625, 21.23876953125, 22.188232421875, 23.1376953125, 24.087158203125, 25.03662109375, 25.986083984375, 26.935546875, 27.885009765625, 28.83447265625, 29.783935546875, 30.7333984375, 31.682861328125, 32.63232421875, 33.581787109375, 34.53125]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 9.0, 12.0, 17.0, 44.0, 101.0, 260.0, 282.0, 159.0, 52.0, 21.0, 16.0, 8.0, 5.0, 6.0, 2.0, 2.0, 3.0, 3.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-219.9298553466797, -207.06796264648438, -194.20608520507812, -181.34420776367188, -168.48231506347656, -155.62042236328125, -142.758544921875, -129.89666748046875, -117.03477478027344, -104.17288970947266, -91.31100463867188, -78.4491195678711, -65.58723449707031, -52.72534942626953, -39.86346435546875, -27.00157928466797, -14.139694213867188, -1.2778091430664062, 11.584075927734375, 24.445960998535156, 37.30784606933594, 50.16973114013672, 63.0316162109375, 75.89350128173828, 88.75538635253906, 101.61727142333984, 114.47915649414062, 127.3410415649414, 140.2029266357422, 153.0648193359375, 165.92669677734375, 178.78857421875, 191.65045166015625, 204.5123291015625, 217.3742218017578, 230.23611450195312, 243.09799194335938, 255.95986938476562, 268.82177734375, 281.68365478515625, 294.5455322265625, 307.40740966796875, 320.269287109375, 333.1311950683594, 345.9930725097656, 358.8549499511719, 371.71685791015625, 384.5787353515625, 397.44061279296875, 410.302490234375, 423.16436767578125, 436.0262756347656, 448.8881530761719, 461.7500305175781, 474.6119384765625, 487.47381591796875, 500.335693359375, 513.1975708007812, 526.0594482421875, 538.9213256835938, 551.783203125, 564.6451416015625, 577.5070190429688, 590.368896484375, 603.2307739257812]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 5.0, 7.0, 5.0, 8.0, 10.0, 18.0, 19.0, 18.0, 8.0, 34.0, 27.0, 36.0, 45.0, 37.0, 50.0, 48.0, 54.0, 74.0, 51.0, 51.0, 50.0, 41.0, 35.0, 35.0, 27.0, 30.0, 40.0, 23.0, 22.0, 14.0, 10.0, 15.0, 14.0, 10.0, 9.0, 5.0, 7.0, 1.0, 1.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-209.44200134277344, -202.90267944335938, -196.3633575439453, -189.82403564453125, -183.28469848632812, -176.74537658691406, -170.2060546875, -163.66673278808594, -157.12741088867188, -150.5880889892578, -144.04876708984375, -137.50942993164062, -130.97010803222656, -124.4307861328125, -117.89146423339844, -111.35214233398438, -104.81281280517578, -98.27349090576172, -91.73416137695312, -85.19483947753906, -78.655517578125, -72.11619567871094, -65.57686614990234, -59.03754425048828, -52.49821853637695, -45.958892822265625, -39.41957092285156, -32.880245208740234, -26.34092140197754, -19.801597595214844, -13.262271881103516, -6.722949981689453, -0.183624267578125, 6.3557000160217285, 12.895024299621582, 19.434349060058594, 25.97367286682129, 32.512996673583984, 39.05232238769531, 45.591644287109375, 52.1309700012207, 58.67029571533203, 65.2096176147461, 71.74894714355469, 78.28826904296875, 84.82759094238281, 91.36691284179688, 97.90623474121094, 104.44556427001953, 110.9848861694336, 117.52421569824219, 124.06353759765625, 130.6028594970703, 137.14218139648438, 143.6815185546875, 150.2208251953125, 156.76016235351562, 163.2994842529297, 169.83880615234375, 176.37814331054688, 182.91746520996094, 189.456787109375, 195.99610900878906, 202.53543090820312, 209.0747528076172]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 6.0, 7.0, 9.0, 17.0, 21.0, 27.0, 37.0, 60.0, 81.0, 96.0, 154.0, 156.0, 223.0, 358.0, 920.0, 3063.0, 18819.0, 1019169.0, 3162.0, 864.0, 385.0, 252.0, 173.0, 121.0, 107.0, 74.0, 51.0, 48.0, 32.0, 15.0, 23.0, 11.0, 4.0, 5.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.69109344482422, -59.22428512573242, -56.757476806640625, -54.29066848754883, -51.82386016845703, -49.357051849365234, -46.89024353027344, -44.42343521118164, -41.956626892089844, -39.48981857299805, -37.02301025390625, -34.55620193481445, -32.089393615722656, -29.62258529663086, -27.155776977539062, -24.688968658447266, -22.22216033935547, -19.755352020263672, -17.288543701171875, -14.821735382080078, -12.354927062988281, -9.888118743896484, -7.4213104248046875, -4.954502105712891, -2.4876937866210938, -0.020885467529296875, 2.4459228515625, 4.912731170654297, 7.379539489746094, 9.84634780883789, 12.313156127929688, 14.779964447021484, 17.246780395507812, 19.71358871459961, 22.180397033691406, 24.647205352783203, 27.114013671875, 29.580821990966797, 32.047630310058594, 34.51443862915039, 36.98124694824219, 39.448055267333984, 41.91486358642578, 44.38167190551758, 46.848480224609375, 49.31528854370117, 51.78209686279297, 54.248905181884766, 56.71571350097656, 59.18252182006836, 61.649330139160156, 64.11613464355469, 66.58294677734375, 69.04975891113281, 71.51656341552734, 73.98336791992188, 76.45018005371094, 78.9169921875, 81.38379669189453, 83.85060119628906, 86.31741333007812, 88.78422546386719, 91.25102996826172, 93.71783447265625, 96.18464660644531]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 8.0, 3.0, 12.0, 12.0, 23.0, 44.0, 75.0, 98.0, 264.0, 51461152.0, 1280.0, 87.0, 48.0, 13.0, 12.0, 14.0, 5.0, 5.0, 6.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1333.872802734375, -1262.6396484375, -1191.4066162109375, -1120.1734619140625, -1048.9404296875, -977.707275390625, -906.47412109375, -835.2410278320312, -764.0079345703125, -692.7748413085938, -621.541748046875, -550.30859375, -479.07550048828125, -407.8424072265625, -336.6092834472656, -265.37615966796875, -194.14306640625, -122.90995788574219, -51.676849365234375, 19.556259155273438, 90.78936767578125, 162.0224609375, 233.25558471679688, 304.48870849609375, 375.7218017578125, 446.95489501953125, 518.18798828125, 589.421142578125, 660.6542358398438, 731.8873291015625, 803.1204833984375, 874.3535766601562, 945.5869140625, 1016.8200073242188, 1088.0531005859375, 1159.2862548828125, 1230.519287109375, 1301.75244140625, 1372.985595703125, 1444.21875, 1515.4517822265625, 1586.6849365234375, 1657.91796875, 1729.151123046875, 1800.38427734375, 1871.6173095703125, 1942.8504638671875, 2014.08349609375, 2085.316650390625, 2156.5498046875, 2227.782958984375, 2299.015869140625, 2370.2490234375, 2441.482177734375, 2512.71533203125, 2583.948486328125, 2655.181640625, 2726.414794921875, 2797.64794921875, 2868.880859375, 2940.114013671875, 3011.34716796875, 3082.580322265625, 3153.8134765625, 3225.04638671875]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [5.0, 2.0, 9.0, 17.0, 13.0, 28.0, 45.0, 87.0, 130.0, 171.0, 287.0, 404.0, 513.0, 792.0, 1142.0, 1736.0, 2455.0, 3389.0, 4951.0, 7019.0, 10164.0, 13943.0, 19905.0, 28626.0, 42515.0, 61402.0, 90923.0, 136972.0, 212281.0, 339661.0, 753858.0, 3516213.0, 365068.0, 226110.0, 146436.0, 96844.0, 65054.0, 43158.0, 29787.0, 20764.0, 14106.0, 10249.0, 7402.0, 5136.0, 3564.0, 2483.0, 1731.0, 1351.0, 875.0, 566.0, 368.0, 241.0, 176.0, 106.0, 76.0, 54.0, 28.0, 24.0, 21.0, 7.0, 3.0, 2.0, 4.0, 4.0], "bins": [-0.84765625, -0.82037353515625, -0.7930908203125, -0.76580810546875, -0.738525390625, -0.71124267578125, -0.6839599609375, -0.65667724609375, -0.62939453125, -0.60211181640625, -0.5748291015625, -0.54754638671875, -0.520263671875, -0.49298095703125, -0.4656982421875, -0.43841552734375, -0.4111328125, -0.38385009765625, -0.3565673828125, -0.32928466796875, -0.302001953125, -0.27471923828125, -0.2474365234375, -0.22015380859375, -0.19287109375, -0.16558837890625, -0.1383056640625, -0.11102294921875, -0.083740234375, -0.05645751953125, -0.0291748046875, -0.00189208984375, 0.025390625, 0.05267333984375, 0.0799560546875, 0.10723876953125, 0.134521484375, 0.16180419921875, 0.1890869140625, 0.21636962890625, 0.24365234375, 0.27093505859375, 0.2982177734375, 0.32550048828125, 0.352783203125, 0.38006591796875, 0.4073486328125, 0.43463134765625, 0.4619140625, 0.48919677734375, 0.5164794921875, 0.54376220703125, 0.571044921875, 0.59832763671875, 0.6256103515625, 0.65289306640625, 0.68017578125, 0.70745849609375, 0.7347412109375, 0.76202392578125, 0.789306640625, 0.81658935546875, 0.8438720703125, 0.87115478515625, 0.8984375]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 1.0, 0.0, 2.0, 4.0, 2.0, 2.0, 3.0, 6.0, 8.0, 6.0, 8.0, 8.0, 9.0, 16.0, 13.0, 24.0, 21.0, 25.0, 30.0, 29.0, 31.0, 38.0, 26.0, 35.0, 43.0, 44.0, 39.0, 1050.0, 59.0, 38.0, 45.0, 34.0, 34.0, 43.0, 27.0, 30.0, 27.0, 28.0, 26.0, 24.0, 14.0, 15.0, 10.0, 10.0, 10.0, 9.0, 1.0, 9.0, 5.0, 5.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-21.296875, -20.601806640625, -19.90673828125, -19.211669921875, -18.5166015625, -17.821533203125, -17.12646484375, -16.431396484375, -15.736328125, -15.041259765625, -14.34619140625, -13.651123046875, -12.9560546875, -12.260986328125, -11.56591796875, -10.870849609375, -10.17578125, -9.480712890625, -8.78564453125, -8.090576171875, -7.3955078125, -6.700439453125, -6.00537109375, -5.310302734375, -4.615234375, -3.920166015625, -3.22509765625, -2.530029296875, -1.8349609375, -1.139892578125, -0.44482421875, 0.250244140625, 0.9453125, 1.640380859375, 2.33544921875, 3.030517578125, 3.7255859375, 4.420654296875, 5.11572265625, 5.810791015625, 6.505859375, 7.200927734375, 7.89599609375, 8.591064453125, 9.2861328125, 9.981201171875, 10.67626953125, 11.371337890625, 12.06640625, 12.761474609375, 13.45654296875, 14.151611328125, 14.8466796875, 15.541748046875, 16.23681640625, 16.931884765625, 17.626953125, 18.322021484375, 19.01708984375, 19.712158203125, 20.4072265625, 21.102294921875, 21.79736328125, 22.492431640625, 23.1875]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [7.0, 16.0, 16.0, 20.0, 29.0, 38.0, 68.0, 103.0, 137.0, 211.0, 264.0, 437.0, 676.0, 804.0, 1109.0, 1705.0, 2428.0, 3487.0, 5093.0, 7185.0, 10734.0, 14955.0, 21819.0, 31267.0, 45911.0, 66778.0, 98442.0, 147554.0, 223210.0, 337975.0, 768068.0, 3425171.0, 356987.0, 233995.0, 155807.0, 103673.0, 69706.0, 47731.0, 33269.0, 22777.0, 15642.0, 10829.0, 7406.0, 5422.0, 3779.0, 2746.0, 1847.0, 1249.0, 875.0, 642.0, 382.0, 301.0, 194.0, 145.0, 98.0, 93.0, 45.0, 43.0, 15.0, 9.0, 13.0, 10.0, 6.0, 3.0], "bins": [-0.66552734375, -0.64410400390625, -0.6226806640625, -0.60125732421875, -0.579833984375, -0.55841064453125, -0.5369873046875, -0.51556396484375, -0.494140625, -0.47271728515625, -0.4512939453125, -0.42987060546875, -0.408447265625, -0.38702392578125, -0.3656005859375, -0.34417724609375, -0.32275390625, -0.30133056640625, -0.2799072265625, -0.25848388671875, -0.237060546875, -0.21563720703125, -0.1942138671875, -0.17279052734375, -0.1513671875, -0.12994384765625, -0.1085205078125, -0.08709716796875, -0.065673828125, -0.04425048828125, -0.0228271484375, -0.00140380859375, 0.02001953125, 0.04144287109375, 0.0628662109375, 0.08428955078125, 0.105712890625, 0.12713623046875, 0.1485595703125, 0.16998291015625, 0.19140625, 0.21282958984375, 0.2342529296875, 0.25567626953125, 0.277099609375, 0.29852294921875, 0.3199462890625, 0.34136962890625, 0.36279296875, 0.38421630859375, 0.4056396484375, 0.42706298828125, 0.448486328125, 0.46990966796875, 0.4913330078125, 0.51275634765625, 0.5341796875, 0.55560302734375, 0.5770263671875, 0.59844970703125, 0.619873046875, 0.64129638671875, 0.6627197265625, 0.68414306640625, 0.70556640625]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 4.0, 2.0, 5.0, 7.0, 10.0, 13.0, 9.0, 17.0, 10.0, 20.0, 11.0, 21.0, 23.0, 19.0, 28.0, 26.0, 36.0, 38.0, 38.0, 42.0, 34.0, 25.0, 43.0, 1054.0, 34.0, 32.0, 51.0, 41.0, 29.0, 39.0, 26.0, 31.0, 32.0, 23.0, 24.0, 25.0, 9.0, 17.0, 10.0, 17.0, 12.0, 14.0, 9.0, 5.0, 2.0, 3.0, 4.0, 2.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-16.671875, -16.157470703125, -15.64306640625, -15.128662109375, -14.6142578125, -14.099853515625, -13.58544921875, -13.071044921875, -12.556640625, -12.042236328125, -11.52783203125, -11.013427734375, -10.4990234375, -9.984619140625, -9.47021484375, -8.955810546875, -8.44140625, -7.927001953125, -7.41259765625, -6.898193359375, -6.3837890625, -5.869384765625, -5.35498046875, -4.840576171875, -4.326171875, -3.811767578125, -3.29736328125, -2.782958984375, -2.2685546875, -1.754150390625, -1.23974609375, -0.725341796875, -0.2109375, 0.303466796875, 0.81787109375, 1.332275390625, 1.8466796875, 2.361083984375, 2.87548828125, 3.389892578125, 3.904296875, 4.418701171875, 4.93310546875, 5.447509765625, 5.9619140625, 6.476318359375, 6.99072265625, 7.505126953125, 8.01953125, 8.533935546875, 9.04833984375, 9.562744140625, 10.0771484375, 10.591552734375, 11.10595703125, 11.620361328125, 12.134765625, 12.649169921875, 13.16357421875, 13.677978515625, 14.1923828125, 14.706787109375, 15.22119140625, 15.735595703125, 16.25]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [4.0, 2.0, 4.0, 5.0, 2.0, 6.0, 2.0, 5.0, 5.0, 17.0, 20.0, 14.0, 23.0, 15.0, 41.0, 47.0, 75.0, 99.0, 97.0, 134.0, 204.0, 203.0, 307.0, 413.0, 631.0, 947.0, 1550.0, 2538.0, 4273.0, 8225.0, 16822.0, 37119.0, 101221.0, 5776834.0, 215639.0, 68114.0, 26859.0, 12834.0, 6280.0, 3679.0, 1961.0, 1203.0, 834.0, 548.0, 371.0, 271.0, 244.0, 171.0, 86.0, 100.0, 54.0, 64.0, 51.0, 33.0, 42.0, 47.0, 21.0, 10.0, 10.0, 6.0, 7.0, 7.0, 3.0, 3.0], "bins": [-2.728515625, -2.6478271484375, -2.567138671875, -2.4864501953125, -2.40576171875, -2.3250732421875, -2.244384765625, -2.1636962890625, -2.0830078125, -2.0023193359375, -1.921630859375, -1.8409423828125, -1.76025390625, -1.6795654296875, -1.598876953125, -1.5181884765625, -1.4375, -1.3568115234375, -1.276123046875, -1.1954345703125, -1.11474609375, -1.0340576171875, -0.953369140625, -0.8726806640625, -0.7919921875, -0.7113037109375, -0.630615234375, -0.5499267578125, -0.46923828125, -0.3885498046875, -0.307861328125, -0.2271728515625, -0.146484375, -0.0657958984375, 0.014892578125, 0.0955810546875, 0.17626953125, 0.2569580078125, 0.337646484375, 0.4183349609375, 0.4990234375, 0.5797119140625, 0.660400390625, 0.7410888671875, 0.82177734375, 0.9024658203125, 0.983154296875, 1.0638427734375, 1.14453125, 1.2252197265625, 1.305908203125, 1.3865966796875, 1.46728515625, 1.5479736328125, 1.628662109375, 1.7093505859375, 1.7900390625, 1.8707275390625, 1.951416015625, 2.0321044921875, 2.11279296875, 2.1934814453125, 2.274169921875, 2.3548583984375, 2.435546875]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 7.0, 6.0, 5.0, 6.0, 6.0, 10.0, 4.0, 16.0, 22.0, 14.0, 15.0, 21.0, 22.0, 17.0, 27.0, 24.0, 31.0, 31.0, 40.0, 38.0, 36.0, 28.0, 33.0, 445.0, 649.0, 27.0, 41.0, 30.0, 35.0, 37.0, 33.0, 33.0, 30.0, 22.0, 21.0, 13.0, 15.0, 19.0, 18.0, 21.0, 19.0, 13.0, 13.0, 6.0, 4.0, 7.0, 7.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 3.0], "bins": [-11.8046875, -11.43603515625, -11.0673828125, -10.69873046875, -10.330078125, -9.96142578125, -9.5927734375, -9.22412109375, -8.85546875, -8.48681640625, -8.1181640625, -7.74951171875, -7.380859375, -7.01220703125, -6.6435546875, -6.27490234375, -5.90625, -5.53759765625, -5.1689453125, -4.80029296875, -4.431640625, -4.06298828125, -3.6943359375, -3.32568359375, -2.95703125, -2.58837890625, -2.2197265625, -1.85107421875, -1.482421875, -1.11376953125, -0.7451171875, -0.37646484375, -0.0078125, 0.36083984375, 0.7294921875, 1.09814453125, 1.466796875, 1.83544921875, 2.2041015625, 2.57275390625, 2.94140625, 3.31005859375, 3.6787109375, 4.04736328125, 4.416015625, 4.78466796875, 5.1533203125, 5.52197265625, 5.890625, 6.25927734375, 6.6279296875, 6.99658203125, 7.365234375, 7.73388671875, 8.1025390625, 8.47119140625, 8.83984375, 9.20849609375, 9.5771484375, 9.94580078125, 10.314453125, 10.68310546875, 11.0517578125, 11.42041015625, 11.7890625]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 9.0, 7.0, 31.0, 61.0, 147.0, 468.0, 173.0, 63.0, 20.0, 14.0, 7.0, 5.0, 4.0, 1.0], "bins": [-115.35600280761719, -113.27873992919922, -111.20148468017578, -109.12422180175781, -107.04696655273438, -104.9697036743164, -102.89244842529297, -100.815185546875, -98.73793029785156, -96.6606674194336, -94.58341217041016, -92.50614929199219, -90.42889404296875, -88.35163116455078, -86.27437591552734, -84.19711303710938, -82.11985778808594, -80.04259490966797, -77.96533966064453, -75.88807678222656, -73.81082153320312, -71.73355865478516, -69.65630340576172, -67.57904052734375, -65.50177764892578, -63.42451858520508, -61.347259521484375, -59.27000045776367, -57.19274139404297, -55.115482330322266, -53.03822326660156, -50.960960388183594, -48.88370895385742, -46.80644989013672, -44.729190826416016, -42.65193176269531, -40.57467269897461, -38.497413635253906, -36.42015075683594, -34.3428955078125, -32.26563262939453, -30.188373565673828, -28.111114501953125, -26.033855438232422, -23.95659637451172, -21.879337310791016, -19.80207633972168, -17.724817276000977, -15.647560119628906, -13.570301055908203, -11.4930419921875, -9.41578197479248, -7.338522911071777, -5.261263847351074, -3.1840038299560547, -1.1067447662353516, 0.9705142974853516, 3.047773599624634, 5.125032901763916, 7.202292442321777, 9.27955150604248, 11.356810569763184, 13.434070587158203, 15.511329650878906, 17.58858871459961]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 3.0, 3.0, 6.0, 8.0, 10.0, 9.0, 17.0, 8.0, 21.0, 20.0, 24.0, 25.0, 31.0, 23.0, 30.0, 28.0, 48.0, 34.0, 35.0, 39.0, 45.0, 37.0, 46.0, 44.0, 27.0, 41.0, 50.0, 26.0, 34.0, 34.0, 33.0, 24.0, 28.0, 13.0, 16.0, 13.0, 18.0, 11.0, 7.0, 8.0, 8.0, 4.0, 1.0, 5.0, 5.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-25.787487030029297, -25.029155731201172, -24.270824432373047, -23.512493133544922, -22.754161834716797, -21.995830535888672, -21.237499237060547, -20.479167938232422, -19.720836639404297, -18.962505340576172, -18.204174041748047, -17.445842742919922, -16.687511444091797, -15.929180145263672, -15.170848846435547, -14.412517547607422, -13.65418529510498, -12.895853996276855, -12.13752269744873, -11.379191398620605, -10.62086009979248, -9.862528800964355, -9.104196548461914, -8.345865249633789, -7.587534427642822, -6.829203128814697, -6.070871829986572, -5.312540054321289, -4.554208755493164, -3.795877695083618, -3.037546157836914, -2.279214859008789, -1.520883560180664, -0.7625522017478943, -0.004220843315124512, 0.75411057472229, 1.512441873550415, 2.27077317237854, 3.029104709625244, 3.787436008453369, 4.545767307281494, 5.304098606109619, 6.062429904937744, 6.820761680603027, 7.579092979431152, 8.337424278259277, 9.095755577087402, 9.854086875915527, 10.612418174743652, 11.370749473571777, 12.129080772399902, 12.887412071228027, 13.645743370056152, 14.404074668884277, 15.162406921386719, 15.920738220214844, 16.67906951904297, 17.437400817871094, 18.19573211669922, 18.954063415527344, 19.71239471435547, 20.470726013183594, 21.22905731201172, 21.987388610839844, 22.74571990966797]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 4.0, 1.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 9.0, 13.0, 15.0, 19.0, 20.0, 23.0, 43.0, 57.0, 70.0, 87.0, 140.0, 240.0, 391.0, 576.0, 964.0, 1828.0, 3782.0, 18009.0, 4025695.0, 129534.0, 7183.0, 2289.0, 1217.0, 665.0, 413.0, 285.0, 178.0, 143.0, 93.0, 62.0, 55.0, 33.0, 30.0, 26.0, 28.0, 16.0, 9.0, 11.0, 7.0, 8.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.289794921875, -0.28006744384765625, -0.2703399658203125, -0.26061248779296875, -0.250885009765625, -0.24115753173828125, -0.2314300537109375, -0.22170257568359375, -0.21197509765625, -0.20224761962890625, -0.1925201416015625, -0.18279266357421875, -0.173065185546875, -0.16333770751953125, -0.1536102294921875, -0.14388275146484375, -0.1341552734375, -0.12442779541015625, -0.1147003173828125, -0.10497283935546875, -0.095245361328125, -0.08551788330078125, -0.0757904052734375, -0.06606292724609375, -0.05633544921875, -0.04660797119140625, -0.0368804931640625, -0.02715301513671875, -0.017425537109375, -0.00769805908203125, 0.0020294189453125, 0.01175689697265625, 0.021484375, 0.03121185302734375, 0.0409393310546875, 0.05066680908203125, 0.060394287109375, 0.07012176513671875, 0.0798492431640625, 0.08957672119140625, 0.09930419921875, 0.10903167724609375, 0.1187591552734375, 0.12848663330078125, 0.138214111328125, 0.14794158935546875, 0.1576690673828125, 0.16739654541015625, 0.1771240234375, 0.18685150146484375, 0.1965789794921875, 0.20630645751953125, 0.216033935546875, 0.22576141357421875, 0.2354888916015625, 0.24521636962890625, 0.25494384765625, 0.26467132568359375, 0.2743988037109375, 0.28412628173828125, 0.293853759765625, 0.30358123779296875, 0.3133087158203125, 0.32303619384765625, 0.332763671875]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 7.0, 8.0, 5.0, 5.0, 6.0, 13.0, 10.0, 10.0, 12.0, 13.0, 22.0, 782.0, 26.0, 15.0, 14.0, 12.0, 9.0, 5.0, 3.0, 5.0, 4.0, 3.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09613037109375, -0.09288215637207031, -0.08963394165039062, -0.08638572692871094, -0.08313751220703125, -0.07988929748535156, -0.07664108276367188, -0.07339286804199219, -0.0701446533203125, -0.06689643859863281, -0.06364822387695312, -0.06040000915527344, -0.05715179443359375, -0.05390357971191406, -0.050655364990234375, -0.04740715026855469, -0.044158935546875, -0.04091072082519531, -0.037662506103515625, -0.03441429138183594, -0.03116607666015625, -0.027917861938476562, -0.024669647216796875, -0.021421432495117188, -0.0181732177734375, -0.014925003051757812, -0.011676788330078125, -0.008428573608398438, -0.00518035888671875, -0.0019321441650390625, 0.001316070556640625, 0.0045642852783203125, 0.0078125, 0.011060714721679688, 0.014308929443359375, 0.017557144165039062, 0.02080535888671875, 0.024053573608398438, 0.027301788330078125, 0.030550003051757812, 0.0337982177734375, 0.03704643249511719, 0.040294647216796875, 0.04354286193847656, 0.04679107666015625, 0.05003929138183594, 0.053287506103515625, 0.05653572082519531, 0.059783935546875, 0.06303215026855469, 0.06628036499023438, 0.06952857971191406, 0.07277679443359375, 0.07602500915527344, 0.07927322387695312, 0.08252143859863281, 0.0857696533203125, 0.08901786804199219, 0.09226608276367188, 0.09551429748535156, 0.09876251220703125, 0.10201072692871094, 0.10525894165039062, 0.10850715637207031, 0.11175537109375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 8.0, 4.0, 3.0, 3.0, 16.0, 16.0, 16.0, 38.0, 46.0, 73.0, 120.0, 180.0, 235.0, 373.0, 567.0, 828.0, 1441.0, 2416.0, 4057.0, 7212.0, 14375.0, 33102.0, 132246.0, 3650657.0, 261356.0, 45835.0, 18258.0, 8897.0, 4712.0, 2707.0, 1643.0, 961.0, 636.0, 403.0, 261.0, 185.0, 140.0, 81.0, 59.0, 27.0, 32.0, 27.0, 9.0, 9.0, 12.0, 5.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.22607421875, -0.219146728515625, -0.21221923828125, -0.205291748046875, -0.1983642578125, -0.191436767578125, -0.18450927734375, -0.177581787109375, -0.170654296875, -0.163726806640625, -0.15679931640625, -0.149871826171875, -0.1429443359375, -0.136016845703125, -0.12908935546875, -0.122161865234375, -0.115234375, -0.108306884765625, -0.10137939453125, -0.094451904296875, -0.0875244140625, -0.080596923828125, -0.07366943359375, -0.066741943359375, -0.059814453125, -0.052886962890625, -0.04595947265625, -0.039031982421875, -0.0321044921875, -0.025177001953125, -0.01824951171875, -0.011322021484375, -0.00439453125, 0.002532958984375, 0.00946044921875, 0.016387939453125, 0.0233154296875, 0.030242919921875, 0.03717041015625, 0.044097900390625, 0.051025390625, 0.057952880859375, 0.06488037109375, 0.071807861328125, 0.0787353515625, 0.085662841796875, 0.09259033203125, 0.099517822265625, 0.1064453125, 0.113372802734375, 0.12030029296875, 0.127227783203125, 0.1341552734375, 0.141082763671875, 0.14801025390625, 0.154937744140625, 0.161865234375, 0.168792724609375, 0.17572021484375, 0.182647705078125, 0.1895751953125, 0.196502685546875, 0.20343017578125, 0.210357666015625, 0.21728515625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 4.0, 6.0, 3.0, 8.0, 11.0, 10.0, 10.0, 15.0, 13.0, 22.0, 29.0, 47.0, 73.0, 195.0, 751.0, 1956.0, 514.0, 149.0, 74.0, 35.0, 35.0, 20.0, 21.0, 18.0, 20.0, 8.0, 8.0, 5.0, 2.0, 5.0, 3.0, 3.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1275634765625, -0.12290191650390625, -0.1182403564453125, -0.11357879638671875, -0.108917236328125, -0.10425567626953125, -0.0995941162109375, -0.09493255615234375, -0.09027099609375, -0.08560943603515625, -0.0809478759765625, -0.07628631591796875, -0.071624755859375, -0.06696319580078125, -0.0623016357421875, -0.05764007568359375, -0.052978515625, -0.04831695556640625, -0.0436553955078125, -0.03899383544921875, -0.034332275390625, -0.02967071533203125, -0.0250091552734375, -0.02034759521484375, -0.01568603515625, -0.01102447509765625, -0.0063629150390625, -0.00170135498046875, 0.002960205078125, 0.00762176513671875, 0.0122833251953125, 0.01694488525390625, 0.0216064453125, 0.02626800537109375, 0.0309295654296875, 0.03559112548828125, 0.040252685546875, 0.04491424560546875, 0.0495758056640625, 0.05423736572265625, 0.05889892578125, 0.06356048583984375, 0.0682220458984375, 0.07288360595703125, 0.077545166015625, 0.08220672607421875, 0.0868682861328125, 0.09152984619140625, 0.09619140625, 0.10085296630859375, 0.1055145263671875, 0.11017608642578125, 0.114837646484375, 0.11949920654296875, 0.1241607666015625, 0.12882232666015625, 0.13348388671875, 0.13814544677734375, 0.1428070068359375, 0.14746856689453125, 0.152130126953125, 0.15679168701171875, 0.1614532470703125, 0.16611480712890625, 0.1707763671875]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 8.0, 5.0, 19.0, 43.0, 149.0, 480.0, 193.0, 54.0, 26.0, 16.0, 8.0, 3.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7148686647415161, -0.6844812035560608, -0.6540937423706055, -0.6237062215805054, -0.59331876039505, -0.5629312992095947, -0.5325438380241394, -0.5021563768386841, -0.47176891565322876, -0.44138145446777344, -0.4109939634799957, -0.3806065022945404, -0.3502190411090851, -0.3198315501213074, -0.28944408893585205, -0.25905662775039673, -0.22866913676261902, -0.1982816606760025, -0.16789419949054718, -0.13750672340393066, -0.10711925476789474, -0.07673178613185883, -0.04634431004524231, -0.015956848859786987, 0.014430627226829529, 0.04481809586286545, 0.07520556449890137, 0.10559304058551788, 0.1359805166721344, 0.16636797785758972, 0.19675545394420624, 0.22714291512966156, 0.2575303912162781, 0.2879178524017334, 0.3183053433895111, 0.34869280457496643, 0.37908026576042175, 0.40946775674819946, 0.4398552179336548, 0.4702426791191101, 0.5006301403045654, 0.5310176014900208, 0.5614050626754761, 0.5917925834655762, 0.6221800446510315, 0.6525675058364868, 0.6829549670219421, 0.7133424282073975, 0.7437299489974976, 0.7741174101829529, 0.8045048713684082, 0.8348923921585083, 0.8652798533439636, 0.895667314529419, 0.9260547757148743, 0.9564422369003296, 0.9868296980857849, 1.0172171592712402, 1.0476046800613403, 1.0779920816421509, 1.108379602432251, 1.1387670040130615, 1.1691545248031616, 1.1995420455932617, 1.2299294471740723]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 7.0, 6.0, 8.0, 19.0, 23.0, 15.0, 32.0, 43.0, 51.0, 43.0, 54.0, 50.0, 54.0, 71.0, 61.0, 66.0, 54.0, 51.0, 53.0, 46.0, 42.0, 28.0, 21.0, 21.0, 15.0, 18.0, 17.0, 5.0, 8.0, 8.0, 7.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.53624027967453, -0.5210390686988831, -0.5058379173278809, -0.4906367063522339, -0.4754355251789093, -0.4602343440055847, -0.44503316283226013, -0.42983198165893555, -0.4146307706832886, -0.399429589509964, -0.3842284083366394, -0.36902719736099243, -0.35382601618766785, -0.33862483501434326, -0.3234236538410187, -0.3082224726676941, -0.2930212616920471, -0.27782008051872253, -0.26261889934539795, -0.24741770327091217, -0.2322165071964264, -0.2170153260231018, -0.20181414484977722, -0.18661294877529144, -0.17141178250312805, -0.15621060132980347, -0.1410094052553177, -0.1258082240819931, -0.11060702800750732, -0.09540584683418274, -0.08020465821027756, -0.06500346958637238, -0.0498022735118866, -0.034601084887981415, -0.019399898126721382, -0.0041987113654613495, 0.011002477258443832, 0.026203662157058716, 0.0414048507809639, 0.05660603940486908, 0.07180722802877426, 0.08700841665267944, 0.10220960527658463, 0.11741079390048981, 0.1326119750738144, 0.14781317114830017, 0.16301435232162476, 0.17821553349494934, 0.19341672956943512, 0.2086179107427597, 0.22381910681724548, 0.23902028799057007, 0.25422146916389465, 0.26942265033721924, 0.2846238613128662, 0.2998250424861908, 0.3150262236595154, 0.33022740483283997, 0.34542858600616455, 0.3606297969818115, 0.3758309781551361, 0.3910321593284607, 0.4062333405017853, 0.42143452167510986, 0.43663573265075684]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 0.0, 2.0, 2.0, 1.0, 8.0, 8.0, 8.0, 13.0, 21.0, 29.0, 33.0, 62.0, 86.0, 96.0, 147.0, 184.0, 280.0, 419.0, 635.0, 979.0, 1560.0, 2650.0, 4553.0, 8565.0, 18704.0, 56461.0, 892865.0, 31630.0, 12860.0, 6220.0, 3574.0, 2017.0, 1229.0, 855.0, 565.0, 368.0, 297.0, 172.0, 122.0, 82.0, 59.0, 59.0, 16.0, 18.0, 16.0, 12.0, 10.0, 3.0, 4.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.43994140625, -0.42671966552734375, -0.4134979248046875, -0.40027618408203125, -0.387054443359375, -0.37383270263671875, -0.3606109619140625, -0.34738922119140625, -0.33416748046875, -0.32094573974609375, -0.3077239990234375, -0.29450225830078125, -0.281280517578125, -0.26805877685546875, -0.2548370361328125, -0.24161529541015625, -0.2283935546875, -0.21517181396484375, -0.2019500732421875, -0.18872833251953125, -0.175506591796875, -0.16228485107421875, -0.1490631103515625, -0.13584136962890625, -0.12261962890625, -0.10939788818359375, -0.0961761474609375, -0.08295440673828125, -0.069732666015625, -0.05651092529296875, -0.0432891845703125, -0.03006744384765625, -0.016845703125, -0.00362396240234375, 0.0095977783203125, 0.02281951904296875, 0.036041259765625, 0.04926300048828125, 0.0624847412109375, 0.07570648193359375, 0.08892822265625, 0.10214996337890625, 0.1153717041015625, 0.12859344482421875, 0.141815185546875, 0.15503692626953125, 0.1682586669921875, 0.18148040771484375, 0.1947021484375, 0.20792388916015625, 0.2211456298828125, 0.23436737060546875, 0.247589111328125, 0.26081085205078125, 0.2740325927734375, 0.28725433349609375, 0.30047607421875, 0.31369781494140625, 0.3269195556640625, 0.34014129638671875, 0.353363037109375, 0.36658477783203125, 0.3798065185546875, 0.39302825927734375, 0.40625]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 2.0, 6.0, 6.0, 8.0, 6.0, 5.0, 4.0, 17.0, 9.0, 12.0, 14.0, 15.0, 136.0, 670.0, 18.0, 16.0, 14.0, 9.0, 6.0, 5.0, 3.0, 6.0, 5.0, 2.0, 5.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09716796875, -0.09394454956054688, -0.09072113037109375, -0.08749771118164062, -0.0842742919921875, -0.08105087280273438, -0.07782745361328125, -0.07460403442382812, -0.071380615234375, -0.06815719604492188, -0.06493377685546875, -0.061710357666015625, -0.0584869384765625, -0.055263519287109375, -0.05204010009765625, -0.048816680908203125, -0.04559326171875, -0.042369842529296875, -0.03914642333984375, -0.035923004150390625, -0.0326995849609375, -0.029476165771484375, -0.02625274658203125, -0.023029327392578125, -0.019805908203125, -0.016582489013671875, -0.01335906982421875, -0.010135650634765625, -0.0069122314453125, -0.003688812255859375, -0.00046539306640625, 0.002758026123046875, 0.0059814453125, 0.009204864501953125, 0.01242828369140625, 0.015651702880859375, 0.0188751220703125, 0.022098541259765625, 0.02532196044921875, 0.028545379638671875, 0.031768798828125, 0.034992218017578125, 0.03821563720703125, 0.041439056396484375, 0.0446624755859375, 0.047885894775390625, 0.05110931396484375, 0.054332733154296875, 0.05755615234375, 0.060779571533203125, 0.06400299072265625, 0.06722640991210938, 0.0704498291015625, 0.07367324829101562, 0.07689666748046875, 0.08012008666992188, 0.083343505859375, 0.08656692504882812, 0.08979034423828125, 0.09301376342773438, 0.0962371826171875, 0.09946060180664062, 0.10268402099609375, 0.10590744018554688, 0.109130859375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [5.0, 3.0, 3.0, 3.0, 7.0, 9.0, 0.0, 10.0, 10.0, 12.0, 22.0, 34.0, 38.0, 55.0, 72.0, 100.0, 105.0, 194.0, 230.0, 380.0, 593.0, 1056.0, 1684.0, 2872.0, 4867.0, 8357.0, 15084.0, 27625.0, 52570.0, 109260.0, 274659.0, 307122.0, 117993.0, 56140.0, 29485.0, 15894.0, 9018.0, 5090.0, 3022.0, 1813.0, 1088.0, 622.0, 427.0, 281.0, 147.0, 135.0, 96.0, 72.0, 55.0, 51.0, 21.0, 20.0, 19.0, 4.0, 8.0, 12.0, 3.0, 4.0, 4.0, 2.0, 3.0, 1.0, 1.0, 4.0], "bins": [-0.2015380859375, -0.19504737854003906, -0.18855667114257812, -0.1820659637451172, -0.17557525634765625, -0.1690845489501953, -0.16259384155273438, -0.15610313415527344, -0.1496124267578125, -0.14312171936035156, -0.13663101196289062, -0.1301403045654297, -0.12364959716796875, -0.11715888977050781, -0.11066818237304688, -0.10417747497558594, -0.097686767578125, -0.09119606018066406, -0.08470535278320312, -0.07821464538574219, -0.07172393798828125, -0.06523323059082031, -0.058742523193359375, -0.05225181579589844, -0.0457611083984375, -0.03927040100097656, -0.032779693603515625, -0.026288986206054688, -0.01979827880859375, -0.013307571411132812, -0.006816864013671875, -0.0003261566162109375, 0.00616455078125, 0.012655258178710938, 0.019145965576171875, 0.025636672973632812, 0.03212738037109375, 0.03861808776855469, 0.045108795166015625, 0.05159950256347656, 0.0580902099609375, 0.06458091735839844, 0.07107162475585938, 0.07756233215332031, 0.08405303955078125, 0.09054374694824219, 0.09703445434570312, 0.10352516174316406, 0.110015869140625, 0.11650657653808594, 0.12299728393554688, 0.1294879913330078, 0.13597869873046875, 0.1424694061279297, 0.14896011352539062, 0.15545082092285156, 0.1619415283203125, 0.16843223571777344, 0.17492294311523438, 0.1814136505126953, 0.18790435791015625, 0.1943950653076172, 0.20088577270507812, 0.20737648010253906, 0.2138671875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 5.0, 4.0, 8.0, 10.0, 9.0, 9.0, 15.0, 18.0, 13.0, 17.0, 17.0, 19.0, 24.0, 35.0, 26.0, 34.0, 39.0, 31.0, 37.0, 30.0, 33.0, 37.0, 36.0, 40.0, 37.0, 38.0, 47.0, 28.0, 34.0, 30.0, 30.0, 35.0, 20.0, 21.0, 21.0, 16.0, 15.0, 12.0, 11.0, 17.0, 15.0, 12.0, 4.0, 6.0, 4.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.291748046875, -0.2823486328125, -0.27294921875, -0.2635498046875, -0.254150390625, -0.2447509765625, -0.2353515625, -0.2259521484375, -0.216552734375, -0.2071533203125, -0.19775390625, -0.1883544921875, -0.178955078125, -0.1695556640625, -0.16015625, -0.1507568359375, -0.141357421875, -0.1319580078125, -0.12255859375, -0.1131591796875, -0.103759765625, -0.0943603515625, -0.0849609375, -0.0755615234375, -0.066162109375, -0.0567626953125, -0.04736328125, -0.0379638671875, -0.028564453125, -0.0191650390625, -0.009765625, -0.0003662109375, 0.009033203125, 0.0184326171875, 0.02783203125, 0.0372314453125, 0.046630859375, 0.0560302734375, 0.0654296875, 0.0748291015625, 0.084228515625, 0.0936279296875, 0.10302734375, 0.1124267578125, 0.121826171875, 0.1312255859375, 0.140625, 0.1500244140625, 0.159423828125, 0.1688232421875, 0.17822265625, 0.1876220703125, 0.197021484375, 0.2064208984375, 0.2158203125, 0.2252197265625, 0.234619140625, 0.2440185546875, 0.25341796875, 0.2628173828125, 0.272216796875, 0.2816162109375, 0.291015625, 0.3004150390625, 0.309814453125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 6.0, 3.0, 2.0, 8.0, 7.0, 6.0, 25.0, 30.0, 44.0, 74.0, 136.0, 248.0, 539.0, 1433.0, 5306.0, 56661.0, 949558.0, 28508.0, 3859.0, 1126.0, 464.0, 218.0, 98.0, 81.0, 36.0, 23.0, 15.0, 12.0, 9.0, 4.0, 6.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0433349609375, -0.04195451736450195, -0.040574073791503906, -0.03919363021850586, -0.03781318664550781, -0.036432743072509766, -0.03505229949951172, -0.03367185592651367, -0.032291412353515625, -0.030910968780517578, -0.02953052520751953, -0.028150081634521484, -0.026769638061523438, -0.02538919448852539, -0.024008750915527344, -0.022628307342529297, -0.02124786376953125, -0.019867420196533203, -0.018486976623535156, -0.01710653305053711, -0.015726089477539062, -0.014345645904541016, -0.012965202331542969, -0.011584758758544922, -0.010204315185546875, -0.008823871612548828, -0.007443428039550781, -0.006062984466552734, -0.0046825408935546875, -0.0033020973205566406, -0.0019216537475585938, -0.0005412101745605469, 0.0008392333984375, 0.002219676971435547, 0.0036001205444335938, 0.004980564117431641, 0.0063610076904296875, 0.007741451263427734, 0.009121894836425781, 0.010502338409423828, 0.011882781982421875, 0.013263225555419922, 0.014643669128417969, 0.016024112701416016, 0.017404556274414062, 0.01878499984741211, 0.020165443420410156, 0.021545886993408203, 0.02292633056640625, 0.024306774139404297, 0.025687217712402344, 0.02706766128540039, 0.028448104858398438, 0.029828548431396484, 0.03120899200439453, 0.03258943557739258, 0.033969879150390625, 0.03535032272338867, 0.03673076629638672, 0.038111209869384766, 0.03949165344238281, 0.04087209701538086, 0.042252540588378906, 0.04363298416137695, 0.045013427734375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 4.0, 4.0, 0.0, 5.0, 14.0, 13.0, 20.0, 24.0, 23.0, 64.0, 89.0, 129.0, 182.0, 158.0, 86.0, 48.0, 40.0, 36.0, 11.0, 8.0, 8.0, 7.0, 5.0, 4.0, 6.0, 4.0, 4.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.698204040527344e-05, -5.4838135838508606e-05, -5.2694231271743774e-05, -5.055032670497894e-05, -4.840642213821411e-05, -4.626251757144928e-05, -4.411861300468445e-05, -4.197470843791962e-05, -3.9830803871154785e-05, -3.7686899304389954e-05, -3.554299473762512e-05, -3.339909017086029e-05, -3.125518560409546e-05, -2.9111281037330627e-05, -2.6967376470565796e-05, -2.4823471903800964e-05, -2.2679567337036133e-05, -2.05356627702713e-05, -1.839175820350647e-05, -1.6247853636741638e-05, -1.4103949069976807e-05, -1.1960044503211975e-05, -9.816139936447144e-06, -7.672235369682312e-06, -5.5283308029174805e-06, -3.384426236152649e-06, -1.2405216693878174e-06, 9.033828973770142e-07, 3.0472874641418457e-06, 5.191192030906677e-06, 7.335096597671509e-06, 9.47900116443634e-06, 1.1622905731201172e-05, 1.3766810297966003e-05, 1.5910714864730835e-05, 1.8054619431495667e-05, 2.0198523998260498e-05, 2.234242856502533e-05, 2.448633313179016e-05, 2.6630237698554993e-05, 2.8774142265319824e-05, 3.0918046832084656e-05, 3.306195139884949e-05, 3.520585596561432e-05, 3.734976053237915e-05, 3.949366509914398e-05, 4.1637569665908813e-05, 4.3781474232673645e-05, 4.5925378799438477e-05, 4.806928336620331e-05, 5.021318793296814e-05, 5.235709249973297e-05, 5.45009970664978e-05, 5.6644901633262634e-05, 5.8788806200027466e-05, 6.09327107667923e-05, 6.307661533355713e-05, 6.522051990032196e-05, 6.736442446708679e-05, 6.950832903385162e-05, 7.165223360061646e-05, 7.379613816738129e-05, 7.594004273414612e-05, 7.808394730091095e-05, 8.022785186767578e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 7.0, 8.0, 8.0, 14.0, 20.0, 22.0, 28.0, 61.0, 86.0, 161.0, 289.0, 494.0, 1095.0, 2334.0, 5576.0, 17101.0, 80855.0, 750950.0, 150917.0, 25351.0, 7454.0, 2945.0, 1285.0, 673.0, 381.0, 181.0, 92.0, 47.0, 38.0, 32.0, 18.0, 12.0, 8.0, 10.0, 2.0, 5.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.022064208984375, -0.02134418487548828, -0.020624160766601562, -0.019904136657714844, -0.019184112548828125, -0.018464088439941406, -0.017744064331054688, -0.01702404022216797, -0.01630401611328125, -0.015583992004394531, -0.014863967895507812, -0.014143943786621094, -0.013423919677734375, -0.012703895568847656, -0.011983871459960938, -0.011263847351074219, -0.0105438232421875, -0.009823799133300781, -0.009103775024414062, -0.008383750915527344, -0.007663726806640625, -0.006943702697753906, -0.0062236785888671875, -0.005503654479980469, -0.00478363037109375, -0.004063606262207031, -0.0033435821533203125, -0.0026235580444335938, -0.001903533935546875, -0.0011835098266601562, -0.0004634857177734375, 0.00025653839111328125, 0.0009765625, 0.0016965866088867188, 0.0024166107177734375, 0.0031366348266601562, 0.003856658935546875, 0.004576683044433594, 0.0052967071533203125, 0.006016731262207031, 0.00673675537109375, 0.007456779479980469, 0.008176803588867188, 0.008896827697753906, 0.009616851806640625, 0.010336875915527344, 0.011056900024414062, 0.011776924133300781, 0.0124969482421875, 0.013216972351074219, 0.013936996459960938, 0.014657020568847656, 0.015377044677734375, 0.016097068786621094, 0.016817092895507812, 0.01753711700439453, 0.01825714111328125, 0.01897716522216797, 0.019697189331054688, 0.020417213439941406, 0.021137237548828125, 0.021857261657714844, 0.022577285766601562, 0.02329730987548828, 0.024017333984375]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 4.0, 0.0, 2.0, 7.0, 8.0, 16.0, 10.0, 18.0, 27.0, 32.0, 52.0, 71.0, 110.0, 128.0, 123.0, 102.0, 78.0, 60.0, 40.0, 30.0, 26.0, 16.0, 6.0, 9.0, 10.0, 4.0, 3.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.019256591796875, -0.018428325653076172, -0.017600059509277344, -0.016771793365478516, -0.015943527221679688, -0.01511526107788086, -0.014286994934082031, -0.013458728790283203, -0.012630462646484375, -0.011802196502685547, -0.010973930358886719, -0.01014566421508789, -0.009317398071289062, -0.008489131927490234, -0.007660865783691406, -0.006832599639892578, -0.00600433349609375, -0.005176067352294922, -0.004347801208496094, -0.0035195350646972656, -0.0026912689208984375, -0.0018630027770996094, -0.0010347366333007812, -0.00020647048950195312, 0.000621795654296875, 0.0014500617980957031, 0.0022783279418945312, 0.0031065940856933594, 0.0039348602294921875, 0.004763126373291016, 0.005591392517089844, 0.006419658660888672, 0.0072479248046875, 0.008076190948486328, 0.008904457092285156, 0.009732723236083984, 0.010560989379882812, 0.01138925552368164, 0.012217521667480469, 0.013045787811279297, 0.013874053955078125, 0.014702320098876953, 0.015530586242675781, 0.01635885238647461, 0.017187118530273438, 0.018015384674072266, 0.018843650817871094, 0.019671916961669922, 0.02050018310546875, 0.021328449249267578, 0.022156715393066406, 0.022984981536865234, 0.023813247680664062, 0.02464151382446289, 0.02546977996826172, 0.026298046112060547, 0.027126312255859375, 0.027954578399658203, 0.02878284454345703, 0.02961111068725586, 0.030439376831054688, 0.031267642974853516, 0.032095909118652344, 0.03292417526245117, 0.03375244140625]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 7.0, 6.0, 5.0, 8.0, 11.0, 18.0, 24.0, 30.0, 63.0, 90.0, 176.0, 214.0, 123.0, 70.0, 36.0, 36.0, 21.0, 15.0, 15.0, 9.0, 5.0, 2.0, 4.0, 6.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-3.1755661964416504, -3.1022655963897705, -3.0289649963378906, -2.9556643962860107, -2.882363796234131, -2.809062957763672, -2.735762357711792, -2.662461757659912, -2.5891611576080322, -2.5158605575561523, -2.4425599575042725, -2.3692593574523926, -2.2959585189819336, -2.2226579189300537, -2.149357318878174, -2.076056718826294, -2.002756118774414, -1.9294555187225342, -1.8561549186706543, -1.7828541994094849, -1.709553599357605, -1.636252999305725, -1.5629522800445557, -1.4896516799926758, -1.416351079940796, -1.343050479888916, -1.2697498798370361, -1.1964491605758667, -1.1231485605239868, -1.049847960472107, -0.9765473008155823, -0.9032466411590576, -0.8299460411071777, -0.7566454410552979, -0.6833447813987732, -0.6100441217422485, -0.5367435216903687, -0.4634428918361664, -0.3901422619819641, -0.31684160232543945, -0.24354100227355957, -0.1702403724193573, -0.09693974256515503, -0.02363911271095276, 0.04966151714324951, 0.12296214699745178, 0.19626277685165405, 0.2695634365081787, 0.3428640365600586, 0.41616466641426086, 0.48946529626846313, 0.5627659559249878, 0.6360665559768677, 0.7093671560287476, 0.7826678156852722, 0.8559684753417969, 0.9292690753936768, 1.0025696754455566, 1.0758702754974365, 1.149170994758606, 1.2224715948104858, 1.2957721948623657, 1.3690729141235352, 1.442373514175415, 1.515674114227295]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 5.0, 1.0, 1.0, 5.0, 3.0, 5.0, 10.0, 14.0, 23.0, 34.0, 57.0, 88.0, 187.0, 201.0, 150.0, 81.0, 47.0, 27.0, 15.0, 16.0, 12.0, 8.0, 4.0, 3.0, 1.0, 5.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.211030960083008, -8.9646577835083, -8.718283653259277, -8.47191047668457, -8.225537300109863, -7.979163646697998, -7.732790470123291, -7.486416816711426, -7.240043640136719, -6.9936699867248535, -6.7472968101501465, -6.500923156738281, -6.254549980163574, -6.008176326751709, -5.761803150177002, -5.515429496765137, -5.26905632019043, -5.0226826667785645, -4.776309490203857, -4.529935836791992, -4.283562660217285, -4.03718900680542, -3.790815830230713, -3.5444421768188477, -3.2980685234069824, -3.0516951084136963, -2.80532169342041, -2.558948278427124, -2.312574863433838, -2.0662012100219727, -1.819827914237976, -1.57345449924469, -1.3270812034606934, -1.0807077884674072, -0.8343343734741211, -0.5879608988761902, -0.34158748388290405, -0.09521400928497314, 0.151159405708313, 0.3975328207015991, 0.6439062356948853, 0.8902796506881714, 1.1366530656814575, 1.3830265998840332, 1.6294000148773193, 1.8757734298706055, 2.1221468448638916, 2.3685202598571777, 2.614893674850464, 2.86126708984375, 3.107640504837036, 3.3540139198303223, 3.6003873348236084, 3.8467607498168945, 4.09313440322876, 4.339507579803467, 4.585881233215332, 4.832254886627197, 5.078628063201904, 5.3250017166137695, 5.571374893188477, 5.817748546600342, 6.064121723175049, 6.310495376586914, 6.556868553161621]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 7.0, 5.0, 11.0, 9.0, 16.0, 22.0, 23.0, 34.0, 36.0, 62.0, 89.0, 125.0, 140.0, 218.0, 313.0, 451.0, 681.0, 1008.0, 1601.0, 2653.0, 4503.0, 8020.0, 18447.0, 320644.0, 3798389.0, 19306.0, 7264.0, 3820.0, 2232.0, 1388.0, 829.0, 601.0, 389.0, 262.0, 167.0, 142.0, 102.0, 65.0, 61.0, 45.0, 26.0, 20.0, 12.0, 16.0, 9.0, 5.0, 4.0, 6.0, 3.0, 1.0, 5.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.8525390625, -0.82672119140625, -0.8009033203125, -0.77508544921875, -0.749267578125, -0.72344970703125, -0.6976318359375, -0.67181396484375, -0.64599609375, -0.62017822265625, -0.5943603515625, -0.56854248046875, -0.542724609375, -0.51690673828125, -0.4910888671875, -0.46527099609375, -0.439453125, -0.41363525390625, -0.3878173828125, -0.36199951171875, -0.336181640625, -0.31036376953125, -0.2845458984375, -0.25872802734375, -0.23291015625, -0.20709228515625, -0.1812744140625, -0.15545654296875, -0.129638671875, -0.10382080078125, -0.0780029296875, -0.05218505859375, -0.0263671875, -0.00054931640625, 0.0252685546875, 0.05108642578125, 0.076904296875, 0.10272216796875, 0.1285400390625, 0.15435791015625, 0.18017578125, 0.20599365234375, 0.2318115234375, 0.25762939453125, 0.283447265625, 0.30926513671875, 0.3350830078125, 0.36090087890625, 0.38671875, 0.41253662109375, 0.4383544921875, 0.46417236328125, 0.489990234375, 0.51580810546875, 0.5416259765625, 0.56744384765625, 0.59326171875, 0.61907958984375, 0.6448974609375, 0.67071533203125, 0.696533203125, 0.72235107421875, 0.7481689453125, 0.77398681640625, 0.7998046875]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 5.0, 3.0, 6.0, 5.0, 6.0, 7.0, 8.0, 4.0, 10.0, 9.0, 4.0, 12.0, 17.0, 56.0, 215.0, 409.0, 108.0, 31.0, 17.0, 10.0, 8.0, 8.0, 5.0, 5.0, 7.0, 5.0, 3.0, 3.0, 3.0, 3.0, 3.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0648193359375, -0.06286191940307617, -0.060904502868652344, -0.058947086334228516, -0.05698966979980469, -0.05503225326538086, -0.05307483673095703, -0.0511174201965332, -0.049160003662109375, -0.04720258712768555, -0.04524517059326172, -0.04328775405883789, -0.04133033752441406, -0.039372920989990234, -0.037415504455566406, -0.03545808792114258, -0.03350067138671875, -0.03154325485229492, -0.029585838317871094, -0.027628421783447266, -0.025671005249023438, -0.02371358871459961, -0.02175617218017578, -0.019798755645751953, -0.017841339111328125, -0.015883922576904297, -0.013926506042480469, -0.01196908950805664, -0.010011672973632812, -0.008054256439208984, -0.006096839904785156, -0.004139423370361328, -0.0021820068359375, -0.00022459030151367188, 0.0017328262329101562, 0.0036902427673339844, 0.0056476593017578125, 0.007605075836181641, 0.009562492370605469, 0.011519908905029297, 0.013477325439453125, 0.015434741973876953, 0.01739215850830078, 0.01934957504272461, 0.021306991577148438, 0.023264408111572266, 0.025221824645996094, 0.027179241180419922, 0.02913665771484375, 0.031094074249267578, 0.033051490783691406, 0.035008907318115234, 0.03696632385253906, 0.03892374038696289, 0.04088115692138672, 0.04283857345581055, 0.044795989990234375, 0.0467534065246582, 0.04871082305908203, 0.05066823959350586, 0.05262565612792969, 0.054583072662353516, 0.056540489196777344, 0.05849790573120117, 0.060455322265625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 6.0, 9.0, 11.0, 21.0, 17.0, 25.0, 37.0, 72.0, 114.0, 165.0, 237.0, 418.0, 683.0, 1114.0, 2000.0, 3636.0, 6863.0, 13982.0, 33043.0, 98742.0, 3681769.0, 250098.0, 56956.0, 22182.0, 10084.0, 5074.0, 2861.0, 1616.0, 932.0, 566.0, 330.0, 186.0, 150.0, 97.0, 64.0, 45.0, 25.0, 21.0, 9.0, 8.0, 6.0, 4.0, 3.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.5625, -0.5458450317382812, -0.5291900634765625, -0.5125350952148438, -0.495880126953125, -0.47922515869140625, -0.4625701904296875, -0.44591522216796875, -0.42926025390625, -0.41260528564453125, -0.3959503173828125, -0.37929534912109375, -0.362640380859375, -0.34598541259765625, -0.3293304443359375, -0.31267547607421875, -0.2960205078125, -0.27936553955078125, -0.2627105712890625, -0.24605560302734375, -0.229400634765625, -0.21274566650390625, -0.1960906982421875, -0.17943572998046875, -0.16278076171875, -0.14612579345703125, -0.1294708251953125, -0.11281585693359375, -0.096160888671875, -0.07950592041015625, -0.0628509521484375, -0.04619598388671875, -0.029541015625, -0.01288604736328125, 0.0037689208984375, 0.02042388916015625, 0.037078857421875, 0.05373382568359375, 0.0703887939453125, 0.08704376220703125, 0.10369873046875, 0.12035369873046875, 0.1370086669921875, 0.15366363525390625, 0.170318603515625, 0.18697357177734375, 0.2036285400390625, 0.22028350830078125, 0.2369384765625, 0.25359344482421875, 0.2702484130859375, 0.28690338134765625, 0.303558349609375, 0.32021331787109375, 0.3368682861328125, 0.35352325439453125, 0.37017822265625, 0.38683319091796875, 0.4034881591796875, 0.42014312744140625, 0.436798095703125, 0.45345306396484375, 0.4701080322265625, 0.48676300048828125, 0.50341796875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 6.0, 6.0, 6.0, 8.0, 10.0, 16.0, 6.0, 16.0, 24.0, 34.0, 46.0, 41.0, 68.0, 104.0, 181.0, 2996.0, 180.0, 62.0, 34.0, 52.0, 35.0, 29.0, 23.0, 20.0, 17.0, 7.0, 7.0, 9.0, 6.0, 6.0, 3.0, 8.0, 2.0, 3.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1141357421875, -0.1099853515625, -0.1058349609375, -0.1016845703125, -0.0975341796875, -0.0933837890625, -0.0892333984375, -0.0850830078125, -0.0809326171875, -0.0767822265625, -0.0726318359375, -0.0684814453125, -0.0643310546875, -0.0601806640625, -0.0560302734375, -0.0518798828125, -0.0477294921875, -0.0435791015625, -0.0394287109375, -0.0352783203125, -0.0311279296875, -0.0269775390625, -0.0228271484375, -0.0186767578125, -0.0145263671875, -0.0103759765625, -0.0062255859375, -0.0020751953125, 0.0020751953125, 0.0062255859375, 0.0103759765625, 0.0145263671875, 0.0186767578125, 0.0228271484375, 0.0269775390625, 0.0311279296875, 0.0352783203125, 0.0394287109375, 0.0435791015625, 0.0477294921875, 0.0518798828125, 0.0560302734375, 0.0601806640625, 0.0643310546875, 0.0684814453125, 0.0726318359375, 0.0767822265625, 0.0809326171875, 0.0850830078125, 0.0892333984375, 0.0933837890625, 0.0975341796875, 0.1016845703125, 0.1058349609375, 0.1099853515625, 0.1141357421875, 0.1182861328125, 0.1224365234375, 0.1265869140625, 0.1307373046875, 0.1348876953125, 0.1390380859375, 0.1431884765625, 0.1473388671875, 0.1514892578125]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 2.0, 6.0, 13.0, 24.0, 79.0, 269.0, 404.0, 111.0, 58.0, 30.0, 8.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9773894548416138, -0.9351291656494141, -0.8928689360618591, -0.8506086468696594, -0.8083484172821045, -0.7660881280899048, -0.7238278388977051, -0.6815675497055054, -0.6393073201179504, -0.5970470309257507, -0.5547868013381958, -0.5125265121459961, -0.4702662527561188, -0.42800599336624146, -0.38574570417404175, -0.34348544478416443, -0.3012251853942871, -0.2589649260044098, -0.21670465171337128, -0.17444437742233276, -0.13218411803245544, -0.08992385864257812, -0.04766356945037842, -0.005403310060501099, 0.03685694932937622, 0.07911721616983414, 0.12137748301029205, 0.16363775730133057, 0.20589801669120789, 0.2481582760810852, 0.2904185652732849, 0.33267882466316223, 0.3749392032623291, 0.4171994626522064, 0.45945972204208374, 0.5017200112342834, 0.5439802408218384, 0.5862405300140381, 0.6285008192062378, 0.6707611083984375, 0.7130213379859924, 0.7552816271781921, 0.7975418567657471, 0.8398021459579468, 0.8820624351501465, 0.9243226647377014, 0.9665829539299011, 1.008843183517456, 1.0511034727096558, 1.0933637619018555, 1.1356240510940552, 1.1778843402862549, 1.220144510269165, 1.2624047994613647, 1.3046650886535645, 1.3469253778457642, 1.3891856670379639, 1.4314459562301636, 1.4737062454223633, 1.5159664154052734, 1.5582267045974731, 1.6004869937896729, 1.6427472829818726, 1.6850075721740723, 1.7272677421569824]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 8.0, 5.0, 7.0, 8.0, 10.0, 15.0, 25.0, 36.0, 42.0, 58.0, 83.0, 74.0, 72.0, 103.0, 81.0, 82.0, 66.0, 71.0, 35.0, 38.0, 30.0, 17.0, 13.0, 9.0, 8.0, 7.0, 1.0, 2.0, 6.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7235525250434875, -0.6980715990066528, -0.6725906133651733, -0.6471096277236938, -0.6216287016868591, -0.5961477756500244, -0.5706667900085449, -0.5451858043670654, -0.5197048783302307, -0.4942239224910736, -0.4687429666519165, -0.4432620108127594, -0.4177810549736023, -0.3923000991344452, -0.3668191432952881, -0.341338187456131, -0.3158572316169739, -0.2903762757778168, -0.26489531993865967, -0.23941436409950256, -0.21393340826034546, -0.18845245242118835, -0.16297149658203125, -0.13749054074287415, -0.11200958490371704, -0.08652862906455994, -0.06104767322540283, -0.03556671738624573, -0.010085761547088623, 0.015395194292068481, 0.040876150131225586, 0.06635710597038269, 0.0918380618095398, 0.1173190176486969, 0.142799973487854, 0.1682809293270111, 0.1937618851661682, 0.21924284100532532, 0.24472379684448242, 0.2702047526836395, 0.29568570852279663, 0.32116666436195374, 0.34664762020111084, 0.37212857604026794, 0.39760953187942505, 0.42309048771858215, 0.44857144355773926, 0.47405239939689636, 0.49953335523605347, 0.5250142812728882, 0.5504952669143677, 0.5759762525558472, 0.6014571785926819, 0.6269381046295166, 0.6524190902709961, 0.6779000759124756, 0.7033810019493103, 0.728861927986145, 0.7543429136276245, 0.779823899269104, 0.8053048253059387, 0.8307857513427734, 0.8562667369842529, 0.8817477226257324, 0.9072286486625671]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 6.0, 5.0, 3.0, 9.0, 16.0, 24.0, 31.0, 51.0, 65.0, 129.0, 173.0, 307.0, 481.0, 821.0, 1413.0, 2576.0, 4832.0, 10082.0, 28144.0, 429311.0, 519259.0, 29320.0, 10296.0, 4967.0, 2593.0, 1514.0, 802.0, 492.0, 290.0, 192.0, 106.0, 94.0, 56.0, 19.0, 16.0, 17.0, 18.0, 8.0, 8.0, 4.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5693359375, -0.549713134765625, -0.53009033203125, -0.510467529296875, -0.4908447265625, -0.471221923828125, -0.45159912109375, -0.431976318359375, -0.412353515625, -0.392730712890625, -0.37310791015625, -0.353485107421875, -0.3338623046875, -0.314239501953125, -0.29461669921875, -0.274993896484375, -0.25537109375, -0.235748291015625, -0.21612548828125, -0.196502685546875, -0.1768798828125, -0.157257080078125, -0.13763427734375, -0.118011474609375, -0.098388671875, -0.078765869140625, -0.05914306640625, -0.039520263671875, -0.0198974609375, -0.000274658203125, 0.01934814453125, 0.038970947265625, 0.05859375, 0.078216552734375, 0.09783935546875, 0.117462158203125, 0.1370849609375, 0.156707763671875, 0.17633056640625, 0.195953369140625, 0.215576171875, 0.235198974609375, 0.25482177734375, 0.274444580078125, 0.2940673828125, 0.313690185546875, 0.33331298828125, 0.352935791015625, 0.37255859375, 0.392181396484375, 0.41180419921875, 0.431427001953125, 0.4510498046875, 0.470672607421875, 0.49029541015625, 0.509918212890625, 0.529541015625, 0.549163818359375, 0.56878662109375, 0.588409423828125, 0.6080322265625, 0.627655029296875, 0.64727783203125, 0.666900634765625, 0.6865234375]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 5.0, 5.0, 4.0, 4.0, 6.0, 10.0, 11.0, 2.0, 11.0, 20.0, 42.0, 105.0, 224.0, 273.0, 139.0, 55.0, 20.0, 12.0, 18.0, 6.0, 5.0, 5.0, 6.0, 2.0, 3.0, 1.0, 7.0, 0.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.078369140625, -0.07613849639892578, -0.07390785217285156, -0.07167720794677734, -0.06944656372070312, -0.0672159194946289, -0.06498527526855469, -0.06275463104248047, -0.06052398681640625, -0.05829334259033203, -0.05606269836425781, -0.053832054138183594, -0.051601409912109375, -0.049370765686035156, -0.04714012145996094, -0.04490947723388672, -0.0426788330078125, -0.04044818878173828, -0.03821754455566406, -0.035986900329589844, -0.033756256103515625, -0.031525611877441406, -0.029294967651367188, -0.02706432342529297, -0.02483367919921875, -0.02260303497314453, -0.020372390747070312, -0.018141746520996094, -0.015911102294921875, -0.013680458068847656, -0.011449813842773438, -0.009219169616699219, -0.006988525390625, -0.004757881164550781, -0.0025272369384765625, -0.00029659271240234375, 0.001934051513671875, 0.004164695739746094, 0.0063953399658203125, 0.008625984191894531, 0.01085662841796875, 0.013087272644042969, 0.015317916870117188, 0.017548561096191406, 0.019779205322265625, 0.022009849548339844, 0.024240493774414062, 0.02647113800048828, 0.0287017822265625, 0.03093242645263672, 0.03316307067871094, 0.035393714904785156, 0.037624359130859375, 0.039855003356933594, 0.04208564758300781, 0.04431629180908203, 0.04654693603515625, 0.04877758026123047, 0.05100822448730469, 0.053238868713378906, 0.055469512939453125, 0.057700157165527344, 0.05993080139160156, 0.06216144561767578, 0.06439208984375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 0.0, 4.0, 2.0, 5.0, 5.0, 6.0, 7.0, 11.0, 13.0, 17.0, 15.0, 22.0, 29.0, 62.0, 82.0, 164.0, 329.0, 625.0, 1391.0, 2973.0, 7049.0, 16281.0, 40716.0, 116312.0, 425290.0, 297198.0, 85556.0, 31378.0, 12625.0, 5597.0, 2461.0, 1155.0, 516.0, 275.0, 139.0, 73.0, 59.0, 31.0, 12.0, 20.0, 15.0, 11.0, 5.0, 6.0, 7.0, 5.0, 3.0, 1.0, 3.0, 3.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.295166015625, -0.284942626953125, -0.27471923828125, -0.264495849609375, -0.2542724609375, -0.244049072265625, -0.23382568359375, -0.223602294921875, -0.21337890625, -0.203155517578125, -0.19293212890625, -0.182708740234375, -0.1724853515625, -0.162261962890625, -0.15203857421875, -0.141815185546875, -0.131591796875, -0.121368408203125, -0.11114501953125, -0.100921630859375, -0.0906982421875, -0.080474853515625, -0.07025146484375, -0.060028076171875, -0.0498046875, -0.039581298828125, -0.02935791015625, -0.019134521484375, -0.0089111328125, 0.001312255859375, 0.01153564453125, 0.021759033203125, 0.031982421875, 0.042205810546875, 0.05242919921875, 0.062652587890625, 0.0728759765625, 0.083099365234375, 0.09332275390625, 0.103546142578125, 0.11376953125, 0.123992919921875, 0.13421630859375, 0.144439697265625, 0.1546630859375, 0.164886474609375, 0.17510986328125, 0.185333251953125, 0.195556640625, 0.205780029296875, 0.21600341796875, 0.226226806640625, 0.2364501953125, 0.246673583984375, 0.25689697265625, 0.267120361328125, 0.27734375, 0.287567138671875, 0.29779052734375, 0.308013916015625, 0.3182373046875, 0.328460693359375, 0.33868408203125, 0.348907470703125, 0.359130859375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 1.0, 4.0, 1.0, 5.0, 3.0, 7.0, 13.0, 10.0, 11.0, 16.0, 11.0, 14.0, 19.0, 22.0, 33.0, 28.0, 34.0, 32.0, 34.0, 34.0, 45.0, 47.0, 37.0, 31.0, 41.0, 43.0, 36.0, 52.0, 30.0, 38.0, 38.0, 22.0, 31.0, 26.0, 16.0, 33.0, 21.0, 13.0, 12.0, 18.0, 9.0, 9.0, 7.0, 10.0, 5.0, 3.0, 2.0, 2.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1658935546875, -0.16012954711914062, -0.15436553955078125, -0.14860153198242188, -0.1428375244140625, -0.13707351684570312, -0.13130950927734375, -0.12554550170898438, -0.119781494140625, -0.11401748657226562, -0.10825347900390625, -0.10248947143554688, -0.0967254638671875, -0.09096145629882812, -0.08519744873046875, -0.07943344116210938, -0.07366943359375, -0.06790542602539062, -0.06214141845703125, -0.056377410888671875, -0.0506134033203125, -0.044849395751953125, -0.03908538818359375, -0.033321380615234375, -0.027557373046875, -0.021793365478515625, -0.01602935791015625, -0.010265350341796875, -0.0045013427734375, 0.001262664794921875, 0.00702667236328125, 0.012790679931640625, 0.0185546875, 0.024318695068359375, 0.03008270263671875, 0.035846710205078125, 0.0416107177734375, 0.047374725341796875, 0.05313873291015625, 0.058902740478515625, 0.064666748046875, 0.07043075561523438, 0.07619476318359375, 0.08195877075195312, 0.0877227783203125, 0.09348678588867188, 0.09925079345703125, 0.10501480102539062, 0.11077880859375, 0.11654281616210938, 0.12230682373046875, 0.12807083129882812, 0.1338348388671875, 0.13959884643554688, 0.14536285400390625, 0.15112686157226562, 0.156890869140625, 0.16265487670898438, 0.16841888427734375, 0.17418289184570312, 0.1799468994140625, 0.18571090698242188, 0.19147491455078125, 0.19723892211914062, 0.2030029296875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 6.0, 9.0, 10.0, 13.0, 22.0, 31.0, 63.0, 100.0, 142.0, 249.0, 384.0, 786.0, 1770.0, 5149.0, 20592.0, 169203.0, 782445.0, 52325.0, 9827.0, 2925.0, 1152.0, 521.0, 286.0, 206.0, 111.0, 79.0, 44.0, 32.0, 21.0, 11.0, 7.0, 4.0, 8.0, 3.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0], "bins": [-0.060760498046875, -0.05881643295288086, -0.05687236785888672, -0.05492830276489258, -0.05298423767089844, -0.0510401725769043, -0.049096107482910156, -0.047152042388916016, -0.045207977294921875, -0.043263912200927734, -0.041319847106933594, -0.03937578201293945, -0.03743171691894531, -0.03548765182495117, -0.03354358673095703, -0.03159952163696289, -0.02965545654296875, -0.02771139144897461, -0.02576732635498047, -0.023823261260986328, -0.021879196166992188, -0.019935131072998047, -0.017991065979003906, -0.016047000885009766, -0.014102935791015625, -0.012158870697021484, -0.010214805603027344, -0.008270740509033203, -0.0063266754150390625, -0.004382610321044922, -0.0024385452270507812, -0.0004944801330566406, 0.0014495849609375, 0.0033936500549316406, 0.005337715148925781, 0.007281780242919922, 0.009225845336914062, 0.011169910430908203, 0.013113975524902344, 0.015058040618896484, 0.017002105712890625, 0.018946170806884766, 0.020890235900878906, 0.022834300994873047, 0.024778366088867188, 0.026722431182861328, 0.02866649627685547, 0.03061056137084961, 0.03255462646484375, 0.03449869155883789, 0.03644275665283203, 0.03838682174682617, 0.04033088684082031, 0.04227495193481445, 0.044219017028808594, 0.046163082122802734, 0.048107147216796875, 0.050051212310791016, 0.051995277404785156, 0.0539393424987793, 0.05588340759277344, 0.05782747268676758, 0.05977153778076172, 0.06171560287475586, 0.06365966796875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 2.0, 1.0, 4.0, 4.0, 10.0, 14.0, 11.0, 20.0, 20.0, 42.0, 43.0, 63.0, 90.0, 108.0, 129.0, 94.0, 92.0, 84.0, 34.0, 39.0, 28.0, 17.0, 17.0, 8.0, 11.0, 7.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-4.2557716369628906e-05, -4.1425228118896484e-05, -4.029273986816406e-05, -3.916025161743164e-05, -3.802776336669922e-05, -3.68952751159668e-05, -3.5762786865234375e-05, -3.463029861450195e-05, -3.349781036376953e-05, -3.236532211303711e-05, -3.123283386230469e-05, -3.0100345611572266e-05, -2.8967857360839844e-05, -2.7835369110107422e-05, -2.6702880859375e-05, -2.5570392608642578e-05, -2.4437904357910156e-05, -2.3305416107177734e-05, -2.2172927856445312e-05, -2.104043960571289e-05, -1.990795135498047e-05, -1.8775463104248047e-05, -1.7642974853515625e-05, -1.6510486602783203e-05, -1.537799835205078e-05, -1.424551010131836e-05, -1.3113021850585938e-05, -1.1980533599853516e-05, -1.0848045349121094e-05, -9.715557098388672e-06, -8.58306884765625e-06, -7.450580596923828e-06, -6.318092346191406e-06, -5.185604095458984e-06, -4.0531158447265625e-06, -2.9206275939941406e-06, -1.7881393432617188e-06, -6.556510925292969e-07, 4.76837158203125e-07, 1.6093254089355469e-06, 2.7418136596679688e-06, 3.874301910400391e-06, 5.0067901611328125e-06, 6.139278411865234e-06, 7.271766662597656e-06, 8.404254913330078e-06, 9.5367431640625e-06, 1.0669231414794922e-05, 1.1801719665527344e-05, 1.2934207916259766e-05, 1.4066696166992188e-05, 1.519918441772461e-05, 1.633167266845703e-05, 1.7464160919189453e-05, 1.8596649169921875e-05, 1.9729137420654297e-05, 2.086162567138672e-05, 2.199411392211914e-05, 2.3126602172851562e-05, 2.4259090423583984e-05, 2.5391578674316406e-05, 2.6524066925048828e-05, 2.765655517578125e-05, 2.8789043426513672e-05, 2.9921531677246094e-05]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 1.0, 3.0, 1.0, 2.0, 0.0, 3.0, 3.0, 4.0, 7.0, 13.0, 20.0, 37.0, 63.0, 104.0, 176.0, 295.0, 606.0, 1196.0, 2506.0, 6017.0, 16876.0, 59031.0, 395299.0, 469227.0, 66581.0, 18658.0, 6570.0, 2666.0, 1166.0, 635.0, 349.0, 183.0, 94.0, 69.0, 37.0, 22.0, 12.0, 13.0, 7.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03173828125, -0.030644893646240234, -0.02955150604248047, -0.028458118438720703, -0.027364730834960938, -0.026271343231201172, -0.025177955627441406, -0.02408456802368164, -0.022991180419921875, -0.02189779281616211, -0.020804405212402344, -0.019711017608642578, -0.018617630004882812, -0.017524242401123047, -0.01643085479736328, -0.015337467193603516, -0.01424407958984375, -0.013150691986083984, -0.012057304382324219, -0.010963916778564453, -0.009870529174804688, -0.008777141571044922, -0.007683753967285156, -0.006590366363525391, -0.005496978759765625, -0.004403591156005859, -0.0033102035522460938, -0.002216815948486328, -0.0011234283447265625, -3.0040740966796875e-05, 0.0010633468627929688, 0.0021567344665527344, 0.0032501220703125, 0.004343509674072266, 0.005436897277832031, 0.006530284881591797, 0.0076236724853515625, 0.008717060089111328, 0.009810447692871094, 0.01090383529663086, 0.011997222900390625, 0.01309061050415039, 0.014183998107910156, 0.015277385711669922, 0.016370773315429688, 0.017464160919189453, 0.01855754852294922, 0.019650936126708984, 0.02074432373046875, 0.021837711334228516, 0.02293109893798828, 0.024024486541748047, 0.025117874145507812, 0.026211261749267578, 0.027304649353027344, 0.02839803695678711, 0.029491424560546875, 0.03058481216430664, 0.031678199768066406, 0.03277158737182617, 0.03386497497558594, 0.0349583625793457, 0.03605175018310547, 0.037145137786865234, 0.038238525390625]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 3.0, 4.0, 2.0, 4.0, 5.0, 4.0, 11.0, 12.0, 16.0, 21.0, 18.0, 19.0, 30.0, 40.0, 51.0, 73.0, 82.0, 99.0, 80.0, 69.0, 59.0, 56.0, 45.0, 43.0, 24.0, 34.0, 25.0, 22.0, 15.0, 11.0, 4.0, 7.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0186004638671875, -0.017957210540771484, -0.01731395721435547, -0.016670703887939453, -0.016027450561523438, -0.015384197235107422, -0.014740943908691406, -0.01409769058227539, -0.013454437255859375, -0.01281118392944336, -0.012167930603027344, -0.011524677276611328, -0.010881423950195312, -0.010238170623779297, -0.009594917297363281, -0.008951663970947266, -0.00830841064453125, -0.007665157318115234, -0.007021903991699219, -0.006378650665283203, -0.0057353973388671875, -0.005092144012451172, -0.004448890686035156, -0.0038056373596191406, -0.003162384033203125, -0.0025191307067871094, -0.0018758773803710938, -0.0012326240539550781, -0.0005893707275390625, 5.3882598876953125e-05, 0.0006971359252929688, 0.0013403892517089844, 0.001983642578125, 0.0026268959045410156, 0.0032701492309570312, 0.003913402557373047, 0.0045566558837890625, 0.005199909210205078, 0.005843162536621094, 0.006486415863037109, 0.007129669189453125, 0.007772922515869141, 0.008416175842285156, 0.009059429168701172, 0.009702682495117188, 0.010345935821533203, 0.010989189147949219, 0.011632442474365234, 0.01227569580078125, 0.012918949127197266, 0.013562202453613281, 0.014205455780029297, 0.014848709106445312, 0.015491962432861328, 0.016135215759277344, 0.01677846908569336, 0.017421722412109375, 0.01806497573852539, 0.018708229064941406, 0.019351482391357422, 0.019994735717773438, 0.020637989044189453, 0.02128124237060547, 0.021924495697021484, 0.0225677490234375]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 12.0, 39.0, 144.0, 590.0, 165.0, 38.0, 11.0, 6.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.771942138671875, -3.578969717025757, -3.3859972953796387, -3.1930251121520996, -3.0000526905059814, -2.8070802688598633, -2.614107847213745, -2.421135425567627, -2.228163242340088, -2.0351908206939697, -1.8422185182571411, -1.649246096611023, -1.4562737941741943, -1.2633013725280762, -1.070328950881958, -0.8773566484451294, -0.6843841075897217, -0.4914117455482483, -0.2984393537044525, -0.10546696186065674, 0.08750540018081665, 0.28047776222229004, 0.4734501838684082, 0.6664224863052368, 0.859394907951355, 1.0523673295974731, 1.2453396320343018, 1.43831205368042, 1.631284475326538, 1.8242567777633667, 2.0172290802001953, 2.2102015018463135, 2.4031739234924316, 2.59614634513855, 2.789118766784668, 2.982090950012207, 3.175063371658325, 3.3680357933044434, 3.5610082149505615, 3.7539806365966797, 3.9469528198242188, 4.139925003051758, 4.332897663116455, 4.525869846343994, 4.718842506408691, 4.9118146896362305, 5.1047868728637695, 5.297759532928467, 5.490732192993164, 5.683704376220703, 5.8766770362854, 6.0696492195129395, 6.262621879577637, 6.455594062805176, 6.648566246032715, 6.841538906097412, 7.034511089324951, 7.22748327255249, 7.4204559326171875, 7.613428115844727, 7.806400775909424, 7.999372959136963, 8.19234561920166, 8.3853178024292, 8.578289985656738]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 1.0, 4.0, 8.0, 12.0, 10.0, 19.0, 25.0, 33.0, 47.0, 64.0, 68.0, 74.0, 78.0, 105.0, 92.0, 89.0, 59.0, 51.0, 41.0, 27.0, 21.0, 14.0, 10.0, 9.0, 5.0, 4.0, 6.0, 4.0, 2.0, 7.0, 3.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.1868035793304443, -2.1156365871429443, -2.0444695949554443, -1.9733024835586548, -1.9021354913711548, -1.8309684991836548, -1.7598013877868652, -1.6886343955993652, -1.6174674034118652, -1.5463004112243652, -1.4751334190368652, -1.4039663076400757, -1.3327993154525757, -1.2616323232650757, -1.1904652118682861, -1.1192982196807861, -1.0481312274932861, -0.9769642353057861, -0.9057971835136414, -0.8346301317214966, -0.7634631395339966, -0.6922961473464966, -0.6211290955543518, -0.549962043762207, -0.47879505157470703, -0.40762802958488464, -0.33646100759506226, -0.26529398560523987, -0.19412696361541748, -0.12295994162559509, -0.051792919635772705, 0.019374102354049683, 0.09054088592529297, 0.16170790791511536, 0.23287492990493774, 0.30404195189476013, 0.3752089738845825, 0.4463759958744049, 0.5175430178642273, 0.5887100696563721, 0.6598770618438721, 0.7310440540313721, 0.8022111058235168, 0.8733781576156616, 0.9445451498031616, 1.0157121419906616, 1.0868792533874512, 1.1580462455749512, 1.2292132377624512, 1.3003802299499512, 1.3715472221374512, 1.4427143335342407, 1.5138813257217407, 1.5850483179092407, 1.6562154293060303, 1.7273824214935303, 1.7985494136810303, 1.8697164058685303, 1.9408833980560303, 2.0120503902435303, 2.0832176208496094, 2.1543846130371094, 2.2255516052246094, 2.2967185974121094, 2.3678855895996094]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 6.0, 2.0, 0.0, 7.0, 4.0, 6.0, 2.0, 7.0, 8.0, 6.0, 13.0, 18.0, 17.0, 25.0, 44.0, 54.0, 104.0, 122.0, 223.0, 308.0, 465.0, 711.0, 1134.0, 1996.0, 4022.0, 10605.0, 56391.0, 4075008.0, 28449.0, 7128.0, 3103.0, 1571.0, 924.0, 545.0, 389.0, 281.0, 188.0, 123.0, 88.0, 65.0, 42.0, 29.0, 25.0, 13.0, 7.0, 5.0, 3.0, 1.0, 3.0, 1.0], "bins": [-1.89453125, -1.84869384765625, -1.8028564453125, -1.75701904296875, -1.711181640625, -1.66534423828125, -1.6195068359375, -1.57366943359375, -1.52783203125, -1.48199462890625, -1.4361572265625, -1.39031982421875, -1.344482421875, -1.29864501953125, -1.2528076171875, -1.20697021484375, -1.1611328125, -1.11529541015625, -1.0694580078125, -1.02362060546875, -0.977783203125, -0.93194580078125, -0.8861083984375, -0.84027099609375, -0.79443359375, -0.74859619140625, -0.7027587890625, -0.65692138671875, -0.611083984375, -0.56524658203125, -0.5194091796875, -0.47357177734375, -0.427734375, -0.38189697265625, -0.3360595703125, -0.29022216796875, -0.244384765625, -0.19854736328125, -0.1527099609375, -0.10687255859375, -0.06103515625, -0.01519775390625, 0.0306396484375, 0.07647705078125, 0.122314453125, 0.16815185546875, 0.2139892578125, 0.25982666015625, 0.3056640625, 0.35150146484375, 0.3973388671875, 0.44317626953125, 0.489013671875, 0.53485107421875, 0.5806884765625, 0.62652587890625, 0.67236328125, 0.71820068359375, 0.7640380859375, 0.80987548828125, 0.855712890625, 0.90155029296875, 0.9473876953125, 0.99322509765625, 1.0390625]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 3.0, 2.0, 2.0, 3.0, 8.0, 7.0, 13.0, 17.0, 13.0, 26.0, 51.0, 78.0, 173.0, 202.0, 155.0, 101.0, 47.0, 20.0, 26.0, 11.0, 9.0, 7.0, 5.0, 3.0, 6.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 3.0, 0.0, 1.0], "bins": [-0.0750732421875, -0.07326364517211914, -0.07145404815673828, -0.06964445114135742, -0.06783485412597656, -0.0660252571105957, -0.06421566009521484, -0.062406063079833984, -0.060596466064453125, -0.058786869049072266, -0.056977272033691406, -0.05516767501831055, -0.05335807800292969, -0.05154848098754883, -0.04973888397216797, -0.04792928695678711, -0.04611968994140625, -0.04431009292602539, -0.04250049591064453, -0.04069089889526367, -0.03888130187988281, -0.03707170486450195, -0.035262107849121094, -0.033452510833740234, -0.031642913818359375, -0.029833316802978516, -0.028023719787597656, -0.026214122772216797, -0.024404525756835938, -0.022594928741455078, -0.02078533172607422, -0.01897573471069336, -0.0171661376953125, -0.01535654067993164, -0.013546943664550781, -0.011737346649169922, -0.009927749633789062, -0.008118152618408203, -0.006308555603027344, -0.004498958587646484, -0.002689361572265625, -0.0008797645568847656, 0.0009298324584960938, 0.002739429473876953, 0.0045490264892578125, 0.006358623504638672, 0.008168220520019531, 0.00997781753540039, 0.01178741455078125, 0.01359701156616211, 0.015406608581542969, 0.017216205596923828, 0.019025802612304688, 0.020835399627685547, 0.022644996643066406, 0.024454593658447266, 0.026264190673828125, 0.028073787689208984, 0.029883384704589844, 0.0316929817199707, 0.03350257873535156, 0.03531217575073242, 0.03712177276611328, 0.03893136978149414, 0.040740966796875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 2.0, 3.0, 3.0, 3.0, 5.0, 9.0, 7.0, 9.0, 10.0, 21.0, 12.0, 16.0, 9.0, 30.0, 30.0, 113.0, 1148.0, 27353.0, 4146984.0, 17449.0, 799.0, 104.0, 32.0, 22.0, 12.0, 18.0, 16.0, 7.0, 12.0, 8.0, 10.0, 6.0, 6.0, 3.0, 4.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.720703125, -2.621551513671875, -2.52239990234375, -2.423248291015625, -2.3240966796875, -2.224945068359375, -2.12579345703125, -2.026641845703125, -1.927490234375, -1.828338623046875, -1.72918701171875, -1.630035400390625, -1.5308837890625, -1.431732177734375, -1.33258056640625, -1.233428955078125, -1.13427734375, -1.035125732421875, -0.93597412109375, -0.836822509765625, -0.7376708984375, -0.638519287109375, -0.53936767578125, -0.440216064453125, -0.341064453125, -0.241912841796875, -0.14276123046875, -0.043609619140625, 0.0555419921875, 0.154693603515625, 0.25384521484375, 0.352996826171875, 0.4521484375, 0.551300048828125, 0.65045166015625, 0.749603271484375, 0.8487548828125, 0.947906494140625, 1.04705810546875, 1.146209716796875, 1.245361328125, 1.344512939453125, 1.44366455078125, 1.542816162109375, 1.6419677734375, 1.741119384765625, 1.84027099609375, 1.939422607421875, 2.03857421875, 2.137725830078125, 2.23687744140625, 2.336029052734375, 2.4351806640625, 2.534332275390625, 2.63348388671875, 2.732635498046875, 2.831787109375, 2.930938720703125, 3.03009033203125, 3.129241943359375, 3.2283935546875, 3.327545166015625, 3.42669677734375, 3.525848388671875, 3.625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 1.0, 3.0, 3.0, 4.0, 5.0, 5.0, 13.0, 6.0, 11.0, 8.0, 21.0, 16.0, 14.0, 26.0, 29.0, 41.0, 54.0, 216.0, 3305.0, 66.0, 38.0, 40.0, 19.0, 19.0, 15.0, 12.0, 18.0, 15.0, 7.0, 8.0, 9.0, 8.0, 4.0, 4.0, 3.0, 1.0, 3.0, 6.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.12237548828125, -0.11908149719238281, -0.11578750610351562, -0.11249351501464844, -0.10919952392578125, -0.10590553283691406, -0.10261154174804688, -0.09931755065917969, -0.0960235595703125, -0.09272956848144531, -0.08943557739257812, -0.08614158630371094, -0.08284759521484375, -0.07955360412597656, -0.07625961303710938, -0.07296562194824219, -0.069671630859375, -0.06637763977050781, -0.06308364868164062, -0.05978965759277344, -0.05649566650390625, -0.05320167541503906, -0.049907684326171875, -0.04661369323730469, -0.0433197021484375, -0.04002571105957031, -0.036731719970703125, -0.03343772888183594, -0.03014373779296875, -0.026849746704101562, -0.023555755615234375, -0.020261764526367188, -0.0169677734375, -0.013673782348632812, -0.010379791259765625, -0.0070858001708984375, -0.00379180908203125, -0.0004978179931640625, 0.002796173095703125, 0.0060901641845703125, 0.0093841552734375, 0.012678146362304688, 0.015972137451171875, 0.019266128540039062, 0.02256011962890625, 0.025854110717773438, 0.029148101806640625, 0.03244209289550781, 0.035736083984375, 0.03903007507324219, 0.042324066162109375, 0.04561805725097656, 0.04891204833984375, 0.05220603942871094, 0.055500030517578125, 0.05879402160644531, 0.0620880126953125, 0.06538200378417969, 0.06867599487304688, 0.07196998596191406, 0.07526397705078125, 0.07855796813964844, 0.08185195922851562, 0.08514595031738281, 0.08843994140625]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 10.0, 18.0, 44.0, 138.0, 543.0, 181.0, 53.0, 18.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.260511636734009, -2.2157864570617676, -2.1710615158081055, -2.1263363361358643, -2.081611394882202, -2.036886215209961, -1.9921611547470093, -1.9474360942840576, -1.902711033821106, -1.8579859733581543, -1.8132609128952026, -1.768535852432251, -1.7238106727600098, -1.679085612297058, -1.6343605518341064, -1.5896354913711548, -1.5449104309082031, -1.5001853704452515, -1.4554603099822998, -1.4107352495193481, -1.3660101890563965, -1.3212850093841553, -1.2765599489212036, -1.231834888458252, -1.1871098279953003, -1.1423847675323486, -1.097659707069397, -1.0529346466064453, -1.008209466934204, -0.9634844660758972, -0.9187593460083008, -0.8740342855453491, -0.829309344291687, -0.7845842838287354, -0.7398592233657837, -0.6951341032981873, -0.6504090428352356, -0.6056839823722839, -0.5609588623046875, -0.5162338018417358, -0.4715087413787842, -0.4267836809158325, -0.38205859065055847, -0.3373335003852844, -0.29260843992233276, -0.2478833645582199, -0.20315828919410706, -0.158433198928833, -0.11370813846588135, -0.0689830631017685, -0.02425798773765564, 0.020467087626457214, 0.06519216299057007, 0.10991723835468292, 0.15464231371879578, 0.19936740398406982, 0.24409246444702148, 0.28881752490997314, 0.3335426151752472, 0.37826770544052124, 0.4229927659034729, 0.46771782636642456, 0.512442946434021, 0.5571680068969727, 0.6018930673599243]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 7.0, 5.0, 5.0, 8.0, 8.0, 15.0, 29.0, 24.0, 37.0, 54.0, 59.0, 82.0, 76.0, 87.0, 87.0, 83.0, 78.0, 55.0, 72.0, 39.0, 24.0, 26.0, 12.0, 14.0, 8.0, 6.0, 4.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.7095207571983337, -0.6930294632911682, -0.6765381693840027, -0.6600468158721924, -0.6435555219650269, -0.6270642280578613, -0.6105729341506958, -0.5940816402435303, -0.57759028673172, -0.5610989928245544, -0.5446076989173889, -0.5281163454055786, -0.5116250514984131, -0.49513375759124756, -0.47864246368408203, -0.4621511399745941, -0.4456598460674286, -0.42916855216026306, -0.41267722845077515, -0.3961859345436096, -0.3796946108341217, -0.3632033169269562, -0.34671199321746826, -0.33022069931030273, -0.3137294054031372, -0.2972381114959717, -0.28074678778648376, -0.26425549387931824, -0.24776417016983032, -0.2312728762626648, -0.21478156745433807, -0.19829025864601135, -0.18179893493652344, -0.16530762612819672, -0.14881631731987, -0.13232502341270447, -0.11583370715379715, -0.09934239834547043, -0.0828510969877243, -0.06635978817939758, -0.04986847937107086, -0.03337717056274414, -0.016885865479707718, -0.00039456039667129517, 0.016096748411655426, 0.03258805721998215, 0.04907935857772827, 0.06557066738605499, 0.08206197619438171, 0.09855328500270844, 0.11504459381103516, 0.13153588771820068, 0.1480272114276886, 0.16451850533485413, 0.18100981414318085, 0.19750112295150757, 0.2139924317598343, 0.230483740568161, 0.24697504937648773, 0.26346635818481445, 0.27995765209198, 0.2964489758014679, 0.3129402697086334, 0.32943159341812134, 0.34592288732528687]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 2.0, 1.0, 9.0, 9.0, 12.0, 13.0, 17.0, 23.0, 33.0, 67.0, 116.0, 179.0, 320.0, 666.0, 1311.0, 3253.0, 9789.0, 47056.0, 793158.0, 163967.0, 19058.0, 5462.0, 2059.0, 887.0, 481.0, 234.0, 121.0, 78.0, 60.0, 27.0, 19.0, 19.0, 6.0, 11.0, 10.0, 8.0, 7.0, 5.0, 2.0, 0.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.78515625, -0.7604217529296875, -0.735687255859375, -0.7109527587890625, -0.68621826171875, -0.6614837646484375, -0.636749267578125, -0.6120147705078125, -0.5872802734375, -0.5625457763671875, -0.537811279296875, -0.5130767822265625, -0.48834228515625, -0.4636077880859375, -0.438873291015625, -0.4141387939453125, -0.389404296875, -0.3646697998046875, -0.339935302734375, -0.3152008056640625, -0.29046630859375, -0.2657318115234375, -0.240997314453125, -0.2162628173828125, -0.1915283203125, -0.1667938232421875, -0.142059326171875, -0.1173248291015625, -0.09259033203125, -0.0678558349609375, -0.043121337890625, -0.0183868408203125, 0.00634765625, 0.0310821533203125, 0.055816650390625, 0.0805511474609375, 0.10528564453125, 0.1300201416015625, 0.154754638671875, 0.1794891357421875, 0.2042236328125, 0.2289581298828125, 0.253692626953125, 0.2784271240234375, 0.30316162109375, 0.3278961181640625, 0.352630615234375, 0.3773651123046875, 0.402099609375, 0.4268341064453125, 0.451568603515625, 0.4763031005859375, 0.50103759765625, 0.5257720947265625, 0.550506591796875, 0.5752410888671875, 0.5999755859375, 0.6247100830078125, 0.649444580078125, 0.6741790771484375, 0.69891357421875, 0.7236480712890625, 0.748382568359375, 0.7731170654296875, 0.7978515625]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 3.0, 5.0, 5.0, 8.0, 18.0, 16.0, 16.0, 47.0, 80.0, 134.0, 183.0, 191.0, 130.0, 67.0, 37.0, 19.0, 13.0, 12.0, 4.0, 3.0, 6.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.08050537109375, -0.07866621017456055, -0.0768270492553711, -0.07498788833618164, -0.07314872741699219, -0.07130956649780273, -0.06947040557861328, -0.06763124465942383, -0.06579208374023438, -0.06395292282104492, -0.06211376190185547, -0.060274600982666016, -0.05843544006347656, -0.05659627914428711, -0.054757118225097656, -0.0529179573059082, -0.05107879638671875, -0.0492396354675293, -0.047400474548339844, -0.04556131362915039, -0.04372215270996094, -0.041882991790771484, -0.04004383087158203, -0.03820466995239258, -0.036365509033203125, -0.03452634811401367, -0.03268718719482422, -0.030848026275634766, -0.029008865356445312, -0.02716970443725586, -0.025330543518066406, -0.023491382598876953, -0.0216522216796875, -0.019813060760498047, -0.017973899841308594, -0.01613473892211914, -0.014295578002929688, -0.012456417083740234, -0.010617256164550781, -0.008778095245361328, -0.006938934326171875, -0.005099773406982422, -0.0032606124877929688, -0.0014214515686035156, 0.0004177093505859375, 0.0022568702697753906, 0.004096031188964844, 0.005935192108154297, 0.00777435302734375, 0.009613513946533203, 0.011452674865722656, 0.01329183578491211, 0.015130996704101562, 0.016970157623291016, 0.01880931854248047, 0.020648479461669922, 0.022487640380859375, 0.024326801300048828, 0.02616596221923828, 0.028005123138427734, 0.029844284057617188, 0.03168344497680664, 0.033522605895996094, 0.03536176681518555, 0.037200927734375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 3.0, 7.0, 13.0, 5.0, 13.0, 22.0, 34.0, 31.0, 73.0, 91.0, 111.0, 216.0, 264.0, 435.0, 734.0, 1111.0, 1819.0, 3167.0, 5751.0, 10729.0, 20494.0, 40610.0, 91612.0, 249822.0, 368430.0, 137052.0, 57599.0, 27208.0, 13673.0, 7315.0, 4053.0, 2247.0, 1369.0, 853.0, 530.0, 339.0, 226.0, 169.0, 113.0, 61.0, 46.0, 33.0, 23.0, 22.0, 7.0, 5.0, 10.0, 7.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.2344970703125, -0.22698402404785156, -0.21947097778320312, -0.2119579315185547, -0.20444488525390625, -0.1969318389892578, -0.18941879272460938, -0.18190574645996094, -0.1743927001953125, -0.16687965393066406, -0.15936660766601562, -0.1518535614013672, -0.14434051513671875, -0.1368274688720703, -0.12931442260742188, -0.12180137634277344, -0.114288330078125, -0.10677528381347656, -0.09926223754882812, -0.09174919128417969, -0.08423614501953125, -0.07672309875488281, -0.06921005249023438, -0.06169700622558594, -0.0541839599609375, -0.04667091369628906, -0.039157867431640625, -0.03164482116699219, -0.02413177490234375, -0.016618728637695312, -0.009105682373046875, -0.0015926361083984375, 0.00592041015625, 0.013433456420898438, 0.020946502685546875, 0.028459548950195312, 0.03597259521484375, 0.04348564147949219, 0.050998687744140625, 0.05851173400878906, 0.0660247802734375, 0.07353782653808594, 0.08105087280273438, 0.08856391906738281, 0.09607696533203125, 0.10359001159667969, 0.11110305786132812, 0.11861610412597656, 0.126129150390625, 0.13364219665527344, 0.14115524291992188, 0.1486682891845703, 0.15618133544921875, 0.1636943817138672, 0.17120742797851562, 0.17872047424316406, 0.1862335205078125, 0.19374656677246094, 0.20125961303710938, 0.2087726593017578, 0.21628570556640625, 0.2237987518310547, 0.23131179809570312, 0.23882484436035156, 0.246337890625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 6.0, 6.0, 6.0, 14.0, 15.0, 19.0, 12.0, 21.0, 19.0, 20.0, 31.0, 33.0, 38.0, 35.0, 46.0, 46.0, 54.0, 50.0, 49.0, 47.0, 41.0, 54.0, 42.0, 38.0, 43.0, 42.0, 43.0, 25.0, 26.0, 6.0, 15.0, 14.0, 8.0, 15.0, 5.0, 6.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.152099609375, -0.1467304229736328, -0.14136123657226562, -0.13599205017089844, -0.13062286376953125, -0.12525367736816406, -0.11988449096679688, -0.11451530456542969, -0.1091461181640625, -0.10377693176269531, -0.09840774536132812, -0.09303855895996094, -0.08766937255859375, -0.08230018615722656, -0.07693099975585938, -0.07156181335449219, -0.066192626953125, -0.06082344055175781, -0.055454254150390625, -0.05008506774902344, -0.04471588134765625, -0.03934669494628906, -0.033977508544921875, -0.028608322143554688, -0.0232391357421875, -0.017869949340820312, -0.012500762939453125, -0.0071315765380859375, -0.00176239013671875, 0.0036067962646484375, 0.008975982666015625, 0.014345169067382812, 0.01971435546875, 0.025083541870117188, 0.030452728271484375, 0.03582191467285156, 0.04119110107421875, 0.04656028747558594, 0.051929473876953125, 0.05729866027832031, 0.0626678466796875, 0.06803703308105469, 0.07340621948242188, 0.07877540588378906, 0.08414459228515625, 0.08951377868652344, 0.09488296508789062, 0.10025215148925781, 0.105621337890625, 0.11099052429199219, 0.11635971069335938, 0.12172889709472656, 0.12709808349609375, 0.13246726989746094, 0.13783645629882812, 0.1432056427001953, 0.1485748291015625, 0.1539440155029297, 0.15931320190429688, 0.16468238830566406, 0.17005157470703125, 0.17542076110839844, 0.18078994750976562, 0.1861591339111328, 0.1915283203125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 2.0, 1.0, 7.0, 9.0, 7.0, 16.0, 10.0, 16.0, 28.0, 40.0, 52.0, 64.0, 126.0, 183.0, 305.0, 556.0, 1151.0, 2778.0, 8270.0, 38335.0, 702950.0, 259247.0, 24132.0, 5989.0, 2123.0, 897.0, 521.0, 271.0, 154.0, 97.0, 64.0, 40.0, 36.0, 15.0, 18.0, 7.0, 14.0, 9.0, 4.0, 7.0, 5.0, 0.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.297607421875, -0.28826904296875, -0.2789306640625, -0.26959228515625, -0.26025390625, -0.25091552734375, -0.2415771484375, -0.23223876953125, -0.222900390625, -0.21356201171875, -0.2042236328125, -0.19488525390625, -0.185546875, -0.17620849609375, -0.1668701171875, -0.15753173828125, -0.148193359375, -0.13885498046875, -0.1295166015625, -0.12017822265625, -0.11083984375, -0.10150146484375, -0.0921630859375, -0.08282470703125, -0.073486328125, -0.06414794921875, -0.0548095703125, -0.04547119140625, -0.0361328125, -0.02679443359375, -0.0174560546875, -0.00811767578125, 0.001220703125, 0.01055908203125, 0.0198974609375, 0.02923583984375, 0.03857421875, 0.04791259765625, 0.0572509765625, 0.06658935546875, 0.075927734375, 0.08526611328125, 0.0946044921875, 0.10394287109375, 0.11328125, 0.12261962890625, 0.1319580078125, 0.14129638671875, 0.150634765625, 0.15997314453125, 0.1693115234375, 0.17864990234375, 0.18798828125, 0.19732666015625, 0.2066650390625, 0.21600341796875, 0.225341796875, 0.23468017578125, 0.2440185546875, 0.25335693359375, 0.2626953125, 0.27203369140625, 0.2813720703125, 0.29071044921875, 0.300048828125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 3.0, 5.0, 3.0, 2.0, 2.0, 3.0, 1.0, 5.0, 8.0, 7.0, 12.0, 26.0, 34.0, 64.0, 419.0, 257.0, 53.0, 22.0, 12.0, 8.0, 14.0, 5.0, 7.0, 7.0, 6.0, 0.0, 3.0, 2.0, 5.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00023865699768066406, -0.00023065879940986633, -0.0002226606011390686, -0.00021466240286827087, -0.00020666420459747314, -0.00019866600632667542, -0.00019066780805587769, -0.00018266960978507996, -0.00017467141151428223, -0.0001666732132434845, -0.00015867501497268677, -0.00015067681670188904, -0.0001426786184310913, -0.00013468042016029358, -0.00012668222188949585, -0.00011868402361869812, -0.00011068582534790039, -0.00010268762707710266, -9.468942880630493e-05, -8.66912305355072e-05, -7.869303226470947e-05, -7.069483399391174e-05, -6.269663572311401e-05, -5.4698437452316284e-05, -4.6700239181518555e-05, -3.8702040910720825e-05, -3.0703842639923096e-05, -2.2705644369125366e-05, -1.4707446098327637e-05, -6.709247827529907e-06, 1.2889504432678223e-06, 9.287148714065552e-06, 1.728534698486328e-05, 2.528354525566101e-05, 3.328174352645874e-05, 4.127994179725647e-05, 4.92781400680542e-05, 5.727633833885193e-05, 6.527453660964966e-05, 7.327273488044739e-05, 8.127093315124512e-05, 8.926913142204285e-05, 9.726732969284058e-05, 0.0001052655279636383, 0.00011326372623443604, 0.00012126192450523376, 0.0001292601227760315, 0.00013725832104682922, 0.00014525651931762695, 0.00015325471758842468, 0.0001612529158592224, 0.00016925111413002014, 0.00017724931240081787, 0.0001852475106716156, 0.00019324570894241333, 0.00020124390721321106, 0.0002092421054840088, 0.00021724030375480652, 0.00022523850202560425, 0.00023323670029640198, 0.0002412348985671997, 0.00024923309683799744, 0.00025723129510879517, 0.0002652294933795929, 0.0002732276916503906]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 8.0, 4.0, 5.0, 16.0, 20.0, 22.0, 34.0, 44.0, 72.0, 73.0, 131.0, 224.0, 343.0, 566.0, 870.0, 1479.0, 2769.0, 5775.0, 14142.0, 44373.0, 305833.0, 580240.0, 59833.0, 17548.0, 6835.0, 3090.0, 1622.0, 903.0, 571.0, 359.0, 216.0, 168.0, 117.0, 82.0, 55.0, 40.0, 20.0, 14.0, 10.0, 7.0, 10.0, 7.0, 3.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.19189453125, -0.18552017211914062, -0.17914581298828125, -0.17277145385742188, -0.1663970947265625, -0.16002273559570312, -0.15364837646484375, -0.14727401733398438, -0.140899658203125, -0.13452529907226562, -0.12815093994140625, -0.12177658081054688, -0.1154022216796875, -0.10902786254882812, -0.10265350341796875, -0.09627914428710938, -0.08990478515625, -0.08353042602539062, -0.07715606689453125, -0.07078170776367188, -0.0644073486328125, -0.058032989501953125, -0.05165863037109375, -0.045284271240234375, -0.038909912109375, -0.032535552978515625, -0.02616119384765625, -0.019786834716796875, -0.0134124755859375, -0.007038116455078125, -0.00066375732421875, 0.005710601806640625, 0.0120849609375, 0.018459320068359375, 0.02483367919921875, 0.031208038330078125, 0.0375823974609375, 0.043956756591796875, 0.05033111572265625, 0.056705474853515625, 0.063079833984375, 0.06945419311523438, 0.07582855224609375, 0.08220291137695312, 0.0885772705078125, 0.09495162963867188, 0.10132598876953125, 0.10770034790039062, 0.11407470703125, 0.12044906616210938, 0.12682342529296875, 0.13319778442382812, 0.1395721435546875, 0.14594650268554688, 0.15232086181640625, 0.15869522094726562, 0.165069580078125, 0.17144393920898438, 0.17781829833984375, 0.18419265747070312, 0.1905670166015625, 0.19694137573242188, 0.20331573486328125, 0.20969009399414062, 0.216064453125]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 5.0, 5.0, 8.0, 12.0, 13.0, 16.0, 32.0, 31.0, 41.0, 80.0, 112.0, 166.0, 149.0, 94.0, 64.0, 47.0, 32.0, 26.0, 16.0, 17.0, 8.0, 7.0, 7.0, 2.0, 3.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1131591796875, -0.10878372192382812, -0.10440826416015625, -0.10003280639648438, -0.0956573486328125, -0.09128189086914062, -0.08690643310546875, -0.08253097534179688, -0.078155517578125, -0.07378005981445312, -0.06940460205078125, -0.06502914428710938, -0.0606536865234375, -0.056278228759765625, -0.05190277099609375, -0.047527313232421875, -0.04315185546875, -0.038776397705078125, -0.03440093994140625, -0.030025482177734375, -0.0256500244140625, -0.021274566650390625, -0.01689910888671875, -0.012523651123046875, -0.008148193359375, -0.003772735595703125, 0.00060272216796875, 0.004978179931640625, 0.0093536376953125, 0.013729095458984375, 0.01810455322265625, 0.022480010986328125, 0.02685546875, 0.031230926513671875, 0.03560638427734375, 0.039981842041015625, 0.0443572998046875, 0.048732757568359375, 0.05310821533203125, 0.057483673095703125, 0.061859130859375, 0.06623458862304688, 0.07061004638671875, 0.07498550415039062, 0.0793609619140625, 0.08373641967773438, 0.08811187744140625, 0.09248733520507812, 0.09686279296875, 0.10123825073242188, 0.10561370849609375, 0.10998916625976562, 0.1143646240234375, 0.11874008178710938, 0.12311553955078125, 0.12749099731445312, 0.131866455078125, 0.13624191284179688, 0.14061737060546875, 0.14499282836914062, 0.1493682861328125, 0.15374374389648438, 0.15811920166015625, 0.16249465942382812, 0.1668701171875]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 1.0, 5.0, 7.0, 20.0, 23.0, 36.0, 72.0, 135.0, 243.0, 195.0, 101.0, 63.0, 42.0, 17.0, 14.0, 9.0, 8.0, 6.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.8489274978637695, -2.771926164627075, -2.69492506980896, -2.6179237365722656, -2.5409226417541504, -2.463921308517456, -2.3869199752807617, -2.3099188804626465, -2.232917547225952, -2.155916213989258, -2.0789151191711426, -2.0019137859344482, -1.9249125719070435, -1.8479113578796387, -1.7709100246429443, -1.6939088106155396, -1.6169075965881348, -1.53990638256073, -1.4629051685333252, -1.3859038352966309, -1.308902621269226, -1.2319014072418213, -1.154900074005127, -1.0778988599777222, -1.0008976459503174, -0.9238964319229126, -0.846895158290863, -0.7698938846588135, -0.6928926706314087, -0.6158914566040039, -0.5388901829719543, -0.4618889093399048, -0.3848876953125, -0.3078864514827728, -0.23088520765304565, -0.15388396382331848, -0.07688271999359131, 0.00011852383613586426, 0.07711976766586304, 0.1541210412979126, 0.23112225532531738, 0.30812349915504456, 0.38512474298477173, 0.4621259868144989, 0.5391272306442261, 0.6161284446716309, 0.6931297183036804, 0.77013099193573, 0.8471322059631348, 0.9241334199905396, 1.0011346340179443, 1.0781359672546387, 1.1551371812820435, 1.2321383953094482, 1.3091397285461426, 1.3861409425735474, 1.4631421566009521, 1.540143370628357, 1.6171445846557617, 1.694145917892456, 1.7711471319198608, 1.8481483459472656, 1.92514967918396, 2.0021510124206543, 2.0791521072387695]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 9.0, 10.0, 18.0, 21.0, 36.0, 51.0, 50.0, 72.0, 83.0, 84.0, 103.0, 73.0, 91.0, 66.0, 58.0, 54.0, 41.0, 32.0, 14.0, 11.0, 9.0, 4.0, 1.0, 6.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.4346957206726074, -2.3685531616210938, -2.302410840988159, -2.2362682819366455, -2.170125961303711, -2.1039834022521973, -2.0378408432006836, -1.9716984033584595, -1.9055559635162354, -1.8394135236740112, -1.773271083831787, -1.7071285247802734, -1.6409860849380493, -1.5748436450958252, -1.5087010860443115, -1.4425586462020874, -1.3764162063598633, -1.3102737665176392, -1.244131326675415, -1.1779887676239014, -1.1118463277816772, -1.0457038879394531, -0.9795613884925842, -0.9134188890457153, -0.8472764492034912, -0.7811340093612671, -0.7149915099143982, -0.6488490104675293, -0.5827065706253052, -0.516564130783081, -0.45042163133621216, -0.38427916169166565, -0.31813669204711914, -0.25199422240257263, -0.18585175275802612, -0.11970928311347961, -0.053566813468933105, 0.012575656175613403, 0.07871812582015991, 0.14486059546470642, 0.21100306510925293, 0.27714553475379944, 0.34328800439834595, 0.40943047404289246, 0.47557294368743896, 0.5417153835296631, 0.607857882976532, 0.6740003824234009, 0.740142822265625, 0.8062852621078491, 0.872427761554718, 0.9385702610015869, 1.004712700843811, 1.0708551406860352, 1.1369976997375488, 1.203140139579773, 1.269282579421997, 1.3354250192642212, 1.4015674591064453, 1.467710018157959, 1.533852458000183, 1.5999948978424072, 1.666137456893921, 1.732279896736145, 1.7984223365783691]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 5.0, 7.0, 9.0, 16.0, 18.0, 37.0, 41.0, 70.0, 121.0, 405.0, 1952.0, 33027.0, 4149003.0, 8113.0, 1032.0, 296.0, 76.0, 31.0, 10.0, 7.0, 6.0, 1.0, 1.0, 5.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-5.56640625, -5.44354248046875, -5.3206787109375, -5.19781494140625, -5.074951171875, -4.95208740234375, -4.8292236328125, -4.70635986328125, -4.58349609375, -4.46063232421875, -4.3377685546875, -4.21490478515625, -4.092041015625, -3.96917724609375, -3.8463134765625, -3.72344970703125, -3.6005859375, -3.47772216796875, -3.3548583984375, -3.23199462890625, -3.109130859375, -2.98626708984375, -2.8634033203125, -2.74053955078125, -2.61767578125, -2.49481201171875, -2.3719482421875, -2.24908447265625, -2.126220703125, -2.00335693359375, -1.8804931640625, -1.75762939453125, -1.634765625, -1.51190185546875, -1.3890380859375, -1.26617431640625, -1.143310546875, -1.02044677734375, -0.8975830078125, -0.77471923828125, -0.65185546875, -0.52899169921875, -0.4061279296875, -0.28326416015625, -0.160400390625, -0.03753662109375, 0.0853271484375, 0.20819091796875, 0.3310546875, 0.45391845703125, 0.5767822265625, 0.69964599609375, 0.822509765625, 0.94537353515625, 1.0682373046875, 1.19110107421875, 1.31396484375, 1.43682861328125, 1.5596923828125, 1.68255615234375, 1.805419921875, 1.92828369140625, 2.0511474609375, 2.17401123046875, 2.296875]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 4.0, 1.0, 9.0, 12.0, 29.0, 23.0, 67.0, 137.0, 184.0, 190.0, 149.0, 91.0, 48.0, 19.0, 16.0, 7.0, 7.0, 4.0, 1.0, 4.0, 4.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.11407470703125, -0.11154890060424805, -0.1090230941772461, -0.10649728775024414, -0.10397148132324219, -0.10144567489624023, -0.09891986846923828, -0.09639406204223633, -0.09386825561523438, -0.09134244918823242, -0.08881664276123047, -0.08629083633422852, -0.08376502990722656, -0.08123922348022461, -0.07871341705322266, -0.0761876106262207, -0.07366180419921875, -0.0711359977722168, -0.06861019134521484, -0.06608438491821289, -0.06355857849121094, -0.061032772064208984, -0.05850696563720703, -0.05598115921020508, -0.053455352783203125, -0.05092954635620117, -0.04840373992919922, -0.045877933502197266, -0.04335212707519531, -0.04082632064819336, -0.038300514221191406, -0.03577470779418945, -0.0332489013671875, -0.030723094940185547, -0.028197288513183594, -0.02567148208618164, -0.023145675659179688, -0.020619869232177734, -0.01809406280517578, -0.015568256378173828, -0.013042449951171875, -0.010516643524169922, -0.007990837097167969, -0.005465030670166016, -0.0029392242431640625, -0.0004134178161621094, 0.0021123886108398438, 0.004638195037841797, 0.00716400146484375, 0.009689807891845703, 0.012215614318847656, 0.01474142074584961, 0.017267227172851562, 0.019793033599853516, 0.02231884002685547, 0.024844646453857422, 0.027370452880859375, 0.029896259307861328, 0.03242206573486328, 0.034947872161865234, 0.03747367858886719, 0.03999948501586914, 0.042525291442871094, 0.04505109786987305, 0.047576904296875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 4.0, 3.0, 3.0, 5.0, 4.0, 9.0, 11.0, 19.0, 32.0, 26.0, 40.0, 69.0, 116.0, 131.0, 218.0, 367.0, 582.0, 971.0, 1662.0, 2989.0, 5564.0, 11149.0, 24490.0, 66202.0, 782486.0, 3181529.0, 66624.0, 24588.0, 11341.0, 5691.0, 3073.0, 1660.0, 980.0, 594.0, 349.0, 244.0, 153.0, 94.0, 64.0, 46.0, 27.0, 22.0, 19.0, 13.0, 11.0, 9.0, 5.0, 4.0, 2.0, 2.0], "bins": [-0.5849609375, -0.5699653625488281, -0.5549697875976562, -0.5399742126464844, -0.5249786376953125, -0.5099830627441406, -0.49498748779296875, -0.4799919128417969, -0.464996337890625, -0.4500007629394531, -0.43500518798828125, -0.4200096130371094, -0.4050140380859375, -0.3900184631347656, -0.37502288818359375, -0.3600273132324219, -0.34503173828125, -0.3300361633300781, -0.31504058837890625, -0.3000450134277344, -0.2850494384765625, -0.2700538635253906, -0.25505828857421875, -0.24006271362304688, -0.225067138671875, -0.21007156372070312, -0.19507598876953125, -0.18008041381835938, -0.1650848388671875, -0.15008926391601562, -0.13509368896484375, -0.12009811401367188, -0.1051025390625, -0.09010696411132812, -0.07511138916015625, -0.060115814208984375, -0.0451202392578125, -0.030124664306640625, -0.01512908935546875, -0.000133514404296875, 0.014862060546875, 0.029857635498046875, 0.04485321044921875, 0.059848785400390625, 0.0748443603515625, 0.08983993530273438, 0.10483551025390625, 0.11983108520507812, 0.13482666015625, 0.14982223510742188, 0.16481781005859375, 0.17981338500976562, 0.1948089599609375, 0.20980453491210938, 0.22480010986328125, 0.23979568481445312, 0.254791259765625, 0.2697868347167969, 0.28478240966796875, 0.2997779846191406, 0.3147735595703125, 0.3297691345214844, 0.34476470947265625, 0.3597602844238281, 0.374755859375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 6.0, 8.0, 4.0, 6.0, 7.0, 9.0, 10.0, 22.0, 26.0, 24.0, 32.0, 34.0, 49.0, 72.0, 151.0, 3053.0, 226.0, 96.0, 50.0, 38.0, 26.0, 28.0, 15.0, 15.0, 9.0, 11.0, 8.0, 8.0, 7.0, 8.0, 3.0, 3.0, 3.0, 5.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.11639404296875, -0.11313056945800781, -0.10986709594726562, -0.10660362243652344, -0.10334014892578125, -0.10007667541503906, -0.09681320190429688, -0.09354972839355469, -0.0902862548828125, -0.08702278137207031, -0.08375930786132812, -0.08049583435058594, -0.07723236083984375, -0.07396888732910156, -0.07070541381835938, -0.06744194030761719, -0.064178466796875, -0.06091499328613281, -0.057651519775390625, -0.05438804626464844, -0.05112457275390625, -0.04786109924316406, -0.044597625732421875, -0.04133415222167969, -0.0380706787109375, -0.03480720520019531, -0.031543731689453125, -0.028280258178710938, -0.02501678466796875, -0.021753311157226562, -0.018489837646484375, -0.015226364135742188, -0.011962890625, -0.008699417114257812, -0.005435943603515625, -0.0021724700927734375, 0.00109100341796875, 0.0043544769287109375, 0.007617950439453125, 0.010881423950195312, 0.0141448974609375, 0.017408370971679688, 0.020671844482421875, 0.023935317993164062, 0.02719879150390625, 0.030462265014648438, 0.033725738525390625, 0.03698921203613281, 0.040252685546875, 0.04351615905761719, 0.046779632568359375, 0.05004310607910156, 0.05330657958984375, 0.05657005310058594, 0.059833526611328125, 0.06309700012207031, 0.0663604736328125, 0.06962394714355469, 0.07288742065429688, 0.07615089416503906, 0.07941436767578125, 0.08267784118652344, 0.08594131469726562, 0.08920478820800781, 0.09246826171875]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 0.0, 6.0, 5.0, 4.0, 13.0, 15.0, 22.0, 23.0, 41.0, 62.0, 77.0, 113.0, 161.0, 142.0, 89.0, 74.0, 38.0, 45.0, 17.0, 13.0, 10.0, 5.0, 9.0, 3.0, 6.0, 4.0, 6.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.418947696685791, -0.40444493293762207, -0.3899421691894531, -0.3754394054412842, -0.3609366714954376, -0.3464339077472687, -0.33193114399909973, -0.3174283802509308, -0.30292564630508423, -0.2884228825569153, -0.27392011880874634, -0.2594173550605774, -0.24491462111473083, -0.2304118573665619, -0.21590909361839294, -0.201406329870224, -0.18690356612205505, -0.1724008023738861, -0.15789805352687836, -0.1433952897787094, -0.12889254093170166, -0.11438977718353271, -0.09988701343536377, -0.08538425713777542, -0.07088150084018707, -0.056378744542598724, -0.04187598451972008, -0.02737322449684143, -0.012870468199253082, 0.0016322880983352661, 0.01613505184650421, 0.03063780814409256, 0.04514056444168091, 0.05964332073926926, 0.0741460770368576, 0.08864884078502655, 0.1031515970826149, 0.11765435338020325, 0.1321571171283722, 0.14665988087654114, 0.1611626297235489, 0.17566539347171783, 0.19016814231872559, 0.20467090606689453, 0.21917366981506348, 0.23367641866207123, 0.24817918241024017, 0.2626819312572479, 0.27718469500541687, 0.2916874587535858, 0.30619022250175476, 0.3206929564476013, 0.33519572019577026, 0.3496984839439392, 0.36420124769210815, 0.3787040114402771, 0.39320677518844604, 0.407709538936615, 0.42221230268478394, 0.4367150664329529, 0.45121780037879944, 0.4657205641269684, 0.48022332787513733, 0.4947260916233063, 0.5092288255691528]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 5.0, 7.0, 8.0, 6.0, 12.0, 20.0, 14.0, 26.0, 20.0, 26.0, 28.0, 38.0, 41.0, 44.0, 52.0, 57.0, 41.0, 46.0, 49.0, 46.0, 44.0, 43.0, 36.0, 30.0, 41.0, 36.0, 35.0, 29.0, 17.0, 23.0, 15.0, 16.0, 19.0, 5.0, 6.0, 9.0, 3.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.3641483187675476, -0.35382455587387085, -0.3435007929801941, -0.33317703008651733, -0.3228532671928406, -0.3125295042991638, -0.30220574140548706, -0.2918819785118103, -0.28155821561813354, -0.2712344527244568, -0.26091068983078003, -0.25058692693710327, -0.2402631640434265, -0.22993940114974976, -0.219615638256073, -0.20929187536239624, -0.1989680975675583, -0.18864433467388153, -0.17832057178020477, -0.16799680888652802, -0.15767304599285126, -0.1473492830991745, -0.13702550530433655, -0.1267017424106598, -0.11637798696756363, -0.10605422407388687, -0.09573046118021011, -0.08540669083595276, -0.075082927942276, -0.06475916504859924, -0.054435402154922485, -0.04411163926124573, -0.03378787636756897, -0.023464113473892212, -0.013140348717570305, -0.002816583961248398, 0.00750717893242836, 0.017830941826105118, 0.028154708445072174, 0.03847847133874893, 0.04880223423242569, 0.05912599712610245, 0.0694497600197792, 0.07977353036403656, 0.09009729325771332, 0.10042105615139008, 0.11074481904506683, 0.12106858193874359, 0.13139234483242035, 0.1417161077260971, 0.15203987061977386, 0.16236363351345062, 0.17268739640712738, 0.18301115930080414, 0.1933349370956421, 0.20365869998931885, 0.2139824628829956, 0.22430622577667236, 0.23462998867034912, 0.24495375156402588, 0.25527751445770264, 0.2656012773513794, 0.27592504024505615, 0.2862488031387329, 0.29657256603240967]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 7.0, 4.0, 7.0, 4.0, 11.0, 4.0, 8.0, 12.0, 15.0, 20.0, 27.0, 38.0, 68.0, 90.0, 165.0, 247.0, 522.0, 975.0, 2257.0, 6841.0, 37848.0, 632038.0, 333216.0, 25068.0, 5299.0, 1863.0, 838.0, 373.0, 239.0, 144.0, 85.0, 54.0, 39.0, 28.0, 30.0, 18.0, 11.0, 11.0, 10.0, 5.0, 5.0, 4.0, 6.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.69677734375, -0.6749343872070312, -0.6530914306640625, -0.6312484741210938, -0.609405517578125, -0.5875625610351562, -0.5657196044921875, -0.5438766479492188, -0.52203369140625, -0.5001907348632812, -0.4783477783203125, -0.45650482177734375, -0.434661865234375, -0.41281890869140625, -0.3909759521484375, -0.36913299560546875, -0.3472900390625, -0.32544708251953125, -0.3036041259765625, -0.28176116943359375, -0.259918212890625, -0.23807525634765625, -0.2162322998046875, -0.19438934326171875, -0.17254638671875, -0.15070343017578125, -0.1288604736328125, -0.10701751708984375, -0.085174560546875, -0.06333160400390625, -0.0414886474609375, -0.01964569091796875, 0.002197265625, 0.02404022216796875, 0.0458831787109375, 0.06772613525390625, 0.089569091796875, 0.11141204833984375, 0.1332550048828125, 0.15509796142578125, 0.17694091796875, 0.19878387451171875, 0.2206268310546875, 0.24246978759765625, 0.264312744140625, 0.28615570068359375, 0.3079986572265625, 0.32984161376953125, 0.3516845703125, 0.37352752685546875, 0.3953704833984375, 0.41721343994140625, 0.439056396484375, 0.46089935302734375, 0.4827423095703125, 0.5045852661132812, 0.52642822265625, 0.5482711791992188, 0.5701141357421875, 0.5919570922851562, 0.613800048828125, 0.6356430053710938, 0.6574859619140625, 0.6793289184570312, 0.701171875]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 5.0, 8.0, 6.0, 16.0, 38.0, 82.0, 126.0, 187.0, 186.0, 136.0, 107.0, 51.0, 26.0, 13.0, 6.0, 4.0, 2.0, 4.0, 3.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.10980224609375, -0.10732030868530273, -0.10483837127685547, -0.1023564338684082, -0.09987449645996094, -0.09739255905151367, -0.0949106216430664, -0.09242868423461914, -0.08994674682617188, -0.08746480941772461, -0.08498287200927734, -0.08250093460083008, -0.08001899719238281, -0.07753705978393555, -0.07505512237548828, -0.07257318496704102, -0.07009124755859375, -0.06760931015014648, -0.06512737274169922, -0.06264543533325195, -0.06016349792480469, -0.05768156051635742, -0.055199623107910156, -0.05271768569946289, -0.050235748291015625, -0.04775381088256836, -0.045271873474121094, -0.04278993606567383, -0.04030799865722656, -0.0378260612487793, -0.03534412384033203, -0.032862186431884766, -0.0303802490234375, -0.027898311614990234, -0.02541637420654297, -0.022934436798095703, -0.020452499389648438, -0.017970561981201172, -0.015488624572753906, -0.01300668716430664, -0.010524749755859375, -0.00804281234741211, -0.005560874938964844, -0.003078937530517578, -0.0005970001220703125, 0.0018849372863769531, 0.004366874694824219, 0.006848812103271484, 0.00933074951171875, 0.011812686920166016, 0.014294624328613281, 0.016776561737060547, 0.019258499145507812, 0.021740436553955078, 0.024222373962402344, 0.02670431137084961, 0.029186248779296875, 0.03166818618774414, 0.034150123596191406, 0.03663206100463867, 0.03911399841308594, 0.0415959358215332, 0.04407787322998047, 0.046559810638427734, 0.049041748046875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 0.0, 4.0, 4.0, 10.0, 6.0, 8.0, 23.0, 28.0, 25.0, 56.0, 100.0, 117.0, 229.0, 368.0, 549.0, 1037.0, 1856.0, 3452.0, 7120.0, 16365.0, 45737.0, 162472.0, 530883.0, 190293.0, 53000.0, 18419.0, 7994.0, 3676.0, 1981.0, 1046.0, 631.0, 368.0, 247.0, 148.0, 106.0, 83.0, 34.0, 25.0, 22.0, 18.0, 6.0, 4.0, 4.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.329345703125, -0.32033538818359375, -0.3113250732421875, -0.30231475830078125, -0.293304443359375, -0.28429412841796875, -0.2752838134765625, -0.26627349853515625, -0.25726318359375, -0.24825286865234375, -0.2392425537109375, -0.23023223876953125, -0.221221923828125, -0.21221160888671875, -0.2032012939453125, -0.19419097900390625, -0.1851806640625, -0.17617034912109375, -0.1671600341796875, -0.15814971923828125, -0.149139404296875, -0.14012908935546875, -0.1311187744140625, -0.12210845947265625, -0.11309814453125, -0.10408782958984375, -0.0950775146484375, -0.08606719970703125, -0.077056884765625, -0.06804656982421875, -0.0590362548828125, -0.05002593994140625, -0.041015625, -0.03200531005859375, -0.0229949951171875, -0.01398468017578125, -0.004974365234375, 0.00403594970703125, 0.0130462646484375, 0.02205657958984375, 0.03106689453125, 0.04007720947265625, 0.0490875244140625, 0.05809783935546875, 0.067108154296875, 0.07611846923828125, 0.0851287841796875, 0.09413909912109375, 0.1031494140625, 0.11215972900390625, 0.1211700439453125, 0.13018035888671875, 0.139190673828125, 0.14820098876953125, 0.1572113037109375, 0.16622161865234375, 0.17523193359375, 0.18424224853515625, 0.1932525634765625, 0.20226287841796875, 0.211273193359375, 0.22028350830078125, 0.2292938232421875, 0.23830413818359375, 0.247314453125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 5.0, 6.0, 4.0, 10.0, 5.0, 29.0, 24.0, 26.0, 39.0, 59.0, 54.0, 55.0, 59.0, 70.0, 72.0, 60.0, 60.0, 54.0, 59.0, 45.0, 36.0, 45.0, 28.0, 27.0, 13.0, 10.0, 8.0, 8.0, 6.0, 4.0, 5.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2232666015625, -0.21695518493652344, -0.21064376831054688, -0.2043323516845703, -0.19802093505859375, -0.1917095184326172, -0.18539810180664062, -0.17908668518066406, -0.1727752685546875, -0.16646385192871094, -0.16015243530273438, -0.1538410186767578, -0.14752960205078125, -0.1412181854248047, -0.13490676879882812, -0.12859535217285156, -0.122283935546875, -0.11597251892089844, -0.10966110229492188, -0.10334968566894531, -0.09703826904296875, -0.09072685241699219, -0.08441543579101562, -0.07810401916503906, -0.0717926025390625, -0.06548118591308594, -0.059169769287109375, -0.05285835266113281, -0.04654693603515625, -0.04023551940917969, -0.033924102783203125, -0.027612686157226562, -0.02130126953125, -0.014989852905273438, -0.008678436279296875, -0.0023670196533203125, 0.00394439697265625, 0.010255813598632812, 0.016567230224609375, 0.022878646850585938, 0.0291900634765625, 0.03550148010253906, 0.041812896728515625, 0.04812431335449219, 0.05443572998046875, 0.06074714660644531, 0.06705856323242188, 0.07336997985839844, 0.079681396484375, 0.08599281311035156, 0.09230422973632812, 0.09861564636230469, 0.10492706298828125, 0.11123847961425781, 0.11754989624023438, 0.12386131286621094, 0.1301727294921875, 0.13648414611816406, 0.14279556274414062, 0.1491069793701172, 0.15541839599609375, 0.1617298126220703, 0.16804122924804688, 0.17435264587402344, 0.1806640625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 0.0, 5.0, 4.0, 6.0, 6.0, 5.0, 7.0, 16.0, 16.0, 32.0, 43.0, 77.0, 101.0, 204.0, 345.0, 676.0, 1481.0, 4155.0, 17975.0, 664243.0, 338509.0, 14334.0, 3500.0, 1385.0, 610.0, 319.0, 177.0, 105.0, 74.0, 43.0, 35.0, 19.0, 17.0, 7.0, 9.0, 8.0, 3.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.446044921875, -0.4316291809082031, -0.41721343994140625, -0.4027976989746094, -0.3883819580078125, -0.3739662170410156, -0.35955047607421875, -0.3451347351074219, -0.330718994140625, -0.3163032531738281, -0.30188751220703125, -0.2874717712402344, -0.2730560302734375, -0.2586402893066406, -0.24422454833984375, -0.22980880737304688, -0.21539306640625, -0.20097732543945312, -0.18656158447265625, -0.17214584350585938, -0.1577301025390625, -0.14331436157226562, -0.12889862060546875, -0.11448287963867188, -0.100067138671875, -0.08565139770507812, -0.07123565673828125, -0.056819915771484375, -0.0424041748046875, -0.027988433837890625, -0.01357269287109375, 0.000843048095703125, 0.0152587890625, 0.029674530029296875, 0.04409027099609375, 0.058506011962890625, 0.0729217529296875, 0.08733749389648438, 0.10175323486328125, 0.11616897583007812, 0.130584716796875, 0.14500045776367188, 0.15941619873046875, 0.17383193969726562, 0.1882476806640625, 0.20266342163085938, 0.21707916259765625, 0.23149490356445312, 0.24591064453125, 0.2603263854980469, 0.27474212646484375, 0.2891578674316406, 0.3035736083984375, 0.3179893493652344, 0.33240509033203125, 0.3468208312988281, 0.361236572265625, 0.3756523132324219, 0.39006805419921875, 0.4044837951660156, 0.4188995361328125, 0.4333152770996094, 0.44773101806640625, 0.4621467590332031, 0.4765625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 4.0, 0.0, 1.0, 4.0, 2.0, 8.0, 9.0, 25.0, 31.0, 46.0, 90.0, 319.0, 235.0, 77.0, 48.0, 27.0, 26.0, 13.0, 7.0, 5.0, 4.0, 5.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.000492095947265625, -0.0004761815071105957, -0.0004602670669555664, -0.0004443526268005371, -0.0004284381866455078, -0.0004125237464904785, -0.0003966093063354492, -0.0003806948661804199, -0.0003647804260253906, -0.00034886598587036133, -0.00033295154571533203, -0.00031703710556030273, -0.00030112266540527344, -0.00028520822525024414, -0.00026929378509521484, -0.00025337934494018555, -0.00023746490478515625, -0.00022155046463012695, -0.00020563602447509766, -0.00018972158432006836, -0.00017380714416503906, -0.00015789270401000977, -0.00014197826385498047, -0.00012606382369995117, -0.00011014938354492188, -9.423494338989258e-05, -7.832050323486328e-05, -6.240606307983398e-05, -4.649162292480469e-05, -3.057718276977539e-05, -1.4662742614746094e-05, 1.2516975402832031e-06, 1.71661376953125e-05, 3.30805778503418e-05, 4.8995018005371094e-05, 6.490945816040039e-05, 8.082389831542969e-05, 9.673833847045898e-05, 0.00011265277862548828, 0.00012856721878051758, 0.00014448165893554688, 0.00016039609909057617, 0.00017631053924560547, 0.00019222497940063477, 0.00020813941955566406, 0.00022405385971069336, 0.00023996829986572266, 0.00025588274002075195, 0.00027179718017578125, 0.00028771162033081055, 0.00030362606048583984, 0.00031954050064086914, 0.00033545494079589844, 0.00035136938095092773, 0.00036728382110595703, 0.00038319826126098633, 0.0003991127014160156, 0.0004150271415710449, 0.0004309415817260742, 0.0004468560218811035, 0.0004627704620361328, 0.0004786849021911621, 0.0004945993423461914, 0.0005105137825012207, 0.00052642822265625]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 2.0, 4.0, 6.0, 4.0, 9.0, 10.0, 7.0, 17.0, 22.0, 28.0, 32.0, 47.0, 80.0, 122.0, 138.0, 238.0, 366.0, 520.0, 766.0, 1303.0, 2205.0, 4044.0, 9127.0, 27924.0, 165683.0, 716853.0, 85714.0, 18574.0, 6713.0, 3215.0, 1678.0, 1036.0, 663.0, 430.0, 315.0, 192.0, 121.0, 107.0, 76.0, 44.0, 33.0, 19.0, 23.0, 10.0, 11.0, 11.0, 6.0, 3.0, 4.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.204345703125, -0.19821739196777344, -0.19208908081054688, -0.1859607696533203, -0.17983245849609375, -0.1737041473388672, -0.16757583618164062, -0.16144752502441406, -0.1553192138671875, -0.14919090270996094, -0.14306259155273438, -0.1369342803955078, -0.13080596923828125, -0.12467765808105469, -0.11854934692382812, -0.11242103576660156, -0.106292724609375, -0.10016441345214844, -0.09403610229492188, -0.08790779113769531, -0.08177947998046875, -0.07565116882324219, -0.06952285766601562, -0.06339454650878906, -0.0572662353515625, -0.05113792419433594, -0.045009613037109375, -0.03888130187988281, -0.03275299072265625, -0.026624679565429688, -0.020496368408203125, -0.014368057250976562, -0.00823974609375, -0.0021114349365234375, 0.004016876220703125, 0.010145187377929688, 0.01627349853515625, 0.022401809692382812, 0.028530120849609375, 0.03465843200683594, 0.0407867431640625, 0.04691505432128906, 0.053043365478515625, 0.05917167663574219, 0.06529998779296875, 0.07142829895019531, 0.07755661010742188, 0.08368492126464844, 0.089813232421875, 0.09594154357910156, 0.10206985473632812, 0.10819816589355469, 0.11432647705078125, 0.12045478820800781, 0.12658309936523438, 0.13271141052246094, 0.1388397216796875, 0.14496803283691406, 0.15109634399414062, 0.1572246551513672, 0.16335296630859375, 0.1694812774658203, 0.17560958862304688, 0.18173789978027344, 0.1878662109375]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 2.0, 5.0, 1.0, 3.0, 6.0, 6.0, 6.0, 17.0, 24.0, 33.0, 47.0, 88.0, 148.0, 162.0, 142.0, 105.0, 80.0, 41.0, 34.0, 14.0, 12.0, 10.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.1790771484375, -0.1740550994873047, -0.16903305053710938, -0.16401100158691406, -0.15898895263671875, -0.15396690368652344, -0.14894485473632812, -0.1439228057861328, -0.1389007568359375, -0.1338787078857422, -0.12885665893554688, -0.12383460998535156, -0.11881256103515625, -0.11379051208496094, -0.10876846313476562, -0.10374641418457031, -0.098724365234375, -0.09370231628417969, -0.08868026733398438, -0.08365821838378906, -0.07863616943359375, -0.07361412048339844, -0.06859207153320312, -0.06357002258300781, -0.0585479736328125, -0.05352592468261719, -0.048503875732421875, -0.04348182678222656, -0.03845977783203125, -0.03343772888183594, -0.028415679931640625, -0.023393630981445312, -0.01837158203125, -0.013349533081054688, -0.008327484130859375, -0.0033054351806640625, 0.00171661376953125, 0.0067386627197265625, 0.011760711669921875, 0.016782760620117188, 0.0218048095703125, 0.026826858520507812, 0.031848907470703125, 0.03687095642089844, 0.04189300537109375, 0.04691505432128906, 0.051937103271484375, 0.05695915222167969, 0.061981201171875, 0.06700325012207031, 0.07202529907226562, 0.07704734802246094, 0.08206939697265625, 0.08709144592285156, 0.09211349487304688, 0.09713554382324219, 0.1021575927734375, 0.10717964172363281, 0.11220169067382812, 0.11722373962402344, 0.12224578857421875, 0.12726783752441406, 0.13228988647460938, 0.1373119354248047, 0.142333984375]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 8.0, 48.0, 182.0, 488.0, 204.0, 57.0, 17.0, 8.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.388756036758423, -2.2235968112945557, -2.0584378242492676, -1.8932785987854004, -1.7281194925308228, -1.5629603862762451, -1.397801160812378, -1.2326420545578003, -1.0674829483032227, -0.902323842048645, -0.7371646761894226, -0.5720055103302002, -0.40684640407562256, -0.24168729782104492, -0.07652813196182251, 0.0886310338973999, 0.25379014015197754, 0.41894927620887756, 0.5841084122657776, 0.749267578125, 0.9144266843795776, 1.0795857906341553, 1.2447450160980225, 1.4099041223526, 1.5750632286071777, 1.7402223348617554, 1.905381441116333, 2.0705406665802, 2.2356996536254883, 2.4008588790893555, 2.5660181045532227, 2.73117733001709, 2.896336555480957, 3.061495780944824, 3.2266547679901123, 3.3918139934539795, 3.5569729804992676, 3.7221322059631348, 3.887291431427002, 4.052450656890869, 4.217609405517578, 4.382768630981445, 4.5479278564453125, 4.7130866050720215, 4.878245830535889, 5.043405055999756, 5.208564281463623, 5.37372350692749, 5.538882732391357, 5.704041957855225, 5.869201183319092, 6.034359931945801, 6.199519157409668, 6.364678382873535, 6.529837608337402, 6.6949968338012695, 6.860156059265137, 7.025315284729004, 7.190474510192871, 7.35563325881958, 7.520792484283447, 7.6859517097473145, 7.851110935211182, 8.01626968383789, 8.181428909301758]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 9.0, 7.0, 8.0, 11.0, 15.0, 15.0, 13.0, 16.0, 27.0, 30.0, 34.0, 40.0, 49.0, 47.0, 54.0, 62.0, 62.0, 51.0, 41.0, 53.0, 59.0, 40.0, 38.0, 43.0, 40.0, 25.0, 14.0, 13.0, 13.0, 18.0, 12.0, 14.0, 8.0, 6.0, 4.0, 7.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9719880819320679, -0.9380923509597778, -0.904196560382843, -0.870300829410553, -0.8364050388336182, -0.8025093078613281, -0.7686135768890381, -0.734717845916748, -0.7008220553398132, -0.6669263243675232, -0.6330305337905884, -0.5991348028182983, -0.5652390718460083, -0.5313432812690735, -0.49744755029678345, -0.463551789522171, -0.4296560287475586, -0.39576026797294617, -0.36186450719833374, -0.3279687762260437, -0.2940730154514313, -0.26017725467681885, -0.22628150880336761, -0.19238576292991638, -0.15849000215530396, -0.12459424883127213, -0.0906984955072403, -0.056802742183208466, -0.022906988859176636, 0.010988771915435791, 0.044884517788887024, 0.07878026366233826, 0.11267602443695068, 0.1465717852115631, 0.18046753108501434, 0.21436327695846558, 0.248259037733078, 0.28215479850769043, 0.31605052947998047, 0.3499462902545929, 0.3838420510292053, 0.41773781180381775, 0.4516335725784302, 0.4855293035507202, 0.5194250345230103, 0.5533208250999451, 0.5872165560722351, 0.6211123466491699, 0.65500807762146, 0.68890380859375, 0.7227995991706848, 0.7566953301429749, 0.7905911207199097, 0.8244868516921997, 0.8583825826644897, 0.8922783136367798, 0.9261741042137146, 0.9600698351860046, 0.9939656257629395, 1.0278613567352295, 1.0617570877075195, 1.0956528186798096, 1.1295486688613892, 1.1634443998336792, 1.1973401308059692]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 7.0, 11.0, 18.0, 20.0, 30.0, 51.0, 94.0, 149.0, 316.0, 1319.0, 14432.0, 4129983.0, 43969.0, 2711.0, 728.0, 267.0, 91.0, 46.0, 16.0, 10.0, 5.0, 2.0, 1.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.9580078125, -1.9109954833984375, -1.863983154296875, -1.8169708251953125, -1.76995849609375, -1.7229461669921875, -1.675933837890625, -1.6289215087890625, -1.5819091796875, -1.5348968505859375, -1.487884521484375, -1.4408721923828125, -1.39385986328125, -1.3468475341796875, -1.299835205078125, -1.2528228759765625, -1.205810546875, -1.1587982177734375, -1.111785888671875, -1.0647735595703125, -1.01776123046875, -0.9707489013671875, -0.923736572265625, -0.8767242431640625, -0.8297119140625, -0.7826995849609375, -0.735687255859375, -0.6886749267578125, -0.64166259765625, -0.5946502685546875, -0.547637939453125, -0.5006256103515625, -0.45361328125, -0.4066009521484375, -0.359588623046875, -0.3125762939453125, -0.26556396484375, -0.2185516357421875, -0.171539306640625, -0.1245269775390625, -0.0775146484375, -0.0305023193359375, 0.016510009765625, 0.0635223388671875, 0.11053466796875, 0.1575469970703125, 0.204559326171875, 0.2515716552734375, 0.298583984375, 0.3455963134765625, 0.392608642578125, 0.4396209716796875, 0.48663330078125, 0.5336456298828125, 0.580657958984375, 0.6276702880859375, 0.6746826171875, 0.7216949462890625, 0.768707275390625, 0.8157196044921875, 0.86273193359375, 0.9097442626953125, 0.956756591796875, 1.0037689208984375, 1.05078125]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 3.0, 1.0, 10.0, 15.0, 15.0, 37.0, 54.0, 92.0, 135.0, 152.0, 135.0, 133.0, 91.0, 64.0, 38.0, 10.0, 9.0, 6.0, 3.0, 0.0, 2.0, 6.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.10235595703125, -0.1000823974609375, -0.097808837890625, -0.0955352783203125, -0.09326171875, -0.0909881591796875, -0.088714599609375, -0.0864410400390625, -0.08416748046875, -0.0818939208984375, -0.079620361328125, -0.0773468017578125, -0.0750732421875, -0.0727996826171875, -0.070526123046875, -0.0682525634765625, -0.06597900390625, -0.0637054443359375, -0.061431884765625, -0.0591583251953125, -0.056884765625, -0.0546112060546875, -0.052337646484375, -0.0500640869140625, -0.04779052734375, -0.0455169677734375, -0.043243408203125, -0.0409698486328125, -0.0386962890625, -0.0364227294921875, -0.034149169921875, -0.0318756103515625, -0.02960205078125, -0.0273284912109375, -0.025054931640625, -0.0227813720703125, -0.0205078125, -0.0182342529296875, -0.015960693359375, -0.0136871337890625, -0.01141357421875, -0.0091400146484375, -0.006866455078125, -0.0045928955078125, -0.0023193359375, -4.57763671875e-05, 0.002227783203125, 0.0045013427734375, 0.00677490234375, 0.0090484619140625, 0.011322021484375, 0.0135955810546875, 0.015869140625, 0.0181427001953125, 0.020416259765625, 0.0226898193359375, 0.02496337890625, 0.0272369384765625, 0.029510498046875, 0.0317840576171875, 0.0340576171875, 0.0363311767578125, 0.038604736328125, 0.0408782958984375, 0.04315185546875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 4.0, 12.0, 16.0, 38.0, 59.0, 131.0, 258.0, 530.0, 1101.0, 2434.0, 5923.0, 18467.0, 96773.0, 3886697.0, 146158.0, 23484.0, 7051.0, 2796.0, 1238.0, 594.0, 276.0, 125.0, 64.0, 31.0, 11.0, 9.0, 7.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.51416015625, -0.5001068115234375, -0.486053466796875, -0.4720001220703125, -0.45794677734375, -0.4438934326171875, -0.429840087890625, -0.4157867431640625, -0.4017333984375, -0.3876800537109375, -0.373626708984375, -0.3595733642578125, -0.34552001953125, -0.3314666748046875, -0.317413330078125, -0.3033599853515625, -0.289306640625, -0.2752532958984375, -0.261199951171875, -0.2471466064453125, -0.23309326171875, -0.2190399169921875, -0.204986572265625, -0.1909332275390625, -0.1768798828125, -0.1628265380859375, -0.148773193359375, -0.1347198486328125, -0.12066650390625, -0.1066131591796875, -0.092559814453125, -0.0785064697265625, -0.064453125, -0.0503997802734375, -0.036346435546875, -0.0222930908203125, -0.00823974609375, 0.0058135986328125, 0.019866943359375, 0.0339202880859375, 0.0479736328125, 0.0620269775390625, 0.076080322265625, 0.0901336669921875, 0.10418701171875, 0.1182403564453125, 0.132293701171875, 0.1463470458984375, 0.160400390625, 0.1744537353515625, 0.188507080078125, 0.2025604248046875, 0.21661376953125, 0.2306671142578125, 0.244720458984375, 0.2587738037109375, 0.2728271484375, 0.2868804931640625, 0.300933837890625, 0.3149871826171875, 0.32904052734375, 0.3430938720703125, 0.357147216796875, 0.3712005615234375, 0.38525390625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 5.0, 5.0, 3.0, 3.0, 8.0, 5.0, 6.0, 8.0, 10.0, 18.0, 12.0, 30.0, 25.0, 55.0, 68.0, 110.0, 190.0, 2357.0, 666.0, 157.0, 107.0, 58.0, 39.0, 24.0, 17.0, 20.0, 15.0, 7.0, 8.0, 10.0, 3.0, 7.0, 5.0, 4.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 5.0], "bins": [-0.08148193359375, -0.07933378219604492, -0.07718563079833984, -0.07503747940063477, -0.07288932800292969, -0.07074117660522461, -0.06859302520751953, -0.06644487380981445, -0.06429672241210938, -0.0621485710144043, -0.06000041961669922, -0.05785226821899414, -0.05570411682128906, -0.053555965423583984, -0.051407814025878906, -0.04925966262817383, -0.04711151123046875, -0.04496335983276367, -0.042815208435058594, -0.040667057037353516, -0.03851890563964844, -0.03637075424194336, -0.03422260284423828, -0.0320744514465332, -0.029926300048828125, -0.027778148651123047, -0.02562999725341797, -0.02348184585571289, -0.021333694458007812, -0.019185543060302734, -0.017037391662597656, -0.014889240264892578, -0.0127410888671875, -0.010592937469482422, -0.008444786071777344, -0.006296634674072266, -0.0041484832763671875, -0.0020003318786621094, 0.00014781951904296875, 0.002295970916748047, 0.004444122314453125, 0.006592273712158203, 0.008740425109863281, 0.01088857650756836, 0.013036727905273438, 0.015184879302978516, 0.017333030700683594, 0.019481182098388672, 0.02162933349609375, 0.023777484893798828, 0.025925636291503906, 0.028073787689208984, 0.030221939086914062, 0.03237009048461914, 0.03451824188232422, 0.0366663932800293, 0.038814544677734375, 0.04096269607543945, 0.04311084747314453, 0.04525899887084961, 0.04740715026855469, 0.049555301666259766, 0.051703453063964844, 0.05385160446166992, 0.055999755859375]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 9.0, 25.0, 96.0, 401.0, 363.0, 87.0, 24.0, 6.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1147541999816895, -2.0706465244293213, -2.026538848876953, -1.982431173324585, -1.9383234977722168, -1.8942158222198486, -1.8501081466674805, -1.8060004711151123, -1.7618927955627441, -1.717785120010376, -1.6736774444580078, -1.6295697689056396, -1.5854620933532715, -1.5413544178009033, -1.4972467422485352, -1.453139066696167, -1.4090313911437988, -1.3649237155914307, -1.3208160400390625, -1.2767083644866943, -1.2326006889343262, -1.188493013381958, -1.1443853378295898, -1.1002776622772217, -1.056170105934143, -1.012062430381775, -0.9679547548294067, -0.9238470792770386, -0.8797394037246704, -0.8356317281723022, -0.7915240526199341, -0.7474163770675659, -0.7033087611198425, -0.6592010855674744, -0.6150934100151062, -0.570985734462738, -0.5268780589103699, -0.4827703833580017, -0.43866273760795593, -0.39455506205558777, -0.3504473865032196, -0.30633971095085144, -0.2622320353984833, -0.2181243747472763, -0.17401669919490814, -0.12990902364253998, -0.08580136299133301, -0.041693687438964844, 0.0024139881134033203, 0.046521659940481186, 0.09062933176755905, 0.13473699986934662, 0.17884467542171478, 0.22295235097408295, 0.2670600116252899, 0.3111676871776581, 0.35527536273002625, 0.3993830382823944, 0.4434907138347626, 0.48759835958480835, 0.5317060351371765, 0.5758137106895447, 0.6199213862419128, 0.664029061794281, 0.7081367373466492]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 6.0, 2.0, 10.0, 11.0, 13.0, 6.0, 9.0, 13.0, 22.0, 26.0, 22.0, 32.0, 36.0, 35.0, 42.0, 30.0, 44.0, 43.0, 54.0, 42.0, 34.0, 50.0, 50.0, 43.0, 39.0, 36.0, 39.0, 26.0, 31.0, 25.0, 18.0, 15.0, 20.0, 21.0, 16.0, 13.0, 11.0, 4.0, 3.0, 4.0, 3.0, 2.0, 6.0, 1.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.21758371591567993, -0.21080443263053894, -0.20402516424655914, -0.19724588096141815, -0.19046659767627716, -0.18368732929229736, -0.17690804600715637, -0.17012876272201538, -0.1633494794368744, -0.1565701961517334, -0.1497909277677536, -0.1430116444826126, -0.13623236119747162, -0.12945309281349182, -0.12267380952835083, -0.11589452624320984, -0.10911525785923004, -0.10233598202466965, -0.09555669873952866, -0.08877742290496826, -0.08199813961982727, -0.07521886378526688, -0.06843958795070648, -0.06166030839085579, -0.054881028831005096, -0.048101749271154404, -0.04132246971130371, -0.03454319387674332, -0.027763914316892624, -0.02098463475704193, -0.014205358922481537, -0.007426079362630844, -0.0006467998027801514, 0.006132478825747967, 0.012911757454276085, 0.01969103515148163, 0.02647031471133232, 0.033249594271183014, 0.04002887010574341, 0.0468081496655941, 0.053587429225444794, 0.060366708785295486, 0.06714598834514618, 0.07392526417970657, 0.08070454001426697, 0.08748382329940796, 0.09426309913396835, 0.10104237496852875, 0.10782165825366974, 0.11460093408823013, 0.12138021737337112, 0.12815949320793152, 0.1349387764930725, 0.1417180597782135, 0.1484973281621933, 0.1552766114473343, 0.1620558798313141, 0.16883516311645508, 0.17561443150043488, 0.18239371478557587, 0.18917299807071686, 0.19595226645469666, 0.20273154973983765, 0.20951083302497864, 0.21629011631011963]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 9.0, 9.0, 6.0, 9.0, 14.0, 10.0, 17.0, 25.0, 26.0, 45.0, 77.0, 131.0, 212.0, 449.0, 1050.0, 2779.0, 10221.0, 70101.0, 747976.0, 189411.0, 18939.0, 4192.0, 1381.0, 654.0, 343.0, 172.0, 94.0, 56.0, 43.0, 32.0, 20.0, 13.0, 8.0, 14.0, 7.0, 8.0, 2.0, 1.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.611328125, -0.59466552734375, -0.5780029296875, -0.56134033203125, -0.544677734375, -0.52801513671875, -0.5113525390625, -0.49468994140625, -0.47802734375, -0.46136474609375, -0.4447021484375, -0.42803955078125, -0.411376953125, -0.39471435546875, -0.3780517578125, -0.36138916015625, -0.3447265625, -0.32806396484375, -0.3114013671875, -0.29473876953125, -0.278076171875, -0.26141357421875, -0.2447509765625, -0.22808837890625, -0.21142578125, -0.19476318359375, -0.1781005859375, -0.16143798828125, -0.144775390625, -0.12811279296875, -0.1114501953125, -0.09478759765625, -0.078125, -0.06146240234375, -0.0447998046875, -0.02813720703125, -0.011474609375, 0.00518798828125, 0.0218505859375, 0.03851318359375, 0.05517578125, 0.07183837890625, 0.0885009765625, 0.10516357421875, 0.121826171875, 0.13848876953125, 0.1551513671875, 0.17181396484375, 0.1884765625, 0.20513916015625, 0.2218017578125, 0.23846435546875, 0.255126953125, 0.27178955078125, 0.2884521484375, 0.30511474609375, 0.32177734375, 0.33843994140625, 0.3551025390625, 0.37176513671875, 0.388427734375, 0.40509033203125, 0.4217529296875, 0.43841552734375, 0.455078125]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 5.0, 13.0, 14.0, 40.0, 63.0, 92.0, 150.0, 162.0, 137.0, 130.0, 86.0, 49.0, 26.0, 10.0, 11.0, 4.0, 3.0, 5.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.105224609375, -0.10288047790527344, -0.10053634643554688, -0.09819221496582031, -0.09584808349609375, -0.09350395202636719, -0.09115982055664062, -0.08881568908691406, -0.0864715576171875, -0.08412742614746094, -0.08178329467773438, -0.07943916320800781, -0.07709503173828125, -0.07475090026855469, -0.07240676879882812, -0.07006263732910156, -0.067718505859375, -0.06537437438964844, -0.06303024291992188, -0.06068611145019531, -0.05834197998046875, -0.05599784851074219, -0.053653717041015625, -0.05130958557128906, -0.0489654541015625, -0.04662132263183594, -0.044277191162109375, -0.04193305969238281, -0.03958892822265625, -0.03724479675292969, -0.034900665283203125, -0.03255653381347656, -0.03021240234375, -0.027868270874023438, -0.025524139404296875, -0.023180007934570312, -0.02083587646484375, -0.018491744995117188, -0.016147613525390625, -0.013803482055664062, -0.0114593505859375, -0.009115219116210938, -0.006771087646484375, -0.0044269561767578125, -0.00208282470703125, 0.0002613067626953125, 0.002605438232421875, 0.0049495697021484375, 0.007293701171875, 0.009637832641601562, 0.011981964111328125, 0.014326095581054688, 0.01667022705078125, 0.019014358520507812, 0.021358489990234375, 0.023702621459960938, 0.0260467529296875, 0.028390884399414062, 0.030735015869140625, 0.03307914733886719, 0.03542327880859375, 0.03776741027832031, 0.040111541748046875, 0.04245567321777344, 0.0447998046875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 4.0, 3.0, 5.0, 4.0, 9.0, 14.0, 23.0, 30.0, 51.0, 64.0, 93.0, 161.0, 214.0, 365.0, 569.0, 923.0, 1483.0, 2617.0, 4521.0, 8247.0, 15817.0, 31743.0, 68441.0, 160074.0, 366375.0, 215657.0, 87861.0, 40280.0, 19673.0, 10097.0, 5346.0, 3021.0, 1843.0, 1067.0, 654.0, 423.0, 237.0, 181.0, 127.0, 73.0, 60.0, 36.0, 27.0, 19.0, 15.0, 8.0, 3.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1318359375, -0.12723541259765625, -0.1226348876953125, -0.11803436279296875, -0.113433837890625, -0.10883331298828125, -0.1042327880859375, -0.09963226318359375, -0.09503173828125, -0.09043121337890625, -0.0858306884765625, -0.08123016357421875, -0.076629638671875, -0.07202911376953125, -0.0674285888671875, -0.06282806396484375, -0.0582275390625, -0.05362701416015625, -0.0490264892578125, -0.04442596435546875, -0.039825439453125, -0.03522491455078125, -0.0306243896484375, -0.02602386474609375, -0.02142333984375, -0.01682281494140625, -0.0122222900390625, -0.00762176513671875, -0.003021240234375, 0.00157928466796875, 0.0061798095703125, 0.01078033447265625, 0.015380859375, 0.01998138427734375, 0.0245819091796875, 0.02918243408203125, 0.033782958984375, 0.03838348388671875, 0.0429840087890625, 0.04758453369140625, 0.05218505859375, 0.05678558349609375, 0.0613861083984375, 0.06598663330078125, 0.070587158203125, 0.07518768310546875, 0.0797882080078125, 0.08438873291015625, 0.0889892578125, 0.09358978271484375, 0.0981903076171875, 0.10279083251953125, 0.107391357421875, 0.11199188232421875, 0.1165924072265625, 0.12119293212890625, 0.12579345703125, 0.13039398193359375, 0.1349945068359375, 0.13959503173828125, 0.144195556640625, 0.14879608154296875, 0.1533966064453125, 0.15799713134765625, 0.16259765625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 2.0, 1.0, 2.0, 2.0, 3.0, 8.0, 12.0, 4.0, 13.0, 17.0, 19.0, 28.0, 28.0, 27.0, 30.0, 35.0, 43.0, 48.0, 52.0, 51.0, 51.0, 67.0, 54.0, 51.0, 39.0, 48.0, 41.0, 35.0, 28.0, 27.0, 27.0, 18.0, 21.0, 15.0, 17.0, 7.0, 8.0, 9.0, 5.0, 3.0, 5.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.135498046875, -0.13073348999023438, -0.12596893310546875, -0.12120437622070312, -0.1164398193359375, -0.11167526245117188, -0.10691070556640625, -0.10214614868164062, -0.097381591796875, -0.09261703491210938, -0.08785247802734375, -0.08308792114257812, -0.0783233642578125, -0.07355880737304688, -0.06879425048828125, -0.06402969360351562, -0.05926513671875, -0.054500579833984375, -0.04973602294921875, -0.044971466064453125, -0.0402069091796875, -0.035442352294921875, -0.03067779541015625, -0.025913238525390625, -0.021148681640625, -0.016384124755859375, -0.01161956787109375, -0.006855010986328125, -0.0020904541015625, 0.002674102783203125, 0.00743865966796875, 0.012203216552734375, 0.0169677734375, 0.021732330322265625, 0.02649688720703125, 0.031261444091796875, 0.0360260009765625, 0.040790557861328125, 0.04555511474609375, 0.050319671630859375, 0.055084228515625, 0.059848785400390625, 0.06461334228515625, 0.06937789916992188, 0.0741424560546875, 0.07890701293945312, 0.08367156982421875, 0.08843612670898438, 0.09320068359375, 0.09796524047851562, 0.10272979736328125, 0.10749435424804688, 0.1122589111328125, 0.11702346801757812, 0.12178802490234375, 0.12655258178710938, 0.131317138671875, 0.13608169555664062, 0.14084625244140625, 0.14561080932617188, 0.1503753662109375, 0.15513992309570312, 0.15990447998046875, 0.16466903686523438, 0.16943359375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 7.0, 2.0, 9.0, 10.0, 23.0, 26.0, 37.0, 59.0, 132.0, 260.0, 605.0, 1510.0, 4867.0, 21559.0, 237932.0, 722995.0, 46381.0, 8320.0, 2335.0, 797.0, 356.0, 143.0, 91.0, 40.0, 27.0, 12.0, 12.0, 5.0, 4.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1927490234375, -0.18676185607910156, -0.18077468872070312, -0.1747875213623047, -0.16880035400390625, -0.1628131866455078, -0.15682601928710938, -0.15083885192871094, -0.1448516845703125, -0.13886451721191406, -0.13287734985351562, -0.1268901824951172, -0.12090301513671875, -0.11491584777832031, -0.10892868041992188, -0.10294151306152344, -0.096954345703125, -0.09096717834472656, -0.08498001098632812, -0.07899284362792969, -0.07300567626953125, -0.06701850891113281, -0.061031341552734375, -0.05504417419433594, -0.0490570068359375, -0.04306983947753906, -0.037082672119140625, -0.031095504760742188, -0.02510833740234375, -0.019121170043945312, -0.013134002685546875, -0.0071468353271484375, -0.00115966796875, 0.0048274993896484375, 0.010814666748046875, 0.016801834106445312, 0.02278900146484375, 0.028776168823242188, 0.034763336181640625, 0.04075050354003906, 0.0467376708984375, 0.05272483825683594, 0.058712005615234375, 0.06469917297363281, 0.07068634033203125, 0.07667350769042969, 0.08266067504882812, 0.08864784240722656, 0.094635009765625, 0.10062217712402344, 0.10660934448242188, 0.11259651184082031, 0.11858367919921875, 0.12457084655761719, 0.13055801391601562, 0.13654518127441406, 0.1425323486328125, 0.14851951599121094, 0.15450668334960938, 0.1604938507080078, 0.16648101806640625, 0.1724681854248047, 0.17845535278320312, 0.18444252014160156, 0.1904296875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 3.0, 5.0, 4.0, 8.0, 4.0, 9.0, 23.0, 18.0, 40.0, 79.0, 153.0, 363.0, 118.0, 62.0, 29.0, 26.0, 12.0, 16.0, 14.0, 4.0, 3.0, 6.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004100799560546875, -0.0003966018557548523, -0.0003831237554550171, -0.0003696456551551819, -0.0003561675548553467, -0.0003426894545555115, -0.00032921135425567627, -0.00031573325395584106, -0.00030225515365600586, -0.00028877705335617065, -0.00027529895305633545, -0.00026182085275650024, -0.00024834275245666504, -0.00023486465215682983, -0.00022138655185699463, -0.00020790845155715942, -0.00019443035125732422, -0.00018095225095748901, -0.0001674741506576538, -0.0001539960503578186, -0.0001405179500579834, -0.0001270398497581482, -0.00011356174945831299, -0.00010008364915847778, -8.660554885864258e-05, -7.312744855880737e-05, -5.964934825897217e-05, -4.617124795913696e-05, -3.269314765930176e-05, -1.9215047359466553e-05, -5.736947059631348e-06, 7.741153240203857e-06, 2.1219253540039062e-05, 3.469735383987427e-05, 4.817545413970947e-05, 6.165355443954468e-05, 7.513165473937988e-05, 8.860975503921509e-05, 0.00010208785533905029, 0.0001155659556388855, 0.0001290440559387207, 0.0001425221562385559, 0.0001560002565383911, 0.00016947835683822632, 0.00018295645713806152, 0.00019643455743789673, 0.00020991265773773193, 0.00022339075803756714, 0.00023686885833740234, 0.00025034695863723755, 0.00026382505893707275, 0.00027730315923690796, 0.00029078125953674316, 0.00030425935983657837, 0.0003177374601364136, 0.0003312155604362488, 0.000344693660736084, 0.0003581717610359192, 0.0003716498613357544, 0.0003851279616355896, 0.0003986060619354248, 0.00041208416223526, 0.0004255622625350952, 0.0004390403628349304, 0.0004525184631347656]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 7.0, 5.0, 12.0, 21.0, 25.0, 29.0, 55.0, 76.0, 129.0, 240.0, 358.0, 605.0, 1075.0, 2000.0, 3979.0, 8997.0, 24788.0, 99937.0, 646539.0, 198611.0, 37717.0, 12452.0, 5184.0, 2491.0, 1351.0, 750.0, 425.0, 271.0, 165.0, 92.0, 71.0, 32.0, 23.0, 15.0, 14.0, 6.0, 7.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1168212890625, -0.11324596405029297, -0.10967063903808594, -0.1060953140258789, -0.10251998901367188, -0.09894466400146484, -0.09536933898925781, -0.09179401397705078, -0.08821868896484375, -0.08464336395263672, -0.08106803894042969, -0.07749271392822266, -0.07391738891601562, -0.0703420639038086, -0.06676673889160156, -0.06319141387939453, -0.0596160888671875, -0.05604076385498047, -0.05246543884277344, -0.048890113830566406, -0.045314788818359375, -0.041739463806152344, -0.03816413879394531, -0.03458881378173828, -0.03101348876953125, -0.02743816375732422, -0.023862838745117188, -0.020287513732910156, -0.016712188720703125, -0.013136863708496094, -0.009561538696289062, -0.005986213684082031, -0.002410888671875, 0.0011644363403320312, 0.0047397613525390625, 0.008315086364746094, 0.011890411376953125, 0.015465736389160156, 0.019041061401367188, 0.02261638641357422, 0.02619171142578125, 0.02976703643798828, 0.03334236145019531, 0.036917686462402344, 0.040493011474609375, 0.044068336486816406, 0.04764366149902344, 0.05121898651123047, 0.0547943115234375, 0.05836963653564453, 0.06194496154785156, 0.0655202865600586, 0.06909561157226562, 0.07267093658447266, 0.07624626159667969, 0.07982158660888672, 0.08339691162109375, 0.08697223663330078, 0.09054756164550781, 0.09412288665771484, 0.09769821166992188, 0.1012735366821289, 0.10484886169433594, 0.10842418670654297, 0.11199951171875]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 2.0, 1.0, 4.0, 3.0, 6.0, 8.0, 4.0, 9.0, 13.0, 15.0, 28.0, 30.0, 39.0, 54.0, 79.0, 120.0, 134.0, 99.0, 99.0, 66.0, 48.0, 27.0, 32.0, 18.0, 9.0, 19.0, 10.0, 5.0, 6.0, 4.0, 1.0, 5.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.09600830078125, -0.09288501739501953, -0.08976173400878906, -0.0866384506225586, -0.08351516723632812, -0.08039188385009766, -0.07726860046386719, -0.07414531707763672, -0.07102203369140625, -0.06789875030517578, -0.06477546691894531, -0.061652183532714844, -0.058528900146484375, -0.055405616760253906, -0.05228233337402344, -0.04915904998779297, -0.0460357666015625, -0.04291248321533203, -0.03978919982910156, -0.036665916442871094, -0.033542633056640625, -0.030419349670410156, -0.027296066284179688, -0.02417278289794922, -0.02104949951171875, -0.01792621612548828, -0.014802932739257812, -0.011679649353027344, -0.008556365966796875, -0.005433082580566406, -0.0023097991943359375, 0.0008134841918945312, 0.003936767578125, 0.007060050964355469, 0.010183334350585938, 0.013306617736816406, 0.016429901123046875, 0.019553184509277344, 0.022676467895507812, 0.02579975128173828, 0.02892303466796875, 0.03204631805419922, 0.03516960144042969, 0.038292884826660156, 0.041416168212890625, 0.044539451599121094, 0.04766273498535156, 0.05078601837158203, 0.0539093017578125, 0.05703258514404297, 0.06015586853027344, 0.0632791519165039, 0.06640243530273438, 0.06952571868896484, 0.07264900207519531, 0.07577228546142578, 0.07889556884765625, 0.08201885223388672, 0.08514213562011719, 0.08826541900634766, 0.09138870239257812, 0.0945119857788086, 0.09763526916503906, 0.10075855255126953, 0.1038818359375]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 1.0, 6.0, 8.0, 8.0, 28.0, 46.0, 80.0, 166.0, 228.0, 196.0, 93.0, 59.0, 37.0, 20.0, 13.0, 2.0, 5.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.867201566696167, -1.8060872554779053, -1.744972825050354, -1.6838585138320923, -1.622744083404541, -1.5616297721862793, -1.500515341758728, -1.4394010305404663, -1.378286600112915, -1.3171722888946533, -1.256057858467102, -1.1949435472488403, -1.133829116821289, -1.0727148056030273, -1.011600375175476, -0.9504860639572144, -0.8893716931343079, -0.8282573223114014, -0.7671429514884949, -0.7060285806655884, -0.6449142098426819, -0.5837998390197754, -0.5226855278015137, -0.4615711271762848, -0.4004567563533783, -0.3393423855304718, -0.2782280147075653, -0.21711365878582, -0.1559992879629135, -0.09488493204116821, -0.03377056121826172, 0.027343809604644775, 0.08845818042755127, 0.14957255125045776, 0.21068692207336426, 0.27180129289627075, 0.33291566371917725, 0.39403000473976135, 0.45514437556266785, 0.516258716583252, 0.5773731470108032, 0.6384875178337097, 0.6996018886566162, 0.7607162594795227, 0.8218306303024292, 0.8829449415206909, 0.9440593719482422, 1.005173683166504, 1.0662879943847656, 1.1274023056030273, 1.1885167360305786, 1.2496310472488403, 1.3107454776763916, 1.3718597888946533, 1.4329742193222046, 1.4940885305404663, 1.5552029609680176, 1.6163172721862793, 1.6774317026138306, 1.7385460138320923, 1.7996604442596436, 1.8607747554779053, 1.9218891859054565, 1.9830034971237183, 2.0441179275512695]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 5.0, 5.0, 2.0, 11.0, 11.0, 7.0, 13.0, 22.0, 23.0, 22.0, 42.0, 43.0, 48.0, 52.0, 38.0, 41.0, 48.0, 62.0, 54.0, 48.0, 60.0, 38.0, 27.0, 50.0, 35.0, 38.0, 34.0, 26.0, 22.0, 24.0, 11.0, 9.0, 9.0, 6.0, 5.0, 8.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1428098678588867, -1.1130892038345337, -1.0833685398101807, -1.0536479949951172, -1.0239273309707642, -0.9942066669464111, -0.9644860625267029, -0.9347654581069946, -0.9050447940826416, -0.8753241300582886, -0.8456035256385803, -0.8158829212188721, -0.786162257194519, -0.756441593170166, -0.7267209887504578, -0.6970003843307495, -0.6672797203063965, -0.6375590562820435, -0.6078384518623352, -0.578117847442627, -0.5483971834182739, -0.5186765193939209, -0.48895591497421265, -0.459235280752182, -0.42951464653015137, -0.3997940123081207, -0.3700733780860901, -0.34035274386405945, -0.3106321096420288, -0.28091147541999817, -0.25119084119796753, -0.2214702069759369, -0.19174951314926147, -0.16202887892723083, -0.1323082447052002, -0.10258761048316956, -0.07286697626113892, -0.043146342039108276, -0.013425707817077637, 0.016294926404953003, 0.04601556062698364, 0.07573619484901428, 0.10545682907104492, 0.13517746329307556, 0.1648980975151062, 0.19461873173713684, 0.22433936595916748, 0.2540600001811981, 0.28378063440322876, 0.3135012686252594, 0.34322190284729004, 0.3729425370693207, 0.4026631712913513, 0.43238380551338196, 0.4621044397354126, 0.49182507395744324, 0.5215457081794739, 0.5512663125991821, 0.5809869766235352, 0.6107076406478882, 0.6404282450675964, 0.6701488494873047, 0.6998695135116577, 0.7295901775360107, 0.759310781955719]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 4.0, 2.0, 3.0, 2.0, 3.0, 7.0, 8.0, 6.0, 6.0, 17.0, 24.0, 33.0, 39.0, 46.0, 89.0, 151.0, 305.0, 620.0, 1472.0, 4713.0, 24617.0, 3988276.0, 156167.0, 12227.0, 3001.0, 1150.0, 526.0, 302.0, 145.0, 105.0, 92.0, 37.0, 33.0, 23.0, 12.0, 7.0, 0.0, 9.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5341796875, -0.5196685791015625, -0.505157470703125, -0.4906463623046875, -0.47613525390625, -0.4616241455078125, -0.447113037109375, -0.4326019287109375, -0.4180908203125, -0.4035797119140625, -0.389068603515625, -0.3745574951171875, -0.36004638671875, -0.3455352783203125, -0.331024169921875, -0.3165130615234375, -0.302001953125, -0.2874908447265625, -0.272979736328125, -0.2584686279296875, -0.24395751953125, -0.2294464111328125, -0.214935302734375, -0.2004241943359375, -0.1859130859375, -0.1714019775390625, -0.156890869140625, -0.1423797607421875, -0.12786865234375, -0.1133575439453125, -0.098846435546875, -0.0843353271484375, -0.06982421875, -0.0553131103515625, -0.040802001953125, -0.0262908935546875, -0.01177978515625, 0.0027313232421875, 0.017242431640625, 0.0317535400390625, 0.0462646484375, 0.0607757568359375, 0.075286865234375, 0.0897979736328125, 0.10430908203125, 0.1188201904296875, 0.133331298828125, 0.1478424072265625, 0.162353515625, 0.1768646240234375, 0.191375732421875, 0.2058868408203125, 0.22039794921875, 0.2349090576171875, 0.249420166015625, 0.2639312744140625, 0.2784423828125, 0.2929534912109375, 0.307464599609375, 0.3219757080078125, 0.33648681640625, 0.3509979248046875, 0.365509033203125, 0.3800201416015625, 0.39453125]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 9.0, 10.0, 7.0, 33.0, 39.0, 70.0, 104.0, 137.0, 140.0, 131.0, 119.0, 89.0, 46.0, 27.0, 17.0, 12.0, 4.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0], "bins": [-0.099853515625, -0.09761953353881836, -0.09538555145263672, -0.09315156936645508, -0.09091758728027344, -0.0886836051940918, -0.08644962310791016, -0.08421564102172852, -0.08198165893554688, -0.07974767684936523, -0.0775136947631836, -0.07527971267700195, -0.07304573059082031, -0.07081174850463867, -0.06857776641845703, -0.06634378433227539, -0.06410980224609375, -0.06187582015991211, -0.05964183807373047, -0.05740785598754883, -0.05517387390136719, -0.05293989181518555, -0.050705909729003906, -0.048471927642822266, -0.046237945556640625, -0.044003963470458984, -0.041769981384277344, -0.0395359992980957, -0.03730201721191406, -0.03506803512573242, -0.03283405303955078, -0.03060007095336914, -0.0283660888671875, -0.02613210678100586, -0.02389812469482422, -0.021664142608642578, -0.019430160522460938, -0.017196178436279297, -0.014962196350097656, -0.012728214263916016, -0.010494232177734375, -0.008260250091552734, -0.006026268005371094, -0.003792285919189453, -0.0015583038330078125, 0.0006756782531738281, 0.0029096603393554688, 0.005143642425537109, 0.00737762451171875, 0.00961160659790039, 0.011845588684082031, 0.014079570770263672, 0.016313552856445312, 0.018547534942626953, 0.020781517028808594, 0.023015499114990234, 0.025249481201171875, 0.027483463287353516, 0.029717445373535156, 0.0319514274597168, 0.03418540954589844, 0.03641939163208008, 0.03865337371826172, 0.04088735580444336, 0.043121337890625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 3.0, 0.0, 6.0, 7.0, 4.0, 9.0, 16.0, 27.0, 36.0, 45.0, 56.0, 71.0, 120.0, 124.0, 218.0, 330.0, 531.0, 850.0, 1412.0, 2674.0, 5121.0, 11071.0, 28910.0, 123749.0, 3769360.0, 186690.0, 36439.0, 13205.0, 5966.0, 3040.0, 1680.0, 977.0, 594.0, 282.0, 210.0, 143.0, 90.0, 72.0, 40.0, 29.0, 23.0, 10.0, 18.0, 11.0, 7.0, 9.0, 0.0, 6.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.1700439453125, -0.16409683227539062, -0.15814971923828125, -0.15220260620117188, -0.1462554931640625, -0.14030838012695312, -0.13436126708984375, -0.12841415405273438, -0.122467041015625, -0.11651992797851562, -0.11057281494140625, -0.10462570190429688, -0.0986785888671875, -0.09273147583007812, -0.08678436279296875, -0.08083724975585938, -0.07489013671875, -0.06894302368164062, -0.06299591064453125, -0.057048797607421875, -0.0511016845703125, -0.045154571533203125, -0.03920745849609375, -0.033260345458984375, -0.027313232421875, -0.021366119384765625, -0.01541900634765625, -0.009471893310546875, -0.0035247802734375, 0.002422332763671875, 0.00836944580078125, 0.014316558837890625, 0.020263671875, 0.026210784912109375, 0.03215789794921875, 0.038105010986328125, 0.0440521240234375, 0.049999237060546875, 0.05594635009765625, 0.061893463134765625, 0.067840576171875, 0.07378768920898438, 0.07973480224609375, 0.08568191528320312, 0.0916290283203125, 0.09757614135742188, 0.10352325439453125, 0.10947036743164062, 0.11541748046875, 0.12136459350585938, 0.12731170654296875, 0.13325881958007812, 0.1392059326171875, 0.14515304565429688, 0.15110015869140625, 0.15704727172851562, 0.162994384765625, 0.16894149780273438, 0.17488861083984375, 0.18083572387695312, 0.1867828369140625, 0.19272994995117188, 0.19867706298828125, 0.20462417602539062, 0.2105712890625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 4.0, 3.0, 3.0, 10.0, 9.0, 10.0, 19.0, 21.0, 32.0, 58.0, 105.0, 207.0, 2773.0, 449.0, 135.0, 87.0, 37.0, 24.0, 33.0, 9.0, 8.0, 10.0, 5.0, 4.0, 5.0, 7.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06964111328125, -0.06751346588134766, -0.06538581848144531, -0.06325817108154297, -0.061130523681640625, -0.05900287628173828, -0.05687522888183594, -0.054747581481933594, -0.05261993408203125, -0.050492286682128906, -0.04836463928222656, -0.04623699188232422, -0.044109344482421875, -0.04198169708251953, -0.03985404968261719, -0.037726402282714844, -0.0355987548828125, -0.033471107482910156, -0.03134346008300781, -0.02921581268310547, -0.027088165283203125, -0.02496051788330078, -0.022832870483398438, -0.020705223083496094, -0.01857757568359375, -0.016449928283691406, -0.014322280883789062, -0.012194633483886719, -0.010066986083984375, -0.007939338684082031, -0.0058116912841796875, -0.0036840438842773438, -0.001556396484375, 0.0005712509155273438, 0.0026988983154296875, 0.004826545715332031, 0.006954193115234375, 0.009081840515136719, 0.011209487915039062, 0.013337135314941406, 0.01546478271484375, 0.017592430114746094, 0.019720077514648438, 0.02184772491455078, 0.023975372314453125, 0.02610301971435547, 0.028230667114257812, 0.030358314514160156, 0.0324859619140625, 0.034613609313964844, 0.03674125671386719, 0.03886890411376953, 0.040996551513671875, 0.04312419891357422, 0.04525184631347656, 0.047379493713378906, 0.04950714111328125, 0.051634788513183594, 0.05376243591308594, 0.05589008331298828, 0.058017730712890625, 0.06014537811279297, 0.06227302551269531, 0.06440067291259766, 0.0665283203125]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 4.0, 21.0, 75.0, 426.0, 394.0, 77.0, 10.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.846519947052002, -1.8109623193740845, -1.775404691696167, -1.73984694480896, -1.7042893171310425, -1.668731689453125, -1.6331740617752075, -1.59761643409729, -1.562058687210083, -1.5265010595321655, -1.490943431854248, -1.455385684967041, -1.4198280572891235, -1.384270429611206, -1.3487128019332886, -1.313155174255371, -1.2775975465774536, -1.2420399188995361, -1.2064822912216187, -1.1709245443344116, -1.1353669166564941, -1.0998092889785767, -1.0642516613006592, -1.0286940336227417, -0.9931363463401794, -0.957578718662262, -0.9220210313796997, -0.8864634037017822, -0.8509057760238647, -0.8153480887413025, -0.779790461063385, -0.7442327737808228, -0.7086750268936157, -0.6731173992156982, -0.637559711933136, -0.6020020842552185, -0.5664443969726562, -0.5308867692947388, -0.4953291416168213, -0.4597714841365814, -0.42421382665634155, -0.3886561691761017, -0.3530985116958618, -0.31754088401794434, -0.28198322653770447, -0.2464255690574646, -0.21086792647838593, -0.17531028389930725, -0.13975262641906738, -0.10419497638940811, -0.06863732635974884, -0.03307967633008957, 0.002477973699569702, 0.03803563117980957, 0.07359327375888824, 0.10915091633796692, 0.1447085738182068, 0.18026623129844666, 0.21582387387752533, 0.251381516456604, 0.28693917393684387, 0.32249683141708374, 0.3580544590950012, 0.3936121165752411, 0.42916977405548096]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 7.0, 5.0, 7.0, 20.0, 16.0, 54.0, 44.0, 44.0, 66.0, 86.0, 71.0, 83.0, 74.0, 77.0, 56.0, 51.0, 50.0, 60.0, 37.0, 33.0, 19.0, 14.0, 11.0, 13.0, 5.0, 6.0, 2.0, 2.0], "bins": [-0.41808414459228516, -0.4095260202884674, -0.40096792578697205, -0.3924098014831543, -0.38385167717933655, -0.3752935528755188, -0.36673545837402344, -0.3581773340702057, -0.34961920976638794, -0.3410610854625702, -0.33250299096107483, -0.3239448666572571, -0.31538674235343933, -0.3068286180496216, -0.2982705235481262, -0.28971239924430847, -0.2811542749404907, -0.272596150636673, -0.2640380561351776, -0.25547993183135986, -0.24692180752754211, -0.23836369812488556, -0.229805588722229, -0.22124746441841125, -0.2126893699169159, -0.20413126051425934, -0.1955731362104416, -0.18701502680778503, -0.17845690250396729, -0.16989879310131073, -0.16134068369865417, -0.15278255939483643, -0.14422443509101868, -0.13566632568836212, -0.12710820138454437, -0.11855009198188782, -0.10999196767807007, -0.10143385827541351, -0.09287574142217636, -0.08431762456893921, -0.07575950771570206, -0.0672013908624649, -0.05864327400922775, -0.0500851608812809, -0.04152704402804375, -0.032968927174806595, -0.02441081404685974, -0.01585269719362259, -0.007294580340385437, 0.0012635355815291405, 0.009821651503443718, 0.01837976649403572, 0.026937883347272873, 0.035496000200510025, 0.04405411332845688, 0.05261223018169403, 0.06117034703493118, 0.06972846388816833, 0.07828658074140549, 0.08684469759464264, 0.0954028069972992, 0.10396093130111694, 0.1125190407037735, 0.12107715755701065, 0.1296352744102478]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 1.0, 1.0, 6.0, 2.0, 4.0, 6.0, 13.0, 6.0, 16.0, 10.0, 29.0, 15.0, 33.0, 49.0, 85.0, 118.0, 166.0, 300.0, 478.0, 807.0, 1334.0, 2697.0, 7036.0, 25274.0, 132770.0, 631351.0, 195764.0, 34172.0, 8812.0, 3403.0, 1584.0, 831.0, 493.0, 302.0, 174.0, 122.0, 71.0, 55.0, 36.0, 23.0, 28.0, 15.0, 17.0, 11.0, 6.0, 15.0, 4.0, 6.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 3.0], "bins": [-0.328125, -0.318359375, -0.30859375, -0.298828125, -0.2890625, -0.279296875, -0.26953125, -0.259765625, -0.25, -0.240234375, -0.23046875, -0.220703125, -0.2109375, -0.201171875, -0.19140625, -0.181640625, -0.171875, -0.162109375, -0.15234375, -0.142578125, -0.1328125, -0.123046875, -0.11328125, -0.103515625, -0.09375, -0.083984375, -0.07421875, -0.064453125, -0.0546875, -0.044921875, -0.03515625, -0.025390625, -0.015625, -0.005859375, 0.00390625, 0.013671875, 0.0234375, 0.033203125, 0.04296875, 0.052734375, 0.0625, 0.072265625, 0.08203125, 0.091796875, 0.1015625, 0.111328125, 0.12109375, 0.130859375, 0.140625, 0.150390625, 0.16015625, 0.169921875, 0.1796875, 0.189453125, 0.19921875, 0.208984375, 0.21875, 0.228515625, 0.23828125, 0.248046875, 0.2578125, 0.267578125, 0.27734375, 0.287109375, 0.296875]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 7.0, 6.0, 8.0, 20.0, 52.0, 70.0, 96.0, 115.0, 136.0, 142.0, 120.0, 97.0, 52.0, 31.0, 21.0, 8.0, 10.0, 2.0, 0.0, 4.0, 2.0, 0.0, 3.0, 4.0, 1.0, 0.0, 1.0, 3.0], "bins": [-0.09930419921875, -0.0970926284790039, -0.09488105773925781, -0.09266948699951172, -0.09045791625976562, -0.08824634552001953, -0.08603477478027344, -0.08382320404052734, -0.08161163330078125, -0.07940006256103516, -0.07718849182128906, -0.07497692108154297, -0.07276535034179688, -0.07055377960205078, -0.06834220886230469, -0.0661306381225586, -0.0639190673828125, -0.061707496643066406, -0.05949592590332031, -0.05728435516357422, -0.055072784423828125, -0.05286121368408203, -0.05064964294433594, -0.048438072204589844, -0.04622650146484375, -0.044014930725097656, -0.04180335998535156, -0.03959178924560547, -0.037380218505859375, -0.03516864776611328, -0.03295707702636719, -0.030745506286621094, -0.028533935546875, -0.026322364807128906, -0.024110794067382812, -0.02189922332763672, -0.019687652587890625, -0.01747608184814453, -0.015264511108398438, -0.013052940368652344, -0.01084136962890625, -0.008629798889160156, -0.0064182281494140625, -0.004206657409667969, -0.001995086669921875, 0.00021648406982421875, 0.0024280548095703125, 0.004639625549316406, 0.0068511962890625, 0.009062767028808594, 0.011274337768554688, 0.013485908508300781, 0.015697479248046875, 0.01790904998779297, 0.020120620727539062, 0.022332191467285156, 0.02454376220703125, 0.026755332946777344, 0.028966903686523438, 0.03117847442626953, 0.033390045166015625, 0.03560161590576172, 0.03781318664550781, 0.040024757385253906, 0.042236328125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 3.0, 4.0, 7.0, 9.0, 10.0, 17.0, 50.0, 47.0, 82.0, 133.0, 219.0, 337.0, 636.0, 1135.0, 2235.0, 4570.0, 10121.0, 24979.0, 68452.0, 223924.0, 460899.0, 162641.0, 51985.0, 19801.0, 8189.0, 3835.0, 1864.0, 1000.0, 571.0, 297.0, 181.0, 117.0, 68.0, 38.0, 45.0, 23.0, 9.0, 10.0, 6.0, 5.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1566162109375, -0.15109634399414062, -0.14557647705078125, -0.14005661010742188, -0.1345367431640625, -0.12901687622070312, -0.12349700927734375, -0.11797714233398438, -0.112457275390625, -0.10693740844726562, -0.10141754150390625, -0.09589767456054688, -0.0903778076171875, -0.08485794067382812, -0.07933807373046875, -0.07381820678710938, -0.06829833984375, -0.06277847290039062, -0.05725860595703125, -0.051738739013671875, -0.0462188720703125, -0.040699005126953125, -0.03517913818359375, -0.029659271240234375, -0.024139404296875, -0.018619537353515625, -0.01309967041015625, -0.007579803466796875, -0.0020599365234375, 0.003459930419921875, 0.00897979736328125, 0.014499664306640625, 0.02001953125, 0.025539398193359375, 0.03105926513671875, 0.036579132080078125, 0.0420989990234375, 0.047618865966796875, 0.05313873291015625, 0.058658599853515625, 0.064178466796875, 0.06969833374023438, 0.07521820068359375, 0.08073806762695312, 0.0862579345703125, 0.09177780151367188, 0.09729766845703125, 0.10281753540039062, 0.10833740234375, 0.11385726928710938, 0.11937713623046875, 0.12489700317382812, 0.1304168701171875, 0.13593673706054688, 0.14145660400390625, 0.14697647094726562, 0.152496337890625, 0.15801620483398438, 0.16353607177734375, 0.16905593872070312, 0.1745758056640625, 0.18009567260742188, 0.18561553955078125, 0.19113540649414062, 0.1966552734375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 6.0, 0.0, 2.0, 3.0, 1.0, 10.0, 4.0, 6.0, 18.0, 12.0, 19.0, 20.0, 27.0, 33.0, 28.0, 33.0, 44.0, 35.0, 50.0, 33.0, 53.0, 57.0, 52.0, 47.0, 44.0, 53.0, 50.0, 41.0, 41.0, 30.0, 28.0, 25.0, 19.0, 12.0, 8.0, 21.0, 10.0, 12.0, 7.0, 6.0, 5.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1322021484375, -0.1275196075439453, -0.12283706665039062, -0.11815452575683594, -0.11347198486328125, -0.10878944396972656, -0.10410690307617188, -0.09942436218261719, -0.0947418212890625, -0.09005928039550781, -0.08537673950195312, -0.08069419860839844, -0.07601165771484375, -0.07132911682128906, -0.06664657592773438, -0.06196403503417969, -0.057281494140625, -0.05259895324707031, -0.047916412353515625, -0.04323387145996094, -0.03855133056640625, -0.03386878967285156, -0.029186248779296875, -0.024503707885742188, -0.0198211669921875, -0.015138626098632812, -0.010456085205078125, -0.0057735443115234375, -0.00109100341796875, 0.0035915374755859375, 0.008274078369140625, 0.012956619262695312, 0.01763916015625, 0.022321701049804688, 0.027004241943359375, 0.03168678283691406, 0.03636932373046875, 0.04105186462402344, 0.045734405517578125, 0.05041694641113281, 0.0550994873046875, 0.05978202819824219, 0.06446456909179688, 0.06914710998535156, 0.07382965087890625, 0.07851219177246094, 0.08319473266601562, 0.08787727355957031, 0.092559814453125, 0.09724235534667969, 0.10192489624023438, 0.10660743713378906, 0.11128997802734375, 0.11597251892089844, 0.12065505981445312, 0.1253376007080078, 0.1300201416015625, 0.1347026824951172, 0.13938522338867188, 0.14406776428222656, 0.14875030517578125, 0.15343284606933594, 0.15811538696289062, 0.1627979278564453, 0.16748046875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 2.0, 3.0, 4.0, 1.0, 10.0, 14.0, 19.0, 26.0, 67.0, 174.0, 928.0, 21230.0, 1009261.0, 15674.0, 868.0, 144.0, 52.0, 22.0, 16.0, 16.0, 2.0, 10.0, 10.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.6640625, -0.6480484008789062, -0.6320343017578125, -0.6160202026367188, -0.600006103515625, -0.5839920043945312, -0.5679779052734375, -0.5519638061523438, -0.53594970703125, -0.5199356079101562, -0.5039215087890625, -0.48790740966796875, -0.471893310546875, -0.45587921142578125, -0.4398651123046875, -0.42385101318359375, -0.4078369140625, -0.39182281494140625, -0.3758087158203125, -0.35979461669921875, -0.343780517578125, -0.32776641845703125, -0.3117523193359375, -0.29573822021484375, -0.27972412109375, -0.26371002197265625, -0.2476959228515625, -0.23168182373046875, -0.215667724609375, -0.19965362548828125, -0.1836395263671875, -0.16762542724609375, -0.151611328125, -0.13559722900390625, -0.1195831298828125, -0.10356903076171875, -0.087554931640625, -0.07154083251953125, -0.0555267333984375, -0.03951263427734375, -0.02349853515625, -0.00748443603515625, 0.0085296630859375, 0.02454376220703125, 0.040557861328125, 0.05657196044921875, 0.0725860595703125, 0.08860015869140625, 0.1046142578125, 0.12062835693359375, 0.1366424560546875, 0.15265655517578125, 0.168670654296875, 0.18468475341796875, 0.2006988525390625, 0.21671295166015625, 0.23272705078125, 0.24874114990234375, 0.2647552490234375, 0.28076934814453125, 0.296783447265625, 0.31279754638671875, 0.3288116455078125, 0.34482574462890625, 0.36083984375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 2.0, 2.0, 5.0, 4.0, 8.0, 13.0, 12.0, 14.0, 23.0, 34.0, 58.0, 115.0, 268.0, 194.0, 92.0, 50.0, 35.0, 22.0, 11.0, 14.0, 5.0, 3.0, 2.0, 8.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00018310546875, -0.00017539411783218384, -0.00016768276691436768, -0.00015997141599655151, -0.00015226006507873535, -0.0001445487141609192, -0.00013683736324310303, -0.00012912601232528687, -0.0001214146614074707, -0.00011370331048965454, -0.00010599195957183838, -9.828060865402222e-05, -9.056925773620605e-05, -8.285790681838989e-05, -7.514655590057373e-05, -6.743520498275757e-05, -5.9723854064941406e-05, -5.2012503147125244e-05, -4.430115222930908e-05, -3.658980131149292e-05, -2.8878450393676758e-05, -2.1167099475860596e-05, -1.3455748558044434e-05, -5.7443976402282715e-06, 1.9669532775878906e-06, 9.678304195404053e-06, 1.7389655113220215e-05, 2.5101006031036377e-05, 3.281235694885254e-05, 4.05237078666687e-05, 4.823505878448486e-05, 5.5946409702301025e-05, 6.365776062011719e-05, 7.136911153793335e-05, 7.908046245574951e-05, 8.679181337356567e-05, 9.450316429138184e-05, 0.000102214515209198, 0.00010992586612701416, 0.00011763721704483032, 0.00012534856796264648, 0.00013305991888046265, 0.0001407712697982788, 0.00014848262071609497, 0.00015619397163391113, 0.0001639053225517273, 0.00017161667346954346, 0.00017932802438735962, 0.00018703937530517578, 0.00019475072622299194, 0.0002024620771408081, 0.00021017342805862427, 0.00021788477897644043, 0.0002255961298942566, 0.00023330748081207275, 0.00024101883172988892, 0.0002487301826477051, 0.00025644153356552124, 0.0002641528844833374, 0.00027186423540115356, 0.0002795755863189697, 0.0002872869372367859, 0.00029499828815460205, 0.0003027096390724182, 0.0003104209899902344]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 6.0, 3.0, 2.0, 9.0, 15.0, 20.0, 30.0, 64.0, 89.0, 160.0, 343.0, 795.0, 2300.0, 8692.0, 53736.0, 746540.0, 208949.0, 20096.0, 4320.0, 1327.0, 512.0, 222.0, 125.0, 78.0, 40.0, 33.0, 19.0, 9.0, 11.0, 5.0, 2.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.18310546875, -0.17751502990722656, -0.17192459106445312, -0.1663341522216797, -0.16074371337890625, -0.1551532745361328, -0.14956283569335938, -0.14397239685058594, -0.1383819580078125, -0.13279151916503906, -0.12720108032226562, -0.12161064147949219, -0.11602020263671875, -0.11042976379394531, -0.10483932495117188, -0.09924888610839844, -0.093658447265625, -0.08806800842285156, -0.08247756958007812, -0.07688713073730469, -0.07129669189453125, -0.06570625305175781, -0.060115814208984375, -0.05452537536621094, -0.0489349365234375, -0.04334449768066406, -0.037754058837890625, -0.03216361999511719, -0.02657318115234375, -0.020982742309570312, -0.015392303466796875, -0.009801864624023438, -0.00421142578125, 0.0013790130615234375, 0.006969451904296875, 0.012559890747070312, 0.01815032958984375, 0.023740768432617188, 0.029331207275390625, 0.03492164611816406, 0.0405120849609375, 0.04610252380371094, 0.051692962646484375, 0.05728340148925781, 0.06287384033203125, 0.06846427917480469, 0.07405471801757812, 0.07964515686035156, 0.085235595703125, 0.09082603454589844, 0.09641647338867188, 0.10200691223144531, 0.10759735107421875, 0.11318778991699219, 0.11877822875976562, 0.12436866760253906, 0.1299591064453125, 0.13554954528808594, 0.14113998413085938, 0.1467304229736328, 0.15232086181640625, 0.1579113006591797, 0.16350173950195312, 0.16909217834472656, 0.1746826171875]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 6.0, 4.0, 6.0, 13.0, 9.0, 17.0, 29.0, 47.0, 60.0, 78.0, 127.0, 124.0, 138.0, 96.0, 72.0, 55.0, 41.0, 19.0, 22.0, 15.0, 9.0, 5.0, 9.0, 3.0, 1.0, 4.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09002685546875, -0.08607959747314453, -0.08213233947753906, -0.0781850814819336, -0.07423782348632812, -0.07029056549072266, -0.06634330749511719, -0.06239604949951172, -0.05844879150390625, -0.05450153350830078, -0.05055427551269531, -0.046607017517089844, -0.042659759521484375, -0.038712501525878906, -0.03476524353027344, -0.03081798553466797, -0.0268707275390625, -0.02292346954345703, -0.018976211547851562, -0.015028953552246094, -0.011081695556640625, -0.007134437561035156, -0.0031871795654296875, 0.0007600784301757812, 0.00470733642578125, 0.008654594421386719, 0.012601852416992188, 0.016549110412597656, 0.020496368408203125, 0.024443626403808594, 0.028390884399414062, 0.03233814239501953, 0.036285400390625, 0.04023265838623047, 0.04417991638183594, 0.048127174377441406, 0.052074432373046875, 0.056021690368652344, 0.05996894836425781, 0.06391620635986328, 0.06786346435546875, 0.07181072235107422, 0.07575798034667969, 0.07970523834228516, 0.08365249633789062, 0.0875997543334961, 0.09154701232910156, 0.09549427032470703, 0.0994415283203125, 0.10338878631591797, 0.10733604431152344, 0.1112833023071289, 0.11523056030273438, 0.11917781829833984, 0.12312507629394531, 0.12707233428955078, 0.13101959228515625, 0.13496685028076172, 0.1389141082763672, 0.14286136627197266, 0.14680862426757812, 0.1507558822631836, 0.15470314025878906, 0.15865039825439453, 0.16259765625]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 13.0, 11.0, 9.0, 26.0, 36.0, 39.0, 95.0, 148.0, 162.0, 160.0, 110.0, 68.0, 51.0, 21.0, 24.0, 12.0, 11.0, 2.0, 4.0, 3.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9016638994216919, -0.8558385968208313, -0.8100132942199707, -0.7641879916191101, -0.7183626890182495, -0.6725373864173889, -0.6267120838165283, -0.5808867812156677, -0.5350614786148071, -0.48923617601394653, -0.44341087341308594, -0.39758557081222534, -0.35176026821136475, -0.30593496561050415, -0.26010966300964355, -0.21428436040878296, -0.16845905780792236, -0.12263375520706177, -0.07680845260620117, -0.030983150005340576, 0.01484215259552002, 0.060667455196380615, 0.10649275779724121, 0.1523180603981018, 0.1981433629989624, 0.243968665599823, 0.2897939682006836, 0.3356192708015442, 0.3814445734024048, 0.4272698760032654, 0.473095178604126, 0.5189204812049866, 0.5647459030151367, 0.6105712056159973, 0.6563965082168579, 0.7022218108177185, 0.7480471134185791, 0.7938724160194397, 0.8396977186203003, 0.8855230212211609, 0.9313483238220215, 0.9771736264228821, 1.0229989290237427, 1.068824291229248, 1.1146495342254639, 1.1604747772216797, 1.206300139427185, 1.2521255016326904, 1.2979507446289062, 1.343775987625122, 1.3896013498306274, 1.4354267120361328, 1.4812519550323486, 1.5270771980285645, 1.5729025602340698, 1.6187279224395752, 1.664553165435791, 1.7103784084320068, 1.7562037706375122, 1.8020291328430176, 1.8478543758392334, 1.8936796188354492, 1.9395049810409546, 1.98533034324646, 2.031155586242676]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 1.0, 3.0, 4.0, 4.0, 3.0, 6.0, 10.0, 9.0, 8.0, 13.0, 12.0, 17.0, 30.0, 16.0, 16.0, 40.0, 29.0, 29.0, 42.0, 48.0, 53.0, 58.0, 56.0, 52.0, 50.0, 43.0, 50.0, 35.0, 28.0, 31.0, 38.0, 32.0, 25.0, 18.0, 23.0, 12.0, 11.0, 11.0, 12.0, 8.0, 11.0, 3.0, 1.0, 3.0, 5.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7087627053260803, -0.6819206476211548, -0.6550785899162292, -0.6282365322113037, -0.6013944149017334, -0.5745524168014526, -0.5477102994918823, -0.5208682417869568, -0.49402618408203125, -0.4671841263771057, -0.4403420686721802, -0.41349998116493225, -0.3866579234600067, -0.3598158657550812, -0.33297377824783325, -0.3061317205429077, -0.2792896628379822, -0.25244760513305664, -0.2256055325269699, -0.19876345992088318, -0.17192140221595764, -0.1450793445110321, -0.11823727190494537, -0.09139519929885864, -0.0645531415939331, -0.03771107643842697, -0.010869011282920837, 0.015973053872585297, 0.04281511902809143, 0.06965717673301697, 0.0964992493391037, 0.12334132194519043, 0.15018343925476074, 0.17702549695968628, 0.203867569565773, 0.23070964217185974, 0.2575516998767853, 0.2843937575817108, 0.31123584508895874, 0.3380779027938843, 0.3649199604988098, 0.39176201820373535, 0.4186040759086609, 0.4454461634159088, 0.47228822112083435, 0.4991302788257599, 0.5259723663330078, 0.5528144240379333, 0.5796564817428589, 0.6064985394477844, 0.63334059715271, 0.6601826548576355, 0.687024712562561, 0.7138668298721313, 0.7407088875770569, 0.7675509452819824, 0.794393002986908, 0.8212350606918335, 0.848077118396759, 0.8749191761016846, 0.9017612934112549, 0.9286032915115356, 0.955445408821106, 0.9822874665260315, 1.009129524230957]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 5.0, 3.0, 2.0, 8.0, 3.0, 3.0, 9.0, 9.0, 7.0, 19.0, 23.0, 17.0, 15.0, 38.0, 50.0, 74.0, 132.0, 204.0, 377.0, 741.0, 1756.0, 5145.0, 21613.0, 3054061.0, 1080081.0, 20991.0, 5041.0, 1921.0, 842.0, 408.0, 216.0, 142.0, 116.0, 59.0, 42.0, 47.0, 23.0, 15.0, 11.0, 2.0, 4.0, 7.0, 2.0, 4.0, 2.0], "bins": [-0.55908203125, -0.5460777282714844, -0.5330734252929688, -0.5200691223144531, -0.5070648193359375, -0.4940605163574219, -0.48105621337890625, -0.4680519104003906, -0.455047607421875, -0.4420433044433594, -0.42903900146484375, -0.4160346984863281, -0.4030303955078125, -0.3900260925292969, -0.37702178955078125, -0.3640174865722656, -0.35101318359375, -0.3380088806152344, -0.32500457763671875, -0.3120002746582031, -0.2989959716796875, -0.2859916687011719, -0.27298736572265625, -0.2599830627441406, -0.246978759765625, -0.23397445678710938, -0.22097015380859375, -0.20796585083007812, -0.1949615478515625, -0.18195724487304688, -0.16895294189453125, -0.15594863891601562, -0.1429443359375, -0.12994003295898438, -0.11693572998046875, -0.10393142700195312, -0.0909271240234375, -0.07792282104492188, -0.06491851806640625, -0.051914215087890625, -0.038909912109375, -0.025905609130859375, -0.01290130615234375, 0.000102996826171875, 0.0131072998046875, 0.026111602783203125, 0.03911590576171875, 0.052120208740234375, 0.06512451171875, 0.07812881469726562, 0.09113311767578125, 0.10413742065429688, 0.1171417236328125, 0.13014602661132812, 0.14315032958984375, 0.15615463256835938, 0.169158935546875, 0.18216323852539062, 0.19516754150390625, 0.20817184448242188, 0.2211761474609375, 0.23418045043945312, 0.24718475341796875, 0.2601890563964844, 0.273193359375]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 7.0, 4.0, 11.0, 13.0, 19.0, 54.0, 86.0, 98.0, 126.0, 132.0, 137.0, 131.0, 75.0, 52.0, 25.0, 10.0, 10.0, 7.0, 0.0, 2.0, 5.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.0972900390625, -0.09500646591186523, -0.09272289276123047, -0.0904393196105957, -0.08815574645996094, -0.08587217330932617, -0.0835886001586914, -0.08130502700805664, -0.07902145385742188, -0.07673788070678711, -0.07445430755615234, -0.07217073440551758, -0.06988716125488281, -0.06760358810424805, -0.06532001495361328, -0.06303644180297852, -0.06075286865234375, -0.058469295501708984, -0.05618572235107422, -0.05390214920043945, -0.05161857604980469, -0.04933500289916992, -0.047051429748535156, -0.04476785659790039, -0.042484283447265625, -0.04020071029663086, -0.037917137145996094, -0.03563356399536133, -0.03334999084472656, -0.031066417694091797, -0.02878284454345703, -0.026499271392822266, -0.0242156982421875, -0.021932125091552734, -0.01964855194091797, -0.017364978790283203, -0.015081405639648438, -0.012797832489013672, -0.010514259338378906, -0.00823068618774414, -0.005947113037109375, -0.0036635398864746094, -0.0013799667358398438, 0.0009036064147949219, 0.0031871795654296875, 0.005470752716064453, 0.007754325866699219, 0.010037899017333984, 0.01232147216796875, 0.014605045318603516, 0.01688861846923828, 0.019172191619873047, 0.021455764770507812, 0.023739337921142578, 0.026022911071777344, 0.02830648422241211, 0.030590057373046875, 0.03287363052368164, 0.035157203674316406, 0.03744077682495117, 0.03972434997558594, 0.0420079231262207, 0.04429149627685547, 0.046575069427490234, 0.048858642578125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 5.0, 4.0, 6.0, 6.0, 10.0, 12.0, 22.0, 37.0, 56.0, 98.0, 247.0, 499.0, 1066.0, 2751.0, 9117.0, 44722.0, 3656837.0, 439289.0, 29114.0, 6365.0, 2153.0, 887.0, 456.0, 212.0, 121.0, 70.0, 39.0, 31.0, 25.0, 11.0, 5.0, 6.0, 4.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.419921875, -0.4091224670410156, -0.39832305908203125, -0.3875236511230469, -0.3767242431640625, -0.3659248352050781, -0.35512542724609375, -0.3443260192871094, -0.333526611328125, -0.3227272033691406, -0.31192779541015625, -0.3011283874511719, -0.2903289794921875, -0.2795295715332031, -0.26873016357421875, -0.2579307556152344, -0.24713134765625, -0.23633193969726562, -0.22553253173828125, -0.21473312377929688, -0.2039337158203125, -0.19313430786132812, -0.18233489990234375, -0.17153549194335938, -0.160736083984375, -0.14993667602539062, -0.13913726806640625, -0.12833786010742188, -0.1175384521484375, -0.10673904418945312, -0.09593963623046875, -0.08514022827148438, -0.0743408203125, -0.06354141235351562, -0.05274200439453125, -0.041942596435546875, -0.0311431884765625, -0.020343780517578125, -0.00954437255859375, 0.001255035400390625, 0.012054443359375, 0.022853851318359375, 0.03365325927734375, 0.044452667236328125, 0.0552520751953125, 0.06605148315429688, 0.07685089111328125, 0.08765029907226562, 0.09844970703125, 0.10924911499023438, 0.12004852294921875, 0.13084793090820312, 0.1416473388671875, 0.15244674682617188, 0.16324615478515625, 0.17404556274414062, 0.184844970703125, 0.19564437866210938, 0.20644378662109375, 0.21724319458007812, 0.2280426025390625, 0.23884201049804688, 0.24964141845703125, 0.2604408264160156, 0.271240234375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 6.0, 3.0, 6.0, 9.0, 12.0, 12.0, 23.0, 31.0, 28.0, 62.0, 127.0, 247.0, 2643.0, 467.0, 147.0, 81.0, 64.0, 35.0, 26.0, 14.0, 8.0, 9.0, 5.0, 6.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08331298828125, -0.07993602752685547, -0.07655906677246094, -0.0731821060180664, -0.06980514526367188, -0.06642818450927734, -0.06305122375488281, -0.05967426300048828, -0.05629730224609375, -0.05292034149169922, -0.04954338073730469, -0.046166419982910156, -0.042789459228515625, -0.039412498474121094, -0.03603553771972656, -0.03265857696533203, -0.0292816162109375, -0.02590465545654297, -0.022527694702148438, -0.019150733947753906, -0.015773773193359375, -0.012396812438964844, -0.009019851684570312, -0.005642890930175781, -0.00226593017578125, 0.0011110305786132812, 0.0044879913330078125, 0.007864952087402344, 0.011241912841796875, 0.014618873596191406, 0.017995834350585938, 0.02137279510498047, 0.024749755859375, 0.02812671661376953, 0.03150367736816406, 0.034880638122558594, 0.038257598876953125, 0.041634559631347656, 0.04501152038574219, 0.04838848114013672, 0.05176544189453125, 0.05514240264892578, 0.05851936340332031, 0.061896324157714844, 0.06527328491210938, 0.0686502456665039, 0.07202720642089844, 0.07540416717529297, 0.0787811279296875, 0.08215808868408203, 0.08553504943847656, 0.0889120101928711, 0.09228897094726562, 0.09566593170166016, 0.09904289245605469, 0.10241985321044922, 0.10579681396484375, 0.10917377471923828, 0.11255073547363281, 0.11592769622802734, 0.11930465698242188, 0.1226816177368164, 0.12605857849121094, 0.12943553924560547, 0.1328125]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 8.0, 57.0, 394.0, 465.0, 65.0, 16.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3852362632751465, -2.3208463191986084, -2.2564563751220703, -2.192066192626953, -2.127676248550415, -2.063286304473877, -1.9988962411880493, -1.9345061779022217, -1.8701162338256836, -1.8057262897491455, -1.7413362264633179, -1.6769461631774902, -1.6125562191009521, -1.548166275024414, -1.4837762117385864, -1.4193861484527588, -1.3549962043762207, -1.2906062602996826, -1.226216197013855, -1.1618261337280273, -1.0974361896514893, -1.0330462455749512, -0.9686561822891235, -0.9042661786079407, -0.8398761749267578, -0.775486171245575, -0.7110961675643921, -0.6467061638832092, -0.5823161602020264, -0.5179261565208435, -0.45353615283966064, -0.3891461491584778, -0.3247559070587158, -0.26036590337753296, -0.1959758996963501, -0.13158589601516724, -0.06719589233398438, -0.0028058886528015137, 0.06158411502838135, 0.1259741187095642, 0.19036412239074707, 0.25475412607192993, 0.3191441297531128, 0.38353413343429565, 0.4479241371154785, 0.5123141407966614, 0.5767041444778442, 0.6410941481590271, 0.70548415184021, 0.7698741555213928, 0.8342641592025757, 0.8986541628837585, 0.9630441665649414, 1.0274341106414795, 1.0918241739273071, 1.1562142372131348, 1.2206041812896729, 1.284994125366211, 1.3493841886520386, 1.4137742519378662, 1.4781641960144043, 1.5425541400909424, 1.60694420337677, 1.6713342666625977, 1.7357242107391357]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 2.0, 3.0, 3.0, 8.0, 13.0, 10.0, 28.0, 23.0, 24.0, 24.0, 29.0, 47.0, 46.0, 61.0, 57.0, 61.0, 71.0, 65.0, 44.0, 55.0, 56.0, 54.0, 50.0, 44.0, 35.0, 25.0, 19.0, 16.0, 11.0, 5.0, 5.0, 6.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.3651965260505676, -0.3546462953090668, -0.34409603476524353, -0.3335458040237427, -0.32299554347991943, -0.3124453127384186, -0.3018950819969177, -0.2913448214530945, -0.28079459071159363, -0.2702443599700928, -0.25969409942626953, -0.24914386868476868, -0.23859362304210663, -0.22804337739944458, -0.21749314665794373, -0.20694290101528168, -0.19639265537261963, -0.18584240972995758, -0.17529216408729553, -0.16474193334579468, -0.15419168770313263, -0.14364144206047058, -0.13309121131896973, -0.12254096567630768, -0.11199072003364563, -0.10144047439098358, -0.09089023619890213, -0.08033999800682068, -0.06978975236415863, -0.05923951044678688, -0.04868926852941513, -0.03813903033733368, -0.02758878469467163, -0.01703854277729988, -0.006488300859928131, 0.004061941057443619, 0.014612182974815369, 0.02516242489218712, 0.03571266680955887, 0.04626290500164032, 0.05681315064430237, 0.06736339628696442, 0.07791363447904587, 0.08846387267112732, 0.09901411831378937, 0.10956436395645142, 0.12011460214853287, 0.13066484034061432, 0.14121508598327637, 0.15176533162593842, 0.16231557726860046, 0.17286580801010132, 0.18341605365276337, 0.19396629929542542, 0.20451653003692627, 0.21506677567958832, 0.22561702132225037, 0.23616726696491241, 0.24671751260757446, 0.2572677433490753, 0.26781797409057617, 0.2783682346343994, 0.28891846537590027, 0.2994686961174011, 0.31001895666122437]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 1.0, 6.0, 6.0, 7.0, 16.0, 23.0, 23.0, 43.0, 51.0, 56.0, 84.0, 104.0, 183.0, 219.0, 371.0, 531.0, 867.0, 1550.0, 3022.0, 7585.0, 28433.0, 161700.0, 642550.0, 158799.0, 27653.0, 7615.0, 2943.0, 1519.0, 820.0, 543.0, 383.0, 226.0, 179.0, 135.0, 88.0, 60.0, 46.0, 40.0, 26.0, 12.0, 10.0, 9.0, 7.0, 4.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.31494140625, -0.30606842041015625, -0.2971954345703125, -0.28832244873046875, -0.279449462890625, -0.27057647705078125, -0.2617034912109375, -0.25283050537109375, -0.24395751953125, -0.23508453369140625, -0.2262115478515625, -0.21733856201171875, -0.208465576171875, -0.19959259033203125, -0.1907196044921875, -0.18184661865234375, -0.1729736328125, -0.16410064697265625, -0.1552276611328125, -0.14635467529296875, -0.137481689453125, -0.12860870361328125, -0.1197357177734375, -0.11086273193359375, -0.10198974609375, -0.09311676025390625, -0.0842437744140625, -0.07537078857421875, -0.066497802734375, -0.05762481689453125, -0.0487518310546875, -0.03987884521484375, -0.031005859375, -0.02213287353515625, -0.0132598876953125, -0.00438690185546875, 0.004486083984375, 0.01335906982421875, 0.0222320556640625, 0.03110504150390625, 0.03997802734375, 0.04885101318359375, 0.0577239990234375, 0.06659698486328125, 0.075469970703125, 0.08434295654296875, 0.0932159423828125, 0.10208892822265625, 0.1109619140625, 0.11983489990234375, 0.1287078857421875, 0.13758087158203125, 0.146453857421875, 0.15532684326171875, 0.1641998291015625, 0.17307281494140625, 0.18194580078125, 0.19081878662109375, 0.1996917724609375, 0.20856475830078125, 0.217437744140625, 0.22631072998046875, 0.2351837158203125, 0.24405670166015625, 0.2529296875]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 5.0, 5.0, 14.0, 16.0, 51.0, 75.0, 103.0, 128.0, 125.0, 145.0, 136.0, 91.0, 42.0, 27.0, 14.0, 9.0, 3.0, 3.0, 2.0, 3.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.09063720703125, -0.08830022811889648, -0.08596324920654297, -0.08362627029418945, -0.08128929138183594, -0.07895231246948242, -0.0766153335571289, -0.07427835464477539, -0.07194137573242188, -0.06960439682006836, -0.06726741790771484, -0.06493043899536133, -0.06259346008300781, -0.0602564811706543, -0.05791950225830078, -0.055582523345947266, -0.05324554443359375, -0.050908565521240234, -0.04857158660888672, -0.0462346076965332, -0.04389762878417969, -0.04156064987182617, -0.039223670959472656, -0.03688669204711914, -0.034549713134765625, -0.03221273422241211, -0.029875755310058594, -0.027538776397705078, -0.025201797485351562, -0.022864818572998047, -0.02052783966064453, -0.018190860748291016, -0.0158538818359375, -0.013516902923583984, -0.011179924011230469, -0.008842945098876953, -0.0065059661865234375, -0.004168987274169922, -0.0018320083618164062, 0.0005049705505371094, 0.002841949462890625, 0.005178928375244141, 0.007515907287597656, 0.009852886199951172, 0.012189865112304688, 0.014526844024658203, 0.01686382293701172, 0.019200801849365234, 0.02153778076171875, 0.023874759674072266, 0.02621173858642578, 0.028548717498779297, 0.030885696411132812, 0.03322267532348633, 0.035559654235839844, 0.03789663314819336, 0.040233612060546875, 0.04257059097290039, 0.044907569885253906, 0.04724454879760742, 0.04958152770996094, 0.05191850662231445, 0.05425548553466797, 0.056592464447021484, 0.058929443359375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 5.0, 6.0, 4.0, 4.0, 7.0, 11.0, 12.0, 22.0, 27.0, 56.0, 80.0, 114.0, 207.0, 315.0, 471.0, 817.0, 1391.0, 2362.0, 3832.0, 6920.0, 12609.0, 22556.0, 42987.0, 85359.0, 176835.0, 294668.0, 196539.0, 95582.0, 47371.0, 25184.0, 13828.0, 7634.0, 4271.0, 2511.0, 1482.0, 954.0, 546.0, 325.0, 225.0, 135.0, 80.0, 75.0, 45.0, 31.0, 25.0, 15.0, 12.0, 6.0, 6.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.094970703125, -0.0920553207397461, -0.08913993835449219, -0.08622455596923828, -0.08330917358398438, -0.08039379119873047, -0.07747840881347656, -0.07456302642822266, -0.07164764404296875, -0.06873226165771484, -0.06581687927246094, -0.06290149688720703, -0.059986114501953125, -0.05707073211669922, -0.05415534973144531, -0.051239967346191406, -0.0483245849609375, -0.045409202575683594, -0.04249382019042969, -0.03957843780517578, -0.036663055419921875, -0.03374767303466797, -0.030832290649414062, -0.027916908264160156, -0.02500152587890625, -0.022086143493652344, -0.019170761108398438, -0.01625537872314453, -0.013339996337890625, -0.010424613952636719, -0.0075092315673828125, -0.004593849182128906, -0.001678466796875, 0.0012369155883789062, 0.0041522979736328125, 0.007067680358886719, 0.009983062744140625, 0.012898445129394531, 0.015813827514648438, 0.018729209899902344, 0.02164459228515625, 0.024559974670410156, 0.027475357055664062, 0.03039073944091797, 0.033306121826171875, 0.03622150421142578, 0.03913688659667969, 0.042052268981933594, 0.0449676513671875, 0.047883033752441406, 0.05079841613769531, 0.05371379852294922, 0.056629180908203125, 0.05954456329345703, 0.06245994567871094, 0.06537532806396484, 0.06829071044921875, 0.07120609283447266, 0.07412147521972656, 0.07703685760498047, 0.07995223999023438, 0.08286762237548828, 0.08578300476074219, 0.0886983871459961, 0.09161376953125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 5.0, 7.0, 7.0, 15.0, 6.0, 19.0, 10.0, 26.0, 22.0, 15.0, 20.0, 22.0, 36.0, 42.0, 34.0, 36.0, 41.0, 48.0, 37.0, 43.0, 46.0, 38.0, 46.0, 55.0, 38.0, 43.0, 38.0, 33.0, 24.0, 30.0, 18.0, 19.0, 23.0, 18.0, 10.0, 6.0, 8.0, 5.0, 3.0, 2.0, 3.0, 1.0, 7.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1021728515625, -0.09841537475585938, -0.09465789794921875, -0.09090042114257812, -0.0871429443359375, -0.08338546752929688, -0.07962799072265625, -0.07587051391601562, -0.072113037109375, -0.06835556030273438, -0.06459808349609375, -0.060840606689453125, -0.0570831298828125, -0.053325653076171875, -0.04956817626953125, -0.045810699462890625, -0.04205322265625, -0.038295745849609375, -0.03453826904296875, -0.030780792236328125, -0.0270233154296875, -0.023265838623046875, -0.01950836181640625, -0.015750885009765625, -0.011993408203125, -0.008235931396484375, -0.00447845458984375, -0.000720977783203125, 0.0030364990234375, 0.006793975830078125, 0.01055145263671875, 0.014308929443359375, 0.01806640625, 0.021823883056640625, 0.02558135986328125, 0.029338836669921875, 0.0330963134765625, 0.036853790283203125, 0.04061126708984375, 0.044368743896484375, 0.048126220703125, 0.051883697509765625, 0.05564117431640625, 0.059398651123046875, 0.0631561279296875, 0.06691360473632812, 0.07067108154296875, 0.07442855834960938, 0.07818603515625, 0.08194351196289062, 0.08570098876953125, 0.08945846557617188, 0.0932159423828125, 0.09697341918945312, 0.10073089599609375, 0.10448837280273438, 0.108245849609375, 0.11200332641601562, 0.11576080322265625, 0.11951828002929688, 0.1232757568359375, 0.12703323364257812, 0.13079071044921875, 0.13454818725585938, 0.1383056640625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 8.0, 3.0, 11.0, 16.0, 9.0, 19.0, 40.0, 62.0, 87.0, 158.0, 301.0, 570.0, 1181.0, 2992.0, 8815.0, 33301.0, 204506.0, 670549.0, 96334.0, 19595.0, 5895.0, 2172.0, 893.0, 475.0, 236.0, 119.0, 72.0, 47.0, 40.0, 15.0, 13.0, 9.0, 5.0, 5.0, 6.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.075927734375, -0.07267189025878906, -0.06941604614257812, -0.06616020202636719, -0.06290435791015625, -0.05964851379394531, -0.056392669677734375, -0.05313682556152344, -0.0498809814453125, -0.04662513732910156, -0.043369293212890625, -0.04011344909667969, -0.03685760498046875, -0.03360176086425781, -0.030345916748046875, -0.027090072631835938, -0.023834228515625, -0.020578384399414062, -0.017322540283203125, -0.014066696166992188, -0.01081085205078125, -0.0075550079345703125, -0.004299163818359375, -0.0010433197021484375, 0.0022125244140625, 0.0054683685302734375, 0.008724212646484375, 0.011980056762695312, 0.01523590087890625, 0.018491744995117188, 0.021747589111328125, 0.025003433227539062, 0.02825927734375, 0.03151512145996094, 0.034770965576171875, 0.03802680969238281, 0.04128265380859375, 0.04453849792480469, 0.047794342041015625, 0.05105018615722656, 0.0543060302734375, 0.05756187438964844, 0.060817718505859375, 0.06407356262207031, 0.06732940673828125, 0.07058525085449219, 0.07384109497070312, 0.07709693908691406, 0.080352783203125, 0.08360862731933594, 0.08686447143554688, 0.09012031555175781, 0.09337615966796875, 0.09663200378417969, 0.09988784790039062, 0.10314369201660156, 0.1063995361328125, 0.10965538024902344, 0.11291122436523438, 0.11616706848144531, 0.11942291259765625, 0.12267875671386719, 0.12593460083007812, 0.12919044494628906, 0.1324462890625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 3.0, 6.0, 4.0, 8.0, 14.0, 19.0, 60.0, 80.0, 181.0, 276.0, 183.0, 74.0, 45.0, 19.0, 8.0, 8.0, 3.0, 2.0, 2.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00013637542724609375, -0.00013203173875808716, -0.00012768805027008057, -0.00012334436178207397, -0.00011900067329406738, -0.00011465698480606079, -0.0001103132963180542, -0.00010596960783004761, -0.00010162591934204102, -9.728223085403442e-05, -9.293854236602783e-05, -8.859485387802124e-05, -8.425116539001465e-05, -7.990747690200806e-05, -7.556378841400146e-05, -7.122009992599487e-05, -6.687641143798828e-05, -6.253272294998169e-05, -5.81890344619751e-05, -5.3845345973968506e-05, -4.9501657485961914e-05, -4.515796899795532e-05, -4.081428050994873e-05, -3.647059202194214e-05, -3.212690353393555e-05, -2.7783215045928955e-05, -2.3439526557922363e-05, -1.909583806991577e-05, -1.475214958190918e-05, -1.0408461093902588e-05, -6.064772605895996e-06, -1.7210841178894043e-06, 2.6226043701171875e-06, 6.966292858123779e-06, 1.1309981346130371e-05, 1.5653669834136963e-05, 1.9997358322143555e-05, 2.4341046810150146e-05, 2.8684735298156738e-05, 3.302842378616333e-05, 3.737211227416992e-05, 4.1715800762176514e-05, 4.6059489250183105e-05, 5.04031777381897e-05, 5.474686622619629e-05, 5.909055471420288e-05, 6.343424320220947e-05, 6.777793169021606e-05, 7.212162017822266e-05, 7.646530866622925e-05, 8.080899715423584e-05, 8.515268564224243e-05, 8.949637413024902e-05, 9.384006261825562e-05, 9.818375110626221e-05, 0.0001025274395942688, 0.00010687112808227539, 0.00011121481657028198, 0.00011555850505828857, 0.00011990219354629517, 0.00012424588203430176, 0.00012858957052230835, 0.00013293325901031494, 0.00013727694749832153, 0.00014162063598632812]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 6.0, 5.0, 10.0, 14.0, 19.0, 28.0, 43.0, 57.0, 88.0, 160.0, 246.0, 427.0, 696.0, 1112.0, 2080.0, 4020.0, 7668.0, 15953.0, 36602.0, 97546.0, 327136.0, 368748.0, 109698.0, 40599.0, 17611.0, 8323.0, 4258.0, 2244.0, 1256.0, 727.0, 433.0, 246.0, 157.0, 107.0, 66.0, 52.0, 33.0, 28.0, 14.0, 8.0, 10.0, 12.0, 5.0, 3.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.050689697265625, -0.04900312423706055, -0.047316551208496094, -0.04562997817993164, -0.04394340515136719, -0.042256832122802734, -0.04057025909423828, -0.03888368606567383, -0.037197113037109375, -0.03551054000854492, -0.03382396697998047, -0.032137393951416016, -0.030450820922851562, -0.02876424789428711, -0.027077674865722656, -0.025391101837158203, -0.02370452880859375, -0.022017955780029297, -0.020331382751464844, -0.01864480972290039, -0.016958236694335938, -0.015271663665771484, -0.013585090637207031, -0.011898517608642578, -0.010211944580078125, -0.008525371551513672, -0.006838798522949219, -0.005152225494384766, -0.0034656524658203125, -0.0017790794372558594, -9.250640869140625e-05, 0.0015940666198730469, 0.0032806396484375, 0.004967212677001953, 0.006653785705566406, 0.00834035873413086, 0.010026931762695312, 0.011713504791259766, 0.013400077819824219, 0.015086650848388672, 0.016773223876953125, 0.018459796905517578, 0.02014636993408203, 0.021832942962646484, 0.023519515991210938, 0.02520608901977539, 0.026892662048339844, 0.028579235076904297, 0.03026580810546875, 0.0319523811340332, 0.033638954162597656, 0.03532552719116211, 0.03701210021972656, 0.038698673248291016, 0.04038524627685547, 0.04207181930541992, 0.043758392333984375, 0.04544496536254883, 0.04713153839111328, 0.048818111419677734, 0.05050468444824219, 0.05219125747680664, 0.053877830505371094, 0.05556440353393555, 0.0572509765625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 1.0, 3.0, 2.0, 4.0, 8.0, 11.0, 13.0, 12.0, 8.0, 15.0, 18.0, 21.0, 32.0, 46.0, 54.0, 63.0, 87.0, 74.0, 82.0, 86.0, 70.0, 50.0, 55.0, 40.0, 39.0, 24.0, 23.0, 14.0, 10.0, 13.0, 7.0, 7.0, 7.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07244873046875, -0.07020854949951172, -0.06796836853027344, -0.06572818756103516, -0.06348800659179688, -0.061247825622558594, -0.05900764465332031, -0.05676746368408203, -0.05452728271484375, -0.05228710174560547, -0.05004692077636719, -0.047806739807128906, -0.045566558837890625, -0.043326377868652344, -0.04108619689941406, -0.03884601593017578, -0.0366058349609375, -0.03436565399169922, -0.03212547302246094, -0.029885292053222656, -0.027645111083984375, -0.025404930114746094, -0.023164749145507812, -0.02092456817626953, -0.01868438720703125, -0.01644420623779297, -0.014204025268554688, -0.011963844299316406, -0.009723663330078125, -0.007483482360839844, -0.0052433013916015625, -0.0030031204223632812, -0.000762939453125, 0.0014772415161132812, 0.0037174224853515625, 0.005957603454589844, 0.008197784423828125, 0.010437965393066406, 0.012678146362304688, 0.014918327331542969, 0.01715850830078125, 0.01939868927001953, 0.021638870239257812, 0.023879051208496094, 0.026119232177734375, 0.028359413146972656, 0.030599594116210938, 0.03283977508544922, 0.0350799560546875, 0.03732013702392578, 0.03956031799316406, 0.041800498962402344, 0.044040679931640625, 0.046280860900878906, 0.04852104187011719, 0.05076122283935547, 0.05300140380859375, 0.05524158477783203, 0.05748176574707031, 0.059721946716308594, 0.061962127685546875, 0.06420230865478516, 0.06644248962402344, 0.06868267059326172, 0.0709228515625]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 7.0, 3.0, 15.0, 43.0, 93.0, 277.0, 352.0, 134.0, 48.0, 28.0, 8.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4928957223892212, -1.4060356616973877, -1.3191754817962646, -1.2323154211044312, -1.145455241203308, -1.0585951805114746, -0.9717350602149963, -0.8848749399185181, -0.7980148196220398, -0.7111546993255615, -0.6242945790290833, -0.537434458732605, -0.4505743682384491, -0.3637142479419708, -0.27685415744781494, -0.18999403715133667, -0.1031339168548584, -0.016273804008960724, 0.07058630883693695, 0.15744641423225403, 0.2443065345287323, 0.33116665482521057, 0.41802674531936646, 0.5048868656158447, 0.591746985912323, 0.6786071062088013, 0.7654672265052795, 0.8523273468017578, 0.9391874074935913, 1.0260475873947144, 1.1129076480865479, 1.199767827987671, 1.286628007888794, 1.3734880685806274, 1.4603482484817505, 1.547208309173584, 1.634068489074707, 1.7209285497665405, 1.807788610458374, 1.894648790359497, 1.9815089702606201, 2.068369150161743, 2.155229091644287, 2.24208927154541, 2.328949451446533, 2.4158096313476562, 2.5026695728302, 2.5895297527313232, 2.676389694213867, 2.7632498741149902, 2.850109815597534, 2.9369699954986572, 3.0238301753997803, 3.1106903553009033, 3.1975502967834473, 3.2844104766845703, 3.3712706565856934, 3.4581308364868164, 3.5449907779693604, 3.6318509578704834, 3.7187111377716064, 3.8055713176727295, 3.8924312591552734, 3.9792914390563965, 4.0661516189575195]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 2.0, 1.0, 13.0, 8.0, 7.0, 9.0, 11.0, 17.0, 19.0, 12.0, 23.0, 25.0, 35.0, 42.0, 38.0, 41.0, 47.0, 50.0, 56.0, 48.0, 47.0, 48.0, 46.0, 57.0, 46.0, 45.0, 29.0, 31.0, 24.0, 28.0, 15.0, 19.0, 15.0, 15.0, 10.0, 9.0, 8.0, 5.0, 1.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.8184596300125122, -0.794048011302948, -0.7696363925933838, -0.7452247142791748, -0.7208130955696106, -0.6964014768600464, -0.6719898581504822, -0.647578239440918, -0.6231666207313538, -0.5987550020217896, -0.5743433833122253, -0.5499317646026611, -0.5255200862884521, -0.5011084675788879, -0.47669684886932373, -0.4522852301597595, -0.4278735816478729, -0.4034619629383087, -0.3790503144264221, -0.3546386957168579, -0.3302270770072937, -0.3058154582977295, -0.2814038097858429, -0.2569921910762787, -0.23258055746555328, -0.20816892385482788, -0.18375730514526367, -0.15934567153453827, -0.13493403792381287, -0.11052241921424866, -0.08611078560352325, -0.061699166893959045, -0.03728753328323364, -0.012875905260443687, 0.011535722762346268, 0.03594735264778137, 0.06035897880792618, 0.08477060496807098, 0.10918223857879639, 0.1335938572883606, 0.158005490899086, 0.1824171245098114, 0.2068287432193756, 0.231240376830101, 0.2556520104408264, 0.2800636291503906, 0.30447524785995483, 0.32888686656951904, 0.35329851508140564, 0.37771013379096985, 0.40212178230285645, 0.42653340101242065, 0.45094501972198486, 0.4753566384315491, 0.49976828694343567, 0.5241799354553223, 0.5485915541648865, 0.5730031728744507, 0.5974147915840149, 0.6218264102935791, 0.6462380886077881, 0.6706497073173523, 0.6950613260269165, 0.7194729447364807, 0.7438845634460449]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 6.0, 3.0, 6.0, 10.0, 8.0, 12.0, 20.0, 23.0, 26.0, 28.0, 69.0, 92.0, 201.0, 402.0, 1001.0, 3476.0, 20633.0, 4096880.0, 62257.0, 6098.0, 1664.0, 625.0, 306.0, 138.0, 94.0, 63.0, 39.0, 27.0, 21.0, 25.0, 12.0, 5.0, 7.0, 4.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.404541015625, -0.3932037353515625, -0.381866455078125, -0.3705291748046875, -0.35919189453125, -0.3478546142578125, -0.336517333984375, -0.3251800537109375, -0.3138427734375, -0.3025054931640625, -0.291168212890625, -0.2798309326171875, -0.26849365234375, -0.2571563720703125, -0.245819091796875, -0.2344818115234375, -0.22314453125, -0.2118072509765625, -0.200469970703125, -0.1891326904296875, -0.17779541015625, -0.1664581298828125, -0.155120849609375, -0.1437835693359375, -0.1324462890625, -0.1211090087890625, -0.109771728515625, -0.0984344482421875, -0.08709716796875, -0.0757598876953125, -0.064422607421875, -0.0530853271484375, -0.041748046875, -0.0304107666015625, -0.019073486328125, -0.0077362060546875, 0.00360107421875, 0.0149383544921875, 0.026275634765625, 0.0376129150390625, 0.0489501953125, 0.0602874755859375, 0.071624755859375, 0.0829620361328125, 0.09429931640625, 0.1056365966796875, 0.116973876953125, 0.1283111572265625, 0.1396484375, 0.1509857177734375, 0.162322998046875, 0.1736602783203125, 0.18499755859375, 0.1963348388671875, 0.207672119140625, 0.2190093994140625, 0.2303466796875, 0.2416839599609375, 0.253021240234375, 0.2643585205078125, 0.27569580078125, 0.2870330810546875, 0.298370361328125, 0.3097076416015625, 0.321044921875]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 11.0, 12.0, 27.0, 49.0, 79.0, 101.0, 135.0, 141.0, 138.0, 116.0, 75.0, 47.0, 25.0, 17.0, 8.0, 3.0, 3.0, 3.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0914306640625, -0.08906269073486328, -0.08669471740722656, -0.08432674407958984, -0.08195877075195312, -0.0795907974243164, -0.07722282409667969, -0.07485485076904297, -0.07248687744140625, -0.07011890411376953, -0.06775093078613281, -0.0653829574584961, -0.06301498413085938, -0.060647010803222656, -0.05827903747558594, -0.05591106414794922, -0.0535430908203125, -0.05117511749267578, -0.04880714416503906, -0.046439170837402344, -0.044071197509765625, -0.041703224182128906, -0.03933525085449219, -0.03696727752685547, -0.03459930419921875, -0.03223133087158203, -0.029863357543945312, -0.027495384216308594, -0.025127410888671875, -0.022759437561035156, -0.020391464233398438, -0.01802349090576172, -0.015655517578125, -0.013287544250488281, -0.010919570922851562, -0.008551597595214844, -0.006183624267578125, -0.0038156509399414062, -0.0014476776123046875, 0.0009202957153320312, 0.00328826904296875, 0.005656242370605469, 0.008024215698242188, 0.010392189025878906, 0.012760162353515625, 0.015128135681152344, 0.017496109008789062, 0.01986408233642578, 0.0222320556640625, 0.02460002899169922, 0.026968002319335938, 0.029335975646972656, 0.031703948974609375, 0.034071922302246094, 0.03643989562988281, 0.03880786895751953, 0.04117584228515625, 0.04354381561279297, 0.04591178894042969, 0.048279762268066406, 0.050647735595703125, 0.053015708923339844, 0.05538368225097656, 0.05775165557861328, 0.06011962890625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 4.0, 6.0, 9.0, 26.0, 30.0, 40.0, 84.0, 121.0, 212.0, 314.0, 593.0, 1135.0, 2692.0, 7286.0, 26544.0, 366148.0, 3733942.0, 39565.0, 9314.0, 3276.0, 1334.0, 679.0, 369.0, 199.0, 144.0, 88.0, 48.0, 27.0, 14.0, 15.0, 9.0, 9.0, 5.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.197265625, -0.19025039672851562, -0.18323516845703125, -0.17621994018554688, -0.1692047119140625, -0.16218948364257812, -0.15517425537109375, -0.14815902709960938, -0.141143798828125, -0.13412857055664062, -0.12711334228515625, -0.12009811401367188, -0.1130828857421875, -0.10606765747070312, -0.09905242919921875, -0.09203720092773438, -0.08502197265625, -0.07800674438476562, -0.07099151611328125, -0.06397628784179688, -0.0569610595703125, -0.049945831298828125, -0.04293060302734375, -0.035915374755859375, -0.028900146484375, -0.021884918212890625, -0.01486968994140625, -0.007854461669921875, -0.0008392333984375, 0.006175994873046875, 0.01319122314453125, 0.020206451416015625, 0.0272216796875, 0.034236907958984375, 0.04125213623046875, 0.048267364501953125, 0.0552825927734375, 0.062297821044921875, 0.06931304931640625, 0.07632827758789062, 0.083343505859375, 0.09035873413085938, 0.09737396240234375, 0.10438919067382812, 0.1114044189453125, 0.11841964721679688, 0.12543487548828125, 0.13245010375976562, 0.13946533203125, 0.14648056030273438, 0.15349578857421875, 0.16051101684570312, 0.1675262451171875, 0.17454147338867188, 0.18155670166015625, 0.18857192993164062, 0.195587158203125, 0.20260238647460938, 0.20961761474609375, 0.21663284301757812, 0.2236480712890625, 0.23066329956054688, 0.23767852783203125, 0.24469375610351562, 0.251708984375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 7.0, 3.0, 4.0, 7.0, 7.0, 7.0, 11.0, 12.0, 13.0, 31.0, 50.0, 92.0, 188.0, 2847.0, 498.0, 129.0, 64.0, 37.0, 14.0, 16.0, 15.0, 8.0, 4.0, 6.0, 6.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0843505859375, -0.08205747604370117, -0.07976436614990234, -0.07747125625610352, -0.07517814636230469, -0.07288503646850586, -0.07059192657470703, -0.0682988166809082, -0.06600570678710938, -0.06371259689331055, -0.06141948699951172, -0.05912637710571289, -0.05683326721191406, -0.054540157318115234, -0.052247047424316406, -0.04995393753051758, -0.04766082763671875, -0.04536771774291992, -0.043074607849121094, -0.040781497955322266, -0.03848838806152344, -0.03619527816772461, -0.03390216827392578, -0.03160905838012695, -0.029315948486328125, -0.027022838592529297, -0.02472972869873047, -0.02243661880493164, -0.020143508911132812, -0.017850399017333984, -0.015557289123535156, -0.013264179229736328, -0.0109710693359375, -0.008677959442138672, -0.006384849548339844, -0.004091739654541016, -0.0017986297607421875, 0.0004944801330566406, 0.0027875900268554688, 0.005080699920654297, 0.007373809814453125, 0.009666919708251953, 0.011960029602050781, 0.01425313949584961, 0.016546249389648438, 0.018839359283447266, 0.021132469177246094, 0.023425579071044922, 0.02571868896484375, 0.028011798858642578, 0.030304908752441406, 0.032598018646240234, 0.03489112854003906, 0.03718423843383789, 0.03947734832763672, 0.04177045822143555, 0.044063568115234375, 0.0463566780090332, 0.04864978790283203, 0.05094289779663086, 0.05323600769042969, 0.055529117584228516, 0.057822227478027344, 0.06011533737182617, 0.062408447265625]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 3.0, 4.0, 10.0, 43.0, 134.0, 371.0, 312.0, 92.0, 21.0, 15.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8899651765823364, -0.8644610047340393, -0.8389568328857422, -0.8134527206420898, -0.7879485487937927, -0.7624443769454956, -0.7369402050971985, -0.7114360332489014, -0.685931921005249, -0.6604277491569519, -0.6349235773086548, -0.6094194650650024, -0.5839152932167053, -0.5584111213684082, -0.5329069495201111, -0.507402777671814, -0.48189860582351685, -0.4563944339752197, -0.430890291929245, -0.4053861200809479, -0.37988197803497314, -0.354377806186676, -0.3288736343383789, -0.3033694624900818, -0.27786532044410706, -0.25236114859580994, -0.2268570065498352, -0.20135283470153809, -0.17584867775440216, -0.15034452080726624, -0.12484034895896912, -0.09933619201183319, -0.07383203506469727, -0.04832787439227104, -0.022823713719844818, 0.002680450677871704, 0.02818460762500763, 0.053688764572143555, 0.07919293642044067, 0.1046970933675766, 0.13020125031471252, 0.15570540726184845, 0.18120956420898438, 0.2067137360572815, 0.23221789300441742, 0.25772204995155334, 0.28322622179985046, 0.3087303638458252, 0.3342345356941223, 0.35973870754241943, 0.38524284958839417, 0.4107470214366913, 0.436251163482666, 0.46175533533096313, 0.48725950717926025, 0.5127636790275574, 0.5382678508758545, 0.5637720227241516, 0.5892761945724487, 0.6147803068161011, 0.6402844786643982, 0.6657886505126953, 0.6912928223609924, 0.7167969942092896, 0.7423011064529419]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 8.0, 11.0, 11.0, 6.0, 10.0, 24.0, 19.0, 24.0, 20.0, 20.0, 36.0, 28.0, 20.0, 43.0, 37.0, 38.0, 38.0, 52.0, 47.0, 49.0, 22.0, 38.0, 39.0, 39.0, 41.0, 49.0, 32.0, 24.0, 23.0, 27.0, 13.0, 19.0, 16.0, 14.0, 12.0, 12.0, 6.0, 9.0, 5.0, 3.0, 3.0, 3.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.15403872728347778, -0.14933548867702484, -0.1446322500705719, -0.13992901146411896, -0.13522577285766602, -0.13052251935005188, -0.12581928074359894, -0.121116042137146, -0.11641280353069305, -0.11170956492424011, -0.10700632631778717, -0.10230308026075363, -0.09759984165430069, -0.09289660304784775, -0.08819335699081421, -0.08349011838436127, -0.07878687977790833, -0.07408364117145538, -0.06938040256500244, -0.0646771565079689, -0.05997391790151596, -0.05527067929506302, -0.05056743696331978, -0.04586419463157654, -0.041160956025123596, -0.036457717418670654, -0.031754475086927414, -0.027051234617829323, -0.02234799414873123, -0.01764475367963314, -0.01294151321053505, -0.008238270878791809, -0.003535032272338867, 0.001168208196759224, 0.005871448665857315, 0.010574689134955406, 0.015277929604053497, 0.01998117007315159, 0.02468441054224968, 0.02938765287399292, 0.03409089148044586, 0.038794130086898804, 0.043497372418642044, 0.048200614750385284, 0.052903853356838226, 0.05760709196329117, 0.06231033429503441, 0.06701357662677765, 0.07171681523323059, 0.07642005383968353, 0.08112329244613647, 0.08582653850317001, 0.09052977710962296, 0.0952330157160759, 0.09993626177310944, 0.10463950037956238, 0.10934273898601532, 0.11404597759246826, 0.1187492161989212, 0.12345246225595474, 0.12815570831298828, 0.13285894691944122, 0.13756218552589417, 0.1422654241323471, 0.14696866273880005]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 7.0, 8.0, 14.0, 7.0, 22.0, 22.0, 38.0, 34.0, 64.0, 86.0, 99.0, 154.0, 168.0, 271.0, 384.0, 572.0, 862.0, 1462.0, 2846.0, 7188.0, 24378.0, 116452.0, 588543.0, 241384.0, 43258.0, 11338.0, 3969.0, 1755.0, 1029.0, 582.0, 429.0, 267.0, 215.0, 162.0, 110.0, 77.0, 65.0, 59.0, 35.0, 41.0, 20.0, 17.0, 22.0, 11.0, 10.0, 10.0, 4.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2291259765625, -0.22189712524414062, -0.21466827392578125, -0.20743942260742188, -0.2002105712890625, -0.19298171997070312, -0.18575286865234375, -0.17852401733398438, -0.171295166015625, -0.16406631469726562, -0.15683746337890625, -0.14960861206054688, -0.1423797607421875, -0.13515090942382812, -0.12792205810546875, -0.12069320678710938, -0.11346435546875, -0.10623550415039062, -0.09900665283203125, -0.09177780151367188, -0.0845489501953125, -0.07732009887695312, -0.07009124755859375, -0.06286239624023438, -0.055633544921875, -0.048404693603515625, -0.04117584228515625, -0.033946990966796875, -0.0267181396484375, -0.019489288330078125, -0.01226043701171875, -0.005031585693359375, 0.002197265625, 0.009426116943359375, 0.01665496826171875, 0.023883819580078125, 0.0311126708984375, 0.038341522216796875, 0.04557037353515625, 0.052799224853515625, 0.060028076171875, 0.06725692749023438, 0.07448577880859375, 0.08171463012695312, 0.0889434814453125, 0.09617233276367188, 0.10340118408203125, 0.11063003540039062, 0.11785888671875, 0.12508773803710938, 0.13231658935546875, 0.13954544067382812, 0.1467742919921875, 0.15400314331054688, 0.16123199462890625, 0.16846084594726562, 0.175689697265625, 0.18291854858398438, 0.19014739990234375, 0.19737625122070312, 0.2046051025390625, 0.21183395385742188, 0.21906280517578125, 0.22629165649414062, 0.2335205078125]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 13.0, 19.0, 38.0, 63.0, 91.0, 116.0, 137.0, 134.0, 138.0, 95.0, 62.0, 35.0, 18.0, 19.0, 4.0, 4.0, 2.0, 1.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.08843994140625, -0.08612203598022461, -0.08380413055419922, -0.08148622512817383, -0.07916831970214844, -0.07685041427612305, -0.07453250885009766, -0.07221460342407227, -0.06989669799804688, -0.06757879257202148, -0.0652608871459961, -0.0629429817199707, -0.06062507629394531, -0.05830717086791992, -0.05598926544189453, -0.05367136001586914, -0.05135345458984375, -0.04903554916381836, -0.04671764373779297, -0.04439973831176758, -0.04208183288574219, -0.0397639274597168, -0.037446022033691406, -0.035128116607666016, -0.032810211181640625, -0.030492305755615234, -0.028174400329589844, -0.025856494903564453, -0.023538589477539062, -0.021220684051513672, -0.01890277862548828, -0.01658487319946289, -0.0142669677734375, -0.01194906234741211, -0.009631156921386719, -0.007313251495361328, -0.0049953460693359375, -0.002677440643310547, -0.00035953521728515625, 0.0019583702087402344, 0.004276275634765625, 0.006594181060791016, 0.008912086486816406, 0.011229991912841797, 0.013547897338867188, 0.015865802764892578, 0.01818370819091797, 0.02050161361694336, 0.02281951904296875, 0.02513742446899414, 0.02745532989501953, 0.029773235321044922, 0.03209114074707031, 0.0344090461730957, 0.036726951599121094, 0.039044857025146484, 0.041362762451171875, 0.043680667877197266, 0.045998573303222656, 0.04831647872924805, 0.05063438415527344, 0.05295228958129883, 0.05527019500732422, 0.05758810043334961, 0.059906005859375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 3.0, 2.0, 10.0, 7.0, 15.0, 27.0, 37.0, 63.0, 112.0, 221.0, 384.0, 727.0, 1525.0, 3189.0, 7215.0, 17643.0, 47374.0, 140784.0, 417914.0, 274596.0, 84965.0, 30264.0, 11866.0, 5040.0, 2231.0, 1060.0, 570.0, 306.0, 157.0, 99.0, 44.0, 39.0, 16.0, 15.0, 7.0, 10.0, 3.0, 5.0, 7.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11492919921875, -0.1110696792602539, -0.10721015930175781, -0.10335063934326172, -0.09949111938476562, -0.09563159942626953, -0.09177207946777344, -0.08791255950927734, -0.08405303955078125, -0.08019351959228516, -0.07633399963378906, -0.07247447967529297, -0.06861495971679688, -0.06475543975830078, -0.06089591979980469, -0.057036399841308594, -0.0531768798828125, -0.049317359924316406, -0.04545783996582031, -0.04159832000732422, -0.037738800048828125, -0.03387928009033203, -0.030019760131835938, -0.026160240173339844, -0.02230072021484375, -0.018441200256347656, -0.014581680297851562, -0.010722160339355469, -0.006862640380859375, -0.0030031204223632812, 0.0008563995361328125, 0.004715919494628906, 0.008575439453125, 0.012434959411621094, 0.016294479370117188, 0.02015399932861328, 0.024013519287109375, 0.02787303924560547, 0.03173255920410156, 0.035592079162597656, 0.03945159912109375, 0.043311119079589844, 0.04717063903808594, 0.05103015899658203, 0.054889678955078125, 0.05874919891357422, 0.06260871887207031, 0.0664682388305664, 0.0703277587890625, 0.0741872787475586, 0.07804679870605469, 0.08190631866455078, 0.08576583862304688, 0.08962535858154297, 0.09348487854003906, 0.09734439849853516, 0.10120391845703125, 0.10506343841552734, 0.10892295837402344, 0.11278247833251953, 0.11664199829101562, 0.12050151824951172, 0.12436103820800781, 0.1282205581665039, 0.132080078125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 6.0, 9.0, 1.0, 4.0, 16.0, 15.0, 12.0, 16.0, 12.0, 15.0, 25.0, 23.0, 28.0, 41.0, 38.0, 36.0, 51.0, 52.0, 30.0, 32.0, 40.0, 53.0, 53.0, 32.0, 51.0, 25.0, 35.0, 25.0, 48.0, 29.0, 23.0, 25.0, 23.0, 14.0, 18.0, 7.0, 7.0, 10.0, 5.0, 8.0, 3.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.1156005859375, -0.11217594146728516, -0.10875129699707031, -0.10532665252685547, -0.10190200805664062, -0.09847736358642578, -0.09505271911621094, -0.0916280746459961, -0.08820343017578125, -0.0847787857055664, -0.08135414123535156, -0.07792949676513672, -0.07450485229492188, -0.07108020782470703, -0.06765556335449219, -0.06423091888427734, -0.0608062744140625, -0.057381629943847656, -0.05395698547363281, -0.05053234100341797, -0.047107696533203125, -0.04368305206298828, -0.04025840759277344, -0.036833763122558594, -0.03340911865234375, -0.029984474182128906, -0.026559829711914062, -0.02313518524169922, -0.019710540771484375, -0.01628589630126953, -0.012861251831054688, -0.009436607360839844, -0.006011962890625, -0.0025873184204101562, 0.0008373260498046875, 0.004261970520019531, 0.007686614990234375, 0.011111259460449219, 0.014535903930664062, 0.017960548400878906, 0.02138519287109375, 0.024809837341308594, 0.028234481811523438, 0.03165912628173828, 0.035083770751953125, 0.03850841522216797, 0.04193305969238281, 0.045357704162597656, 0.0487823486328125, 0.052206993103027344, 0.05563163757324219, 0.05905628204345703, 0.062480926513671875, 0.06590557098388672, 0.06933021545410156, 0.0727548599243164, 0.07617950439453125, 0.0796041488647461, 0.08302879333496094, 0.08645343780517578, 0.08987808227539062, 0.09330272674560547, 0.09672737121582031, 0.10015201568603516, 0.10357666015625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 6.0, 2.0, 5.0, 6.0, 16.0, 17.0, 23.0, 38.0, 65.0, 115.0, 194.0, 350.0, 841.0, 2121.0, 6168.0, 22295.0, 107091.0, 609580.0, 241506.0, 41977.0, 10547.0, 3248.0, 1181.0, 529.0, 294.0, 119.0, 87.0, 57.0, 28.0, 16.0, 21.0, 8.0, 5.0, 5.0, 0.0, 2.0, 0.0, 0.0, 3.0], "bins": [-0.090576171875, -0.0884556770324707, -0.0863351821899414, -0.08421468734741211, -0.08209419250488281, -0.07997369766235352, -0.07785320281982422, -0.07573270797729492, -0.07361221313476562, -0.07149171829223633, -0.06937122344970703, -0.06725072860717773, -0.06513023376464844, -0.06300973892211914, -0.060889244079589844, -0.05876874923706055, -0.05664825439453125, -0.05452775955200195, -0.052407264709472656, -0.05028676986694336, -0.04816627502441406, -0.046045780181884766, -0.04392528533935547, -0.04180479049682617, -0.039684295654296875, -0.03756380081176758, -0.03544330596923828, -0.033322811126708984, -0.031202316284179688, -0.02908182144165039, -0.026961326599121094, -0.024840831756591797, -0.0227203369140625, -0.020599842071533203, -0.018479347229003906, -0.01635885238647461, -0.014238357543945312, -0.012117862701416016, -0.009997367858886719, -0.007876873016357422, -0.005756378173828125, -0.003635883331298828, -0.0015153884887695312, 0.0006051063537597656, 0.0027256011962890625, 0.004846096038818359, 0.006966590881347656, 0.009087085723876953, 0.01120758056640625, 0.013328075408935547, 0.015448570251464844, 0.01756906509399414, 0.019689559936523438, 0.021810054779052734, 0.02393054962158203, 0.026051044464111328, 0.028171539306640625, 0.030292034149169922, 0.03241252899169922, 0.034533023834228516, 0.03665351867675781, 0.03877401351928711, 0.040894508361816406, 0.0430150032043457, 0.045135498046875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 5.0, 5.0, 7.0, 7.0, 16.0, 10.0, 50.0, 74.0, 163.0, 270.0, 200.0, 90.0, 45.0, 20.0, 11.0, 4.0, 10.0, 4.0, 3.0, 6.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.18235969543457e-05, -6.849970668554306e-05, -6.517581641674042e-05, -6.185192614793777e-05, -5.852803587913513e-05, -5.520414561033249e-05, -5.1880255341529846e-05, -4.85563650727272e-05, -4.523247480392456e-05, -4.190858453512192e-05, -3.8584694266319275e-05, -3.526080399751663e-05, -3.193691372871399e-05, -2.8613023459911346e-05, -2.5289133191108704e-05, -2.196524292230606e-05, -1.8641352653503418e-05, -1.5317462384700775e-05, -1.1993572115898132e-05, -8.66968184709549e-06, -5.345791578292847e-06, -2.021901309490204e-06, 1.301988959312439e-06, 4.625879228115082e-06, 7.949769496917725e-06, 1.1273659765720367e-05, 1.459755003452301e-05, 1.7921440303325653e-05, 2.1245330572128296e-05, 2.456922084093094e-05, 2.789311110973358e-05, 3.1217001378536224e-05, 3.454089164733887e-05, 3.786478191614151e-05, 4.118867218494415e-05, 4.4512562453746796e-05, 4.783645272254944e-05, 5.116034299135208e-05, 5.4484233260154724e-05, 5.780812352895737e-05, 6.113201379776001e-05, 6.445590406656265e-05, 6.77797943353653e-05, 7.110368460416794e-05, 7.442757487297058e-05, 7.775146514177322e-05, 8.107535541057587e-05, 8.439924567937851e-05, 8.772313594818115e-05, 9.10470262169838e-05, 9.437091648578644e-05, 9.769480675458908e-05, 0.00010101869702339172, 0.00010434258729219437, 0.00010766647756099701, 0.00011099036782979965, 0.0001143142580986023, 0.00011763814836740494, 0.00012096203863620758, 0.00012428592890501022, 0.00012760981917381287, 0.0001309337094426155, 0.00013425759971141815, 0.0001375814899802208, 0.00014090538024902344]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 4.0, 3.0, 8.0, 19.0, 32.0, 41.0, 80.0, 158.0, 322.0, 739.0, 1767.0, 4762.0, 16510.0, 88362.0, 622328.0, 263127.0, 36712.0, 8731.0, 2757.0, 1105.0, 485.0, 219.0, 134.0, 73.0, 31.0, 17.0, 14.0, 9.0, 5.0, 2.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.083251953125, -0.08110380172729492, -0.07895565032958984, -0.07680749893188477, -0.07465934753417969, -0.07251119613647461, -0.07036304473876953, -0.06821489334106445, -0.06606674194335938, -0.0639185905456543, -0.06177043914794922, -0.05962228775024414, -0.05747413635253906, -0.055325984954833984, -0.053177833557128906, -0.05102968215942383, -0.04888153076171875, -0.04673337936401367, -0.044585227966308594, -0.042437076568603516, -0.04028892517089844, -0.03814077377319336, -0.03599262237548828, -0.0338444709777832, -0.031696319580078125, -0.029548168182373047, -0.02740001678466797, -0.02525186538696289, -0.023103713989257812, -0.020955562591552734, -0.018807411193847656, -0.016659259796142578, -0.0145111083984375, -0.012362957000732422, -0.010214805603027344, -0.008066654205322266, -0.0059185028076171875, -0.0037703514099121094, -0.0016222000122070312, 0.0005259513854980469, 0.002674102783203125, 0.004822254180908203, 0.006970405578613281, 0.00911855697631836, 0.011266708374023438, 0.013414859771728516, 0.015563011169433594, 0.017711162567138672, 0.01985931396484375, 0.022007465362548828, 0.024155616760253906, 0.026303768157958984, 0.028451919555664062, 0.03060007095336914, 0.03274822235107422, 0.0348963737487793, 0.037044525146484375, 0.03919267654418945, 0.04134082794189453, 0.04348897933959961, 0.04563713073730469, 0.047785282135009766, 0.049933433532714844, 0.05208158493041992, 0.054229736328125]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 8.0, 3.0, 5.0, 7.0, 4.0, 10.0, 5.0, 17.0, 25.0, 39.0, 33.0, 53.0, 71.0, 96.0, 83.0, 79.0, 90.0, 68.0, 63.0, 65.0, 34.0, 43.0, 31.0, 22.0, 12.0, 9.0, 6.0, 8.0, 5.0, 4.0, 5.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0491943359375, -0.04763984680175781, -0.046085357666015625, -0.04453086853027344, -0.04297637939453125, -0.04142189025878906, -0.039867401123046875, -0.03831291198730469, -0.0367584228515625, -0.03520393371582031, -0.033649444580078125, -0.03209495544433594, -0.03054046630859375, -0.028985977172851562, -0.027431488037109375, -0.025876998901367188, -0.024322509765625, -0.022768020629882812, -0.021213531494140625, -0.019659042358398438, -0.01810455322265625, -0.016550064086914062, -0.014995574951171875, -0.013441085815429688, -0.0118865966796875, -0.010332107543945312, -0.008777618408203125, -0.0072231292724609375, -0.00566864013671875, -0.0041141510009765625, -0.002559661865234375, -0.0010051727294921875, 0.00054931640625, 0.0021038055419921875, 0.003658294677734375, 0.0052127838134765625, 0.00676727294921875, 0.008321762084960938, 0.009876251220703125, 0.011430740356445312, 0.0129852294921875, 0.014539718627929688, 0.016094207763671875, 0.017648696899414062, 0.01920318603515625, 0.020757675170898438, 0.022312164306640625, 0.023866653442382812, 0.025421142578125, 0.026975631713867188, 0.028530120849609375, 0.030084609985351562, 0.03163909912109375, 0.03319358825683594, 0.034748077392578125, 0.03630256652832031, 0.0378570556640625, 0.03941154479980469, 0.040966033935546875, 0.04252052307128906, 0.04407501220703125, 0.04562950134277344, 0.047183990478515625, 0.04873847961425781, 0.05029296875]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 9.0, 30.0, 87.0, 244.0, 390.0, 152.0, 63.0, 23.0, 8.0, 4.0, 0.0, 0.0, 3.0], "bins": [-4.071187973022461, -3.997525691986084, -3.923863410949707, -3.850201368331909, -3.7765390872955322, -3.7028768062591553, -3.6292145252227783, -3.5555522441864014, -3.4818902015686035, -3.4082279205322266, -3.3345656394958496, -3.2609035968780518, -3.187241315841675, -3.113579034805298, -3.039916753768921, -2.966254472732544, -2.892592191696167, -2.81892991065979, -2.745267629623413, -2.6716055870056152, -2.5979433059692383, -2.5242810249328613, -2.4506187438964844, -2.3769564628601074, -2.3032941818237305, -2.2296319007873535, -2.1559696197509766, -2.0823075771331787, -2.0086452960968018, -1.9349830150604248, -1.8613207340240479, -1.787658452987671, -1.713996171951294, -1.640333890914917, -1.5666717290878296, -1.4930094480514526, -1.4193472862243652, -1.3456850051879883, -1.2720227241516113, -1.1983604431152344, -1.1246984004974365, -1.0510361194610596, -0.9773739576339722, -0.9037116765975952, -0.830049455165863, -0.7563872337341309, -0.6827249526977539, -0.6090627312660217, -0.5354004502296448, -0.4617382287979126, -0.38807597756385803, -0.31441372632980347, -0.2407515048980713, -0.1670892834663391, -0.09342703223228455, -0.01976478099822998, 0.0538974404335022, 0.12755967676639557, 0.20122191309928894, 0.2748841643333435, 0.3485463857650757, 0.42220860719680786, 0.4958708584308624, 0.569533109664917, 0.6431953310966492]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 4.0, 6.0, 4.0, 8.0, 12.0, 14.0, 10.0, 17.0, 18.0, 18.0, 28.0, 21.0, 26.0, 32.0, 30.0, 26.0, 32.0, 33.0, 43.0, 46.0, 59.0, 45.0, 37.0, 51.0, 37.0, 34.0, 51.0, 43.0, 33.0, 29.0, 18.0, 22.0, 18.0, 16.0, 18.0, 12.0, 9.0, 9.0, 8.0, 8.0, 7.0, 5.0, 6.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.5050162076950073, -0.487313836812973, -0.46961143612861633, -0.45190906524658203, -0.43420666456222534, -0.41650429368019104, -0.39880192279815674, -0.38109952211380005, -0.36339715123176575, -0.34569478034973145, -0.32799237966537476, -0.31029000878334045, -0.29258763790130615, -0.27488523721694946, -0.25718286633491516, -0.23948048055171967, -0.22177809476852417, -0.20407570898532867, -0.18637332320213318, -0.16867095232009888, -0.15096856653690338, -0.13326618075370789, -0.11556380242109299, -0.09786142408847809, -0.08015903830528259, -0.062456656247377396, -0.0447542741894722, -0.027051892131567, -0.009349510073661804, 0.008352875709533691, 0.02605525404214859, 0.04375763237476349, 0.06146007776260376, 0.07916246354579926, 0.09686484187841415, 0.11456722021102905, 0.13226960599422455, 0.14997199177742004, 0.16767436265945435, 0.18537674844264984, 0.20307913422584534, 0.22078152000904083, 0.23848390579223633, 0.25618627667427063, 0.27388864755630493, 0.2915910482406616, 0.3092934191226959, 0.3269957900047302, 0.3446981906890869, 0.3624005615711212, 0.3801029622554779, 0.3978053331375122, 0.4155077338218689, 0.4332101047039032, 0.4509124755859375, 0.4686148762702942, 0.4863172471523285, 0.5040196180343628, 0.5217220187187195, 0.5394244194030762, 0.5571267604827881, 0.5748291611671448, 0.5925315618515015, 0.6102339029312134, 0.6279363036155701]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 6.0, 2.0, 6.0, 7.0, 5.0, 7.0, 15.0, 13.0, 21.0, 32.0, 34.0, 86.0, 153.0, 276.0, 605.0, 1746.0, 7285.0, 447195.0, 3725286.0, 8180.0, 1897.0, 670.0, 318.0, 164.0, 85.0, 63.0, 32.0, 31.0, 19.0, 14.0, 11.0, 6.0, 5.0, 5.0, 0.0, 5.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.47900390625, -0.4670372009277344, -0.45507049560546875, -0.4431037902832031, -0.4311370849609375, -0.4191703796386719, -0.40720367431640625, -0.3952369689941406, -0.383270263671875, -0.3713035583496094, -0.35933685302734375, -0.3473701477050781, -0.3354034423828125, -0.3234367370605469, -0.31147003173828125, -0.2995033264160156, -0.28753662109375, -0.2755699157714844, -0.26360321044921875, -0.2516365051269531, -0.2396697998046875, -0.22770309448242188, -0.21573638916015625, -0.20376968383789062, -0.191802978515625, -0.17983627319335938, -0.16786956787109375, -0.15590286254882812, -0.1439361572265625, -0.13196945190429688, -0.12000274658203125, -0.10803604125976562, -0.0960693359375, -0.08410263061523438, -0.07213592529296875, -0.060169219970703125, -0.0482025146484375, -0.036235809326171875, -0.02426910400390625, -0.012302398681640625, -0.000335693359375, 0.011631011962890625, 0.02359771728515625, 0.035564422607421875, 0.0475311279296875, 0.059497833251953125, 0.07146453857421875, 0.08343124389648438, 0.09539794921875, 0.10736465454101562, 0.11933135986328125, 0.13129806518554688, 0.1432647705078125, 0.15523147583007812, 0.16719818115234375, 0.17916488647460938, 0.191131591796875, 0.20309829711914062, 0.21506500244140625, 0.22703170776367188, 0.2389984130859375, 0.2509651184082031, 0.26293182373046875, 0.2748985290527344, 0.286865234375]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 10.0, 16.0, 33.0, 62.0, 92.0, 112.0, 128.0, 135.0, 152.0, 97.0, 70.0, 40.0, 17.0, 11.0, 10.0, 1.0, 4.0, 2.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.09674072265625, -0.09427833557128906, -0.09181594848632812, -0.08935356140136719, -0.08689117431640625, -0.08442878723144531, -0.08196640014648438, -0.07950401306152344, -0.0770416259765625, -0.07457923889160156, -0.07211685180664062, -0.06965446472167969, -0.06719207763671875, -0.06472969055175781, -0.062267303466796875, -0.05980491638183594, -0.057342529296875, -0.05488014221191406, -0.052417755126953125, -0.04995536804199219, -0.04749298095703125, -0.04503059387207031, -0.042568206787109375, -0.04010581970214844, -0.0376434326171875, -0.03518104553222656, -0.032718658447265625, -0.030256271362304688, -0.02779388427734375, -0.025331497192382812, -0.022869110107421875, -0.020406723022460938, -0.0179443359375, -0.015481948852539062, -0.013019561767578125, -0.010557174682617188, -0.00809478759765625, -0.0056324005126953125, -0.003170013427734375, -0.0007076263427734375, 0.0017547607421875, 0.0042171478271484375, 0.006679534912109375, 0.009141921997070312, 0.01160430908203125, 0.014066696166992188, 0.016529083251953125, 0.018991470336914062, 0.021453857421875, 0.023916244506835938, 0.026378631591796875, 0.028841018676757812, 0.03130340576171875, 0.03376579284667969, 0.036228179931640625, 0.03869056701660156, 0.0411529541015625, 0.04361534118652344, 0.046077728271484375, 0.04854011535644531, 0.05100250244140625, 0.05346488952636719, 0.055927276611328125, 0.05838966369628906, 0.06085205078125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 4.0, 2.0, 9.0, 6.0, 12.0, 10.0, 24.0, 43.0, 51.0, 86.0, 181.0, 339.0, 564.0, 1320.0, 2867.0, 7462.0, 24597.0, 173783.0, 3896289.0, 63140.0, 14534.0, 4827.0, 2004.0, 932.0, 517.0, 276.0, 164.0, 88.0, 62.0, 24.0, 23.0, 20.0, 10.0, 7.0, 3.0, 4.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.177734375, -0.1723957061767578, -0.16705703735351562, -0.16171836853027344, -0.15637969970703125, -0.15104103088378906, -0.14570236206054688, -0.1403636932373047, -0.1350250244140625, -0.1296863555908203, -0.12434768676757812, -0.11900901794433594, -0.11367034912109375, -0.10833168029785156, -0.10299301147460938, -0.09765434265136719, -0.092315673828125, -0.08697700500488281, -0.08163833618164062, -0.07629966735839844, -0.07096099853515625, -0.06562232971191406, -0.060283660888671875, -0.05494499206542969, -0.0496063232421875, -0.04426765441894531, -0.038928985595703125, -0.03359031677246094, -0.02825164794921875, -0.022912979125976562, -0.017574310302734375, -0.012235641479492188, -0.00689697265625, -0.0015583038330078125, 0.003780364990234375, 0.009119033813476562, 0.01445770263671875, 0.019796371459960938, 0.025135040283203125, 0.030473709106445312, 0.0358123779296875, 0.04115104675292969, 0.046489715576171875, 0.05182838439941406, 0.05716705322265625, 0.06250572204589844, 0.06784439086914062, 0.07318305969238281, 0.078521728515625, 0.08386039733886719, 0.08919906616210938, 0.09453773498535156, 0.09987640380859375, 0.10521507263183594, 0.11055374145507812, 0.11589241027832031, 0.1212310791015625, 0.1265697479248047, 0.13190841674804688, 0.13724708557128906, 0.14258575439453125, 0.14792442321777344, 0.15326309204101562, 0.1586017608642578, 0.1639404296875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 5.0, 4.0, 12.0, 11.0, 7.0, 20.0, 20.0, 47.0, 81.0, 198.0, 2871.0, 516.0, 106.0, 59.0, 32.0, 28.0, 12.0, 18.0, 8.0, 3.0, 4.0, 1.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0606689453125, -0.05821514129638672, -0.05576133728027344, -0.053307533264160156, -0.050853729248046875, -0.048399925231933594, -0.04594612121582031, -0.04349231719970703, -0.04103851318359375, -0.03858470916748047, -0.03613090515136719, -0.033677101135253906, -0.031223297119140625, -0.028769493103027344, -0.026315689086914062, -0.02386188507080078, -0.0214080810546875, -0.01895427703857422, -0.016500473022460938, -0.014046669006347656, -0.011592864990234375, -0.009139060974121094, -0.0066852569580078125, -0.004231452941894531, -0.00177764892578125, 0.0006761550903320312, 0.0031299591064453125, 0.005583763122558594, 0.008037567138671875, 0.010491371154785156, 0.012945175170898438, 0.015398979187011719, 0.017852783203125, 0.02030658721923828, 0.022760391235351562, 0.025214195251464844, 0.027667999267578125, 0.030121803283691406, 0.03257560729980469, 0.03502941131591797, 0.03748321533203125, 0.03993701934814453, 0.04239082336425781, 0.044844627380371094, 0.047298431396484375, 0.049752235412597656, 0.05220603942871094, 0.05465984344482422, 0.0571136474609375, 0.05956745147705078, 0.06202125549316406, 0.06447505950927734, 0.06692886352539062, 0.0693826675415039, 0.07183647155761719, 0.07429027557373047, 0.07674407958984375, 0.07919788360595703, 0.08165168762207031, 0.0841054916381836, 0.08655929565429688, 0.08901309967041016, 0.09146690368652344, 0.09392070770263672, 0.09637451171875]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 9.0, 46.0, 298.0, 506.0, 112.0, 28.0, 5.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.38780465722084045, -0.353226900100708, -0.31864914298057556, -0.2840713858604431, -0.24949364364147186, -0.21491588652133942, -0.18033814430236816, -0.14576038718223572, -0.11118263006210327, -0.07660487294197083, -0.042027123272418976, -0.0074493736028671265, 0.02712838351726532, 0.061706140637397766, 0.09628388285636902, 0.13086163997650146, 0.1654393970966339, 0.20001715421676636, 0.2345949113368988, 0.26917266845703125, 0.3037503957748413, 0.33832818269729614, 0.3729059100151062, 0.40748366713523865, 0.4420614242553711, 0.47663918137550354, 0.511216938495636, 0.545794665813446, 0.5803724527359009, 0.6149501800537109, 0.649527907371521, 0.6841056942939758, 0.7186833620071411, 0.7532610893249512, 0.787838876247406, 0.8224166035652161, 0.8569943904876709, 0.891572117805481, 0.926149845123291, 0.9607276320457458, 0.9953054189682007, 1.0298831462860107, 1.0644608736038208, 1.0990387201309204, 1.1336164474487305, 1.1681941747665405, 1.2027719020843506, 1.2373497486114502, 1.2719273567199707, 1.3065050840377808, 1.3410828113555908, 1.3756606578826904, 1.4102383852005005, 1.4448161125183105, 1.4793938398361206, 1.5139715671539307, 1.5485494136810303, 1.5831271409988403, 1.6177048683166504, 1.65228271484375, 1.68686044216156, 1.7214381694793701, 1.7560158967971802, 1.7905936241149902, 1.8251714706420898]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 11.0, 7.0, 10.0, 12.0, 22.0, 28.0, 24.0, 41.0, 55.0, 61.0, 67.0, 75.0, 64.0, 67.0, 59.0, 89.0, 62.0, 55.0, 54.0, 28.0, 29.0, 21.0, 18.0, 13.0, 12.0, 6.0, 6.0, 4.0, 2.0, 1.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2892959713935852, -0.28160953521728516, -0.2739230990409851, -0.26623666286468506, -0.258550226688385, -0.25086379051208496, -0.2431773692369461, -0.23549093306064606, -0.2278045117855072, -0.22011807560920715, -0.2124316394329071, -0.20474520325660706, -0.1970587819814682, -0.18937234580516815, -0.1816859096288681, -0.17399947345256805, -0.166313037276268, -0.15862660109996796, -0.1509401649236679, -0.14325374364852905, -0.135567307472229, -0.12788087129592896, -0.1201944351196289, -0.11250799894332886, -0.1048215702176094, -0.09713513404130936, -0.0894487053155899, -0.08176226913928986, -0.07407583296298981, -0.06638940423727036, -0.058702968060970306, -0.051016535609960556, -0.043330103158950806, -0.035643670707941055, -0.027957236394286156, -0.020270802080631256, -0.012584369629621506, -0.004897937178611755, 0.0027884989976882935, 0.010474931448698044, 0.018161363899707794, 0.025847796350717545, 0.033534228801727295, 0.041220664978027344, 0.048907097429037094, 0.056593529880046844, 0.0642799660563469, 0.07196639478206635, 0.0796528309583664, 0.08733926713466644, 0.0950256958603859, 0.10271213203668594, 0.1103985607624054, 0.11808499693870544, 0.1257714331150055, 0.13345786929130554, 0.1411443054676056, 0.14883074164390564, 0.1565171778202057, 0.16420361399650574, 0.1718900352716446, 0.17957647144794464, 0.1872629076242447, 0.19494934380054474, 0.2026357650756836]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 5.0, 5.0, 10.0, 8.0, 19.0, 28.0, 27.0, 39.0, 67.0, 86.0, 154.0, 172.0, 236.0, 452.0, 716.0, 1313.0, 2817.0, 8714.0, 47696.0, 555483.0, 382442.0, 35313.0, 7322.0, 2519.0, 1118.0, 620.0, 340.0, 241.0, 165.0, 117.0, 84.0, 63.0, 36.0, 35.0, 15.0, 20.0, 21.0, 8.0, 9.0, 9.0, 3.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.328125, -0.3187294006347656, -0.30933380126953125, -0.2999382019042969, -0.2905426025390625, -0.2811470031738281, -0.27175140380859375, -0.2623558044433594, -0.252960205078125, -0.24356460571289062, -0.23416900634765625, -0.22477340698242188, -0.2153778076171875, -0.20598220825195312, -0.19658660888671875, -0.18719100952148438, -0.17779541015625, -0.16839981079101562, -0.15900421142578125, -0.14960861206054688, -0.1402130126953125, -0.13081741333007812, -0.12142181396484375, -0.11202621459960938, -0.102630615234375, -0.09323501586914062, -0.08383941650390625, -0.07444381713867188, -0.0650482177734375, -0.055652618408203125, -0.04625701904296875, -0.036861419677734375, -0.0274658203125, -0.018070220947265625, -0.00867462158203125, 0.000720977783203125, 0.0101165771484375, 0.019512176513671875, 0.02890777587890625, 0.038303375244140625, 0.047698974609375, 0.057094573974609375, 0.06649017333984375, 0.07588577270507812, 0.0852813720703125, 0.09467697143554688, 0.10407257080078125, 0.11346817016601562, 0.12286376953125, 0.13225936889648438, 0.14165496826171875, 0.15105056762695312, 0.1604461669921875, 0.16984176635742188, 0.17923736572265625, 0.18863296508789062, 0.198028564453125, 0.20742416381835938, 0.21681976318359375, 0.22621536254882812, 0.2356109619140625, 0.24500656127929688, 0.25440216064453125, 0.2637977600097656, 0.273193359375]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 9.0, 3.0, 18.0, 30.0, 56.0, 80.0, 114.0, 141.0, 127.0, 151.0, 111.0, 72.0, 45.0, 16.0, 11.0, 8.0, 4.0, 1.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.09869384765625, -0.09618997573852539, -0.09368610382080078, -0.09118223190307617, -0.08867835998535156, -0.08617448806762695, -0.08367061614990234, -0.08116674423217773, -0.07866287231445312, -0.07615900039672852, -0.0736551284790039, -0.0711512565612793, -0.06864738464355469, -0.06614351272583008, -0.06363964080810547, -0.06113576889038086, -0.05863189697265625, -0.05612802505493164, -0.05362415313720703, -0.05112028121948242, -0.04861640930175781, -0.0461125373840332, -0.043608665466308594, -0.041104793548583984, -0.038600921630859375, -0.036097049713134766, -0.033593177795410156, -0.031089305877685547, -0.028585433959960938, -0.026081562042236328, -0.02357769012451172, -0.02107381820678711, -0.0185699462890625, -0.01606607437133789, -0.013562202453613281, -0.011058330535888672, -0.008554458618164062, -0.006050586700439453, -0.0035467147827148438, -0.0010428428649902344, 0.001461029052734375, 0.003964900970458984, 0.006468772888183594, 0.008972644805908203, 0.011476516723632812, 0.013980388641357422, 0.01648426055908203, 0.01898813247680664, 0.02149200439453125, 0.02399587631225586, 0.02649974822998047, 0.029003620147705078, 0.03150749206542969, 0.0340113639831543, 0.036515235900878906, 0.039019107818603516, 0.041522979736328125, 0.044026851654052734, 0.046530723571777344, 0.04903459548950195, 0.05153846740722656, 0.05404233932495117, 0.05654621124267578, 0.05905008316040039, 0.061553955078125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 4.0, 5.0, 9.0, 4.0, 15.0, 19.0, 29.0, 26.0, 44.0, 78.0, 111.0, 213.0, 412.0, 912.0, 2108.0, 5408.0, 16306.0, 55086.0, 213357.0, 516726.0, 171053.0, 45009.0, 13559.0, 4624.0, 1811.0, 743.0, 329.0, 220.0, 128.0, 72.0, 46.0, 28.0, 15.0, 9.0, 10.0, 8.0, 12.0, 4.0, 6.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.156982421875, -0.1524219512939453, -0.14786148071289062, -0.14330101013183594, -0.13874053955078125, -0.13418006896972656, -0.12961959838867188, -0.1250591278076172, -0.1204986572265625, -0.11593818664550781, -0.11137771606445312, -0.10681724548339844, -0.10225677490234375, -0.09769630432128906, -0.09313583374023438, -0.08857536315917969, -0.084014892578125, -0.07945442199707031, -0.07489395141601562, -0.07033348083496094, -0.06577301025390625, -0.06121253967285156, -0.056652069091796875, -0.05209159851074219, -0.0475311279296875, -0.04297065734863281, -0.038410186767578125, -0.03384971618652344, -0.02928924560546875, -0.024728775024414062, -0.020168304443359375, -0.015607833862304688, -0.01104736328125, -0.0064868927001953125, -0.001926422119140625, 0.0026340484619140625, 0.00719451904296875, 0.011754989624023438, 0.016315460205078125, 0.020875930786132812, 0.0254364013671875, 0.029996871948242188, 0.034557342529296875, 0.03911781311035156, 0.04367828369140625, 0.04823875427246094, 0.052799224853515625, 0.05735969543457031, 0.061920166015625, 0.06648063659667969, 0.07104110717773438, 0.07560157775878906, 0.08016204833984375, 0.08472251892089844, 0.08928298950195312, 0.09384346008300781, 0.0984039306640625, 0.10296440124511719, 0.10752487182617188, 0.11208534240722656, 0.11664581298828125, 0.12120628356933594, 0.12576675415039062, 0.1303272247314453, 0.1348876953125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 6.0, 2.0, 12.0, 8.0, 10.0, 9.0, 19.0, 15.0, 18.0, 18.0, 26.0, 26.0, 31.0, 26.0, 38.0, 36.0, 42.0, 37.0, 34.0, 60.0, 39.0, 51.0, 39.0, 48.0, 41.0, 50.0, 38.0, 21.0, 28.0, 36.0, 20.0, 19.0, 18.0, 17.0, 15.0, 9.0, 14.0, 10.0, 4.0, 9.0, 4.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.11663818359375, -0.11319637298583984, -0.10975456237792969, -0.10631275177001953, -0.10287094116210938, -0.09942913055419922, -0.09598731994628906, -0.0925455093383789, -0.08910369873046875, -0.0856618881225586, -0.08222007751464844, -0.07877826690673828, -0.07533645629882812, -0.07189464569091797, -0.06845283508300781, -0.06501102447509766, -0.0615692138671875, -0.058127403259277344, -0.05468559265136719, -0.05124378204345703, -0.047801971435546875, -0.04436016082763672, -0.04091835021972656, -0.037476539611816406, -0.03403472900390625, -0.030592918395996094, -0.027151107788085938, -0.02370929718017578, -0.020267486572265625, -0.01682567596435547, -0.013383865356445312, -0.009942054748535156, -0.006500244140625, -0.0030584335327148438, 0.0003833770751953125, 0.0038251876831054688, 0.007266998291015625, 0.010708808898925781, 0.014150619506835938, 0.017592430114746094, 0.02103424072265625, 0.024476051330566406, 0.027917861938476562, 0.03135967254638672, 0.034801483154296875, 0.03824329376220703, 0.04168510437011719, 0.045126914978027344, 0.0485687255859375, 0.052010536193847656, 0.05545234680175781, 0.05889415740966797, 0.062335968017578125, 0.06577777862548828, 0.06921958923339844, 0.0726613998413086, 0.07610321044921875, 0.0795450210571289, 0.08298683166503906, 0.08642864227294922, 0.08987045288085938, 0.09331226348876953, 0.09675407409667969, 0.10019588470458984, 0.1036376953125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 1.0, 2.0, 7.0, 7.0, 6.0, 15.0, 19.0, 31.0, 55.0, 61.0, 88.0, 160.0, 223.0, 350.0, 597.0, 980.0, 1845.0, 4096.0, 10553.0, 39355.0, 254097.0, 627708.0, 78359.0, 18206.0, 6014.0, 2543.0, 1236.0, 716.0, 435.0, 279.0, 156.0, 121.0, 87.0, 49.0, 40.0, 23.0, 17.0, 9.0, 7.0, 3.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.064208984375, -0.06221580505371094, -0.060222625732421875, -0.05822944641113281, -0.05623626708984375, -0.05424308776855469, -0.052249908447265625, -0.05025672912597656, -0.0482635498046875, -0.04627037048339844, -0.044277191162109375, -0.04228401184082031, -0.04029083251953125, -0.03829765319824219, -0.036304473876953125, -0.03431129455566406, -0.032318115234375, -0.030324935913085938, -0.028331756591796875, -0.026338577270507812, -0.02434539794921875, -0.022352218627929688, -0.020359039306640625, -0.018365859985351562, -0.0163726806640625, -0.014379501342773438, -0.012386322021484375, -0.010393142700195312, -0.00839996337890625, -0.0064067840576171875, -0.004413604736328125, -0.0024204254150390625, -0.00042724609375, 0.0015659332275390625, 0.003559112548828125, 0.0055522918701171875, 0.00754547119140625, 0.009538650512695312, 0.011531829833984375, 0.013525009155273438, 0.0155181884765625, 0.017511367797851562, 0.019504547119140625, 0.021497726440429688, 0.02349090576171875, 0.025484085083007812, 0.027477264404296875, 0.029470443725585938, 0.031463623046875, 0.03345680236816406, 0.035449981689453125, 0.03744316101074219, 0.03943634033203125, 0.04142951965332031, 0.043422698974609375, 0.04541587829589844, 0.0474090576171875, 0.04940223693847656, 0.051395416259765625, 0.05338859558105469, 0.05538177490234375, 0.05737495422363281, 0.059368133544921875, 0.06136131286621094, 0.0633544921875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 4.0, 5.0, 4.0, 5.0, 6.0, 13.0, 20.0, 19.0, 35.0, 77.0, 178.0, 309.0, 162.0, 65.0, 29.0, 23.0, 13.0, 9.0, 6.0, 4.0, 3.0, 2.0, 1.0, 4.0, 4.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00013256072998046875, -0.00012754276394844055, -0.00012252479791641235, -0.00011750683188438416, -0.00011248886585235596, -0.00010747089982032776, -0.00010245293378829956, -9.743496775627136e-05, -9.241700172424316e-05, -8.739903569221497e-05, -8.238106966018677e-05, -7.736310362815857e-05, -7.234513759613037e-05, -6.732717156410217e-05, -6.230920553207397e-05, -5.7291239500045776e-05, -5.227327346801758e-05, -4.725530743598938e-05, -4.223734140396118e-05, -3.7219375371932983e-05, -3.2201409339904785e-05, -2.7183443307876587e-05, -2.216547727584839e-05, -1.714751124382019e-05, -1.2129545211791992e-05, -7.111579179763794e-06, -2.0936131477355957e-06, 2.9243528842926025e-06, 7.9423189163208e-06, 1.2960284948348999e-05, 1.7978250980377197e-05, 2.2996217012405396e-05, 2.8014183044433594e-05, 3.303214907646179e-05, 3.805011510848999e-05, 4.306808114051819e-05, 4.808604717254639e-05, 5.3104013204574585e-05, 5.812197923660278e-05, 6.313994526863098e-05, 6.815791130065918e-05, 7.317587733268738e-05, 7.819384336471558e-05, 8.321180939674377e-05, 8.822977542877197e-05, 9.324774146080017e-05, 9.826570749282837e-05, 0.00010328367352485657, 0.00010830163955688477, 0.00011331960558891296, 0.00011833757162094116, 0.00012335553765296936, 0.00012837350368499756, 0.00013339146971702576, 0.00013840943574905396, 0.00014342740178108215, 0.00014844536781311035, 0.00015346333384513855, 0.00015848129987716675, 0.00016349926590919495, 0.00016851723194122314, 0.00017353519797325134, 0.00017855316400527954, 0.00018357113003730774, 0.00018858909606933594]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 1.0, 8.0, 5.0, 8.0, 8.0, 13.0, 30.0, 31.0, 73.0, 112.0, 225.0, 416.0, 878.0, 2056.0, 5094.0, 16216.0, 86052.0, 727478.0, 172581.0, 25482.0, 6995.0, 2599.0, 1092.0, 505.0, 238.0, 156.0, 69.0, 43.0, 31.0, 17.0, 17.0, 10.0, 4.0, 7.0, 0.0, 3.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0887451171875, -0.08625602722167969, -0.08376693725585938, -0.08127784729003906, -0.07878875732421875, -0.07629966735839844, -0.07381057739257812, -0.07132148742675781, -0.0688323974609375, -0.06634330749511719, -0.06385421752929688, -0.06136512756347656, -0.05887603759765625, -0.05638694763183594, -0.053897857666015625, -0.05140876770019531, -0.048919677734375, -0.04643058776855469, -0.043941497802734375, -0.04145240783691406, -0.03896331787109375, -0.03647422790527344, -0.033985137939453125, -0.03149604797363281, -0.0290069580078125, -0.026517868041992188, -0.024028778076171875, -0.021539688110351562, -0.01905059814453125, -0.016561508178710938, -0.014072418212890625, -0.011583328247070312, -0.00909423828125, -0.0066051483154296875, -0.004116058349609375, -0.0016269683837890625, 0.00086212158203125, 0.0033512115478515625, 0.005840301513671875, 0.008329391479492188, 0.0108184814453125, 0.013307571411132812, 0.015796661376953125, 0.018285751342773438, 0.02077484130859375, 0.023263931274414062, 0.025753021240234375, 0.028242111206054688, 0.030731201171875, 0.03322029113769531, 0.035709381103515625, 0.03819847106933594, 0.04068756103515625, 0.04317665100097656, 0.045665740966796875, 0.04815483093261719, 0.0506439208984375, 0.05313301086425781, 0.055622100830078125, 0.05811119079589844, 0.06060028076171875, 0.06308937072753906, 0.06557846069335938, 0.06806755065917969, 0.070556640625]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 2.0, 3.0, 6.0, 11.0, 11.0, 6.0, 19.0, 29.0, 42.0, 41.0, 57.0, 59.0, 83.0, 110.0, 97.0, 85.0, 75.0, 54.0, 44.0, 27.0, 36.0, 24.0, 16.0, 17.0, 3.0, 7.0, 5.0, 10.0, 2.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.060638427734375, -0.05891895294189453, -0.05719947814941406, -0.055480003356933594, -0.053760528564453125, -0.052041053771972656, -0.05032157897949219, -0.04860210418701172, -0.04688262939453125, -0.04516315460205078, -0.04344367980957031, -0.041724205017089844, -0.040004730224609375, -0.038285255432128906, -0.03656578063964844, -0.03484630584716797, -0.0331268310546875, -0.03140735626220703, -0.029687881469726562, -0.027968406677246094, -0.026248931884765625, -0.024529457092285156, -0.022809982299804688, -0.02109050750732422, -0.01937103271484375, -0.01765155792236328, -0.015932083129882812, -0.014212608337402344, -0.012493133544921875, -0.010773658752441406, -0.009054183959960938, -0.007334709167480469, -0.005615234375, -0.0038957595825195312, -0.0021762847900390625, -0.00045680999755859375, 0.001262664794921875, 0.0029821395874023438, 0.0047016143798828125, 0.006421089172363281, 0.00814056396484375, 0.009860038757324219, 0.011579513549804688, 0.013298988342285156, 0.015018463134765625, 0.016737937927246094, 0.018457412719726562, 0.02017688751220703, 0.0218963623046875, 0.02361583709716797, 0.025335311889648438, 0.027054786682128906, 0.028774261474609375, 0.030493736267089844, 0.03221321105957031, 0.03393268585205078, 0.03565216064453125, 0.03737163543701172, 0.03909111022949219, 0.040810585021972656, 0.042530059814453125, 0.044249534606933594, 0.04596900939941406, 0.04768848419189453, 0.049407958984375]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 5.0, 5.0, 11.0, 35.0, 46.0, 120.0, 241.0, 280.0, 143.0, 63.0, 27.0, 15.0, 5.0, 9.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9402272701263428, -1.8894137144088745, -1.8386001586914062, -1.787786602973938, -1.7369730472564697, -1.6861594915390015, -1.6353459358215332, -1.584532380104065, -1.5337188243865967, -1.4829052686691284, -1.4320917129516602, -1.381278157234192, -1.3304646015167236, -1.2796510457992554, -1.228837490081787, -1.1780239343643188, -1.1272103786468506, -1.0763968229293823, -1.025583267211914, -0.9747697114944458, -0.9239561557769775, -0.8731426000595093, -0.822329044342041, -0.7715154886245728, -0.720702052116394, -0.6698884963989258, -0.6190749406814575, -0.5682613849639893, -0.517447829246521, -0.4666343033313751, -0.41582074761390686, -0.3650071918964386, -0.31419360637664795, -0.2633800506591797, -0.21256649494171143, -0.16175295412540436, -0.1109393984079361, -0.06012585759162903, -0.009312301874160767, 0.041501253843307495, 0.09231480956077576, 0.14312836527824402, 0.19394192099571228, 0.24475546181201935, 0.2955690026283264, 0.3463825583457947, 0.39719611406326294, 0.4480096697807312, 0.49882322549819946, 0.5496367812156677, 0.600450336933136, 0.6512638926506042, 0.7020774483680725, 0.752890944480896, 0.8037045001983643, 0.8545180559158325, 0.9053316116333008, 0.956145167350769, 1.0069587230682373, 1.0577722787857056, 1.1085858345031738, 1.159399390220642, 1.2102129459381104, 1.2610265016555786, 1.3118400573730469]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 3.0, 4.0, 4.0, 5.0, 12.0, 11.0, 11.0, 18.0, 14.0, 17.0, 23.0, 27.0, 17.0, 31.0, 35.0, 35.0, 35.0, 36.0, 51.0, 48.0, 47.0, 44.0, 59.0, 46.0, 42.0, 39.0, 36.0, 37.0, 33.0, 34.0, 26.0, 21.0, 18.0, 17.0, 14.0, 13.0, 11.0, 10.0, 6.0, 5.0, 2.0, 2.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5247740149497986, -0.5074394941329956, -0.49010494351387024, -0.4727703928947449, -0.4554358720779419, -0.4381013512611389, -0.42076680064201355, -0.4034322500228882, -0.3860977292060852, -0.3687632083892822, -0.35142865777015686, -0.3340941071510315, -0.3167595863342285, -0.29942506551742554, -0.28209051489830017, -0.2647559642791748, -0.24742144346237183, -0.23008690774440765, -0.21275237202644348, -0.1954178363084793, -0.17808330059051514, -0.16074876487255096, -0.1434142291545868, -0.12607969343662262, -0.10874515771865845, -0.09141062200069427, -0.0740760862827301, -0.05674155056476593, -0.03940701484680176, -0.022072479128837585, -0.004737943410873413, 0.01259659230709076, 0.029931187629699707, 0.04726572334766388, 0.06460025906562805, 0.08193479478359222, 0.0992693305015564, 0.11660386621952057, 0.13393840193748474, 0.1512729376554489, 0.16860747337341309, 0.18594200909137726, 0.20327654480934143, 0.2206110805273056, 0.23794561624526978, 0.25528013706207275, 0.2726146876811981, 0.2899492383003235, 0.30728375911712646, 0.32461827993392944, 0.3419528305530548, 0.3592873811721802, 0.37662190198898315, 0.39395642280578613, 0.4112909734249115, 0.42862552404403687, 0.44596004486083984, 0.4632945656776428, 0.4806291162967682, 0.49796366691589355, 0.5152981877326965, 0.5326327085494995, 0.5499672889709473, 0.5673018097877502, 0.5846363306045532]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 1.0, 2.0, 6.0, 6.0, 7.0, 3.0, 8.0, 13.0, 18.0, 22.0, 24.0, 33.0, 62.0, 89.0, 153.0, 333.0, 872.0, 2919.0, 20325.0, 4136401.0, 27494.0, 3503.0, 1010.0, 444.0, 188.0, 110.0, 81.0, 40.0, 32.0, 24.0, 17.0, 9.0, 11.0, 4.0, 6.0, 2.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.302734375, -0.29488182067871094, -0.2870292663574219, -0.2791767120361328, -0.27132415771484375, -0.2634716033935547, -0.2556190490722656, -0.24776649475097656, -0.2399139404296875, -0.23206138610839844, -0.22420883178710938, -0.2163562774658203, -0.20850372314453125, -0.2006511688232422, -0.19279861450195312, -0.18494606018066406, -0.177093505859375, -0.16924095153808594, -0.16138839721679688, -0.1535358428955078, -0.14568328857421875, -0.1378307342529297, -0.12997817993164062, -0.12212562561035156, -0.1142730712890625, -0.10642051696777344, -0.09856796264648438, -0.09071540832519531, -0.08286285400390625, -0.07501029968261719, -0.06715774536132812, -0.05930519104003906, -0.05145263671875, -0.04360008239746094, -0.035747528076171875, -0.027894973754882812, -0.02004241943359375, -0.012189865112304688, -0.004337310791015625, 0.0035152435302734375, 0.0113677978515625, 0.019220352172851562, 0.027072906494140625, 0.03492546081542969, 0.04277801513671875, 0.05063056945800781, 0.058483123779296875, 0.06633567810058594, 0.074188232421875, 0.08204078674316406, 0.08989334106445312, 0.09774589538574219, 0.10559844970703125, 0.11345100402832031, 0.12130355834960938, 0.12915611267089844, 0.1370086669921875, 0.14486122131347656, 0.15271377563476562, 0.1605663299560547, 0.16841888427734375, 0.1762714385986328, 0.18412399291992188, 0.19197654724121094, 0.1998291015625]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 9.0, 4.0, 18.0, 36.0, 67.0, 99.0, 126.0, 136.0, 155.0, 126.0, 93.0, 66.0, 25.0, 22.0, 4.0, 5.0, 3.0, 1.0, 6.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.10357666015625, -0.10098886489868164, -0.09840106964111328, -0.09581327438354492, -0.09322547912597656, -0.0906376838684082, -0.08804988861083984, -0.08546209335327148, -0.08287429809570312, -0.08028650283813477, -0.0776987075805664, -0.07511091232299805, -0.07252311706542969, -0.06993532180786133, -0.06734752655029297, -0.06475973129272461, -0.06217193603515625, -0.05958414077758789, -0.05699634552001953, -0.05440855026245117, -0.05182075500488281, -0.04923295974731445, -0.046645164489746094, -0.044057369232177734, -0.041469573974609375, -0.038881778717041016, -0.036293983459472656, -0.0337061882019043, -0.031118392944335938, -0.028530597686767578, -0.02594280242919922, -0.02335500717163086, -0.0207672119140625, -0.01817941665649414, -0.015591621398925781, -0.013003826141357422, -0.010416030883789062, -0.007828235626220703, -0.005240440368652344, -0.0026526451110839844, -6.4849853515625e-05, 0.0025229454040527344, 0.005110740661621094, 0.007698535919189453, 0.010286331176757812, 0.012874126434326172, 0.015461921691894531, 0.01804971694946289, 0.02063751220703125, 0.02322530746459961, 0.02581310272216797, 0.028400897979736328, 0.030988693237304688, 0.03357648849487305, 0.036164283752441406, 0.038752079010009766, 0.041339874267578125, 0.043927669525146484, 0.046515464782714844, 0.0491032600402832, 0.05169105529785156, 0.05427885055541992, 0.05686664581298828, 0.05945444107055664, 0.062042236328125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 1.0, 3.0, 5.0, 5.0, 21.0, 31.0, 40.0, 41.0, 76.0, 146.0, 278.0, 576.0, 1477.0, 6539.0, 119024.0, 4049027.0, 13129.0, 2233.0, 794.0, 353.0, 184.0, 103.0, 57.0, 31.0, 32.0, 27.0, 22.0, 8.0, 8.0, 10.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.40625, -0.3963813781738281, -0.38651275634765625, -0.3766441345214844, -0.3667755126953125, -0.3569068908691406, -0.34703826904296875, -0.3371696472167969, -0.327301025390625, -0.3174324035644531, -0.30756378173828125, -0.2976951599121094, -0.2878265380859375, -0.2779579162597656, -0.26808929443359375, -0.2582206726074219, -0.24835205078125, -0.23848342895507812, -0.22861480712890625, -0.21874618530273438, -0.2088775634765625, -0.19900894165039062, -0.18914031982421875, -0.17927169799804688, -0.169403076171875, -0.15953445434570312, -0.14966583251953125, -0.13979721069335938, -0.1299285888671875, -0.12005996704101562, -0.11019134521484375, -0.10032272338867188, -0.0904541015625, -0.08058547973632812, -0.07071685791015625, -0.060848236083984375, -0.0509796142578125, -0.041110992431640625, -0.03124237060546875, -0.021373748779296875, -0.011505126953125, -0.001636505126953125, 0.00823211669921875, 0.018100738525390625, 0.0279693603515625, 0.037837982177734375, 0.04770660400390625, 0.057575225830078125, 0.06744384765625, 0.07731246948242188, 0.08718109130859375, 0.09704971313476562, 0.1069183349609375, 0.11678695678710938, 0.12665557861328125, 0.13652420043945312, 0.146392822265625, 0.15626144409179688, 0.16613006591796875, 0.17599868774414062, 0.1858673095703125, 0.19573593139648438, 0.20560455322265625, 0.21547317504882812, 0.225341796875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 5.0, 4.0, 11.0, 20.0, 46.0, 118.0, 3573.0, 220.0, 46.0, 15.0, 7.0, 12.0, 4.0, 5.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06951904296875, -0.06578731536865234, -0.06205558776855469, -0.05832386016845703, -0.054592132568359375, -0.05086040496826172, -0.04712867736816406, -0.043396949768066406, -0.03966522216796875, -0.035933494567871094, -0.03220176696777344, -0.02847003936767578, -0.024738311767578125, -0.02100658416748047, -0.017274856567382812, -0.013543128967285156, -0.0098114013671875, -0.006079673767089844, -0.0023479461669921875, 0.0013837814331054688, 0.005115509033203125, 0.008847236633300781, 0.012578964233398438, 0.016310691833496094, 0.02004241943359375, 0.023774147033691406, 0.027505874633789062, 0.03123760223388672, 0.034969329833984375, 0.03870105743408203, 0.04243278503417969, 0.046164512634277344, 0.049896240234375, 0.053627967834472656, 0.05735969543457031, 0.06109142303466797, 0.06482315063476562, 0.06855487823486328, 0.07228660583496094, 0.0760183334350586, 0.07975006103515625, 0.0834817886352539, 0.08721351623535156, 0.09094524383544922, 0.09467697143554688, 0.09840869903564453, 0.10214042663574219, 0.10587215423583984, 0.1096038818359375, 0.11333560943603516, 0.11706733703613281, 0.12079906463623047, 0.12453079223632812, 0.12826251983642578, 0.13199424743652344, 0.1357259750366211, 0.13945770263671875, 0.1431894302368164, 0.14692115783691406, 0.15065288543701172, 0.15438461303710938, 0.15811634063720703, 0.1618480682373047, 0.16557979583740234, 0.1693115234375]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 9.0, 11.0, 86.0, 279.0, 421.0, 140.0, 31.0, 14.0, 8.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.3846874237060547, -0.3673533499240875, -0.35001927614212036, -0.3326852023601532, -0.31535112857818604, -0.29801705479621887, -0.2806829810142517, -0.26334890723228455, -0.24601483345031738, -0.22868075966835022, -0.21134668588638306, -0.1940126121044159, -0.17667853832244873, -0.15934446454048157, -0.1420103907585144, -0.12467631697654724, -0.10734224319458008, -0.09000816941261292, -0.07267409563064575, -0.05534002184867859, -0.038005948066711426, -0.020671874284744263, -0.0033378005027770996, 0.013996273279190063, 0.03133034706115723, 0.04866442084312439, 0.06599849462509155, 0.08333256840705872, 0.10066664218902588, 0.11800071597099304, 0.1353347897529602, 0.15266886353492737, 0.1700029969215393, 0.18733707070350647, 0.20467114448547363, 0.2220052182674408, 0.23933929204940796, 0.2566733658313751, 0.2740074396133423, 0.29134151339530945, 0.3086755871772766, 0.3260096609592438, 0.34334373474121094, 0.3606778085231781, 0.37801188230514526, 0.3953459560871124, 0.4126800298690796, 0.43001410365104675, 0.4473481774330139, 0.4646822512149811, 0.48201632499694824, 0.4993503987789154, 0.5166844725608826, 0.5340185165405273, 0.5513526201248169, 0.5686867237091064, 0.5860207676887512, 0.603354811668396, 0.6206889152526855, 0.6380230188369751, 0.6553570628166199, 0.6726911067962646, 0.6900252103805542, 0.7073593139648438, 0.7246933579444885]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 14.0, 25.0, 35.0, 80.0, 98.0, 158.0, 156.0, 117.0, 123.0, 66.0, 57.0, 40.0, 15.0, 8.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.3285573124885559, -0.31906038522720337, -0.3095634877681732, -0.3000665605068207, -0.2905696630477905, -0.281072735786438, -0.27157580852508545, -0.2620789110660553, -0.25258198380470276, -0.2430850714445114, -0.23358815908432007, -0.22409123182296753, -0.21459431946277618, -0.20509740710258484, -0.1956004947423935, -0.18610358238220215, -0.1766066700220108, -0.16710975766181946, -0.1576128453016281, -0.14811593294143677, -0.13861900568008423, -0.12912209331989288, -0.11962518095970154, -0.1101282611489296, -0.10063134878873825, -0.0911344364285469, -0.08163751661777496, -0.07214060425758362, -0.06264369189739227, -0.05314677208662033, -0.043649859726428986, -0.03415293991565704, -0.024656027555465698, -0.01515911240130663, -0.00566219724714756, 0.0038347169756889343, 0.013331633061170578, 0.02282854914665222, 0.03232546150684357, 0.04182238131761551, 0.051319293677806854, 0.0608162097632885, 0.07031312584877014, 0.07981003820896149, 0.08930695056915283, 0.09880387037992477, 0.10830078274011612, 0.11779770255088806, 0.1272946149110794, 0.13679152727127075, 0.1462884396314621, 0.15578535199165344, 0.16528227925300598, 0.17477919161319733, 0.18427610397338867, 0.1937730312347412, 0.20326992869377136, 0.2127668410539627, 0.22226375341415405, 0.2317606806755066, 0.24125759303569794, 0.2507545053958893, 0.26025140285491943, 0.269748330116272, 0.2792452573776245]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 4.0, 3.0, 3.0, 6.0, 12.0, 13.0, 8.0, 12.0, 15.0, 22.0, 39.0, 35.0, 56.0, 75.0, 76.0, 100.0, 135.0, 188.0, 251.0, 424.0, 538.0, 845.0, 1574.0, 3148.0, 8878.0, 38014.0, 261664.0, 609553.0, 94857.0, 17367.0, 5025.0, 1982.0, 1171.0, 710.0, 495.0, 324.0, 223.0, 178.0, 124.0, 87.0, 73.0, 68.0, 35.0, 37.0, 26.0, 19.0, 16.0, 20.0, 10.0, 9.0, 4.0, 3.0, 2.0, 4.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.193359375, -0.18717193603515625, -0.1809844970703125, -0.17479705810546875, -0.168609619140625, -0.16242218017578125, -0.1562347412109375, -0.15004730224609375, -0.14385986328125, -0.13767242431640625, -0.1314849853515625, -0.12529754638671875, -0.119110107421875, -0.11292266845703125, -0.1067352294921875, -0.10054779052734375, -0.0943603515625, -0.08817291259765625, -0.0819854736328125, -0.07579803466796875, -0.069610595703125, -0.06342315673828125, -0.0572357177734375, -0.05104827880859375, -0.04486083984375, -0.03867340087890625, -0.0324859619140625, -0.02629852294921875, -0.020111083984375, -0.01392364501953125, -0.0077362060546875, -0.00154876708984375, 0.004638671875, 0.01082611083984375, 0.0170135498046875, 0.02320098876953125, 0.029388427734375, 0.03557586669921875, 0.0417633056640625, 0.04795074462890625, 0.05413818359375, 0.06032562255859375, 0.0665130615234375, 0.07270050048828125, 0.078887939453125, 0.08507537841796875, 0.0912628173828125, 0.09745025634765625, 0.1036376953125, 0.10982513427734375, 0.1160125732421875, 0.12220001220703125, 0.128387451171875, 0.13457489013671875, 0.1407623291015625, 0.14694976806640625, 0.15313720703125, 0.15932464599609375, 0.1655120849609375, 0.17169952392578125, 0.177886962890625, 0.18407440185546875, 0.1902618408203125, 0.19644927978515625, 0.20263671875]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 7.0, 6.0, 25.0, 42.0, 86.0, 114.0, 146.0, 160.0, 145.0, 119.0, 75.0, 34.0, 24.0, 4.0, 5.0, 2.0, 2.0, 5.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1129150390625, -0.11012649536132812, -0.10733795166015625, -0.10454940795898438, -0.1017608642578125, -0.09897232055664062, -0.09618377685546875, -0.09339523315429688, -0.090606689453125, -0.08781814575195312, -0.08502960205078125, -0.08224105834960938, -0.0794525146484375, -0.07666397094726562, -0.07387542724609375, -0.07108688354492188, -0.06829833984375, -0.06550979614257812, -0.06272125244140625, -0.059932708740234375, -0.0571441650390625, -0.054355621337890625, -0.05156707763671875, -0.048778533935546875, -0.045989990234375, -0.043201446533203125, -0.04041290283203125, -0.037624359130859375, -0.0348358154296875, -0.032047271728515625, -0.02925872802734375, -0.026470184326171875, -0.023681640625, -0.020893096923828125, -0.01810455322265625, -0.015316009521484375, -0.0125274658203125, -0.009738922119140625, -0.00695037841796875, -0.004161834716796875, -0.001373291015625, 0.001415252685546875, 0.00420379638671875, 0.006992340087890625, 0.0097808837890625, 0.012569427490234375, 0.01535797119140625, 0.018146514892578125, 0.02093505859375, 0.023723602294921875, 0.02651214599609375, 0.029300689697265625, 0.0320892333984375, 0.034877777099609375, 0.03766632080078125, 0.040454864501953125, 0.043243408203125, 0.046031951904296875, 0.04882049560546875, 0.051609039306640625, 0.0543975830078125, 0.057186126708984375, 0.05997467041015625, 0.06276321411132812, 0.0655517578125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 5.0, 7.0, 4.0, 5.0, 9.0, 15.0, 22.0, 16.0, 21.0, 25.0, 53.0, 94.0, 195.0, 376.0, 766.0, 1598.0, 3544.0, 8470.0, 20617.0, 53286.0, 151649.0, 413138.0, 255118.0, 85171.0, 31490.0, 12877.0, 5438.0, 2443.0, 1012.0, 451.0, 254.0, 125.0, 59.0, 47.0, 36.0, 21.0, 13.0, 17.0, 12.0, 8.0, 13.0, 6.0, 6.0, 5.0, 7.0, 4.0, 4.0, 1.0, 0.0, 1.0, 4.0, 4.0], "bins": [-0.10107421875, -0.09807777404785156, -0.09508132934570312, -0.09208488464355469, -0.08908843994140625, -0.08609199523925781, -0.08309555053710938, -0.08009910583496094, -0.0771026611328125, -0.07410621643066406, -0.07110977172851562, -0.06811332702636719, -0.06511688232421875, -0.06212043762207031, -0.059123992919921875, -0.05612754821777344, -0.053131103515625, -0.05013465881347656, -0.047138214111328125, -0.04414176940917969, -0.04114532470703125, -0.03814888000488281, -0.035152435302734375, -0.03215599060058594, -0.0291595458984375, -0.026163101196289062, -0.023166656494140625, -0.020170211791992188, -0.01717376708984375, -0.014177322387695312, -0.011180877685546875, -0.008184432983398438, -0.00518798828125, -0.0021915435791015625, 0.000804901123046875, 0.0038013458251953125, 0.00679779052734375, 0.009794235229492188, 0.012790679931640625, 0.015787124633789062, 0.0187835693359375, 0.021780014038085938, 0.024776458740234375, 0.027772903442382812, 0.03076934814453125, 0.03376579284667969, 0.036762237548828125, 0.03975868225097656, 0.042755126953125, 0.04575157165527344, 0.048748016357421875, 0.05174446105957031, 0.05474090576171875, 0.05773735046386719, 0.060733795166015625, 0.06373023986816406, 0.0667266845703125, 0.06972312927246094, 0.07271957397460938, 0.07571601867675781, 0.07871246337890625, 0.08170890808105469, 0.08470535278320312, 0.08770179748535156, 0.0906982421875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 1.0, 6.0, 9.0, 12.0, 15.0, 14.0, 9.0, 13.0, 14.0, 16.0, 13.0, 25.0, 19.0, 21.0, 33.0, 37.0, 31.0, 44.0, 38.0, 41.0, 41.0, 40.0, 31.0, 40.0, 46.0, 34.0, 38.0, 32.0, 30.0, 35.0, 31.0, 21.0, 17.0, 29.0, 13.0, 15.0, 13.0, 11.0, 12.0, 10.0, 14.0, 6.0, 8.0, 8.0, 3.0, 6.0, 4.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0809326171875, -0.07821178436279297, -0.07549095153808594, -0.0727701187133789, -0.07004928588867188, -0.06732845306396484, -0.06460762023925781, -0.06188678741455078, -0.05916595458984375, -0.05644512176513672, -0.05372428894042969, -0.051003456115722656, -0.048282623291015625, -0.045561790466308594, -0.04284095764160156, -0.04012012481689453, -0.0373992919921875, -0.03467845916748047, -0.03195762634277344, -0.029236793518066406, -0.026515960693359375, -0.023795127868652344, -0.021074295043945312, -0.01835346221923828, -0.01563262939453125, -0.012911796569824219, -0.010190963745117188, -0.007470130920410156, -0.004749298095703125, -0.0020284652709960938, 0.0006923675537109375, 0.0034132003784179688, 0.006134033203125, 0.008854866027832031, 0.011575698852539062, 0.014296531677246094, 0.017017364501953125, 0.019738197326660156, 0.022459030151367188, 0.02517986297607422, 0.02790069580078125, 0.03062152862548828, 0.03334236145019531, 0.036063194274902344, 0.038784027099609375, 0.041504859924316406, 0.04422569274902344, 0.04694652557373047, 0.0496673583984375, 0.05238819122314453, 0.05510902404785156, 0.057829856872558594, 0.060550689697265625, 0.06327152252197266, 0.06599235534667969, 0.06871318817138672, 0.07143402099609375, 0.07415485382080078, 0.07687568664550781, 0.07959651947021484, 0.08231735229492188, 0.0850381851196289, 0.08775901794433594, 0.09047985076904297, 0.09320068359375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 8.0, 6.0, 4.0, 5.0, 15.0, 25.0, 27.0, 55.0, 75.0, 126.0, 245.0, 377.0, 674.0, 1324.0, 2687.0, 6293.0, 16660.0, 63133.0, 517232.0, 364722.0, 50212.0, 14174.0, 5442.0, 2315.0, 1216.0, 608.0, 361.0, 205.0, 103.0, 81.0, 61.0, 20.0, 22.0, 16.0, 10.0, 9.0, 5.0, 3.0, 4.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0430908203125, -0.04160118103027344, -0.040111541748046875, -0.03862190246582031, -0.03713226318359375, -0.03564262390136719, -0.034152984619140625, -0.03266334533691406, -0.0311737060546875, -0.029684066772460938, -0.028194427490234375, -0.026704788208007812, -0.02521514892578125, -0.023725509643554688, -0.022235870361328125, -0.020746231079101562, -0.019256591796875, -0.017766952514648438, -0.016277313232421875, -0.014787673950195312, -0.01329803466796875, -0.011808395385742188, -0.010318756103515625, -0.008829116821289062, -0.0073394775390625, -0.0058498382568359375, -0.004360198974609375, -0.0028705596923828125, -0.00138092041015625, 0.0001087188720703125, 0.001598358154296875, 0.0030879974365234375, 0.00457763671875, 0.0060672760009765625, 0.007556915283203125, 0.009046554565429688, 0.01053619384765625, 0.012025833129882812, 0.013515472412109375, 0.015005111694335938, 0.0164947509765625, 0.017984390258789062, 0.019474029541015625, 0.020963668823242188, 0.02245330810546875, 0.023942947387695312, 0.025432586669921875, 0.026922225952148438, 0.028411865234375, 0.029901504516601562, 0.031391143798828125, 0.03288078308105469, 0.03437042236328125, 0.03586006164550781, 0.037349700927734375, 0.03883934020996094, 0.0403289794921875, 0.04181861877441406, 0.043308258056640625, 0.04479789733886719, 0.04628753662109375, 0.04777717590332031, 0.049266815185546875, 0.05075645446777344, 0.05224609375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 6.0, 10.0, 4.0, 18.0, 18.0, 28.0, 47.0, 83.0, 145.0, 221.0, 185.0, 93.0, 59.0, 28.0, 11.0, 13.0, 10.0, 8.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00022161006927490234, -0.0002161506563425064, -0.00021069124341011047, -0.00020523183047771454, -0.0001997724175453186, -0.00019431300461292267, -0.00018885359168052673, -0.0001833941787481308, -0.00017793476581573486, -0.00017247535288333893, -0.000167015939950943, -0.00016155652701854706, -0.00015609711408615112, -0.0001506377011537552, -0.00014517828822135925, -0.00013971887528896332, -0.00013425946235656738, -0.00012880004942417145, -0.0001233406364917755, -0.00011788122355937958, -0.00011242181062698364, -0.00010696239769458771, -0.00010150298476219177, -9.604357182979584e-05, -9.05841588973999e-05, -8.512474596500397e-05, -7.966533303260803e-05, -7.42059201002121e-05, -6.874650716781616e-05, -6.328709423542023e-05, -5.782768130302429e-05, -5.236826837062836e-05, -4.690885543823242e-05, -4.144944250583649e-05, -3.599002957344055e-05, -3.053061664104462e-05, -2.507120370864868e-05, -1.9611790776252747e-05, -1.4152377843856812e-05, -8.692964911460876e-06, -3.2335519790649414e-06, 2.2258609533309937e-06, 7.685273885726929e-06, 1.3144686818122864e-05, 1.86040997505188e-05, 2.4063512682914734e-05, 2.952292561531067e-05, 3.4982338547706604e-05, 4.044175148010254e-05, 4.5901164412498474e-05, 5.136057734489441e-05, 5.6819990277290344e-05, 6.227940320968628e-05, 6.773881614208221e-05, 7.319822907447815e-05, 7.865764200687408e-05, 8.411705493927002e-05, 8.957646787166595e-05, 9.503588080406189e-05, 0.00010049529373645782, 0.00010595470666885376, 0.0001114141196012497, 0.00011687353253364563, 0.00012233294546604156, 0.0001277923583984375]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 5.0, 6.0, 10.0, 20.0, 32.0, 53.0, 106.0, 142.0, 307.0, 603.0, 1200.0, 3631.0, 13876.0, 107925.0, 810255.0, 92268.0, 12384.0, 3303.0, 1229.0, 575.0, 273.0, 152.0, 83.0, 51.0, 27.0, 16.0, 9.0, 4.0, 5.0, 5.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.078369140625, -0.07595539093017578, -0.07354164123535156, -0.07112789154052734, -0.06871414184570312, -0.0663003921508789, -0.06388664245605469, -0.06147289276123047, -0.05905914306640625, -0.05664539337158203, -0.05423164367675781, -0.051817893981933594, -0.049404144287109375, -0.046990394592285156, -0.04457664489746094, -0.04216289520263672, -0.0397491455078125, -0.03733539581298828, -0.03492164611816406, -0.032507896423339844, -0.030094146728515625, -0.027680397033691406, -0.025266647338867188, -0.02285289764404297, -0.02043914794921875, -0.01802539825439453, -0.015611648559570312, -0.013197898864746094, -0.010784149169921875, -0.008370399475097656, -0.0059566497802734375, -0.0035429000854492188, -0.001129150390625, 0.0012845993041992188, 0.0036983489990234375, 0.006112098693847656, 0.008525848388671875, 0.010939598083496094, 0.013353347778320312, 0.01576709747314453, 0.01818084716796875, 0.02059459686279297, 0.023008346557617188, 0.025422096252441406, 0.027835845947265625, 0.030249595642089844, 0.03266334533691406, 0.03507709503173828, 0.0374908447265625, 0.03990459442138672, 0.04231834411621094, 0.044732093811035156, 0.047145843505859375, 0.049559593200683594, 0.05197334289550781, 0.05438709259033203, 0.05680084228515625, 0.05921459197998047, 0.06162834167480469, 0.0640420913696289, 0.06645584106445312, 0.06886959075927734, 0.07128334045410156, 0.07369709014892578, 0.07611083984375]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 2.0, 1.0, 3.0, 7.0, 9.0, 12.0, 11.0, 12.0, 23.0, 51.0, 64.0, 99.0, 132.0, 172.0, 143.0, 77.0, 65.0, 39.0, 33.0, 18.0, 14.0, 11.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0677490234375, -0.06572341918945312, -0.06369781494140625, -0.061672210693359375, -0.0596466064453125, -0.057621002197265625, -0.05559539794921875, -0.053569793701171875, -0.051544189453125, -0.049518585205078125, -0.04749298095703125, -0.045467376708984375, -0.0434417724609375, -0.041416168212890625, -0.03939056396484375, -0.037364959716796875, -0.03533935546875, -0.033313751220703125, -0.03128814697265625, -0.029262542724609375, -0.0272369384765625, -0.025211334228515625, -0.02318572998046875, -0.021160125732421875, -0.019134521484375, -0.017108917236328125, -0.01508331298828125, -0.013057708740234375, -0.0110321044921875, -0.009006500244140625, -0.00698089599609375, -0.004955291748046875, -0.0029296875, -0.000904083251953125, 0.00112152099609375, 0.003147125244140625, 0.0051727294921875, 0.007198333740234375, 0.00922393798828125, 0.011249542236328125, 0.013275146484375, 0.015300750732421875, 0.01732635498046875, 0.019351959228515625, 0.0213775634765625, 0.023403167724609375, 0.02542877197265625, 0.027454376220703125, 0.02947998046875, 0.031505584716796875, 0.03353118896484375, 0.035556793212890625, 0.0375823974609375, 0.039608001708984375, 0.04163360595703125, 0.043659210205078125, 0.045684814453125, 0.047710418701171875, 0.04973602294921875, 0.051761627197265625, 0.0537872314453125, 0.055812835693359375, 0.05783843994140625, 0.059864044189453125, 0.0618896484375]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 7.0, 11.0, 22.0, 38.0, 91.0, 204.0, 293.0, 165.0, 108.0, 33.0, 18.0, 12.0, 5.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0629701614379883, -1.0213743448257446, -0.979778528213501, -0.9381826519966125, -0.8965868353843689, -0.8549910187721252, -0.8133951425552368, -0.7717993259429932, -0.7302035093307495, -0.6886076927185059, -0.6470118761062622, -0.6054159998893738, -0.5638201832771301, -0.5222243666648865, -0.48062852025032043, -0.4390326738357544, -0.39743685722351074, -0.3558410406112671, -0.31424519419670105, -0.272649347782135, -0.23105353116989136, -0.1894576996564865, -0.14786186814308167, -0.10626602172851562, -0.06467020511627197, -0.023074373602867126, 0.01852145791053772, 0.060117289423942566, 0.10171312093734741, 0.14330895245075226, 0.1849047839641571, 0.22650063037872314, 0.2680964469909668, 0.30969226360321045, 0.3512881100177765, 0.39288395643234253, 0.4344797730445862, 0.47607558965682983, 0.5176714658737183, 0.5592672824859619, 0.6008630990982056, 0.6424589157104492, 0.6840547323226929, 0.7256506085395813, 0.767246425151825, 0.8088422417640686, 0.850438117980957, 0.8920339345932007, 0.9336297512054443, 0.975225567817688, 1.0168213844299316, 1.0584172010421753, 1.100013017654419, 1.1416089534759521, 1.1832047700881958, 1.2248005867004395, 1.266396403312683, 1.3079922199249268, 1.3495880365371704, 1.391183853149414, 1.4327797889709473, 1.474375605583191, 1.5159714221954346, 1.5575672388076782, 1.5991630554199219]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 5.0, 0.0, 3.0, 12.0, 8.0, 11.0, 9.0, 10.0, 7.0, 10.0, 12.0, 20.0, 20.0, 19.0, 25.0, 33.0, 29.0, 34.0, 30.0, 36.0, 44.0, 36.0, 50.0, 34.0, 33.0, 40.0, 31.0, 33.0, 29.0, 35.0, 24.0, 28.0, 33.0, 35.0, 20.0, 18.0, 25.0, 14.0, 18.0, 10.0, 8.0, 10.0, 11.0, 9.0, 11.0, 8.0, 8.0, 7.0, 3.0, 1.0, 3.0, 2.0, 3.0, 5.0, 0.0, 1.0], "bins": [-0.3973597288131714, -0.38521525263786316, -0.37307077646255493, -0.3609262704849243, -0.3487817943096161, -0.33663731813430786, -0.32449284195899963, -0.3123483657836914, -0.3002038598060608, -0.28805938363075256, -0.27591490745544434, -0.2637704014778137, -0.2516259253025055, -0.23948144912719727, -0.22733697295188904, -0.2151924967765808, -0.20304802060127258, -0.19090354442596436, -0.17875905334949493, -0.1666145771741867, -0.15447008609771729, -0.14232560992240906, -0.13018113374710083, -0.118036650121212, -0.10589216649532318, -0.09374768286943436, -0.08160319924354553, -0.0694587230682373, -0.05731423944234848, -0.045169755816459656, -0.03302527964115143, -0.020880796015262604, -0.00873631238937378, 0.003408169373869896, 0.015552651137113571, 0.027697131037712097, 0.03984161466360092, 0.051986098289489746, 0.06413057446479797, 0.0762750580906868, 0.08841954171657562, 0.10056402534246445, 0.11270850896835327, 0.1248529851436615, 0.13699746131896973, 0.14914195239543915, 0.16128642857074738, 0.1734309196472168, 0.18557539582252502, 0.19771987199783325, 0.20986436307430267, 0.2220088392496109, 0.23415333032608032, 0.24629780650138855, 0.2584422826766968, 0.270586758852005, 0.28273123502731323, 0.29487571120262146, 0.3070201873779297, 0.3191646933555603, 0.33130916953086853, 0.34345364570617676, 0.355598121881485, 0.3677425980567932, 0.37988710403442383]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 5.0, 7.0, 5.0, 6.0, 10.0, 10.0, 8.0, 18.0, 14.0, 22.0, 30.0, 32.0, 52.0, 106.0, 157.0, 396.0, 1431.0, 7548.0, 4122418.0, 56029.0, 4085.0, 1044.0, 403.0, 168.0, 121.0, 55.0, 44.0, 23.0, 13.0, 9.0, 6.0, 4.0, 6.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.609375, -0.5936851501464844, -0.5779953002929688, -0.5623054504394531, -0.5466156005859375, -0.5309257507324219, -0.5152359008789062, -0.4995460510253906, -0.483856201171875, -0.4681663513183594, -0.45247650146484375, -0.4367866516113281, -0.4210968017578125, -0.4054069519042969, -0.38971710205078125, -0.3740272521972656, -0.35833740234375, -0.3426475524902344, -0.32695770263671875, -0.3112678527832031, -0.2955780029296875, -0.2798881530761719, -0.26419830322265625, -0.24850845336914062, -0.232818603515625, -0.21712875366210938, -0.20143890380859375, -0.18574905395507812, -0.1700592041015625, -0.15436935424804688, -0.13867950439453125, -0.12298965454101562, -0.1072998046875, -0.09160995483398438, -0.07592010498046875, -0.060230255126953125, -0.0445404052734375, -0.028850555419921875, -0.01316070556640625, 0.002529144287109375, 0.018218994140625, 0.033908843994140625, 0.04959869384765625, 0.06528854370117188, 0.0809783935546875, 0.09666824340820312, 0.11235809326171875, 0.12804794311523438, 0.14373779296875, 0.15942764282226562, 0.17511749267578125, 0.19080734252929688, 0.2064971923828125, 0.22218704223632812, 0.23787689208984375, 0.2535667419433594, 0.269256591796875, 0.2849464416503906, 0.30063629150390625, 0.3163261413574219, 0.3320159912109375, 0.3477058410644531, 0.36339569091796875, 0.3790855407714844, 0.394775390625]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 5.0, 10.0, 22.0, 37.0, 63.0, 117.0, 131.0, 178.0, 140.0, 117.0, 101.0, 40.0, 21.0, 9.0, 4.0, 0.0, 3.0, 3.0, 6.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.11468505859375, -0.11186885833740234, -0.10905265808105469, -0.10623645782470703, -0.10342025756835938, -0.10060405731201172, -0.09778785705566406, -0.0949716567993164, -0.09215545654296875, -0.0893392562866211, -0.08652305603027344, -0.08370685577392578, -0.08089065551757812, -0.07807445526123047, -0.07525825500488281, -0.07244205474853516, -0.0696258544921875, -0.06680965423583984, -0.06399345397949219, -0.06117725372314453, -0.058361053466796875, -0.05554485321044922, -0.05272865295410156, -0.049912452697753906, -0.04709625244140625, -0.044280052185058594, -0.04146385192871094, -0.03864765167236328, -0.035831451416015625, -0.03301525115966797, -0.030199050903320312, -0.027382850646972656, -0.024566650390625, -0.021750450134277344, -0.018934249877929688, -0.01611804962158203, -0.013301849365234375, -0.010485649108886719, -0.0076694488525390625, -0.004853248596191406, -0.00203704833984375, 0.0007791519165039062, 0.0035953521728515625, 0.006411552429199219, 0.009227752685546875, 0.012043952941894531, 0.014860153198242188, 0.017676353454589844, 0.0204925537109375, 0.023308753967285156, 0.026124954223632812, 0.02894115447998047, 0.031757354736328125, 0.03457355499267578, 0.03738975524902344, 0.040205955505371094, 0.04302215576171875, 0.045838356018066406, 0.04865455627441406, 0.05147075653076172, 0.054286956787109375, 0.05710315704345703, 0.05991935729980469, 0.06273555755615234, 0.0655517578125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 6.0, 5.0, 13.0, 16.0, 13.0, 15.0, 40.0, 68.0, 103.0, 149.0, 272.0, 499.0, 940.0, 2103.0, 5734.0, 23111.0, 4008737.0, 132143.0, 12976.0, 3962.0, 1612.0, 772.0, 410.0, 208.0, 127.0, 97.0, 51.0, 30.0, 24.0, 22.0, 16.0, 8.0, 2.0, 2.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.287353515625, -0.27955055236816406, -0.2717475891113281, -0.2639446258544922, -0.25614166259765625, -0.2483386993408203, -0.24053573608398438, -0.23273277282714844, -0.2249298095703125, -0.21712684631347656, -0.20932388305664062, -0.2015209197998047, -0.19371795654296875, -0.1859149932861328, -0.17811203002929688, -0.17030906677246094, -0.162506103515625, -0.15470314025878906, -0.14690017700195312, -0.1390972137451172, -0.13129425048828125, -0.12349128723144531, -0.11568832397460938, -0.10788536071777344, -0.1000823974609375, -0.09227943420410156, -0.08447647094726562, -0.07667350769042969, -0.06887054443359375, -0.06106758117675781, -0.053264617919921875, -0.04546165466308594, -0.03765869140625, -0.029855728149414062, -0.022052764892578125, -0.014249801635742188, -0.00644683837890625, 0.0013561248779296875, 0.009159088134765625, 0.016962051391601562, 0.0247650146484375, 0.03256797790527344, 0.040370941162109375, 0.04817390441894531, 0.05597686767578125, 0.06377983093261719, 0.07158279418945312, 0.07938575744628906, 0.087188720703125, 0.09499168395996094, 0.10279464721679688, 0.11059761047363281, 0.11840057373046875, 0.1262035369873047, 0.13400650024414062, 0.14180946350097656, 0.1496124267578125, 0.15741539001464844, 0.16521835327148438, 0.1730213165283203, 0.18082427978515625, 0.1886272430419922, 0.19643020629882812, 0.20423316955566406, 0.2120361328125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 1.0, 2.0, 2.0, 5.0, 10.0, 11.0, 20.0, 40.0, 138.0, 3649.0, 111.0, 40.0, 21.0, 11.0, 3.0, 4.0, 1.0, 3.0, 6.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09356689453125, -0.08988666534423828, -0.08620643615722656, -0.08252620697021484, -0.07884597778320312, -0.0751657485961914, -0.07148551940917969, -0.06780529022216797, -0.06412506103515625, -0.06044483184814453, -0.05676460266113281, -0.053084373474121094, -0.049404144287109375, -0.045723915100097656, -0.04204368591308594, -0.03836345672607422, -0.0346832275390625, -0.03100299835205078, -0.027322769165039062, -0.023642539978027344, -0.019962310791015625, -0.016282081604003906, -0.012601852416992188, -0.008921623229980469, -0.00524139404296875, -0.0015611648559570312, 0.0021190643310546875, 0.005799293518066406, 0.009479522705078125, 0.013159751892089844, 0.016839981079101562, 0.02052021026611328, 0.024200439453125, 0.02788066864013672, 0.03156089782714844, 0.035241127014160156, 0.038921356201171875, 0.042601585388183594, 0.04628181457519531, 0.04996204376220703, 0.05364227294921875, 0.05732250213623047, 0.06100273132324219, 0.0646829605102539, 0.06836318969726562, 0.07204341888427734, 0.07572364807128906, 0.07940387725830078, 0.0830841064453125, 0.08676433563232422, 0.09044456481933594, 0.09412479400634766, 0.09780502319335938, 0.1014852523803711, 0.10516548156738281, 0.10884571075439453, 0.11252593994140625, 0.11620616912841797, 0.11988639831542969, 0.1235666275024414, 0.12724685668945312, 0.13092708587646484, 0.13460731506347656, 0.13828754425048828, 0.1419677734375]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 8.0, 24.0, 144.0, 556.0, 205.0, 53.0, 11.0, 2.0, 3.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7478407621383667, -0.7255522012710571, -0.7032635807991028, -0.6809750199317932, -0.6586863994598389, -0.6363978385925293, -0.6141092777252197, -0.5918206572532654, -0.569532036781311, -0.5472434759140015, -0.5249548554420471, -0.5026662945747375, -0.4803776741027832, -0.45808911323547363, -0.4358005225658417, -0.4135119318962097, -0.39122337102890015, -0.3689347803592682, -0.34664618968963623, -0.32435762882232666, -0.3020690083503723, -0.27978044748306274, -0.2574918568134308, -0.23520326614379883, -0.21291467547416687, -0.1906260848045349, -0.16833749413490295, -0.1460489183664322, -0.12376032769680023, -0.10147173702716827, -0.07918316125869751, -0.05689457058906555, -0.034605979919433594, -0.012317392975091934, 0.009971193969249725, 0.032259777188301086, 0.054548367857933044, 0.076836958527565, 0.09912553429603577, 0.12141412496566772, 0.14370271563529968, 0.16599130630493164, 0.1882798969745636, 0.21056847274303436, 0.23285706341266632, 0.2551456689834595, 0.27743422985076904, 0.299722820520401, 0.32201141119003296, 0.3443000018596649, 0.3665885925292969, 0.38887715339660645, 0.4111657738685608, 0.43345433473587036, 0.4557429254055023, 0.4780315160751343, 0.5003200769424438, 0.5226086378097534, 0.5448972582817078, 0.5671858191490173, 0.5894744396209717, 0.6117630004882812, 0.6340515613555908, 0.6563401818275452, 0.6786288022994995]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 12.0, 19.0, 49.0, 75.0, 124.0, 137.0, 116.0, 143.0, 120.0, 90.0, 59.0, 23.0, 18.0, 12.0, 3.0, 5.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.486997127532959, -0.4758654236793518, -0.46473371982574463, -0.45360201597213745, -0.4424703121185303, -0.4313386082649231, -0.4202069044113159, -0.40907520055770874, -0.39794349670410156, -0.3868117928504944, -0.3756800889968872, -0.36454838514328003, -0.35341668128967285, -0.3422849774360657, -0.3311532735824585, -0.3200215697288513, -0.30888983607292175, -0.2977581322193146, -0.2866264283657074, -0.2754947245121002, -0.26436302065849304, -0.25323131680488586, -0.2420995980501175, -0.23096789419651031, -0.21983619034290314, -0.20870448648929596, -0.19757278263568878, -0.1864410638809204, -0.17530936002731323, -0.16417765617370605, -0.15304595232009888, -0.1419142484664917, -0.13078254461288452, -0.11965084075927734, -0.10851913690567017, -0.09738742560148239, -0.08625572174787521, -0.07512401789426804, -0.06399230659008026, -0.052860602736473083, -0.041728898882865906, -0.03059719316661358, -0.019465487450361252, -0.008333779871463776, 0.002797923982143402, 0.01392962783575058, 0.025061339139938354, 0.03619304299354553, 0.04732474684715271, 0.05845645070075989, 0.06958815455436707, 0.08071986585855484, 0.09185156971216202, 0.1029832735657692, 0.11411498486995697, 0.12524668872356415, 0.13637839257717133, 0.1475100964307785, 0.15864180028438568, 0.16977351903915405, 0.18090522289276123, 0.1920369267463684, 0.20316863059997559, 0.21430033445358276, 0.22543203830718994]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 4.0, 8.0, 5.0, 16.0, 21.0, 20.0, 27.0, 45.0, 36.0, 56.0, 95.0, 114.0, 154.0, 196.0, 291.0, 404.0, 630.0, 1052.0, 1769.0, 4042.0, 14277.0, 86033.0, 640936.0, 252983.0, 31933.0, 7043.0, 2537.0, 1314.0, 754.0, 498.0, 332.0, 246.0, 171.0, 119.0, 88.0, 68.0, 48.0, 40.0, 49.0, 25.0, 14.0, 12.0, 14.0, 9.0, 8.0, 9.0, 8.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.21728515625, -0.20998001098632812, -0.20267486572265625, -0.19536972045898438, -0.1880645751953125, -0.18075942993164062, -0.17345428466796875, -0.16614913940429688, -0.158843994140625, -0.15153884887695312, -0.14423370361328125, -0.13692855834960938, -0.1296234130859375, -0.12231826782226562, -0.11501312255859375, -0.10770797729492188, -0.10040283203125, -0.09309768676757812, -0.08579254150390625, -0.07848739624023438, -0.0711822509765625, -0.06387710571289062, -0.05657196044921875, -0.049266815185546875, -0.041961669921875, -0.034656524658203125, -0.02735137939453125, -0.020046234130859375, -0.0127410888671875, -0.005435943603515625, 0.00186920166015625, 0.009174346923828125, 0.0164794921875, 0.023784637451171875, 0.03108978271484375, 0.038394927978515625, 0.0457000732421875, 0.053005218505859375, 0.06031036376953125, 0.06761550903320312, 0.074920654296875, 0.08222579956054688, 0.08953094482421875, 0.09683609008789062, 0.1041412353515625, 0.11144638061523438, 0.11875152587890625, 0.12605667114257812, 0.13336181640625, 0.14066696166992188, 0.14797210693359375, 0.15527725219726562, 0.1625823974609375, 0.16988754272460938, 0.17719268798828125, 0.18449783325195312, 0.191802978515625, 0.19910812377929688, 0.20641326904296875, 0.21371841430664062, 0.2210235595703125, 0.22832870483398438, 0.23563385009765625, 0.24293899536132812, 0.250244140625]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 7.0, 17.0, 43.0, 62.0, 119.0, 144.0, 183.0, 141.0, 129.0, 88.0, 35.0, 15.0, 6.0, 3.0, 3.0, 4.0, 4.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.12371826171875, -0.12074565887451172, -0.11777305603027344, -0.11480045318603516, -0.11182785034179688, -0.1088552474975586, -0.10588264465332031, -0.10291004180908203, -0.09993743896484375, -0.09696483612060547, -0.09399223327636719, -0.0910196304321289, -0.08804702758789062, -0.08507442474365234, -0.08210182189941406, -0.07912921905517578, -0.0761566162109375, -0.07318401336669922, -0.07021141052246094, -0.06723880767822266, -0.06426620483398438, -0.061293601989746094, -0.05832099914550781, -0.05534839630126953, -0.05237579345703125, -0.04940319061279297, -0.04643058776855469, -0.043457984924316406, -0.040485382080078125, -0.037512779235839844, -0.03454017639160156, -0.03156757354736328, -0.028594970703125, -0.02562236785888672, -0.022649765014648438, -0.019677162170410156, -0.016704559326171875, -0.013731956481933594, -0.010759353637695312, -0.007786750793457031, -0.00481414794921875, -0.0018415451049804688, 0.0011310577392578125, 0.004103660583496094, 0.007076263427734375, 0.010048866271972656, 0.013021469116210938, 0.01599407196044922, 0.0189666748046875, 0.02193927764892578, 0.024911880493164062, 0.027884483337402344, 0.030857086181640625, 0.033829689025878906, 0.03680229187011719, 0.03977489471435547, 0.04274749755859375, 0.04572010040283203, 0.04869270324707031, 0.051665306091308594, 0.054637908935546875, 0.057610511779785156, 0.06058311462402344, 0.06355571746826172, 0.0665283203125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 2.0, 6.0, 5.0, 2.0, 7.0, 16.0, 27.0, 24.0, 40.0, 54.0, 82.0, 152.0, 279.0, 528.0, 1011.0, 2137.0, 4788.0, 11331.0, 28437.0, 75570.0, 213206.0, 425467.0, 178766.0, 63867.0, 24509.0, 9964.0, 4191.0, 1981.0, 966.0, 493.0, 254.0, 143.0, 86.0, 50.0, 33.0, 21.0, 22.0, 9.0, 8.0, 9.0, 5.0, 6.0, 2.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.09405517578125, -0.09115409851074219, -0.08825302124023438, -0.08535194396972656, -0.08245086669921875, -0.07954978942871094, -0.07664871215820312, -0.07374763488769531, -0.0708465576171875, -0.06794548034667969, -0.06504440307617188, -0.06214332580566406, -0.05924224853515625, -0.05634117126464844, -0.053440093994140625, -0.05053901672363281, -0.047637939453125, -0.04473686218261719, -0.041835784912109375, -0.03893470764160156, -0.03603363037109375, -0.03313255310058594, -0.030231475830078125, -0.027330398559570312, -0.0244293212890625, -0.021528244018554688, -0.018627166748046875, -0.015726089477539062, -0.01282501220703125, -0.009923934936523438, -0.007022857666015625, -0.0041217803955078125, -0.001220703125, 0.0016803741455078125, 0.004581451416015625, 0.0074825286865234375, 0.01038360595703125, 0.013284683227539062, 0.016185760498046875, 0.019086837768554688, 0.0219879150390625, 0.024888992309570312, 0.027790069580078125, 0.030691146850585938, 0.03359222412109375, 0.03649330139160156, 0.039394378662109375, 0.04229545593261719, 0.045196533203125, 0.04809761047363281, 0.050998687744140625, 0.05389976501464844, 0.05680084228515625, 0.05970191955566406, 0.06260299682617188, 0.06550407409667969, 0.0684051513671875, 0.07130622863769531, 0.07420730590820312, 0.07710838317871094, 0.08000946044921875, 0.08291053771972656, 0.08581161499023438, 0.08871269226074219, 0.09161376953125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 7.0, 1.0, 3.0, 8.0, 7.0, 11.0, 3.0, 18.0, 17.0, 14.0, 20.0, 21.0, 25.0, 38.0, 32.0, 35.0, 28.0, 28.0, 42.0, 29.0, 47.0, 49.0, 45.0, 43.0, 45.0, 36.0, 44.0, 41.0, 32.0, 35.0, 23.0, 28.0, 21.0, 24.0, 21.0, 17.0, 7.0, 13.0, 4.0, 12.0, 8.0, 6.0, 7.0, 3.0, 3.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.100830078125, -0.09771060943603516, -0.09459114074707031, -0.09147167205810547, -0.08835220336914062, -0.08523273468017578, -0.08211326599121094, -0.0789937973022461, -0.07587432861328125, -0.0727548599243164, -0.06963539123535156, -0.06651592254638672, -0.06339645385742188, -0.06027698516845703, -0.05715751647949219, -0.054038047790527344, -0.0509185791015625, -0.047799110412597656, -0.04467964172363281, -0.04156017303466797, -0.038440704345703125, -0.03532123565673828, -0.03220176696777344, -0.029082298278808594, -0.02596282958984375, -0.022843360900878906, -0.019723892211914062, -0.01660442352294922, -0.013484954833984375, -0.010365486145019531, -0.0072460174560546875, -0.004126548767089844, -0.001007080078125, 0.0021123886108398438, 0.0052318572998046875, 0.008351325988769531, 0.011470794677734375, 0.014590263366699219, 0.017709732055664062, 0.020829200744628906, 0.02394866943359375, 0.027068138122558594, 0.030187606811523438, 0.03330707550048828, 0.036426544189453125, 0.03954601287841797, 0.04266548156738281, 0.045784950256347656, 0.0489044189453125, 0.052023887634277344, 0.05514335632324219, 0.05826282501220703, 0.061382293701171875, 0.06450176239013672, 0.06762123107910156, 0.0707406997680664, 0.07386016845703125, 0.0769796371459961, 0.08009910583496094, 0.08321857452392578, 0.08633804321289062, 0.08945751190185547, 0.09257698059082031, 0.09569644927978516, 0.09881591796875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 2.0, 9.0, 15.0, 12.0, 16.0, 23.0, 57.0, 81.0, 134.0, 209.0, 395.0, 707.0, 1326.0, 2657.0, 6555.0, 18694.0, 68429.0, 423821.0, 426496.0, 68145.0, 18385.0, 6593.0, 2839.0, 1361.0, 709.0, 388.0, 192.0, 112.0, 63.0, 54.0, 24.0, 12.0, 12.0, 10.0, 12.0, 5.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.04449462890625, -0.04332375526428223, -0.04215288162231445, -0.04098200798034668, -0.039811134338378906, -0.03864026069641113, -0.03746938705444336, -0.036298513412475586, -0.03512763977050781, -0.03395676612854004, -0.032785892486572266, -0.03161501884460449, -0.03044414520263672, -0.029273271560668945, -0.028102397918701172, -0.0269315242767334, -0.025760650634765625, -0.02458977699279785, -0.023418903350830078, -0.022248029708862305, -0.02107715606689453, -0.019906282424926758, -0.018735408782958984, -0.01756453514099121, -0.016393661499023438, -0.015222787857055664, -0.01405191421508789, -0.012881040573120117, -0.011710166931152344, -0.01053929328918457, -0.009368419647216797, -0.008197546005249023, -0.00702667236328125, -0.0058557987213134766, -0.004684925079345703, -0.0035140514373779297, -0.0023431777954101562, -0.0011723041534423828, -1.430511474609375e-06, 0.001169443130493164, 0.0023403167724609375, 0.003511190414428711, 0.004682064056396484, 0.005852937698364258, 0.007023811340332031, 0.008194684982299805, 0.009365558624267578, 0.010536432266235352, 0.011707305908203125, 0.012878179550170898, 0.014049053192138672, 0.015219926834106445, 0.01639080047607422, 0.017561674118041992, 0.018732547760009766, 0.01990342140197754, 0.021074295043945312, 0.022245168685913086, 0.02341604232788086, 0.024586915969848633, 0.025757789611816406, 0.02692866325378418, 0.028099536895751953, 0.029270410537719727, 0.0304412841796875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 4.0, 6.0, 6.0, 5.0, 9.0, 14.0, 16.0, 27.0, 32.0, 60.0, 110.0, 244.0, 243.0, 84.0, 57.0, 29.0, 18.0, 13.0, 7.0, 7.0, 10.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00017154216766357422, -0.0001659989356994629, -0.00016045570373535156, -0.00015491247177124023, -0.0001493692398071289, -0.00014382600784301758, -0.00013828277587890625, -0.00013273954391479492, -0.0001271963119506836, -0.00012165307998657227, -0.00011610984802246094, -0.00011056661605834961, -0.00010502338409423828, -9.948015213012695e-05, -9.393692016601562e-05, -8.83936882019043e-05, -8.285045623779297e-05, -7.730722427368164e-05, -7.176399230957031e-05, -6.622076034545898e-05, -6.0677528381347656e-05, -5.513429641723633e-05, -4.9591064453125e-05, -4.404783248901367e-05, -3.8504600524902344e-05, -3.2961368560791016e-05, -2.7418136596679688e-05, -2.187490463256836e-05, -1.633167266845703e-05, -1.0788440704345703e-05, -5.245208740234375e-06, 2.980232238769531e-07, 5.841255187988281e-06, 1.138448715209961e-05, 1.6927719116210938e-05, 2.2470951080322266e-05, 2.8014183044433594e-05, 3.355741500854492e-05, 3.910064697265625e-05, 4.464387893676758e-05, 5.0187110900878906e-05, 5.5730342864990234e-05, 6.127357482910156e-05, 6.681680679321289e-05, 7.236003875732422e-05, 7.790327072143555e-05, 8.344650268554688e-05, 8.89897346496582e-05, 9.453296661376953e-05, 0.00010007619857788086, 0.00010561943054199219, 0.00011116266250610352, 0.00011670589447021484, 0.00012224912643432617, 0.0001277923583984375, 0.00013333559036254883, 0.00013887882232666016, 0.00014442205429077148, 0.0001499652862548828, 0.00015550851821899414, 0.00016105175018310547, 0.0001665949821472168, 0.00017213821411132812, 0.00017768144607543945, 0.00018322467803955078]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 10.0, 14.0, 17.0, 18.0, 40.0, 90.0, 174.0, 293.0, 838.0, 2962.0, 13167.0, 90736.0, 731920.0, 180705.0, 21291.0, 4270.0, 1189.0, 431.0, 182.0, 88.0, 45.0, 39.0, 19.0, 9.0, 6.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.059295654296875, -0.0576319694519043, -0.055968284606933594, -0.05430459976196289, -0.05264091491699219, -0.050977230072021484, -0.04931354522705078, -0.04764986038208008, -0.045986175537109375, -0.04432249069213867, -0.04265880584716797, -0.040995121002197266, -0.03933143615722656, -0.03766775131225586, -0.036004066467285156, -0.03434038162231445, -0.03267669677734375, -0.031013011932373047, -0.029349327087402344, -0.02768564224243164, -0.026021957397460938, -0.024358272552490234, -0.02269458770751953, -0.021030902862548828, -0.019367218017578125, -0.017703533172607422, -0.01603984832763672, -0.014376163482666016, -0.012712478637695312, -0.01104879379272461, -0.009385108947753906, -0.007721424102783203, -0.0060577392578125, -0.004394054412841797, -0.0027303695678710938, -0.0010666847229003906, 0.0005970001220703125, 0.0022606849670410156, 0.003924369812011719, 0.005588054656982422, 0.007251739501953125, 0.008915424346923828, 0.010579109191894531, 0.012242794036865234, 0.013906478881835938, 0.01557016372680664, 0.017233848571777344, 0.018897533416748047, 0.02056121826171875, 0.022224903106689453, 0.023888587951660156, 0.02555227279663086, 0.027215957641601562, 0.028879642486572266, 0.03054332733154297, 0.03220701217651367, 0.033870697021484375, 0.03553438186645508, 0.03719806671142578, 0.038861751556396484, 0.04052543640136719, 0.04218912124633789, 0.043852806091308594, 0.0455164909362793, 0.04718017578125]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 3.0, 4.0, 4.0, 9.0, 15.0, 25.0, 30.0, 35.0, 55.0, 76.0, 104.0, 125.0, 110.0, 118.0, 100.0, 70.0, 45.0, 26.0, 17.0, 13.0, 7.0, 7.0, 8.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0640869140625, -0.06270146369934082, -0.06131601333618164, -0.05993056297302246, -0.05854511260986328, -0.0571596622467041, -0.05577421188354492, -0.05438876152038574, -0.05300331115722656, -0.05161786079406738, -0.0502324104309082, -0.04884696006774902, -0.047461509704589844, -0.046076059341430664, -0.044690608978271484, -0.043305158615112305, -0.041919708251953125, -0.040534257888793945, -0.039148807525634766, -0.037763357162475586, -0.036377906799316406, -0.03499245643615723, -0.03360700607299805, -0.03222155570983887, -0.030836105346679688, -0.029450654983520508, -0.028065204620361328, -0.02667975425720215, -0.02529430389404297, -0.02390885353088379, -0.02252340316772461, -0.02113795280456543, -0.01975250244140625, -0.01836705207824707, -0.01698160171508789, -0.015596151351928711, -0.014210700988769531, -0.012825250625610352, -0.011439800262451172, -0.010054349899291992, -0.008668899536132812, -0.007283449172973633, -0.005897998809814453, -0.0045125484466552734, -0.0031270980834960938, -0.001741647720336914, -0.0003561973571777344, 0.0010292530059814453, 0.002414703369140625, 0.0038001537322998047, 0.005185604095458984, 0.006571054458618164, 0.007956504821777344, 0.009341955184936523, 0.010727405548095703, 0.012112855911254883, 0.013498306274414062, 0.014883756637573242, 0.016269207000732422, 0.0176546573638916, 0.01904010772705078, 0.02042555809020996, 0.02181100845336914, 0.02319645881652832, 0.0245819091796875]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 12.0, 14.0, 15.0, 27.0, 44.0, 49.0, 94.0, 138.0, 133.0, 162.0, 107.0, 78.0, 41.0, 31.0, 14.0, 21.0, 8.0, 6.0, 4.0, 3.0, 1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0081660747528076, -0.9827969074249268, -0.9574277997016907, -0.9320586323738098, -0.9066895246505737, -0.8813203573226929, -0.855951189994812, -0.8305820822715759, -0.8052129745483398, -0.779843807220459, -0.7544746994972229, -0.729105532169342, -0.703736424446106, -0.6783672571182251, -0.6529980897903442, -0.6276289820671082, -0.6022598147392273, -0.5768906474113464, -0.5515215396881104, -0.5261523723602295, -0.5007832646369934, -0.47541409730911255, -0.4500449597835541, -0.4246758222579956, -0.39930668473243713, -0.37393754720687866, -0.3485684096813202, -0.3231992721557617, -0.29783010482788086, -0.2724609971046448, -0.24709182977676392, -0.22172269225120544, -0.19635355472564697, -0.1709844172000885, -0.14561527967453003, -0.12024612724781036, -0.09487698972225189, -0.06950785219669342, -0.044138699769973755, -0.018769562244415283, 0.0065995752811431885, 0.03196871653199196, 0.05733785778284073, 0.0827070027589798, 0.10807614028453827, 0.13344527781009674, 0.1588144302368164, 0.18418356776237488, 0.20955270528793335, 0.23492184281349182, 0.2602909803390503, 0.28566014766693115, 0.31102925539016724, 0.3363984227180481, 0.36176756024360657, 0.38713669776916504, 0.4125058352947235, 0.437874972820282, 0.46324411034584045, 0.4886132478713989, 0.5139824151992798, 0.5393515229225159, 0.5647206902503967, 0.5900897979736328, 0.6154589653015137]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 3.0, 8.0, 4.0, 8.0, 6.0, 13.0, 18.0, 21.0, 21.0, 29.0, 26.0, 25.0, 34.0, 35.0, 43.0, 49.0, 34.0, 53.0, 51.0, 54.0, 54.0, 37.0, 43.0, 52.0, 40.0, 33.0, 32.0, 28.0, 21.0, 26.0, 17.0, 13.0, 18.0, 11.0, 10.0, 8.0, 10.0, 7.0, 5.0, 5.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.5147621631622314, -0.4973222017288208, -0.47988224029541016, -0.4624422788619995, -0.44500231742858887, -0.4275623559951782, -0.41012242436408997, -0.3926824629306793, -0.3752425014972687, -0.35780254006385803, -0.3403625786304474, -0.32292261719703674, -0.3054826855659485, -0.28804272413253784, -0.2706027626991272, -0.25316280126571655, -0.2357228398323059, -0.21828287839889526, -0.20084291696548462, -0.18340297043323517, -0.16596300899982452, -0.14852304756641388, -0.13108310103416443, -0.11364313960075378, -0.09620317816734314, -0.0787632167339325, -0.06132326275110245, -0.0438833050429821, -0.026443347334861755, -0.00900338590145111, 0.008436568081378937, 0.025876522064208984, 0.04331648349761963, 0.060756441205739975, 0.07819639891386032, 0.09563635289669037, 0.11307631433010101, 0.13051627576351166, 0.1479562222957611, 0.16539618372917175, 0.1828361451625824, 0.20027610659599304, 0.2177160680294037, 0.23515601456165314, 0.2525959610939026, 0.27003592252731323, 0.2874758839607239, 0.3049158453941345, 0.32235580682754517, 0.3397957682609558, 0.35723572969436646, 0.3746756911277771, 0.39211565256118774, 0.4095556139945984, 0.42699554562568665, 0.4444355070590973, 0.46187546849250793, 0.4793154299259186, 0.4967553913593292, 0.5141953229904175, 0.5316352844238281, 0.5490752458572388, 0.5665152072906494, 0.5839551687240601, 0.6013951301574707]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 0.0, 4.0, 3.0, 2.0, 4.0, 5.0, 5.0, 11.0, 6.0, 11.0, 10.0, 10.0, 15.0, 16.0, 23.0, 26.0, 28.0, 58.0, 67.0, 125.0, 220.0, 512.0, 1495.0, 5942.0, 107310.0, 4065869.0, 8825.0, 2127.0, 743.0, 334.0, 161.0, 103.0, 78.0, 42.0, 31.0, 24.0, 7.0, 11.0, 6.0, 8.0, 5.0, 0.0, 2.0, 1.0, 0.0, 3.0], "bins": [-0.6025390625, -0.5885581970214844, -0.5745773315429688, -0.5605964660644531, -0.5466156005859375, -0.5326347351074219, -0.5186538696289062, -0.5046730041503906, -0.490692138671875, -0.4767112731933594, -0.46273040771484375, -0.4487495422363281, -0.4347686767578125, -0.4207878112792969, -0.40680694580078125, -0.3928260803222656, -0.37884521484375, -0.3648643493652344, -0.35088348388671875, -0.3369026184082031, -0.3229217529296875, -0.3089408874511719, -0.29496002197265625, -0.2809791564941406, -0.266998291015625, -0.2530174255371094, -0.23903656005859375, -0.22505569458007812, -0.2110748291015625, -0.19709396362304688, -0.18311309814453125, -0.16913223266601562, -0.1551513671875, -0.14117050170898438, -0.12718963623046875, -0.11320877075195312, -0.0992279052734375, -0.08524703979492188, -0.07126617431640625, -0.057285308837890625, -0.043304443359375, -0.029323577880859375, -0.01534271240234375, -0.001361846923828125, 0.0126190185546875, 0.026599884033203125, 0.04058074951171875, 0.054561614990234375, 0.06854248046875, 0.08252334594726562, 0.09650421142578125, 0.11048507690429688, 0.1244659423828125, 0.13844680786132812, 0.15242767333984375, 0.16640853881835938, 0.180389404296875, 0.19437026977539062, 0.20835113525390625, 0.22233200073242188, 0.2363128662109375, 0.2502937316894531, 0.26427459716796875, 0.2782554626464844, 0.292236328125]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 19.0, 40.0, 61.0, 102.0, 150.0, 191.0, 161.0, 118.0, 81.0, 46.0, 10.0, 4.0, 5.0, 1.0, 4.0, 6.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.1253662109375, -0.1223592758178711, -0.11935234069824219, -0.11634540557861328, -0.11333847045898438, -0.11033153533935547, -0.10732460021972656, -0.10431766510009766, -0.10131072998046875, -0.09830379486083984, -0.09529685974121094, -0.09228992462158203, -0.08928298950195312, -0.08627605438232422, -0.08326911926269531, -0.0802621841430664, -0.0772552490234375, -0.0742483139038086, -0.07124137878417969, -0.06823444366455078, -0.06522750854492188, -0.06222057342529297, -0.05921363830566406, -0.056206703186035156, -0.05319976806640625, -0.050192832946777344, -0.04718589782714844, -0.04417896270751953, -0.041172027587890625, -0.03816509246826172, -0.03515815734863281, -0.032151222229003906, -0.029144287109375, -0.026137351989746094, -0.023130416870117188, -0.02012348175048828, -0.017116546630859375, -0.014109611511230469, -0.011102676391601562, -0.008095741271972656, -0.00508880615234375, -0.0020818710327148438, 0.0009250640869140625, 0.003931999206542969, 0.006938934326171875, 0.009945869445800781, 0.012952804565429688, 0.015959739685058594, 0.0189666748046875, 0.021973609924316406, 0.024980545043945312, 0.02798748016357422, 0.030994415283203125, 0.03400135040283203, 0.03700828552246094, 0.040015220642089844, 0.04302215576171875, 0.046029090881347656, 0.04903602600097656, 0.05204296112060547, 0.055049896240234375, 0.05805683135986328, 0.06106376647949219, 0.0640707015991211, 0.06707763671875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 4.0, 6.0, 13.0, 18.0, 18.0, 34.0, 37.0, 74.0, 97.0, 187.0, 342.0, 768.0, 2055.0, 6661.0, 40218.0, 4088710.0, 44314.0, 7056.0, 1994.0, 786.0, 363.0, 200.0, 116.0, 72.0, 51.0, 29.0, 20.0, 11.0, 15.0, 5.0, 3.0, 7.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2471923828125, -0.2378711700439453, -0.22854995727539062, -0.21922874450683594, -0.20990753173828125, -0.20058631896972656, -0.19126510620117188, -0.1819438934326172, -0.1726226806640625, -0.1633014678955078, -0.15398025512695312, -0.14465904235839844, -0.13533782958984375, -0.12601661682128906, -0.11669540405273438, -0.10737419128417969, -0.098052978515625, -0.08873176574707031, -0.07941055297851562, -0.07008934020996094, -0.06076812744140625, -0.05144691467285156, -0.042125701904296875, -0.03280448913574219, -0.0234832763671875, -0.014162063598632812, -0.004840850830078125, 0.0044803619384765625, 0.01380157470703125, 0.023122787475585938, 0.032444000244140625, 0.04176521301269531, 0.05108642578125, 0.06040763854980469, 0.06972885131835938, 0.07905006408691406, 0.08837127685546875, 0.09769248962402344, 0.10701370239257812, 0.11633491516113281, 0.1256561279296875, 0.1349773406982422, 0.14429855346679688, 0.15361976623535156, 0.16294097900390625, 0.17226219177246094, 0.18158340454101562, 0.1909046173095703, 0.200225830078125, 0.2095470428466797, 0.21886825561523438, 0.22818946838378906, 0.23751068115234375, 0.24683189392089844, 0.2561531066894531, 0.2654743194580078, 0.2747955322265625, 0.2841167449951172, 0.2934379577636719, 0.30275917053222656, 0.31208038330078125, 0.32140159606933594, 0.3307228088378906, 0.3400440216064453, 0.349365234375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 1.0, 1.0, 5.0, 4.0, 8.0, 8.0, 9.0, 17.0, 28.0, 72.0, 3430.0, 363.0, 60.0, 32.0, 17.0, 9.0, 6.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11749267578125, -0.11327266693115234, -0.10905265808105469, -0.10483264923095703, -0.10061264038085938, -0.09639263153076172, -0.09217262268066406, -0.0879526138305664, -0.08373260498046875, -0.0795125961303711, -0.07529258728027344, -0.07107257843017578, -0.06685256958007812, -0.06263256072998047, -0.05841255187988281, -0.054192543029785156, -0.0499725341796875, -0.045752525329589844, -0.04153251647949219, -0.03731250762939453, -0.033092498779296875, -0.02887248992919922, -0.024652481079101562, -0.020432472229003906, -0.01621246337890625, -0.011992454528808594, -0.0077724456787109375, -0.0035524368286132812, 0.000667572021484375, 0.004887580871582031, 0.009107589721679688, 0.013327598571777344, 0.017547607421875, 0.021767616271972656, 0.025987625122070312, 0.03020763397216797, 0.034427642822265625, 0.03864765167236328, 0.04286766052246094, 0.047087669372558594, 0.05130767822265625, 0.055527687072753906, 0.05974769592285156, 0.06396770477294922, 0.06818771362304688, 0.07240772247314453, 0.07662773132324219, 0.08084774017333984, 0.0850677490234375, 0.08928775787353516, 0.09350776672363281, 0.09772777557373047, 0.10194778442382812, 0.10616779327392578, 0.11038780212402344, 0.1146078109741211, 0.11882781982421875, 0.1230478286743164, 0.12726783752441406, 0.13148784637451172, 0.13570785522460938, 0.13992786407470703, 0.1441478729248047, 0.14836788177490234, 0.152587890625]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 10.0, 19.0, 55.0, 217.0, 447.0, 169.0, 47.0, 18.0, 6.0, 3.0, 3.0, 3.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9195607900619507, -0.8955643177032471, -0.8715678453445435, -0.8475714325904846, -0.823574960231781, -0.7995784878730774, -0.7755820751190186, -0.7515856027603149, -0.7275891304016113, -0.7035926580429077, -0.6795961856842041, -0.6555997729301453, -0.6316033005714417, -0.607606828212738, -0.5836104154586792, -0.5596139430999756, -0.535617470741272, -0.5116209983825684, -0.48762455582618713, -0.4636281132698059, -0.4396316409111023, -0.4156351685523987, -0.39163872599601746, -0.36764228343963623, -0.3436458110809326, -0.319649338722229, -0.2956528961658478, -0.27165645360946655, -0.24765998125076294, -0.22366352379322052, -0.1996670663356781, -0.17567060887813568, -0.15167415142059326, -0.12767769396305084, -0.10368123650550842, -0.079684779047966, -0.055688321590423584, -0.031691864132881165, -0.007695406675338745, 0.016301050782203674, 0.040297508239746094, 0.06429396569728851, 0.08829042315483093, 0.11228688061237335, 0.13628333806991577, 0.1602797955274582, 0.1842762529850006, 0.20827271044254303, 0.23226916790008545, 0.25626564025878906, 0.2802620828151703, 0.3042585253715515, 0.3282549977302551, 0.35225147008895874, 0.37624791264533997, 0.4002443552017212, 0.4242408275604248, 0.4482372999191284, 0.47223374247550964, 0.49623018503189087, 0.5202266573905945, 0.5442231297492981, 0.5682195425033569, 0.5922160148620605, 0.6162124872207642]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 6.0, 2.0, 4.0, 11.0, 17.0, 23.0, 49.0, 58.0, 78.0, 97.0, 101.0, 127.0, 77.0, 102.0, 69.0, 53.0, 42.0, 34.0, 24.0, 11.0, 7.0, 5.0, 6.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.36791157722473145, -0.3569802939891815, -0.3460490107536316, -0.33511772751808167, -0.32418644428253174, -0.3132551610469818, -0.3023238778114319, -0.29139259457588196, -0.28046131134033203, -0.2695300281047821, -0.2585987448692322, -0.24766746163368225, -0.23673617839813232, -0.2258048951625824, -0.21487361192703247, -0.20394232869148254, -0.19301104545593262, -0.1820797622203827, -0.17114847898483276, -0.16021719574928284, -0.1492859125137329, -0.13835462927818298, -0.12742334604263306, -0.11649206280708313, -0.1055607795715332, -0.09462949633598328, -0.08369821310043335, -0.07276692986488342, -0.061835646629333496, -0.05090436339378357, -0.03997308015823364, -0.029041796922683716, -0.01811051368713379, -0.007179230451583862, 0.0037520527839660645, 0.014683336019515991, 0.025614619255065918, 0.036545902490615845, 0.04747718572616577, 0.0584084689617157, 0.06933975219726562, 0.08027103543281555, 0.09120231866836548, 0.1021336019039154, 0.11306488513946533, 0.12399616837501526, 0.13492745161056519, 0.1458587348461151, 0.15679001808166504, 0.16772130131721497, 0.1786525845527649, 0.18958386778831482, 0.20051515102386475, 0.21144643425941467, 0.2223777174949646, 0.23330900073051453, 0.24424028396606445, 0.2551715672016144, 0.2661028504371643, 0.27703413367271423, 0.28796541690826416, 0.2988967001438141, 0.309827983379364, 0.32075926661491394, 0.33169054985046387]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 2.0, 2.0, 3.0, 7.0, 13.0, 14.0, 7.0, 17.0, 23.0, 37.0, 68.0, 71.0, 110.0, 156.0, 224.0, 372.0, 701.0, 1149.0, 2705.0, 8919.0, 80115.0, 805894.0, 129604.0, 12067.0, 2980.0, 1332.0, 691.0, 427.0, 256.0, 202.0, 119.0, 73.0, 46.0, 43.0, 27.0, 35.0, 17.0, 11.0, 6.0, 4.0, 3.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.361328125, -0.3502388000488281, -0.33914947509765625, -0.3280601501464844, -0.3169708251953125, -0.3058815002441406, -0.29479217529296875, -0.2837028503417969, -0.272613525390625, -0.2615242004394531, -0.25043487548828125, -0.23934555053710938, -0.2282562255859375, -0.21716690063476562, -0.20607757568359375, -0.19498825073242188, -0.18389892578125, -0.17280960083007812, -0.16172027587890625, -0.15063095092773438, -0.1395416259765625, -0.12845230102539062, -0.11736297607421875, -0.10627365112304688, -0.095184326171875, -0.08409500122070312, -0.07300567626953125, -0.061916351318359375, -0.0508270263671875, -0.039737701416015625, -0.02864837646484375, -0.017559051513671875, -0.0064697265625, 0.004619598388671875, 0.01570892333984375, 0.026798248291015625, 0.0378875732421875, 0.048976898193359375, 0.06006622314453125, 0.07115554809570312, 0.082244873046875, 0.09333419799804688, 0.10442352294921875, 0.11551284790039062, 0.1266021728515625, 0.13769149780273438, 0.14878082275390625, 0.15987014770507812, 0.17095947265625, 0.18204879760742188, 0.19313812255859375, 0.20422744750976562, 0.2153167724609375, 0.22640609741210938, 0.23749542236328125, 0.24858474731445312, 0.259674072265625, 0.2707633972167969, 0.28185272216796875, 0.2929420471191406, 0.3040313720703125, 0.3151206970214844, 0.32621002197265625, 0.3372993469238281, 0.348388671875]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 6.0, 22.0, 39.0, 72.0, 109.0, 161.0, 201.0, 159.0, 103.0, 77.0, 25.0, 8.0, 8.0, 2.0, 1.0, 4.0, 5.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1278076171875, -0.1247243881225586, -0.12164115905761719, -0.11855792999267578, -0.11547470092773438, -0.11239147186279297, -0.10930824279785156, -0.10622501373291016, -0.10314178466796875, -0.10005855560302734, -0.09697532653808594, -0.09389209747314453, -0.09080886840820312, -0.08772563934326172, -0.08464241027832031, -0.0815591812133789, -0.0784759521484375, -0.0753927230834961, -0.07230949401855469, -0.06922626495361328, -0.06614303588867188, -0.06305980682373047, -0.05997657775878906, -0.056893348693847656, -0.05381011962890625, -0.050726890563964844, -0.04764366149902344, -0.04456043243408203, -0.041477203369140625, -0.03839397430419922, -0.03531074523925781, -0.032227516174316406, -0.029144287109375, -0.026061058044433594, -0.022977828979492188, -0.01989459991455078, -0.016811370849609375, -0.013728141784667969, -0.010644912719726562, -0.007561683654785156, -0.00447845458984375, -0.0013952255249023438, 0.0016880035400390625, 0.004771232604980469, 0.007854461669921875, 0.010937690734863281, 0.014020919799804688, 0.017104148864746094, 0.0201873779296875, 0.023270606994628906, 0.026353836059570312, 0.02943706512451172, 0.032520294189453125, 0.03560352325439453, 0.03868675231933594, 0.041769981384277344, 0.04485321044921875, 0.047936439514160156, 0.05101966857910156, 0.05410289764404297, 0.057186126708984375, 0.06026935577392578, 0.06335258483886719, 0.0664358139038086, 0.06951904296875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 5.0, 6.0, 6.0, 16.0, 22.0, 38.0, 61.0, 99.0, 165.0, 314.0, 603.0, 1612.0, 5041.0, 18565.0, 89839.0, 516311.0, 339996.0, 57057.0, 12707.0, 3686.0, 1287.0, 532.0, 258.0, 131.0, 71.0, 44.0, 29.0, 16.0, 22.0, 11.0, 5.0, 8.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2044677734375, -0.1990680694580078, -0.19366836547851562, -0.18826866149902344, -0.18286895751953125, -0.17746925354003906, -0.17206954956054688, -0.1666698455810547, -0.1612701416015625, -0.1558704376220703, -0.15047073364257812, -0.14507102966308594, -0.13967132568359375, -0.13427162170410156, -0.12887191772460938, -0.12347221374511719, -0.118072509765625, -0.11267280578613281, -0.10727310180664062, -0.10187339782714844, -0.09647369384765625, -0.09107398986816406, -0.08567428588867188, -0.08027458190917969, -0.0748748779296875, -0.06947517395019531, -0.06407546997070312, -0.05867576599121094, -0.05327606201171875, -0.04787635803222656, -0.042476654052734375, -0.03707695007324219, -0.03167724609375, -0.026277542114257812, -0.020877838134765625, -0.015478134155273438, -0.01007843017578125, -0.0046787261962890625, 0.000720977783203125, 0.0061206817626953125, 0.0115203857421875, 0.016920089721679688, 0.022319793701171875, 0.027719497680664062, 0.03311920166015625, 0.03851890563964844, 0.043918609619140625, 0.04931831359863281, 0.054718017578125, 0.06011772155761719, 0.06551742553710938, 0.07091712951660156, 0.07631683349609375, 0.08171653747558594, 0.08711624145507812, 0.09251594543457031, 0.0979156494140625, 0.10331535339355469, 0.10871505737304688, 0.11411476135253906, 0.11951446533203125, 0.12491416931152344, 0.13031387329101562, 0.1357135772705078, 0.14111328125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 2.0, 3.0, 6.0, 10.0, 11.0, 28.0, 36.0, 44.0, 71.0, 75.0, 60.0, 86.0, 107.0, 88.0, 76.0, 86.0, 59.0, 38.0, 38.0, 29.0, 15.0, 16.0, 5.0, 6.0, 3.0, 3.0, 5.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2484130859375, -0.24182701110839844, -0.23524093627929688, -0.2286548614501953, -0.22206878662109375, -0.2154827117919922, -0.20889663696289062, -0.20231056213378906, -0.1957244873046875, -0.18913841247558594, -0.18255233764648438, -0.1759662628173828, -0.16938018798828125, -0.1627941131591797, -0.15620803833007812, -0.14962196350097656, -0.143035888671875, -0.13644981384277344, -0.12986373901367188, -0.12327766418457031, -0.11669158935546875, -0.11010551452636719, -0.10351943969726562, -0.09693336486816406, -0.0903472900390625, -0.08376121520996094, -0.07717514038085938, -0.07058906555175781, -0.06400299072265625, -0.05741691589355469, -0.050830841064453125, -0.04424476623535156, -0.03765869140625, -0.031072616577148438, -0.024486541748046875, -0.017900466918945312, -0.01131439208984375, -0.0047283172607421875, 0.001857757568359375, 0.008443832397460938, 0.0150299072265625, 0.021615982055664062, 0.028202056884765625, 0.03478813171386719, 0.04137420654296875, 0.04796028137207031, 0.054546356201171875, 0.06113243103027344, 0.067718505859375, 0.07430458068847656, 0.08089065551757812, 0.08747673034667969, 0.09406280517578125, 0.10064888000488281, 0.10723495483398438, 0.11382102966308594, 0.1204071044921875, 0.12699317932128906, 0.13357925415039062, 0.1401653289794922, 0.14675140380859375, 0.1533374786376953, 0.15992355346679688, 0.16650962829589844, 0.173095703125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 5.0, 6.0, 4.0, 4.0, 4.0, 7.0, 16.0, 21.0, 25.0, 32.0, 50.0, 87.0, 130.0, 155.0, 258.0, 413.0, 761.0, 1357.0, 2981.0, 7535.0, 26086.0, 145564.0, 711600.0, 116479.0, 22285.0, 6838.0, 2746.0, 1276.0, 693.0, 388.0, 236.0, 152.0, 114.0, 63.0, 57.0, 32.0, 34.0, 18.0, 13.0, 11.0, 3.0, 7.0, 3.0, 3.0, 2.0, 5.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06256103515625, -0.06057167053222656, -0.058582305908203125, -0.05659294128417969, -0.05460357666015625, -0.05261421203613281, -0.050624847412109375, -0.04863548278808594, -0.0466461181640625, -0.04465675354003906, -0.042667388916015625, -0.04067802429199219, -0.03868865966796875, -0.03669929504394531, -0.034709930419921875, -0.03272056579589844, -0.030731201171875, -0.028741836547851562, -0.026752471923828125, -0.024763107299804688, -0.02277374267578125, -0.020784378051757812, -0.018795013427734375, -0.016805648803710938, -0.0148162841796875, -0.012826919555664062, -0.010837554931640625, -0.008848190307617188, -0.00685882568359375, -0.0048694610595703125, -0.002880096435546875, -0.0008907318115234375, 0.0010986328125, 0.0030879974365234375, 0.005077362060546875, 0.0070667266845703125, 0.00905609130859375, 0.011045455932617188, 0.013034820556640625, 0.015024185180664062, 0.0170135498046875, 0.019002914428710938, 0.020992279052734375, 0.022981643676757812, 0.02497100830078125, 0.026960372924804688, 0.028949737548828125, 0.030939102172851562, 0.032928466796875, 0.03491783142089844, 0.036907196044921875, 0.03889656066894531, 0.04088592529296875, 0.04287528991699219, 0.044864654541015625, 0.04685401916503906, 0.0488433837890625, 0.05083274841308594, 0.052822113037109375, 0.05481147766113281, 0.05680084228515625, 0.05879020690917969, 0.060779571533203125, 0.06276893615722656, 0.06475830078125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 6.0, 4.0, 2.0, 7.0, 6.0, 7.0, 10.0, 19.0, 18.0, 27.0, 37.0, 57.0, 90.0, 187.0, 187.0, 120.0, 67.0, 35.0, 30.0, 25.0, 13.0, 9.0, 9.0, 7.0, 6.0, 6.0, 5.0, 6.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00019168853759765625, -0.00018637627363204956, -0.00018106400966644287, -0.00017575174570083618, -0.0001704394817352295, -0.0001651272177696228, -0.0001598149538040161, -0.00015450268983840942, -0.00014919042587280273, -0.00014387816190719604, -0.00013856589794158936, -0.00013325363397598267, -0.00012794137001037598, -0.0001226291060447693, -0.0001173168420791626, -0.00011200457811355591, -0.00010669231414794922, -0.00010138005018234253, -9.606778621673584e-05, -9.075552225112915e-05, -8.544325828552246e-05, -8.013099431991577e-05, -7.481873035430908e-05, -6.950646638870239e-05, -6.41942024230957e-05, -5.8881938457489014e-05, -5.3569674491882324e-05, -4.8257410526275635e-05, -4.2945146560668945e-05, -3.7632882595062256e-05, -3.2320618629455566e-05, -2.7008354663848877e-05, -2.1696090698242188e-05, -1.6383826732635498e-05, -1.1071562767028809e-05, -5.759298801422119e-06, -4.470348358154297e-07, 4.86522912979126e-06, 1.017749309539795e-05, 1.548975706100464e-05, 2.0802021026611328e-05, 2.6114284992218018e-05, 3.142654895782471e-05, 3.6738812923431396e-05, 4.2051076889038086e-05, 4.7363340854644775e-05, 5.2675604820251465e-05, 5.7987868785858154e-05, 6.330013275146484e-05, 6.861239671707153e-05, 7.392466068267822e-05, 7.923692464828491e-05, 8.45491886138916e-05, 8.986145257949829e-05, 9.517371654510498e-05, 0.00010048598051071167, 0.00010579824447631836, 0.00011111050844192505, 0.00011642277240753174, 0.00012173503637313843, 0.00012704730033874512, 0.0001323595643043518, 0.0001376718282699585, 0.00014298409223556519, 0.00014829635620117188]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 3.0, 5.0, 7.0, 12.0, 18.0, 20.0, 35.0, 49.0, 111.0, 227.0, 410.0, 817.0, 1613.0, 3230.0, 7797.0, 24794.0, 110279.0, 610607.0, 226518.0, 41314.0, 11950.0, 4503.0, 2068.0, 1001.0, 550.0, 262.0, 150.0, 82.0, 47.0, 31.0, 13.0, 9.0, 3.0, 8.0, 9.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0501708984375, -0.048587799072265625, -0.04700469970703125, -0.045421600341796875, -0.0438385009765625, -0.042255401611328125, -0.04067230224609375, -0.039089202880859375, -0.037506103515625, -0.035923004150390625, -0.03433990478515625, -0.032756805419921875, -0.0311737060546875, -0.029590606689453125, -0.02800750732421875, -0.026424407958984375, -0.02484130859375, -0.023258209228515625, -0.02167510986328125, -0.020092010498046875, -0.0185089111328125, -0.016925811767578125, -0.01534271240234375, -0.013759613037109375, -0.012176513671875, -0.010593414306640625, -0.00901031494140625, -0.007427215576171875, -0.0058441162109375, -0.004261016845703125, -0.00267791748046875, -0.001094818115234375, 0.00048828125, 0.002071380615234375, 0.00365447998046875, 0.005237579345703125, 0.0068206787109375, 0.008403778076171875, 0.00998687744140625, 0.011569976806640625, 0.013153076171875, 0.014736175537109375, 0.01631927490234375, 0.017902374267578125, 0.0194854736328125, 0.021068572998046875, 0.02265167236328125, 0.024234771728515625, 0.02581787109375, 0.027400970458984375, 0.02898406982421875, 0.030567169189453125, 0.0321502685546875, 0.033733367919921875, 0.03531646728515625, 0.036899566650390625, 0.038482666015625, 0.040065765380859375, 0.04164886474609375, 0.043231964111328125, 0.0448150634765625, 0.046398162841796875, 0.04798126220703125, 0.049564361572265625, 0.0511474609375]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 4.0, 1.0, 0.0, 3.0, 2.0, 3.0, 3.0, 3.0, 4.0, 9.0, 24.0, 25.0, 40.0, 40.0, 56.0, 93.0, 87.0, 118.0, 118.0, 103.0, 74.0, 63.0, 38.0, 33.0, 23.0, 8.0, 8.0, 4.0, 3.0, 2.0, 3.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.04937744140625, -0.047616004943847656, -0.04585456848144531, -0.04409313201904297, -0.042331695556640625, -0.04057025909423828, -0.03880882263183594, -0.037047386169433594, -0.03528594970703125, -0.033524513244628906, -0.03176307678222656, -0.03000164031982422, -0.028240203857421875, -0.02647876739501953, -0.024717330932617188, -0.022955894470214844, -0.0211944580078125, -0.019433021545410156, -0.017671585083007812, -0.01591014862060547, -0.014148712158203125, -0.012387275695800781, -0.010625839233398438, -0.008864402770996094, -0.00710296630859375, -0.005341529846191406, -0.0035800933837890625, -0.0018186569213867188, -5.7220458984375e-05, 0.0017042160034179688, 0.0034656524658203125, 0.005227088928222656, 0.006988525390625, 0.008749961853027344, 0.010511398315429688, 0.012272834777832031, 0.014034271240234375, 0.01579570770263672, 0.017557144165039062, 0.019318580627441406, 0.02108001708984375, 0.022841453552246094, 0.024602890014648438, 0.02636432647705078, 0.028125762939453125, 0.02988719940185547, 0.03164863586425781, 0.033410072326660156, 0.0351715087890625, 0.036932945251464844, 0.03869438171386719, 0.04045581817626953, 0.042217254638671875, 0.04397869110107422, 0.04574012756347656, 0.047501564025878906, 0.04926300048828125, 0.051024436950683594, 0.05278587341308594, 0.05454730987548828, 0.056308746337890625, 0.05807018280029297, 0.05983161926269531, 0.061593055725097656, 0.0633544921875]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 20.0, 85.0, 458.0, 376.0, 57.0, 11.0, 4.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.944631814956665, -2.8104360103607178, -2.6762404441833496, -2.5420446395874023, -2.407849073410034, -2.273653268814087, -2.1394577026367188, -2.0052618980407715, -1.8710662126541138, -1.736870527267456, -1.6026748418807983, -1.4684791564941406, -1.3342833518981934, -1.2000877857208252, -1.065891981124878, -0.9316962957382202, -0.7975006103515625, -0.6633049249649048, -0.5291092395782471, -0.3949134945869446, -0.26071780920028687, -0.12652212381362915, 0.00767362117767334, 0.14186930656433105, 0.27606499195098877, 0.4102606773376465, 0.5444563627243042, 0.6786521077156067, 0.8128477931022644, 0.9470434784889221, 1.0812392234802246, 1.2154349088668823, 1.3496308326721191, 1.4838265180587769, 1.6180222034454346, 1.7522180080413818, 1.88641357421875, 2.0206093788146973, 2.1548051834106445, 2.2890007495880127, 2.423196315765381, 2.557392120361328, 2.6915876865386963, 2.8257834911346436, 2.9599790573120117, 3.094174861907959, 3.2283706665039062, 3.3625662326812744, 3.4967620372772217, 3.630957841873169, 3.765153408050537, 3.8993492126464844, 4.033545017242432, 4.167740345001221, 4.301936149597168, 4.436131954193115, 4.5703277587890625, 4.70452356338501, 4.838719367980957, 4.972914695739746, 5.107110500335693, 5.241306304931641, 5.375502109527588, 5.509697914123535, 5.643893241882324]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 6.0, 0.0, 1.0, 8.0, 5.0, 14.0, 14.0, 24.0, 18.0, 25.0, 26.0, 47.0, 54.0, 43.0, 68.0, 56.0, 63.0, 65.0, 63.0, 60.0, 49.0, 51.0, 30.0, 38.0, 41.0, 35.0, 31.0, 26.0, 12.0, 16.0, 13.0, 8.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.9334578514099121, -0.9087934494018555, -0.8841290473937988, -0.8594646453857422, -0.8348002433776855, -0.8101358413696289, -0.7854714393615723, -0.7608070373535156, -0.736142635345459, -0.7114782333374023, -0.6868138313293457, -0.6621494293212891, -0.6374850273132324, -0.6128206253051758, -0.5881562232971191, -0.5634918212890625, -0.5388274192810059, -0.5141630172729492, -0.4894986152648926, -0.46483421325683594, -0.4401698112487793, -0.41550540924072266, -0.390841007232666, -0.3661766052246094, -0.3415122628211975, -0.31684786081314087, -0.29218345880508423, -0.2675190567970276, -0.24285465478897095, -0.2181902527809143, -0.19352586567401886, -0.16886146366596222, -0.14419704675674438, -0.11953264474868774, -0.0948682427406311, -0.07020384818315506, -0.04553944617509842, -0.02087504416704178, 0.003789350390434265, 0.028453752398490906, 0.053118154406547546, 0.07778255641460419, 0.10244695842266083, 0.12711134552955627, 0.15177574753761292, 0.17644014954566956, 0.2011045515537262, 0.22576895356178284, 0.2504333555698395, 0.2750977575778961, 0.29976215958595276, 0.3244265615940094, 0.34909096360206604, 0.3737553656101227, 0.39841973781585693, 0.4230841398239136, 0.4477485418319702, 0.47241294384002686, 0.4970773458480835, 0.5217417478561401, 0.5464061498641968, 0.5710705518722534, 0.5957349538803101, 0.6203993558883667, 0.6450637578964233]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 2.0, 1.0, 3.0, 5.0, 3.0, 10.0, 25.0, 37.0, 91.0, 240.0, 1241.0, 4187118.0, 4824.0, 430.0, 136.0, 54.0, 32.0, 13.0, 4.0, 8.0, 6.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.31298828125, -0.3044624328613281, -0.29593658447265625, -0.2874107360839844, -0.2788848876953125, -0.2703590393066406, -0.26183319091796875, -0.2533073425292969, -0.244781494140625, -0.23625564575195312, -0.22772979736328125, -0.21920394897460938, -0.2106781005859375, -0.20215225219726562, -0.19362640380859375, -0.18510055541992188, -0.17657470703125, -0.16804885864257812, -0.15952301025390625, -0.15099716186523438, -0.1424713134765625, -0.13394546508789062, -0.12541961669921875, -0.11689376831054688, -0.108367919921875, -0.09984207153320312, -0.09131622314453125, -0.08279037475585938, -0.0742645263671875, -0.06573867797851562, -0.05721282958984375, -0.048686981201171875, -0.0401611328125, -0.031635284423828125, -0.02310943603515625, -0.014583587646484375, -0.0060577392578125, 0.002468109130859375, 0.01099395751953125, 0.019519805908203125, 0.028045654296875, 0.036571502685546875, 0.04509735107421875, 0.053623199462890625, 0.0621490478515625, 0.07067489624023438, 0.07920074462890625, 0.08772659301757812, 0.09625244140625, 0.10477828979492188, 0.11330413818359375, 0.12182998657226562, 0.1303558349609375, 0.13888168334960938, 0.14740753173828125, 0.15593338012695312, 0.164459228515625, 0.17298507690429688, 0.18151092529296875, 0.19003677368164062, 0.1985626220703125, 0.20708847045898438, 0.21561431884765625, 0.22414016723632812, 0.232666015625]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 9.0, 26.0, 52.0, 96.0, 139.0, 181.0, 189.0, 148.0, 80.0, 40.0, 20.0, 4.0, 7.0, 1.0, 3.0, 5.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.13330078125, -0.13012409210205078, -0.12694740295410156, -0.12377071380615234, -0.12059402465820312, -0.1174173355102539, -0.11424064636230469, -0.11106395721435547, -0.10788726806640625, -0.10471057891845703, -0.10153388977050781, -0.0983572006225586, -0.09518051147460938, -0.09200382232666016, -0.08882713317871094, -0.08565044403076172, -0.0824737548828125, -0.07929706573486328, -0.07612037658691406, -0.07294368743896484, -0.06976699829101562, -0.0665903091430664, -0.06341361999511719, -0.06023693084716797, -0.05706024169921875, -0.05388355255126953, -0.05070686340332031, -0.047530174255371094, -0.044353485107421875, -0.041176795959472656, -0.03800010681152344, -0.03482341766357422, -0.031646728515625, -0.02847003936767578, -0.025293350219726562, -0.022116661071777344, -0.018939971923828125, -0.015763282775878906, -0.012586593627929688, -0.009409904479980469, -0.00623321533203125, -0.0030565261840820312, 0.0001201629638671875, 0.0032968521118164062, 0.006473541259765625, 0.009650230407714844, 0.012826919555664062, 0.01600360870361328, 0.0191802978515625, 0.02235698699951172, 0.025533676147460938, 0.028710365295410156, 0.031887054443359375, 0.035063743591308594, 0.03824043273925781, 0.04141712188720703, 0.04459381103515625, 0.04777050018310547, 0.05094718933105469, 0.054123878479003906, 0.057300567626953125, 0.060477256774902344, 0.06365394592285156, 0.06683063507080078, 0.07000732421875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 5.0, 3.0, 7.0, 10.0, 24.0, 41.0, 56.0, 75.0, 138.0, 146.0, 252.0, 398.0, 619.0, 1035.0, 2011.0, 5499.0, 4108306.0, 66890.0, 4358.0, 1806.0, 976.0, 564.0, 350.0, 224.0, 167.0, 106.0, 68.0, 58.0, 37.0, 20.0, 12.0, 10.0, 6.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0875244140625, -0.08478260040283203, -0.08204078674316406, -0.0792989730834961, -0.07655715942382812, -0.07381534576416016, -0.07107353210449219, -0.06833171844482422, -0.06558990478515625, -0.06284809112548828, -0.06010627746582031, -0.057364463806152344, -0.054622650146484375, -0.051880836486816406, -0.04913902282714844, -0.04639720916748047, -0.0436553955078125, -0.04091358184814453, -0.03817176818847656, -0.035429954528808594, -0.032688140869140625, -0.029946327209472656, -0.027204513549804688, -0.02446269989013672, -0.02172088623046875, -0.01897907257080078, -0.016237258911132812, -0.013495445251464844, -0.010753631591796875, -0.008011817932128906, -0.0052700042724609375, -0.0025281906127929688, 0.000213623046875, 0.0029554367065429688, 0.0056972503662109375, 0.008439064025878906, 0.011180877685546875, 0.013922691345214844, 0.016664505004882812, 0.01940631866455078, 0.02214813232421875, 0.02488994598388672, 0.027631759643554688, 0.030373573303222656, 0.033115386962890625, 0.035857200622558594, 0.03859901428222656, 0.04134082794189453, 0.0440826416015625, 0.04682445526123047, 0.04956626892089844, 0.052308082580566406, 0.055049896240234375, 0.057791709899902344, 0.06053352355957031, 0.06327533721923828, 0.06601715087890625, 0.06875896453857422, 0.07150077819824219, 0.07424259185791016, 0.07698440551757812, 0.0797262191772461, 0.08246803283691406, 0.08520984649658203, 0.08795166015625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 9.0, 3.0, 24.0, 3916.0, 75.0, 26.0, 8.0, 2.0, 4.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0124969482421875, -0.012076258659362793, -0.011655569076538086, -0.011234879493713379, -0.010814189910888672, -0.010393500328063965, -0.009972810745239258, -0.00955212116241455, -0.009131431579589844, -0.008710741996765137, -0.00829005241394043, -0.007869362831115723, -0.007448673248291016, -0.007027983665466309, -0.0066072940826416016, -0.0061866044998168945, -0.0057659149169921875, -0.0053452253341674805, -0.0049245357513427734, -0.004503846168518066, -0.004083156585693359, -0.0036624670028686523, -0.0032417774200439453, -0.0028210878372192383, -0.0024003982543945312, -0.0019797086715698242, -0.0015590190887451172, -0.0011383295059204102, -0.0007176399230957031, -0.0002969503402709961, 0.00012373924255371094, 0.000544428825378418, 0.000965118408203125, 0.001385807991027832, 0.001806497573852539, 0.002227187156677246, 0.002647876739501953, 0.00306856632232666, 0.003489255905151367, 0.003909945487976074, 0.004330635070800781, 0.004751324653625488, 0.005172014236450195, 0.005592703819274902, 0.006013393402099609, 0.006434082984924316, 0.0068547725677490234, 0.0072754621505737305, 0.0076961517333984375, 0.008116841316223145, 0.008537530899047852, 0.008958220481872559, 0.009378910064697266, 0.009799599647521973, 0.01022028923034668, 0.010640978813171387, 0.011061668395996094, 0.0114823579788208, 0.011903047561645508, 0.012323737144470215, 0.012744426727294922, 0.013165116310119629, 0.013585805892944336, 0.014006495475769043, 0.01442718505859375]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 5.0, 26.0, 58.0, 257.0, 443.0, 166.0, 40.0, 16.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02175716683268547, -0.018298236653208733, -0.014839304611086845, -0.011380374431610107, -0.007921443320810795, -0.004462512210011482, -0.0010035820305347443, 0.002455350011587143, 0.005914280191063881, 0.009373211301863194, 0.012832142412662506, 0.016291072592139244, 0.019750002771615982, 0.02320893481373787, 0.026667864993214607, 0.030126797035336494, 0.03358572721481323, 0.03704465925693512, 0.04050358757376671, 0.043962519615888596, 0.04742145165801048, 0.05088037997484207, 0.05433931201696396, 0.057798244059085846, 0.06125717610120773, 0.06471610814332962, 0.06817504018545151, 0.0716339647769928, 0.07509289681911469, 0.07855182886123657, 0.08201076090335846, 0.08546969294548035, 0.08892861753702164, 0.09238754957914352, 0.09584648162126541, 0.0993054062128067, 0.10276433825492859, 0.10622327029705048, 0.10968220233917236, 0.11314113438129425, 0.11660006642341614, 0.12005899846553802, 0.12351793050765991, 0.1269768625497818, 0.1304357945919037, 0.13389472663402557, 0.13735365867614746, 0.14081257581710815, 0.14427150785923004, 0.14773043990135193, 0.15118937194347382, 0.1546483039855957, 0.1581072360277176, 0.16156616806983948, 0.16502508521080017, 0.16848403215408325, 0.17194296419620514, 0.17540189623832703, 0.1788608282804489, 0.1823197603225708, 0.1857786923646927, 0.18923762440681458, 0.19269654154777527, 0.19615548849105835, 0.19961440563201904]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 4.0, 3.0, 9.0, 9.0, 12.0, 13.0, 22.0, 27.0, 29.0, 34.0, 38.0, 48.0, 43.0, 51.0, 51.0, 49.0, 64.0, 63.0, 49.0, 52.0, 54.0, 50.0, 38.0, 40.0, 38.0, 22.0, 27.0, 15.0, 17.0, 9.0, 7.0, 11.0, 6.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.02491670846939087, -0.02418903261423111, -0.0234613586217165, -0.02273368462920189, -0.02200600877404213, -0.02127833291888237, -0.02055065892636776, -0.01982298493385315, -0.01909530907869339, -0.01836763322353363, -0.01763995923101902, -0.01691228523850441, -0.01618460938334465, -0.015456934459507465, -0.01472925953567028, -0.014001584611833096, -0.01327390968799591, -0.012546234764158726, -0.01181855984032154, -0.011090884916484356, -0.010363209992647171, -0.009635535068809986, -0.008907860144972801, -0.008180185221135616, -0.007452510297298431, -0.0067248353734612465, -0.005997160449624062, -0.005269485525786877, -0.004541810601949692, -0.003814135678112507, -0.003086460754275322, -0.002358785830438137, -0.0016311109066009521, -0.0009034359827637672, -0.00017576105892658234, 0.0005519138649106026, 0.0012795887887477875, 0.0020072637125849724, 0.0027349386364221573, 0.003462613560259342, 0.004190288484096527, 0.004917963407933712, 0.005645638331770897, 0.006373313255608082, 0.007100988179445267, 0.007828663103282452, 0.008556338027119637, 0.009284012950956821, 0.010011687874794006, 0.010739362798631191, 0.011467037722468376, 0.012194712646305561, 0.012922387570142746, 0.013650062493979931, 0.014377737417817116, 0.0151054123416543, 0.015833087265491486, 0.016560763120651245, 0.017288437113165855, 0.018016111105680466, 0.018743786960840225, 0.019471462815999985, 0.020199136808514595, 0.020926810801029205, 0.021654486656188965]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 4.0, 4.0, 3.0, 10.0, 7.0, 13.0, 17.0, 28.0, 32.0, 50.0, 65.0, 113.0, 148.0, 206.0, 302.0, 588.0, 997.0, 1857.0, 4633.0, 22341.0, 304704.0, 654459.0, 45824.0, 6796.0, 2400.0, 1140.0, 627.0, 353.0, 259.0, 173.0, 102.0, 84.0, 61.0, 41.0, 28.0, 27.0, 25.0, 10.0, 7.0, 6.0, 6.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.331787109375, -0.32234954833984375, -0.3129119873046875, -0.30347442626953125, -0.294036865234375, -0.28459930419921875, -0.2751617431640625, -0.26572418212890625, -0.25628662109375, -0.24684906005859375, -0.2374114990234375, -0.22797393798828125, -0.218536376953125, -0.20909881591796875, -0.1996612548828125, -0.19022369384765625, -0.1807861328125, -0.17134857177734375, -0.1619110107421875, -0.15247344970703125, -0.143035888671875, -0.13359832763671875, -0.1241607666015625, -0.11472320556640625, -0.10528564453125, -0.09584808349609375, -0.0864105224609375, -0.07697296142578125, -0.067535400390625, -0.05809783935546875, -0.0486602783203125, -0.03922271728515625, -0.02978515625, -0.02034759521484375, -0.0109100341796875, -0.00147247314453125, 0.007965087890625, 0.01740264892578125, 0.0268402099609375, 0.03627777099609375, 0.04571533203125, 0.05515289306640625, 0.0645904541015625, 0.07402801513671875, 0.083465576171875, 0.09290313720703125, 0.1023406982421875, 0.11177825927734375, 0.1212158203125, 0.13065338134765625, 0.1400909423828125, 0.14952850341796875, 0.158966064453125, 0.16840362548828125, 0.1778411865234375, 0.18727874755859375, 0.19671630859375, 0.20615386962890625, 0.2155914306640625, 0.22502899169921875, 0.234466552734375, 0.24390411376953125, 0.2533416748046875, 0.26277923583984375, 0.272216796875]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 9.0, 26.0, 56.0, 94.0, 140.0, 180.0, 192.0, 147.0, 80.0, 37.0, 19.0, 5.0, 6.0, 1.0, 3.0, 5.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1331787109375, -0.1300039291381836, -0.1268291473388672, -0.12365436553955078, -0.12047958374023438, -0.11730480194091797, -0.11413002014160156, -0.11095523834228516, -0.10778045654296875, -0.10460567474365234, -0.10143089294433594, -0.09825611114501953, -0.09508132934570312, -0.09190654754638672, -0.08873176574707031, -0.0855569839477539, -0.0823822021484375, -0.0792074203491211, -0.07603263854980469, -0.07285785675048828, -0.06968307495117188, -0.06650829315185547, -0.06333351135253906, -0.060158729553222656, -0.05698394775390625, -0.053809165954589844, -0.05063438415527344, -0.04745960235595703, -0.044284820556640625, -0.04111003875732422, -0.03793525695800781, -0.034760475158691406, -0.031585693359375, -0.028410911560058594, -0.025236129760742188, -0.02206134796142578, -0.018886566162109375, -0.01571178436279297, -0.012537002563476562, -0.009362220764160156, -0.00618743896484375, -0.0030126571655273438, 0.0001621246337890625, 0.0033369064331054688, 0.006511688232421875, 0.009686470031738281, 0.012861251831054688, 0.016036033630371094, 0.0192108154296875, 0.022385597229003906, 0.025560379028320312, 0.02873516082763672, 0.031909942626953125, 0.03508472442626953, 0.03825950622558594, 0.041434288024902344, 0.04460906982421875, 0.047783851623535156, 0.05095863342285156, 0.05413341522216797, 0.057308197021484375, 0.06048297882080078, 0.06365776062011719, 0.0668325424194336, 0.07000732421875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 3.0, 5.0, 7.0, 13.0, 7.0, 14.0, 19.0, 26.0, 34.0, 93.0, 120.0, 187.0, 341.0, 593.0, 1137.0, 2315.0, 4844.0, 11264.0, 27497.0, 73601.0, 218574.0, 436271.0, 172102.0, 59274.0, 22530.0, 9294.0, 4116.0, 1981.0, 1001.0, 553.0, 274.0, 161.0, 89.0, 59.0, 49.0, 32.0, 22.0, 15.0, 14.0, 4.0, 6.0, 3.0, 5.0, 5.0, 4.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07763671875, -0.0752401351928711, -0.07284355163574219, -0.07044696807861328, -0.06805038452148438, -0.06565380096435547, -0.06325721740722656, -0.060860633850097656, -0.05846405029296875, -0.056067466735839844, -0.05367088317871094, -0.05127429962158203, -0.048877716064453125, -0.04648113250732422, -0.04408454895019531, -0.041687965393066406, -0.0392913818359375, -0.036894798278808594, -0.03449821472167969, -0.03210163116455078, -0.029705047607421875, -0.02730846405029297, -0.024911880493164062, -0.022515296936035156, -0.02011871337890625, -0.017722129821777344, -0.015325546264648438, -0.012928962707519531, -0.010532379150390625, -0.008135795593261719, -0.0057392120361328125, -0.0033426284790039062, -0.000946044921875, 0.0014505386352539062, 0.0038471221923828125, 0.006243705749511719, 0.008640289306640625, 0.011036872863769531, 0.013433456420898438, 0.015830039978027344, 0.01822662353515625, 0.020623207092285156, 0.023019790649414062, 0.02541637420654297, 0.027812957763671875, 0.03020954132080078, 0.03260612487792969, 0.035002708435058594, 0.0373992919921875, 0.039795875549316406, 0.04219245910644531, 0.04458904266357422, 0.046985626220703125, 0.04938220977783203, 0.05177879333496094, 0.054175376892089844, 0.05657196044921875, 0.058968544006347656, 0.06136512756347656, 0.06376171112060547, 0.06615829467773438, 0.06855487823486328, 0.07095146179199219, 0.0733480453491211, 0.07574462890625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 1.0, 3.0, 6.0, 12.0, 14.0, 17.0, 15.0, 22.0, 23.0, 30.0, 35.0, 41.0, 44.0, 60.0, 56.0, 40.0, 58.0, 66.0, 71.0, 45.0, 40.0, 54.0, 47.0, 33.0, 25.0, 21.0, 28.0, 20.0, 19.0, 18.0, 10.0, 13.0, 11.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09649658203125, -0.09310054779052734, -0.08970451354980469, -0.08630847930908203, -0.08291244506835938, -0.07951641082763672, -0.07612037658691406, -0.0727243423461914, -0.06932830810546875, -0.0659322738647461, -0.06253623962402344, -0.05914020538330078, -0.055744171142578125, -0.05234813690185547, -0.04895210266113281, -0.045556068420410156, -0.0421600341796875, -0.038763999938964844, -0.03536796569824219, -0.03197193145751953, -0.028575897216796875, -0.02517986297607422, -0.021783828735351562, -0.018387794494628906, -0.01499176025390625, -0.011595726013183594, -0.008199691772460938, -0.004803657531738281, -0.001407623291015625, 0.0019884109497070312, 0.0053844451904296875, 0.008780479431152344, 0.012176513671875, 0.015572547912597656, 0.018968582153320312, 0.02236461639404297, 0.025760650634765625, 0.02915668487548828, 0.03255271911621094, 0.035948753356933594, 0.03934478759765625, 0.042740821838378906, 0.04613685607910156, 0.04953289031982422, 0.052928924560546875, 0.05632495880126953, 0.05972099304199219, 0.06311702728271484, 0.0665130615234375, 0.06990909576416016, 0.07330513000488281, 0.07670116424560547, 0.08009719848632812, 0.08349323272705078, 0.08688926696777344, 0.0902853012084961, 0.09368133544921875, 0.0970773696899414, 0.10047340393066406, 0.10386943817138672, 0.10726547241210938, 0.11066150665283203, 0.11405754089355469, 0.11745357513427734, 0.120849609375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 2.0, 4.0, 1.0, 5.0, 7.0, 13.0, 12.0, 20.0, 29.0, 26.0, 44.0, 82.0, 133.0, 219.0, 331.0, 572.0, 1064.0, 2048.0, 4177.0, 10098.0, 27914.0, 107877.0, 633574.0, 194202.0, 41376.0, 13647.0, 5463.0, 2593.0, 1233.0, 694.0, 408.0, 253.0, 144.0, 101.0, 58.0, 31.0, 35.0, 20.0, 19.0, 8.0, 5.0, 8.0, 9.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.033935546875, -0.03282880783081055, -0.031722068786621094, -0.03061532974243164, -0.029508590698242188, -0.028401851654052734, -0.02729511260986328, -0.026188373565673828, -0.025081634521484375, -0.023974895477294922, -0.02286815643310547, -0.021761417388916016, -0.020654678344726562, -0.01954793930053711, -0.018441200256347656, -0.017334461212158203, -0.01622772216796875, -0.015120983123779297, -0.014014244079589844, -0.01290750503540039, -0.011800765991210938, -0.010694026947021484, -0.009587287902832031, -0.008480548858642578, -0.007373809814453125, -0.006267070770263672, -0.005160331726074219, -0.004053592681884766, -0.0029468536376953125, -0.0018401145935058594, -0.0007333755493164062, 0.0003733634948730469, 0.0014801025390625, 0.002586841583251953, 0.0036935806274414062, 0.004800319671630859, 0.0059070587158203125, 0.007013797760009766, 0.008120536804199219, 0.009227275848388672, 0.010334014892578125, 0.011440753936767578, 0.012547492980957031, 0.013654232025146484, 0.014760971069335938, 0.01586771011352539, 0.016974449157714844, 0.018081188201904297, 0.01918792724609375, 0.020294666290283203, 0.021401405334472656, 0.02250814437866211, 0.023614883422851562, 0.024721622467041016, 0.02582836151123047, 0.026935100555419922, 0.028041839599609375, 0.029148578643798828, 0.03025531768798828, 0.031362056732177734, 0.03246879577636719, 0.03357553482055664, 0.034682273864746094, 0.03578901290893555, 0.036895751953125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 4.0, 5.0, 7.0, 13.0, 7.0, 11.0, 18.0, 23.0, 19.0, 23.0, 27.0, 33.0, 48.0, 57.0, 71.0, 107.0, 95.0, 78.0, 65.0, 55.0, 37.0, 35.0, 27.0, 25.0, 21.0, 18.0, 12.0, 10.0, 10.0, 8.0, 2.0, 6.0, 5.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-9.900331497192383e-05, -9.592156857252121e-05, -9.283982217311859e-05, -8.975807577371597e-05, -8.667632937431335e-05, -8.359458297491074e-05, -8.051283657550812e-05, -7.74310901761055e-05, -7.434934377670288e-05, -7.126759737730026e-05, -6.818585097789764e-05, -6.510410457849503e-05, -6.202235817909241e-05, -5.894061177968979e-05, -5.585886538028717e-05, -5.277711898088455e-05, -4.9695372581481934e-05, -4.6613626182079315e-05, -4.35318797826767e-05, -4.045013338327408e-05, -3.736838698387146e-05, -3.428664058446884e-05, -3.120489418506622e-05, -2.8123147785663605e-05, -2.5041401386260986e-05, -2.1959654986858368e-05, -1.887790858745575e-05, -1.579616218805313e-05, -1.2714415788650513e-05, -9.632669389247894e-06, -6.550922989845276e-06, -3.4691765904426575e-06, -3.8743019104003906e-07, 2.6943162083625793e-06, 5.776062607765198e-06, 8.857809007167816e-06, 1.1939555406570435e-05, 1.5021301805973053e-05, 1.810304820537567e-05, 2.118479460477829e-05, 2.4266541004180908e-05, 2.7348287403583527e-05, 3.0430033802986145e-05, 3.3511780202388763e-05, 3.659352660179138e-05, 3.9675273001194e-05, 4.275701940059662e-05, 4.583876579999924e-05, 4.8920512199401855e-05, 5.2002258598804474e-05, 5.508400499820709e-05, 5.816575139760971e-05, 6.124749779701233e-05, 6.432924419641495e-05, 6.741099059581757e-05, 7.049273699522018e-05, 7.35744833946228e-05, 7.665622979402542e-05, 7.973797619342804e-05, 8.281972259283066e-05, 8.590146899223328e-05, 8.89832153916359e-05, 9.206496179103851e-05, 9.514670819044113e-05, 9.822845458984375e-05]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 2.0, 4.0, 0.0, 9.0, 10.0, 9.0, 15.0, 22.0, 24.0, 27.0, 55.0, 116.0, 150.0, 268.0, 472.0, 894.0, 1882.0, 4940.0, 15821.0, 76246.0, 677390.0, 224045.0, 31972.0, 8398.0, 2942.0, 1304.0, 638.0, 344.0, 186.0, 135.0, 76.0, 50.0, 29.0, 33.0, 10.0, 13.0, 9.0, 7.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.04339599609375, -0.041886329650878906, -0.04037666320800781, -0.03886699676513672, -0.037357330322265625, -0.03584766387939453, -0.03433799743652344, -0.032828330993652344, -0.03131866455078125, -0.029808998107910156, -0.028299331665039062, -0.02678966522216797, -0.025279998779296875, -0.02377033233642578, -0.022260665893554688, -0.020750999450683594, -0.0192413330078125, -0.017731666564941406, -0.016222000122070312, -0.014712333679199219, -0.013202667236328125, -0.011693000793457031, -0.010183334350585938, -0.008673667907714844, -0.00716400146484375, -0.005654335021972656, -0.0041446685791015625, -0.0026350021362304688, -0.001125335693359375, 0.00038433074951171875, 0.0018939971923828125, 0.0034036636352539062, 0.004913330078125, 0.006422996520996094, 0.007932662963867188, 0.009442329406738281, 0.010951995849609375, 0.012461662292480469, 0.013971328735351562, 0.015480995178222656, 0.01699066162109375, 0.018500328063964844, 0.020009994506835938, 0.02151966094970703, 0.023029327392578125, 0.02453899383544922, 0.026048660278320312, 0.027558326721191406, 0.0290679931640625, 0.030577659606933594, 0.03208732604980469, 0.03359699249267578, 0.035106658935546875, 0.03661632537841797, 0.03812599182128906, 0.039635658264160156, 0.04114532470703125, 0.042654991149902344, 0.04416465759277344, 0.04567432403564453, 0.047183990478515625, 0.04869365692138672, 0.05020332336425781, 0.051712989807128906, 0.05322265625]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 6.0, 16.0, 14.0, 24.0, 22.0, 49.0, 61.0, 116.0, 145.0, 165.0, 113.0, 97.0, 57.0, 34.0, 26.0, 20.0, 20.0, 7.0, 6.0, 3.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0657958984375, -0.0636281967163086, -0.06146049499511719, -0.05929279327392578, -0.057125091552734375, -0.05495738983154297, -0.05278968811035156, -0.050621986389160156, -0.04845428466796875, -0.046286582946777344, -0.04411888122558594, -0.04195117950439453, -0.039783477783203125, -0.03761577606201172, -0.03544807434082031, -0.033280372619628906, -0.0311126708984375, -0.028944969177246094, -0.026777267456054688, -0.02460956573486328, -0.022441864013671875, -0.02027416229248047, -0.018106460571289062, -0.015938758850097656, -0.01377105712890625, -0.011603355407714844, -0.009435653686523438, -0.007267951965332031, -0.005100250244140625, -0.0029325485229492188, -0.0007648468017578125, 0.0014028549194335938, 0.003570556640625, 0.005738258361816406, 0.007905960083007812, 0.010073661804199219, 0.012241363525390625, 0.014409065246582031, 0.016576766967773438, 0.018744468688964844, 0.02091217041015625, 0.023079872131347656, 0.025247573852539062, 0.02741527557373047, 0.029582977294921875, 0.03175067901611328, 0.03391838073730469, 0.036086082458496094, 0.0382537841796875, 0.040421485900878906, 0.04258918762207031, 0.04475688934326172, 0.046924591064453125, 0.04909229278564453, 0.05125999450683594, 0.053427696228027344, 0.05559539794921875, 0.057763099670410156, 0.05993080139160156, 0.06209850311279297, 0.06426620483398438, 0.06643390655517578, 0.06860160827636719, 0.0707693099975586, 0.07293701171875]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 6.0, 22.0, 88.0, 256.0, 395.0, 180.0, 48.0, 19.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.401869535446167, -2.335577964782715, -2.2692861557006836, -2.2029945850372314, -2.1367027759552, -2.070411205291748, -2.004119396209717, -1.9378278255462646, -1.871536135673523, -1.8052444458007812, -1.7389527559280396, -1.6726610660552979, -1.6063694953918457, -1.5400776863098145, -1.4737861156463623, -1.4074944257736206, -1.341202735900879, -1.2749110460281372, -1.2086193561553955, -1.1423276662826538, -1.076035976409912, -1.00974440574646, -0.9434527158737183, -0.8771610260009766, -0.8108693361282349, -0.7445776462554932, -0.6782859563827515, -0.6119943261146545, -0.5457026362419128, -0.47941094636917114, -0.41311928629875183, -0.3468276262283325, -0.2805356979370117, -0.2142440229654312, -0.1479523479938507, -0.0816606730222702, -0.015368998050689697, 0.050922691822052, 0.11721435189247131, 0.18350601196289062, 0.24979770183563232, 0.316089391708374, 0.38238105177879333, 0.44867271184921265, 0.5149644017219543, 0.581256091594696, 0.647547721862793, 0.7138394117355347, 0.7801311016082764, 0.8464227914810181, 0.9127144813537598, 0.9790061116218567, 1.0452978610992432, 1.1115894317626953, 1.177881121635437, 1.2441728115081787, 1.3104645013809204, 1.376756191253662, 1.4430478811264038, 1.5093395709991455, 1.5756311416625977, 1.641922950744629, 1.708214521408081, 1.7745062112808228, 1.8407979011535645]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 1.0, 2.0, 6.0, 10.0, 4.0, 2.0, 9.0, 14.0, 13.0, 12.0, 8.0, 19.0, 17.0, 24.0, 23.0, 32.0, 30.0, 28.0, 46.0, 39.0, 40.0, 49.0, 49.0, 49.0, 41.0, 45.0, 35.0, 31.0, 42.0, 37.0, 36.0, 30.0, 21.0, 17.0, 22.0, 17.0, 27.0, 12.0, 12.0, 8.0, 13.0, 7.0, 5.0, 1.0, 5.0, 3.0, 6.0, 2.0, 4.0, 1.0, 5.0, 1.0, 1.0, 2.0], "bins": [-0.4238309860229492, -0.41121748089790344, -0.39860397577285767, -0.3859904408454895, -0.3733769357204437, -0.36076343059539795, -0.3481499254703522, -0.3355364203453064, -0.32292288541793823, -0.31030938029289246, -0.2976958751678467, -0.2850823402404785, -0.27246883511543274, -0.25985532999038696, -0.2472418248653412, -0.2346283197402954, -0.22201481461524963, -0.20940130949020386, -0.1967877894639969, -0.1841742843389511, -0.17156076431274414, -0.15894725918769836, -0.1463337540626526, -0.1337202489376068, -0.12110672891139984, -0.10849321633577347, -0.0958797037601471, -0.08326619863510132, -0.07065268605947495, -0.05803917348384857, -0.045425668358802795, -0.03281215578317642, -0.02019864320755005, -0.007585132494568825, 0.005028378218412399, 0.017641887068748474, 0.030255399644374847, 0.04286891222000122, 0.055482417345047, 0.06809592992067337, 0.08070944249629974, 0.09332295507192612, 0.10593646764755249, 0.11854997277259827, 0.13116347789764404, 0.143776997923851, 0.1563905030488968, 0.16900402307510376, 0.18161752820014954, 0.1942310333251953, 0.20684455335140228, 0.21945805847644806, 0.23207157850265503, 0.2446850836277008, 0.2572985887527466, 0.26991209387779236, 0.28252559900283813, 0.2951391041278839, 0.3077526092529297, 0.32036614418029785, 0.33297964930534363, 0.3455931544303894, 0.3582066595554352, 0.37082016468048096, 0.3834336996078491]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 7.0, 6.0, 4.0, 10.0, 11.0, 10.0, 23.0, 39.0, 99.0, 329.0, 1275.0, 15065.0, 4174600.0, 2034.0, 428.0, 159.0, 68.0, 39.0, 20.0, 22.0, 10.0, 6.0, 7.0, 7.0, 0.0, 1.0, 2.0, 2.0, 3.0], "bins": [-0.33203125, -0.32498645782470703, -0.31794166564941406, -0.3108968734741211, -0.3038520812988281, -0.29680728912353516, -0.2897624969482422, -0.2827177047729492, -0.27567291259765625, -0.2686281204223633, -0.2615833282470703, -0.25453853607177734, -0.24749374389648438, -0.2404489517211914, -0.23340415954589844, -0.22635936737060547, -0.2193145751953125, -0.21226978302001953, -0.20522499084472656, -0.1981801986694336, -0.19113540649414062, -0.18409061431884766, -0.1770458221435547, -0.17000102996826172, -0.16295623779296875, -0.15591144561767578, -0.1488666534423828, -0.14182186126708984, -0.13477706909179688, -0.1277322769165039, -0.12068748474121094, -0.11364269256591797, -0.106597900390625, -0.09955310821533203, -0.09250831604003906, -0.0854635238647461, -0.07841873168945312, -0.07137393951416016, -0.06432914733886719, -0.05728435516357422, -0.05023956298828125, -0.04319477081298828, -0.03614997863769531, -0.029105186462402344, -0.022060394287109375, -0.015015602111816406, -0.007970809936523438, -0.0009260177612304688, 0.0061187744140625, 0.013163566589355469, 0.020208358764648438, 0.027253150939941406, 0.034297943115234375, 0.041342735290527344, 0.04838752746582031, 0.05543231964111328, 0.06247711181640625, 0.06952190399169922, 0.07656669616699219, 0.08361148834228516, 0.09065628051757812, 0.0977010726928711, 0.10474586486816406, 0.11179065704345703, 0.11883544921875]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 8.0, 27.0, 57.0, 82.0, 139.0, 190.0, 194.0, 147.0, 81.0, 39.0, 17.0, 4.0, 7.0, 1.0, 2.0, 5.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1331787109375, -0.1300048828125, -0.1268310546875, -0.1236572265625, -0.1204833984375, -0.1173095703125, -0.1141357421875, -0.1109619140625, -0.1077880859375, -0.1046142578125, -0.1014404296875, -0.0982666015625, -0.0950927734375, -0.0919189453125, -0.0887451171875, -0.0855712890625, -0.0823974609375, -0.0792236328125, -0.0760498046875, -0.0728759765625, -0.0697021484375, -0.0665283203125, -0.0633544921875, -0.0601806640625, -0.0570068359375, -0.0538330078125, -0.0506591796875, -0.0474853515625, -0.0443115234375, -0.0411376953125, -0.0379638671875, -0.0347900390625, -0.0316162109375, -0.0284423828125, -0.0252685546875, -0.0220947265625, -0.0189208984375, -0.0157470703125, -0.0125732421875, -0.0093994140625, -0.0062255859375, -0.0030517578125, 0.0001220703125, 0.0032958984375, 0.0064697265625, 0.0096435546875, 0.0128173828125, 0.0159912109375, 0.0191650390625, 0.0223388671875, 0.0255126953125, 0.0286865234375, 0.0318603515625, 0.0350341796875, 0.0382080078125, 0.0413818359375, 0.0445556640625, 0.0477294921875, 0.0509033203125, 0.0540771484375, 0.0572509765625, 0.0604248046875, 0.0635986328125, 0.0667724609375, 0.0699462890625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 7.0, 3.0, 6.0, 19.0, 30.0, 35.0, 53.0, 91.0, 161.0, 289.0, 550.0, 1239.0, 3549.0, 23424.0, 4152883.0, 8103.0, 2055.0, 861.0, 423.0, 208.0, 118.0, 67.0, 37.0, 31.0, 15.0, 9.0, 8.0, 6.0, 5.0, 4.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0689697265625, -0.06612873077392578, -0.06328773498535156, -0.060446739196777344, -0.057605743408203125, -0.054764747619628906, -0.05192375183105469, -0.04908275604248047, -0.04624176025390625, -0.04340076446533203, -0.04055976867675781, -0.037718772888183594, -0.034877777099609375, -0.032036781311035156, -0.029195785522460938, -0.02635478973388672, -0.0235137939453125, -0.02067279815673828, -0.017831802368164062, -0.014990806579589844, -0.012149810791015625, -0.009308815002441406, -0.0064678192138671875, -0.0036268234252929688, -0.00078582763671875, 0.0020551681518554688, 0.0048961639404296875, 0.007737159729003906, 0.010578155517578125, 0.013419151306152344, 0.016260147094726562, 0.01910114288330078, 0.021942138671875, 0.02478313446044922, 0.027624130249023438, 0.030465126037597656, 0.033306121826171875, 0.036147117614746094, 0.03898811340332031, 0.04182910919189453, 0.04467010498046875, 0.04751110076904297, 0.05035209655761719, 0.053193092346191406, 0.056034088134765625, 0.058875083923339844, 0.06171607971191406, 0.06455707550048828, 0.0673980712890625, 0.07023906707763672, 0.07308006286621094, 0.07592105865478516, 0.07876205444335938, 0.0816030502319336, 0.08444404602050781, 0.08728504180908203, 0.09012603759765625, 0.09296703338623047, 0.09580802917480469, 0.0986490249633789, 0.10149002075195312, 0.10433101654052734, 0.10717201232910156, 0.11001300811767578, 0.11285400390625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 6.0, 6.0, 7.0, 26.0, 3884.0, 94.0, 23.0, 8.0, 6.0, 4.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01016998291015625, -0.009775638580322266, -0.009381294250488281, -0.008986949920654297, -0.008592605590820312, -0.008198261260986328, -0.007803916931152344, -0.007409572601318359, -0.007015228271484375, -0.006620883941650391, -0.006226539611816406, -0.005832195281982422, -0.0054378509521484375, -0.005043506622314453, -0.004649162292480469, -0.004254817962646484, -0.0038604736328125, -0.0034661293029785156, -0.0030717849731445312, -0.002677440643310547, -0.0022830963134765625, -0.0018887519836425781, -0.0014944076538085938, -0.0011000633239746094, -0.000705718994140625, -0.0003113746643066406, 8.296966552734375e-05, 0.0004773139953613281, 0.0008716583251953125, 0.0012660026550292969, 0.0016603469848632812, 0.0020546913146972656, 0.00244903564453125, 0.0028433799743652344, 0.0032377243041992188, 0.003632068634033203, 0.0040264129638671875, 0.004420757293701172, 0.004815101623535156, 0.005209445953369141, 0.005603790283203125, 0.005998134613037109, 0.006392478942871094, 0.006786823272705078, 0.0071811676025390625, 0.007575511932373047, 0.007969856262207031, 0.008364200592041016, 0.008758544921875, 0.009152889251708984, 0.009547233581542969, 0.009941577911376953, 0.010335922241210938, 0.010730266571044922, 0.011124610900878906, 0.01151895523071289, 0.011913299560546875, 0.01230764389038086, 0.012701988220214844, 0.013096332550048828, 0.013490676879882812, 0.013885021209716797, 0.014279365539550781, 0.014673709869384766, 0.01506805419921875]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 10.0, 14.0, 63.0, 194.0, 339.0, 228.0, 100.0, 41.0, 15.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03993437439203262, -0.03752191364765167, -0.03510945290327072, -0.03269699215888977, -0.03028452955186367, -0.02787206880748272, -0.02545960620045662, -0.02304714545607567, -0.020634684711694717, -0.018222223967313766, -0.015809763222932816, -0.013397300615906715, -0.010984839871525764, -0.008572379127144814, -0.006159917451441288, -0.0037474557757377625, -0.0013349950313568115, 0.0010774661786854267, 0.003489927388727665, 0.005902388598769903, 0.008314849808812141, 0.010727310553193092, 0.013139772228896618, 0.015552233904600143, 0.017964694648981094, 0.020377155393362045, 0.022789616137742996, 0.025202078744769096, 0.027614539489150047, 0.030027000233530998, 0.0324394628405571, 0.03485192358493805, 0.0372643768787384, 0.039676837623119354, 0.042089298367500305, 0.044501759111881256, 0.04691421985626221, 0.04932668060064316, 0.05173914507031441, 0.05415160581469536, 0.05656406655907631, 0.05897652730345726, 0.06138898804783821, 0.06380145251750946, 0.06621391326189041, 0.06862637400627136, 0.07103883475065231, 0.07345129549503326, 0.07586375623941422, 0.07827621698379517, 0.08068867772817612, 0.08310113847255707, 0.08551359921693802, 0.08792605996131897, 0.09033852070569992, 0.09275098145008087, 0.09516344964504242, 0.09757591038942337, 0.09998837113380432, 0.10240083187818527, 0.10481329262256622, 0.10722575336694717, 0.10963821411132812, 0.11205068230628967, 0.11446313560009003]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 4.0, 11.0, 10.0, 2.0, 10.0, 13.0, 15.0, 14.0, 30.0, 29.0, 22.0, 32.0, 32.0, 33.0, 40.0, 45.0, 47.0, 46.0, 50.0, 52.0, 42.0, 37.0, 51.0, 53.0, 46.0, 30.0, 37.0, 24.0, 29.0, 30.0, 17.0, 11.0, 6.0, 13.0, 12.0, 8.0, 6.0, 4.0, 1.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.016213417053222656, -0.015672829002141953, -0.015132240951061249, -0.014591652899980545, -0.014051064848899841, -0.013510476797819138, -0.012969888746738434, -0.01242930069565773, -0.011888712644577026, -0.011348124593496323, -0.010807536542415619, -0.010266948491334915, -0.009726360440254211, -0.009185772389173508, -0.008645184338092804, -0.0081045962870121, -0.0075640082359313965, -0.007023420184850693, -0.006482832133769989, -0.005942244082689285, -0.0054016560316085815, -0.004861067980527878, -0.004320479929447174, -0.0037798918783664703, -0.0032393038272857666, -0.002698715776205063, -0.002158127725124359, -0.0016175396740436554, -0.0010769516229629517, -0.0005363635718822479, 4.2244791984558105e-06, 0.0005448125302791595, 0.0010854005813598633, 0.001625988632440567, 0.0021665766835212708, 0.0027071647346019745, 0.0032477527856826782, 0.003788340836763382, 0.004328928887844086, 0.004869516938924789, 0.005410104990005493, 0.005950693041086197, 0.006491281092166901, 0.007031869143247604, 0.007572457194328308, 0.008113045245409012, 0.008653633296489716, 0.00919422134757042, 0.009734809398651123, 0.010275397449731827, 0.01081598550081253, 0.011356573551893234, 0.011897161602973938, 0.012437749654054642, 0.012978337705135345, 0.01351892575621605, 0.014059513807296753, 0.014600101858377457, 0.01514068990945816, 0.015681277960538864, 0.016221866011619568, 0.01676245406270027, 0.017303042113780975, 0.01784363016486168, 0.018384218215942383]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 6.0, 5.0, 5.0, 8.0, 8.0, 17.0, 22.0, 35.0, 34.0, 47.0, 77.0, 89.0, 151.0, 208.0, 356.0, 464.0, 819.0, 1384.0, 2993.0, 9317.0, 65309.0, 690845.0, 243884.0, 22798.0, 4915.0, 1841.0, 1016.0, 612.0, 369.0, 297.0, 170.0, 106.0, 94.0, 62.0, 42.0, 44.0, 21.0, 23.0, 13.0, 13.0, 12.0, 8.0, 5.0, 2.0, 3.0, 3.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2578125, -0.2499408721923828, -0.24206924438476562, -0.23419761657714844, -0.22632598876953125, -0.21845436096191406, -0.21058273315429688, -0.2027111053466797, -0.1948394775390625, -0.1869678497314453, -0.17909622192382812, -0.17122459411621094, -0.16335296630859375, -0.15548133850097656, -0.14760971069335938, -0.1397380828857422, -0.131866455078125, -0.12399482727050781, -0.11612319946289062, -0.10825157165527344, -0.10037994384765625, -0.09250831604003906, -0.08463668823242188, -0.07676506042480469, -0.0688934326171875, -0.06102180480957031, -0.053150177001953125, -0.04527854919433594, -0.03740692138671875, -0.029535293579101562, -0.021663665771484375, -0.013792037963867188, -0.00592041015625, 0.0019512176513671875, 0.009822845458984375, 0.017694473266601562, 0.02556610107421875, 0.03343772888183594, 0.041309356689453125, 0.04918098449707031, 0.0570526123046875, 0.06492424011230469, 0.07279586791992188, 0.08066749572753906, 0.08853912353515625, 0.09641075134277344, 0.10428237915039062, 0.11215400695800781, 0.120025634765625, 0.1278972625732422, 0.13576889038085938, 0.14364051818847656, 0.15151214599609375, 0.15938377380371094, 0.16725540161132812, 0.1751270294189453, 0.1829986572265625, 0.1908702850341797, 0.19874191284179688, 0.20661354064941406, 0.21448516845703125, 0.22235679626464844, 0.23022842407226562, 0.2381000518798828, 0.2459716796875]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 7.0, 27.0, 53.0, 81.0, 147.0, 187.0, 193.0, 146.0, 82.0, 41.0, 18.0, 3.0, 7.0, 1.0, 2.0, 5.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.13330078125, -0.1301250457763672, -0.12694931030273438, -0.12377357482910156, -0.12059783935546875, -0.11742210388183594, -0.11424636840820312, -0.11107063293457031, -0.1078948974609375, -0.10471916198730469, -0.10154342651367188, -0.09836769104003906, -0.09519195556640625, -0.09201622009277344, -0.08884048461914062, -0.08566474914550781, -0.082489013671875, -0.07931327819824219, -0.07613754272460938, -0.07296180725097656, -0.06978607177734375, -0.06661033630371094, -0.06343460083007812, -0.06025886535644531, -0.0570831298828125, -0.05390739440917969, -0.050731658935546875, -0.04755592346191406, -0.04438018798828125, -0.04120445251464844, -0.038028717041015625, -0.03485298156738281, -0.03167724609375, -0.028501510620117188, -0.025325775146484375, -0.022150039672851562, -0.01897430419921875, -0.015798568725585938, -0.012622833251953125, -0.009447097778320312, -0.0062713623046875, -0.0030956268310546875, 8.0108642578125e-05, 0.0032558441162109375, 0.00643157958984375, 0.009607315063476562, 0.012783050537109375, 0.015958786010742188, 0.019134521484375, 0.022310256958007812, 0.025485992431640625, 0.028661727905273438, 0.03183746337890625, 0.03501319885253906, 0.038188934326171875, 0.04136466979980469, 0.0445404052734375, 0.04771614074707031, 0.050891876220703125, 0.05406761169433594, 0.05724334716796875, 0.06041908264160156, 0.06359481811523438, 0.06677055358886719, 0.0699462890625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 8.0, 4.0, 8.0, 11.0, 11.0, 20.0, 24.0, 35.0, 76.0, 97.0, 163.0, 235.0, 545.0, 1001.0, 1994.0, 4376.0, 10111.0, 25770.0, 76556.0, 263829.0, 451640.0, 139634.0, 43916.0, 15865.0, 6614.0, 2870.0, 1407.0, 754.0, 386.0, 236.0, 118.0, 81.0, 45.0, 36.0, 25.0, 17.0, 9.0, 6.0, 7.0, 10.0, 1.0, 2.0, 1.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.0762939453125, -0.0738525390625, -0.0714111328125, -0.0689697265625, -0.0665283203125, -0.0640869140625, -0.0616455078125, -0.0592041015625, -0.0567626953125, -0.0543212890625, -0.0518798828125, -0.0494384765625, -0.0469970703125, -0.0445556640625, -0.0421142578125, -0.0396728515625, -0.0372314453125, -0.0347900390625, -0.0323486328125, -0.0299072265625, -0.0274658203125, -0.0250244140625, -0.0225830078125, -0.0201416015625, -0.0177001953125, -0.0152587890625, -0.0128173828125, -0.0103759765625, -0.0079345703125, -0.0054931640625, -0.0030517578125, -0.0006103515625, 0.0018310546875, 0.0042724609375, 0.0067138671875, 0.0091552734375, 0.0115966796875, 0.0140380859375, 0.0164794921875, 0.0189208984375, 0.0213623046875, 0.0238037109375, 0.0262451171875, 0.0286865234375, 0.0311279296875, 0.0335693359375, 0.0360107421875, 0.0384521484375, 0.0408935546875, 0.0433349609375, 0.0457763671875, 0.0482177734375, 0.0506591796875, 0.0531005859375, 0.0555419921875, 0.0579833984375, 0.0604248046875, 0.0628662109375, 0.0653076171875, 0.0677490234375, 0.0701904296875, 0.0726318359375, 0.0750732421875, 0.0775146484375, 0.0799560546875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 2.0, 6.0, 7.0, 12.0, 13.0, 17.0, 4.0, 23.0, 25.0, 30.0, 39.0, 33.0, 37.0, 53.0, 50.0, 63.0, 52.0, 55.0, 57.0, 51.0, 37.0, 42.0, 49.0, 40.0, 29.0, 37.0, 27.0, 21.0, 26.0, 17.0, 10.0, 12.0, 13.0, 8.0, 1.0, 3.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.081298828125, -0.07800865173339844, -0.07471847534179688, -0.07142829895019531, -0.06813812255859375, -0.06484794616699219, -0.061557769775390625, -0.05826759338378906, -0.0549774169921875, -0.05168724060058594, -0.048397064208984375, -0.04510688781738281, -0.04181671142578125, -0.03852653503417969, -0.035236358642578125, -0.03194618225097656, -0.028656005859375, -0.025365829467773438, -0.022075653076171875, -0.018785476684570312, -0.01549530029296875, -0.012205123901367188, -0.008914947509765625, -0.0056247711181640625, -0.0023345947265625, 0.0009555816650390625, 0.004245758056640625, 0.0075359344482421875, 0.01082611083984375, 0.014116287231445312, 0.017406463623046875, 0.020696640014648438, 0.02398681640625, 0.027276992797851562, 0.030567169189453125, 0.03385734558105469, 0.03714752197265625, 0.04043769836425781, 0.043727874755859375, 0.04701805114746094, 0.0503082275390625, 0.05359840393066406, 0.056888580322265625, 0.06017875671386719, 0.06346893310546875, 0.06675910949707031, 0.07004928588867188, 0.07333946228027344, 0.076629638671875, 0.07991981506347656, 0.08320999145507812, 0.08650016784667969, 0.08979034423828125, 0.09308052062988281, 0.09637069702148438, 0.09966087341308594, 0.1029510498046875, 0.10624122619628906, 0.10953140258789062, 0.11282157897949219, 0.11611175537109375, 0.11940193176269531, 0.12269210815429688, 0.12598228454589844, 0.1292724609375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 0.0, 4.0, 4.0, 5.0, 12.0, 9.0, 15.0, 26.0, 33.0, 43.0, 50.0, 88.0, 96.0, 134.0, 198.0, 323.0, 559.0, 863.0, 1532.0, 2779.0, 6047.0, 15034.0, 50087.0, 371145.0, 509828.0, 58853.0, 16903.0, 6547.0, 3156.0, 1576.0, 905.0, 558.0, 343.0, 247.0, 150.0, 107.0, 93.0, 51.0, 40.0, 32.0, 25.0, 18.0, 7.0, 7.0, 7.0, 4.0, 3.0, 0.0, 6.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.041595458984375, -0.04025602340698242, -0.038916587829589844, -0.037577152252197266, -0.03623771667480469, -0.03489828109741211, -0.03355884552001953, -0.03221940994262695, -0.030879974365234375, -0.029540538787841797, -0.02820110321044922, -0.02686166763305664, -0.025522232055664062, -0.024182796478271484, -0.022843360900878906, -0.021503925323486328, -0.02016448974609375, -0.018825054168701172, -0.017485618591308594, -0.016146183013916016, -0.014806747436523438, -0.01346731185913086, -0.012127876281738281, -0.010788440704345703, -0.009449005126953125, -0.008109569549560547, -0.006770133972167969, -0.005430698394775391, -0.0040912628173828125, -0.0027518272399902344, -0.0014123916625976562, -7.295608520507812e-05, 0.0012664794921875, 0.002605915069580078, 0.003945350646972656, 0.005284786224365234, 0.0066242218017578125, 0.00796365737915039, 0.009303092956542969, 0.010642528533935547, 0.011981964111328125, 0.013321399688720703, 0.014660835266113281, 0.01600027084350586, 0.017339706420898438, 0.018679141998291016, 0.020018577575683594, 0.021358013153076172, 0.02269744873046875, 0.024036884307861328, 0.025376319885253906, 0.026715755462646484, 0.028055191040039062, 0.02939462661743164, 0.03073406219482422, 0.0320734977722168, 0.033412933349609375, 0.03475236892700195, 0.03609180450439453, 0.03743124008178711, 0.03877067565917969, 0.040110111236572266, 0.041449546813964844, 0.04278898239135742, 0.04412841796875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 3.0, 2.0, 6.0, 4.0, 6.0, 7.0, 9.0, 19.0, 16.0, 27.0, 32.0, 39.0, 51.0, 74.0, 123.0, 146.0, 131.0, 76.0, 60.0, 30.0, 30.0, 15.0, 15.0, 15.0, 10.0, 14.0, 9.0, 7.0, 5.0, 7.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0001277923583984375, -0.00012397393584251404, -0.00012015551328659058, -0.00011633709073066711, -0.00011251866817474365, -0.00010870024561882019, -0.00010488182306289673, -0.00010106340050697327, -9.72449779510498e-05, -9.342655539512634e-05, -8.960813283920288e-05, -8.578971028327942e-05, -8.197128772735596e-05, -7.81528651714325e-05, -7.433444261550903e-05, -7.051602005958557e-05, -6.669759750366211e-05, -6.287917494773865e-05, -5.9060752391815186e-05, -5.5242329835891724e-05, -5.142390727996826e-05, -4.76054847240448e-05, -4.378706216812134e-05, -3.9968639612197876e-05, -3.6150217056274414e-05, -3.233179450035095e-05, -2.851337194442749e-05, -2.469494938850403e-05, -2.0876526832580566e-05, -1.7058104276657104e-05, -1.3239681720733643e-05, -9.42125916481018e-06, -5.602836608886719e-06, -1.7844140529632568e-06, 2.034008502960205e-06, 5.852431058883667e-06, 9.670853614807129e-06, 1.348927617073059e-05, 1.7307698726654053e-05, 2.1126121282577515e-05, 2.4944543838500977e-05, 2.876296639442444e-05, 3.25813889503479e-05, 3.639981150627136e-05, 4.0218234062194824e-05, 4.4036656618118286e-05, 4.785507917404175e-05, 5.167350172996521e-05, 5.549192428588867e-05, 5.9310346841812134e-05, 6.31287693977356e-05, 6.694719195365906e-05, 7.076561450958252e-05, 7.458403706550598e-05, 7.840245962142944e-05, 8.22208821773529e-05, 8.603930473327637e-05, 8.985772728919983e-05, 9.367614984512329e-05, 9.749457240104675e-05, 0.00010131299495697021, 0.00010513141751289368, 0.00010894984006881714, 0.0001127682626247406, 0.00011658668518066406]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 5.0, 6.0, 7.0, 10.0, 14.0, 26.0, 35.0, 59.0, 102.0, 202.0, 377.0, 848.0, 2798.0, 14173.0, 205901.0, 788242.0, 28824.0, 4568.0, 1271.0, 524.0, 243.0, 130.0, 73.0, 43.0, 29.0, 10.0, 18.0, 6.0, 4.0, 6.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.113525390625, -0.11038684844970703, -0.10724830627441406, -0.1041097640991211, -0.10097122192382812, -0.09783267974853516, -0.09469413757324219, -0.09155559539794922, -0.08841705322265625, -0.08527851104736328, -0.08213996887207031, -0.07900142669677734, -0.07586288452148438, -0.0727243423461914, -0.06958580017089844, -0.06644725799560547, -0.0633087158203125, -0.06017017364501953, -0.05703163146972656, -0.053893089294433594, -0.050754547119140625, -0.047616004943847656, -0.04447746276855469, -0.04133892059326172, -0.03820037841796875, -0.03506183624267578, -0.03192329406738281, -0.028784751892089844, -0.025646209716796875, -0.022507667541503906, -0.019369125366210938, -0.01623058319091797, -0.013092041015625, -0.009953498840332031, -0.0068149566650390625, -0.0036764144897460938, -0.000537872314453125, 0.0026006698608398438, 0.0057392120361328125, 0.008877754211425781, 0.01201629638671875, 0.015154838562011719, 0.018293380737304688, 0.021431922912597656, 0.024570465087890625, 0.027709007263183594, 0.030847549438476562, 0.03398609161376953, 0.0371246337890625, 0.04026317596435547, 0.04340171813964844, 0.046540260314941406, 0.049678802490234375, 0.052817344665527344, 0.05595588684082031, 0.05909442901611328, 0.06223297119140625, 0.06537151336669922, 0.06851005554199219, 0.07164859771728516, 0.07478713989257812, 0.0779256820678711, 0.08106422424316406, 0.08420276641845703, 0.08734130859375]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 7.0, 4.0, 14.0, 23.0, 25.0, 32.0, 42.0, 73.0, 111.0, 155.0, 151.0, 113.0, 86.0, 39.0, 36.0, 20.0, 26.0, 12.0, 10.0, 7.0, 4.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.05389404296875, -0.051903724670410156, -0.04991340637207031, -0.04792308807373047, -0.045932769775390625, -0.04394245147705078, -0.04195213317871094, -0.039961814880371094, -0.03797149658203125, -0.035981178283691406, -0.03399085998535156, -0.03200054168701172, -0.030010223388671875, -0.02801990509033203, -0.026029586791992188, -0.024039268493652344, -0.0220489501953125, -0.020058631896972656, -0.018068313598632812, -0.01607799530029297, -0.014087677001953125, -0.012097358703613281, -0.010107040405273438, -0.008116722106933594, -0.00612640380859375, -0.004136085510253906, -0.0021457672119140625, -0.00015544891357421875, 0.001834869384765625, 0.0038251876831054688, 0.0058155059814453125, 0.007805824279785156, 0.009796142578125, 0.011786460876464844, 0.013776779174804688, 0.01576709747314453, 0.017757415771484375, 0.01974773406982422, 0.021738052368164062, 0.023728370666503906, 0.02571868896484375, 0.027709007263183594, 0.029699325561523438, 0.03168964385986328, 0.033679962158203125, 0.03567028045654297, 0.03766059875488281, 0.039650917053222656, 0.0416412353515625, 0.043631553649902344, 0.04562187194824219, 0.04761219024658203, 0.049602508544921875, 0.05159282684326172, 0.05358314514160156, 0.055573463439941406, 0.05756378173828125, 0.059554100036621094, 0.06154441833496094, 0.06353473663330078, 0.06552505493164062, 0.06751537322998047, 0.06950569152832031, 0.07149600982666016, 0.073486328125]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 8.0, 13.0, 38.0, 93.0, 223.0, 303.0, 223.0, 59.0, 36.0, 13.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.7570199966430664, -2.704591989517212, -2.6521639823913574, -2.599735975265503, -2.5473079681396484, -2.494879722595215, -2.4424517154693604, -2.390023708343506, -2.3375957012176514, -2.285167694091797, -2.2327396869659424, -2.180311679840088, -2.1278834342956543, -2.0754554271698, -2.0230274200439453, -1.9705994129180908, -1.9181714057922363, -1.8657433986663818, -1.8133153915405273, -1.7608872652053833, -1.7084592580795288, -1.6560312509536743, -1.6036031246185303, -1.5511751174926758, -1.4987471103668213, -1.4463191032409668, -1.3938910961151123, -1.3414629697799683, -1.2890349626541138, -1.2366069555282593, -1.1841788291931152, -1.1317508220672607, -1.0793226957321167, -1.0268946886062622, -0.9744666218757629, -0.9220385551452637, -0.8696105480194092, -0.8171825408935547, -0.7647544741630554, -0.7123264074325562, -0.6598984003067017, -0.6074703931808472, -0.5550423264503479, -0.5026142597198486, -0.45018625259399414, -0.39775821566581726, -0.3453301787376404, -0.2929021418094635, -0.24047410488128662, -0.18804606795310974, -0.13561803102493286, -0.08318999409675598, -0.0307619571685791, 0.02166607975959778, 0.07409411668777466, 0.12652215361595154, 0.17895019054412842, 0.2313782274723053, 0.2838062644004822, 0.33623430132865906, 0.38866233825683594, 0.4410903751850128, 0.4935184121131897, 0.545946478843689, 0.5983744859695435]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 3.0, 0.0, 5.0, 0.0, 5.0, 7.0, 13.0, 4.0, 7.0, 4.0, 15.0, 16.0, 16.0, 16.0, 29.0, 25.0, 23.0, 32.0, 33.0, 46.0, 32.0, 51.0, 41.0, 50.0, 54.0, 53.0, 44.0, 49.0, 40.0, 33.0, 29.0, 23.0, 32.0, 22.0, 27.0, 20.0, 20.0, 18.0, 20.0, 14.0, 9.0, 9.0, 6.0, 2.0, 0.0, 2.0, 2.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.40834635496139526, -0.3949120342731476, -0.3814776837825775, -0.36804336309432983, -0.35460904240608215, -0.3411746919155121, -0.3277403712272644, -0.31430602073669434, -0.30087170004844666, -0.287437379360199, -0.2740030288696289, -0.2605687081813812, -0.24713437259197235, -0.23370003700256348, -0.2202657163143158, -0.20683138072490692, -0.19339706003665924, -0.17996272444725037, -0.16652840375900269, -0.1530940681695938, -0.13965973258018494, -0.12622541189193726, -0.11279107630252838, -0.0993567407131195, -0.08592241257429123, -0.07248808443546295, -0.05905374884605408, -0.0456194207072258, -0.032185088843107224, -0.018750756978988647, -0.00531642884016037, 0.008117906749248505, 0.021552234888076782, 0.03498656675219536, 0.048420898616313934, 0.06185522675514221, 0.07528956234455109, 0.08872389048337936, 0.10215821862220764, 0.11559255421161652, 0.1290268898010254, 0.14246122539043427, 0.15589554607868195, 0.16932988166809082, 0.1827642172574997, 0.19619855284690857, 0.20963287353515625, 0.22306720912456512, 0.2365015298128128, 0.24993586540222168, 0.26337018609046936, 0.27680450677871704, 0.2902388572692871, 0.3036731779575348, 0.31710749864578247, 0.33054184913635254, 0.3439761698246002, 0.3574104905128479, 0.37084484100341797, 0.38427916169166565, 0.39771348237991333, 0.4111478328704834, 0.4245821535587311, 0.43801647424697876, 0.45145082473754883]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 7.0, 21.0, 13.0, 33.0, 57.0, 100.0, 253.0, 736.0, 14507.0, 4177191.0, 839.0, 260.0, 110.0, 62.0, 23.0, 20.0, 10.0, 12.0, 8.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.415771484375, -0.4031867980957031, -0.39060211181640625, -0.3780174255371094, -0.3654327392578125, -0.3528480529785156, -0.34026336669921875, -0.3276786804199219, -0.315093994140625, -0.3025093078613281, -0.28992462158203125, -0.2773399353027344, -0.2647552490234375, -0.2521705627441406, -0.23958587646484375, -0.22700119018554688, -0.21441650390625, -0.20183181762695312, -0.18924713134765625, -0.17666244506835938, -0.1640777587890625, -0.15149307250976562, -0.13890838623046875, -0.12632369995117188, -0.113739013671875, -0.10115432739257812, -0.08856964111328125, -0.07598495483398438, -0.0634002685546875, -0.050815582275390625, -0.03823089599609375, -0.025646209716796875, -0.0130615234375, -0.000476837158203125, 0.01210784912109375, 0.024692535400390625, 0.0372772216796875, 0.049861907958984375, 0.06244659423828125, 0.07503128051757812, 0.087615966796875, 0.10020065307617188, 0.11278533935546875, 0.12537002563476562, 0.1379547119140625, 0.15053939819335938, 0.16312408447265625, 0.17570877075195312, 0.18829345703125, 0.20087814331054688, 0.21346282958984375, 0.22604751586914062, 0.2386322021484375, 0.2512168884277344, 0.26380157470703125, 0.2763862609863281, 0.288970947265625, 0.3015556335449219, 0.31414031982421875, 0.3267250061035156, 0.3393096923828125, 0.3518943786621094, 0.36447906494140625, 0.3770637512207031, 0.3896484375]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 7.0, 22.0, 50.0, 86.0, 144.0, 190.0, 199.0, 138.0, 89.0, 35.0, 21.0, 7.0, 5.0, 1.0, 2.0, 5.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.133544921875, -0.13036537170410156, -0.12718582153320312, -0.12400627136230469, -0.12082672119140625, -0.11764717102050781, -0.11446762084960938, -0.11128807067871094, -0.1081085205078125, -0.10492897033691406, -0.10174942016601562, -0.09856986999511719, -0.09539031982421875, -0.09221076965332031, -0.08903121948242188, -0.08585166931152344, -0.082672119140625, -0.07949256896972656, -0.07631301879882812, -0.07313346862792969, -0.06995391845703125, -0.06677436828613281, -0.06359481811523438, -0.06041526794433594, -0.0572357177734375, -0.05405616760253906, -0.050876617431640625, -0.04769706726074219, -0.04451751708984375, -0.04133796691894531, -0.038158416748046875, -0.03497886657714844, -0.03179931640625, -0.028619766235351562, -0.025440216064453125, -0.022260665893554688, -0.01908111572265625, -0.015901565551757812, -0.012722015380859375, -0.009542465209960938, -0.0063629150390625, -0.0031833648681640625, -3.814697265625e-06, 0.0031757354736328125, 0.00635528564453125, 0.009534835815429688, 0.012714385986328125, 0.015893936157226562, 0.019073486328125, 0.022253036499023438, 0.025432586669921875, 0.028612136840820312, 0.03179168701171875, 0.03497123718261719, 0.038150787353515625, 0.04133033752441406, 0.0445098876953125, 0.04768943786621094, 0.050868988037109375, 0.05404853820800781, 0.05722808837890625, 0.06040763854980469, 0.06358718872070312, 0.06676673889160156, 0.0699462890625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 2.0, 4.0, 12.0, 4.0, 9.0, 6.0, 13.0, 14.0, 21.0, 29.0, 40.0, 59.0, 82.0, 151.0, 221.0, 358.0, 642.0, 1162.0, 2314.0, 7023.0, 4170655.0, 6431.0, 2145.0, 1187.0, 633.0, 396.0, 236.0, 140.0, 90.0, 62.0, 37.0, 21.0, 15.0, 14.0, 13.0, 9.0, 4.0, 14.0, 5.0, 5.0, 5.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.10406494140625, -0.100860595703125, -0.09765625, -0.094451904296875, -0.09124755859375, -0.088043212890625, -0.0848388671875, -0.081634521484375, -0.07843017578125, -0.075225830078125, -0.072021484375, -0.068817138671875, -0.06561279296875, -0.062408447265625, -0.0592041015625, -0.055999755859375, -0.05279541015625, -0.049591064453125, -0.04638671875, -0.043182373046875, -0.03997802734375, -0.036773681640625, -0.0335693359375, -0.030364990234375, -0.02716064453125, -0.023956298828125, -0.020751953125, -0.017547607421875, -0.01434326171875, -0.011138916015625, -0.0079345703125, -0.004730224609375, -0.00152587890625, 0.001678466796875, 0.0048828125, 0.008087158203125, 0.01129150390625, 0.014495849609375, 0.0177001953125, 0.020904541015625, 0.02410888671875, 0.027313232421875, 0.030517578125, 0.033721923828125, 0.03692626953125, 0.040130615234375, 0.0433349609375, 0.046539306640625, 0.04974365234375, 0.052947998046875, 0.05615234375, 0.059356689453125, 0.06256103515625, 0.065765380859375, 0.0689697265625, 0.072174072265625, 0.07537841796875, 0.078582763671875, 0.081787109375, 0.084991455078125, 0.08819580078125, 0.091400146484375, 0.0946044921875, 0.097808837890625, 0.10101318359375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 29.0, 4014.0, 20.0, 5.0, 8.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.011627197265625, -0.010914802551269531, -0.010202407836914062, -0.009490013122558594, -0.008777618408203125, -0.008065223693847656, -0.0073528289794921875, -0.006640434265136719, -0.00592803955078125, -0.005215644836425781, -0.0045032501220703125, -0.0037908554077148438, -0.003078460693359375, -0.0023660659790039062, -0.0016536712646484375, -0.0009412765502929688, -0.0002288818359375, 0.00048351287841796875, 0.0011959075927734375, 0.0019083023071289062, 0.002620697021484375, 0.0033330917358398438, 0.0040454864501953125, 0.004757881164550781, 0.00547027587890625, 0.006182670593261719, 0.0068950653076171875, 0.007607460021972656, 0.008319854736328125, 0.009032249450683594, 0.009744644165039062, 0.010457038879394531, 0.01116943359375, 0.011881828308105469, 0.012594223022460938, 0.013306617736816406, 0.014019012451171875, 0.014731407165527344, 0.015443801879882812, 0.01615619659423828, 0.01686859130859375, 0.01758098602294922, 0.018293380737304688, 0.019005775451660156, 0.019718170166015625, 0.020430564880371094, 0.021142959594726562, 0.02185535430908203, 0.0225677490234375, 0.02328014373779297, 0.023992538452148438, 0.024704933166503906, 0.025417327880859375, 0.026129722595214844, 0.026842117309570312, 0.02755451202392578, 0.02826690673828125, 0.02897930145263672, 0.029691696166992188, 0.030404090881347656, 0.031116485595703125, 0.031828880310058594, 0.03254127502441406, 0.03325366973876953, 0.033966064453125]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 11.0, 66.0, 471.0, 356.0, 85.0, 19.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.25576069951057434, -0.24949349462985992, -0.2432262897491455, -0.2369590699672699, -0.23069186508655548, -0.22442466020584106, -0.21815745532512665, -0.21189025044441223, -0.20562304556369781, -0.1993558406829834, -0.19308863580226898, -0.18682143092155457, -0.18055421113967896, -0.17428700625896454, -0.16801980137825012, -0.1617525964975357, -0.1554853916168213, -0.14921818673610687, -0.14295098185539246, -0.13668376207351685, -0.13041655719280243, -0.12414935231208801, -0.1178821474313736, -0.11161494255065918, -0.10534772276878357, -0.09908051788806915, -0.09281330555677414, -0.08654610067605972, -0.0802788957953453, -0.07401168346405029, -0.06774447858333588, -0.06147727370262146, -0.05521006882190704, -0.04894286021590233, -0.04267565533518791, -0.0364084467291832, -0.03014123998582363, -0.023874033242464066, -0.01760682463645935, -0.011339619755744934, -0.005072411149740219, 0.001194796059280634, 0.007462003268301487, 0.013729210942983627, 0.019996417686343193, 0.02626362442970276, 0.032530833035707474, 0.03879803791642189, 0.045065246522426605, 0.05133245512843132, 0.05759966000914574, 0.06386686861515045, 0.07013407349586487, 0.07640127837657928, 0.0826684907078743, 0.08893569558858871, 0.09520290791988373, 0.10147011280059814, 0.10773732513189316, 0.11400453001260757, 0.12027173489332199, 0.126538947224617, 0.13280615210533142, 0.13907335698604584, 0.14534056186676025]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 6.0, 10.0, 9.0, 15.0, 25.0, 33.0, 31.0, 45.0, 50.0, 52.0, 57.0, 86.0, 84.0, 72.0, 63.0, 55.0, 47.0, 52.0, 46.0, 34.0, 36.0, 31.0, 16.0, 21.0, 7.0, 6.0, 5.0, 1.0, 3.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04196751117706299, -0.04075542464852333, -0.03954333811998367, -0.03833124786615372, -0.03711916133761406, -0.0359070748090744, -0.034694984555244446, -0.03348289802670479, -0.03227081149816513, -0.031058724969625473, -0.029846636578440666, -0.02863454818725586, -0.027422461658716202, -0.026210375130176544, -0.024998286738991737, -0.02378619834780693, -0.022574111819267273, -0.021362025290727615, -0.02014993689954281, -0.018937848508358, -0.017725761979818344, -0.016513675451278687, -0.01530158706009388, -0.014089499600231647, -0.012877412140369415, -0.011665324680507183, -0.01045323722064495, -0.009241149760782719, -0.008029062300920486, -0.006816974841058254, -0.005604887381196022, -0.00439279992133379, -0.0031807124614715576, -0.0019686250016093254, -0.0007565375417470932, 0.000455549918115139, 0.0016676373779773712, 0.0028797248378396034, 0.004091812297701836, 0.005303899757564068, 0.0065159872174263, 0.007728074677288532, 0.008940162137150764, 0.010152249597012997, 0.011364337056875229, 0.012576424516737461, 0.013788511976599693, 0.015000599436461926, 0.016212686896324158, 0.017424773424863815, 0.018636861816048622, 0.01984895020723343, 0.021061036735773087, 0.022273123264312744, 0.02348521165549755, 0.024697300046682358, 0.025909386575222015, 0.027121473103761673, 0.02833356149494648, 0.029545649886131287, 0.030757736414670944, 0.0319698229432106, 0.03318191319704056, 0.034393999725580215, 0.03560608625411987]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 1.0, 3.0, 6.0, 5.0, 6.0, 13.0, 16.0, 22.0, 30.0, 53.0, 83.0, 117.0, 237.0, 392.0, 697.0, 1555.0, 3955.0, 23843.0, 662143.0, 335209.0, 14391.0, 3071.0, 1218.0, 625.0, 307.0, 177.0, 142.0, 74.0, 43.0, 42.0, 22.0, 19.0, 14.0, 8.0, 4.0, 8.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.422607421875, -0.4104957580566406, -0.39838409423828125, -0.3862724304199219, -0.3741607666015625, -0.3620491027832031, -0.34993743896484375, -0.3378257751464844, -0.325714111328125, -0.3136024475097656, -0.30149078369140625, -0.2893791198730469, -0.2772674560546875, -0.2651557922363281, -0.25304412841796875, -0.24093246459960938, -0.22882080078125, -0.21670913696289062, -0.20459747314453125, -0.19248580932617188, -0.1803741455078125, -0.16826248168945312, -0.15615081787109375, -0.14403915405273438, -0.131927490234375, -0.11981582641601562, -0.10770416259765625, -0.09559249877929688, -0.0834808349609375, -0.07136917114257812, -0.05925750732421875, -0.047145843505859375, -0.0350341796875, -0.022922515869140625, -0.01081085205078125, 0.001300811767578125, 0.0134124755859375, 0.025524139404296875, 0.03763580322265625, 0.049747467041015625, 0.061859130859375, 0.07397079467773438, 0.08608245849609375, 0.09819412231445312, 0.1103057861328125, 0.12241744995117188, 0.13452911376953125, 0.14664077758789062, 0.15875244140625, 0.17086410522460938, 0.18297576904296875, 0.19508743286132812, 0.2071990966796875, 0.21931076049804688, 0.23142242431640625, 0.24353408813476562, 0.255645751953125, 0.2677574157714844, 0.27986907958984375, 0.2919807434082031, 0.3040924072265625, 0.3162040710449219, 0.32831573486328125, 0.3404273986816406, 0.3525390625]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 7.0, 23.0, 43.0, 96.0, 143.0, 189.0, 194.0, 141.0, 90.0, 35.0, 20.0, 6.0, 6.0, 1.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.133544921875, -0.13036727905273438, -0.12718963623046875, -0.12401199340820312, -0.1208343505859375, -0.11765670776367188, -0.11447906494140625, -0.11130142211914062, -0.108123779296875, -0.10494613647460938, -0.10176849365234375, -0.09859085083007812, -0.0954132080078125, -0.09223556518554688, -0.08905792236328125, -0.08588027954101562, -0.08270263671875, -0.07952499389648438, -0.07634735107421875, -0.07316970825195312, -0.0699920654296875, -0.06681442260742188, -0.06363677978515625, -0.060459136962890625, -0.057281494140625, -0.054103851318359375, -0.05092620849609375, -0.047748565673828125, -0.0445709228515625, -0.041393280029296875, -0.03821563720703125, -0.035037994384765625, -0.0318603515625, -0.028682708740234375, -0.02550506591796875, -0.022327423095703125, -0.0191497802734375, -0.015972137451171875, -0.01279449462890625, -0.009616851806640625, -0.006439208984375, -0.003261566162109375, -8.392333984375e-05, 0.003093719482421875, 0.0062713623046875, 0.009449005126953125, 0.01262664794921875, 0.015804290771484375, 0.01898193359375, 0.022159576416015625, 0.02533721923828125, 0.028514862060546875, 0.0316925048828125, 0.034870147705078125, 0.03804779052734375, 0.041225433349609375, 0.044403076171875, 0.047580718994140625, 0.05075836181640625, 0.053936004638671875, 0.0571136474609375, 0.060291290283203125, 0.06346893310546875, 0.06664657592773438, 0.06982421875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 7.0, 8.0, 7.0, 9.0, 24.0, 21.0, 25.0, 35.0, 49.0, 94.0, 154.0, 264.0, 462.0, 887.0, 2296.0, 6741.0, 25691.0, 144726.0, 686026.0, 144016.0, 25791.0, 6775.0, 2331.0, 943.0, 459.0, 262.0, 144.0, 108.0, 66.0, 41.0, 23.0, 24.0, 18.0, 10.0, 8.0, 3.0, 5.0, 1.0, 1.0, 1.0, 5.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1419677734375, -0.13746070861816406, -0.13295364379882812, -0.1284465789794922, -0.12393951416015625, -0.11943244934082031, -0.11492538452148438, -0.11041831970214844, -0.1059112548828125, -0.10140419006347656, -0.09689712524414062, -0.09239006042480469, -0.08788299560546875, -0.08337593078613281, -0.07886886596679688, -0.07436180114746094, -0.069854736328125, -0.06534767150878906, -0.060840606689453125, -0.05633354187011719, -0.05182647705078125, -0.04731941223144531, -0.042812347412109375, -0.03830528259277344, -0.0337982177734375, -0.029291152954101562, -0.024784088134765625, -0.020277023315429688, -0.01576995849609375, -0.011262893676757812, -0.006755828857421875, -0.0022487640380859375, 0.00225830078125, 0.0067653656005859375, 0.011272430419921875, 0.015779495239257812, 0.02028656005859375, 0.024793624877929688, 0.029300689697265625, 0.03380775451660156, 0.0383148193359375, 0.04282188415527344, 0.047328948974609375, 0.05183601379394531, 0.05634307861328125, 0.06085014343261719, 0.06535720825195312, 0.06986427307128906, 0.074371337890625, 0.07887840270996094, 0.08338546752929688, 0.08789253234863281, 0.09239959716796875, 0.09690666198730469, 0.10141372680664062, 0.10592079162597656, 0.1104278564453125, 0.11493492126464844, 0.11944198608398438, 0.12394905090332031, 0.12845611572265625, 0.1329631805419922, 0.13747024536132812, 0.14197731018066406, 0.146484375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 6.0, 6.0, 6.0, 5.0, 10.0, 13.0, 14.0, 22.0, 19.0, 22.0, 32.0, 32.0, 32.0, 49.0, 48.0, 39.0, 47.0, 39.0, 50.0, 54.0, 66.0, 52.0, 40.0, 39.0, 37.0, 27.0, 29.0, 29.0, 26.0, 24.0, 26.0, 16.0, 11.0, 17.0, 6.0, 6.0, 6.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08770751953125, -0.08431529998779297, -0.08092308044433594, -0.0775308609008789, -0.07413864135742188, -0.07074642181396484, -0.06735420227050781, -0.06396198272705078, -0.06056976318359375, -0.05717754364013672, -0.05378532409667969, -0.050393104553222656, -0.047000885009765625, -0.043608665466308594, -0.04021644592285156, -0.03682422637939453, -0.0334320068359375, -0.03003978729248047, -0.026647567749023438, -0.023255348205566406, -0.019863128662109375, -0.016470909118652344, -0.013078689575195312, -0.009686470031738281, -0.00629425048828125, -0.0029020309448242188, 0.0004901885986328125, 0.0038824081420898438, 0.007274627685546875, 0.010666847229003906, 0.014059066772460938, 0.01745128631591797, 0.020843505859375, 0.02423572540283203, 0.027627944946289062, 0.031020164489746094, 0.034412384033203125, 0.037804603576660156, 0.04119682312011719, 0.04458904266357422, 0.04798126220703125, 0.05137348175048828, 0.05476570129394531, 0.058157920837402344, 0.061550140380859375, 0.0649423599243164, 0.06833457946777344, 0.07172679901123047, 0.0751190185546875, 0.07851123809814453, 0.08190345764160156, 0.0852956771850586, 0.08868789672851562, 0.09208011627197266, 0.09547233581542969, 0.09886455535888672, 0.10225677490234375, 0.10564899444580078, 0.10904121398925781, 0.11243343353271484, 0.11582565307617188, 0.1192178726196289, 0.12261009216308594, 0.12600231170654297, 0.12939453125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 5.0, 2.0, 2.0, 8.0, 5.0, 5.0, 9.0, 8.0, 17.0, 16.0, 35.0, 36.0, 49.0, 85.0, 116.0, 171.0, 282.0, 626.0, 1515.0, 4673.0, 31205.0, 967066.0, 34806.0, 4769.0, 1551.0, 667.0, 296.0, 162.0, 127.0, 77.0, 48.0, 28.0, 21.0, 16.0, 10.0, 8.0, 8.0, 8.0, 6.0, 4.0, 0.0, 4.0, 4.0, 1.0, 6.0, 0.0, 1.0, 1.0], "bins": [-0.2061767578125, -0.2006816864013672, -0.19518661499023438, -0.18969154357910156, -0.18419647216796875, -0.17870140075683594, -0.17320632934570312, -0.1677112579345703, -0.1622161865234375, -0.1567211151123047, -0.15122604370117188, -0.14573097229003906, -0.14023590087890625, -0.13474082946777344, -0.12924575805664062, -0.12375068664550781, -0.118255615234375, -0.11276054382324219, -0.10726547241210938, -0.10177040100097656, -0.09627532958984375, -0.09078025817871094, -0.08528518676757812, -0.07979011535644531, -0.0742950439453125, -0.06879997253417969, -0.06330490112304688, -0.05780982971191406, -0.05231475830078125, -0.04681968688964844, -0.041324615478515625, -0.03582954406738281, -0.03033447265625, -0.024839401245117188, -0.019344329833984375, -0.013849258422851562, -0.00835418701171875, -0.0028591156005859375, 0.002635955810546875, 0.008131027221679688, 0.0136260986328125, 0.019121170043945312, 0.024616241455078125, 0.030111312866210938, 0.03560638427734375, 0.04110145568847656, 0.046596527099609375, 0.05209159851074219, 0.057586669921875, 0.06308174133300781, 0.06857681274414062, 0.07407188415527344, 0.07956695556640625, 0.08506202697753906, 0.09055709838867188, 0.09605216979980469, 0.1015472412109375, 0.10704231262207031, 0.11253738403320312, 0.11803245544433594, 0.12352752685546875, 0.12902259826660156, 0.13451766967773438, 0.1400127410888672, 0.1455078125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 2.0, 4.0, 8.0, 11.0, 13.0, 14.0, 26.0, 31.0, 51.0, 66.0, 117.0, 165.0, 175.0, 97.0, 66.0, 49.0, 30.0, 19.0, 15.0, 9.0, 6.0, 6.0, 5.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0002484321594238281, -0.00024206936359405518, -0.00023570656776428223, -0.00022934377193450928, -0.00022298097610473633, -0.00021661818027496338, -0.00021025538444519043, -0.00020389258861541748, -0.00019752979278564453, -0.00019116699695587158, -0.00018480420112609863, -0.00017844140529632568, -0.00017207860946655273, -0.00016571581363677979, -0.00015935301780700684, -0.0001529902219772339, -0.00014662742614746094, -0.000140264630317688, -0.00013390183448791504, -0.0001275390386581421, -0.00012117624282836914, -0.00011481344699859619, -0.00010845065116882324, -0.00010208785533905029, -9.572505950927734e-05, -8.93622636795044e-05, -8.299946784973145e-05, -7.66366720199585e-05, -7.027387619018555e-05, -6.39110803604126e-05, -5.754828453063965e-05, -5.11854887008667e-05, -4.482269287109375e-05, -3.84598970413208e-05, -3.209710121154785e-05, -2.5734305381774902e-05, -1.9371509552001953e-05, -1.3008713722229004e-05, -6.645917892456055e-06, -2.8312206268310547e-07, 6.079673767089844e-06, 1.2442469596862793e-05, 1.8805265426635742e-05, 2.516806125640869e-05, 3.153085708618164e-05, 3.789365291595459e-05, 4.425644874572754e-05, 5.061924457550049e-05, 5.698204040527344e-05, 6.334483623504639e-05, 6.970763206481934e-05, 7.607042789459229e-05, 8.243322372436523e-05, 8.879601955413818e-05, 9.515881538391113e-05, 0.00010152161121368408, 0.00010788440704345703, 0.00011424720287322998, 0.00012060999870300293, 0.00012697279453277588, 0.00013333559036254883, 0.00013969838619232178, 0.00014606118202209473, 0.00015242397785186768, 0.00015878677368164062]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 4.0, 7.0, 7.0, 11.0, 19.0, 29.0, 36.0, 60.0, 104.0, 169.0, 406.0, 1003.0, 3470.0, 37093.0, 990103.0, 12488.0, 2148.0, 698.0, 323.0, 174.0, 74.0, 44.0, 30.0, 16.0, 11.0, 9.0, 1.0, 5.0, 5.0, 4.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.306884765625, -0.2979469299316406, -0.28900909423828125, -0.2800712585449219, -0.2711334228515625, -0.2621955871582031, -0.25325775146484375, -0.24431991577148438, -0.235382080078125, -0.22644424438476562, -0.21750640869140625, -0.20856857299804688, -0.1996307373046875, -0.19069290161132812, -0.18175506591796875, -0.17281723022460938, -0.16387939453125, -0.15494155883789062, -0.14600372314453125, -0.13706588745117188, -0.1281280517578125, -0.11919021606445312, -0.11025238037109375, -0.10131454467773438, -0.092376708984375, -0.08343887329101562, -0.07450103759765625, -0.06556320190429688, -0.0566253662109375, -0.047687530517578125, -0.03874969482421875, -0.029811859130859375, -0.0208740234375, -0.011936187744140625, -0.00299835205078125, 0.005939483642578125, 0.0148773193359375, 0.023815155029296875, 0.03275299072265625, 0.041690826416015625, 0.050628662109375, 0.059566497802734375, 0.06850433349609375, 0.07744216918945312, 0.0863800048828125, 0.09531784057617188, 0.10425567626953125, 0.11319351196289062, 0.12213134765625, 0.13106918334960938, 0.14000701904296875, 0.14894485473632812, 0.1578826904296875, 0.16682052612304688, 0.17575836181640625, 0.18469619750976562, 0.193634033203125, 0.20257186889648438, 0.21150970458984375, 0.22044754028320312, 0.2293853759765625, 0.23832321166992188, 0.24726104736328125, 0.2561988830566406, 0.26513671875]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 9.0, 9.0, 19.0, 17.0, 43.0, 81.0, 141.0, 268.0, 171.0, 103.0, 45.0, 39.0, 19.0, 16.0, 8.0, 10.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11175537109375, -0.10811710357666016, -0.10447883605957031, -0.10084056854248047, -0.09720230102539062, -0.09356403350830078, -0.08992576599121094, -0.0862874984741211, -0.08264923095703125, -0.0790109634399414, -0.07537269592285156, -0.07173442840576172, -0.06809616088867188, -0.06445789337158203, -0.06081962585449219, -0.057181358337402344, -0.0535430908203125, -0.049904823303222656, -0.04626655578613281, -0.04262828826904297, -0.038990020751953125, -0.03535175323486328, -0.03171348571777344, -0.028075218200683594, -0.02443695068359375, -0.020798683166503906, -0.017160415649414062, -0.013522148132324219, -0.009883880615234375, -0.006245613098144531, -0.0026073455810546875, 0.0010309219360351562, 0.004669189453125, 0.008307456970214844, 0.011945724487304688, 0.015583992004394531, 0.019222259521484375, 0.02286052703857422, 0.026498794555664062, 0.030137062072753906, 0.03377532958984375, 0.037413597106933594, 0.04105186462402344, 0.04469013214111328, 0.048328399658203125, 0.05196666717529297, 0.05560493469238281, 0.059243202209472656, 0.0628814697265625, 0.06651973724365234, 0.07015800476074219, 0.07379627227783203, 0.07743453979492188, 0.08107280731201172, 0.08471107482910156, 0.0883493423461914, 0.09198760986328125, 0.0956258773803711, 0.09926414489746094, 0.10290241241455078, 0.10654067993164062, 0.11017894744873047, 0.11381721496582031, 0.11745548248291016, 0.12109375]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 7.0, 0.0, 8.0, 9.0, 7.0, 22.0, 35.0, 51.0, 67.0, 111.0, 169.0, 181.0, 133.0, 73.0, 48.0, 33.0, 19.0, 18.0, 4.0, 5.0, 1.0, 5.0, 3.0, 0.0, 5.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4616219997406006, -1.4269235134124756, -1.392224907875061, -1.357526421546936, -1.322827935218811, -1.2881293296813965, -1.2534308433532715, -1.2187323570251465, -1.184033751487732, -1.149335265159607, -1.1146366596221924, -1.0799381732940674, -1.0452396869659424, -1.0105410814285278, -0.9758425951004028, -0.9411440491676331, -0.9064455628395081, -0.8717470169067383, -0.8370485305786133, -0.8023499846458435, -0.7676514387130737, -0.7329529523849487, -0.698254406452179, -0.6635558605194092, -0.6288573741912842, -0.5941588282585144, -0.5594603419303894, -0.5247617959976196, -0.49006325006484985, -0.45536473393440247, -0.4206662178039551, -0.3859676718711853, -0.3512691259384155, -0.31657060980796814, -0.28187206387519836, -0.24717354774475098, -0.2124750167131424, -0.1777764856815338, -0.14307796955108643, -0.10837943851947784, -0.07368090748786926, -0.03898238018155098, -0.0042838528752326965, 0.030414670705795288, 0.06511320173740387, 0.09981173276901245, 0.13451024889945984, 0.16920877993106842, 0.203907310962677, 0.23860584199428558, 0.27330437302589417, 0.30800288915634155, 0.34270143508911133, 0.3773999512195587, 0.4120984673500061, 0.4467970132827759, 0.48149552941322327, 0.5161940455436707, 0.5508925914764404, 0.5855910778045654, 0.6202896237373352, 0.654988169670105, 0.68968665599823, 0.7243852019309998, 0.7590837478637695]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 6.0, 5.0, 1.0, 6.0, 7.0, 6.0, 10.0, 14.0, 10.0, 18.0, 25.0, 18.0, 25.0, 28.0, 31.0, 31.0, 46.0, 45.0, 41.0, 44.0, 39.0, 40.0, 42.0, 47.0, 48.0, 33.0, 38.0, 45.0, 26.0, 21.0, 31.0, 31.0, 27.0, 12.0, 18.0, 25.0, 16.0, 13.0, 14.0, 8.0, 6.0, 4.0, 1.0, 6.0, 0.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.4322248101234436, -0.4184243977069855, -0.40462398529052734, -0.3908235728740692, -0.3770231604576111, -0.36322277784347534, -0.3494223654270172, -0.3356219530105591, -0.32182154059410095, -0.3080211281776428, -0.2942207157611847, -0.28042030334472656, -0.2666199207305908, -0.2528194785118103, -0.23901909589767456, -0.22521868348121643, -0.2114182710647583, -0.19761785864830017, -0.18381744623184204, -0.1700170487165451, -0.15621663630008698, -0.14241622388362885, -0.1286158263683319, -0.11481541395187378, -0.10101500153541565, -0.08721458911895752, -0.07341418415307999, -0.059613775461912155, -0.045813366770744324, -0.032012954354286194, -0.01821254938840866, -0.004412144422531128, 0.009388267993927002, 0.023188676685094833, 0.036989085376262665, 0.050789494067430496, 0.06458990275859833, 0.07839031517505646, 0.09219072014093399, 0.10599112510681152, 0.11979153752326965, 0.13359194993972778, 0.1473923623561859, 0.16119275987148285, 0.17499317228794098, 0.1887935847043991, 0.20259398221969604, 0.21639439463615417, 0.2301948070526123, 0.24399521946907043, 0.25779563188552856, 0.2715960443019867, 0.2853964567184448, 0.29919683933258057, 0.3129972517490387, 0.3267976641654968, 0.34059807658195496, 0.3543984889984131, 0.3681989014148712, 0.38199931383132935, 0.3957996964454651, 0.4096001386642456, 0.42340052127838135, 0.4372009336948395, 0.4510013461112976]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 10.0, 6.0, 14.0, 27.0, 74.0, 145.0, 490.0, 2040.0, 4186934.0, 3598.0, 580.0, 205.0, 68.0, 28.0, 18.0, 15.0, 7.0, 4.0, 6.0, 3.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.62109375, -0.6001052856445312, -0.5791168212890625, -0.5581283569335938, -0.537139892578125, -0.5161514282226562, -0.4951629638671875, -0.47417449951171875, -0.45318603515625, -0.43219757080078125, -0.4112091064453125, -0.39022064208984375, -0.369232177734375, -0.34824371337890625, -0.3272552490234375, -0.30626678466796875, -0.2852783203125, -0.26428985595703125, -0.2433013916015625, -0.22231292724609375, -0.201324462890625, -0.18033599853515625, -0.1593475341796875, -0.13835906982421875, -0.11737060546875, -0.09638214111328125, -0.0753936767578125, -0.05440521240234375, -0.033416748046875, -0.01242828369140625, 0.0085601806640625, 0.02954864501953125, 0.050537109375, 0.07152557373046875, 0.0925140380859375, 0.11350250244140625, 0.134490966796875, 0.15547943115234375, 0.1764678955078125, 0.19745635986328125, 0.21844482421875, 0.23943328857421875, 0.2604217529296875, 0.28141021728515625, 0.302398681640625, 0.32338714599609375, 0.3443756103515625, 0.36536407470703125, 0.3863525390625, 0.40734100341796875, 0.4283294677734375, 0.44931793212890625, 0.470306396484375, 0.49129486083984375, 0.5122833251953125, 0.5332717895507812, 0.55426025390625, 0.5752487182617188, 0.5962371826171875, 0.6172256469726562, 0.638214111328125, 0.6592025756835938, 0.6801910400390625, 0.7011795043945312, 0.72216796875]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 8.0, 18.0, 46.0, 89.0, 148.0, 186.0, 178.0, 169.0, 80.0, 39.0, 21.0, 2.0, 9.0, 1.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1336669921875, -0.13048839569091797, -0.12730979919433594, -0.1241312026977539, -0.12095260620117188, -0.11777400970458984, -0.11459541320800781, -0.11141681671142578, -0.10823822021484375, -0.10505962371826172, -0.10188102722167969, -0.09870243072509766, -0.09552383422851562, -0.0923452377319336, -0.08916664123535156, -0.08598804473876953, -0.0828094482421875, -0.07963085174560547, -0.07645225524902344, -0.0732736587524414, -0.07009506225585938, -0.06691646575927734, -0.06373786926269531, -0.06055927276611328, -0.05738067626953125, -0.05420207977294922, -0.05102348327636719, -0.047844886779785156, -0.044666290283203125, -0.041487693786621094, -0.03830909729003906, -0.03513050079345703, -0.031951904296875, -0.02877330780029297, -0.025594711303710938, -0.022416114807128906, -0.019237518310546875, -0.016058921813964844, -0.012880325317382812, -0.009701728820800781, -0.00652313232421875, -0.0033445358276367188, -0.0001659393310546875, 0.0030126571655273438, 0.006191253662109375, 0.009369850158691406, 0.012548446655273438, 0.01572704315185547, 0.0189056396484375, 0.02208423614501953, 0.025262832641601562, 0.028441429138183594, 0.031620025634765625, 0.034798622131347656, 0.03797721862792969, 0.04115581512451172, 0.04433441162109375, 0.04751300811767578, 0.05069160461425781, 0.053870201110839844, 0.057048797607421875, 0.060227394104003906, 0.06340599060058594, 0.06658458709716797, 0.06976318359375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 7.0, 5.0, 16.0, 15.0, 25.0, 43.0, 81.0, 121.0, 258.0, 428.0, 877.0, 1734.0, 3965.0, 13742.0, 4104755.0, 56238.0, 6853.0, 2578.0, 1176.0, 585.0, 315.0, 192.0, 110.0, 55.0, 41.0, 30.0, 15.0, 6.0, 2.0, 5.0, 5.0, 3.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09503173828125, -0.09147930145263672, -0.08792686462402344, -0.08437442779541016, -0.08082199096679688, -0.0772695541381836, -0.07371711730957031, -0.07016468048095703, -0.06661224365234375, -0.06305980682373047, -0.05950736999511719, -0.055954933166503906, -0.052402496337890625, -0.048850059509277344, -0.04529762268066406, -0.04174518585205078, -0.0381927490234375, -0.03464031219482422, -0.031087875366210938, -0.027535438537597656, -0.023983001708984375, -0.020430564880371094, -0.016878128051757812, -0.013325691223144531, -0.00977325439453125, -0.006220817565917969, -0.0026683807373046875, 0.0008840560913085938, 0.004436492919921875, 0.007988929748535156, 0.011541366577148438, 0.015093803405761719, 0.018646240234375, 0.02219867706298828, 0.025751113891601562, 0.029303550720214844, 0.032855987548828125, 0.036408424377441406, 0.03996086120605469, 0.04351329803466797, 0.04706573486328125, 0.05061817169189453, 0.05417060852050781, 0.057723045349121094, 0.061275482177734375, 0.06482791900634766, 0.06838035583496094, 0.07193279266357422, 0.0754852294921875, 0.07903766632080078, 0.08259010314941406, 0.08614253997802734, 0.08969497680664062, 0.0932474136352539, 0.09679985046386719, 0.10035228729248047, 0.10390472412109375, 0.10745716094970703, 0.11100959777832031, 0.1145620346069336, 0.11811447143554688, 0.12166690826416016, 0.12521934509277344, 0.12877178192138672, 0.13232421875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 0.0, 1.0, 2.0, 5.0, 14.0, 11.0, 60.0, 744.0, 3084.0, 91.0, 19.0, 12.0, 4.0, 5.0, 5.0, 2.0, 3.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0229949951171875, -0.021999597549438477, -0.021004199981689453, -0.02000880241394043, -0.019013404846191406, -0.018018007278442383, -0.01702260971069336, -0.016027212142944336, -0.015031814575195312, -0.014036417007446289, -0.013041019439697266, -0.012045621871948242, -0.011050224304199219, -0.010054826736450195, -0.009059429168701172, -0.008064031600952148, -0.007068634033203125, -0.0060732364654541016, -0.005077838897705078, -0.004082441329956055, -0.0030870437622070312, -0.002091646194458008, -0.0010962486267089844, -0.00010085105895996094, 0.0008945465087890625, 0.001889944076538086, 0.0028853416442871094, 0.003880739212036133, 0.004876136779785156, 0.00587153434753418, 0.006866931915283203, 0.007862329483032227, 0.00885772705078125, 0.009853124618530273, 0.010848522186279297, 0.01184391975402832, 0.012839317321777344, 0.013834714889526367, 0.01483011245727539, 0.015825510025024414, 0.016820907592773438, 0.01781630516052246, 0.018811702728271484, 0.019807100296020508, 0.02080249786376953, 0.021797895431518555, 0.022793292999267578, 0.0237886905670166, 0.024784088134765625, 0.02577948570251465, 0.026774883270263672, 0.027770280838012695, 0.02876567840576172, 0.029761075973510742, 0.030756473541259766, 0.03175187110900879, 0.03274726867675781, 0.033742666244506836, 0.03473806381225586, 0.03573346138000488, 0.036728858947753906, 0.03772425651550293, 0.03871965408325195, 0.03971505165100098, 0.04071044921875]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 9.0, 4.0, 6.0, 7.0, 14.0, 12.0, 31.0, 32.0, 51.0, 73.0, 103.0, 108.0, 110.0, 117.0, 76.0, 66.0, 52.0, 34.0, 20.0, 18.0, 20.0, 13.0, 5.0, 3.0, 7.0, 6.0, 7.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07730314880609512, -0.07460027933120728, -0.07189741730690002, -0.06919455528259277, -0.06649168580770493, -0.06378881633281708, -0.06108595430850983, -0.05838308855891228, -0.05568022280931473, -0.05297735705971718, -0.05027449131011963, -0.04757162556052208, -0.04486875981092453, -0.04216589406132698, -0.03946302831172943, -0.03676016256213188, -0.03405729681253433, -0.03135443106293678, -0.028651565313339233, -0.025948699563741684, -0.023245833814144135, -0.020542968064546585, -0.017840102314949036, -0.015137236565351486, -0.012434370815753937, -0.009731505066156387, -0.007028639316558838, -0.0043257735669612885, -0.001622907817363739, 0.0010799579322338104, 0.00378282368183136, 0.006485689431428909, 0.009188562631607056, 0.011891428381204605, 0.014594294130802155, 0.017297159880399704, 0.020000025629997253, 0.022702891379594803, 0.025405757129192352, 0.0281086228787899, 0.03081148862838745, 0.033514354377985, 0.03621722012758255, 0.0389200858771801, 0.04162295162677765, 0.0443258173763752, 0.04702868312597275, 0.0497315488755703, 0.05243441462516785, 0.055137280374765396, 0.057840146124362946, 0.060543011873960495, 0.06324587762355804, 0.0659487396478653, 0.06865160912275314, 0.07135447859764099, 0.07405734062194824, 0.0767602026462555, 0.07946307212114334, 0.08216594159603119, 0.08486880362033844, 0.08757166564464569, 0.09027453511953354, 0.09297740459442139, 0.09568026661872864]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 3.0, 7.0, 3.0, 13.0, 8.0, 14.0, 20.0, 16.0, 28.0, 35.0, 39.0, 47.0, 48.0, 49.0, 50.0, 52.0, 57.0, 51.0, 46.0, 55.0, 37.0, 54.0, 43.0, 53.0, 31.0, 27.0, 22.0, 26.0, 19.0, 13.0, 10.0, 10.0, 7.0, 5.0, 0.0, 1.0, 2.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.07715767621994019, -0.07499028742313385, -0.07282289862632751, -0.07065550982952118, -0.06848812103271484, -0.06632072478532791, -0.06415333598852158, -0.06198594719171524, -0.059818558394908905, -0.05765116959810257, -0.055483780801296234, -0.0533163882791996, -0.051148999482393265, -0.04898161068558693, -0.046814218163490295, -0.04464682936668396, -0.042479440569877625, -0.04031205177307129, -0.038144662976264954, -0.03597727045416832, -0.033809881657361984, -0.03164249286055565, -0.029475102201104164, -0.02730771154165268, -0.025140322744846344, -0.02297293394804001, -0.020805543288588524, -0.01863815262913704, -0.016470763832330704, -0.014303374104201794, -0.012135984376072884, -0.009968594647943974, -0.0078012049198150635, -0.005633815191686153, -0.0034664254635572433, -0.0012990357354283333, 0.0008683539927005768, 0.003035743720829487, 0.005203133448958397, 0.007370523177087307, 0.009537912905216217, 0.011705302633345127, 0.013872692361474037, 0.016040083020925522, 0.018207471817731857, 0.020374860614538193, 0.022542251273989677, 0.024709641933441162, 0.026877030730247498, 0.029044419527053833, 0.031211810186505318, 0.0333792008459568, 0.03554658964276314, 0.03771397843956947, 0.03988137096166611, 0.04204875975847244, 0.04421614855527878, 0.046383537352085114, 0.04855092614889145, 0.05071831867098808, 0.05288570746779442, 0.055053096264600754, 0.05722048878669739, 0.05938787758350372, 0.06155526638031006]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 2.0, 2.0, 1.0, 3.0, 2.0, 11.0, 17.0, 13.0, 13.0, 30.0, 65.0, 96.0, 169.0, 280.0, 507.0, 1214.0, 3322.0, 31156.0, 942410.0, 61707.0, 4731.0, 1491.0, 616.0, 280.0, 146.0, 103.0, 64.0, 31.0, 23.0, 23.0, 8.0, 8.0, 7.0, 6.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8076171875, -0.784271240234375, -0.76092529296875, -0.737579345703125, -0.7142333984375, -0.690887451171875, -0.66754150390625, -0.644195556640625, -0.620849609375, -0.597503662109375, -0.57415771484375, -0.550811767578125, -0.5274658203125, -0.504119873046875, -0.48077392578125, -0.457427978515625, -0.43408203125, -0.410736083984375, -0.38739013671875, -0.364044189453125, -0.3406982421875, -0.317352294921875, -0.29400634765625, -0.270660400390625, -0.247314453125, -0.223968505859375, -0.20062255859375, -0.177276611328125, -0.1539306640625, -0.130584716796875, -0.10723876953125, -0.083892822265625, -0.060546875, -0.037200927734375, -0.01385498046875, 0.009490966796875, 0.0328369140625, 0.056182861328125, 0.07952880859375, 0.102874755859375, 0.126220703125, 0.149566650390625, 0.17291259765625, 0.196258544921875, 0.2196044921875, 0.242950439453125, 0.26629638671875, 0.289642333984375, 0.31298828125, 0.336334228515625, 0.35968017578125, 0.383026123046875, 0.4063720703125, 0.429718017578125, 0.45306396484375, 0.476409912109375, 0.499755859375, 0.523101806640625, 0.54644775390625, 0.569793701171875, 0.5931396484375, 0.616485595703125, 0.63983154296875, 0.663177490234375, 0.6865234375]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 19.0, 50.0, 90.0, 145.0, 183.0, 183.0, 162.0, 83.0, 40.0, 21.0, 2.0, 9.0, 1.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.133544921875, -0.1303691864013672, -0.12719345092773438, -0.12401771545410156, -0.12084197998046875, -0.11766624450683594, -0.11449050903320312, -0.11131477355957031, -0.1081390380859375, -0.10496330261230469, -0.10178756713867188, -0.09861183166503906, -0.09543609619140625, -0.09226036071777344, -0.08908462524414062, -0.08590888977050781, -0.082733154296875, -0.07955741882324219, -0.07638168334960938, -0.07320594787597656, -0.07003021240234375, -0.06685447692871094, -0.06367874145507812, -0.06050300598144531, -0.0573272705078125, -0.05415153503417969, -0.050975799560546875, -0.04780006408691406, -0.04462432861328125, -0.04144859313964844, -0.038272857666015625, -0.03509712219238281, -0.03192138671875, -0.028745651245117188, -0.025569915771484375, -0.022394180297851562, -0.01921844482421875, -0.016042709350585938, -0.012866973876953125, -0.009691238403320312, -0.0065155029296875, -0.0033397674560546875, -0.000164031982421875, 0.0030117034912109375, 0.00618743896484375, 0.009363174438476562, 0.012538909912109375, 0.015714645385742188, 0.018890380859375, 0.022066116333007812, 0.025241851806640625, 0.028417587280273438, 0.03159332275390625, 0.03476905822753906, 0.037944793701171875, 0.04112052917480469, 0.0442962646484375, 0.04747200012207031, 0.050647735595703125, 0.05382347106933594, 0.05699920654296875, 0.06017494201660156, 0.06335067749023438, 0.06652641296386719, 0.0697021484375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 6.0, 4.0, 4.0, 10.0, 13.0, 14.0, 20.0, 27.0, 39.0, 48.0, 76.0, 122.0, 199.0, 331.0, 577.0, 1162.0, 2788.0, 7821.0, 30713.0, 194986.0, 681893.0, 99199.0, 18891.0, 5393.0, 2043.0, 915.0, 496.0, 264.0, 145.0, 111.0, 74.0, 58.0, 34.0, 29.0, 11.0, 13.0, 6.0, 8.0, 3.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1658935546875, -0.1609172821044922, -0.15594100952148438, -0.15096473693847656, -0.14598846435546875, -0.14101219177246094, -0.13603591918945312, -0.1310596466064453, -0.1260833740234375, -0.12110710144042969, -0.11613082885742188, -0.11115455627441406, -0.10617828369140625, -0.10120201110839844, -0.09622573852539062, -0.09124946594238281, -0.086273193359375, -0.08129692077636719, -0.07632064819335938, -0.07134437561035156, -0.06636810302734375, -0.06139183044433594, -0.056415557861328125, -0.05143928527832031, -0.0464630126953125, -0.04148674011230469, -0.036510467529296875, -0.03153419494628906, -0.02655792236328125, -0.021581649780273438, -0.016605377197265625, -0.011629104614257812, -0.00665283203125, -0.0016765594482421875, 0.003299713134765625, 0.008275985717773438, 0.01325225830078125, 0.018228530883789062, 0.023204803466796875, 0.028181076049804688, 0.0331573486328125, 0.03813362121582031, 0.043109893798828125, 0.04808616638183594, 0.05306243896484375, 0.05803871154785156, 0.06301498413085938, 0.06799125671386719, 0.072967529296875, 0.07794380187988281, 0.08292007446289062, 0.08789634704589844, 0.09287261962890625, 0.09784889221191406, 0.10282516479492188, 0.10780143737792969, 0.1127777099609375, 0.11775398254394531, 0.12273025512695312, 0.12770652770996094, 0.13268280029296875, 0.13765907287597656, 0.14263534545898438, 0.1476116180419922, 0.152587890625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 4.0, 3.0, 5.0, 9.0, 5.0, 11.0, 11.0, 18.0, 11.0, 20.0, 23.0, 27.0, 22.0, 26.0, 26.0, 34.0, 29.0, 35.0, 34.0, 44.0, 56.0, 42.0, 47.0, 44.0, 42.0, 37.0, 49.0, 40.0, 26.0, 36.0, 23.0, 24.0, 34.0, 20.0, 16.0, 15.0, 15.0, 9.0, 10.0, 7.0, 5.0, 4.0, 1.0, 2.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09796142578125, -0.09490585327148438, -0.09185028076171875, -0.08879470825195312, -0.0857391357421875, -0.08268356323242188, -0.07962799072265625, -0.07657241821289062, -0.073516845703125, -0.07046127319335938, -0.06740570068359375, -0.06435012817382812, -0.0612945556640625, -0.058238983154296875, -0.05518341064453125, -0.052127838134765625, -0.049072265625, -0.046016693115234375, -0.04296112060546875, -0.039905548095703125, -0.0368499755859375, -0.033794403076171875, -0.03073883056640625, -0.027683258056640625, -0.024627685546875, -0.021572113037109375, -0.01851654052734375, -0.015460968017578125, -0.0124053955078125, -0.009349822998046875, -0.00629425048828125, -0.003238677978515625, -0.00018310546875, 0.002872467041015625, 0.00592803955078125, 0.008983612060546875, 0.0120391845703125, 0.015094757080078125, 0.01815032958984375, 0.021205902099609375, 0.024261474609375, 0.027317047119140625, 0.03037261962890625, 0.033428192138671875, 0.0364837646484375, 0.039539337158203125, 0.04259490966796875, 0.045650482177734375, 0.0487060546875, 0.051761627197265625, 0.05481719970703125, 0.057872772216796875, 0.0609283447265625, 0.06398391723632812, 0.06703948974609375, 0.07009506225585938, 0.073150634765625, 0.07620620727539062, 0.07926177978515625, 0.08231735229492188, 0.0853729248046875, 0.08842849731445312, 0.09148406982421875, 0.09453964233398438, 0.09759521484375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 8.0, 9.0, 7.0, 12.0, 16.0, 12.0, 33.0, 37.0, 56.0, 64.0, 108.0, 143.0, 296.0, 491.0, 830.0, 1856.0, 5601.0, 26001.0, 818482.0, 174020.0, 13618.0, 3712.0, 1452.0, 640.0, 349.0, 229.0, 157.0, 87.0, 69.0, 41.0, 31.0, 30.0, 19.0, 12.0, 11.0, 9.0, 2.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.116943359375, -0.11314964294433594, -0.10935592651367188, -0.10556221008300781, -0.10176849365234375, -0.09797477722167969, -0.09418106079101562, -0.09038734436035156, -0.0865936279296875, -0.08279991149902344, -0.07900619506835938, -0.07521247863769531, -0.07141876220703125, -0.06762504577636719, -0.06383132934570312, -0.06003761291503906, -0.056243896484375, -0.05245018005371094, -0.048656463623046875, -0.04486274719238281, -0.04106903076171875, -0.03727531433105469, -0.033481597900390625, -0.029687881469726562, -0.0258941650390625, -0.022100448608398438, -0.018306732177734375, -0.014513015747070312, -0.01071929931640625, -0.0069255828857421875, -0.003131866455078125, 0.0006618499755859375, 0.00445556640625, 0.008249282836914062, 0.012042999267578125, 0.015836715698242188, 0.01963043212890625, 0.023424148559570312, 0.027217864990234375, 0.031011581420898438, 0.0348052978515625, 0.03859901428222656, 0.042392730712890625, 0.04618644714355469, 0.04998016357421875, 0.05377388000488281, 0.057567596435546875, 0.06136131286621094, 0.065155029296875, 0.06894874572753906, 0.07274246215820312, 0.07653617858886719, 0.08032989501953125, 0.08412361145019531, 0.08791732788085938, 0.09171104431152344, 0.0955047607421875, 0.09929847717285156, 0.10309219360351562, 0.10688591003417969, 0.11067962646484375, 0.11447334289550781, 0.11826705932617188, 0.12206077575683594, 0.1258544921875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 4.0, 3.0, 4.0, 8.0, 5.0, 4.0, 24.0, 18.0, 27.0, 37.0, 73.0, 109.0, 184.0, 186.0, 121.0, 70.0, 41.0, 23.0, 18.0, 18.0, 5.0, 6.0, 9.0, 3.0, 3.0, 5.0, 2.0, 0.0, 2.0, 0.0, 2.0, 3.0], "bins": [-0.0003476142883300781, -0.0003398917615413666, -0.00033216923475265503, -0.0003244467079639435, -0.00031672418117523193, -0.0003090016543865204, -0.00030127912759780884, -0.0002935566008090973, -0.00028583407402038574, -0.0002781115472316742, -0.00027038902044296265, -0.0002626664936542511, -0.00025494396686553955, -0.000247221440076828, -0.00023949891328811646, -0.0002317763864994049, -0.00022405385971069336, -0.0002163313329219818, -0.00020860880613327026, -0.00020088627934455872, -0.00019316375255584717, -0.00018544122576713562, -0.00017771869897842407, -0.00016999617218971252, -0.00016227364540100098, -0.00015455111861228943, -0.00014682859182357788, -0.00013910606503486633, -0.00013138353824615479, -0.00012366101145744324, -0.00011593848466873169, -0.00010821595788002014, -0.0001004934310913086, -9.277090430259705e-05, -8.50483775138855e-05, -7.732585072517395e-05, -6.96033239364624e-05, -6.188079714775085e-05, -5.415827035903931e-05, -4.643574357032776e-05, -3.871321678161621e-05, -3.099068999290466e-05, -2.3268163204193115e-05, -1.5545636415481567e-05, -7.82310962677002e-06, -1.0058283805847168e-07, 7.621943950653076e-06, 1.5344470739364624e-05, 2.3066997528076172e-05, 3.078952431678772e-05, 3.851205110549927e-05, 4.6234577894210815e-05, 5.395710468292236e-05, 6.167963147163391e-05, 6.940215826034546e-05, 7.712468504905701e-05, 8.484721183776855e-05, 9.25697386264801e-05, 0.00010029226541519165, 0.0001080147922039032, 0.00011573731899261475, 0.0001234598457813263, 0.00013118237257003784, 0.0001389048993587494, 0.00014662742614746094]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 7.0, 5.0, 3.0, 12.0, 9.0, 12.0, 18.0, 19.0, 37.0, 52.0, 110.0, 189.0, 338.0, 630.0, 1380.0, 3669.0, 14403.0, 148320.0, 835054.0, 33927.0, 6423.0, 2131.0, 879.0, 404.0, 182.0, 120.0, 75.0, 64.0, 33.0, 21.0, 10.0, 5.0, 10.0, 7.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1451416015625, -0.1409015655517578, -0.13666152954101562, -0.13242149353027344, -0.12818145751953125, -0.12394142150878906, -0.11970138549804688, -0.11546134948730469, -0.1112213134765625, -0.10698127746582031, -0.10274124145507812, -0.09850120544433594, -0.09426116943359375, -0.09002113342285156, -0.08578109741210938, -0.08154106140136719, -0.077301025390625, -0.07306098937988281, -0.06882095336914062, -0.06458091735839844, -0.06034088134765625, -0.05610084533691406, -0.051860809326171875, -0.04762077331542969, -0.0433807373046875, -0.03914070129394531, -0.034900665283203125, -0.030660629272460938, -0.02642059326171875, -0.022180557250976562, -0.017940521240234375, -0.013700485229492188, -0.00946044921875, -0.0052204132080078125, -0.000980377197265625, 0.0032596588134765625, 0.00749969482421875, 0.011739730834960938, 0.015979766845703125, 0.020219802856445312, 0.0244598388671875, 0.028699874877929688, 0.032939910888671875, 0.03717994689941406, 0.04141998291015625, 0.04566001892089844, 0.049900054931640625, 0.05414009094238281, 0.058380126953125, 0.06262016296386719, 0.06686019897460938, 0.07110023498535156, 0.07534027099609375, 0.07958030700683594, 0.08382034301757812, 0.08806037902832031, 0.0923004150390625, 0.09654045104980469, 0.10078048706054688, 0.10502052307128906, 0.10926055908203125, 0.11350059509277344, 0.11774063110351562, 0.12198066711425781, 0.126220703125]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 2.0, 1.0, 5.0, 3.0, 7.0, 8.0, 8.0, 11.0, 17.0, 23.0, 31.0, 44.0, 63.0, 106.0, 148.0, 159.0, 124.0, 82.0, 46.0, 35.0, 12.0, 17.0, 6.0, 8.0, 14.0, 4.0, 3.0, 2.0, 3.0, 3.0, 1.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.083984375, -0.0815286636352539, -0.07907295227050781, -0.07661724090576172, -0.07416152954101562, -0.07170581817626953, -0.06925010681152344, -0.06679439544677734, -0.06433868408203125, -0.061882972717285156, -0.05942726135253906, -0.05697154998779297, -0.054515838623046875, -0.05206012725830078, -0.04960441589355469, -0.047148704528808594, -0.0446929931640625, -0.042237281799316406, -0.03978157043457031, -0.03732585906982422, -0.034870147705078125, -0.03241443634033203, -0.029958724975585938, -0.027503013610839844, -0.02504730224609375, -0.022591590881347656, -0.020135879516601562, -0.01768016815185547, -0.015224456787109375, -0.012768745422363281, -0.010313034057617188, -0.007857322692871094, -0.005401611328125, -0.0029458999633789062, -0.0004901885986328125, 0.0019655227661132812, 0.004421234130859375, 0.006876945495605469, 0.009332656860351562, 0.011788368225097656, 0.01424407958984375, 0.016699790954589844, 0.019155502319335938, 0.02161121368408203, 0.024066925048828125, 0.02652263641357422, 0.028978347778320312, 0.031434059143066406, 0.0338897705078125, 0.036345481872558594, 0.03880119323730469, 0.04125690460205078, 0.043712615966796875, 0.04616832733154297, 0.04862403869628906, 0.051079750061035156, 0.05353546142578125, 0.055991172790527344, 0.05844688415527344, 0.06090259552001953, 0.06335830688476562, 0.06581401824951172, 0.06826972961425781, 0.0707254409790039, 0.07318115234375]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 3.0, 6.0, 4.0, 10.0, 11.0, 19.0, 16.0, 23.0, 24.0, 39.0, 61.0, 62.0, 102.0, 109.0, 118.0, 90.0, 80.0, 55.0, 41.0, 32.0, 30.0, 18.0, 12.0, 9.0, 7.0, 6.0, 5.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4781157970428467, -0.45712828636169434, -0.436140775680542, -0.41515326499938965, -0.3941657245159149, -0.3731782138347626, -0.35219070315361023, -0.3312031626701355, -0.31021565198898315, -0.2892281413078308, -0.26824063062667847, -0.24725310504436493, -0.2262655794620514, -0.20527806878089905, -0.1842905580997467, -0.16330303251743317, -0.14231553673744202, -0.12132801860570908, -0.10034050047397614, -0.07935298979282379, -0.05836547166109085, -0.03737795352935791, -0.016390442848205566, 0.004597082734107971, 0.025584593415260315, 0.046572111546993256, 0.0675596296787262, 0.08854714035987854, 0.10953465849161148, 0.13052217662334442, 0.15150968730449677, 0.1724972128868103, 0.19348472356796265, 0.214472234249115, 0.23545975983142853, 0.2564472556114197, 0.2774347960948944, 0.29842230677604675, 0.3194098174571991, 0.34039735794067383, 0.36138486862182617, 0.3823723793029785, 0.40335988998413086, 0.4243474006652832, 0.44533494114875793, 0.4663224518299103, 0.4873099625110626, 0.5082975029945374, 0.5292849540710449, 0.5502724647521973, 0.5712599754333496, 0.592247486114502, 0.6132349967956543, 0.6342225074768066, 0.655210018157959, 0.6761975884437561, 0.6971850991249084, 0.7181726098060608, 0.7391601204872131, 0.7601476311683655, 0.7811351418495178, 0.8021227121353149, 0.8231102228164673, 0.8440977334976196, 0.865085244178772]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 7.0, 3.0, 6.0, 4.0, 10.0, 10.0, 4.0, 19.0, 12.0, 24.0, 16.0, 20.0, 28.0, 31.0, 27.0, 39.0, 38.0, 43.0, 40.0, 40.0, 54.0, 38.0, 49.0, 40.0, 47.0, 46.0, 44.0, 29.0, 39.0, 31.0, 29.0, 22.0, 23.0, 18.0, 19.0, 15.0, 16.0, 7.0, 6.0, 6.0, 7.0, 3.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4817732572555542, -0.46676936745643616, -0.4517654478549957, -0.4367615580558777, -0.42175763845443726, -0.4067537486553192, -0.3917498290538788, -0.37674593925476074, -0.3617420196533203, -0.34673812985420227, -0.33173421025276184, -0.3167303204536438, -0.30172640085220337, -0.2867225110530853, -0.2717185914516449, -0.25671470165252686, -0.24171079695224762, -0.22670689225196838, -0.21170298755168915, -0.1966990828514099, -0.18169517815113068, -0.16669127345085144, -0.1516873836517334, -0.13668346405029297, -0.12167956680059433, -0.1066756621003151, -0.09167175740003586, -0.07666786015033722, -0.061663951724767685, -0.04666005074977875, -0.03165614604949951, -0.016652241349220276, -0.00164833664894104, 0.013355567120015621, 0.028359470888972282, 0.04336337372660637, 0.058367278426885605, 0.07337117940187454, 0.08837508410215378, 0.10337898880243301, 0.11838289350271225, 0.1333867907524109, 0.14839069545269012, 0.16339460015296936, 0.1783985048532486, 0.19340240955352783, 0.20840631425380707, 0.2234102189540863, 0.23841412365436554, 0.2534180283546448, 0.2684219181537628, 0.28342583775520325, 0.2984297275543213, 0.3134336471557617, 0.32843753695487976, 0.3434414565563202, 0.35844534635543823, 0.3734492361545563, 0.3884531557559967, 0.40345704555511475, 0.4184609651565552, 0.4334648549556732, 0.44846877455711365, 0.4634726643562317, 0.4784765839576721]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 5.0, 16.0, 12.0, 15.0, 20.0, 26.0, 27.0, 62.0, 84.0, 134.0, 189.0, 329.0, 564.0, 1188.0, 3175.0, 14327.0, 219819.0, 3882796.0, 57631.0, 8319.0, 2611.0, 1269.0, 599.0, 382.0, 247.0, 135.0, 97.0, 59.0, 49.0, 30.0, 14.0, 13.0, 9.0, 4.0, 7.0, 3.0, 7.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.51953125, -0.5059700012207031, -0.49240875244140625, -0.4788475036621094, -0.4652862548828125, -0.4517250061035156, -0.43816375732421875, -0.4246025085449219, -0.411041259765625, -0.3974800109863281, -0.38391876220703125, -0.3703575134277344, -0.3567962646484375, -0.3432350158691406, -0.32967376708984375, -0.3161125183105469, -0.30255126953125, -0.2889900207519531, -0.27542877197265625, -0.2618675231933594, -0.2483062744140625, -0.23474502563476562, -0.22118377685546875, -0.20762252807617188, -0.194061279296875, -0.18050003051757812, -0.16693878173828125, -0.15337753295898438, -0.1398162841796875, -0.12625503540039062, -0.11269378662109375, -0.09913253784179688, -0.0855712890625, -0.07201004028320312, -0.05844879150390625, -0.044887542724609375, -0.0313262939453125, -0.017765045166015625, -0.00420379638671875, 0.009357452392578125, 0.022918701171875, 0.036479949951171875, 0.05004119873046875, 0.06360244750976562, 0.0771636962890625, 0.09072494506835938, 0.10428619384765625, 0.11784744262695312, 0.13140869140625, 0.14496994018554688, 0.15853118896484375, 0.17209243774414062, 0.1856536865234375, 0.19921493530273438, 0.21277618408203125, 0.22633743286132812, 0.239898681640625, 0.2534599304199219, 0.26702117919921875, 0.2805824279785156, 0.2941436767578125, 0.3077049255371094, 0.32126617431640625, 0.3348274230957031, 0.348388671875]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 22.0, 41.0, 93.0, 157.0, 181.0, 194.0, 154.0, 83.0, 35.0, 17.0, 6.0, 6.0, 1.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.13330078125, -0.1301288604736328, -0.12695693969726562, -0.12378501892089844, -0.12061309814453125, -0.11744117736816406, -0.11426925659179688, -0.11109733581542969, -0.1079254150390625, -0.10475349426269531, -0.10158157348632812, -0.09840965270996094, -0.09523773193359375, -0.09206581115722656, -0.08889389038085938, -0.08572196960449219, -0.082550048828125, -0.07937812805175781, -0.07620620727539062, -0.07303428649902344, -0.06986236572265625, -0.06669044494628906, -0.06351852416992188, -0.06034660339355469, -0.0571746826171875, -0.05400276184082031, -0.050830841064453125, -0.04765892028808594, -0.04448699951171875, -0.04131507873535156, -0.038143157958984375, -0.03497123718261719, -0.03179931640625, -0.028627395629882812, -0.025455474853515625, -0.022283554077148438, -0.01911163330078125, -0.015939712524414062, -0.012767791748046875, -0.009595870971679688, -0.0064239501953125, -0.0032520294189453125, -8.0108642578125e-05, 0.0030918121337890625, 0.00626373291015625, 0.009435653686523438, 0.012607574462890625, 0.015779495239257812, 0.018951416015625, 0.022123336791992188, 0.025295257568359375, 0.028467178344726562, 0.03163909912109375, 0.03481101989746094, 0.037982940673828125, 0.04115486145019531, 0.0443267822265625, 0.04749870300292969, 0.050670623779296875, 0.05384254455566406, 0.05701446533203125, 0.06018638610839844, 0.06335830688476562, 0.06653022766113281, 0.0697021484375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 3.0, 3.0, 4.0, 4.0, 7.0, 8.0, 11.0, 18.0, 31.0, 64.0, 80.0, 117.0, 184.0, 345.0, 643.0, 1250.0, 2720.0, 7784.0, 32501.0, 266374.0, 3644687.0, 199140.0, 26328.0, 6794.0, 2608.0, 1157.0, 581.0, 314.0, 203.0, 115.0, 76.0, 42.0, 34.0, 17.0, 9.0, 4.0, 5.0, 3.0, 4.0, 3.0, 3.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1663818359375, -0.1612548828125, -0.1561279296875, -0.1510009765625, -0.1458740234375, -0.1407470703125, -0.1356201171875, -0.1304931640625, -0.1253662109375, -0.1202392578125, -0.1151123046875, -0.1099853515625, -0.1048583984375, -0.0997314453125, -0.0946044921875, -0.0894775390625, -0.0843505859375, -0.0792236328125, -0.0740966796875, -0.0689697265625, -0.0638427734375, -0.0587158203125, -0.0535888671875, -0.0484619140625, -0.0433349609375, -0.0382080078125, -0.0330810546875, -0.0279541015625, -0.0228271484375, -0.0177001953125, -0.0125732421875, -0.0074462890625, -0.0023193359375, 0.0028076171875, 0.0079345703125, 0.0130615234375, 0.0181884765625, 0.0233154296875, 0.0284423828125, 0.0335693359375, 0.0386962890625, 0.0438232421875, 0.0489501953125, 0.0540771484375, 0.0592041015625, 0.0643310546875, 0.0694580078125, 0.0745849609375, 0.0797119140625, 0.0848388671875, 0.0899658203125, 0.0950927734375, 0.1002197265625, 0.1053466796875, 0.1104736328125, 0.1156005859375, 0.1207275390625, 0.1258544921875, 0.1309814453125, 0.1361083984375, 0.1412353515625, 0.1463623046875, 0.1514892578125, 0.1566162109375, 0.1617431640625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 4.0, 6.0, 8.0, 15.0, 29.0, 39.0, 77.0, 104.0, 167.0, 315.0, 634.0, 1489.0, 635.0, 266.0, 119.0, 74.0, 33.0, 23.0, 9.0, 5.0, 8.0, 4.0, 5.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1712646484375, -0.16629791259765625, -0.1613311767578125, -0.15636444091796875, -0.151397705078125, -0.14643096923828125, -0.1414642333984375, -0.13649749755859375, -0.13153076171875, -0.12656402587890625, -0.1215972900390625, -0.11663055419921875, -0.111663818359375, -0.10669708251953125, -0.1017303466796875, -0.09676361083984375, -0.091796875, -0.08683013916015625, -0.0818634033203125, -0.07689666748046875, -0.071929931640625, -0.06696319580078125, -0.0619964599609375, -0.05702972412109375, -0.05206298828125, -0.04709625244140625, -0.0421295166015625, -0.03716278076171875, -0.032196044921875, -0.02722930908203125, -0.0222625732421875, -0.01729583740234375, -0.0123291015625, -0.00736236572265625, -0.0023956298828125, 0.00257110595703125, 0.007537841796875, 0.01250457763671875, 0.0174713134765625, 0.02243804931640625, 0.02740478515625, 0.03237152099609375, 0.0373382568359375, 0.04230499267578125, 0.047271728515625, 0.05223846435546875, 0.0572052001953125, 0.06217193603515625, 0.067138671875, 0.07210540771484375, 0.0770721435546875, 0.08203887939453125, 0.087005615234375, 0.09197235107421875, 0.0969390869140625, 0.10190582275390625, 0.10687255859375, 0.11183929443359375, 0.1168060302734375, 0.12177276611328125, 0.126739501953125, 0.13170623779296875, 0.1366729736328125, 0.14163970947265625, 0.1466064453125]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 5.0, 2.0, 9.0, 9.0, 8.0, 11.0, 16.0, 20.0, 32.0, 32.0, 37.0, 47.0, 52.0, 70.0, 89.0, 99.0, 111.0, 87.0, 89.0, 60.0, 40.0, 30.0, 11.0, 6.0, 6.0, 8.0, 3.0, 6.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2237436771392822, -1.1884782314300537, -1.1532129049301147, -1.1179474592208862, -1.0826821327209473, -1.0474166870117188, -1.0121513605117798, -0.9768859148025513, -0.9416205883026123, -0.9063552021980286, -0.8710898160934448, -0.8358244299888611, -0.8005590438842773, -0.7652936577796936, -0.7300282716751099, -0.6947628259658813, -0.6594974398612976, -0.6242320537567139, -0.5889666676521301, -0.5537012815475464, -0.5184358954429626, -0.4831705093383789, -0.4479050934314728, -0.41263970732688904, -0.3773743212223053, -0.34210893511772156, -0.3068435490131378, -0.2715781331062317, -0.23631276190280914, -0.2010473757982254, -0.16578197479248047, -0.13051658868789673, -0.09525120258331299, -0.05998581275343895, -0.02472042292356491, 0.010544970631599426, 0.045810356736183167, 0.0810757428407669, 0.11634114384651184, 0.15160652995109558, 0.18687191605567932, 0.22213730216026306, 0.2574026882648468, 0.29266810417175293, 0.32793349027633667, 0.3631988763809204, 0.39846426248550415, 0.4337296485900879, 0.46899503469467163, 0.5042604207992554, 0.5395258069038391, 0.5747911930084229, 0.6100565791130066, 0.6453219652175903, 0.6805874109268188, 0.7158527374267578, 0.7511181831359863, 0.7863835692405701, 0.8216489553451538, 0.8569143414497375, 0.8921797275543213, 0.927445113658905, 0.9627104997634888, 0.9979759454727173, 1.0332412719726562]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 2.0, 4.0, 5.0, 10.0, 10.0, 9.0, 14.0, 17.0, 34.0, 31.0, 33.0, 46.0, 31.0, 30.0, 45.0, 44.0, 35.0, 37.0, 36.0, 35.0, 39.0, 34.0, 46.0, 49.0, 31.0, 45.0, 37.0, 34.0, 37.0, 33.0, 19.0, 28.0, 18.0, 14.0, 5.0, 10.0, 2.0, 4.0, 4.0, 4.0, 0.0, 5.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7265638113021851, -0.6995563507080078, -0.6725489497184753, -0.6455414891242981, -0.6185340881347656, -0.5915266275405884, -0.5645192265510559, -0.5375117659568787, -0.5105043649673462, -0.48349693417549133, -0.4564895033836365, -0.4294820725917816, -0.40247464179992676, -0.3754671812057495, -0.34845978021621704, -0.3214523196220398, -0.29444488883018494, -0.2674374580383301, -0.24043002724647522, -0.21342259645462036, -0.1864151656627655, -0.15940771996974945, -0.1324002891778946, -0.10539285838603973, -0.07838542759418488, -0.05137799680233002, -0.02437056228518486, 0.0026368722319602966, 0.029644303023815155, 0.05665174126625061, 0.08365917205810547, 0.11066660284996033, 0.13767403364181519, 0.16468146443367004, 0.1916888952255249, 0.21869632601737976, 0.24570375680923462, 0.27271121740341187, 0.29971861839294434, 0.3267260789871216, 0.35373347997665405, 0.3807409107685089, 0.40774834156036377, 0.43475577235221863, 0.4617632031440735, 0.48877066373825073, 0.5157780647277832, 0.5427855253219604, 0.5697929859161377, 0.5968004465103149, 0.6238078474998474, 0.6508153080940247, 0.6778227090835571, 0.7048301696777344, 0.7318375706672668, 0.7588450312614441, 0.7858524322509766, 0.8128598928451538, 0.8398672938346863, 0.8668747544288635, 0.893882155418396, 0.9208896160125732, 0.9478970170021057, 0.974904477596283, 1.0019118785858154]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 1.0, 4.0, 3.0, 6.0, 7.0, 9.0, 10.0, 13.0, 20.0, 36.0, 47.0, 62.0, 104.0, 200.0, 417.0, 976.0, 3170.0, 19156.0, 887227.0, 126954.0, 7028.0, 1708.0, 629.0, 281.0, 146.0, 106.0, 69.0, 48.0, 38.0, 24.0, 15.0, 10.0, 8.0, 8.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0439453125, -1.013916015625, -0.98388671875, -0.953857421875, -0.923828125, -0.893798828125, -0.86376953125, -0.833740234375, -0.8037109375, -0.773681640625, -0.74365234375, -0.713623046875, -0.68359375, -0.653564453125, -0.62353515625, -0.593505859375, -0.5634765625, -0.533447265625, -0.50341796875, -0.473388671875, -0.443359375, -0.413330078125, -0.38330078125, -0.353271484375, -0.3232421875, -0.293212890625, -0.26318359375, -0.233154296875, -0.203125, -0.173095703125, -0.14306640625, -0.113037109375, -0.0830078125, -0.052978515625, -0.02294921875, 0.007080078125, 0.037109375, 0.067138671875, 0.09716796875, 0.127197265625, 0.1572265625, 0.187255859375, 0.21728515625, 0.247314453125, 0.27734375, 0.307373046875, 0.33740234375, 0.367431640625, 0.3974609375, 0.427490234375, 0.45751953125, 0.487548828125, 0.517578125, 0.547607421875, 0.57763671875, 0.607666015625, 0.6376953125, 0.667724609375, 0.69775390625, 0.727783203125, 0.7578125, 0.787841796875, 0.81787109375, 0.847900390625, 0.8779296875]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 5.0, 21.0, 38.0, 79.0, 110.0, 164.0, 147.0, 167.0, 107.0, 72.0, 50.0, 16.0, 8.0, 5.0, 2.0, 4.0, 4.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1336669921875, -0.13045215606689453, -0.12723731994628906, -0.1240224838256836, -0.12080764770507812, -0.11759281158447266, -0.11437797546386719, -0.11116313934326172, -0.10794830322265625, -0.10473346710205078, -0.10151863098144531, -0.09830379486083984, -0.09508895874023438, -0.0918741226196289, -0.08865928649902344, -0.08544445037841797, -0.0822296142578125, -0.07901477813720703, -0.07579994201660156, -0.0725851058959961, -0.06937026977539062, -0.06615543365478516, -0.06294059753417969, -0.05972576141357422, -0.05651092529296875, -0.05329608917236328, -0.05008125305175781, -0.046866416931152344, -0.043651580810546875, -0.040436744689941406, -0.03722190856933594, -0.03400707244873047, -0.030792236328125, -0.02757740020751953, -0.024362564086914062, -0.021147727966308594, -0.017932891845703125, -0.014718055725097656, -0.011503219604492188, -0.008288383483886719, -0.00507354736328125, -0.0018587112426757812, 0.0013561248779296875, 0.004570960998535156, 0.007785797119140625, 0.011000633239746094, 0.014215469360351562, 0.01743030548095703, 0.0206451416015625, 0.02385997772216797, 0.027074813842773438, 0.030289649963378906, 0.033504486083984375, 0.036719322204589844, 0.03993415832519531, 0.04314899444580078, 0.04636383056640625, 0.04957866668701172, 0.05279350280761719, 0.056008338928222656, 0.059223175048828125, 0.062438011169433594, 0.06565284729003906, 0.06886768341064453, 0.07208251953125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 6.0, 5.0, 13.0, 14.0, 15.0, 31.0, 48.0, 63.0, 107.0, 213.0, 352.0, 668.0, 1573.0, 4757.0, 23615.0, 413698.0, 568603.0, 26717.0, 5028.0, 1561.0, 696.0, 323.0, 163.0, 98.0, 57.0, 37.0, 24.0, 24.0, 9.0, 11.0, 7.0, 5.0, 2.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.39306640625, -0.3815155029296875, -0.369964599609375, -0.3584136962890625, -0.34686279296875, -0.3353118896484375, -0.323760986328125, -0.3122100830078125, -0.3006591796875, -0.2891082763671875, -0.277557373046875, -0.2660064697265625, -0.25445556640625, -0.2429046630859375, -0.231353759765625, -0.2198028564453125, -0.208251953125, -0.1967010498046875, -0.185150146484375, -0.1735992431640625, -0.16204833984375, -0.1504974365234375, -0.138946533203125, -0.1273956298828125, -0.1158447265625, -0.1042938232421875, -0.092742919921875, -0.0811920166015625, -0.06964111328125, -0.0580902099609375, -0.046539306640625, -0.0349884033203125, -0.0234375, -0.0118865966796875, -0.000335693359375, 0.0112152099609375, 0.02276611328125, 0.0343170166015625, 0.045867919921875, 0.0574188232421875, 0.0689697265625, 0.0805206298828125, 0.092071533203125, 0.1036224365234375, 0.11517333984375, 0.1267242431640625, 0.138275146484375, 0.1498260498046875, 0.161376953125, 0.1729278564453125, 0.184478759765625, 0.1960296630859375, 0.20758056640625, 0.2191314697265625, 0.230682373046875, 0.2422332763671875, 0.2537841796875, 0.2653350830078125, 0.276885986328125, 0.2884368896484375, 0.29998779296875, 0.3115386962890625, 0.323089599609375, 0.3346405029296875, 0.34619140625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 0.0, 7.0, 2.0, 6.0, 7.0, 12.0, 18.0, 12.0, 14.0, 20.0, 34.0, 33.0, 32.0, 45.0, 53.0, 69.0, 65.0, 73.0, 64.0, 65.0, 53.0, 58.0, 47.0, 48.0, 37.0, 28.0, 27.0, 19.0, 17.0, 14.0, 7.0, 6.0, 3.0, 8.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.155029296875, -0.14899444580078125, -0.1429595947265625, -0.13692474365234375, -0.130889892578125, -0.12485504150390625, -0.1188201904296875, -0.11278533935546875, -0.10675048828125, -0.10071563720703125, -0.0946807861328125, -0.08864593505859375, -0.082611083984375, -0.07657623291015625, -0.0705413818359375, -0.06450653076171875, -0.0584716796875, -0.05243682861328125, -0.0464019775390625, -0.04036712646484375, -0.034332275390625, -0.02829742431640625, -0.0222625732421875, -0.01622772216796875, -0.01019287109375, -0.00415802001953125, 0.0018768310546875, 0.00791168212890625, 0.013946533203125, 0.01998138427734375, 0.0260162353515625, 0.03205108642578125, 0.0380859375, 0.04412078857421875, 0.0501556396484375, 0.05619049072265625, 0.062225341796875, 0.06826019287109375, 0.0742950439453125, 0.08032989501953125, 0.08636474609375, 0.09239959716796875, 0.0984344482421875, 0.10446929931640625, 0.110504150390625, 0.11653900146484375, 0.1225738525390625, 0.12860870361328125, 0.1346435546875, 0.14067840576171875, 0.1467132568359375, 0.15274810791015625, 0.158782958984375, 0.16481781005859375, 0.1708526611328125, 0.17688751220703125, 0.18292236328125, 0.18895721435546875, 0.1949920654296875, 0.20102691650390625, 0.207061767578125, 0.21309661865234375, 0.2191314697265625, 0.22516632080078125, 0.231201171875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 2.0, 3.0, 3.0, 7.0, 9.0, 10.0, 6.0, 12.0, 24.0, 28.0, 59.0, 112.0, 201.0, 465.0, 1169.0, 5629.0, 381108.0, 651829.0, 5745.0, 1180.0, 461.0, 241.0, 99.0, 63.0, 33.0, 20.0, 16.0, 9.0, 6.0, 1.0, 2.0, 1.0, 6.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.88525390625, -0.8641815185546875, -0.843109130859375, -0.8220367431640625, -0.80096435546875, -0.7798919677734375, -0.758819580078125, -0.7377471923828125, -0.7166748046875, -0.6956024169921875, -0.674530029296875, -0.6534576416015625, -0.63238525390625, -0.6113128662109375, -0.590240478515625, -0.5691680908203125, -0.548095703125, -0.5270233154296875, -0.505950927734375, -0.4848785400390625, -0.46380615234375, -0.4427337646484375, -0.421661376953125, -0.4005889892578125, -0.3795166015625, -0.3584442138671875, -0.337371826171875, -0.3162994384765625, -0.29522705078125, -0.2741546630859375, -0.253082275390625, -0.2320098876953125, -0.2109375, -0.1898651123046875, -0.168792724609375, -0.1477203369140625, -0.12664794921875, -0.1055755615234375, -0.084503173828125, -0.0634307861328125, -0.0423583984375, -0.0212860107421875, -0.000213623046875, 0.0208587646484375, 0.04193115234375, 0.0630035400390625, 0.084075927734375, 0.1051483154296875, 0.126220703125, 0.1472930908203125, 0.168365478515625, 0.1894378662109375, 0.21051025390625, 0.2315826416015625, 0.252655029296875, 0.2737274169921875, 0.2947998046875, 0.3158721923828125, 0.336944580078125, 0.3580169677734375, 0.37908935546875, 0.4001617431640625, 0.421234130859375, 0.4423065185546875, 0.46337890625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 2.0, 3.0, 6.0, 11.0, 8.0, 8.0, 13.0, 19.0, 22.0, 15.0, 32.0, 27.0, 29.0, 47.0, 56.0, 80.0, 79.0, 102.0, 88.0, 74.0, 54.0, 43.0, 45.0, 26.0, 26.0, 16.0, 17.0, 9.0, 11.0, 4.0, 10.0, 4.0, 8.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00010591745376586914, -0.0001021726056933403, -9.842775762081146e-05, -9.468290954828262e-05, -9.093806147575378e-05, -8.719321340322495e-05, -8.34483653306961e-05, -7.970351725816727e-05, -7.595866918563843e-05, -7.221382111310959e-05, -6.846897304058075e-05, -6.472412496805191e-05, -6.097927689552307e-05, -5.723442882299423e-05, -5.348958075046539e-05, -4.9744732677936554e-05, -4.5999884605407715e-05, -4.2255036532878876e-05, -3.851018846035004e-05, -3.47653403878212e-05, -3.102049231529236e-05, -2.727564424276352e-05, -2.353079617023468e-05, -1.978594809770584e-05, -1.6041100025177002e-05, -1.2296251952648163e-05, -8.551403880119324e-06, -4.806555807590485e-06, -1.0617077350616455e-06, 2.6831403374671936e-06, 6.427988409996033e-06, 1.0172836482524872e-05, 1.3917684555053711e-05, 1.766253262758255e-05, 2.140738070011139e-05, 2.5152228772640228e-05, 2.8897076845169067e-05, 3.2641924917697906e-05, 3.6386772990226746e-05, 4.0131621062755585e-05, 4.3876469135284424e-05, 4.762131720781326e-05, 5.13661652803421e-05, 5.511101335287094e-05, 5.885586142539978e-05, 6.260070949792862e-05, 6.634555757045746e-05, 7.00904056429863e-05, 7.383525371551514e-05, 7.758010178804398e-05, 8.132494986057281e-05, 8.506979793310165e-05, 8.881464600563049e-05, 9.255949407815933e-05, 9.630434215068817e-05, 0.00010004919022321701, 0.00010379403829574585, 0.00010753888636827469, 0.00011128373444080353, 0.00011502858251333237, 0.0001187734305858612, 0.00012251827865839005, 0.00012626312673091888, 0.00013000797480344772, 0.00013375282287597656]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 6.0, 4.0, 8.0, 8.0, 7.0, 17.0, 18.0, 18.0, 33.0, 34.0, 49.0, 93.0, 94.0, 186.0, 279.0, 433.0, 682.0, 1266.0, 2560.0, 5943.0, 17407.0, 111175.0, 822329.0, 63047.0, 13028.0, 4751.0, 2167.0, 1118.0, 613.0, 380.0, 240.0, 155.0, 95.0, 99.0, 52.0, 44.0, 36.0, 19.0, 14.0, 12.0, 7.0, 9.0, 6.0, 6.0, 3.0, 3.0, 4.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.2138671875, -0.2074604034423828, -0.20105361938476562, -0.19464683532714844, -0.18824005126953125, -0.18183326721191406, -0.17542648315429688, -0.1690196990966797, -0.1626129150390625, -0.1562061309814453, -0.14979934692382812, -0.14339256286621094, -0.13698577880859375, -0.13057899475097656, -0.12417221069335938, -0.11776542663574219, -0.111358642578125, -0.10495185852050781, -0.09854507446289062, -0.09213829040527344, -0.08573150634765625, -0.07932472229003906, -0.07291793823242188, -0.06651115417480469, -0.0601043701171875, -0.05369758605957031, -0.047290802001953125, -0.04088401794433594, -0.03447723388671875, -0.028070449829101562, -0.021663665771484375, -0.015256881713867188, -0.00885009765625, -0.0024433135986328125, 0.003963470458984375, 0.010370254516601562, 0.01677703857421875, 0.023183822631835938, 0.029590606689453125, 0.03599739074707031, 0.0424041748046875, 0.04881095886230469, 0.055217742919921875, 0.06162452697753906, 0.06803131103515625, 0.07443809509277344, 0.08084487915039062, 0.08725166320800781, 0.093658447265625, 0.10006523132324219, 0.10647201538085938, 0.11287879943847656, 0.11928558349609375, 0.12569236755371094, 0.13209915161132812, 0.1385059356689453, 0.1449127197265625, 0.1513195037841797, 0.15772628784179688, 0.16413307189941406, 0.17053985595703125, 0.17694664001464844, 0.18335342407226562, 0.1897602081298828, 0.1961669921875]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 6.0, 1.0, 4.0, 8.0, 15.0, 14.0, 31.0, 58.0, 99.0, 137.0, 243.0, 160.0, 97.0, 45.0, 30.0, 14.0, 9.0, 5.0, 5.0, 8.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.2398681640625, -0.23308753967285156, -0.22630691528320312, -0.2195262908935547, -0.21274566650390625, -0.2059650421142578, -0.19918441772460938, -0.19240379333496094, -0.1856231689453125, -0.17884254455566406, -0.17206192016601562, -0.1652812957763672, -0.15850067138671875, -0.1517200469970703, -0.14493942260742188, -0.13815879821777344, -0.131378173828125, -0.12459754943847656, -0.11781692504882812, -0.11103630065917969, -0.10425567626953125, -0.09747505187988281, -0.09069442749023438, -0.08391380310058594, -0.0771331787109375, -0.07035255432128906, -0.06357192993164062, -0.05679130554199219, -0.05001068115234375, -0.04323005676269531, -0.036449432373046875, -0.029668807983398438, -0.02288818359375, -0.016107559204101562, -0.009326934814453125, -0.0025463104248046875, 0.00423431396484375, 0.011014938354492188, 0.017795562744140625, 0.024576187133789062, 0.0313568115234375, 0.03813743591308594, 0.044918060302734375, 0.05169868469238281, 0.05847930908203125, 0.06525993347167969, 0.07204055786132812, 0.07882118225097656, 0.085601806640625, 0.09238243103027344, 0.09916305541992188, 0.10594367980957031, 0.11272430419921875, 0.11950492858886719, 0.12628555297851562, 0.13306617736816406, 0.1398468017578125, 0.14662742614746094, 0.15340805053710938, 0.1601886749267578, 0.16696929931640625, 0.1737499237060547, 0.18053054809570312, 0.18731117248535156, 0.194091796875]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 9.0, 14.0, 28.0, 51.0, 114.0, 296.0, 278.0, 134.0, 49.0, 22.0, 7.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.948605060577393, -5.8271331787109375, -5.705661296844482, -5.584188938140869, -5.462717056274414, -5.341245174407959, -5.219773292541504, -5.098301410675049, -4.976829528808594, -4.855357646942139, -4.733885765075684, -4.61241340637207, -4.490941524505615, -4.36946964263916, -4.247997760772705, -4.12652587890625, -4.005053520202637, -3.8835816383361816, -3.7621095180511475, -3.6406376361846924, -3.519165515899658, -3.397693634033203, -3.276221752166748, -3.154749870300293, -3.033277750015259, -2.9118058681488037, -2.7903337478637695, -2.6688618659973145, -2.5473899841308594, -2.425917863845825, -2.30444598197937, -2.182973861694336, -2.061501979827881, -1.9400299787521362, -1.8185579776763916, -1.6970860958099365, -1.575614094734192, -1.4541420936584473, -1.3326702117919922, -1.2111982107162476, -1.0897260904312134, -0.9682540893554688, -0.8467821478843689, -0.725310206413269, -0.6038382053375244, -0.4823662042617798, -0.36089426279067993, -0.23942232131958008, -0.11795032024383545, 0.003521651029586792, 0.12499362230300903, 0.24646559357643127, 0.3679375648498535, 0.48940956592559814, 0.610881507396698, 0.7323534488677979, 0.8538254499435425, 0.9752974510192871, 1.0967693328857422, 1.2182413339614868, 1.3397133350372314, 1.461185336112976, 1.5826573371887207, 1.7041292190551758, 1.8256012201309204]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 4.0, 4.0, 8.0, 15.0, 14.0, 20.0, 26.0, 26.0, 27.0, 31.0, 50.0, 49.0, 51.0, 51.0, 75.0, 75.0, 63.0, 78.0, 65.0, 51.0, 42.0, 47.0, 23.0, 24.0, 21.0, 20.0, 17.0, 12.0, 7.0, 5.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0], "bins": [-1.3496026992797852, -1.3180228471755981, -1.2864429950714111, -1.2548632621765137, -1.2232834100723267, -1.1917035579681396, -1.1601238250732422, -1.1285439729690552, -1.0969641208648682, -1.0653842687606812, -1.0338044166564941, -1.0022246837615967, -0.9706448316574097, -0.9390649795532227, -0.9074851870536804, -0.8759053945541382, -0.8443255424499512, -0.8127456903457642, -0.7811658978462219, -0.7495861053466797, -0.7180062532424927, -0.6864264011383057, -0.6548466086387634, -0.6232668161392212, -0.5916869640350342, -0.5601071119308472, -0.5285273194313049, -0.4969474971294403, -0.4653676748275757, -0.43378785252571106, -0.40220803022384644, -0.3706282079219818, -0.3390483856201172, -0.30746856331825256, -0.27588874101638794, -0.24430891871452332, -0.2127290964126587, -0.18114927411079407, -0.14956945180892944, -0.11798962950706482, -0.0864098072052002, -0.05482998490333557, -0.023250162601470947, 0.008329659700393677, 0.0399094820022583, 0.07148930430412292, 0.10306912660598755, 0.13464894890785217, 0.1662287712097168, 0.19780859351158142, 0.22938841581344604, 0.26096823811531067, 0.2925480604171753, 0.3241278827190399, 0.35570770502090454, 0.38728752732276917, 0.4188673496246338, 0.4504471719264984, 0.48202699422836304, 0.5136067867279053, 0.5451866388320923, 0.5767664909362793, 0.6083462834358215, 0.6399260759353638, 0.6715059280395508]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 5.0, 5.0, 4.0, 7.0, 9.0, 8.0, 10.0, 10.0, 20.0, 16.0, 21.0, 21.0, 29.0, 38.0, 58.0, 66.0, 90.0, 117.0, 152.0, 200.0, 250.0, 410.0, 610.0, 1068.0, 2025.0, 5305.0, 22277.0, 351671.0, 3716857.0, 73207.0, 11984.0, 4044.0, 1720.0, 812.0, 421.0, 264.0, 156.0, 96.0, 68.0, 58.0, 28.0, 20.0, 12.0, 11.0, 6.0, 5.0, 4.0, 7.0, 3.0, 4.0, 4.0, 1.0, 1.0], "bins": [-0.325927734375, -0.3176250457763672, -0.3093223571777344, -0.30101966857910156, -0.29271697998046875, -0.28441429138183594, -0.2761116027832031, -0.2678089141845703, -0.2595062255859375, -0.2512035369873047, -0.24290084838867188, -0.23459815979003906, -0.22629547119140625, -0.21799278259277344, -0.20969009399414062, -0.2013874053955078, -0.193084716796875, -0.1847820281982422, -0.17647933959960938, -0.16817665100097656, -0.15987396240234375, -0.15157127380371094, -0.14326858520507812, -0.1349658966064453, -0.1266632080078125, -0.11836051940917969, -0.11005783081054688, -0.10175514221191406, -0.09345245361328125, -0.08514976501464844, -0.07684707641601562, -0.06854438781738281, -0.06024169921875, -0.05193901062011719, -0.043636322021484375, -0.03533363342285156, -0.02703094482421875, -0.018728256225585938, -0.010425567626953125, -0.0021228790283203125, 0.0061798095703125, 0.014482498168945312, 0.022785186767578125, 0.031087875366210938, 0.03939056396484375, 0.04769325256347656, 0.055995941162109375, 0.06429862976074219, 0.072601318359375, 0.08090400695800781, 0.08920669555664062, 0.09750938415527344, 0.10581207275390625, 0.11411476135253906, 0.12241744995117188, 0.1307201385498047, 0.1390228271484375, 0.1473255157470703, 0.15562820434570312, 0.16393089294433594, 0.17223358154296875, 0.18053627014160156, 0.18883895874023438, 0.1971416473388672, 0.2054443359375]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 6.0, 6.0, 21.0, 43.0, 94.0, 114.0, 173.0, 148.0, 149.0, 103.0, 69.0, 33.0, 24.0, 2.0, 8.0, 1.0, 3.0, 5.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1317138671875, -0.12853050231933594, -0.12534713745117188, -0.12216377258300781, -0.11898040771484375, -0.11579704284667969, -0.11261367797851562, -0.10943031311035156, -0.1062469482421875, -0.10306358337402344, -0.09988021850585938, -0.09669685363769531, -0.09351348876953125, -0.09033012390136719, -0.08714675903320312, -0.08396339416503906, -0.080780029296875, -0.07759666442871094, -0.07441329956054688, -0.07122993469238281, -0.06804656982421875, -0.06486320495605469, -0.061679840087890625, -0.05849647521972656, -0.0553131103515625, -0.05212974548339844, -0.048946380615234375, -0.04576301574707031, -0.04257965087890625, -0.03939628601074219, -0.036212921142578125, -0.03302955627441406, -0.02984619140625, -0.026662826538085938, -0.023479461669921875, -0.020296096801757812, -0.01711273193359375, -0.013929367065429688, -0.010746002197265625, -0.0075626373291015625, -0.0043792724609375, -0.0011959075927734375, 0.001987457275390625, 0.0051708221435546875, 0.00835418701171875, 0.011537551879882812, 0.014720916748046875, 0.017904281616210938, 0.021087646484375, 0.024271011352539062, 0.027454376220703125, 0.030637741088867188, 0.03382110595703125, 0.03700447082519531, 0.040187835693359375, 0.04337120056152344, 0.0465545654296875, 0.04973793029785156, 0.052921295166015625, 0.05610466003417969, 0.05928802490234375, 0.06247138977050781, 0.06565475463867188, 0.06883811950683594, 0.072021484375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 5.0, 4.0, 9.0, 17.0, 34.0, 34.0, 55.0, 93.0, 168.0, 227.0, 279.0, 473.0, 654.0, 891.0, 1418.0, 2043.0, 3591.0, 6830.0, 15964.0, 52036.0, 327579.0, 3365309.0, 327194.0, 55344.0, 17421.0, 7585.0, 3750.0, 2099.0, 1139.0, 720.0, 446.0, 248.0, 203.0, 133.0, 94.0, 54.0, 48.0, 44.0, 26.0, 12.0, 2.0, 6.0, 4.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1378173828125, -0.1329803466796875, -0.128143310546875, -0.1233062744140625, -0.11846923828125, -0.1136322021484375, -0.108795166015625, -0.1039581298828125, -0.09912109375, -0.0942840576171875, -0.089447021484375, -0.0846099853515625, -0.07977294921875, -0.0749359130859375, -0.070098876953125, -0.0652618408203125, -0.0604248046875, -0.0555877685546875, -0.050750732421875, -0.0459136962890625, -0.04107666015625, -0.0362396240234375, -0.031402587890625, -0.0265655517578125, -0.021728515625, -0.0168914794921875, -0.012054443359375, -0.0072174072265625, -0.00238037109375, 0.0024566650390625, 0.007293701171875, 0.0121307373046875, 0.0169677734375, 0.0218048095703125, 0.026641845703125, 0.0314788818359375, 0.03631591796875, 0.0411529541015625, 0.045989990234375, 0.0508270263671875, 0.0556640625, 0.0605010986328125, 0.065338134765625, 0.0701751708984375, 0.07501220703125, 0.0798492431640625, 0.084686279296875, 0.0895233154296875, 0.0943603515625, 0.0991973876953125, 0.104034423828125, 0.1088714599609375, 0.11370849609375, 0.1185455322265625, 0.123382568359375, 0.1282196044921875, 0.133056640625, 0.1378936767578125, 0.142730712890625, 0.1475677490234375, 0.15240478515625, 0.1572418212890625, 0.162078857421875, 0.1669158935546875, 0.1717529296875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 3.0, 0.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 3.0, 3.0, 0.0, 2.0, 2.0, 2.0, 4.0, 2.0, 5.0, 6.0, 18.0, 24.0, 42.0, 69.0, 93.0, 199.0, 370.0, 960.0, 1036.0, 482.0, 240.0, 152.0, 110.0, 65.0, 48.0, 26.0, 21.0, 22.0, 14.0, 11.0, 8.0, 8.0, 4.0, 4.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.188232421875, -0.18329429626464844, -0.17835617065429688, -0.1734180450439453, -0.16847991943359375, -0.1635417938232422, -0.15860366821289062, -0.15366554260253906, -0.1487274169921875, -0.14378929138183594, -0.13885116577148438, -0.1339130401611328, -0.12897491455078125, -0.12403678894042969, -0.11909866333007812, -0.11416053771972656, -0.109222412109375, -0.10428428649902344, -0.09934616088867188, -0.09440803527832031, -0.08946990966796875, -0.08453178405761719, -0.07959365844726562, -0.07465553283691406, -0.0697174072265625, -0.06477928161621094, -0.059841156005859375, -0.05490303039550781, -0.04996490478515625, -0.04502677917480469, -0.040088653564453125, -0.03515052795410156, -0.03021240234375, -0.025274276733398438, -0.020336151123046875, -0.015398025512695312, -0.01045989990234375, -0.0055217742919921875, -0.000583648681640625, 0.0043544769287109375, 0.0092926025390625, 0.014230728149414062, 0.019168853759765625, 0.024106979370117188, 0.02904510498046875, 0.03398323059082031, 0.038921356201171875, 0.04385948181152344, 0.048797607421875, 0.05373573303222656, 0.058673858642578125, 0.06361198425292969, 0.06855010986328125, 0.07348823547363281, 0.07842636108398438, 0.08336448669433594, 0.0883026123046875, 0.09324073791503906, 0.09817886352539062, 0.10311698913574219, 0.10805511474609375, 0.11299324035644531, 0.11793136596679688, 0.12286949157714844, 0.1278076171875]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 6.0, 3.0, 1.0, 1.0, 7.0, 13.0, 16.0, 17.0, 42.0, 45.0, 71.0, 94.0, 105.0, 145.0, 102.0, 90.0, 53.0, 52.0, 38.0, 27.0, 18.0, 15.0, 8.0, 15.0, 3.0, 3.0, 0.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.387558937072754, -1.3371734619140625, -1.2867878675460815, -1.2364022731781006, -1.1860167980194092, -1.1356313228607178, -1.0852457284927368, -1.0348601341247559, -0.9844746589660645, -0.9340891242027283, -0.8837035894393921, -0.8333180546760559, -0.7829325199127197, -0.7325469851493835, -0.6821614503860474, -0.6317759156227112, -0.581390380859375, -0.5310048460960388, -0.48061931133270264, -0.43023377656936646, -0.3798482418060303, -0.3294627070426941, -0.2790771722793579, -0.22869163751602173, -0.17830610275268555, -0.12792056798934937, -0.07753503322601318, -0.027149498462677002, 0.02323603630065918, 0.07362157106399536, 0.12400710582733154, 0.17439264059066772, 0.2247781753540039, 0.2751637101173401, 0.32554924488067627, 0.37593477964401245, 0.42632031440734863, 0.4767058491706848, 0.527091383934021, 0.5774769186973572, 0.6278624534606934, 0.6782479882240295, 0.7286335229873657, 0.7790190577507019, 0.8294045925140381, 0.8797901272773743, 0.9301756620407104, 0.9805611968040466, 1.0309467315673828, 1.0813322067260742, 1.1317178010940552, 1.1821033954620361, 1.2324888706207275, 1.282874345779419, 1.3332599401474, 1.3836455345153809, 1.4340310096740723, 1.4844164848327637, 1.5348020792007446, 1.5851876735687256, 1.635573148727417, 1.6859586238861084, 1.7363442182540894, 1.7867298126220703, 1.8371152877807617]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 5.0, 6.0, 4.0, 12.0, 10.0, 16.0, 12.0, 24.0, 27.0, 26.0, 41.0, 29.0, 35.0, 43.0, 56.0, 45.0, 45.0, 59.0, 58.0, 50.0, 38.0, 47.0, 45.0, 42.0, 30.0, 35.0, 30.0, 26.0, 26.0, 19.0, 22.0, 12.0, 9.0, 6.0, 6.0, 7.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.313619613647461, -1.2759904861450195, -1.2383614778518677, -1.2007323503494263, -1.1631033420562744, -1.125474214553833, -1.0878452062606812, -1.0502160787582397, -1.012587070465088, -0.9749580025672913, -0.9373289346694946, -0.899699866771698, -0.8620707988739014, -0.8244417309761047, -0.7868126630783081, -0.7491835355758667, -0.7115544676780701, -0.6739253997802734, -0.6362963318824768, -0.5986672639846802, -0.5610381960868835, -0.5234091281890869, -0.4857800304889679, -0.44815096259117126, -0.41052189469337463, -0.372892826795578, -0.33526375889778137, -0.29763466119766235, -0.2600055932998657, -0.22237654030323029, -0.18474745750427246, -0.14711838960647583, -0.1094893217086792, -0.07186025381088257, -0.03423117846250534, 0.003397896885871887, 0.04102696478366852, 0.07865603268146515, 0.11628511548042297, 0.1539141833782196, 0.19154325127601624, 0.22917231917381287, 0.2668013870716095, 0.3044304847717285, 0.34205955266952515, 0.3796886205673218, 0.4173176884651184, 0.45494675636291504, 0.49257582426071167, 0.5302048921585083, 0.5678339600563049, 0.6054630279541016, 0.6430920958518982, 0.6807211637496948, 0.7183502912521362, 0.7559792995452881, 0.7936084270477295, 0.8312374949455261, 0.8688665628433228, 0.9064956307411194, 0.944124698638916, 0.9817537665367126, 1.0193828344345093, 1.0570119619369507, 1.0946409702301025]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 1.0, 5.0, 4.0, 11.0, 16.0, 15.0, 26.0, 41.0, 65.0, 99.0, 165.0, 257.0, 424.0, 725.0, 1505.0, 3687.0, 13095.0, 87141.0, 757419.0, 156067.0, 19239.0, 4697.0, 1756.0, 873.0, 432.0, 270.0, 180.0, 115.0, 86.0, 50.0, 25.0, 23.0, 15.0, 4.0, 11.0, 5.0, 4.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.406982421875, -0.3945045471191406, -0.38202667236328125, -0.3695487976074219, -0.3570709228515625, -0.3445930480957031, -0.33211517333984375, -0.3196372985839844, -0.307159423828125, -0.2946815490722656, -0.28220367431640625, -0.2697257995605469, -0.2572479248046875, -0.24477005004882812, -0.23229217529296875, -0.21981430053710938, -0.20733642578125, -0.19485855102539062, -0.18238067626953125, -0.16990280151367188, -0.1574249267578125, -0.14494705200195312, -0.13246917724609375, -0.11999130249023438, -0.107513427734375, -0.09503555297851562, -0.08255767822265625, -0.07007980346679688, -0.0576019287109375, -0.045124053955078125, -0.03264617919921875, -0.020168304443359375, -0.0076904296875, 0.004787445068359375, 0.01726531982421875, 0.029743194580078125, 0.0422210693359375, 0.054698944091796875, 0.06717681884765625, 0.07965469360351562, 0.092132568359375, 0.10461044311523438, 0.11708831787109375, 0.12956619262695312, 0.1420440673828125, 0.15452194213867188, 0.16699981689453125, 0.17947769165039062, 0.19195556640625, 0.20443344116210938, 0.21691131591796875, 0.22938919067382812, 0.2418670654296875, 0.2543449401855469, 0.26682281494140625, 0.2793006896972656, 0.291778564453125, 0.3042564392089844, 0.31673431396484375, 0.3292121887207031, 0.3416900634765625, 0.3541679382324219, 0.36664581298828125, 0.3791236877441406, 0.3916015625]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 5.0, 7.0, 9.0, 26.0, 37.0, 56.0, 83.0, 96.0, 124.0, 129.0, 117.0, 90.0, 86.0, 44.0, 32.0, 21.0, 14.0, 10.0, 6.0, 2.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.133056640625, -0.1296863555908203, -0.12631607055664062, -0.12294578552246094, -0.11957550048828125, -0.11620521545410156, -0.11283493041992188, -0.10946464538574219, -0.1060943603515625, -0.10272407531738281, -0.09935379028320312, -0.09598350524902344, -0.09261322021484375, -0.08924293518066406, -0.08587265014648438, -0.08250236511230469, -0.079132080078125, -0.07576179504394531, -0.07239151000976562, -0.06902122497558594, -0.06565093994140625, -0.06228065490722656, -0.058910369873046875, -0.05554008483886719, -0.0521697998046875, -0.04879951477050781, -0.045429229736328125, -0.04205894470214844, -0.03868865966796875, -0.03531837463378906, -0.031948089599609375, -0.028577804565429688, -0.02520751953125, -0.021837234497070312, -0.018466949462890625, -0.015096664428710938, -0.01172637939453125, -0.008356094360351562, -0.004985809326171875, -0.0016155242919921875, 0.0017547607421875, 0.0051250457763671875, 0.008495330810546875, 0.011865615844726562, 0.01523590087890625, 0.018606185913085938, 0.021976470947265625, 0.025346755981445312, 0.028717041015625, 0.03208732604980469, 0.035457611083984375, 0.03882789611816406, 0.04219818115234375, 0.04556846618652344, 0.048938751220703125, 0.05230903625488281, 0.0556793212890625, 0.05904960632324219, 0.062419891357421875, 0.06579017639160156, 0.06916046142578125, 0.07253074645996094, 0.07590103149414062, 0.07927131652832031, 0.0826416015625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 6.0, 4.0, 10.0, 14.0, 42.0, 51.0, 79.0, 148.0, 267.0, 568.0, 1148.0, 2404.0, 5335.0, 12643.0, 32509.0, 101590.0, 487021.0, 288346.0, 73260.0, 24880.0, 9900.0, 4430.0, 1967.0, 904.0, 442.0, 254.0, 143.0, 75.0, 36.0, 28.0, 21.0, 8.0, 5.0, 3.0, 3.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2203369140625, -0.21383094787597656, -0.20732498168945312, -0.2008190155029297, -0.19431304931640625, -0.1878070831298828, -0.18130111694335938, -0.17479515075683594, -0.1682891845703125, -0.16178321838378906, -0.15527725219726562, -0.1487712860107422, -0.14226531982421875, -0.1357593536376953, -0.12925338745117188, -0.12274742126464844, -0.116241455078125, -0.10973548889160156, -0.10322952270507812, -0.09672355651855469, -0.09021759033203125, -0.08371162414550781, -0.07720565795898438, -0.07069969177246094, -0.0641937255859375, -0.05768775939941406, -0.051181793212890625, -0.04467582702636719, -0.03816986083984375, -0.03166389465332031, -0.025157928466796875, -0.018651962280273438, -0.01214599609375, -0.0056400299072265625, 0.000865936279296875, 0.0073719024658203125, 0.01387786865234375, 0.020383834838867188, 0.026889801025390625, 0.03339576721191406, 0.0399017333984375, 0.04640769958496094, 0.052913665771484375, 0.05941963195800781, 0.06592559814453125, 0.07243156433105469, 0.07893753051757812, 0.08544349670410156, 0.091949462890625, 0.09845542907714844, 0.10496139526367188, 0.11146736145019531, 0.11797332763671875, 0.12447929382324219, 0.13098526000976562, 0.13749122619628906, 0.1439971923828125, 0.15050315856933594, 0.15700912475585938, 0.1635150909423828, 0.17002105712890625, 0.1765270233154297, 0.18303298950195312, 0.18953895568847656, 0.196044921875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 7.0, 7.0, 9.0, 11.0, 12.0, 11.0, 20.0, 25.0, 19.0, 16.0, 38.0, 35.0, 45.0, 39.0, 43.0, 47.0, 51.0, 55.0, 47.0, 63.0, 52.0, 34.0, 48.0, 43.0, 39.0, 39.0, 14.0, 24.0, 25.0, 11.0, 14.0, 17.0, 7.0, 5.0, 9.0, 3.0, 3.0, 3.0, 4.0, 4.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.209228515625, -0.20272445678710938, -0.19622039794921875, -0.18971633911132812, -0.1832122802734375, -0.17670822143554688, -0.17020416259765625, -0.16370010375976562, -0.157196044921875, -0.15069198608398438, -0.14418792724609375, -0.13768386840820312, -0.1311798095703125, -0.12467575073242188, -0.11817169189453125, -0.11166763305664062, -0.10516357421875, -0.09865951538085938, -0.09215545654296875, -0.08565139770507812, -0.0791473388671875, -0.07264328002929688, -0.06613922119140625, -0.059635162353515625, -0.053131103515625, -0.046627044677734375, -0.04012298583984375, -0.033618927001953125, -0.0271148681640625, -0.020610809326171875, -0.01410675048828125, -0.007602691650390625, -0.0010986328125, 0.005405426025390625, 0.01190948486328125, 0.018413543701171875, 0.0249176025390625, 0.031421661376953125, 0.03792572021484375, 0.044429779052734375, 0.050933837890625, 0.057437896728515625, 0.06394195556640625, 0.07044601440429688, 0.0769500732421875, 0.08345413208007812, 0.08995819091796875, 0.09646224975585938, 0.10296630859375, 0.10947036743164062, 0.11597442626953125, 0.12247848510742188, 0.1289825439453125, 0.13548660278320312, 0.14199066162109375, 0.14849472045898438, 0.154998779296875, 0.16150283813476562, 0.16800689697265625, 0.17451095581054688, 0.1810150146484375, 0.18751907348632812, 0.19402313232421875, 0.20052719116210938, 0.20703125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 5.0, 7.0, 11.0, 18.0, 34.0, 45.0, 65.0, 138.0, 269.0, 678.0, 1874.0, 6868.0, 39760.0, 760367.0, 211723.0, 20315.0, 4153.0, 1255.0, 486.0, 216.0, 109.0, 66.0, 28.0, 18.0, 17.0, 14.0, 4.0, 5.0, 1.0, 6.0, 0.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1529541015625, -0.14868450164794922, -0.14441490173339844, -0.14014530181884766, -0.13587570190429688, -0.1316061019897461, -0.1273365020751953, -0.12306690216064453, -0.11879730224609375, -0.11452770233154297, -0.11025810241699219, -0.1059885025024414, -0.10171890258789062, -0.09744930267333984, -0.09317970275878906, -0.08891010284423828, -0.0846405029296875, -0.08037090301513672, -0.07610130310058594, -0.07183170318603516, -0.06756210327148438, -0.0632925033569336, -0.05902290344238281, -0.05475330352783203, -0.05048370361328125, -0.04621410369873047, -0.04194450378417969, -0.037674903869628906, -0.033405303955078125, -0.029135704040527344, -0.024866104125976562, -0.02059650421142578, -0.016326904296875, -0.012057304382324219, -0.0077877044677734375, -0.0035181045532226562, 0.000751495361328125, 0.005021095275878906, 0.009290695190429688, 0.013560295104980469, 0.01782989501953125, 0.02209949493408203, 0.026369094848632812, 0.030638694763183594, 0.034908294677734375, 0.039177894592285156, 0.04344749450683594, 0.04771709442138672, 0.0519866943359375, 0.05625629425048828, 0.06052589416503906, 0.06479549407958984, 0.06906509399414062, 0.0733346939086914, 0.07760429382324219, 0.08187389373779297, 0.08614349365234375, 0.09041309356689453, 0.09468269348144531, 0.0989522933959961, 0.10322189331054688, 0.10749149322509766, 0.11176109313964844, 0.11603069305419922, 0.12030029296875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 4.0, 2.0, 5.0, 4.0, 4.0, 13.0, 13.0, 12.0, 16.0, 21.0, 41.0, 81.0, 114.0, 150.0, 149.0, 138.0, 81.0, 42.0, 30.0, 18.0, 14.0, 7.0, 8.0, 6.0, 6.0, 8.0, 4.0, 3.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00014400482177734375, -0.00014023110270500183, -0.0001364573836326599, -0.000132683664560318, -0.00012890994548797607, -0.00012513622641563416, -0.00012136250734329224, -0.00011758878827095032, -0.0001138150691986084, -0.00011004135012626648, -0.00010626763105392456, -0.00010249391198158264, -9.872019290924072e-05, -9.49464738368988e-05, -9.117275476455688e-05, -8.739903569221497e-05, -8.362531661987305e-05, -7.985159754753113e-05, -7.607787847518921e-05, -7.230415940284729e-05, -6.853044033050537e-05, -6.475672125816345e-05, -6.098300218582153e-05, -5.7209283113479614e-05, -5.3435564041137695e-05, -4.9661844968795776e-05, -4.588812589645386e-05, -4.211440682411194e-05, -3.834068775177002e-05, -3.45669686794281e-05, -3.079324960708618e-05, -2.7019530534744263e-05, -2.3245811462402344e-05, -1.9472092390060425e-05, -1.5698373317718506e-05, -1.1924654245376587e-05, -8.150935173034668e-06, -4.377216100692749e-06, -6.034970283508301e-07, 3.170222043991089e-06, 6.943941116333008e-06, 1.0717660188674927e-05, 1.4491379261016846e-05, 1.8265098333358765e-05, 2.2038817405700684e-05, 2.5812536478042603e-05, 2.958625555038452e-05, 3.335997462272644e-05, 3.713369369506836e-05, 4.090741276741028e-05, 4.46811318397522e-05, 4.8454850912094116e-05, 5.2228569984436035e-05, 5.6002289056777954e-05, 5.977600812911987e-05, 6.354972720146179e-05, 6.732344627380371e-05, 7.109716534614563e-05, 7.487088441848755e-05, 7.864460349082947e-05, 8.241832256317139e-05, 8.61920416355133e-05, 8.996576070785522e-05, 9.373947978019714e-05, 9.751319885253906e-05]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 4.0, 10.0, 9.0, 7.0, 24.0, 22.0, 47.0, 48.0, 62.0, 166.0, 242.0, 409.0, 756.0, 1501.0, 2854.0, 6087.0, 13811.0, 36006.0, 132010.0, 620415.0, 163123.0, 41851.0, 15546.0, 6877.0, 3146.0, 1592.0, 847.0, 427.0, 237.0, 163.0, 84.0, 64.0, 36.0, 24.0, 20.0, 9.0, 8.0, 3.0, 4.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.061492919921875, -0.059481143951416016, -0.05746936798095703, -0.05545759201049805, -0.05344581604003906, -0.05143404006958008, -0.049422264099121094, -0.04741048812866211, -0.045398712158203125, -0.04338693618774414, -0.041375160217285156, -0.03936338424682617, -0.03735160827636719, -0.0353398323059082, -0.03332805633544922, -0.031316280364990234, -0.02930450439453125, -0.027292728424072266, -0.02528095245361328, -0.023269176483154297, -0.021257400512695312, -0.019245624542236328, -0.017233848571777344, -0.01522207260131836, -0.013210296630859375, -0.01119852066040039, -0.009186744689941406, -0.007174968719482422, -0.0051631927490234375, -0.003151416778564453, -0.0011396408081054688, 0.0008721351623535156, 0.0028839111328125, 0.004895687103271484, 0.006907463073730469, 0.008919239044189453, 0.010931015014648438, 0.012942790985107422, 0.014954566955566406, 0.01696634292602539, 0.018978118896484375, 0.02098989486694336, 0.023001670837402344, 0.025013446807861328, 0.027025222778320312, 0.029036998748779297, 0.03104877471923828, 0.033060550689697266, 0.03507232666015625, 0.037084102630615234, 0.03909587860107422, 0.0411076545715332, 0.04311943054199219, 0.04513120651245117, 0.047142982482910156, 0.04915475845336914, 0.051166534423828125, 0.05317831039428711, 0.055190086364746094, 0.05720186233520508, 0.05921363830566406, 0.06122541427612305, 0.06323719024658203, 0.06524896621704102, 0.0672607421875]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 9.0, 11.0, 8.0, 4.0, 16.0, 12.0, 20.0, 28.0, 28.0, 29.0, 38.0, 60.0, 53.0, 91.0, 131.0, 100.0, 82.0, 53.0, 47.0, 41.0, 28.0, 16.0, 21.0, 17.0, 14.0, 10.0, 10.0, 10.0, 4.0, 6.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0699462890625, -0.06767082214355469, -0.06539535522460938, -0.06311988830566406, -0.06084442138671875, -0.05856895446777344, -0.056293487548828125, -0.05401802062988281, -0.0517425537109375, -0.04946708679199219, -0.047191619873046875, -0.04491615295410156, -0.04264068603515625, -0.04036521911621094, -0.038089752197265625, -0.03581428527832031, -0.033538818359375, -0.03126335144042969, -0.028987884521484375, -0.026712417602539062, -0.02443695068359375, -0.022161483764648438, -0.019886016845703125, -0.017610549926757812, -0.0153350830078125, -0.013059616088867188, -0.010784149169921875, -0.008508682250976562, -0.00623321533203125, -0.0039577484130859375, -0.001682281494140625, 0.0005931854248046875, 0.00286865234375, 0.0051441192626953125, 0.007419586181640625, 0.009695053100585938, 0.01197052001953125, 0.014245986938476562, 0.016521453857421875, 0.018796920776367188, 0.0210723876953125, 0.023347854614257812, 0.025623321533203125, 0.027898788452148438, 0.03017425537109375, 0.03244972229003906, 0.034725189208984375, 0.03700065612792969, 0.039276123046875, 0.04155158996582031, 0.043827056884765625, 0.04610252380371094, 0.04837799072265625, 0.05065345764160156, 0.052928924560546875, 0.05520439147949219, 0.0574798583984375, 0.05975532531738281, 0.062030792236328125, 0.06430625915527344, 0.06658172607421875, 0.06885719299316406, 0.07113265991210938, 0.07340812683105469, 0.07568359375]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 8.0, 5.0, 5.0, 8.0, 9.0, 21.0, 25.0, 36.0, 29.0, 84.0, 92.0, 141.0, 144.0, 120.0, 77.0, 61.0, 38.0, 23.0, 16.0, 18.0, 14.0, 10.0, 5.0, 6.0, 6.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.3173056840896606, -1.2774688005447388, -1.2376320362091064, -1.1977951526641846, -1.1579582691192627, -1.1181213855743408, -1.078284502029419, -1.0384477376937866, -0.9986108541488647, -0.9587739706039429, -0.9189371466636658, -0.8791003227233887, -0.8392634391784668, -0.7994265556335449, -0.7595897316932678, -0.7197529077529907, -0.6799160242080688, -0.640079140663147, -0.6002423167228699, -0.5604054927825928, -0.5205686092376709, -0.4807317554950714, -0.4408949017524719, -0.40105804800987244, -0.36122119426727295, -0.32138434052467346, -0.281547486782074, -0.2417106330394745, -0.201873779296875, -0.1620369255542755, -0.12220007181167603, -0.08236321806907654, -0.0425264835357666, -0.0026896297931671143, 0.03714722394943237, 0.07698407769203186, 0.11682093143463135, 0.15665778517723083, 0.19649463891983032, 0.2363314926624298, 0.2761683464050293, 0.3160052001476288, 0.35584205389022827, 0.39567890763282776, 0.43551576137542725, 0.47535261511802673, 0.5151894688606262, 0.5550262928009033, 0.5948631763458252, 0.6347000598907471, 0.6745368838310242, 0.7143737077713013, 0.7542105913162231, 0.794047474861145, 0.8338842988014221, 0.8737211227416992, 0.9135580062866211, 0.953394889831543, 0.9932317137718201, 1.0330685377120972, 1.072905421257019, 1.112742304801941, 1.1525790691375732, 1.1924159526824951, 1.232252836227417]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 6.0, 6.0, 6.0, 4.0, 10.0, 10.0, 23.0, 30.0, 27.0, 34.0, 45.0, 53.0, 59.0, 61.0, 87.0, 87.0, 73.0, 66.0, 60.0, 57.0, 28.0, 41.0, 29.0, 25.0, 16.0, 21.0, 9.0, 13.0, 6.0, 3.0, 3.0, 5.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.3824677467346191, -1.344494104385376, -1.3065203428268433, -1.2685467004776, -1.230573058128357, -1.1925992965698242, -1.154625654220581, -1.116652011871338, -1.0786783695220947, -1.0407047271728516, -1.0027309656143188, -0.9647573232650757, -0.9267836809158325, -0.8888099789619446, -0.8508362770080566, -0.8128626346588135, -0.7748888731002808, -0.7369151711463928, -0.6989415287971497, -0.6609678268432617, -0.6229941844940186, -0.5850204825401306, -0.5470467805862427, -0.5090731382369995, -0.4710994362831116, -0.433125764131546, -0.39515209197998047, -0.35717839002609253, -0.319204717874527, -0.2812310457229614, -0.24325735867023468, -0.20528367161750793, -0.16730999946594238, -0.12933632731437683, -0.09136264026165009, -0.05338896065950394, -0.015415281057357788, 0.022558391094207764, 0.06053207814693451, 0.09850576519966125, 0.1364794373512268, 0.17445310950279236, 0.2124267965555191, 0.25040048360824585, 0.2883741557598114, 0.32634782791137695, 0.3643215298652649, 0.40229520201683044, 0.440268874168396, 0.47824254631996155, 0.5162162184715271, 0.554189920425415, 0.5921635627746582, 0.6301372647285461, 0.6681109666824341, 0.7060846090316772, 0.7440583109855652, 0.7820320129394531, 0.8200056552886963, 0.8579793572425842, 0.8959530591964722, 0.9339267015457153, 0.9719004034996033, 1.0098741054534912, 1.0478477478027344]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 5.0, 8.0, 8.0, 14.0, 15.0, 34.0, 55.0, 90.0, 176.0, 319.0, 593.0, 1979.0, 14845.0, 3811739.0, 352794.0, 8956.0, 1674.0, 566.0, 207.0, 101.0, 44.0, 23.0, 16.0, 11.0, 4.0, 6.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.76953125, -0.7515830993652344, -0.7336349487304688, -0.7156867980957031, -0.6977386474609375, -0.6797904968261719, -0.6618423461914062, -0.6438941955566406, -0.625946044921875, -0.6079978942871094, -0.5900497436523438, -0.5721015930175781, -0.5541534423828125, -0.5362052917480469, -0.5182571411132812, -0.5003089904785156, -0.48236083984375, -0.4644126892089844, -0.44646453857421875, -0.4285163879394531, -0.4105682373046875, -0.3926200866699219, -0.37467193603515625, -0.3567237854003906, -0.338775634765625, -0.3208274841308594, -0.30287933349609375, -0.2849311828613281, -0.2669830322265625, -0.24903488159179688, -0.23108673095703125, -0.21313858032226562, -0.1951904296875, -0.17724227905273438, -0.15929412841796875, -0.14134597778320312, -0.1233978271484375, -0.10544967651367188, -0.08750152587890625, -0.06955337524414062, -0.051605224609375, -0.033657073974609375, -0.01570892333984375, 0.002239227294921875, 0.0201873779296875, 0.038135528564453125, 0.05608367919921875, 0.07403182983398438, 0.09197998046875, 0.10992813110351562, 0.12787628173828125, 0.14582443237304688, 0.1637725830078125, 0.18172073364257812, 0.19966888427734375, 0.21761703491210938, 0.235565185546875, 0.2535133361816406, 0.27146148681640625, 0.2894096374511719, 0.3073577880859375, 0.3253059387207031, 0.34325408935546875, 0.3612022399902344, 0.379150390625]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 6.0, 10.0, 16.0, 40.0, 68.0, 86.0, 102.0, 109.0, 121.0, 125.0, 96.0, 87.0, 53.0, 27.0, 18.0, 13.0, 12.0, 3.0, 3.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1318359375, -0.12858009338378906, -0.12532424926757812, -0.12206840515136719, -0.11881256103515625, -0.11555671691894531, -0.11230087280273438, -0.10904502868652344, -0.1057891845703125, -0.10253334045410156, -0.09927749633789062, -0.09602165222167969, -0.09276580810546875, -0.08950996398925781, -0.08625411987304688, -0.08299827575683594, -0.079742431640625, -0.07648658752441406, -0.07323074340820312, -0.06997489929199219, -0.06671905517578125, -0.06346321105957031, -0.060207366943359375, -0.05695152282714844, -0.0536956787109375, -0.05043983459472656, -0.047183990478515625, -0.04392814636230469, -0.04067230224609375, -0.03741645812988281, -0.034160614013671875, -0.030904769897460938, -0.02764892578125, -0.024393081665039062, -0.021137237548828125, -0.017881393432617188, -0.01462554931640625, -0.011369705200195312, -0.008113861083984375, -0.0048580169677734375, -0.0016021728515625, 0.0016536712646484375, 0.004909515380859375, 0.008165359497070312, 0.01142120361328125, 0.014677047729492188, 0.017932891845703125, 0.021188735961914062, 0.024444580078125, 0.027700424194335938, 0.030956268310546875, 0.03421211242675781, 0.03746795654296875, 0.04072380065917969, 0.043979644775390625, 0.04723548889160156, 0.0504913330078125, 0.05374717712402344, 0.057003021240234375, 0.06025886535644531, 0.06351470947265625, 0.06677055358886719, 0.07002639770507812, 0.07328224182128906, 0.0765380859375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 5.0, 6.0, 8.0, 18.0, 23.0, 34.0, 35.0, 53.0, 74.0, 137.0, 266.0, 469.0, 913.0, 1989.0, 4609.0, 11698.0, 34390.0, 150886.0, 3150758.0, 727770.0, 76762.0, 20262.0, 7078.0, 2882.0, 1326.0, 690.0, 416.0, 233.0, 157.0, 115.0, 63.0, 54.0, 38.0, 19.0, 8.0, 14.0, 13.0, 5.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.206298828125, -0.1998138427734375, -0.193328857421875, -0.1868438720703125, -0.18035888671875, -0.1738739013671875, -0.167388916015625, -0.1609039306640625, -0.1544189453125, -0.1479339599609375, -0.141448974609375, -0.1349639892578125, -0.12847900390625, -0.1219940185546875, -0.115509033203125, -0.1090240478515625, -0.1025390625, -0.0960540771484375, -0.089569091796875, -0.0830841064453125, -0.07659912109375, -0.0701141357421875, -0.063629150390625, -0.0571441650390625, -0.0506591796875, -0.0441741943359375, -0.037689208984375, -0.0312042236328125, -0.02471923828125, -0.0182342529296875, -0.011749267578125, -0.0052642822265625, 0.001220703125, 0.0077056884765625, 0.014190673828125, 0.0206756591796875, 0.02716064453125, 0.0336456298828125, 0.040130615234375, 0.0466156005859375, 0.0531005859375, 0.0595855712890625, 0.066070556640625, 0.0725555419921875, 0.07904052734375, 0.0855255126953125, 0.092010498046875, 0.0984954833984375, 0.10498046875, 0.1114654541015625, 0.117950439453125, 0.1244354248046875, 0.13092041015625, 0.1374053955078125, 0.143890380859375, 0.1503753662109375, 0.1568603515625, 0.1633453369140625, 0.169830322265625, 0.1763153076171875, 0.18280029296875, 0.1892852783203125, 0.195770263671875, 0.2022552490234375, 0.208740234375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 4.0, 6.0, 13.0, 10.0, 15.0, 21.0, 21.0, 31.0, 50.0, 57.0, 95.0, 175.0, 253.0, 577.0, 1304.0, 751.0, 275.0, 144.0, 74.0, 55.0, 43.0, 29.0, 20.0, 16.0, 7.0, 10.0, 4.0, 3.0, 5.0, 2.0, 4.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.2166748046875, -0.20980262756347656, -0.20293045043945312, -0.1960582733154297, -0.18918609619140625, -0.1823139190673828, -0.17544174194335938, -0.16856956481933594, -0.1616973876953125, -0.15482521057128906, -0.14795303344726562, -0.1410808563232422, -0.13420867919921875, -0.1273365020751953, -0.12046432495117188, -0.11359214782714844, -0.106719970703125, -0.09984779357910156, -0.09297561645507812, -0.08610343933105469, -0.07923126220703125, -0.07235908508300781, -0.06548690795898438, -0.05861473083496094, -0.0517425537109375, -0.04487037658691406, -0.037998199462890625, -0.031126022338867188, -0.02425384521484375, -0.017381668090820312, -0.010509490966796875, -0.0036373138427734375, 0.00323486328125, 0.010107040405273438, 0.016979217529296875, 0.023851394653320312, 0.03072357177734375, 0.03759574890136719, 0.044467926025390625, 0.05134010314941406, 0.0582122802734375, 0.06508445739746094, 0.07195663452148438, 0.07882881164550781, 0.08570098876953125, 0.09257316589355469, 0.09944534301757812, 0.10631752014160156, 0.113189697265625, 0.12006187438964844, 0.12693405151367188, 0.1338062286376953, 0.14067840576171875, 0.1475505828857422, 0.15442276000976562, 0.16129493713378906, 0.1681671142578125, 0.17503929138183594, 0.18191146850585938, 0.1887836456298828, 0.19565582275390625, 0.2025279998779297, 0.20940017700195312, 0.21627235412597656, 0.22314453125]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 1.0, 2.0, 7.0, 6.0, 14.0, 17.0, 19.0, 41.0, 72.0, 97.0, 131.0, 174.0, 142.0, 108.0, 57.0, 40.0, 19.0, 15.0, 13.0, 9.0, 4.0, 4.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9809967279434204, -1.9184601306915283, -1.8559236526489258, -1.7933870553970337, -1.7308504581451416, -1.668313980102539, -1.605777382850647, -1.5432407855987549, -1.4807043075561523, -1.4181677103042603, -1.3556312322616577, -1.2930946350097656, -1.230558156967163, -1.168021559715271, -1.105484962463379, -1.0429484844207764, -0.9804118871688843, -0.917875349521637, -0.8553388118743896, -0.7928022146224976, -0.7302656769752502, -0.6677291393280029, -0.6051925420761108, -0.5426560044288635, -0.4801194667816162, -0.4175829291343689, -0.3550463616847992, -0.2925097942352295, -0.22997325658798218, -0.16743671894073486, -0.10490015149116516, -0.04236358404159546, 0.020173072814941406, 0.08270962536334991, 0.14524617791175842, 0.20778273046016693, 0.27031928300857544, 0.33285582065582275, 0.39539238810539246, 0.45792895555496216, 0.5204654932022095, 0.5830020308494568, 0.6455385684967041, 0.7080751657485962, 0.7706117033958435, 0.8331482410430908, 0.8956848382949829, 0.9582213759422302, 1.0207579135894775, 1.0832945108413696, 1.1458309888839722, 1.2083675861358643, 1.2709040641784668, 1.3334406614303589, 1.395977258682251, 1.4585137367248535, 1.5210503339767456, 1.5835869312286377, 1.6461234092712402, 1.7086600065231323, 1.7711966037750244, 1.833733081817627, 1.896269679069519, 1.9588062763214111, 2.0213427543640137]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 6.0, 1.0, 6.0, 3.0, 9.0, 6.0, 10.0, 11.0, 9.0, 19.0, 14.0, 17.0, 20.0, 31.0, 31.0, 32.0, 57.0, 44.0, 40.0, 49.0, 48.0, 53.0, 41.0, 39.0, 40.0, 41.0, 41.0, 36.0, 41.0, 42.0, 22.0, 18.0, 27.0, 22.0, 17.0, 13.0, 13.0, 6.0, 9.0, 4.0, 7.0, 3.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7867507338523865, -0.7595539093017578, -0.7323570847511292, -0.7051602602005005, -0.6779634952545166, -0.6507666707038879, -0.6235698461532593, -0.5963730216026306, -0.569176197052002, -0.5419793725013733, -0.5147825479507446, -0.48758575320243835, -0.4603889584541321, -0.4331921339035034, -0.40599530935287476, -0.3787984848022461, -0.3516017198562622, -0.32440489530563354, -0.29720810055732727, -0.2700112760066986, -0.24281446635723114, -0.21561765670776367, -0.188420832157135, -0.16122402250766754, -0.13402721285820007, -0.1068304032087326, -0.07963358610868454, -0.052436769008636475, -0.025239959359169006, 0.001956850290298462, 0.029153674840927124, 0.05635048449039459, 0.08354723453521729, 0.11074404418468475, 0.13794085383415222, 0.16513767838478088, 0.19233448803424835, 0.21953129768371582, 0.24672812223434448, 0.27392494678497314, 0.3011217415332794, 0.3283185660839081, 0.35551536083221436, 0.382712185382843, 0.4099090099334717, 0.43710580468177795, 0.4643026292324066, 0.4914994239807129, 0.5186962485313416, 0.5458930730819702, 0.5730898976325989, 0.6002867221832275, 0.6274834871292114, 0.6546803116798401, 0.6818771362304688, 0.7090739607810974, 0.7362707853317261, 0.7634676098823547, 0.7906644344329834, 0.8178611993789673, 0.845058023929596, 0.8722548484802246, 0.8994516730308533, 0.9266484975814819, 0.9538452625274658]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 5.0, 2.0, 0.0, 4.0, 5.0, 11.0, 3.0, 17.0, 13.0, 17.0, 28.0, 40.0, 46.0, 67.0, 110.0, 193.0, 292.0, 510.0, 1010.0, 2443.0, 7067.0, 31027.0, 248966.0, 663268.0, 73462.0, 12996.0, 3682.0, 1435.0, 728.0, 404.0, 245.0, 141.0, 87.0, 68.0, 43.0, 40.0, 28.0, 18.0, 12.0, 6.0, 10.0, 6.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.43701171875, -0.42494964599609375, -0.4128875732421875, -0.40082550048828125, -0.388763427734375, -0.37670135498046875, -0.3646392822265625, -0.35257720947265625, -0.34051513671875, -0.32845306396484375, -0.3163909912109375, -0.30432891845703125, -0.292266845703125, -0.28020477294921875, -0.2681427001953125, -0.25608062744140625, -0.2440185546875, -0.23195648193359375, -0.2198944091796875, -0.20783233642578125, -0.195770263671875, -0.18370819091796875, -0.1716461181640625, -0.15958404541015625, -0.14752197265625, -0.13545989990234375, -0.1233978271484375, -0.11133575439453125, -0.099273681640625, -0.08721160888671875, -0.0751495361328125, -0.06308746337890625, -0.051025390625, -0.03896331787109375, -0.0269012451171875, -0.01483917236328125, -0.002777099609375, 0.00928497314453125, 0.0213470458984375, 0.03340911865234375, 0.04547119140625, 0.05753326416015625, 0.0695953369140625, 0.08165740966796875, 0.093719482421875, 0.10578155517578125, 0.1178436279296875, 0.12990570068359375, 0.1419677734375, 0.15402984619140625, 0.1660919189453125, 0.17815399169921875, 0.190216064453125, 0.20227813720703125, 0.2143402099609375, 0.22640228271484375, 0.23846435546875, 0.25052642822265625, 0.2625885009765625, 0.27465057373046875, 0.286712646484375, 0.29877471923828125, 0.3108367919921875, 0.32289886474609375, 0.3349609375]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 7.0, 3.0, 16.0, 16.0, 37.0, 51.0, 83.0, 87.0, 106.0, 105.0, 120.0, 99.0, 91.0, 72.0, 42.0, 23.0, 13.0, 10.0, 8.0, 7.0, 4.0, 1.0, 2.0, 0.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.1290283203125, -0.125946044921875, -0.12286376953125, -0.119781494140625, -0.11669921875, -0.113616943359375, -0.11053466796875, -0.107452392578125, -0.1043701171875, -0.101287841796875, -0.09820556640625, -0.095123291015625, -0.092041015625, -0.088958740234375, -0.08587646484375, -0.082794189453125, -0.0797119140625, -0.076629638671875, -0.07354736328125, -0.070465087890625, -0.0673828125, -0.064300537109375, -0.06121826171875, -0.058135986328125, -0.0550537109375, -0.051971435546875, -0.04888916015625, -0.045806884765625, -0.042724609375, -0.039642333984375, -0.03656005859375, -0.033477783203125, -0.0303955078125, -0.027313232421875, -0.02423095703125, -0.021148681640625, -0.01806640625, -0.014984130859375, -0.01190185546875, -0.008819580078125, -0.0057373046875, -0.002655029296875, 0.00042724609375, 0.003509521484375, 0.006591796875, 0.009674072265625, 0.01275634765625, 0.015838623046875, 0.0189208984375, 0.022003173828125, 0.02508544921875, 0.028167724609375, 0.03125, 0.034332275390625, 0.03741455078125, 0.040496826171875, 0.0435791015625, 0.046661376953125, 0.04974365234375, 0.052825927734375, 0.055908203125, 0.058990478515625, 0.06207275390625, 0.065155029296875, 0.0682373046875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 0.0, 4.0, 8.0, 3.0, 13.0, 13.0, 22.0, 46.0, 64.0, 112.0, 202.0, 479.0, 960.0, 2496.0, 6833.0, 23653.0, 107866.0, 674713.0, 180666.0, 35066.0, 9633.0, 3274.0, 1258.0, 582.0, 248.0, 142.0, 84.0, 45.0, 15.0, 20.0, 10.0, 7.0, 6.0, 8.0, 2.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.324462890625, -0.314208984375, -0.303955078125, -0.293701171875, -0.283447265625, -0.273193359375, -0.262939453125, -0.252685546875, -0.242431640625, -0.232177734375, -0.221923828125, -0.211669921875, -0.201416015625, -0.191162109375, -0.180908203125, -0.170654296875, -0.160400390625, -0.150146484375, -0.139892578125, -0.129638671875, -0.119384765625, -0.109130859375, -0.098876953125, -0.088623046875, -0.078369140625, -0.068115234375, -0.057861328125, -0.047607421875, -0.037353515625, -0.027099609375, -0.016845703125, -0.006591796875, 0.003662109375, 0.013916015625, 0.024169921875, 0.034423828125, 0.044677734375, 0.054931640625, 0.065185546875, 0.075439453125, 0.085693359375, 0.095947265625, 0.106201171875, 0.116455078125, 0.126708984375, 0.136962890625, 0.147216796875, 0.157470703125, 0.167724609375, 0.177978515625, 0.188232421875, 0.198486328125, 0.208740234375, 0.218994140625, 0.229248046875, 0.239501953125, 0.249755859375, 0.260009765625, 0.270263671875, 0.280517578125, 0.290771484375, 0.301025390625, 0.311279296875, 0.321533203125, 0.331787109375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 0.0, 4.0, 6.0, 6.0, 4.0, 7.0, 14.0, 7.0, 21.0, 29.0, 23.0, 37.0, 45.0, 56.0, 53.0, 58.0, 56.0, 60.0, 61.0, 74.0, 61.0, 61.0, 45.0, 48.0, 31.0, 29.0, 24.0, 20.0, 8.0, 20.0, 9.0, 11.0, 7.0, 3.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.293212890625, -0.2844123840332031, -0.27561187744140625, -0.2668113708496094, -0.2580108642578125, -0.24921035766601562, -0.24040985107421875, -0.23160934448242188, -0.222808837890625, -0.21400833129882812, -0.20520782470703125, -0.19640731811523438, -0.1876068115234375, -0.17880630493164062, -0.17000579833984375, -0.16120529174804688, -0.15240478515625, -0.14360427856445312, -0.13480377197265625, -0.12600326538085938, -0.1172027587890625, -0.10840225219726562, -0.09960174560546875, -0.09080123901367188, -0.082000732421875, -0.07320022583007812, -0.06439971923828125, -0.055599212646484375, -0.0467987060546875, -0.037998199462890625, -0.02919769287109375, -0.020397186279296875, -0.0115966796875, -0.002796173095703125, 0.00600433349609375, 0.014804840087890625, 0.0236053466796875, 0.032405853271484375, 0.04120635986328125, 0.050006866455078125, 0.058807373046875, 0.06760787963867188, 0.07640838623046875, 0.08520889282226562, 0.0940093994140625, 0.10280990600585938, 0.11161041259765625, 0.12041091918945312, 0.12921142578125, 0.13801193237304688, 0.14681243896484375, 0.15561294555664062, 0.1644134521484375, 0.17321395874023438, 0.18201446533203125, 0.19081497192382812, 0.199615478515625, 0.20841598510742188, 0.21721649169921875, 0.22601699829101562, 0.2348175048828125, 0.24361801147460938, 0.25241851806640625, 0.2612190246582031, 0.27001953125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 8.0, 11.0, 11.0, 24.0, 32.0, 33.0, 33.0, 49.0, 85.0, 133.0, 161.0, 231.0, 375.0, 556.0, 990.0, 1519.0, 2648.0, 5176.0, 9937.0, 21840.0, 56781.0, 213959.0, 574457.0, 96693.0, 32930.0, 14058.0, 6832.0, 3585.0, 2022.0, 1225.0, 717.0, 482.0, 323.0, 172.0, 133.0, 93.0, 62.0, 46.0, 35.0, 28.0, 19.0, 14.0, 7.0, 10.0, 9.0, 4.0, 5.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0408935546875, -0.039540767669677734, -0.03818798065185547, -0.0368351936340332, -0.03548240661621094, -0.03412961959838867, -0.032776832580566406, -0.03142404556274414, -0.030071258544921875, -0.02871847152709961, -0.027365684509277344, -0.026012897491455078, -0.024660110473632812, -0.023307323455810547, -0.02195453643798828, -0.020601749420166016, -0.01924896240234375, -0.017896175384521484, -0.01654338836669922, -0.015190601348876953, -0.013837814331054688, -0.012485027313232422, -0.011132240295410156, -0.00977945327758789, -0.008426666259765625, -0.007073879241943359, -0.005721092224121094, -0.004368305206298828, -0.0030155181884765625, -0.0016627311706542969, -0.00030994415283203125, 0.0010428428649902344, 0.0023956298828125, 0.0037484169006347656, 0.005101203918457031, 0.006453990936279297, 0.0078067779541015625, 0.009159564971923828, 0.010512351989746094, 0.01186513900756836, 0.013217926025390625, 0.01457071304321289, 0.015923500061035156, 0.017276287078857422, 0.018629074096679688, 0.019981861114501953, 0.02133464813232422, 0.022687435150146484, 0.02404022216796875, 0.025393009185791016, 0.02674579620361328, 0.028098583221435547, 0.029451370239257812, 0.030804157257080078, 0.032156944274902344, 0.03350973129272461, 0.034862518310546875, 0.03621530532836914, 0.037568092346191406, 0.03892087936401367, 0.04027366638183594, 0.0416264533996582, 0.04297924041748047, 0.044332027435302734, 0.045684814453125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 4.0, 6.0, 2.0, 9.0, 9.0, 11.0, 13.0, 23.0, 58.0, 99.0, 224.0, 253.0, 129.0, 71.0, 33.0, 19.0, 5.0, 6.0, 8.0, 7.0, 6.0, 2.0, 3.0, 0.0, 3.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002808570861816406, -0.00027181580662727356, -0.0002627745270729065, -0.00025373324751853943, -0.00024469196796417236, -0.0002356506884098053, -0.00022660940885543823, -0.00021756812930107117, -0.0002085268497467041, -0.00019948557019233704, -0.00019044429063796997, -0.0001814030110836029, -0.00017236173152923584, -0.00016332045197486877, -0.0001542791724205017, -0.00014523789286613464, -0.00013619661331176758, -0.0001271553337574005, -0.00011811405420303345, -0.00010907277464866638, -0.00010003149509429932, -9.099021553993225e-05, -8.194893598556519e-05, -7.290765643119812e-05, -6.386637687683105e-05, -5.482509732246399e-05, -4.5783817768096924e-05, -3.674253821372986e-05, -2.7701258659362793e-05, -1.8659979104995728e-05, -9.618699550628662e-06, -5.774199962615967e-07, 8.463859558105469e-06, 1.7505139112472534e-05, 2.65464186668396e-05, 3.5587698221206665e-05, 4.462897777557373e-05, 5.3670257329940796e-05, 6.271153688430786e-05, 7.175281643867493e-05, 8.079409599304199e-05, 8.983537554740906e-05, 9.887665510177612e-05, 0.00010791793465614319, 0.00011695921421051025, 0.00012600049376487732, 0.00013504177331924438, 0.00014408305287361145, 0.00015312433242797852, 0.00016216561198234558, 0.00017120689153671265, 0.0001802481710910797, 0.00018928945064544678, 0.00019833073019981384, 0.0002073720097541809, 0.00021641328930854797, 0.00022545456886291504, 0.0002344958484172821, 0.00024353712797164917, 0.00025257840752601624, 0.0002616196870803833, 0.00027066096663475037, 0.00027970224618911743, 0.0002887435257434845, 0.00029778480529785156]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 9.0, 5.0, 11.0, 5.0, 13.0, 17.0, 29.0, 30.0, 51.0, 123.0, 204.0, 307.0, 618.0, 1369.0, 3223.0, 8270.0, 26583.0, 121455.0, 716625.0, 127348.0, 27591.0, 8574.0, 3265.0, 1388.0, 631.0, 336.0, 175.0, 115.0, 56.0, 43.0, 21.0, 11.0, 18.0, 4.0, 8.0, 9.0, 4.0, 3.0, 3.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.061920166015625, -0.06001567840576172, -0.05811119079589844, -0.056206703186035156, -0.054302215576171875, -0.052397727966308594, -0.05049324035644531, -0.04858875274658203, -0.04668426513671875, -0.04477977752685547, -0.04287528991699219, -0.040970802307128906, -0.039066314697265625, -0.037161827087402344, -0.03525733947753906, -0.03335285186767578, -0.0314483642578125, -0.02954387664794922, -0.027639389038085938, -0.025734901428222656, -0.023830413818359375, -0.021925926208496094, -0.020021438598632812, -0.01811695098876953, -0.01621246337890625, -0.014307975769042969, -0.012403488159179688, -0.010499000549316406, -0.008594512939453125, -0.006690025329589844, -0.0047855377197265625, -0.0028810501098632812, -0.0009765625, 0.0009279251098632812, 0.0028324127197265625, 0.004736900329589844, 0.006641387939453125, 0.008545875549316406, 0.010450363159179688, 0.012354850769042969, 0.01425933837890625, 0.01616382598876953, 0.018068313598632812, 0.019972801208496094, 0.021877288818359375, 0.023781776428222656, 0.025686264038085938, 0.02759075164794922, 0.0294952392578125, 0.03139972686767578, 0.03330421447753906, 0.035208702087402344, 0.037113189697265625, 0.039017677307128906, 0.04092216491699219, 0.04282665252685547, 0.04473114013671875, 0.04663562774658203, 0.04854011535644531, 0.050444602966308594, 0.052349090576171875, 0.054253578186035156, 0.05615806579589844, 0.05806255340576172, 0.059967041015625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 7.0, 7.0, 4.0, 1.0, 8.0, 13.0, 14.0, 18.0, 19.0, 22.0, 32.0, 35.0, 51.0, 43.0, 60.0, 81.0, 77.0, 82.0, 75.0, 68.0, 43.0, 56.0, 36.0, 27.0, 25.0, 14.0, 23.0, 10.0, 7.0, 9.0, 8.0, 7.0, 4.0, 5.0, 2.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03790283203125, -0.036640167236328125, -0.03537750244140625, -0.034114837646484375, -0.0328521728515625, -0.031589508056640625, -0.03032684326171875, -0.029064178466796875, -0.027801513671875, -0.026538848876953125, -0.02527618408203125, -0.024013519287109375, -0.0227508544921875, -0.021488189697265625, -0.02022552490234375, -0.018962860107421875, -0.0177001953125, -0.016437530517578125, -0.01517486572265625, -0.013912200927734375, -0.0126495361328125, -0.011386871337890625, -0.01012420654296875, -0.008861541748046875, -0.007598876953125, -0.006336212158203125, -0.00507354736328125, -0.003810882568359375, -0.0025482177734375, -0.001285552978515625, -2.288818359375e-05, 0.001239776611328125, 0.00250244140625, 0.003765106201171875, 0.00502777099609375, 0.006290435791015625, 0.0075531005859375, 0.008815765380859375, 0.01007843017578125, 0.011341094970703125, 0.012603759765625, 0.013866424560546875, 0.01512908935546875, 0.016391754150390625, 0.0176544189453125, 0.018917083740234375, 0.02017974853515625, 0.021442413330078125, 0.022705078125, 0.023967742919921875, 0.02523040771484375, 0.026493072509765625, 0.0277557373046875, 0.029018402099609375, 0.03028106689453125, 0.031543731689453125, 0.032806396484375, 0.034069061279296875, 0.03533172607421875, 0.036594390869140625, 0.0378570556640625, 0.039119720458984375, 0.04038238525390625, 0.041645050048828125, 0.04290771484375]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 5.0, 5.0, 2.0, 0.0, 5.0, 4.0, 6.0, 13.0, 10.0, 7.0, 9.0, 13.0, 23.0, 16.0, 44.0, 32.0, 48.0, 67.0, 87.0, 112.0, 112.0, 87.0, 45.0, 47.0, 46.0, 35.0, 22.0, 22.0, 14.0, 11.0, 8.0, 6.0, 8.0, 5.0, 5.0, 7.0, 2.0, 5.0, 2.0, 1.0, 5.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.8069772720336914, -0.7781876921653748, -0.7493980526924133, -0.7206084728240967, -0.6918188333511353, -0.6630292534828186, -0.634239673614502, -0.6054500341415405, -0.5766603946685791, -0.5478708148002625, -0.519081175327301, -0.4902915954589844, -0.46150195598602295, -0.4327123761177063, -0.40392276644706726, -0.3751331567764282, -0.3463435769081116, -0.31755396723747253, -0.2887643575668335, -0.25997477769851685, -0.2311851531267166, -0.20239554345607758, -0.17360594868659973, -0.1448163390159607, -0.11602672934532166, -0.08723711967468262, -0.058447517454624176, -0.029657915234565735, -0.0008683055639266968, 0.02792130410671234, 0.056710898876190186, 0.08550050854682922, 0.11429011821746826, 0.1430797278881073, 0.17186933755874634, 0.20065893232822418, 0.22944854199886322, 0.25823813676834106, 0.2870277464389801, 0.31581735610961914, 0.3446069657802582, 0.3733965754508972, 0.40218618512153625, 0.4309757947921753, 0.45976537466049194, 0.48855501413345337, 0.51734459400177, 0.5461342334747314, 0.5749238133430481, 0.6037133932113647, 0.6325030326843262, 0.6612926125526428, 0.6900822520256042, 0.7188718318939209, 0.7476614713668823, 0.776451051235199, 0.8052406311035156, 0.8340302109718323, 0.8628198504447937, 0.8916094303131104, 0.9203990697860718, 0.9491886496543884, 0.9779782295227051, 1.0067678689956665, 1.035557508468628]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 5.0, 3.0, 3.0, 3.0, 7.0, 6.0, 6.0, 12.0, 17.0, 19.0, 18.0, 14.0, 13.0, 13.0, 32.0, 28.0, 31.0, 22.0, 35.0, 36.0, 28.0, 36.0, 69.0, 63.0, 62.0, 51.0, 40.0, 39.0, 38.0, 41.0, 27.0, 20.0, 22.0, 15.0, 20.0, 16.0, 16.0, 13.0, 4.0, 10.0, 13.0, 9.0, 12.0, 5.0, 3.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.7811167240142822, -0.7565103769302368, -0.7319040894508362, -0.7072977423667908, -0.6826914548873901, -0.6580851078033447, -0.6334787607192993, -0.6088724732398987, -0.584266185760498, -0.5596598386764526, -0.535053551197052, -0.5104472041130066, -0.48584091663360596, -0.46123456954956055, -0.4366282522678375, -0.4120219349861145, -0.3874155879020691, -0.36280927062034607, -0.33820295333862305, -0.31359660625457764, -0.288990318775177, -0.2643839716911316, -0.23977765440940857, -0.21517133712768555, -0.19056501984596252, -0.1659587025642395, -0.14135238528251648, -0.11674605309963226, -0.09213973581790924, -0.06753341853618622, -0.042927086353302, -0.01832076907157898, 0.006285488605499268, 0.03089180961251259, 0.05549813061952591, 0.08010445535182953, 0.10471077263355255, 0.12931708991527557, 0.1539234220981598, 0.1785297393798828, 0.20313605666160583, 0.22774237394332886, 0.2523486912250519, 0.2769550085067749, 0.3015613555908203, 0.32616764307022095, 0.35077399015426636, 0.3753803074359894, 0.3999866247177124, 0.4245929419994354, 0.44919925928115845, 0.47380560636520386, 0.4984118938446045, 0.5230182409286499, 0.5476245880126953, 0.572230875492096, 0.5968371629714966, 0.621443510055542, 0.6460497975349426, 0.670656144618988, 0.6952624320983887, 0.7198687791824341, 0.7444751262664795, 0.7690814137458801, 0.7936877608299255]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 5.0, 3.0, 5.0, 10.0, 11.0, 20.0, 31.0, 56.0, 71.0, 162.0, 294.0, 592.0, 1156.0, 3776.0, 43432.0, 4017908.0, 117679.0, 6780.0, 1481.0, 494.0, 158.0, 81.0, 33.0, 21.0, 13.0, 9.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.87109375, -0.8511238098144531, -0.8311538696289062, -0.8111839294433594, -0.7912139892578125, -0.7712440490722656, -0.7512741088867188, -0.7313041687011719, -0.711334228515625, -0.6913642883300781, -0.6713943481445312, -0.6514244079589844, -0.6314544677734375, -0.6114845275878906, -0.5915145874023438, -0.5715446472167969, -0.55157470703125, -0.5316047668457031, -0.5116348266601562, -0.4916648864746094, -0.4716949462890625, -0.4517250061035156, -0.43175506591796875, -0.4117851257324219, -0.391815185546875, -0.3718452453613281, -0.35187530517578125, -0.3319053649902344, -0.3119354248046875, -0.2919654846191406, -0.27199554443359375, -0.2520256042480469, -0.2320556640625, -0.21208572387695312, -0.19211578369140625, -0.17214584350585938, -0.1521759033203125, -0.13220596313476562, -0.11223602294921875, -0.09226608276367188, -0.072296142578125, -0.052326202392578125, -0.03235626220703125, -0.012386322021484375, 0.0075836181640625, 0.027553558349609375, 0.04752349853515625, 0.06749343872070312, 0.08746337890625, 0.10743331909179688, 0.12740325927734375, 0.14737319946289062, 0.1673431396484375, 0.18731307983398438, 0.20728302001953125, 0.22725296020507812, 0.247222900390625, 0.2671928405761719, 0.28716278076171875, 0.3071327209472656, 0.3271026611328125, 0.3470726013183594, 0.36704254150390625, 0.3870124816894531, 0.406982421875]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 5.0, 9.0, 16.0, 45.0, 47.0, 67.0, 89.0, 106.0, 104.0, 114.0, 113.0, 93.0, 55.0, 56.0, 32.0, 20.0, 13.0, 12.0, 4.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.13134765625, -0.12822818756103516, -0.1251087188720703, -0.12198925018310547, -0.11886978149414062, -0.11575031280517578, -0.11263084411621094, -0.1095113754272461, -0.10639190673828125, -0.1032724380493164, -0.10015296936035156, -0.09703350067138672, -0.09391403198242188, -0.09079456329345703, -0.08767509460449219, -0.08455562591552734, -0.0814361572265625, -0.07831668853759766, -0.07519721984863281, -0.07207775115966797, -0.06895828247070312, -0.06583881378173828, -0.06271934509277344, -0.059599876403808594, -0.05648040771484375, -0.053360939025878906, -0.05024147033691406, -0.04712200164794922, -0.044002532958984375, -0.04088306427001953, -0.03776359558105469, -0.034644126892089844, -0.031524658203125, -0.028405189514160156, -0.025285720825195312, -0.02216625213623047, -0.019046783447265625, -0.01592731475830078, -0.012807846069335938, -0.009688377380371094, -0.00656890869140625, -0.0034494400024414062, -0.0003299713134765625, 0.0027894973754882812, 0.005908966064453125, 0.009028434753417969, 0.012147903442382812, 0.015267372131347656, 0.0183868408203125, 0.021506309509277344, 0.024625778198242188, 0.02774524688720703, 0.030864715576171875, 0.03398418426513672, 0.03710365295410156, 0.040223121643066406, 0.04334259033203125, 0.046462059020996094, 0.04958152770996094, 0.05270099639892578, 0.055820465087890625, 0.05893993377685547, 0.06205940246582031, 0.06517887115478516, 0.06829833984375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 4.0, 3.0, 4.0, 9.0, 15.0, 26.0, 35.0, 59.0, 83.0, 165.0, 290.0, 777.0, 2821.0, 16762.0, 206277.0, 3763735.0, 182853.0, 15976.0, 2706.0, 718.0, 382.0, 186.0, 121.0, 70.0, 70.0, 42.0, 50.0, 22.0, 15.0, 8.0, 2.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.48388671875, -0.4713096618652344, -0.45873260498046875, -0.4461555480957031, -0.4335784912109375, -0.4210014343261719, -0.40842437744140625, -0.3958473205566406, -0.383270263671875, -0.3706932067871094, -0.35811614990234375, -0.3455390930175781, -0.3329620361328125, -0.3203849792480469, -0.30780792236328125, -0.2952308654785156, -0.28265380859375, -0.2700767517089844, -0.25749969482421875, -0.24492263793945312, -0.2323455810546875, -0.21976852416992188, -0.20719146728515625, -0.19461441040039062, -0.182037353515625, -0.16946029663085938, -0.15688323974609375, -0.14430618286132812, -0.1317291259765625, -0.11915206909179688, -0.10657501220703125, -0.09399795532226562, -0.0814208984375, -0.06884384155273438, -0.05626678466796875, -0.043689727783203125, -0.0311126708984375, -0.018535614013671875, -0.00595855712890625, 0.006618499755859375, 0.019195556640625, 0.031772613525390625, 0.04434967041015625, 0.056926727294921875, 0.0695037841796875, 0.08208084106445312, 0.09465789794921875, 0.10723495483398438, 0.11981201171875, 0.13238906860351562, 0.14496612548828125, 0.15754318237304688, 0.1701202392578125, 0.18269729614257812, 0.19527435302734375, 0.20785140991210938, 0.220428466796875, 0.23300552368164062, 0.24558258056640625, 0.2581596374511719, 0.2707366943359375, 0.2833137512207031, 0.29589080810546875, 0.3084678649902344, 0.321044921875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 4.0, 2.0, 8.0, 7.0, 9.0, 10.0, 26.0, 28.0, 46.0, 51.0, 85.0, 128.0, 204.0, 327.0, 703.0, 1023.0, 501.0, 292.0, 189.0, 140.0, 96.0, 59.0, 46.0, 21.0, 26.0, 22.0, 10.0, 6.0, 5.0, 6.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.140380859375, -0.13311767578125, -0.1258544921875, -0.11859130859375, -0.111328125, -0.10406494140625, -0.0968017578125, -0.08953857421875, -0.082275390625, -0.07501220703125, -0.0677490234375, -0.06048583984375, -0.05322265625, -0.04595947265625, -0.0386962890625, -0.03143310546875, -0.024169921875, -0.01690673828125, -0.0096435546875, -0.00238037109375, 0.0048828125, 0.01214599609375, 0.0194091796875, 0.02667236328125, 0.033935546875, 0.04119873046875, 0.0484619140625, 0.05572509765625, 0.06298828125, 0.07025146484375, 0.0775146484375, 0.08477783203125, 0.092041015625, 0.09930419921875, 0.1065673828125, 0.11383056640625, 0.12109375, 0.12835693359375, 0.1356201171875, 0.14288330078125, 0.150146484375, 0.15740966796875, 0.1646728515625, 0.17193603515625, 0.17919921875, 0.18646240234375, 0.1937255859375, 0.20098876953125, 0.208251953125, 0.21551513671875, 0.2227783203125, 0.23004150390625, 0.2373046875, 0.24456787109375, 0.2518310546875, 0.25909423828125, 0.266357421875, 0.27362060546875, 0.2808837890625, 0.28814697265625, 0.29541015625, 0.30267333984375, 0.3099365234375, 0.31719970703125, 0.324462890625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 5.0, 5.0, 7.0, 10.0, 18.0, 22.0, 45.0, 46.0, 71.0, 87.0, 115.0, 95.0, 108.0, 85.0, 61.0, 47.0, 43.0, 26.0, 21.0, 16.0, 17.0, 13.0, 10.0, 10.0, 6.0, 4.0, 4.0, 1.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.7761776447296143, -1.7270032167434692, -1.6778287887573242, -1.6286543607711792, -1.5794799327850342, -1.5303055047988892, -1.4811310768127441, -1.4319565296173096, -1.382782220840454, -1.333607792854309, -1.284433364868164, -1.235258936882019, -1.186084508895874, -1.136910080909729, -1.087735652923584, -1.0385611057281494, -0.9893866777420044, -0.9402122497558594, -0.8910378217697144, -0.8418633937835693, -0.7926889657974243, -0.7435145378112793, -0.6943400502204895, -0.6451656222343445, -0.5959911942481995, -0.5468167662620544, -0.4976423382759094, -0.448467880487442, -0.399293452501297, -0.350119024515152, -0.30094456672668457, -0.25177013874053955, -0.20259582996368408, -0.15342140197753906, -0.10424695909023285, -0.055072516202926636, -0.005898088216781616, 0.0432763397693634, 0.09245079755783081, 0.14162522554397583, 0.19079965353012085, 0.23997408151626587, 0.2891485095024109, 0.3383229672908783, 0.3874973952770233, 0.43667182326316833, 0.48584628105163574, 0.5350207090377808, 0.5841951370239258, 0.6333695650100708, 0.6825439929962158, 0.7317184209823608, 0.7808928489685059, 0.8300672769546509, 0.8792417645454407, 0.9284161925315857, 0.9775906205177307, 1.0267651081085205, 1.0759395360946655, 1.1251139640808105, 1.1742883920669556, 1.2234628200531006, 1.2726372480392456, 1.3218116760253906, 1.3709861040115356]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 5.0, 1.0, 0.0, 1.0, 2.0, 7.0, 3.0, 4.0, 14.0, 3.0, 13.0, 11.0, 15.0, 13.0, 16.0, 22.0, 17.0, 29.0, 36.0, 38.0, 37.0, 27.0, 35.0, 40.0, 40.0, 44.0, 46.0, 43.0, 36.0, 34.0, 40.0, 29.0, 31.0, 32.0, 28.0, 29.0, 22.0, 35.0, 16.0, 18.0, 16.0, 13.0, 7.0, 11.0, 8.0, 11.0, 5.0, 8.0, 5.0, 4.0, 1.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 4.0, 2.0], "bins": [-0.8957594633102417, -0.868302583694458, -0.8408456444740295, -0.8133887052536011, -0.7859318256378174, -0.7584749460220337, -0.7310180068016052, -0.7035610675811768, -0.6761041879653931, -0.6486473083496094, -0.6211903691291809, -0.5937334299087524, -0.5662765502929688, -0.5388196706771851, -0.5113627314567566, -0.4839058220386505, -0.45644891262054443, -0.42899200320243835, -0.4015350937843323, -0.3740781843662262, -0.3466212749481201, -0.31916436553001404, -0.29170745611190796, -0.2642505466938019, -0.2367936372756958, -0.20933672785758972, -0.18187981843948364, -0.15442290902137756, -0.12696599960327148, -0.0995090901851654, -0.07205218076705933, -0.04459527134895325, -0.017138361930847168, 0.010318547487258911, 0.03777545690536499, 0.06523236632347107, 0.09268927574157715, 0.12014618515968323, 0.1476030945777893, 0.17506000399589539, 0.20251691341400146, 0.22997382283210754, 0.2574307322502136, 0.2848876416683197, 0.3123445510864258, 0.33980146050453186, 0.36725836992263794, 0.394715279340744, 0.4221721887588501, 0.4496290981769562, 0.47708600759506226, 0.5045429468154907, 0.5319998264312744, 0.5594567060470581, 0.5869136452674866, 0.614370584487915, 0.6418274641036987, 0.6692843437194824, 0.6967412829399109, 0.7241982221603394, 0.751655101776123, 0.7791119813919067, 0.8065689206123352, 0.8340258598327637, 0.8614827394485474]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 2.0, 5.0, 8.0, 6.0, 13.0, 12.0, 14.0, 11.0, 28.0, 31.0, 46.0, 51.0, 95.0, 104.0, 188.0, 344.0, 632.0, 1300.0, 2996.0, 8244.0, 28976.0, 133211.0, 649523.0, 172133.0, 34390.0, 9691.0, 3287.0, 1421.0, 689.0, 353.0, 253.0, 146.0, 115.0, 68.0, 37.0, 36.0, 26.0, 19.0, 13.0, 11.0, 5.0, 9.0, 7.0, 1.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3203125, -0.3098335266113281, -0.29935455322265625, -0.2888755798339844, -0.2783966064453125, -0.2679176330566406, -0.25743865966796875, -0.24695968627929688, -0.236480712890625, -0.22600173950195312, -0.21552276611328125, -0.20504379272460938, -0.1945648193359375, -0.18408584594726562, -0.17360687255859375, -0.16312789916992188, -0.15264892578125, -0.14216995239257812, -0.13169097900390625, -0.12121200561523438, -0.1107330322265625, -0.10025405883789062, -0.08977508544921875, -0.07929611206054688, -0.068817138671875, -0.058338165283203125, -0.04785919189453125, -0.037380218505859375, -0.0269012451171875, -0.016422271728515625, -0.00594329833984375, 0.004535675048828125, 0.0150146484375, 0.025493621826171875, 0.03597259521484375, 0.046451568603515625, 0.0569305419921875, 0.06740951538085938, 0.07788848876953125, 0.08836746215820312, 0.098846435546875, 0.10932540893554688, 0.11980438232421875, 0.13028335571289062, 0.1407623291015625, 0.15124130249023438, 0.16172027587890625, 0.17219924926757812, 0.18267822265625, 0.19315719604492188, 0.20363616943359375, 0.21411514282226562, 0.2245941162109375, 0.23507308959960938, 0.24555206298828125, 0.2560310363769531, 0.266510009765625, 0.2769889831542969, 0.28746795654296875, 0.2979469299316406, 0.3084259033203125, 0.3189048767089844, 0.32938385009765625, 0.3398628234863281, 0.350341796875]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 10.0, 16.0, 13.0, 26.0, 39.0, 56.0, 80.0, 85.0, 86.0, 89.0, 98.0, 87.0, 79.0, 72.0, 46.0, 48.0, 25.0, 19.0, 11.0, 7.0, 3.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.1336669921875, -0.13055801391601562, -0.12744903564453125, -0.12434005737304688, -0.1212310791015625, -0.11812210083007812, -0.11501312255859375, -0.11190414428710938, -0.108795166015625, -0.10568618774414062, -0.10257720947265625, -0.09946823120117188, -0.0963592529296875, -0.09325027465820312, -0.09014129638671875, -0.08703231811523438, -0.08392333984375, -0.08081436157226562, -0.07770538330078125, -0.07459640502929688, -0.0714874267578125, -0.06837844848632812, -0.06526947021484375, -0.062160491943359375, -0.059051513671875, -0.055942535400390625, -0.05283355712890625, -0.049724578857421875, -0.0466156005859375, -0.043506622314453125, -0.04039764404296875, -0.037288665771484375, -0.0341796875, -0.031070709228515625, -0.02796173095703125, -0.024852752685546875, -0.0217437744140625, -0.018634796142578125, -0.01552581787109375, -0.012416839599609375, -0.009307861328125, -0.006198883056640625, -0.00308990478515625, 1.9073486328125e-05, 0.0031280517578125, 0.006237030029296875, 0.00934600830078125, 0.012454986572265625, 0.01556396484375, 0.018672943115234375, 0.02178192138671875, 0.024890899658203125, 0.0279998779296875, 0.031108856201171875, 0.03421783447265625, 0.037326812744140625, 0.040435791015625, 0.043544769287109375, 0.04665374755859375, 0.049762725830078125, 0.0528717041015625, 0.055980682373046875, 0.05908966064453125, 0.062198638916015625, 0.0653076171875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 2.0, 4.0, 0.0, 1.0, 5.0, 7.0, 6.0, 11.0, 8.0, 15.0, 22.0, 33.0, 52.0, 96.0, 146.0, 255.0, 550.0, 1055.0, 2386.0, 5832.0, 16030.0, 49560.0, 210255.0, 617609.0, 99529.0, 28097.0, 9850.0, 3808.0, 1677.0, 766.0, 389.0, 194.0, 96.0, 72.0, 44.0, 29.0, 16.0, 15.0, 8.0, 11.0, 5.0, 5.0, 5.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2802734375, -0.2699928283691406, -0.25971221923828125, -0.24943161010742188, -0.2391510009765625, -0.22887039184570312, -0.21858978271484375, -0.20830917358398438, -0.198028564453125, -0.18774795532226562, -0.17746734619140625, -0.16718673706054688, -0.1569061279296875, -0.14662551879882812, -0.13634490966796875, -0.12606430053710938, -0.11578369140625, -0.10550308227539062, -0.09522247314453125, -0.08494186401367188, -0.0746612548828125, -0.06438064575195312, -0.05410003662109375, -0.043819427490234375, -0.033538818359375, -0.023258209228515625, -0.01297760009765625, -0.002696990966796875, 0.0075836181640625, 0.017864227294921875, 0.02814483642578125, 0.038425445556640625, 0.0487060546875, 0.058986663818359375, 0.06926727294921875, 0.07954788208007812, 0.0898284912109375, 0.10010910034179688, 0.11038970947265625, 0.12067031860351562, 0.130950927734375, 0.14123153686523438, 0.15151214599609375, 0.16179275512695312, 0.1720733642578125, 0.18235397338867188, 0.19263458251953125, 0.20291519165039062, 0.21319580078125, 0.22347640991210938, 0.23375701904296875, 0.24403762817382812, 0.2543182373046875, 0.2645988464355469, 0.27487945556640625, 0.2851600646972656, 0.295440673828125, 0.3057212829589844, 0.31600189208984375, 0.3262825012207031, 0.3365631103515625, 0.3468437194824219, 0.35712432861328125, 0.3674049377441406, 0.377685546875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 4.0, 6.0, 5.0, 4.0, 10.0, 8.0, 9.0, 12.0, 14.0, 17.0, 17.0, 34.0, 35.0, 52.0, 33.0, 49.0, 56.0, 56.0, 46.0, 55.0, 58.0, 50.0, 49.0, 49.0, 39.0, 33.0, 41.0, 31.0, 28.0, 16.0, 14.0, 16.0, 14.0, 13.0, 10.0, 5.0, 4.0, 4.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.289306640625, -0.28113555908203125, -0.2729644775390625, -0.26479339599609375, -0.256622314453125, -0.24845123291015625, -0.2402801513671875, -0.23210906982421875, -0.22393798828125, -0.21576690673828125, -0.2075958251953125, -0.19942474365234375, -0.191253662109375, -0.18308258056640625, -0.1749114990234375, -0.16674041748046875, -0.1585693359375, -0.15039825439453125, -0.1422271728515625, -0.13405609130859375, -0.125885009765625, -0.11771392822265625, -0.1095428466796875, -0.10137176513671875, -0.09320068359375, -0.08502960205078125, -0.0768585205078125, -0.06868743896484375, -0.060516357421875, -0.05234527587890625, -0.0441741943359375, -0.03600311279296875, -0.02783203125, -0.01966094970703125, -0.0114898681640625, -0.00331878662109375, 0.004852294921875, 0.01302337646484375, 0.0211944580078125, 0.02936553955078125, 0.03753662109375, 0.04570770263671875, 0.0538787841796875, 0.06204986572265625, 0.070220947265625, 0.07839202880859375, 0.0865631103515625, 0.09473419189453125, 0.1029052734375, 0.11107635498046875, 0.1192474365234375, 0.12741851806640625, 0.135589599609375, 0.14376068115234375, 0.1519317626953125, 0.16010284423828125, 0.16827392578125, 0.17644500732421875, 0.1846160888671875, 0.19278717041015625, 0.200958251953125, 0.20912933349609375, 0.2173004150390625, 0.22547149658203125, 0.233642578125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 4.0, 4.0, 7.0, 7.0, 13.0, 17.0, 17.0, 41.0, 69.0, 93.0, 143.0, 189.0, 347.0, 570.0, 1009.0, 2054.0, 4214.0, 9650.0, 25125.0, 87157.0, 679379.0, 173863.0, 38990.0, 13883.0, 5777.0, 2646.0, 1387.0, 746.0, 435.0, 248.0, 147.0, 85.0, 68.0, 50.0, 27.0, 18.0, 26.0, 8.0, 10.0, 7.0, 10.0, 4.0, 2.0, 4.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.072021484375, -0.07000398635864258, -0.06798648834228516, -0.06596899032592773, -0.06395149230957031, -0.06193399429321289, -0.05991649627685547, -0.05789899826049805, -0.055881500244140625, -0.0538640022277832, -0.05184650421142578, -0.04982900619506836, -0.04781150817871094, -0.045794010162353516, -0.043776512145996094, -0.04175901412963867, -0.03974151611328125, -0.03772401809692383, -0.035706520080566406, -0.033689022064208984, -0.03167152404785156, -0.02965402603149414, -0.02763652801513672, -0.025619029998779297, -0.023601531982421875, -0.021584033966064453, -0.01956653594970703, -0.01754903793334961, -0.015531539916992188, -0.013514041900634766, -0.011496543884277344, -0.009479045867919922, -0.0074615478515625, -0.005444049835205078, -0.0034265518188476562, -0.0014090538024902344, 0.0006084442138671875, 0.0026259422302246094, 0.004643440246582031, 0.006660938262939453, 0.008678436279296875, 0.010695934295654297, 0.012713432312011719, 0.01473093032836914, 0.016748428344726562, 0.018765926361083984, 0.020783424377441406, 0.022800922393798828, 0.02481842041015625, 0.026835918426513672, 0.028853416442871094, 0.030870914459228516, 0.03288841247558594, 0.03490591049194336, 0.03692340850830078, 0.0389409065246582, 0.040958404541015625, 0.04297590255737305, 0.04499340057373047, 0.04701089859008789, 0.04902839660644531, 0.051045894622802734, 0.053063392639160156, 0.05508089065551758, 0.057098388671875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 0.0, 6.0, 2.0, 6.0, 5.0, 12.0, 12.0, 20.0, 17.0, 19.0, 19.0, 37.0, 52.0, 82.0, 163.0, 204.0, 93.0, 55.0, 40.0, 27.0, 29.0, 15.0, 29.0, 8.0, 15.0, 6.0, 6.0, 9.0, 4.0, 3.0, 2.0, 3.0, 2.0, 1.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00019073486328125, -0.00018532201647758484, -0.00017990916967391968, -0.00017449632287025452, -0.00016908347606658936, -0.0001636706292629242, -0.00015825778245925903, -0.00015284493565559387, -0.0001474320888519287, -0.00014201924204826355, -0.0001366063952445984, -0.00013119354844093323, -0.00012578070163726807, -0.0001203678548336029, -0.00011495500802993774, -0.00010954216122627258, -0.00010412931442260742, -9.871646761894226e-05, -9.33036208152771e-05, -8.789077401161194e-05, -8.247792720794678e-05, -7.706508040428162e-05, -7.165223360061646e-05, -6.62393867969513e-05, -6.082653999328613e-05, -5.541369318962097e-05, -5.000084638595581e-05, -4.458799958229065e-05, -3.917515277862549e-05, -3.376230597496033e-05, -2.8349459171295166e-05, -2.2936612367630005e-05, -1.7523765563964844e-05, -1.2110918760299683e-05, -6.6980719566345215e-06, -1.2852251529693604e-06, 4.127621650695801e-06, 9.540468454360962e-06, 1.4953315258026123e-05, 2.0366162061691284e-05, 2.5779008865356445e-05, 3.1191855669021606e-05, 3.660470247268677e-05, 4.201754927635193e-05, 4.743039608001709e-05, 5.284324288368225e-05, 5.825608968734741e-05, 6.366893649101257e-05, 6.908178329467773e-05, 7.44946300983429e-05, 7.990747690200806e-05, 8.532032370567322e-05, 9.073317050933838e-05, 9.614601731300354e-05, 0.0001015588641166687, 0.00010697171092033386, 0.00011238455772399902, 0.00011779740452766418, 0.00012321025133132935, 0.0001286230981349945, 0.00013403594493865967, 0.00013944879174232483, 0.00014486163854599, 0.00015027448534965515, 0.0001556873321533203]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 2.0, 2.0, 6.0, 6.0, 7.0, 18.0, 14.0, 39.0, 52.0, 104.0, 221.0, 441.0, 1131.0, 2886.0, 9045.0, 39179.0, 327133.0, 603826.0, 48077.0, 10813.0, 3276.0, 1232.0, 526.0, 244.0, 114.0, 58.0, 39.0, 11.0, 14.0, 11.0, 5.0, 6.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05743408203125, -0.055230140686035156, -0.05302619934082031, -0.05082225799560547, -0.048618316650390625, -0.04641437530517578, -0.04421043395996094, -0.042006492614746094, -0.03980255126953125, -0.037598609924316406, -0.03539466857910156, -0.03319072723388672, -0.030986785888671875, -0.02878284454345703, -0.026578903198242188, -0.024374961853027344, -0.0221710205078125, -0.019967079162597656, -0.017763137817382812, -0.015559196472167969, -0.013355255126953125, -0.011151313781738281, -0.008947372436523438, -0.006743431091308594, -0.00453948974609375, -0.0023355484008789062, -0.0001316070556640625, 0.0020723342895507812, 0.004276275634765625, 0.006480216979980469, 0.008684158325195312, 0.010888099670410156, 0.013092041015625, 0.015295982360839844, 0.017499923706054688, 0.01970386505126953, 0.021907806396484375, 0.02411174774169922, 0.026315689086914062, 0.028519630432128906, 0.03072357177734375, 0.032927513122558594, 0.03513145446777344, 0.03733539581298828, 0.039539337158203125, 0.04174327850341797, 0.04394721984863281, 0.046151161193847656, 0.0483551025390625, 0.050559043884277344, 0.05276298522949219, 0.05496692657470703, 0.057170867919921875, 0.05937480926513672, 0.06157875061035156, 0.0637826919555664, 0.06598663330078125, 0.0681905746459961, 0.07039451599121094, 0.07259845733642578, 0.07480239868164062, 0.07700634002685547, 0.07921028137207031, 0.08141422271728516, 0.0836181640625]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 3.0, 2.0, 2.0, 9.0, 6.0, 7.0, 12.0, 19.0, 21.0, 20.0, 33.0, 34.0, 56.0, 63.0, 65.0, 84.0, 108.0, 100.0, 77.0, 59.0, 48.0, 45.0, 33.0, 22.0, 21.0, 11.0, 11.0, 11.0, 3.0, 3.0, 3.0, 7.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.05462646484375, -0.05313301086425781, -0.051639556884765625, -0.05014610290527344, -0.04865264892578125, -0.04715919494628906, -0.045665740966796875, -0.04417228698730469, -0.0426788330078125, -0.04118537902832031, -0.039691925048828125, -0.03819847106933594, -0.03670501708984375, -0.03521156311035156, -0.033718109130859375, -0.03222465515136719, -0.030731201171875, -0.029237747192382812, -0.027744293212890625, -0.026250839233398438, -0.02475738525390625, -0.023263931274414062, -0.021770477294921875, -0.020277023315429688, -0.0187835693359375, -0.017290115356445312, -0.015796661376953125, -0.014303207397460938, -0.01280975341796875, -0.011316299438476562, -0.009822845458984375, -0.008329391479492188, -0.0068359375, -0.0053424835205078125, -0.003849029541015625, -0.0023555755615234375, -0.00086212158203125, 0.0006313323974609375, 0.002124786376953125, 0.0036182403564453125, 0.0051116943359375, 0.0066051483154296875, 0.008098602294921875, 0.009592056274414062, 0.01108551025390625, 0.012578964233398438, 0.014072418212890625, 0.015565872192382812, 0.017059326171875, 0.018552780151367188, 0.020046234130859375, 0.021539688110351562, 0.02303314208984375, 0.024526596069335938, 0.026020050048828125, 0.027513504028320312, 0.0290069580078125, 0.030500411987304688, 0.031993865966796875, 0.03348731994628906, 0.03498077392578125, 0.03647422790527344, 0.037967681884765625, 0.03946113586425781, 0.04095458984375]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 1.0, 3.0, 2.0, 2.0, 2.0, 4.0, 4.0, 5.0, 7.0, 8.0, 12.0, 10.0, 20.0, 15.0, 24.0, 40.0, 43.0, 56.0, 78.0, 121.0, 198.0, 108.0, 66.0, 45.0, 30.0, 30.0, 12.0, 13.0, 9.0, 8.0, 7.0, 6.0, 4.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0], "bins": [-1.693743348121643, -1.6537140607833862, -1.6136847734451294, -1.5736554861068726, -1.5336263179779053, -1.4935970306396484, -1.4535677433013916, -1.4135384559631348, -1.373509168624878, -1.333479881286621, -1.2934505939483643, -1.2534213066101074, -1.2133920192718506, -1.1733628511428833, -1.1333335638046265, -1.0933042764663696, -1.0532749891281128, -1.013245701789856, -0.9732164144515991, -0.9331871867179871, -0.8931578993797302, -0.8531286120414734, -0.8130993843078613, -0.7730700969696045, -0.7330408096313477, -0.6930115222930908, -0.652982234954834, -0.6129530072212219, -0.5729237198829651, -0.5328944325447083, -0.4928651750087738, -0.45283591747283936, -0.41280651092529297, -0.37277722358703613, -0.3327479660511017, -0.29271870851516724, -0.2526894211769104, -0.21266014873981476, -0.17263087630271912, -0.13260161876678467, -0.09257233142852783, -0.05254305899143219, -0.012513786554336548, 0.027515485882759094, 0.06754475831985474, 0.10757403075695038, 0.14760330319404602, 0.18763256072998047, 0.2276618480682373, 0.26769113540649414, 0.3077203929424286, 0.34774965047836304, 0.3877789378166199, 0.4278082251548767, 0.46783748269081116, 0.5078667402267456, 0.5478960275650024, 0.5879253149032593, 0.6279546022415161, 0.6679838299751282, 0.708013117313385, 0.7480424046516418, 0.7880716323852539, 0.8281009197235107, 0.8681302070617676]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 5.0, 2.0, 12.0, 7.0, 8.0, 13.0, 8.0, 10.0, 19.0, 17.0, 18.0, 35.0, 29.0, 29.0, 22.0, 40.0, 45.0, 45.0, 75.0, 66.0, 70.0, 52.0, 55.0, 40.0, 30.0, 38.0, 17.0, 44.0, 18.0, 24.0, 17.0, 18.0, 16.0, 7.0, 9.0, 11.0, 8.0, 10.0, 2.0, 2.0, 6.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.864099383354187, -0.8332605361938477, -0.8024216890335083, -0.771582841873169, -0.7407439947128296, -0.7099051475524902, -0.6790663003921509, -0.6482274532318115, -0.6173886060714722, -0.5865497589111328, -0.5557109117507935, -0.5248720645904541, -0.49403321743011475, -0.4631943702697754, -0.43235552310943604, -0.4015166759490967, -0.37067779898643494, -0.3398389518260956, -0.3090001046657562, -0.27816125750541687, -0.24732241034507751, -0.21648354828357697, -0.1856447011232376, -0.15480585396289825, -0.1239670068025589, -0.09312815964221954, -0.06228930875658989, -0.031450457870960236, -0.0006116107106208801, 0.030227243900299072, 0.06106609106063843, 0.09190493822097778, 0.12274378538131714, 0.1535826325416565, 0.18442147970199585, 0.2152603268623352, 0.24609917402267456, 0.2769380211830139, 0.30777686834335327, 0.3386157155036926, 0.369454562664032, 0.40029340982437134, 0.4311322569847107, 0.46197110414505005, 0.4928099513053894, 0.5236487984657288, 0.5544876456260681, 0.5853264927864075, 0.6161653995513916, 0.647004246711731, 0.6778430938720703, 0.7086819410324097, 0.739520788192749, 0.7703596353530884, 0.8011984825134277, 0.8320373296737671, 0.8628761768341064, 0.8937150239944458, 0.9245538711547852, 0.9553927183151245, 0.9862315654754639, 1.0170704126358032, 1.0479092597961426, 1.078748106956482, 1.1095869541168213]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 4.0, 2.0, 3.0, 8.0, 11.0, 16.0, 16.0, 24.0, 38.0, 48.0, 81.0, 130.0, 197.0, 381.0, 742.0, 1788.0, 5765.0, 29724.0, 1792447.0, 2321402.0, 31364.0, 6276.0, 2018.0, 857.0, 412.0, 195.0, 130.0, 75.0, 40.0, 28.0, 21.0, 12.0, 6.0, 5.0, 5.0, 3.0, 2.0, 0.0, 3.0, 2.0], "bins": [-0.5234375, -0.5112686157226562, -0.4990997314453125, -0.48693084716796875, -0.474761962890625, -0.46259307861328125, -0.4504241943359375, -0.43825531005859375, -0.42608642578125, -0.41391754150390625, -0.4017486572265625, -0.38957977294921875, -0.377410888671875, -0.36524200439453125, -0.3530731201171875, -0.34090423583984375, -0.3287353515625, -0.31656646728515625, -0.3043975830078125, -0.29222869873046875, -0.280059814453125, -0.26789093017578125, -0.2557220458984375, -0.24355316162109375, -0.23138427734375, -0.21921539306640625, -0.2070465087890625, -0.19487762451171875, -0.182708740234375, -0.17053985595703125, -0.1583709716796875, -0.14620208740234375, -0.134033203125, -0.12186431884765625, -0.1096954345703125, -0.09752655029296875, -0.085357666015625, -0.07318878173828125, -0.0610198974609375, -0.04885101318359375, -0.03668212890625, -0.02451324462890625, -0.0123443603515625, -0.00017547607421875, 0.011993408203125, 0.02416229248046875, 0.0363311767578125, 0.04850006103515625, 0.0606689453125, 0.07283782958984375, 0.0850067138671875, 0.09717559814453125, 0.109344482421875, 0.12151336669921875, 0.1336822509765625, 0.14585113525390625, 0.15802001953125, 0.17018890380859375, 0.1823577880859375, 0.19452667236328125, 0.206695556640625, 0.21886444091796875, 0.2310333251953125, 0.24320220947265625, 0.25537109375]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 10.0, 13.0, 20.0, 36.0, 33.0, 67.0, 75.0, 88.0, 101.0, 101.0, 93.0, 99.0, 82.0, 64.0, 30.0, 39.0, 14.0, 14.0, 12.0, 2.0, 3.0, 3.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.1317138671875, -0.1286182403564453, -0.12552261352539062, -0.12242698669433594, -0.11933135986328125, -0.11623573303222656, -0.11314010620117188, -0.11004447937011719, -0.1069488525390625, -0.10385322570800781, -0.10075759887695312, -0.09766197204589844, -0.09456634521484375, -0.09147071838378906, -0.08837509155273438, -0.08527946472167969, -0.082183837890625, -0.07908821105957031, -0.07599258422851562, -0.07289695739746094, -0.06980133056640625, -0.06670570373535156, -0.06361007690429688, -0.06051445007324219, -0.0574188232421875, -0.05432319641113281, -0.051227569580078125, -0.04813194274902344, -0.04503631591796875, -0.04194068908691406, -0.038845062255859375, -0.03574943542480469, -0.03265380859375, -0.029558181762695312, -0.026462554931640625, -0.023366928100585938, -0.02027130126953125, -0.017175674438476562, -0.014080047607421875, -0.010984420776367188, -0.0078887939453125, -0.0047931671142578125, -0.001697540283203125, 0.0013980865478515625, 0.00449371337890625, 0.0075893402099609375, 0.010684967041015625, 0.013780593872070312, 0.016876220703125, 0.019971847534179688, 0.023067474365234375, 0.026163101196289062, 0.02925872802734375, 0.03235435485839844, 0.035449981689453125, 0.03854560852050781, 0.0416412353515625, 0.04473686218261719, 0.047832489013671875, 0.05092811584472656, 0.05402374267578125, 0.05711936950683594, 0.060214996337890625, 0.06331062316894531, 0.06640625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 3.0, 4.0, 4.0, 3.0, 8.0, 8.0, 12.0, 13.0, 27.0, 48.0, 49.0, 74.0, 87.0, 164.0, 223.0, 400.0, 783.0, 1738.0, 5098.0, 22108.0, 216899.0, 3839629.0, 87458.0, 12489.0, 3437.0, 1388.0, 730.0, 435.0, 302.0, 183.0, 149.0, 96.0, 74.0, 45.0, 31.0, 28.0, 22.0, 17.0, 13.0, 4.0, 4.0, 1.0, 4.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.310546875, -0.29779052734375, -0.2850341796875, -0.27227783203125, -0.259521484375, -0.24676513671875, -0.2340087890625, -0.22125244140625, -0.20849609375, -0.19573974609375, -0.1829833984375, -0.17022705078125, -0.157470703125, -0.14471435546875, -0.1319580078125, -0.11920166015625, -0.1064453125, -0.09368896484375, -0.0809326171875, -0.06817626953125, -0.055419921875, -0.04266357421875, -0.0299072265625, -0.01715087890625, -0.00439453125, 0.00836181640625, 0.0211181640625, 0.03387451171875, 0.046630859375, 0.05938720703125, 0.0721435546875, 0.08489990234375, 0.09765625, 0.11041259765625, 0.1231689453125, 0.13592529296875, 0.148681640625, 0.16143798828125, 0.1741943359375, 0.18695068359375, 0.19970703125, 0.21246337890625, 0.2252197265625, 0.23797607421875, 0.250732421875, 0.26348876953125, 0.2762451171875, 0.28900146484375, 0.3017578125, 0.31451416015625, 0.3272705078125, 0.34002685546875, 0.352783203125, 0.36553955078125, 0.3782958984375, 0.39105224609375, 0.40380859375, 0.41656494140625, 0.4293212890625, 0.44207763671875, 0.454833984375, 0.46759033203125, 0.4803466796875, 0.49310302734375, 0.505859375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 3.0, 1.0, 2.0, 9.0, 8.0, 9.0, 16.0, 20.0, 29.0, 37.0, 55.0, 107.0, 162.0, 437.0, 1875.0, 834.0, 194.0, 99.0, 63.0, 35.0, 26.0, 20.0, 10.0, 12.0, 5.0, 4.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.177978515625, -0.16790390014648438, -0.15782928466796875, -0.14775466918945312, -0.1376800537109375, -0.12760543823242188, -0.11753082275390625, -0.10745620727539062, -0.097381591796875, -0.08730697631835938, -0.07723236083984375, -0.06715774536132812, -0.0570831298828125, -0.047008514404296875, -0.03693389892578125, -0.026859283447265625, -0.01678466796875, -0.006710052490234375, 0.00336456298828125, 0.013439178466796875, 0.0235137939453125, 0.033588409423828125, 0.04366302490234375, 0.053737640380859375, 0.063812255859375, 0.07388687133789062, 0.08396148681640625, 0.09403610229492188, 0.1041107177734375, 0.11418533325195312, 0.12425994873046875, 0.13433456420898438, 0.1444091796875, 0.15448379516601562, 0.16455841064453125, 0.17463302612304688, 0.1847076416015625, 0.19478225708007812, 0.20485687255859375, 0.21493148803710938, 0.225006103515625, 0.23508071899414062, 0.24515533447265625, 0.2552299499511719, 0.2653045654296875, 0.2753791809082031, 0.28545379638671875, 0.2955284118652344, 0.30560302734375, 0.3156776428222656, 0.32575225830078125, 0.3358268737792969, 0.3459014892578125, 0.3559761047363281, 0.36605072021484375, 0.3761253356933594, 0.386199951171875, 0.3962745666503906, 0.40634918212890625, 0.4164237976074219, 0.4264984130859375, 0.4365730285644531, 0.44664764404296875, 0.4567222595214844, 0.466796875]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 10.0, 10.0, 33.0, 41.0, 92.0, 157.0, 266.0, 190.0, 103.0, 43.0, 25.0, 18.0, 9.0, 6.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.710350513458252, -4.585576057434082, -4.460801601409912, -4.336026668548584, -4.211252212524414, -4.086477756500244, -3.961703300476074, -3.8369288444519043, -3.7121541500091553, -3.5873796939849854, -3.4626049995422363, -3.3378305435180664, -3.2130560874938965, -3.0882813930511475, -2.9635069370269775, -2.8387322425842285, -2.7139577865600586, -2.5891833305358887, -2.4644086360931396, -2.3396341800689697, -2.2148594856262207, -2.090085029602051, -1.9653105735778809, -1.8405359983444214, -1.715761423110962, -1.5909868478775024, -1.466212272644043, -1.341437816619873, -1.2166632413864136, -1.091888666152954, -0.9671141505241394, -0.8423396348953247, -0.7175650596618652, -0.5927904844284058, -0.46801596879959106, -0.343241423368454, -0.2184668779373169, -0.09369230270385742, 0.031082212924957275, 0.15585672855377197, 0.28063130378723145, 0.40540584921836853, 0.5301803946495056, 0.6549549102783203, 0.7797294855117798, 0.9045040607452393, 1.0292785167694092, 1.1540530920028687, 1.2788276672363281, 1.4036022424697876, 1.528376817703247, 1.653151273727417, 1.7779258489608765, 1.902700424194336, 2.027474880218506, 2.152249336242676, 2.277024030685425, 2.4017984867095947, 2.5265731811523438, 2.6513476371765137, 2.7761220932006836, 2.9008967876434326, 3.0256712436676025, 3.1504459381103516, 3.2752203941345215]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 6.0, 3.0, 3.0, 6.0, 2.0, 12.0, 18.0, 19.0, 27.0, 35.0, 51.0, 45.0, 47.0, 49.0, 65.0, 68.0, 60.0, 72.0, 62.0, 70.0, 53.0, 45.0, 35.0, 37.0, 30.0, 17.0, 16.0, 17.0, 12.0, 14.0, 7.0, 8.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.3712878227233887, -2.3168811798095703, -2.262474298477173, -2.2080676555633545, -2.153660774230957, -2.0992541313171387, -2.044847249984741, -1.9904404878616333, -1.9360337257385254, -1.8816269636154175, -1.8272202014923096, -1.7728134393692017, -1.7184066772460938, -1.6639999151229858, -1.609593152999878, -1.55518639087677, -1.500779628753662, -1.4463728666305542, -1.3919661045074463, -1.3375593423843384, -1.2831525802612305, -1.2287458181381226, -1.1743390560150146, -1.1199322938919067, -1.0655256509780884, -1.0111188888549805, -0.9567121267318726, -0.9023053646087646, -0.8478986024856567, -0.7934918403625488, -0.7390850782394409, -0.684678316116333, -0.6302715539932251, -0.5758647918701172, -0.5214580297470093, -0.46705126762390137, -0.41264450550079346, -0.35823777318000793, -0.3038310110569, -0.24942424893379211, -0.1950174868106842, -0.1406107246875763, -0.08620397001504898, -0.03179721534252167, 0.022609546780586243, 0.07701629400253296, 0.13142305612564087, 0.18582981824874878, 0.2402365803718567, 0.2946433424949646, 0.3490501046180725, 0.4034568667411804, 0.45786362886428833, 0.5122703313827515, 0.5666770935058594, 0.6210838556289673, 0.6754906177520752, 0.7298973798751831, 0.784304141998291, 0.8387109041213989, 0.8931176662445068, 0.9475244283676147, 1.0019311904907227, 1.0563379526138306, 1.1107447147369385]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 9.0, 9.0, 8.0, 13.0, 25.0, 23.0, 35.0, 60.0, 92.0, 125.0, 213.0, 408.0, 769.0, 1847.0, 5049.0, 16718.0, 74391.0, 617426.0, 272411.0, 42004.0, 10564.0, 3472.0, 1396.0, 644.0, 363.0, 166.0, 107.0, 68.0, 57.0, 27.0, 16.0, 13.0, 5.0, 6.0, 5.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.76953125, -0.7460861206054688, -0.7226409912109375, -0.6991958618164062, -0.675750732421875, -0.6523056030273438, -0.6288604736328125, -0.6054153442382812, -0.58197021484375, -0.5585250854492188, -0.5350799560546875, -0.5116348266601562, -0.488189697265625, -0.46474456787109375, -0.4412994384765625, -0.41785430908203125, -0.3944091796875, -0.37096405029296875, -0.3475189208984375, -0.32407379150390625, -0.300628662109375, -0.27718353271484375, -0.2537384033203125, -0.23029327392578125, -0.20684814453125, -0.18340301513671875, -0.1599578857421875, -0.13651275634765625, -0.113067626953125, -0.08962249755859375, -0.0661773681640625, -0.04273223876953125, -0.019287109375, 0.00415802001953125, 0.0276031494140625, 0.05104827880859375, 0.074493408203125, 0.09793853759765625, 0.1213836669921875, 0.14482879638671875, 0.16827392578125, 0.19171905517578125, 0.2151641845703125, 0.23860931396484375, 0.262054443359375, 0.28549957275390625, 0.3089447021484375, 0.33238983154296875, 0.3558349609375, 0.37928009033203125, 0.4027252197265625, 0.42617034912109375, 0.449615478515625, 0.47306060791015625, 0.4965057373046875, 0.5199508666992188, 0.54339599609375, 0.5668411254882812, 0.5902862548828125, 0.6137313842773438, 0.637176513671875, 0.6606216430664062, 0.6840667724609375, 0.7075119018554688, 0.73095703125]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 8.0, 7.0, 11.0, 18.0, 21.0, 29.0, 35.0, 57.0, 49.0, 69.0, 65.0, 80.0, 95.0, 72.0, 60.0, 70.0, 64.0, 48.0, 40.0, 35.0, 21.0, 15.0, 8.0, 7.0, 7.0, 5.0, 5.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.1334228515625, -0.13029098510742188, -0.12715911865234375, -0.12402725219726562, -0.1208953857421875, -0.11776351928710938, -0.11463165283203125, -0.11149978637695312, -0.108367919921875, -0.10523605346679688, -0.10210418701171875, -0.09897232055664062, -0.0958404541015625, -0.09270858764648438, -0.08957672119140625, -0.08644485473632812, -0.08331298828125, -0.08018112182617188, -0.07704925537109375, -0.07391738891601562, -0.0707855224609375, -0.06765365600585938, -0.06452178955078125, -0.061389923095703125, -0.058258056640625, -0.055126190185546875, -0.05199432373046875, -0.048862457275390625, -0.0457305908203125, -0.042598724365234375, -0.03946685791015625, -0.036334991455078125, -0.033203125, -0.030071258544921875, -0.02693939208984375, -0.023807525634765625, -0.0206756591796875, -0.017543792724609375, -0.01441192626953125, -0.011280059814453125, -0.008148193359375, -0.005016326904296875, -0.00188446044921875, 0.001247406005859375, 0.0043792724609375, 0.007511138916015625, 0.01064300537109375, 0.013774871826171875, 0.01690673828125, 0.020038604736328125, 0.02317047119140625, 0.026302337646484375, 0.0294342041015625, 0.032566070556640625, 0.03569793701171875, 0.038829803466796875, 0.041961669921875, 0.045093536376953125, 0.04822540283203125, 0.051357269287109375, 0.0544891357421875, 0.057621002197265625, 0.06075286865234375, 0.06388473510742188, 0.0670166015625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 6.0, 1.0, 7.0, 7.0, 11.0, 20.0, 36.0, 63.0, 112.0, 234.0, 465.0, 1136.0, 3294.0, 10379.0, 42559.0, 589037.0, 347984.0, 38674.0, 9509.0, 2953.0, 1124.0, 478.0, 214.0, 114.0, 56.0, 34.0, 20.0, 16.0, 8.0, 3.0, 2.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.8642578125, -0.8431625366210938, -0.8220672607421875, -0.8009719848632812, -0.779876708984375, -0.7587814331054688, -0.7376861572265625, -0.7165908813476562, -0.69549560546875, -0.6744003295898438, -0.6533050537109375, -0.6322097778320312, -0.611114501953125, -0.5900192260742188, -0.5689239501953125, -0.5478286743164062, -0.5267333984375, -0.5056381225585938, -0.4845428466796875, -0.46344757080078125, -0.442352294921875, -0.42125701904296875, -0.4001617431640625, -0.37906646728515625, -0.35797119140625, -0.33687591552734375, -0.3157806396484375, -0.29468536376953125, -0.273590087890625, -0.25249481201171875, -0.2313995361328125, -0.21030426025390625, -0.189208984375, -0.16811370849609375, -0.1470184326171875, -0.12592315673828125, -0.104827880859375, -0.08373260498046875, -0.0626373291015625, -0.04154205322265625, -0.02044677734375, 0.00064849853515625, 0.0217437744140625, 0.04283905029296875, 0.063934326171875, 0.08502960205078125, 0.1061248779296875, 0.12722015380859375, 0.1483154296875, 0.16941070556640625, 0.1905059814453125, 0.21160125732421875, 0.232696533203125, 0.25379180908203125, 0.2748870849609375, 0.29598236083984375, 0.31707763671875, 0.33817291259765625, 0.3592681884765625, 0.38036346435546875, 0.401458740234375, 0.42255401611328125, 0.4436492919921875, 0.46474456787109375, 0.48583984375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 13.0, 10.0, 14.0, 14.0, 16.0, 34.0, 36.0, 50.0, 59.0, 67.0, 85.0, 97.0, 85.0, 81.0, 71.0, 57.0, 63.0, 31.0, 38.0, 26.0, 20.0, 12.0, 6.0, 5.0, 7.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.56103515625, -0.5469741821289062, -0.5329132080078125, -0.5188522338867188, -0.504791259765625, -0.49073028564453125, -0.4766693115234375, -0.46260833740234375, -0.44854736328125, -0.43448638916015625, -0.4204254150390625, -0.40636444091796875, -0.392303466796875, -0.37824249267578125, -0.3641815185546875, -0.35012054443359375, -0.3360595703125, -0.32199859619140625, -0.3079376220703125, -0.29387664794921875, -0.279815673828125, -0.26575469970703125, -0.2516937255859375, -0.23763275146484375, -0.22357177734375, -0.20951080322265625, -0.1954498291015625, -0.18138885498046875, -0.167327880859375, -0.15326690673828125, -0.1392059326171875, -0.12514495849609375, -0.111083984375, -0.09702301025390625, -0.0829620361328125, -0.06890106201171875, -0.054840087890625, -0.04077911376953125, -0.0267181396484375, -0.01265716552734375, 0.00140380859375, 0.01546478271484375, 0.0295257568359375, 0.04358673095703125, 0.057647705078125, 0.07170867919921875, 0.0857696533203125, 0.09983062744140625, 0.1138916015625, 0.12795257568359375, 0.1420135498046875, 0.15607452392578125, 0.170135498046875, 0.18419647216796875, 0.1982574462890625, 0.21231842041015625, 0.22637939453125, 0.24044036865234375, 0.2545013427734375, 0.26856231689453125, 0.282623291015625, 0.29668426513671875, 0.3107452392578125, 0.32480621337890625, 0.3388671875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 7.0, 6.0, 9.0, 13.0, 27.0, 21.0, 32.0, 51.0, 70.0, 117.0, 147.0, 283.0, 438.0, 795.0, 1621.0, 4031.0, 17222.0, 274971.0, 716161.0, 23524.0, 4944.0, 1826.0, 905.0, 485.0, 295.0, 186.0, 111.0, 76.0, 56.0, 33.0, 25.0, 14.0, 16.0, 8.0, 7.0, 7.0, 3.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.171142578125, -0.1661205291748047, -0.16109848022460938, -0.15607643127441406, -0.15105438232421875, -0.14603233337402344, -0.14101028442382812, -0.1359882354736328, -0.1309661865234375, -0.1259441375732422, -0.12092208862304688, -0.11590003967285156, -0.11087799072265625, -0.10585594177246094, -0.10083389282226562, -0.09581184387207031, -0.090789794921875, -0.08576774597167969, -0.08074569702148438, -0.07572364807128906, -0.07070159912109375, -0.06567955017089844, -0.060657501220703125, -0.05563545227050781, -0.0506134033203125, -0.04559135437011719, -0.040569305419921875, -0.03554725646972656, -0.03052520751953125, -0.025503158569335938, -0.020481109619140625, -0.015459060668945312, -0.01043701171875, -0.0054149627685546875, -0.000392913818359375, 0.0046291351318359375, 0.00965118408203125, 0.014673233032226562, 0.019695281982421875, 0.024717330932617188, 0.0297393798828125, 0.03476142883300781, 0.039783477783203125, 0.04480552673339844, 0.04982757568359375, 0.05484962463378906, 0.059871673583984375, 0.06489372253417969, 0.069915771484375, 0.07493782043457031, 0.07995986938476562, 0.08498191833496094, 0.09000396728515625, 0.09502601623535156, 0.10004806518554688, 0.10507011413574219, 0.1100921630859375, 0.11511421203613281, 0.12013626098632812, 0.12515830993652344, 0.13018035888671875, 0.13520240783691406, 0.14022445678710938, 0.1452465057373047, 0.1502685546875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 5.0, 3.0, 4.0, 0.0, 3.0, 5.0, 2.0, 4.0, 6.0, 8.0, 16.0, 10.0, 15.0, 18.0, 18.0, 26.0, 37.0, 60.0, 76.0, 115.0, 168.0, 121.0, 74.0, 53.0, 26.0, 19.0, 20.0, 15.0, 11.0, 9.0, 15.0, 8.0, 5.0, 5.0, 3.0, 6.0, 1.0, 2.0, 5.0, 4.0, 1.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.0003180503845214844, -0.00030934810638427734, -0.0003006458282470703, -0.0002919435501098633, -0.00028324127197265625, -0.0002745389938354492, -0.0002658367156982422, -0.00025713443756103516, -0.0002484321594238281, -0.0002397298812866211, -0.00023102760314941406, -0.00022232532501220703, -0.000213623046875, -0.00020492076873779297, -0.00019621849060058594, -0.0001875162124633789, -0.00017881393432617188, -0.00017011165618896484, -0.0001614093780517578, -0.00015270709991455078, -0.00014400482177734375, -0.00013530254364013672, -0.0001266002655029297, -0.00011789798736572266, -0.00010919570922851562, -0.0001004934310913086, -9.179115295410156e-05, -8.308887481689453e-05, -7.43865966796875e-05, -6.568431854248047e-05, -5.698204040527344e-05, -4.8279762268066406e-05, -3.9577484130859375e-05, -3.0875205993652344e-05, -2.2172927856445312e-05, -1.3470649719238281e-05, -4.76837158203125e-06, 3.933906555175781e-06, 1.2636184692382812e-05, 2.1338462829589844e-05, 3.0040740966796875e-05, 3.8743019104003906e-05, 4.744529724121094e-05, 5.614757537841797e-05, 6.4849853515625e-05, 7.355213165283203e-05, 8.225440979003906e-05, 9.09566879272461e-05, 9.965896606445312e-05, 0.00010836124420166016, 0.00011706352233886719, 0.00012576580047607422, 0.00013446807861328125, 0.00014317035675048828, 0.0001518726348876953, 0.00016057491302490234, 0.00016927719116210938, 0.0001779794692993164, 0.00018668174743652344, 0.00019538402557373047, 0.0002040863037109375, 0.00021278858184814453, 0.00022149085998535156, 0.0002301931381225586, 0.00023889541625976562]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 9.0, 6.0, 6.0, 6.0, 12.0, 13.0, 24.0, 32.0, 69.0, 85.0, 119.0, 211.0, 334.0, 632.0, 1188.0, 2323.0, 4939.0, 11748.0, 35874.0, 178759.0, 699847.0, 76750.0, 20680.0, 7688.0, 3323.0, 1709.0, 918.0, 493.0, 292.0, 164.0, 106.0, 67.0, 31.0, 39.0, 23.0, 10.0, 10.0, 10.0, 4.0, 5.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06988525390625, -0.06757640838623047, -0.06526756286621094, -0.0629587173461914, -0.060649871826171875, -0.058341026306152344, -0.05603218078613281, -0.05372333526611328, -0.05141448974609375, -0.04910564422607422, -0.04679679870605469, -0.044487953186035156, -0.042179107666015625, -0.039870262145996094, -0.03756141662597656, -0.03525257110595703, -0.0329437255859375, -0.03063488006591797, -0.028326034545898438, -0.026017189025878906, -0.023708343505859375, -0.021399497985839844, -0.019090652465820312, -0.01678180694580078, -0.01447296142578125, -0.012164115905761719, -0.009855270385742188, -0.007546424865722656, -0.005237579345703125, -0.0029287338256835938, -0.0006198883056640625, 0.0016889572143554688, 0.003997802734375, 0.006306648254394531, 0.008615493774414062, 0.010924339294433594, 0.013233184814453125, 0.015542030334472656, 0.017850875854492188, 0.02015972137451172, 0.02246856689453125, 0.02477741241455078, 0.027086257934570312, 0.029395103454589844, 0.031703948974609375, 0.034012794494628906, 0.03632164001464844, 0.03863048553466797, 0.0409393310546875, 0.04324817657470703, 0.04555702209472656, 0.047865867614746094, 0.050174713134765625, 0.052483558654785156, 0.05479240417480469, 0.05710124969482422, 0.05941009521484375, 0.06171894073486328, 0.06402778625488281, 0.06633663177490234, 0.06864547729492188, 0.0709543228149414, 0.07326316833496094, 0.07557201385498047, 0.077880859375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 3.0, 6.0, 4.0, 2.0, 5.0, 11.0, 8.0, 8.0, 14.0, 13.0, 30.0, 39.0, 49.0, 57.0, 78.0, 92.0, 97.0, 112.0, 83.0, 67.0, 57.0, 44.0, 33.0, 17.0, 23.0, 13.0, 5.0, 10.0, 4.0, 6.0, 0.0, 4.0, 6.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0567626953125, -0.054986000061035156, -0.05320930480957031, -0.05143260955810547, -0.049655914306640625, -0.04787921905517578, -0.04610252380371094, -0.044325828552246094, -0.04254913330078125, -0.040772438049316406, -0.03899574279785156, -0.03721904754638672, -0.035442352294921875, -0.03366565704345703, -0.03188896179199219, -0.030112266540527344, -0.0283355712890625, -0.026558876037597656, -0.024782180786132812, -0.02300548553466797, -0.021228790283203125, -0.01945209503173828, -0.017675399780273438, -0.015898704528808594, -0.01412200927734375, -0.012345314025878906, -0.010568618774414062, -0.008791923522949219, -0.007015228271484375, -0.005238533020019531, -0.0034618377685546875, -0.0016851425170898438, 9.1552734375e-05, 0.0018682479858398438, 0.0036449432373046875, 0.005421638488769531, 0.007198333740234375, 0.008975028991699219, 0.010751724243164062, 0.012528419494628906, 0.01430511474609375, 0.016081809997558594, 0.017858505249023438, 0.01963520050048828, 0.021411895751953125, 0.02318859100341797, 0.024965286254882812, 0.026741981506347656, 0.0285186767578125, 0.030295372009277344, 0.03207206726074219, 0.03384876251220703, 0.035625457763671875, 0.03740215301513672, 0.03917884826660156, 0.040955543518066406, 0.04273223876953125, 0.044508934020996094, 0.04628562927246094, 0.04806232452392578, 0.049839019775390625, 0.05161571502685547, 0.05339241027832031, 0.055169105529785156, 0.05694580078125]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 6.0, 10.0, 21.0, 16.0, 49.0, 91.0, 191.0, 259.0, 123.0, 68.0, 38.0, 35.0, 20.0, 14.0, 19.0, 10.0, 9.0, 8.0, 7.0, 5.0, 2.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.241309404373169, -1.1639025211334229, -1.0864956378936768, -1.0090887546539307, -0.9316819310188293, -0.8542750477790833, -0.7768682241439819, -0.6994613409042358, -0.6220544576644897, -0.5446475744247437, -0.46724072098731995, -0.38983386754989624, -0.31242698431015015, -0.23502010107040405, -0.15761324763298035, -0.08020639419555664, -0.002799510955810547, 0.07460735738277435, 0.15201422572135925, 0.22942109405994415, 0.30682796239852905, 0.38423484563827515, 0.46164169907569885, 0.5390485525131226, 0.6164554357528687, 0.6938623189926147, 0.7712692022323608, 0.8486760258674622, 0.9260829091072083, 1.0034897327423096, 1.0808966159820557, 1.1583034992218018, 1.2357103824615479, 1.313117265701294, 1.39052414894104, 1.4679310321807861, 1.5453379154205322, 1.6227447986602783, 1.7001515626907349, 1.777558445930481, 1.854965329170227, 1.9323722124099731, 2.0097789764404297, 2.087185859680176, 2.164592742919922, 2.241999626159668, 2.319406509399414, 2.39681339263916, 2.4742202758789062, 2.5516271591186523, 2.6290340423583984, 2.7064409255981445, 2.7838478088378906, 2.8612546920776367, 2.938661575317383, 3.016068458557129, 3.093475341796875, 3.170882225036621, 3.248289108276367, 3.3256959915161133, 3.4031028747558594, 3.4805097579956055, 3.5579166412353516, 3.6353235244750977, 3.7127301692962646]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 4.0, 1.0, 7.0, 8.0, 15.0, 10.0, 19.0, 19.0, 25.0, 28.0, 41.0, 39.0, 46.0, 31.0, 59.0, 83.0, 91.0, 99.0, 81.0, 40.0, 42.0, 29.0, 28.0, 35.0, 19.0, 27.0, 16.0, 12.0, 9.0, 19.0, 9.0, 5.0, 5.0, 3.0, 5.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9773365259170532, -0.9343498349189758, -0.8913631439208984, -0.8483763933181763, -0.8053897023200989, -0.7624030113220215, -0.7194162607192993, -0.6764295697212219, -0.6334428787231445, -0.5904561877250671, -0.5474694967269897, -0.5044827461242676, -0.4614960551261902, -0.4185093641281128, -0.375522643327713, -0.33253592252731323, -0.28954923152923584, -0.24656252562999725, -0.20357581973075867, -0.16058911383152008, -0.1176024079322815, -0.07461570203304291, -0.03162899613380432, 0.011357724666595459, 0.05434441566467285, 0.09733112156391144, 0.14031782746315002, 0.1833045333623886, 0.2262912392616272, 0.2692779302597046, 0.31226465106010437, 0.35525137186050415, 0.39823806285858154, 0.44122475385665894, 0.4842114746570587, 0.5271981954574585, 0.5701848864555359, 0.6131715774536133, 0.6561583280563354, 0.6991450190544128, 0.7421317100524902, 0.7851184010505676, 0.828105092048645, 0.8710918426513672, 0.9140785336494446, 0.957065224647522, 1.0000519752502441, 1.0430386066436768, 1.086025357246399, 1.129012107849121, 1.1719987392425537, 1.2149854898452759, 1.257972240447998, 1.3009588718414307, 1.3439456224441528, 1.386932373046875, 1.4299190044403076, 1.4729057550430298, 1.5158923864364624, 1.5588791370391846, 1.6018657684326172, 1.6448525190353394, 1.6878392696380615, 1.7308259010314941, 1.7738126516342163]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 3.0, 3.0, 4.0, 0.0, 5.0, 8.0, 11.0, 14.0, 20.0, 27.0, 42.0, 58.0, 93.0, 152.0, 221.0, 442.0, 742.0, 1492.0, 3362.0, 13668.0, 275029.0, 3837368.0, 49025.0, 7592.0, 2566.0, 1068.0, 554.0, 253.0, 179.0, 100.0, 48.0, 46.0, 27.0, 21.0, 16.0, 4.0, 5.0, 3.0, 10.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0205078125, -0.99072265625, -0.9609375, -0.93115234375, -0.9013671875, -0.87158203125, -0.841796875, -0.81201171875, -0.7822265625, -0.75244140625, -0.72265625, -0.69287109375, -0.6630859375, -0.63330078125, -0.603515625, -0.57373046875, -0.5439453125, -0.51416015625, -0.484375, -0.45458984375, -0.4248046875, -0.39501953125, -0.365234375, -0.33544921875, -0.3056640625, -0.27587890625, -0.24609375, -0.21630859375, -0.1865234375, -0.15673828125, -0.126953125, -0.09716796875, -0.0673828125, -0.03759765625, -0.0078125, 0.02197265625, 0.0517578125, 0.08154296875, 0.111328125, 0.14111328125, 0.1708984375, 0.20068359375, 0.23046875, 0.26025390625, 0.2900390625, 0.31982421875, 0.349609375, 0.37939453125, 0.4091796875, 0.43896484375, 0.46875, 0.49853515625, 0.5283203125, 0.55810546875, 0.587890625, 0.61767578125, 0.6474609375, 0.67724609375, 0.70703125, 0.73681640625, 0.7666015625, 0.79638671875, 0.826171875, 0.85595703125, 0.8857421875]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 6.0, 9.0, 15.0, 19.0, 23.0, 28.0, 55.0, 50.0, 62.0, 81.0, 88.0, 92.0, 76.0, 85.0, 71.0, 59.0, 56.0, 38.0, 25.0, 17.0, 21.0, 8.0, 6.0, 8.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.131103515625, -0.127960205078125, -0.12481689453125, -0.121673583984375, -0.1185302734375, -0.115386962890625, -0.11224365234375, -0.109100341796875, -0.10595703125, -0.102813720703125, -0.09967041015625, -0.096527099609375, -0.0933837890625, -0.090240478515625, -0.08709716796875, -0.083953857421875, -0.080810546875, -0.077667236328125, -0.07452392578125, -0.071380615234375, -0.0682373046875, -0.065093994140625, -0.06195068359375, -0.058807373046875, -0.0556640625, -0.052520751953125, -0.04937744140625, -0.046234130859375, -0.0430908203125, -0.039947509765625, -0.03680419921875, -0.033660888671875, -0.030517578125, -0.027374267578125, -0.02423095703125, -0.021087646484375, -0.0179443359375, -0.014801025390625, -0.01165771484375, -0.008514404296875, -0.00537109375, -0.002227783203125, 0.00091552734375, 0.004058837890625, 0.0072021484375, 0.010345458984375, 0.01348876953125, 0.016632080078125, 0.019775390625, 0.022918701171875, 0.02606201171875, 0.029205322265625, 0.0323486328125, 0.035491943359375, 0.03863525390625, 0.041778564453125, 0.044921875, 0.048065185546875, 0.05120849609375, 0.054351806640625, 0.0574951171875, 0.060638427734375, 0.06378173828125, 0.066925048828125, 0.070068359375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 8.0, 17.0, 16.0, 27.0, 35.0, 43.0, 80.0, 130.0, 230.0, 358.0, 714.0, 1711.0, 6271.0, 54629.0, 3638589.0, 466628.0, 18929.0, 3378.0, 1224.0, 540.0, 297.0, 159.0, 98.0, 64.0, 36.0, 27.0, 12.0, 5.0, 9.0, 4.0, 7.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.818359375, -0.7972640991210938, -0.7761688232421875, -0.7550735473632812, -0.733978271484375, -0.7128829956054688, -0.6917877197265625, -0.6706924438476562, -0.64959716796875, -0.6285018920898438, -0.6074066162109375, -0.5863113403320312, -0.565216064453125, -0.5441207885742188, -0.5230255126953125, -0.5019302368164062, -0.4808349609375, -0.45973968505859375, -0.4386444091796875, -0.41754913330078125, -0.396453857421875, -0.37535858154296875, -0.3542633056640625, -0.33316802978515625, -0.31207275390625, -0.29097747802734375, -0.2698822021484375, -0.24878692626953125, -0.227691650390625, -0.20659637451171875, -0.1855010986328125, -0.16440582275390625, -0.143310546875, -0.12221527099609375, -0.1011199951171875, -0.08002471923828125, -0.058929443359375, -0.03783416748046875, -0.0167388916015625, 0.00435638427734375, 0.02545166015625, 0.04654693603515625, 0.0676422119140625, 0.08873748779296875, 0.109832763671875, 0.13092803955078125, 0.1520233154296875, 0.17311859130859375, 0.1942138671875, 0.21530914306640625, 0.2364044189453125, 0.25749969482421875, 0.278594970703125, 0.29969024658203125, 0.3207855224609375, 0.34188079833984375, 0.36297607421875, 0.38407135009765625, 0.4051666259765625, 0.42626190185546875, 0.447357177734375, 0.46845245361328125, 0.4895477294921875, 0.5106430053710938, 0.53173828125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 11.0, 10.0, 32.0, 35.0, 93.0, 168.0, 370.0, 1024.0, 1412.0, 469.0, 230.0, 109.0, 52.0, 28.0, 11.0, 8.0, 5.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.80810546875, -0.788909912109375, -0.76971435546875, -0.750518798828125, -0.7313232421875, -0.712127685546875, -0.69293212890625, -0.673736572265625, -0.654541015625, -0.635345458984375, -0.61614990234375, -0.596954345703125, -0.5777587890625, -0.558563232421875, -0.53936767578125, -0.520172119140625, -0.5009765625, -0.481781005859375, -0.46258544921875, -0.443389892578125, -0.4241943359375, -0.404998779296875, -0.38580322265625, -0.366607666015625, -0.347412109375, -0.328216552734375, -0.30902099609375, -0.289825439453125, -0.2706298828125, -0.251434326171875, -0.23223876953125, -0.213043212890625, -0.19384765625, -0.174652099609375, -0.15545654296875, -0.136260986328125, -0.1170654296875, -0.097869873046875, -0.07867431640625, -0.059478759765625, -0.040283203125, -0.021087646484375, -0.00189208984375, 0.017303466796875, 0.0364990234375, 0.055694580078125, 0.07489013671875, 0.094085693359375, 0.11328125, 0.132476806640625, 0.15167236328125, 0.170867919921875, 0.1900634765625, 0.209259033203125, 0.22845458984375, 0.247650146484375, 0.266845703125, 0.286041259765625, 0.30523681640625, 0.324432373046875, 0.3436279296875, 0.362823486328125, 0.38201904296875, 0.401214599609375, 0.42041015625]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 4.0, 0.0, 5.0, 3.0, 6.0, 5.0, 4.0, 7.0, 7.0, 14.0, 6.0, 11.0, 25.0, 30.0, 30.0, 53.0, 65.0, 94.0, 116.0, 119.0, 106.0, 76.0, 53.0, 44.0, 31.0, 26.0, 19.0, 13.0, 13.0, 6.0, 6.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.063363075256348, -3.969193458557129, -3.875023603439331, -3.7808539867401123, -3.6866843700408936, -3.5925145149230957, -3.498344898223877, -3.404175281524658, -3.3100056648254395, -3.2158360481262207, -3.121666193008423, -3.027496576309204, -2.9333269596099854, -2.8391571044921875, -2.7449874877929688, -2.65081787109375, -2.556648015975952, -2.4624783992767334, -2.3683085441589355, -2.274138927459717, -2.179969310760498, -2.0857996940612793, -1.9916298389434814, -1.8974602222442627, -1.8032904863357544, -1.709120750427246, -1.6149511337280273, -1.520781397819519, -1.4266116619110107, -1.332442045211792, -1.2382723093032837, -1.1441025733947754, -1.0499327182769775, -0.955763041973114, -0.8615933656692505, -0.7674236297607422, -0.6732539534568787, -0.5790842771530151, -0.48491454124450684, -0.3907448649406433, -0.2965751886367798, -0.20240549743175507, -0.10823580622673035, -0.014066100120544434, 0.08010357618331909, 0.17427325248718262, 0.2684429883956909, 0.36261266469955444, 0.45678234100341797, 0.5509520173072815, 0.645121693611145, 0.7392914295196533, 0.8334611058235168, 0.9276307821273804, 1.0218005180358887, 1.1159701347351074, 1.2101398706436157, 1.304309606552124, 1.3984792232513428, 1.492648959159851, 1.5868186950683594, 1.6809883117675781, 1.7751580476760864, 1.8693277835845947, 1.9634974002838135]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 6.0, 1.0, 4.0, 10.0, 18.0, 9.0, 8.0, 11.0, 14.0, 22.0, 17.0, 14.0, 34.0, 24.0, 31.0, 47.0, 42.0, 43.0, 51.0, 43.0, 39.0, 48.0, 36.0, 54.0, 39.0, 40.0, 19.0, 32.0, 22.0, 31.0, 29.0, 17.0, 23.0, 20.0, 12.0, 16.0, 8.0, 14.0, 11.0, 10.0, 5.0, 7.0, 1.0, 3.0, 5.0, 1.0, 2.0, 5.0, 1.0, 1.0, 2.0, 2.0], "bins": [-1.9230966567993164, -1.8669215440750122, -1.810746431350708, -1.7545711994171143, -1.69839608669281, -1.6422209739685059, -1.5860458612442017, -1.5298707485198975, -1.4736956357955933, -1.417520523071289, -1.3613454103469849, -1.3051702976226807, -1.248995065689087, -1.1928199529647827, -1.1366448402404785, -1.0804697275161743, -1.0242946147918701, -0.9681195020675659, -0.9119443297386169, -0.8557692170143127, -0.7995941042900085, -0.7434189319610596, -0.6872438192367554, -0.6310687065124512, -0.5748934745788574, -0.5187183618545532, -0.46254321932792664, -0.40636807680130005, -0.35019296407699585, -0.29401782155036926, -0.23784267902374268, -0.18166756629943848, -0.12549245357513428, -0.06931732594966888, -0.013142190873622894, 0.043032944202423096, 0.09920807182788849, 0.15538319945335388, 0.21155834197998047, 0.26773345470428467, 0.32390859723091125, 0.38008373975753784, 0.43625885248184204, 0.49243399500846863, 0.5486091375350952, 0.6047842502593994, 0.6609593629837036, 0.7171344757080078, 0.7733096480369568, 0.829484760761261, 0.88565993309021, 0.9418350458145142, 0.9980101585388184, 1.0541852712631226, 1.1103603839874268, 1.1665356159210205, 1.2227107286453247, 1.278885841369629, 1.335060954093933, 1.3912360668182373, 1.447411298751831, 1.5035864114761353, 1.5597615242004395, 1.6159366369247437, 1.6721117496490479]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 8.0, 6.0, 6.0, 11.0, 12.0, 35.0, 43.0, 75.0, 90.0, 160.0, 279.0, 430.0, 736.0, 1385.0, 2604.0, 5290.0, 11768.0, 30116.0, 100071.0, 579093.0, 227486.0, 54158.0, 18918.0, 7754.0, 3646.0, 1877.0, 963.0, 585.0, 335.0, 223.0, 149.0, 82.0, 57.0, 29.0, 30.0, 16.0, 14.0, 10.0, 2.0, 7.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.642578125, -0.6229629516601562, -0.6033477783203125, -0.5837326049804688, -0.564117431640625, -0.5445022583007812, -0.5248870849609375, -0.5052719116210938, -0.48565673828125, -0.46604156494140625, -0.4464263916015625, -0.42681121826171875, -0.407196044921875, -0.38758087158203125, -0.3679656982421875, -0.34835052490234375, -0.3287353515625, -0.30912017822265625, -0.2895050048828125, -0.26988983154296875, -0.250274658203125, -0.23065948486328125, -0.2110443115234375, -0.19142913818359375, -0.17181396484375, -0.15219879150390625, -0.1325836181640625, -0.11296844482421875, -0.093353271484375, -0.07373809814453125, -0.0541229248046875, -0.03450775146484375, -0.014892578125, 0.00472259521484375, 0.0243377685546875, 0.04395294189453125, 0.063568115234375, 0.08318328857421875, 0.1027984619140625, 0.12241363525390625, 0.14202880859375, 0.16164398193359375, 0.1812591552734375, 0.20087432861328125, 0.220489501953125, 0.24010467529296875, 0.2597198486328125, 0.27933502197265625, 0.2989501953125, 0.31856536865234375, 0.3381805419921875, 0.35779571533203125, 0.377410888671875, 0.39702606201171875, 0.4166412353515625, 0.43625640869140625, 0.45587158203125, 0.47548675537109375, 0.4951019287109375, 0.5147171020507812, 0.534332275390625, 0.5539474487304688, 0.5735626220703125, 0.5931777954101562, 0.61279296875]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 2.0, 4.0, 4.0, 7.0, 6.0, 7.0, 11.0, 17.0, 14.0, 27.0, 17.0, 35.0, 49.0, 41.0, 44.0, 41.0, 56.0, 74.0, 54.0, 76.0, 59.0, 51.0, 56.0, 44.0, 26.0, 43.0, 28.0, 26.0, 22.0, 13.0, 10.0, 11.0, 4.0, 5.0, 11.0, 1.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.14208984375, -0.13840484619140625, -0.1347198486328125, -0.13103485107421875, -0.127349853515625, -0.12366485595703125, -0.1199798583984375, -0.11629486083984375, -0.11260986328125, -0.10892486572265625, -0.1052398681640625, -0.10155487060546875, -0.097869873046875, -0.09418487548828125, -0.0904998779296875, -0.08681488037109375, -0.0831298828125, -0.07944488525390625, -0.0757598876953125, -0.07207489013671875, -0.068389892578125, -0.06470489501953125, -0.0610198974609375, -0.05733489990234375, -0.05364990234375, -0.04996490478515625, -0.0462799072265625, -0.04259490966796875, -0.038909912109375, -0.03522491455078125, -0.0315399169921875, -0.02785491943359375, -0.024169921875, -0.02048492431640625, -0.0167999267578125, -0.01311492919921875, -0.009429931640625, -0.00574493408203125, -0.0020599365234375, 0.00162506103515625, 0.00531005859375, 0.00899505615234375, 0.0126800537109375, 0.01636505126953125, 0.020050048828125, 0.02373504638671875, 0.0274200439453125, 0.03110504150390625, 0.0347900390625, 0.03847503662109375, 0.0421600341796875, 0.04584503173828125, 0.049530029296875, 0.05321502685546875, 0.0569000244140625, 0.06058502197265625, 0.06427001953125, 0.06795501708984375, 0.0716400146484375, 0.07532501220703125, 0.079010009765625, 0.08269500732421875, 0.0863800048828125, 0.09006500244140625, 0.09375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 5.0, 1.0, 1.0, 7.0, 4.0, 5.0, 7.0, 12.0, 16.0, 30.0, 31.0, 53.0, 71.0, 98.0, 141.0, 189.0, 330.0, 562.0, 885.0, 1517.0, 2934.0, 5850.0, 13647.0, 37684.0, 175770.0, 695631.0, 73242.0, 21823.0, 8709.0, 4150.0, 2073.0, 1164.0, 726.0, 407.0, 241.0, 160.0, 112.0, 96.0, 52.0, 42.0, 25.0, 17.0, 9.0, 11.0, 4.0, 6.0, 8.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.576171875, -0.5564727783203125, -0.536773681640625, -0.5170745849609375, -0.49737548828125, -0.4776763916015625, -0.457977294921875, -0.4382781982421875, -0.4185791015625, -0.3988800048828125, -0.379180908203125, -0.3594818115234375, -0.33978271484375, -0.3200836181640625, -0.300384521484375, -0.2806854248046875, -0.260986328125, -0.2412872314453125, -0.221588134765625, -0.2018890380859375, -0.18218994140625, -0.1624908447265625, -0.142791748046875, -0.1230926513671875, -0.1033935546875, -0.0836944580078125, -0.063995361328125, -0.0442962646484375, -0.02459716796875, -0.0048980712890625, 0.014801025390625, 0.0345001220703125, 0.05419921875, 0.0738983154296875, 0.093597412109375, 0.1132965087890625, 0.13299560546875, 0.1526947021484375, 0.172393798828125, 0.1920928955078125, 0.2117919921875, 0.2314910888671875, 0.251190185546875, 0.2708892822265625, 0.29058837890625, 0.3102874755859375, 0.329986572265625, 0.3496856689453125, 0.369384765625, 0.3890838623046875, 0.408782958984375, 0.4284820556640625, 0.44818115234375, 0.4678802490234375, 0.487579345703125, 0.5072784423828125, 0.5269775390625, 0.5466766357421875, 0.566375732421875, 0.5860748291015625, 0.60577392578125, 0.6254730224609375, 0.645172119140625, 0.6648712158203125, 0.6845703125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 5.0, 4.0, 9.0, 9.0, 8.0, 17.0, 16.0, 19.0, 28.0, 42.0, 43.0, 60.0, 69.0, 76.0, 72.0, 74.0, 72.0, 89.0, 53.0, 43.0, 35.0, 36.0, 24.0, 20.0, 15.0, 16.0, 12.0, 6.0, 6.0, 9.0, 5.0, 7.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.67138671875, -0.650665283203125, -0.62994384765625, -0.609222412109375, -0.5885009765625, -0.567779541015625, -0.54705810546875, -0.526336669921875, -0.505615234375, -0.484893798828125, -0.46417236328125, -0.443450927734375, -0.4227294921875, -0.402008056640625, -0.38128662109375, -0.360565185546875, -0.33984375, -0.319122314453125, -0.29840087890625, -0.277679443359375, -0.2569580078125, -0.236236572265625, -0.21551513671875, -0.194793701171875, -0.174072265625, -0.153350830078125, -0.13262939453125, -0.111907958984375, -0.0911865234375, -0.070465087890625, -0.04974365234375, -0.029022216796875, -0.00830078125, 0.012420654296875, 0.03314208984375, 0.053863525390625, 0.0745849609375, 0.095306396484375, 0.11602783203125, 0.136749267578125, 0.157470703125, 0.178192138671875, 0.19891357421875, 0.219635009765625, 0.2403564453125, 0.261077880859375, 0.28179931640625, 0.302520751953125, 0.3232421875, 0.343963623046875, 0.36468505859375, 0.385406494140625, 0.4061279296875, 0.426849365234375, 0.44757080078125, 0.468292236328125, 0.489013671875, 0.509735107421875, 0.53045654296875, 0.551177978515625, 0.5718994140625, 0.592620849609375, 0.61334228515625, 0.634063720703125, 0.65478515625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 6.0, 6.0, 4.0, 8.0, 13.0, 12.0, 8.0, 43.0, 58.0, 103.0, 153.0, 300.0, 522.0, 1004.0, 2033.0, 4758.0, 12792.0, 47160.0, 729224.0, 203781.0, 30159.0, 9295.0, 3658.0, 1636.0, 820.0, 421.0, 213.0, 143.0, 73.0, 52.0, 32.0, 24.0, 17.0, 20.0, 3.0, 6.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12347412109375, -0.11947154998779297, -0.11546897888183594, -0.1114664077758789, -0.10746383666992188, -0.10346126556396484, -0.09945869445800781, -0.09545612335205078, -0.09145355224609375, -0.08745098114013672, -0.08344841003417969, -0.07944583892822266, -0.07544326782226562, -0.0714406967163086, -0.06743812561035156, -0.06343555450439453, -0.0594329833984375, -0.05543041229248047, -0.05142784118652344, -0.047425270080566406, -0.043422698974609375, -0.039420127868652344, -0.03541755676269531, -0.03141498565673828, -0.02741241455078125, -0.02340984344482422, -0.019407272338867188, -0.015404701232910156, -0.011402130126953125, -0.007399559020996094, -0.0033969879150390625, 0.0006055831909179688, 0.004608154296875, 0.008610725402832031, 0.012613296508789062, 0.016615867614746094, 0.020618438720703125, 0.024621009826660156, 0.028623580932617188, 0.03262615203857422, 0.03662872314453125, 0.04063129425048828, 0.04463386535644531, 0.048636436462402344, 0.052639007568359375, 0.056641578674316406, 0.06064414978027344, 0.06464672088623047, 0.0686492919921875, 0.07265186309814453, 0.07665443420410156, 0.0806570053100586, 0.08465957641601562, 0.08866214752197266, 0.09266471862792969, 0.09666728973388672, 0.10066986083984375, 0.10467243194580078, 0.10867500305175781, 0.11267757415771484, 0.11668014526367188, 0.1206827163696289, 0.12468528747558594, 0.12868785858154297, 0.1326904296875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 5.0, 4.0, 10.0, 11.0, 26.0, 37.0, 90.0, 147.0, 263.0, 195.0, 97.0, 43.0, 24.0, 11.0, 10.0, 6.0, 9.0, 2.0, 1.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00027561187744140625, -0.0002676434814929962, -0.0002596750855445862, -0.00025170668959617615, -0.0002437382936477661, -0.00023576989769935608, -0.00022780150175094604, -0.000219833105802536, -0.00021186470985412598, -0.00020389631390571594, -0.0001959279179573059, -0.00018795952200889587, -0.00017999112606048584, -0.0001720227301120758, -0.00016405433416366577, -0.00015608593821525574, -0.0001481175422668457, -0.00014014914631843567, -0.00013218075037002563, -0.0001242123544216156, -0.00011624395847320557, -0.00010827556252479553, -0.0001003071665763855, -9.233877062797546e-05, -8.437037467956543e-05, -7.64019787311554e-05, -6.843358278274536e-05, -6.046518683433533e-05, -5.249679088592529e-05, -4.452839493751526e-05, -3.6559998989105225e-05, -2.859160304069519e-05, -2.0623207092285156e-05, -1.2654811143875122e-05, -4.686415195465088e-06, 3.2819807529449463e-06, 1.125037670135498e-05, 1.9218772649765015e-05, 2.718716859817505e-05, 3.515556454658508e-05, 4.312396049499512e-05, 5.109235644340515e-05, 5.9060752391815186e-05, 6.702914834022522e-05, 7.499754428863525e-05, 8.296594023704529e-05, 9.093433618545532e-05, 9.890273213386536e-05, 0.00010687112808227539, 0.00011483952403068542, 0.00012280791997909546, 0.0001307763159275055, 0.00013874471187591553, 0.00014671310782432556, 0.0001546815037727356, 0.00016264989972114563, 0.00017061829566955566, 0.0001785866916179657, 0.00018655508756637573, 0.00019452348351478577, 0.0002024918794631958, 0.00021046027541160583, 0.00021842867136001587, 0.0002263970673084259, 0.00023436546325683594]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 4.0, 5.0, 4.0, 1.0, 6.0, 8.0, 8.0, 12.0, 27.0, 27.0, 43.0, 46.0, 91.0, 120.0, 164.0, 289.0, 394.0, 611.0, 1055.0, 1778.0, 3114.0, 6206.0, 13655.0, 34000.0, 126776.0, 721771.0, 87525.0, 27257.0, 11210.0, 5308.0, 2816.0, 1611.0, 952.0, 537.0, 357.0, 243.0, 162.0, 118.0, 68.0, 44.0, 38.0, 30.0, 16.0, 17.0, 13.0, 7.0, 4.0, 10.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.07684326171875, -0.07447052001953125, -0.0720977783203125, -0.06972503662109375, -0.067352294921875, -0.06497955322265625, -0.0626068115234375, -0.06023406982421875, -0.057861328125, -0.05548858642578125, -0.0531158447265625, -0.05074310302734375, -0.048370361328125, -0.04599761962890625, -0.0436248779296875, -0.04125213623046875, -0.03887939453125, -0.03650665283203125, -0.0341339111328125, -0.03176116943359375, -0.029388427734375, -0.02701568603515625, -0.0246429443359375, -0.02227020263671875, -0.0198974609375, -0.01752471923828125, -0.0151519775390625, -0.01277923583984375, -0.010406494140625, -0.00803375244140625, -0.0056610107421875, -0.00328826904296875, -0.00091552734375, 0.00145721435546875, 0.0038299560546875, 0.00620269775390625, 0.008575439453125, 0.01094818115234375, 0.0133209228515625, 0.01569366455078125, 0.01806640625, 0.02043914794921875, 0.0228118896484375, 0.02518463134765625, 0.027557373046875, 0.02993011474609375, 0.0323028564453125, 0.03467559814453125, 0.03704833984375, 0.03942108154296875, 0.0417938232421875, 0.04416656494140625, 0.046539306640625, 0.04891204833984375, 0.0512847900390625, 0.05365753173828125, 0.0560302734375, 0.05840301513671875, 0.0607757568359375, 0.06314849853515625, 0.065521240234375, 0.06789398193359375, 0.0702667236328125, 0.07263946533203125, 0.07501220703125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 0.0, 3.0, 2.0, 3.0, 11.0, 9.0, 9.0, 16.0, 12.0, 18.0, 37.0, 29.0, 49.0, 40.0, 64.0, 99.0, 125.0, 110.0, 73.0, 62.0, 48.0, 35.0, 23.0, 21.0, 21.0, 25.0, 13.0, 5.0, 9.0, 8.0, 3.0, 7.0, 7.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.081298828125, -0.07847118377685547, -0.07564353942871094, -0.0728158950805664, -0.06998825073242188, -0.06716060638427734, -0.06433296203613281, -0.06150531768798828, -0.05867767333984375, -0.05585002899169922, -0.05302238464355469, -0.050194740295410156, -0.047367095947265625, -0.044539451599121094, -0.04171180725097656, -0.03888416290283203, -0.0360565185546875, -0.03322887420654297, -0.030401229858398438, -0.027573585510253906, -0.024745941162109375, -0.021918296813964844, -0.019090652465820312, -0.01626300811767578, -0.01343536376953125, -0.010607719421386719, -0.0077800750732421875, -0.004952430725097656, -0.002124786376953125, 0.0007028579711914062, 0.0035305023193359375, 0.006358146667480469, 0.009185791015625, 0.012013435363769531, 0.014841079711914062, 0.017668724060058594, 0.020496368408203125, 0.023324012756347656, 0.026151657104492188, 0.02897930145263672, 0.03180694580078125, 0.03463459014892578, 0.03746223449707031, 0.040289878845214844, 0.043117523193359375, 0.045945167541503906, 0.04877281188964844, 0.05160045623779297, 0.0544281005859375, 0.05725574493408203, 0.06008338928222656, 0.0629110336303711, 0.06573867797851562, 0.06856632232666016, 0.07139396667480469, 0.07422161102294922, 0.07704925537109375, 0.07987689971923828, 0.08270454406738281, 0.08553218841552734, 0.08835983276367188, 0.0911874771118164, 0.09401512145996094, 0.09684276580810547, 0.09967041015625]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 1.0, 11.0, 9.0, 11.0, 10.0, 23.0, 35.0, 53.0, 72.0, 152.0, 411.0, 118.0, 39.0, 26.0, 9.0, 9.0, 2.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.351711750030518, -6.17690372467041, -6.002095699310303, -5.827287673950195, -5.65247917175293, -5.477671146392822, -5.302863121032715, -5.128055095672607, -4.9532470703125, -4.778439044952393, -4.603631019592285, -4.4288225173950195, -4.254014492034912, -4.079206466674805, -3.9043984413146973, -3.72959041595459, -3.554781913757324, -3.379973888397217, -3.2051656246185303, -3.030357599258423, -2.8555493354797363, -2.680741310119629, -2.5059332847595215, -2.331125259399414, -2.1563169956207275, -1.9815088510513306, -1.8067007064819336, -1.6318926811218262, -1.4570845365524292, -1.2822763919830322, -1.1074683666229248, -0.9326602220535278, -0.7578525543212891, -0.5830444097518921, -0.4082363247871399, -0.2334282398223877, -0.05862009525299072, 0.11618804931640625, 0.29099607467651367, 0.46580421924591064, 0.6406123638153076, 0.8154205083847046, 0.9902285933494568, 1.165036678314209, 1.339844822883606, 1.514652967453003, 1.6894609928131104, 1.8642691373825073, 2.0390772819519043, 2.2138853073120117, 2.3886935710906982, 2.5635015964508057, 2.738309860229492, 2.9131178855895996, 3.087925910949707, 3.2627339363098145, 3.437542200088501, 3.6123502254486084, 3.787158489227295, 3.9619665145874023, 4.13677453994751, 4.311582565307617, 4.486391067504883, 4.66119909286499, 4.836007118225098]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 6.0, 6.0, 6.0, 7.0, 7.0, 7.0, 9.0, 14.0, 12.0, 24.0, 21.0, 19.0, 25.0, 36.0, 34.0, 29.0, 42.0, 59.0, 128.0, 122.0, 63.0, 51.0, 39.0, 33.0, 27.0, 37.0, 19.0, 23.0, 14.0, 19.0, 11.0, 16.0, 10.0, 10.0, 3.0, 1.0, 6.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.698139190673828, -2.616666555404663, -2.535193920135498, -2.453721046447754, -2.372248411178589, -2.290775775909424, -2.2093029022216797, -2.1278302669525146, -2.0463576316833496, -1.9648849964141846, -1.88341224193573, -1.8019394874572754, -1.7204668521881104, -1.6389942169189453, -1.5575214624404907, -1.4760487079620361, -1.394576072692871, -1.313103437423706, -1.2316306829452515, -1.1501579284667969, -1.0686852931976318, -0.987212598323822, -0.9057399034500122, -0.8242672085762024, -0.7427945137023926, -0.6613218188285828, -0.579849123954773, -0.49837642908096313, -0.4169037342071533, -0.3354310393333435, -0.2539583444595337, -0.17248564958572388, -0.09101319313049316, -0.00954049825668335, 0.07193219661712646, 0.15340489149093628, 0.2348775863647461, 0.3163502812385559, 0.3978229761123657, 0.47929567098617554, 0.5607683658599854, 0.6422410607337952, 0.723713755607605, 0.8051864504814148, 0.8866591453552246, 0.9681318402290344, 1.0496045351028442, 1.1310772895812988, 1.2125499248504639, 1.294022560119629, 1.3754953145980835, 1.456968069076538, 1.5384407043457031, 1.6199133396148682, 1.7013860940933228, 1.7828588485717773, 1.8643314838409424, 1.9458041191101074, 2.0272769927978516, 2.1087496280670166, 2.1902222633361816, 2.2716948986053467, 2.3531675338745117, 2.434640407562256, 2.516113042831421]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 3.0, 11.0, 2.0, 6.0, 10.0, 10.0, 10.0, 17.0, 19.0, 16.0, 41.0, 56.0, 85.0, 107.0, 158.0, 230.0, 304.0, 494.0, 1527.0, 13528.0, 4046217.0, 125999.0, 3416.0, 768.0, 312.0, 241.0, 169.0, 127.0, 95.0, 74.0, 69.0, 28.0, 33.0, 19.0, 20.0, 22.0, 14.0, 6.0, 2.0, 6.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.82080078125, -0.799041748046875, -0.77728271484375, -0.755523681640625, -0.7337646484375, -0.712005615234375, -0.69024658203125, -0.668487548828125, -0.646728515625, -0.624969482421875, -0.60321044921875, -0.581451416015625, -0.5596923828125, -0.537933349609375, -0.51617431640625, -0.494415283203125, -0.47265625, -0.450897216796875, -0.42913818359375, -0.407379150390625, -0.3856201171875, -0.363861083984375, -0.34210205078125, -0.320343017578125, -0.298583984375, -0.276824951171875, -0.25506591796875, -0.233306884765625, -0.2115478515625, -0.189788818359375, -0.16802978515625, -0.146270751953125, -0.12451171875, -0.102752685546875, -0.08099365234375, -0.059234619140625, -0.0374755859375, -0.015716552734375, 0.00604248046875, 0.027801513671875, 0.049560546875, 0.071319580078125, 0.09307861328125, 0.114837646484375, 0.1365966796875, 0.158355712890625, 0.18011474609375, 0.201873779296875, 0.2236328125, 0.245391845703125, 0.26715087890625, 0.288909912109375, 0.3106689453125, 0.332427978515625, 0.35418701171875, 0.375946044921875, 0.397705078125, 0.419464111328125, 0.44122314453125, 0.462982177734375, 0.4847412109375, 0.506500244140625, 0.52825927734375, 0.550018310546875, 0.57177734375]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 4.0, 6.0, 9.0, 13.0, 20.0, 21.0, 26.0, 40.0, 47.0, 55.0, 58.0, 67.0, 62.0, 75.0, 75.0, 81.0, 62.0, 64.0, 55.0, 29.0, 31.0, 27.0, 24.0, 13.0, 9.0, 10.0, 7.0, 9.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1522216796875, -0.14770126342773438, -0.14318084716796875, -0.13866043090820312, -0.1341400146484375, -0.12961959838867188, -0.12509918212890625, -0.12057876586914062, -0.116058349609375, -0.11153793334960938, -0.10701751708984375, -0.10249710083007812, -0.0979766845703125, -0.09345626831054688, -0.08893585205078125, -0.08441543579101562, -0.07989501953125, -0.07537460327148438, -0.07085418701171875, -0.06633377075195312, -0.0618133544921875, -0.057292938232421875, -0.05277252197265625, -0.048252105712890625, -0.043731689453125, -0.039211273193359375, -0.03469085693359375, -0.030170440673828125, -0.0256500244140625, -0.021129608154296875, -0.01660919189453125, -0.012088775634765625, -0.007568359375, -0.003047943115234375, 0.00147247314453125, 0.005992889404296875, 0.0105133056640625, 0.015033721923828125, 0.01955413818359375, 0.024074554443359375, 0.028594970703125, 0.033115386962890625, 0.03763580322265625, 0.042156219482421875, 0.0466766357421875, 0.051197052001953125, 0.05571746826171875, 0.060237884521484375, 0.06475830078125, 0.06927871704101562, 0.07379913330078125, 0.07831954956054688, 0.0828399658203125, 0.08736038208007812, 0.09188079833984375, 0.09640121459960938, 0.100921630859375, 0.10544204711914062, 0.10996246337890625, 0.11448287963867188, 0.1190032958984375, 0.12352371215820312, 0.12804412841796875, 0.13256454467773438, 0.1370849609375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 7.0, 8.0, 15.0, 34.0, 58.0, 111.0, 200.0, 368.0, 874.0, 2081.0, 9172.0, 386766.0, 3771239.0, 17831.0, 3188.0, 1158.0, 566.0, 279.0, 146.0, 75.0, 50.0, 19.0, 12.0, 9.0, 7.0, 3.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5791015625, -0.55694580078125, -0.5347900390625, -0.51263427734375, -0.490478515625, -0.46832275390625, -0.4461669921875, -0.42401123046875, -0.40185546875, -0.37969970703125, -0.3575439453125, -0.33538818359375, -0.313232421875, -0.29107666015625, -0.2689208984375, -0.24676513671875, -0.224609375, -0.20245361328125, -0.1802978515625, -0.15814208984375, -0.135986328125, -0.11383056640625, -0.0916748046875, -0.06951904296875, -0.04736328125, -0.02520751953125, -0.0030517578125, 0.01910400390625, 0.041259765625, 0.06341552734375, 0.0855712890625, 0.10772705078125, 0.1298828125, 0.15203857421875, 0.1741943359375, 0.19635009765625, 0.218505859375, 0.24066162109375, 0.2628173828125, 0.28497314453125, 0.30712890625, 0.32928466796875, 0.3514404296875, 0.37359619140625, 0.395751953125, 0.41790771484375, 0.4400634765625, 0.46221923828125, 0.484375, 0.50653076171875, 0.5286865234375, 0.55084228515625, 0.572998046875, 0.59515380859375, 0.6173095703125, 0.63946533203125, 0.66162109375, 0.68377685546875, 0.7059326171875, 0.72808837890625, 0.750244140625, 0.77239990234375, 0.7945556640625, 0.81671142578125, 0.8388671875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 6.0, 5.0, 5.0, 12.0, 16.0, 20.0, 22.0, 62.0, 108.0, 224.0, 697.0, 1515.0, 837.0, 260.0, 111.0, 61.0, 36.0, 20.0, 16.0, 6.0, 5.0, 9.0, 7.0, 8.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.240234375, -0.2265777587890625, -0.212921142578125, -0.1992645263671875, -0.18560791015625, -0.1719512939453125, -0.158294677734375, -0.1446380615234375, -0.1309814453125, -0.1173248291015625, -0.103668212890625, -0.0900115966796875, -0.07635498046875, -0.0626983642578125, -0.049041748046875, -0.0353851318359375, -0.021728515625, -0.0080718994140625, 0.005584716796875, 0.0192413330078125, 0.03289794921875, 0.0465545654296875, 0.060211181640625, 0.0738677978515625, 0.0875244140625, 0.1011810302734375, 0.114837646484375, 0.1284942626953125, 0.14215087890625, 0.1558074951171875, 0.169464111328125, 0.1831207275390625, 0.19677734375, 0.2104339599609375, 0.224090576171875, 0.2377471923828125, 0.25140380859375, 0.2650604248046875, 0.278717041015625, 0.2923736572265625, 0.3060302734375, 0.3196868896484375, 0.333343505859375, 0.3470001220703125, 0.36065673828125, 0.3743133544921875, 0.387969970703125, 0.4016265869140625, 0.415283203125, 0.4289398193359375, 0.442596435546875, 0.4562530517578125, 0.46990966796875, 0.4835662841796875, 0.497222900390625, 0.5108795166015625, 0.5245361328125, 0.5381927490234375, 0.551849365234375, 0.5655059814453125, 0.57916259765625, 0.5928192138671875, 0.606475830078125, 0.6201324462890625, 0.6337890625]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 5.0, 11.0, 39.0, 87.0, 242.0, 312.0, 154.0, 66.0, 44.0, 14.0, 10.0, 10.0, 5.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.582521915435791, -7.418257236480713, -7.253992557525635, -7.089727401733398, -6.92546272277832, -6.761198043823242, -6.596933364868164, -6.432668685913086, -6.268404006958008, -6.10413932800293, -5.939874649047852, -5.775609493255615, -5.611344814300537, -5.447080135345459, -5.282815456390381, -5.118550777435303, -4.954285621643066, -4.790020942687988, -4.62575626373291, -4.461491107940674, -4.297226428985596, -4.132961750030518, -3.9686970710754395, -3.8044323921203613, -3.640167474746704, -3.475902795791626, -3.3116378784179688, -3.1473731994628906, -2.9831085205078125, -2.8188436031341553, -2.654578924179077, -2.49031400680542, -2.3260498046875, -2.161785125732422, -1.9975202083587646, -1.8332555294036865, -1.6689907312393188, -1.5047259330749512, -1.340461254119873, -1.1761964559555054, -1.0119316577911377, -0.84766685962677, -0.6834021210670471, -0.5191373825073242, -0.35487258434295654, -0.19060778617858887, -0.026343047618865967, 0.13792169094085693, 0.3021864891052246, 0.4664512574672699, 0.6307160258293152, 0.7949807643890381, 0.9592455625534058, 1.1235103607177734, 1.2877750396728516, 1.4520398378372192, 1.616304636001587, 1.7805694341659546, 1.9448342323303223, 2.1090989112854004, 2.2733635902404785, 2.4376285076141357, 2.601893186569214, 2.766158103942871, 2.930422782897949]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 4.0, 15.0, 9.0, 23.0, 26.0, 37.0, 44.0, 42.0, 48.0, 59.0, 67.0, 72.0, 100.0, 92.0, 83.0, 57.0, 56.0, 34.0, 41.0, 29.0, 22.0, 16.0, 6.0, 4.0, 2.0, 6.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5968148708343506, -3.4969451427459717, -3.3970754146575928, -3.297205924987793, -3.197336196899414, -3.097466468811035, -2.9975967407226562, -2.8977270126342773, -2.7978575229644775, -2.6979877948760986, -2.5981180667877197, -2.49824857711792, -2.398378849029541, -2.298509120941162, -2.198639392852783, -2.0987696647644043, -1.998900055885315, -1.899030327796936, -1.7991607189178467, -1.6992909908294678, -1.5994213819503784, -1.4995516538619995, -1.3996820449829102, -1.2998123168945312, -1.1999425888061523, -1.1000728607177734, -1.000203251838684, -0.9003335237503052, -0.8004639148712158, -0.7005941867828369, -0.6007245182991028, -0.5008548498153687, -0.4009852409362793, -0.30111557245254517, -0.20124588906764984, -0.10137620568275452, -0.0015065371990203857, 0.09836313128471375, 0.19823282957077026, 0.2981024980545044, 0.3979721665382385, 0.49784183502197266, 0.5977115035057068, 0.6975811719894409, 0.7974509000778198, 0.8973205089569092, 0.9971902370452881, 1.097059965133667, 1.1969295740127563, 1.2967993021011353, 1.3966689109802246, 1.4965386390686035, 1.5964082479476929, 1.6962779760360718, 1.7961475849151611, 1.89601731300354, 1.995887041091919, 2.095756769180298, 2.1956264972686768, 2.2954959869384766, 2.3953657150268555, 2.4952354431152344, 2.5951051712036133, 2.694974899291992, 2.794844388961792]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 5.0, 3.0, 4.0, 7.0, 12.0, 10.0, 14.0, 27.0, 42.0, 52.0, 86.0, 146.0, 234.0, 351.0, 586.0, 1118.0, 2124.0, 4725.0, 11698.0, 35869.0, 168085.0, 635895.0, 136740.0, 31446.0, 10491.0, 4311.0, 1982.0, 1004.0, 599.0, 342.0, 190.0, 111.0, 93.0, 50.0, 40.0, 20.0, 15.0, 9.0, 7.0, 10.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.42578125, -0.4108123779296875, -0.395843505859375, -0.3808746337890625, -0.36590576171875, -0.3509368896484375, -0.335968017578125, -0.3209991455078125, -0.3060302734375, -0.2910614013671875, -0.276092529296875, -0.2611236572265625, -0.24615478515625, -0.2311859130859375, -0.216217041015625, -0.2012481689453125, -0.186279296875, -0.1713104248046875, -0.156341552734375, -0.1413726806640625, -0.12640380859375, -0.1114349365234375, -0.096466064453125, -0.0814971923828125, -0.0665283203125, -0.0515594482421875, -0.036590576171875, -0.0216217041015625, -0.00665283203125, 0.0083160400390625, 0.023284912109375, 0.0382537841796875, 0.05322265625, 0.0681915283203125, 0.083160400390625, 0.0981292724609375, 0.11309814453125, 0.1280670166015625, 0.143035888671875, 0.1580047607421875, 0.1729736328125, 0.1879425048828125, 0.202911376953125, 0.2178802490234375, 0.23284912109375, 0.2478179931640625, 0.262786865234375, 0.2777557373046875, 0.292724609375, 0.3076934814453125, 0.322662353515625, 0.3376312255859375, 0.35260009765625, 0.3675689697265625, 0.382537841796875, 0.3975067138671875, 0.4124755859375, 0.4274444580078125, 0.442413330078125, 0.4573822021484375, 0.47235107421875, 0.4873199462890625, 0.502288818359375, 0.5172576904296875, 0.5322265625]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 2.0, 6.0, 5.0, 9.0, 4.0, 7.0, 15.0, 17.0, 17.0, 30.0, 28.0, 28.0, 26.0, 48.0, 44.0, 37.0, 44.0, 53.0, 57.0, 62.0, 49.0, 53.0, 58.0, 47.0, 40.0, 41.0, 26.0, 32.0, 27.0, 17.0, 14.0, 15.0, 12.0, 7.0, 7.0, 7.0, 4.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.1590576171875, -0.1545085906982422, -0.14995956420898438, -0.14541053771972656, -0.14086151123046875, -0.13631248474121094, -0.13176345825195312, -0.1272144317626953, -0.1226654052734375, -0.11811637878417969, -0.11356735229492188, -0.10901832580566406, -0.10446929931640625, -0.09992027282714844, -0.09537124633789062, -0.09082221984863281, -0.086273193359375, -0.08172416687011719, -0.07717514038085938, -0.07262611389160156, -0.06807708740234375, -0.06352806091308594, -0.058979034423828125, -0.05443000793457031, -0.0498809814453125, -0.04533195495605469, -0.040782928466796875, -0.03623390197753906, -0.03168487548828125, -0.027135848999023438, -0.022586822509765625, -0.018037796020507812, -0.01348876953125, -0.008939743041992188, -0.004390716552734375, 0.0001583099365234375, 0.00470733642578125, 0.009256362915039062, 0.013805389404296875, 0.018354415893554688, 0.0229034423828125, 0.027452468872070312, 0.032001495361328125, 0.03655052185058594, 0.04109954833984375, 0.04564857482910156, 0.050197601318359375, 0.05474662780761719, 0.059295654296875, 0.06384468078613281, 0.06839370727539062, 0.07294273376464844, 0.07749176025390625, 0.08204078674316406, 0.08658981323242188, 0.09113883972167969, 0.0956878662109375, 0.10023689270019531, 0.10478591918945312, 0.10933494567871094, 0.11388397216796875, 0.11843299865722656, 0.12298202514648438, 0.1275310516357422, 0.132080078125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 5.0, 5.0, 7.0, 11.0, 14.0, 23.0, 29.0, 33.0, 44.0, 53.0, 87.0, 115.0, 175.0, 261.0, 361.0, 696.0, 1512.0, 4018.0, 13392.0, 66204.0, 756699.0, 168406.0, 25297.0, 6475.0, 2235.0, 943.0, 505.0, 261.0, 174.0, 133.0, 101.0, 81.0, 57.0, 41.0, 29.0, 19.0, 17.0, 9.0, 7.0, 7.0, 11.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.49365234375, -0.4785652160644531, -0.46347808837890625, -0.4483909606933594, -0.4333038330078125, -0.4182167053222656, -0.40312957763671875, -0.3880424499511719, -0.372955322265625, -0.3578681945800781, -0.34278106689453125, -0.3276939392089844, -0.3126068115234375, -0.2975196838378906, -0.28243255615234375, -0.2673454284667969, -0.25225830078125, -0.23717117309570312, -0.22208404541015625, -0.20699691772460938, -0.1919097900390625, -0.17682266235351562, -0.16173553466796875, -0.14664840698242188, -0.131561279296875, -0.11647415161132812, -0.10138702392578125, -0.08629989624023438, -0.0712127685546875, -0.056125640869140625, -0.04103851318359375, -0.025951385498046875, -0.0108642578125, 0.004222869873046875, 0.01930999755859375, 0.034397125244140625, 0.0494842529296875, 0.06457138061523438, 0.07965850830078125, 0.09474563598632812, 0.109832763671875, 0.12491989135742188, 0.14000701904296875, 0.15509414672851562, 0.1701812744140625, 0.18526840209960938, 0.20035552978515625, 0.21544265747070312, 0.23052978515625, 0.24561691284179688, 0.26070404052734375, 0.2757911682128906, 0.2908782958984375, 0.3059654235839844, 0.32105255126953125, 0.3361396789550781, 0.351226806640625, 0.3663139343261719, 0.38140106201171875, 0.3964881896972656, 0.4115753173828125, 0.4266624450683594, 0.44174957275390625, 0.4568367004394531, 0.471923828125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 4.0, 5.0, 11.0, 12.0, 11.0, 19.0, 21.0, 16.0, 26.0, 28.0, 44.0, 48.0, 49.0, 63.0, 66.0, 60.0, 70.0, 52.0, 66.0, 51.0, 42.0, 49.0, 35.0, 24.0, 26.0, 19.0, 19.0, 11.0, 11.0, 11.0, 8.0, 7.0, 4.0, 3.0, 6.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6416015625, -0.6211090087890625, -0.600616455078125, -0.5801239013671875, -0.55963134765625, -0.5391387939453125, -0.518646240234375, -0.4981536865234375, -0.4776611328125, -0.4571685791015625, -0.436676025390625, -0.4161834716796875, -0.39569091796875, -0.3751983642578125, -0.354705810546875, -0.3342132568359375, -0.313720703125, -0.2932281494140625, -0.272735595703125, -0.2522430419921875, -0.23175048828125, -0.2112579345703125, -0.190765380859375, -0.1702728271484375, -0.1497802734375, -0.1292877197265625, -0.108795166015625, -0.0883026123046875, -0.06781005859375, -0.0473175048828125, -0.026824951171875, -0.0063323974609375, 0.01416015625, 0.0346527099609375, 0.055145263671875, 0.0756378173828125, 0.09613037109375, 0.1166229248046875, 0.137115478515625, 0.1576080322265625, 0.1781005859375, 0.1985931396484375, 0.219085693359375, 0.2395782470703125, 0.26007080078125, 0.2805633544921875, 0.301055908203125, 0.3215484619140625, 0.342041015625, 0.3625335693359375, 0.383026123046875, 0.4035186767578125, 0.42401123046875, 0.4445037841796875, 0.464996337890625, 0.4854888916015625, 0.5059814453125, 0.5264739990234375, 0.546966552734375, 0.5674591064453125, 0.58795166015625, 0.6084442138671875, 0.628936767578125, 0.6494293212890625, 0.669921875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 2.0, 8.0, 4.0, 14.0, 24.0, 31.0, 82.0, 187.0, 351.0, 1042.0, 4498.0, 92872.0, 936436.0, 10376.0, 1677.0, 528.0, 199.0, 99.0, 59.0, 21.0, 11.0, 13.0, 6.0, 6.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.330810546875, -0.3202056884765625, -0.309600830078125, -0.2989959716796875, -0.28839111328125, -0.2777862548828125, -0.267181396484375, -0.2565765380859375, -0.2459716796875, -0.2353668212890625, -0.224761962890625, -0.2141571044921875, -0.20355224609375, -0.1929473876953125, -0.182342529296875, -0.1717376708984375, -0.1611328125, -0.1505279541015625, -0.139923095703125, -0.1293182373046875, -0.11871337890625, -0.1081085205078125, -0.097503662109375, -0.0868988037109375, -0.0762939453125, -0.0656890869140625, -0.055084228515625, -0.0444793701171875, -0.03387451171875, -0.0232696533203125, -0.012664794921875, -0.0020599365234375, 0.008544921875, 0.0191497802734375, 0.029754638671875, 0.0403594970703125, 0.05096435546875, 0.0615692138671875, 0.072174072265625, 0.0827789306640625, 0.0933837890625, 0.1039886474609375, 0.114593505859375, 0.1251983642578125, 0.13580322265625, 0.1464080810546875, 0.157012939453125, 0.1676177978515625, 0.17822265625, 0.1888275146484375, 0.199432373046875, 0.2100372314453125, 0.22064208984375, 0.2312469482421875, 0.241851806640625, 0.2524566650390625, 0.2630615234375, 0.2736663818359375, 0.284271240234375, 0.2948760986328125, 0.30548095703125, 0.3160858154296875, 0.326690673828125, 0.3372955322265625, 0.347900390625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 5.0, 7.0, 6.0, 11.0, 13.0, 14.0, 23.0, 30.0, 53.0, 57.0, 94.0, 157.0, 195.0, 107.0, 77.0, 46.0, 28.0, 24.0, 13.0, 15.0, 5.0, 5.0, 5.0, 7.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002334117889404297, -0.00022617727518081665, -0.0002189427614212036, -0.00021170824766159058, -0.00020447373390197754, -0.0001972392201423645, -0.00019000470638275146, -0.00018277019262313843, -0.0001755356788635254, -0.00016830116510391235, -0.00016106665134429932, -0.00015383213758468628, -0.00014659762382507324, -0.0001393631100654602, -0.00013212859630584717, -0.00012489408254623413, -0.0001176595687866211, -0.00011042505502700806, -0.00010319054126739502, -9.595602750778198e-05, -8.872151374816895e-05, -8.148699998855591e-05, -7.425248622894287e-05, -6.701797246932983e-05, -5.97834587097168e-05, -5.254894495010376e-05, -4.531443119049072e-05, -3.8079917430877686e-05, -3.084540367126465e-05, -2.361088991165161e-05, -1.6376376152038574e-05, -9.141862392425537e-06, -1.9073486328125e-06, 5.327165126800537e-06, 1.2561678886413574e-05, 1.979619264602661e-05, 2.703070640563965e-05, 3.4265220165252686e-05, 4.149973392486572e-05, 4.873424768447876e-05, 5.59687614440918e-05, 6.320327520370483e-05, 7.043778896331787e-05, 7.767230272293091e-05, 8.490681648254395e-05, 9.214133024215698e-05, 9.937584400177002e-05, 0.00010661035776138306, 0.0001138448715209961, 0.00012107938528060913, 0.00012831389904022217, 0.0001355484127998352, 0.00014278292655944824, 0.00015001744031906128, 0.00015725195407867432, 0.00016448646783828735, 0.0001717209815979004, 0.00017895549535751343, 0.00018619000911712646, 0.0001934245228767395, 0.00020065903663635254, 0.00020789355039596558, 0.0002151280641555786, 0.00022236257791519165, 0.0002295970916748047]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 9.0, 5.0, 11.0, 14.0, 13.0, 28.0, 47.0, 95.0, 162.0, 397.0, 1348.0, 10519.0, 1016454.0, 16977.0, 1579.0, 448.0, 213.0, 97.0, 48.0, 33.0, 13.0, 18.0, 10.0, 3.0, 6.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5771484375, -0.5604515075683594, -0.5437545776367188, -0.5270576477050781, -0.5103607177734375, -0.4936637878417969, -0.47696685791015625, -0.4602699279785156, -0.443572998046875, -0.4268760681152344, -0.41017913818359375, -0.3934822082519531, -0.3767852783203125, -0.3600883483886719, -0.34339141845703125, -0.3266944885253906, -0.30999755859375, -0.2933006286621094, -0.27660369873046875, -0.2599067687988281, -0.2432098388671875, -0.22651290893554688, -0.20981597900390625, -0.19311904907226562, -0.176422119140625, -0.15972518920898438, -0.14302825927734375, -0.12633132934570312, -0.1096343994140625, -0.09293746948242188, -0.07624053955078125, -0.059543609619140625, -0.0428466796875, -0.026149749755859375, -0.00945281982421875, 0.007244110107421875, 0.0239410400390625, 0.040637969970703125, 0.05733489990234375, 0.07403182983398438, 0.090728759765625, 0.10742568969726562, 0.12412261962890625, 0.14081954956054688, 0.1575164794921875, 0.17421340942382812, 0.19091033935546875, 0.20760726928710938, 0.22430419921875, 0.24100112915039062, 0.25769805908203125, 0.2743949890136719, 0.2910919189453125, 0.3077888488769531, 0.32448577880859375, 0.3411827087402344, 0.357879638671875, 0.3745765686035156, 0.39127349853515625, 0.4079704284667969, 0.4246673583984375, 0.4413642883300781, 0.45806121826171875, 0.4747581481933594, 0.491455078125]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 4.0, 8.0, 8.0, 35.0, 61.0, 168.0, 387.0, 205.0, 66.0, 24.0, 21.0, 4.0, 7.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.64208984375, -0.6250076293945312, -0.6079254150390625, -0.5908432006835938, -0.573760986328125, -0.5566787719726562, -0.5395965576171875, -0.5225143432617188, -0.50543212890625, -0.48834991455078125, -0.4712677001953125, -0.45418548583984375, -0.437103271484375, -0.42002105712890625, -0.4029388427734375, -0.38585662841796875, -0.3687744140625, -0.35169219970703125, -0.3346099853515625, -0.31752777099609375, -0.300445556640625, -0.28336334228515625, -0.2662811279296875, -0.24919891357421875, -0.23211669921875, -0.21503448486328125, -0.1979522705078125, -0.18087005615234375, -0.163787841796875, -0.14670562744140625, -0.1296234130859375, -0.11254119873046875, -0.095458984375, -0.07837677001953125, -0.0612945556640625, -0.04421234130859375, -0.027130126953125, -0.01004791259765625, 0.0070343017578125, 0.02411651611328125, 0.04119873046875, 0.05828094482421875, 0.0753631591796875, 0.09244537353515625, 0.109527587890625, 0.12660980224609375, 0.1436920166015625, 0.16077423095703125, 0.1778564453125, 0.19493865966796875, 0.2120208740234375, 0.22910308837890625, 0.246185302734375, 0.26326751708984375, 0.2803497314453125, 0.29743194580078125, 0.31451416015625, 0.33159637451171875, 0.3486785888671875, 0.36576080322265625, 0.382843017578125, 0.39992523193359375, 0.4170074462890625, 0.43408966064453125, 0.451171875]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 10.0, 371.0, 567.0, 44.0, 13.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-31.435022354125977, -30.853286743164062, -30.27155113220215, -29.689815521240234, -29.108081817626953, -28.52634620666504, -27.944610595703125, -27.36287498474121, -26.781139373779297, -26.199403762817383, -25.61766815185547, -25.035932540893555, -24.45419692993164, -23.87246322631836, -23.290727615356445, -22.70899200439453, -22.127256393432617, -21.545520782470703, -20.96378517150879, -20.382049560546875, -19.800315856933594, -19.21858024597168, -18.636844635009766, -18.05510902404785, -17.473373413085938, -16.891637802124023, -16.30990219116211, -15.728167533874512, -15.146431922912598, -14.564696311950684, -13.982961654663086, -13.401226043701172, -12.819488525390625, -12.237752914428711, -11.656017303466797, -11.0742826461792, -10.492547035217285, -9.910811424255371, -9.329076766967773, -8.74734115600586, -8.165605545043945, -7.583869934082031, -7.002134799957275, -6.4203996658325195, -5.8386640548706055, -5.256928443908691, -4.6751933097839355, -4.09345817565918, -3.5117225646972656, -2.9299871921539307, -2.3482518196105957, -1.7665164470672607, -1.1847810745239258, -0.6030457019805908, -0.02131032943725586, 0.5604248046875, 1.142160415649414, 1.723895788192749, 2.305631160736084, 2.887366533279419, 3.469101905822754, 4.050837516784668, 4.632572650909424, 5.21430778503418, 5.796043395996094]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 1.0, 3.0, 5.0, 11.0, 11.0, 22.0, 29.0, 36.0, 36.0, 53.0, 34.0, 107.0, 132.0, 115.0, 123.0, 61.0, 60.0, 45.0, 30.0, 25.0, 18.0, 15.0, 10.0, 13.0, 6.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.7437186241149902, -3.5891010761260986, -3.434483528137207, -3.2798657417297363, -3.1252481937408447, -2.970630645751953, -2.8160128593444824, -2.661395311355591, -2.506777763366699, -2.3521602153778076, -2.197542667388916, -2.0429248809814453, -1.8883073329925537, -1.733689785003662, -1.579072117805481, -1.4244544506072998, -1.2698369026184082, -1.1152193546295166, -0.9606016874313354, -0.8059840798377991, -0.6513664722442627, -0.4967488646507263, -0.34213125705718994, -0.1875135898590088, -0.03289604187011719, 0.12172156572341919, 0.27633917331695557, 0.43095678091049194, 0.5855743885040283, 0.7401919960975647, 0.8948096036911011, 1.0494272708892822, 1.204045295715332, 1.3586628437042236, 1.5132805109024048, 1.667898178100586, 1.8225157260894775, 1.9771332740783691, 2.13175106048584, 2.2863686084747314, 2.440986156463623, 2.5956037044525146, 2.7502212524414062, 2.904839038848877, 3.0594565868377686, 3.21407413482666, 3.368691921234131, 3.5233094692230225, 3.677927017211914, 3.8325445652008057, 3.9871621131896973, 4.141779899597168, 4.2963972091674805, 4.451014995574951, 4.605632781982422, 4.760250091552734, 4.914867877960205, 5.069485664367676, 5.224102973937988, 5.378720760345459, 5.53333854675293, 5.687955856323242, 5.842573642730713, 5.997191429138184, 6.151808738708496]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 3.0, 5.0, 8.0, 8.0, 11.0, 13.0, 18.0, 14.0, 31.0, 49.0, 80.0, 83.0, 120.0, 183.0, 265.0, 444.0, 748.0, 1257.0, 2416.0, 5437.0, 15370.0, 52692.0, 270411.0, 1497725.0, 1857064.0, 384364.0, 72675.0, 19646.0, 6722.0, 2814.0, 1387.0, 773.0, 494.0, 286.0, 203.0, 122.0, 98.0, 69.0, 58.0, 34.0, 30.0, 21.0, 12.0, 8.0, 4.0, 3.0, 7.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.1654052734375, -0.16008567810058594, -0.15476608276367188, -0.1494464874267578, -0.14412689208984375, -0.1388072967529297, -0.13348770141601562, -0.12816810607910156, -0.1228485107421875, -0.11752891540527344, -0.11220932006835938, -0.10688972473144531, -0.10157012939453125, -0.09625053405761719, -0.09093093872070312, -0.08561134338378906, -0.080291748046875, -0.07497215270996094, -0.06965255737304688, -0.06433296203613281, -0.05901336669921875, -0.05369377136230469, -0.048374176025390625, -0.04305458068847656, -0.0377349853515625, -0.03241539001464844, -0.027095794677734375, -0.021776199340820312, -0.01645660400390625, -0.011137008666992188, -0.005817413330078125, -0.0004978179931640625, 0.00482177734375, 0.010141372680664062, 0.015460968017578125, 0.020780563354492188, 0.02610015869140625, 0.03141975402832031, 0.036739349365234375, 0.04205894470214844, 0.0473785400390625, 0.05269813537597656, 0.058017730712890625, 0.06333732604980469, 0.06865692138671875, 0.07397651672363281, 0.07929611206054688, 0.08461570739746094, 0.089935302734375, 0.09525489807128906, 0.10057449340820312, 0.10589408874511719, 0.11121368408203125, 0.11653327941894531, 0.12185287475585938, 0.12717247009277344, 0.1324920654296875, 0.13781166076660156, 0.14313125610351562, 0.1484508514404297, 0.15377044677734375, 0.1590900421142578, 0.16440963745117188, 0.16972923278808594, 0.175048828125]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 1.0, 4.0, 11.0, 7.0, 10.0, 7.0, 17.0, 15.0, 19.0, 25.0, 27.0, 29.0, 49.0, 39.0, 55.0, 59.0, 53.0, 73.0, 71.0, 42.0, 63.0, 65.0, 47.0, 42.0, 42.0, 26.0, 20.0, 16.0, 18.0, 12.0, 14.0, 8.0, 5.0, 2.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.18310546875, -0.17754554748535156, -0.17198562622070312, -0.1664257049560547, -0.16086578369140625, -0.1553058624267578, -0.14974594116210938, -0.14418601989746094, -0.1386260986328125, -0.13306617736816406, -0.12750625610351562, -0.12194633483886719, -0.11638641357421875, -0.11082649230957031, -0.10526657104492188, -0.09970664978027344, -0.094146728515625, -0.08858680725097656, -0.08302688598632812, -0.07746696472167969, -0.07190704345703125, -0.06634712219238281, -0.060787200927734375, -0.05522727966308594, -0.0496673583984375, -0.04410743713378906, -0.038547515869140625, -0.03298759460449219, -0.02742767333984375, -0.021867752075195312, -0.016307830810546875, -0.010747909545898438, -0.00518798828125, 0.0003719329833984375, 0.005931854248046875, 0.011491775512695312, 0.01705169677734375, 0.022611618041992188, 0.028171539306640625, 0.03373146057128906, 0.0392913818359375, 0.04485130310058594, 0.050411224365234375, 0.05597114562988281, 0.06153106689453125, 0.06709098815917969, 0.07265090942382812, 0.07821083068847656, 0.083770751953125, 0.08933067321777344, 0.09489059448242188, 0.10045051574707031, 0.10601043701171875, 0.11157035827636719, 0.11713027954101562, 0.12269020080566406, 0.1282501220703125, 0.13381004333496094, 0.13936996459960938, 0.1449298858642578, 0.15048980712890625, 0.1560497283935547, 0.16160964965820312, 0.16716957092285156, 0.1727294921875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 5.0, 16.0, 28.0, 62.0, 106.0, 356.0, 1295.0, 49371.0, 4138407.0, 3557.0, 709.0, 205.0, 80.0, 41.0, 23.0, 7.0, 8.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9697265625, -1.913787841796875, -1.85784912109375, -1.801910400390625, -1.7459716796875, -1.690032958984375, -1.63409423828125, -1.578155517578125, -1.522216796875, -1.466278076171875, -1.41033935546875, -1.354400634765625, -1.2984619140625, -1.242523193359375, -1.18658447265625, -1.130645751953125, -1.07470703125, -1.018768310546875, -0.96282958984375, -0.906890869140625, -0.8509521484375, -0.795013427734375, -0.73907470703125, -0.683135986328125, -0.627197265625, -0.571258544921875, -0.51531982421875, -0.459381103515625, -0.4034423828125, -0.347503662109375, -0.29156494140625, -0.235626220703125, -0.1796875, -0.123748779296875, -0.06781005859375, -0.011871337890625, 0.0440673828125, 0.100006103515625, 0.15594482421875, 0.211883544921875, 0.267822265625, 0.323760986328125, 0.37969970703125, 0.435638427734375, 0.4915771484375, 0.547515869140625, 0.60345458984375, 0.659393310546875, 0.71533203125, 0.771270751953125, 0.82720947265625, 0.883148193359375, 0.9390869140625, 0.995025634765625, 1.05096435546875, 1.106903076171875, 1.162841796875, 1.218780517578125, 1.27471923828125, 1.330657958984375, 1.3865966796875, 1.442535400390625, 1.49847412109375, 1.554412841796875, 1.6103515625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 10.0, 25.0, 35.0, 104.0, 297.0, 942.0, 1667.0, 641.0, 195.0, 82.0, 33.0, 15.0, 13.0, 9.0, 2.0, 3.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.499267578125, -0.4667930603027344, -0.43431854248046875, -0.4018440246582031, -0.3693695068359375, -0.3368949890136719, -0.30442047119140625, -0.2719459533691406, -0.239471435546875, -0.20699691772460938, -0.17452239990234375, -0.14204788208007812, -0.1095733642578125, -0.07709884643554688, -0.04462432861328125, -0.012149810791015625, 0.02032470703125, 0.052799224853515625, 0.08527374267578125, 0.11774826049804688, 0.1502227783203125, 0.18269729614257812, 0.21517181396484375, 0.24764633178710938, 0.280120849609375, 0.3125953674316406, 0.34506988525390625, 0.3775444030761719, 0.4100189208984375, 0.4424934387207031, 0.47496795654296875, 0.5074424743652344, 0.5399169921875, 0.5723915100097656, 0.6048660278320312, 0.6373405456542969, 0.6698150634765625, 0.7022895812988281, 0.7347640991210938, 0.7672386169433594, 0.799713134765625, 0.8321876525878906, 0.8646621704101562, 0.8971366882324219, 0.9296112060546875, 0.9620857238769531, 0.9945602416992188, 1.0270347595214844, 1.05950927734375, 1.0919837951660156, 1.1244583129882812, 1.1569328308105469, 1.1894073486328125, 1.2218818664550781, 1.2543563842773438, 1.2868309020996094, 1.319305419921875, 1.3517799377441406, 1.3842544555664062, 1.4167289733886719, 1.4492034912109375, 1.4816780090332031, 1.5141525268554688, 1.5466270446777344, 1.5791015625]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 5.0, 3.0, 11.0, 22.0, 38.0, 89.0, 168.0, 305.0, 192.0, 88.0, 35.0, 12.0, 10.0, 8.0, 1.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5666961669921875, -3.3871774673461914, -3.2076590061187744, -3.0281405448913574, -2.8486218452453613, -2.6691031455993652, -2.4895846843719482, -2.3100662231445312, -2.130547523498535, -1.9510289430618286, -1.771510362625122, -1.5919917821884155, -1.412473201751709, -1.2329546213150024, -1.053436040878296, -0.8739174604415894, -0.6943988800048828, -0.5148802995681763, -0.3353617191314697, -0.15584313869476318, 0.02367544174194336, 0.2031940221786499, 0.38271260261535645, 0.562231183052063, 0.7417497634887695, 0.9212683439254761, 1.1007869243621826, 1.2803055047988892, 1.4598240852355957, 1.6393426656723022, 1.8188612461090088, 1.9983798265457153, 2.1778979301452637, 2.3574166297912598, 2.5369350910186768, 2.7164535522460938, 2.89597225189209, 3.075490951538086, 3.255009412765503, 3.43452787399292, 3.614046573638916, 3.793565273284912, 3.973083734512329, 4.152602195739746, 4.332120895385742, 4.511639595031738, 4.691158294677734, 4.870676517486572, 5.050195217132568, 5.2297139167785645, 5.409232139587402, 5.588750839233398, 5.7682695388793945, 5.947788238525391, 6.127306938171387, 6.306825160980225, 6.486343860626221, 6.665862560272217, 6.845380783081055, 7.024899482727051, 7.204418182373047, 7.383936882019043, 7.563455581665039, 7.742973804473877, 7.922492504119873]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 0.0, 2.0, 5.0, 8.0, 5.0, 8.0, 12.0, 16.0, 16.0, 27.0, 39.0, 44.0, 51.0, 61.0, 63.0, 92.0, 83.0, 84.0, 83.0, 66.0, 53.0, 49.0, 32.0, 30.0, 18.0, 11.0, 10.0, 4.0, 6.0, 7.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.638813018798828, -4.514854907989502, -4.390896797180176, -4.26693868637085, -4.142980575561523, -4.0190229415893555, -3.89506459236145, -3.771106481552124, -3.647148609161377, -3.523190498352051, -3.3992323875427246, -3.2752742767333984, -3.1513164043426514, -3.027358293533325, -2.903400182723999, -2.779442071914673, -2.6554839611053467, -2.5315258502960205, -2.4075677394866943, -2.2836098670959473, -2.159651756286621, -2.035693645477295, -1.9117355346679688, -1.7877774238586426, -1.663819432258606, -1.5398613214492798, -1.4159033298492432, -1.291945219039917, -1.1679871082305908, -1.0440291166305542, -0.920071005821228, -0.7961129546165466, -0.6721546649932861, -0.5481966137886047, -0.42423853278160095, -0.30028045177459717, -0.17632240056991577, -0.052364349365234375, 0.0715937614440918, 0.1955518126487732, 0.3195098638534546, 0.443467915058136, 0.5674259662628174, 0.6913840770721436, 0.815342128276825, 0.9393001794815063, 1.0632582902908325, 1.1872162818908691, 1.3111743927001953, 1.4351325035095215, 1.559090495109558, 1.6830486059188843, 1.807006597518921, 1.930964708328247, 2.0549228191375732, 2.1788809299468994, 2.3028388023376465, 2.4267969131469727, 2.550755023956299, 2.674713134765625, 2.798671007156372, 2.9226291179656982, 3.0465872287750244, 3.1705453395843506, 3.2945034503936768]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 7.0, 6.0, 4.0, 21.0, 25.0, 37.0, 78.0, 115.0, 197.0, 381.0, 949.0, 2404.0, 9362.0, 62802.0, 845566.0, 108214.0, 13041.0, 3164.0, 1161.0, 477.0, 218.0, 132.0, 74.0, 42.0, 20.0, 18.0, 12.0, 7.0, 6.0, 5.0, 5.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.66796875, -0.650665283203125, -0.63336181640625, -0.616058349609375, -0.5987548828125, -0.581451416015625, -0.56414794921875, -0.546844482421875, -0.529541015625, -0.512237548828125, -0.49493408203125, -0.477630615234375, -0.4603271484375, -0.443023681640625, -0.42572021484375, -0.408416748046875, -0.39111328125, -0.373809814453125, -0.35650634765625, -0.339202880859375, -0.3218994140625, -0.304595947265625, -0.28729248046875, -0.269989013671875, -0.252685546875, -0.235382080078125, -0.21807861328125, -0.200775146484375, -0.1834716796875, -0.166168212890625, -0.14886474609375, -0.131561279296875, -0.1142578125, -0.096954345703125, -0.07965087890625, -0.062347412109375, -0.0450439453125, -0.027740478515625, -0.01043701171875, 0.006866455078125, 0.024169921875, 0.041473388671875, 0.05877685546875, 0.076080322265625, 0.0933837890625, 0.110687255859375, 0.12799072265625, 0.145294189453125, 0.16259765625, 0.179901123046875, 0.19720458984375, 0.214508056640625, 0.2318115234375, 0.249114990234375, 0.26641845703125, 0.283721923828125, 0.301025390625, 0.318328857421875, 0.33563232421875, 0.352935791015625, 0.3702392578125, 0.387542724609375, 0.40484619140625, 0.422149658203125, 0.439453125]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 0.0, 6.0, 3.0, 7.0, 7.0, 13.0, 15.0, 32.0, 34.0, 59.0, 58.0, 66.0, 93.0, 106.0, 108.0, 90.0, 85.0, 63.0, 52.0, 31.0, 27.0, 19.0, 9.0, 4.0, 8.0, 3.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.433837890625, -0.42322349548339844, -0.4126091003417969, -0.4019947052001953, -0.39138031005859375, -0.3807659149169922, -0.3701515197753906, -0.35953712463378906, -0.3489227294921875, -0.33830833435058594, -0.3276939392089844, -0.3170795440673828, -0.30646514892578125, -0.2958507537841797, -0.2852363586425781, -0.27462196350097656, -0.264007568359375, -0.25339317321777344, -0.24277877807617188, -0.2321643829345703, -0.22154998779296875, -0.2109355926513672, -0.20032119750976562, -0.18970680236816406, -0.1790924072265625, -0.16847801208496094, -0.15786361694335938, -0.1472492218017578, -0.13663482666015625, -0.1260204315185547, -0.11540603637695312, -0.10479164123535156, -0.09417724609375, -0.08356285095214844, -0.07294845581054688, -0.06233406066894531, -0.05171966552734375, -0.04110527038574219, -0.030490875244140625, -0.019876480102539062, -0.0092620849609375, 0.0013523101806640625, 0.011966705322265625, 0.022581100463867188, 0.03319549560546875, 0.04380989074707031, 0.054424285888671875, 0.06503868103027344, 0.075653076171875, 0.08626747131347656, 0.09688186645507812, 0.10749626159667969, 0.11811065673828125, 0.1287250518798828, 0.13933944702148438, 0.14995384216308594, 0.1605682373046875, 0.17118263244628906, 0.18179702758789062, 0.1924114227294922, 0.20302581787109375, 0.2136402130126953, 0.22425460815429688, 0.23486900329589844, 0.2454833984375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 7.0, 3.0, 5.0, 8.0, 8.0, 7.0, 12.0, 12.0, 28.0, 34.0, 43.0, 58.0, 81.0, 103.0, 190.0, 319.0, 655.0, 1417.0, 4844.0, 28854.0, 883789.0, 112834.0, 10614.0, 2517.0, 901.0, 440.0, 254.0, 159.0, 112.0, 79.0, 48.0, 32.0, 27.0, 20.0, 12.0, 14.0, 8.0, 5.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.52978515625, -0.5140876770019531, -0.49839019775390625, -0.4826927185058594, -0.4669952392578125, -0.4512977600097656, -0.43560028076171875, -0.4199028015136719, -0.404205322265625, -0.3885078430175781, -0.37281036376953125, -0.3571128845214844, -0.3414154052734375, -0.3257179260253906, -0.31002044677734375, -0.2943229675292969, -0.27862548828125, -0.2629280090332031, -0.24723052978515625, -0.23153305053710938, -0.2158355712890625, -0.20013809204101562, -0.18444061279296875, -0.16874313354492188, -0.153045654296875, -0.13734817504882812, -0.12165069580078125, -0.10595321655273438, -0.0902557373046875, -0.07455825805664062, -0.05886077880859375, -0.043163299560546875, -0.0274658203125, -0.011768341064453125, 0.00392913818359375, 0.019626617431640625, 0.0353240966796875, 0.051021575927734375, 0.06671905517578125, 0.08241653442382812, 0.098114013671875, 0.11381149291992188, 0.12950897216796875, 0.14520645141601562, 0.1609039306640625, 0.17660140991210938, 0.19229888916015625, 0.20799636840820312, 0.22369384765625, 0.23939132690429688, 0.25508880615234375, 0.2707862854003906, 0.2864837646484375, 0.3021812438964844, 0.31787872314453125, 0.3335762023925781, 0.349273681640625, 0.3649711608886719, 0.38066864013671875, 0.3963661193847656, 0.4120635986328125, 0.4277610778808594, 0.44345855712890625, 0.4591560363769531, 0.474853515625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 3.0, 3.0, 5.0, 10.0, 6.0, 12.0, 12.0, 18.0, 15.0, 26.0, 37.0, 39.0, 37.0, 62.0, 78.0, 82.0, 89.0, 81.0, 84.0, 53.0, 50.0, 40.0, 31.0, 36.0, 23.0, 24.0, 6.0, 11.0, 8.0, 5.0, 4.0, 1.0, 2.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.15234375, -1.1188507080078125, -1.085357666015625, -1.0518646240234375, -1.01837158203125, -0.9848785400390625, -0.951385498046875, -0.9178924560546875, -0.8843994140625, -0.8509063720703125, -0.817413330078125, -0.7839202880859375, -0.75042724609375, -0.7169342041015625, -0.683441162109375, -0.6499481201171875, -0.616455078125, -0.5829620361328125, -0.549468994140625, -0.5159759521484375, -0.48248291015625, -0.4489898681640625, -0.415496826171875, -0.3820037841796875, -0.3485107421875, -0.3150177001953125, -0.281524658203125, -0.2480316162109375, -0.21453857421875, -0.1810455322265625, -0.147552490234375, -0.1140594482421875, -0.08056640625, -0.0470733642578125, -0.013580322265625, 0.0199127197265625, 0.05340576171875, 0.0868988037109375, 0.120391845703125, 0.1538848876953125, 0.1873779296875, 0.2208709716796875, 0.254364013671875, 0.2878570556640625, 0.32135009765625, 0.3548431396484375, 0.388336181640625, 0.4218292236328125, 0.455322265625, 0.4888153076171875, 0.522308349609375, 0.5558013916015625, 0.58929443359375, 0.6227874755859375, 0.656280517578125, 0.6897735595703125, 0.7232666015625, 0.7567596435546875, 0.790252685546875, 0.8237457275390625, 0.85723876953125, 0.8907318115234375, 0.924224853515625, 0.9577178955078125, 0.9912109375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 5.0, 4.0, 3.0, 9.0, 11.0, 2.0, 13.0, 16.0, 25.0, 21.0, 33.0, 41.0, 58.0, 101.0, 188.0, 291.0, 512.0, 1081.0, 2507.0, 7305.0, 63856.0, 945748.0, 18811.0, 4304.0, 1734.0, 807.0, 384.0, 239.0, 142.0, 85.0, 66.0, 45.0, 20.0, 26.0, 14.0, 12.0, 4.0, 6.0, 6.0, 2.0, 2.0, 3.0, 2.0, 3.0, 7.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.1151123046875, -0.11154651641845703, -0.10798072814941406, -0.1044149398803711, -0.10084915161132812, -0.09728336334228516, -0.09371757507324219, -0.09015178680419922, -0.08658599853515625, -0.08302021026611328, -0.07945442199707031, -0.07588863372802734, -0.07232284545898438, -0.0687570571899414, -0.06519126892089844, -0.06162548065185547, -0.0580596923828125, -0.05449390411376953, -0.05092811584472656, -0.047362327575683594, -0.043796539306640625, -0.040230751037597656, -0.03666496276855469, -0.03309917449951172, -0.02953338623046875, -0.02596759796142578, -0.022401809692382812, -0.018836021423339844, -0.015270233154296875, -0.011704444885253906, -0.008138656616210938, -0.004572868347167969, -0.001007080078125, 0.0025587081909179688, 0.0061244964599609375, 0.009690284729003906, 0.013256072998046875, 0.016821861267089844, 0.020387649536132812, 0.02395343780517578, 0.02751922607421875, 0.03108501434326172, 0.03465080261230469, 0.038216590881347656, 0.041782379150390625, 0.045348167419433594, 0.04891395568847656, 0.05247974395751953, 0.0560455322265625, 0.05961132049560547, 0.06317710876464844, 0.0667428970336914, 0.07030868530273438, 0.07387447357177734, 0.07744026184082031, 0.08100605010986328, 0.08457183837890625, 0.08813762664794922, 0.09170341491699219, 0.09526920318603516, 0.09883499145507812, 0.1024007797241211, 0.10596656799316406, 0.10953235626220703, 0.11309814453125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 3.0, 4.0, 8.0, 9.0, 14.0, 20.0, 20.0, 17.0, 21.0, 27.0, 54.0, 57.0, 95.0, 150.0, 128.0, 85.0, 68.0, 52.0, 26.0, 21.0, 21.0, 21.0, 14.0, 14.0, 13.0, 6.0, 7.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.0001518726348876953, -0.00014724396169185638, -0.00014261528849601746, -0.00013798661530017853, -0.0001333579421043396, -0.00012872926890850067, -0.00012410059571266174, -0.00011947192251682281, -0.00011484324932098389, -0.00011021457612514496, -0.00010558590292930603, -0.0001009572297334671, -9.632855653762817e-05, -9.169988334178925e-05, -8.707121014595032e-05, -8.244253695011139e-05, -7.781386375427246e-05, -7.318519055843353e-05, -6.85565173625946e-05, -6.392784416675568e-05, -5.929917097091675e-05, -5.467049777507782e-05, -5.004182457923889e-05, -4.541315138339996e-05, -4.0784478187561035e-05, -3.615580499172211e-05, -3.152713179588318e-05, -2.689845860004425e-05, -2.2269785404205322e-05, -1.7641112208366394e-05, -1.3012439012527466e-05, -8.383765816688538e-06, -3.7550926208496094e-06, 8.735805749893188e-07, 5.502253770828247e-06, 1.0130926966667175e-05, 1.4759600162506104e-05, 1.9388273358345032e-05, 2.401694655418396e-05, 2.8645619750022888e-05, 3.3274292945861816e-05, 3.7902966141700745e-05, 4.253163933753967e-05, 4.71603125333786e-05, 5.178898572921753e-05, 5.641765892505646e-05, 6.104633212089539e-05, 6.567500531673431e-05, 7.030367851257324e-05, 7.493235170841217e-05, 7.95610249042511e-05, 8.418969810009003e-05, 8.881837129592896e-05, 9.344704449176788e-05, 9.807571768760681e-05, 0.00010270439088344574, 0.00010733306407928467, 0.0001119617372751236, 0.00011659041047096252, 0.00012121908366680145, 0.00012584775686264038, 0.0001304764300584793, 0.00013510510325431824, 0.00013973377645015717, 0.0001443624496459961]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 1.0, 5.0, 2.0, 9.0, 13.0, 17.0, 34.0, 35.0, 68.0, 73.0, 121.0, 257.0, 490.0, 1134.0, 3102.0, 13991.0, 822543.0, 191357.0, 10624.0, 2632.0, 990.0, 438.0, 243.0, 148.0, 77.0, 42.0, 36.0, 21.0, 23.0, 10.0, 8.0, 5.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05908203125, -0.05688762664794922, -0.05469322204589844, -0.052498817443847656, -0.050304412841796875, -0.048110008239746094, -0.04591560363769531, -0.04372119903564453, -0.04152679443359375, -0.03933238983154297, -0.03713798522949219, -0.034943580627441406, -0.032749176025390625, -0.030554771423339844, -0.028360366821289062, -0.02616596221923828, -0.0239715576171875, -0.02177715301513672, -0.019582748413085938, -0.017388343811035156, -0.015193939208984375, -0.012999534606933594, -0.010805130004882812, -0.008610725402832031, -0.00641632080078125, -0.004221916198730469, -0.0020275115966796875, 0.00016689300537109375, 0.002361297607421875, 0.004555702209472656, 0.0067501068115234375, 0.008944511413574219, 0.011138916015625, 0.013333320617675781, 0.015527725219726562, 0.017722129821777344, 0.019916534423828125, 0.022110939025878906, 0.024305343627929688, 0.02649974822998047, 0.02869415283203125, 0.03088855743408203, 0.03308296203613281, 0.035277366638183594, 0.037471771240234375, 0.039666175842285156, 0.04186058044433594, 0.04405498504638672, 0.0462493896484375, 0.04844379425048828, 0.05063819885253906, 0.052832603454589844, 0.055027008056640625, 0.057221412658691406, 0.05941581726074219, 0.06161022186279297, 0.06380462646484375, 0.06599903106689453, 0.06819343566894531, 0.0703878402709961, 0.07258224487304688, 0.07477664947509766, 0.07697105407714844, 0.07916545867919922, 0.08135986328125]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 7.0, 2.0, 7.0, 12.0, 8.0, 13.0, 12.0, 22.0, 57.0, 78.0, 172.0, 260.0, 141.0, 87.0, 52.0, 14.0, 18.0, 15.0, 6.0, 6.0, 9.0, 4.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.103271484375, -0.09821319580078125, -0.0931549072265625, -0.08809661865234375, -0.083038330078125, -0.07798004150390625, -0.0729217529296875, -0.06786346435546875, -0.06280517578125, -0.05774688720703125, -0.0526885986328125, -0.04763031005859375, -0.042572021484375, -0.03751373291015625, -0.0324554443359375, -0.02739715576171875, -0.0223388671875, -0.01728057861328125, -0.0122222900390625, -0.00716400146484375, -0.002105712890625, 0.00295257568359375, 0.0080108642578125, 0.01306915283203125, 0.01812744140625, 0.02318572998046875, 0.0282440185546875, 0.03330230712890625, 0.038360595703125, 0.04341888427734375, 0.0484771728515625, 0.05353546142578125, 0.05859375, 0.06365203857421875, 0.0687103271484375, 0.07376861572265625, 0.078826904296875, 0.08388519287109375, 0.0889434814453125, 0.09400177001953125, 0.09906005859375, 0.10411834716796875, 0.1091766357421875, 0.11423492431640625, 0.119293212890625, 0.12435150146484375, 0.1294097900390625, 0.13446807861328125, 0.1395263671875, 0.14458465576171875, 0.1496429443359375, 0.15470123291015625, 0.159759521484375, 0.16481781005859375, 0.1698760986328125, 0.17493438720703125, 0.17999267578125, 0.18505096435546875, 0.1901092529296875, 0.19516754150390625, 0.200225830078125, 0.20528411865234375, 0.2103424072265625, 0.21540069580078125, 0.220458984375]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 7.0, 23.0, 39.0, 150.0, 497.0, 159.0, 65.0, 31.0, 14.0, 6.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5795183181762695, -3.3853201866149902, -3.191122055053711, -2.9969239234924316, -2.8027257919311523, -2.608527660369873, -2.4143295288085938, -2.2201313972473145, -2.025933265686035, -1.8317351341247559, -1.6375370025634766, -1.4433388710021973, -1.249140739440918, -1.0549426078796387, -0.8607443571090698, -0.6665462255477905, -0.4723479747772217, -0.2781498432159424, -0.0839516818523407, 0.11024647951126099, 0.3044446110725403, 0.4986427426338196, 0.6928409337997437, 0.887039065361023, 1.0812371969223022, 1.2754353284835815, 1.4696334600448608, 1.6638317108154297, 1.858029842376709, 2.0522279739379883, 2.2464261054992676, 2.440624237060547, 2.634822368621826, 2.8290205001831055, 3.0232186317443848, 3.217416763305664, 3.4116148948669434, 3.6058130264282227, 3.800011157989502, 3.9942092895507812, 4.1884074211120605, 4.38260555267334, 4.576803684234619, 4.771001815795898, 4.965199947357178, 5.159398078918457, 5.353596210479736, 5.547794342041016, 5.741992950439453, 5.936191082000732, 6.130389213562012, 6.324587345123291, 6.51878547668457, 6.71298360824585, 6.907181739807129, 7.101379871368408, 7.2955780029296875, 7.489776134490967, 7.683974266052246, 7.878172397613525, 8.072370529174805, 8.266569137573242, 8.460766792297363, 8.6549654006958, 8.849163055419922]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 4.0, 1.0, 0.0, 4.0, 7.0, 7.0, 6.0, 10.0, 15.0, 22.0, 18.0, 24.0, 26.0, 32.0, 68.0, 83.0, 96.0, 73.0, 98.0, 110.0, 80.0, 50.0, 28.0, 25.0, 17.0, 14.0, 11.0, 11.0, 11.0, 5.0, 11.0, 8.0, 10.0, 5.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.550352096557617, -2.4510185718536377, -2.351685047149658, -2.2523515224456787, -2.153017997741699, -2.0536844730377197, -1.9543509483337402, -1.8550174236297607, -1.7556838989257812, -1.6563503742218018, -1.5570168495178223, -1.4576833248138428, -1.3583498001098633, -1.2590162754058838, -1.1596827507019043, -1.0603492259979248, -0.9610157012939453, -0.8616821765899658, -0.7623486518859863, -0.6630151271820068, -0.5636816024780273, -0.46434807777404785, -0.36501455307006836, -0.26568102836608887, -0.16634750366210938, -0.06701397895812988, 0.03231954574584961, 0.1316530704498291, 0.2309865951538086, 0.3303201198577881, 0.4296536445617676, 0.5289871692657471, 0.6283206939697266, 0.727654218673706, 0.8269877433776855, 0.926321268081665, 1.0256547927856445, 1.124988317489624, 1.2243218421936035, 1.323655366897583, 1.4229888916015625, 1.522322416305542, 1.6216559410095215, 1.720989465713501, 1.8203229904174805, 1.91965651512146, 2.0189900398254395, 2.118323564529419, 2.2176570892333984, 2.316990613937378, 2.4163241386413574, 2.515657663345337, 2.6149911880493164, 2.714324712753296, 2.8136582374572754, 2.912991762161255, 3.0123252868652344, 3.111658811569214, 3.2109923362731934, 3.310325860977173, 3.4096593856811523, 3.508992910385132, 3.6083264350891113, 3.707659959793091, 3.8069934844970703]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 6.0, 7.0, 5.0, 13.0, 5.0, 12.0, 10.0, 9.0, 14.0, 13.0, 18.0, 21.0, 27.0, 24.0, 39.0, 52.0, 168.0, 251.0, 50.0, 33.0, 32.0, 33.0, 22.0, 22.0, 14.0, 11.0, 15.0, 7.0, 7.0, 11.0, 7.0, 3.0, 6.0, 4.0, 4.0, 4.0, 3.0, 6.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.144775390625, -0.14012527465820312, -0.13547515869140625, -0.13082504272460938, -0.1261749267578125, -0.12152481079101562, -0.11687469482421875, -0.11222457885742188, -0.107574462890625, -0.10292434692382812, -0.09827423095703125, -0.09362411499023438, -0.0889739990234375, -0.08432388305664062, -0.07967376708984375, -0.07502365112304688, -0.07037353515625, -0.06572341918945312, -0.06107330322265625, -0.056423187255859375, -0.0517730712890625, -0.047122955322265625, -0.04247283935546875, -0.037822723388671875, -0.033172607421875, -0.028522491455078125, -0.02387237548828125, -0.019222259521484375, -0.0145721435546875, -0.009922027587890625, -0.00527191162109375, -0.000621795654296875, 0.0040283203125, 0.008678436279296875, 0.01332855224609375, 0.017978668212890625, 0.0226287841796875, 0.027278900146484375, 0.03192901611328125, 0.036579132080078125, 0.041229248046875, 0.045879364013671875, 0.05052947998046875, 0.055179595947265625, 0.0598297119140625, 0.06447982788085938, 0.06912994384765625, 0.07378005981445312, 0.07843017578125, 0.08308029174804688, 0.08773040771484375, 0.09238052368164062, 0.0970306396484375, 0.10168075561523438, 0.10633087158203125, 0.11098098754882812, 0.115631103515625, 0.12028121948242188, 0.12493133544921875, 0.12958145141601562, 0.1342315673828125, 0.13888168334960938, 0.14353179931640625, 0.14818191528320312, 0.15283203125]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [5.0, 1.0, 0.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 4.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 11.0, 4.0, 18.0, 12.0, 38.0, 26.0, 20.0, 67.0, 116.0, 373.0, 1676.0, 64031.0, 8319340.0, 2116.0, 385.0, 117.0, 71.0, 56.0, 25.0, 8.0, 22.0, 3.0, 4.0, 1.0, 3.0, 2.0, 2.0, 7.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 1.0, 0.0, 1.0], "bins": [-2.3081440925598145, -2.242325782775879, -2.1765074729919434, -2.110689163208008, -2.0448708534240723, -1.9790524244308472, -1.9132341146469116, -1.847415804862976, -1.781597375869751, -1.7157790660858154, -1.6499607563018799, -1.5841424465179443, -1.5183240175247192, -1.4525057077407837, -1.3866873979568481, -1.3208690881729126, -1.255050778388977, -1.1892324686050415, -1.123414158821106, -1.0575957298278809, -0.9917774200439453, -0.9259591102600098, -0.8601408004760742, -0.7943224906921387, -0.7285041213035583, -0.6626858115196228, -0.5968674421310425, -0.5310491323471069, -0.465230792760849, -0.39941245317459106, -0.3335941433906555, -0.2677758038043976, -0.20195746421813965, -0.1361391246318817, -0.07032079994678497, -0.004502475261688232, 0.0613158643245697, 0.12713420391082764, 0.19295251369476318, 0.2587708532810211, 0.32458919286727905, 0.390407532453537, 0.4562258720397949, 0.5220441818237305, 0.587862491607666, 0.6536808609962463, 0.7194991707801819, 0.7853175401687622, 0.8511358499526978, 0.9169541597366333, 0.9827725291252136, 1.048590898513794, 1.1144092082977295, 1.180227518081665, 1.2460458278656006, 1.3118641376495361, 1.3776824474334717, 1.4435007572174072, 1.5093190670013428, 1.5751373767852783, 1.6409558057785034, 1.706774115562439, 1.7725924253463745, 1.83841073513031, 1.9042291641235352]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 6.0, 4.0, 4.0, 2.0, 4.0, 1.0, 3.0, 6.0, 4.0, 3.0, 8.0, 4.0, 10.0, 6.0, 10.0, 6.0, 6.0, 2.0, 3.0, 5.0, 4.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.655138611793518, -1.6143183708190918, -1.573498249053955, -1.5326780080795288, -1.4918577671051025, -1.4510376453399658, -1.4102174043655396, -1.3693971633911133, -1.3285770416259766, -1.2877568006515503, -1.2469366788864136, -1.2061164379119873, -1.165296196937561, -1.1244760751724243, -1.083655834197998, -1.0428357124328613, -1.0020153522491455, -0.961195170879364, -0.9203749299049377, -0.8795547485351562, -0.8387345671653748, -0.7979143857955933, -0.757094144821167, -0.7162739634513855, -0.675453782081604, -0.6346336007118225, -0.5938133597373962, -0.5529931783676147, -0.5121729969978333, -0.47135278582572937, -0.4305325746536255, -0.389712393283844, -0.3488921523094177, -0.30807194113731384, -0.26725175976753235, -0.22643154859542847, -0.18561135232448578, -0.1447911560535431, -0.10397094488143921, -0.06315076351165771, -0.022330552339553833, 0.018489647656679153, 0.05930984765291214, 0.10013005137443542, 0.1409502476453781, 0.1817704439163208, 0.22259065508842468, 0.2634108364582062, 0.30423104763031006, 0.34505125880241394, 0.38587144017219543, 0.4266916513442993, 0.4675118327140808, 0.5083320140838623, 0.5491522550582886, 0.5899724364280701, 0.6307926177978516, 0.6716127991676331, 0.7124330401420593, 0.7532532215118408, 0.7940734028816223, 0.8348935842514038, 0.8757138252258301, 0.9165340065956116, 0.9573542475700378]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 6.0, 2.0, 9.0, 8.0, 11.0, 20.0, 22.0, 26.0, 42.0, 39.0, 80.0, 118.0, 164.0, 306.0, 641.0, 1415.0, 3641.0, 11106.0, 37881.0, 157886.0, 227122.0, 59996.0, 15485.0, 4701.0, 1781.0, 775.0, 369.0, 216.0, 122.0, 72.0, 45.0, 39.0, 37.0, 30.0, 11.0, 8.0, 9.0, 8.0, 4.0, 4.0, 3.0, 5.0, 1.0, 4.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.84716796875, -0.8199920654296875, -0.792816162109375, -0.7656402587890625, -0.73846435546875, -0.7112884521484375, -0.684112548828125, -0.6569366455078125, -0.6297607421875, -0.6025848388671875, -0.575408935546875, -0.5482330322265625, -0.52105712890625, -0.4938812255859375, -0.466705322265625, -0.4395294189453125, -0.412353515625, -0.3851776123046875, -0.358001708984375, -0.3308258056640625, -0.30364990234375, -0.2764739990234375, -0.249298095703125, -0.2221221923828125, -0.1949462890625, -0.1677703857421875, -0.140594482421875, -0.1134185791015625, -0.08624267578125, -0.0590667724609375, -0.031890869140625, -0.0047149658203125, 0.0224609375, 0.0496368408203125, 0.076812744140625, 0.1039886474609375, 0.13116455078125, 0.1583404541015625, 0.185516357421875, 0.2126922607421875, 0.2398681640625, 0.2670440673828125, 0.294219970703125, 0.3213958740234375, 0.34857177734375, 0.3757476806640625, 0.402923583984375, 0.4300994873046875, 0.457275390625, 0.4844512939453125, 0.511627197265625, 0.5388031005859375, 0.56597900390625, 0.5931549072265625, 0.620330810546875, 0.6475067138671875, 0.6746826171875, 0.7018585205078125, 0.729034423828125, 0.7562103271484375, 0.78338623046875, 0.8105621337890625, 0.837738037109375, 0.8649139404296875, 0.89208984375]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 8.0, 4.0, 9.0, 16.0, 15.0, 39.0, 40.0, 61.0, 75.0, 90.0, 116.0, 122.0, 99.0, 80.0, 64.0, 41.0, 50.0, 20.0, 17.0, 12.0, 10.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.300048828125, -0.2902030944824219, -0.28035736083984375, -0.2705116271972656, -0.2606658935546875, -0.2508201599121094, -0.24097442626953125, -0.23112869262695312, -0.221282958984375, -0.21143722534179688, -0.20159149169921875, -0.19174575805664062, -0.1819000244140625, -0.17205429077148438, -0.16220855712890625, -0.15236282348632812, -0.14251708984375, -0.13267135620117188, -0.12282562255859375, -0.11297988891601562, -0.1031341552734375, -0.09328842163085938, -0.08344268798828125, -0.07359695434570312, -0.063751220703125, -0.053905487060546875, -0.04405975341796875, -0.034214019775390625, -0.0243682861328125, -0.014522552490234375, -0.00467681884765625, 0.005168914794921875, 0.0150146484375, 0.024860382080078125, 0.03470611572265625, 0.044551849365234375, 0.0543975830078125, 0.06424331665039062, 0.07408905029296875, 0.08393478393554688, 0.093780517578125, 0.10362625122070312, 0.11347198486328125, 0.12331771850585938, 0.1331634521484375, 0.14300918579101562, 0.15285491943359375, 0.16270065307617188, 0.17254638671875, 0.18239212036132812, 0.19223785400390625, 0.20208358764648438, 0.2119293212890625, 0.22177505493164062, 0.23162078857421875, 0.24146652221679688, 0.251312255859375, 0.2611579895019531, 0.27100372314453125, 0.2808494567871094, 0.2906951904296875, 0.3005409240722656, 0.31038665771484375, 0.3202323913574219, 0.330078125]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 1.0, 4.0, 6.0, 5.0, 7.0, 30.0, 68.0, 157.0, 120.0, 45.0, 12.0, 8.0, 11.0, 4.0, 2.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2807621955871582, -1.2317323684692383, -1.1827025413513184, -1.1336725950241089, -1.084642767906189, -1.035612940788269, -0.9865831136703491, -0.9375532269477844, -0.8885233402252197, -0.8394935131072998, -0.7904636263847351, -0.7414337992668152, -0.6924039125442505, -0.6433740854263306, -0.5943442583084106, -0.545314371585846, -0.496284544467926, -0.4472546875476837, -0.3982248306274414, -0.3491950035095215, -0.3001651167869568, -0.25113528966903687, -0.20210543274879456, -0.15307557582855225, -0.10404571890830994, -0.055015865713357925, -0.005986012518405914, 0.0430438369512558, 0.09207369387149811, 0.14110355079174042, 0.19013339281082153, 0.23916324973106384, 0.28819310665130615, 0.33722296357154846, 0.38625282049179077, 0.4352826476097107, 0.4843125343322754, 0.5333423614501953, 0.5823721885681152, 0.6314020752906799, 0.6804319620132446, 0.7294617891311646, 0.7784916758537292, 0.8275215029716492, 0.8765513896942139, 0.9255812168121338, 0.9746110439300537, 1.0236408710479736, 1.0726706981658936, 1.1217005252838135, 1.1707303524017334, 1.2197602987289429, 1.2687901258468628, 1.3178199529647827, 1.3668497800827026, 1.415879726409912, 1.464909553527832, 1.513939380645752, 1.5629692077636719, 1.6119991540908813, 1.6610289812088013, 1.7100588083267212, 1.7590886354446411, 1.8081185817718506, 1.8571484088897705]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 5.0, 9.0, 12.0, 32.0, 103.0, 154.0, 81.0, 36.0, 13.0, 7.0, 7.0, 10.0, 3.0, 4.0, 3.0, 2.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.622973084449768, -1.5557844638824463, -1.4885958433151245, -1.4214072227478027, -1.354218602180481, -1.2870299816131592, -1.219841480255127, -1.1526527404785156, -1.0854642391204834, -1.0182756185531616, -0.9510869979858398, -0.8838983774185181, -0.8167097568511963, -0.7495211362838745, -0.6823325753211975, -0.6151439547538757, -0.5479552745819092, -0.4807666540145874, -0.4135780334472656, -0.34638944268226624, -0.27920082211494446, -0.21201220154762268, -0.1448236107826233, -0.07763499021530151, -0.010446369647979736, 0.056742243468761444, 0.12393085658550262, 0.1911194622516632, 0.258308082818985, 0.32549670338630676, 0.39268529415130615, 0.45987391471862793, 0.5270624160766602, 0.5942510366439819, 0.6614396572113037, 0.7286282777786255, 0.7958168983459473, 0.863005518913269, 0.930194079875946, 0.9973827004432678, 1.0645713806152344, 1.1317600011825562, 1.198948621749878, 1.2661372423171997, 1.3333258628845215, 1.4005144834518433, 1.467703104019165, 1.5348916053771973, 1.602080225944519, 1.6692688465118408, 1.7364574670791626, 1.8036460876464844, 1.8708347082138062, 1.938023328781128, 2.00521183013916, 2.0724005699157715, 2.1395890712738037, 2.206777572631836, 2.2739663124084473, 2.3411548137664795, 2.408343553543091, 2.475532054901123, 2.5427207946777344, 2.6099092960357666, 2.677098035812378]}, "eval/loss": 4.3373589515686035, "eval/wer": 2.4481753272510907, "eval/runtime": 1098.1378, "eval/samples_per_second": 2.406, "eval/steps_per_second": 0.301, "train/train_runtime": 6248.9422, "train/train_samples_per_second": 4.567, "train/train_steps_per_second": 0.143, "train/total_flos": 0.0, "train/train_loss": 4.35051649381227} \ No newline at end of file +{"train/loss": 3.9803, "train/learning_rate": 7.653061224489796e-07, "train/epoch": 1.0, "train/global_step": 892, "_runtime": 7639, "_timestamp": 1646172615, "_step": 894, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [1.0, 0.0, 14.0, 45.0, 311.0, 523.0, 99.0, 20.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-33.67470169067383, -27.166728973388672, -20.65875816345215, -14.150787353515625, -7.642814636230469, -1.1348419189453125, 5.373126983642578, 11.881099700927734, 18.38907241821289, 24.897045135498047, 31.40501594543457, 37.912986755371094, 44.42095947265625, 50.928932189941406, 57.4369010925293, 63.94487380981445, 70.45285034179688, 76.96082305908203, 83.46879577636719, 89.97676086425781, 96.4847412109375, 102.99270629882812, 109.50067901611328, 116.00865173339844, 122.51661682128906, 129.0245819091797, 135.53256225585938, 142.04052734375, 148.5485076904297, 155.0564727783203, 161.564453125, 168.07241821289062, 174.58038330078125, 181.08834838867188, 187.59632873535156, 194.1042938232422, 200.61227416992188, 207.1202392578125, 213.62820434570312, 220.1361846923828, 226.6441650390625, 233.15213012695312, 239.6601104736328, 246.16807556152344, 252.67605590820312, 259.18402099609375, 265.6919860839844, 272.199951171875, 278.70794677734375, 285.2159118652344, 291.723876953125, 298.23187255859375, 304.7398376464844, 311.247802734375, 317.7557678222656, 324.26373291015625, 330.7716979980469, 337.2796630859375, 343.7876281738281, 350.2956237792969, 356.8035888671875, 363.3115539550781, 369.81951904296875, 376.3275146484375, 382.8354797363281]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 7.0, 3.0, 5.0, 4.0, 6.0, 8.0, 11.0, 11.0, 6.0, 17.0, 11.0, 17.0, 24.0, 19.0, 25.0, 20.0, 35.0, 35.0, 34.0, 50.0, 50.0, 57.0, 63.0, 77.0, 57.0, 44.0, 38.0, 38.0, 39.0, 23.0, 33.0, 23.0, 21.0, 16.0, 10.0, 12.0, 15.0, 11.0, 4.0, 8.0, 5.0, 8.0, 4.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-103.06948852539062, -100.24678039550781, -97.42407989501953, -94.60137176513672, -91.77867126464844, -88.95596313476562, -86.13325500488281, -83.310546875, -80.48784637451172, -77.6651382446289, -74.84243774414062, -72.01972961425781, -69.197021484375, -66.37432098388672, -63.551612854003906, -60.72890853881836, -57.90620422363281, -55.083499908447266, -52.26079559326172, -49.438087463378906, -46.61538314819336, -43.79267883300781, -40.969970703125, -38.14726638793945, -35.324562072753906, -32.50185775756836, -29.67915153503418, -26.8564453125, -24.033740997314453, -21.211036682128906, -18.388330459594727, -15.565624237060547, -12.742919921875, -9.920214653015137, -7.097509384155273, -4.27480411529541, -1.4520988464355469, 1.3706064224243164, 4.19331169128418, 7.016017913818359, 9.838722229003906, 12.66142749786377, 15.484132766723633, 18.306838989257812, 21.12954330444336, 23.952247619628906, 26.774953842163086, 29.597660064697266, 32.42036437988281, 35.24306869506836, 38.065773010253906, 40.88848114013672, 43.711185455322266, 46.53388977050781, 49.356597900390625, 52.17930221557617, 55.00200653076172, 57.824710845947266, 60.64741516113281, 63.470123291015625, 66.29283142089844, 69.11553192138672, 71.93824005126953, 74.76094055175781, 77.58364868164062]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 4.0, 3.0, 2.0, 5.0, 6.0, 5.0, 7.0, 9.0, 9.0, 14.0, 11.0, 10.0, 17.0, 18.0, 29.0, 22.0, 24.0, 28.0, 38.0, 33.0, 45.0, 41.0, 62.0, 65.0, 55.0, 62.0, 50.0, 37.0, 45.0, 35.0, 30.0, 31.0, 17.0, 17.0, 24.0, 15.0, 20.0, 7.0, 12.0, 9.0, 6.0, 6.0, 7.0, 6.0, 3.0, 2.0, 2.0, 1.0, 0.0, 4.0], "bins": [-4.01171875, -3.9049072265625, -3.798095703125, -3.6912841796875, -3.58447265625, -3.4776611328125, -3.370849609375, -3.2640380859375, -3.1572265625, -3.0504150390625, -2.943603515625, -2.8367919921875, -2.72998046875, -2.6231689453125, -2.516357421875, -2.4095458984375, -2.302734375, -2.1959228515625, -2.089111328125, -1.9822998046875, -1.87548828125, -1.7686767578125, -1.661865234375, -1.5550537109375, -1.4482421875, -1.3414306640625, -1.234619140625, -1.1278076171875, -1.02099609375, -0.9141845703125, -0.807373046875, -0.7005615234375, -0.59375, -0.4869384765625, -0.380126953125, -0.2733154296875, -0.16650390625, -0.0596923828125, 0.047119140625, 0.1539306640625, 0.2607421875, 0.3675537109375, 0.474365234375, 0.5811767578125, 0.68798828125, 0.7947998046875, 0.901611328125, 1.0084228515625, 1.115234375, 1.2220458984375, 1.328857421875, 1.4356689453125, 1.54248046875, 1.6492919921875, 1.756103515625, 1.8629150390625, 1.9697265625, 2.0765380859375, 2.183349609375, 2.2901611328125, 2.39697265625, 2.5037841796875, 2.610595703125, 2.7174072265625, 2.82421875]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 5.0, 5.0, 5.0, 5.0, 9.0, 7.0, 21.0, 17.0, 31.0, 25.0, 43.0, 47.0, 79.0, 80.0, 117.0, 204.0, 272.0, 393.0, 616.0, 1065.0, 1927.0, 3802.0, 8734.0, 22726.0, 90580.0, 3263722.0, 728831.0, 45439.0, 14006.0, 5592.0, 2468.0, 1351.0, 716.0, 447.0, 294.0, 176.0, 110.0, 92.0, 62.0, 40.0, 29.0, 31.0, 18.0, 11.0, 14.0, 8.0, 4.0, 4.0, 2.0, 2.0, 1.0, 3.0], "bins": [-23.59375, -22.969482421875, -22.34521484375, -21.720947265625, -21.0966796875, -20.472412109375, -19.84814453125, -19.223876953125, -18.599609375, -17.975341796875, -17.35107421875, -16.726806640625, -16.1025390625, -15.478271484375, -14.85400390625, -14.229736328125, -13.60546875, -12.981201171875, -12.35693359375, -11.732666015625, -11.1083984375, -10.484130859375, -9.85986328125, -9.235595703125, -8.611328125, -7.987060546875, -7.36279296875, -6.738525390625, -6.1142578125, -5.489990234375, -4.86572265625, -4.241455078125, -3.6171875, -2.992919921875, -2.36865234375, -1.744384765625, -1.1201171875, -0.495849609375, 0.12841796875, 0.752685546875, 1.376953125, 2.001220703125, 2.62548828125, 3.249755859375, 3.8740234375, 4.498291015625, 5.12255859375, 5.746826171875, 6.37109375, 6.995361328125, 7.61962890625, 8.243896484375, 8.8681640625, 9.492431640625, 10.11669921875, 10.740966796875, 11.365234375, 11.989501953125, 12.61376953125, 13.238037109375, 13.8623046875, 14.486572265625, 15.11083984375, 15.735107421875, 16.359375]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 12.0, 3.0, 11.0, 10.0, 10.0, 7.0, 26.0, 22.0, 48.0, 56.0, 68.0, 119.0, 185.0, 340.0, 615.0, 920.0, 646.0, 327.0, 211.0, 116.0, 98.0, 67.0, 46.0, 27.0, 28.0, 18.0, 15.0, 10.0, 7.0, 1.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.640625, -15.1103515625, -14.580078125, -14.0498046875, -13.51953125, -12.9892578125, -12.458984375, -11.9287109375, -11.3984375, -10.8681640625, -10.337890625, -9.8076171875, -9.27734375, -8.7470703125, -8.216796875, -7.6865234375, -7.15625, -6.6259765625, -6.095703125, -5.5654296875, -5.03515625, -4.5048828125, -3.974609375, -3.4443359375, -2.9140625, -2.3837890625, -1.853515625, -1.3232421875, -0.79296875, -0.2626953125, 0.267578125, 0.7978515625, 1.328125, 1.8583984375, 2.388671875, 2.9189453125, 3.44921875, 3.9794921875, 4.509765625, 5.0400390625, 5.5703125, 6.1005859375, 6.630859375, 7.1611328125, 7.69140625, 8.2216796875, 8.751953125, 9.2822265625, 9.8125, 10.3427734375, 10.873046875, 11.4033203125, 11.93359375, 12.4638671875, 12.994140625, 13.5244140625, 14.0546875, 14.5849609375, 15.115234375, 15.6455078125, 16.17578125, 16.7060546875, 17.236328125, 17.7666015625, 18.296875]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 8.0, 7.0, 14.0, 14.0, 20.0, 20.0, 30.0, 28.0, 46.0, 75.0, 104.0, 175.0, 263.0, 450.0, 1315.0, 5967.0, 56379.0, 3534433.0, 566313.0, 23347.0, 3269.0, 905.0, 376.0, 242.0, 145.0, 90.0, 70.0, 48.0, 41.0, 29.0, 26.0, 7.0, 8.0, 5.0, 5.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-46.90625, -45.33349609375, -43.7607421875, -42.18798828125, -40.615234375, -39.04248046875, -37.4697265625, -35.89697265625, -34.32421875, -32.75146484375, -31.1787109375, -29.60595703125, -28.033203125, -26.46044921875, -24.8876953125, -23.31494140625, -21.7421875, -20.16943359375, -18.5966796875, -17.02392578125, -15.451171875, -13.87841796875, -12.3056640625, -10.73291015625, -9.16015625, -7.58740234375, -6.0146484375, -4.44189453125, -2.869140625, -1.29638671875, 0.2763671875, 1.84912109375, 3.421875, 4.99462890625, 6.5673828125, 8.14013671875, 9.712890625, 11.28564453125, 12.8583984375, 14.43115234375, 16.00390625, 17.57666015625, 19.1494140625, 20.72216796875, 22.294921875, 23.86767578125, 25.4404296875, 27.01318359375, 28.5859375, 30.15869140625, 31.7314453125, 33.30419921875, 34.876953125, 36.44970703125, 38.0224609375, 39.59521484375, 41.16796875, 42.74072265625, 44.3134765625, 45.88623046875, 47.458984375, 49.03173828125, 50.6044921875, 52.17724609375, 53.75]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 9.0, 21.0, 104.0, 483.0, 332.0, 53.0, 13.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-272.2529296875, -266.1778869628906, -260.10284423828125, -254.02780151367188, -247.9527587890625, -241.87771606445312, -235.80267333984375, -229.72763061523438, -223.652587890625, -217.57754516601562, -211.50250244140625, -205.42745971679688, -199.3524169921875, -193.27737426757812, -187.20233154296875, -181.12728881835938, -175.05223083496094, -168.97718811035156, -162.9021453857422, -156.8271026611328, -150.75205993652344, -144.67701721191406, -138.60195922851562, -132.52691650390625, -126.4518814086914, -120.37683868408203, -114.30179595947266, -108.22674560546875, -102.15170288085938, -96.07666015625, -90.00161743164062, -83.92657470703125, -77.85153198242188, -71.7764892578125, -65.70144653320312, -59.626399993896484, -53.55135726928711, -47.476314544677734, -41.401268005371094, -35.32622528076172, -29.251182556152344, -23.17613983154297, -17.10109519958496, -11.026050567626953, -4.951007843017578, 1.1240348815917969, 7.1990814208984375, 13.274124145507812, 19.349166870117188, 25.424209594726562, 31.49925422668457, 37.57429885864258, 43.64934158325195, 49.72438430786133, 55.79943084716797, 61.874473571777344, 67.94951629638672, 74.0245590209961, 80.09960174560547, 86.17465209960938, 92.24969482421875, 98.32473754882812, 104.3997802734375, 110.47482299804688, 116.54986572265625]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 8.0, 2.0, 9.0, 9.0, 14.0, 15.0, 16.0, 13.0, 29.0, 26.0, 23.0, 25.0, 31.0, 28.0, 37.0, 28.0, 40.0, 34.0, 44.0, 59.0, 58.0, 45.0, 36.0, 36.0, 42.0, 28.0, 40.0, 28.0, 32.0, 34.0, 22.0, 19.0, 21.0, 12.0, 11.0, 13.0, 8.0, 3.0, 9.0, 4.0, 6.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-48.5851936340332, -47.16765213012695, -45.7501106262207, -44.33256912231445, -42.9150276184082, -41.49748611450195, -40.0799446105957, -38.66240310668945, -37.2448616027832, -35.82732009887695, -34.4097785949707, -32.99223709106445, -31.574695587158203, -30.157154083251953, -28.739612579345703, -27.322071075439453, -25.904531478881836, -24.486989974975586, -23.069448471069336, -21.651906967163086, -20.234365463256836, -18.816823959350586, -17.39928436279297, -15.981741905212402, -14.564200401306152, -13.146658897399902, -11.729117393493652, -10.311576843261719, -8.894035339355469, -7.4764933586120605, -6.058952331542969, -4.641410827636719, -3.2238693237304688, -1.8063279390335083, -0.38878655433654785, 1.028754711151123, 2.446296215057373, 3.863837718963623, 5.281378746032715, 6.698920249938965, 8.116461753845215, 9.534003257751465, 10.951544761657715, 12.369085311889648, 13.786626815795898, 15.204168319702148, 16.6217098236084, 18.03925132751465, 19.4567928314209, 20.87433433532715, 22.2918758392334, 23.70941734313965, 25.1269588470459, 26.54450035095215, 27.962039947509766, 29.379581451416016, 30.797122955322266, 32.214664459228516, 33.632205963134766, 35.049747467041016, 36.467288970947266, 37.884830474853516, 39.302371978759766, 40.719913482666016, 42.137454986572266]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 3.0, 4.0, 4.0, 9.0, 3.0, 9.0, 7.0, 9.0, 12.0, 14.0, 11.0, 22.0, 23.0, 23.0, 35.0, 31.0, 48.0, 41.0, 66.0, 49.0, 41.0, 44.0, 60.0, 57.0, 50.0, 49.0, 45.0, 33.0, 33.0, 37.0, 21.0, 27.0, 12.0, 14.0, 12.0, 10.0, 9.0, 10.0, 2.0, 4.0, 7.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.3046875, -4.186553955078125, -4.06842041015625, -3.950286865234375, -3.8321533203125, -3.714019775390625, -3.59588623046875, -3.477752685546875, -3.359619140625, -3.241485595703125, -3.12335205078125, -3.005218505859375, -2.8870849609375, -2.768951416015625, -2.65081787109375, -2.532684326171875, -2.41455078125, -2.296417236328125, -2.17828369140625, -2.060150146484375, -1.9420166015625, -1.823883056640625, -1.70574951171875, -1.587615966796875, -1.469482421875, -1.351348876953125, -1.23321533203125, -1.115081787109375, -0.9969482421875, -0.878814697265625, -0.76068115234375, -0.642547607421875, -0.5244140625, -0.406280517578125, -0.28814697265625, -0.170013427734375, -0.0518798828125, 0.066253662109375, 0.18438720703125, 0.302520751953125, 0.420654296875, 0.538787841796875, 0.65692138671875, 0.775054931640625, 0.8931884765625, 1.011322021484375, 1.12945556640625, 1.247589111328125, 1.36572265625, 1.483856201171875, 1.60198974609375, 1.720123291015625, 1.8382568359375, 1.956390380859375, 2.07452392578125, 2.192657470703125, 2.310791015625, 2.428924560546875, 2.54705810546875, 2.665191650390625, 2.7833251953125, 2.901458740234375, 3.01959228515625, 3.137725830078125, 3.255859375]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 9.0, 7.0, 10.0, 16.0, 26.0, 28.0, 48.0, 75.0, 117.0, 157.0, 211.0, 338.0, 458.0, 631.0, 960.0, 1513.0, 2313.0, 3592.0, 5436.0, 8635.0, 14289.0, 24015.0, 43710.0, 85741.0, 185679.0, 324605.0, 168142.0, 78243.0, 39973.0, 22379.0, 13286.0, 8343.0, 5485.0, 3345.0, 2240.0, 1490.0, 998.0, 623.0, 455.0, 277.0, 205.0, 145.0, 86.0, 60.0, 53.0, 46.0, 18.0, 15.0, 9.0, 6.0, 2.0, 7.0, 4.0, 2.0, 1.0, 2.0], "bins": [-0.1474609375, -0.1430511474609375, -0.138641357421875, -0.1342315673828125, -0.12982177734375, -0.1254119873046875, -0.121002197265625, -0.1165924072265625, -0.1121826171875, -0.1077728271484375, -0.103363037109375, -0.0989532470703125, -0.09454345703125, -0.0901336669921875, -0.085723876953125, -0.0813140869140625, -0.076904296875, -0.0724945068359375, -0.068084716796875, -0.0636749267578125, -0.05926513671875, -0.0548553466796875, -0.050445556640625, -0.0460357666015625, -0.0416259765625, -0.0372161865234375, -0.032806396484375, -0.0283966064453125, -0.02398681640625, -0.0195770263671875, -0.015167236328125, -0.0107574462890625, -0.00634765625, -0.0019378662109375, 0.002471923828125, 0.0068817138671875, 0.01129150390625, 0.0157012939453125, 0.020111083984375, 0.0245208740234375, 0.0289306640625, 0.0333404541015625, 0.037750244140625, 0.0421600341796875, 0.04656982421875, 0.0509796142578125, 0.055389404296875, 0.0597991943359375, 0.064208984375, 0.0686187744140625, 0.073028564453125, 0.0774383544921875, 0.08184814453125, 0.0862579345703125, 0.090667724609375, 0.0950775146484375, 0.0994873046875, 0.1038970947265625, 0.108306884765625, 0.1127166748046875, 0.11712646484375, 0.1215362548828125, 0.125946044921875, 0.1303558349609375, 0.134765625]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 5.0, 2.0, 2.0, 3.0, 3.0, 2.0, 3.0, 7.0, 5.0, 6.0, 13.0, 10.0, 12.0, 18.0, 14.0, 27.0, 39.0, 30.0, 42.0, 22.0, 36.0, 43.0, 41.0, 39.0, 36.0, 43.0, 1076.0, 50.0, 41.0, 44.0, 38.0, 33.0, 30.0, 30.0, 26.0, 26.0, 19.0, 17.0, 15.0, 21.0, 15.0, 7.0, 11.0, 10.0, 8.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 4.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-2.208984375, -2.138702392578125, -2.06842041015625, -1.998138427734375, -1.9278564453125, -1.857574462890625, -1.78729248046875, -1.717010498046875, -1.646728515625, -1.576446533203125, -1.50616455078125, -1.435882568359375, -1.3656005859375, -1.295318603515625, -1.22503662109375, -1.154754638671875, -1.08447265625, -1.014190673828125, -0.94390869140625, -0.873626708984375, -0.8033447265625, -0.733062744140625, -0.66278076171875, -0.592498779296875, -0.522216796875, -0.451934814453125, -0.38165283203125, -0.311370849609375, -0.2410888671875, -0.170806884765625, -0.10052490234375, -0.030242919921875, 0.0400390625, 0.110321044921875, 0.18060302734375, 0.250885009765625, 0.3211669921875, 0.391448974609375, 0.46173095703125, 0.532012939453125, 0.602294921875, 0.672576904296875, 0.74285888671875, 0.813140869140625, 0.8834228515625, 0.953704833984375, 1.02398681640625, 1.094268798828125, 1.16455078125, 1.234832763671875, 1.30511474609375, 1.375396728515625, 1.4456787109375, 1.515960693359375, 1.58624267578125, 1.656524658203125, 1.726806640625, 1.797088623046875, 1.86737060546875, 1.937652587890625, 2.0079345703125, 2.078216552734375, 2.14849853515625, 2.218780517578125, 2.2890625]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 6.0, 9.0, 12.0, 13.0, 20.0, 24.0, 24.0, 48.0, 57.0, 87.0, 138.0, 193.0, 277.0, 402.0, 574.0, 799.0, 1236.0, 1902.0, 2943.0, 4486.0, 7195.0, 11760.0, 19573.0, 33257.0, 57766.0, 104129.0, 199266.0, 1318704.0, 143786.0, 77899.0, 44167.0, 25558.0, 15186.0, 9211.0, 5821.0, 3682.0, 2255.0, 1528.0, 998.0, 668.0, 453.0, 311.0, 221.0, 152.0, 106.0, 63.0, 49.0, 45.0, 22.0, 23.0, 11.0, 4.0, 12.0, 2.0, 6.0, 4.0, 1.0, 2.0, 2.0], "bins": [-0.1075439453125, -0.10420989990234375, -0.1008758544921875, -0.09754180908203125, -0.094207763671875, -0.09087371826171875, -0.0875396728515625, -0.08420562744140625, -0.08087158203125, -0.07753753662109375, -0.0742034912109375, -0.07086944580078125, -0.067535400390625, -0.06420135498046875, -0.0608673095703125, -0.05753326416015625, -0.05419921875, -0.05086517333984375, -0.0475311279296875, -0.04419708251953125, -0.040863037109375, -0.03752899169921875, -0.0341949462890625, -0.03086090087890625, -0.02752685546875, -0.02419281005859375, -0.0208587646484375, -0.01752471923828125, -0.014190673828125, -0.01085662841796875, -0.0075225830078125, -0.00418853759765625, -0.0008544921875, 0.00247955322265625, 0.0058135986328125, 0.00914764404296875, 0.012481689453125, 0.01581573486328125, 0.0191497802734375, 0.02248382568359375, 0.02581787109375, 0.02915191650390625, 0.0324859619140625, 0.03582000732421875, 0.039154052734375, 0.04248809814453125, 0.0458221435546875, 0.04915618896484375, 0.052490234375, 0.05582427978515625, 0.0591583251953125, 0.06249237060546875, 0.065826416015625, 0.06916046142578125, 0.0724945068359375, 0.07582855224609375, 0.07916259765625, 0.08249664306640625, 0.0858306884765625, 0.08916473388671875, 0.092498779296875, 0.09583282470703125, 0.0991668701171875, 0.10250091552734375, 0.1058349609375]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 4.0, 3.0, 2.0, 2.0, 6.0, 4.0, 12.0, 7.0, 8.0, 11.0, 18.0, 35.0, 38.0, 53.0, 63.0, 75.0, 98.0, 124.0, 99.0, 87.0, 48.0, 46.0, 33.0, 28.0, 26.0, 17.0, 21.0, 10.0, 11.0, 6.0, 5.0, 1.0, 5.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00013017654418945312, -0.00012670084834098816, -0.0001232251524925232, -0.00011974945664405823, -0.00011627376079559326, -0.0001127980649471283, -0.00010932236909866333, -0.00010584667325019836, -0.0001023709774017334, -9.889528155326843e-05, -9.541958570480347e-05, -9.19438898563385e-05, -8.846819400787354e-05, -8.499249815940857e-05, -8.15168023109436e-05, -7.804110646247864e-05, -7.456541061401367e-05, -7.10897147655487e-05, -6.761401891708374e-05, -6.413832306861877e-05, -6.066262722015381e-05, -5.718693137168884e-05, -5.371123552322388e-05, -5.023553967475891e-05, -4.6759843826293945e-05, -4.328414797782898e-05, -3.9808452129364014e-05, -3.633275628089905e-05, -3.285706043243408e-05, -2.9381364583969116e-05, -2.590566873550415e-05, -2.2429972887039185e-05, -1.895427703857422e-05, -1.5478581190109253e-05, -1.2002885341644287e-05, -8.527189493179321e-06, -5.0514936447143555e-06, -1.5757977962493896e-06, 1.8998980522155762e-06, 5.375593900680542e-06, 8.851289749145508e-06, 1.2326985597610474e-05, 1.580268144607544e-05, 1.9278377294540405e-05, 2.275407314300537e-05, 2.6229768991470337e-05, 2.9705464839935303e-05, 3.318116068840027e-05, 3.6656856536865234e-05, 4.01325523853302e-05, 4.3608248233795166e-05, 4.708394408226013e-05, 5.05596399307251e-05, 5.4035335779190063e-05, 5.751103162765503e-05, 6.0986727476119995e-05, 6.446242332458496e-05, 6.793811917304993e-05, 7.141381502151489e-05, 7.488951086997986e-05, 7.836520671844482e-05, 8.184090256690979e-05, 8.531659841537476e-05, 8.879229426383972e-05, 9.226799011230469e-05]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 7.0, 6.0, 10.0, 8.0, 9.0, 22.0, 20.0, 24.0, 31.0, 47.0, 92.0, 120.0, 156.0, 275.0, 441.0, 3745.0, 1025156.0, 16854.0, 594.0, 293.0, 187.0, 123.0, 83.0, 62.0, 50.0, 41.0, 32.0, 17.0, 13.0, 10.0, 9.0, 4.0, 5.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0022945404052734375, -0.002228289842605591, -0.002162039279937744, -0.0020957887172698975, -0.0020295381546020508, -0.001963287591934204, -0.0018970370292663574, -0.0018307864665985107, -0.001764535903930664, -0.0016982853412628174, -0.0016320347785949707, -0.001565784215927124, -0.0014995336532592773, -0.0014332830905914307, -0.001367032527923584, -0.0013007819652557373, -0.0012345314025878906, -0.001168280839920044, -0.0011020302772521973, -0.0010357797145843506, -0.0009695291519165039, -0.0009032785892486572, -0.0008370280265808105, -0.0007707774639129639, -0.0007045269012451172, -0.0006382763385772705, -0.0005720257759094238, -0.0005057752132415771, -0.00043952465057373047, -0.0003732740879058838, -0.0003070235252380371, -0.00024077296257019043, -0.00017452239990234375, -0.00010827183723449707, -4.202127456665039e-05, 2.422928810119629e-05, 9.047985076904297e-05, 0.00015673041343688965, 0.00022298097610473633, 0.000289231538772583, 0.0003554821014404297, 0.00042173266410827637, 0.00048798322677612305, 0.0005542337894439697, 0.0006204843521118164, 0.0006867349147796631, 0.0007529854774475098, 0.0008192360401153564, 0.0008854866027832031, 0.0009517371654510498, 0.0010179877281188965, 0.0010842382907867432, 0.0011504888534545898, 0.0012167394161224365, 0.0012829899787902832, 0.0013492405414581299, 0.0014154911041259766, 0.0014817416667938232, 0.00154799222946167, 0.0016142427921295166, 0.0016804933547973633, 0.00174674391746521, 0.0018129944801330566, 0.0018792450428009033, 0.00194549560546875]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 48.0, 523.0, 425.0, 22.0], "bins": [-0.0006569771212525666, -0.0006463686586357653, -0.000635760254226625, -0.0006251517916098237, -0.0006145433289930224, -0.0006039348663762212, -0.0005933264037594199, -0.0005827179993502796, -0.0005721095367334783, -0.000561501074116677, -0.0005508926697075367, -0.0005402842070907354, -0.0005296757444739342, -0.0005190672818571329, -0.0005084588192403316, -0.0004978504148311913, -0.00048724195221439004, -0.0004766334895975888, -0.00046602505608461797, -0.00045541662257164717, -0.0004448081599548459, -0.00043419969733804464, -0.00042359126382507384, -0.00041298283031210303, -0.00040237436769530177, -0.0003917659050785005, -0.0003811574715655297, -0.0003705490380525589, -0.00035994057543575764, -0.0003493321128189564, -0.00033872367930598557, -0.00032811524579301476, -0.00031750675407238305, -0.00030689832055941224, -0.000296289857942611, -0.0002856813953258097, -0.0002750729618128389, -0.0002644645282998681, -0.00025385606568306684, -0.0002432476176181808, -0.00023263916955329478, -0.00022203072148840874, -0.0002114222734235227, -0.00020081382535863668, -0.00019020537729375064, -0.0001795969292288646, -0.00016898848116397858, -0.00015838003309909254, -0.0001477715850342065, -0.00013716313696932048, -0.00012655468890443444, -0.00011594624083954841, -0.00010533779277466238, -9.472934470977634e-05, -8.412089664489031e-05, -7.351244858000427e-05, -6.290400051511824e-05, -5.229555245023221e-05, -4.1687104385346174e-05, -3.107865632046014e-05, -2.0470208255574107e-05, -9.861760190688074e-06, 7.466878741979599e-07, 1.1355135939083993e-05, 2.1963582184980623e-05]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 1.0, 0.0, 3.0, 3.0, 8.0, 3.0, 6.0, 3.0, 9.0, 14.0, 14.0, 11.0, 11.0, 11.0, 23.0, 18.0, 36.0, 27.0, 29.0, 22.0, 35.0, 42.0, 28.0, 40.0, 45.0, 40.0, 46.0, 49.0, 40.0, 42.0, 32.0, 39.0, 35.0, 26.0, 28.0, 24.0, 34.0, 18.0, 20.0, 13.0, 16.0, 14.0, 11.0, 10.0, 3.0, 5.0, 11.0, 4.0, 5.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-3.910064697265625e-05, -3.782566636800766e-05, -3.655068576335907e-05, -3.527570515871048e-05, -3.400072455406189e-05, -3.27257439494133e-05, -3.145076334476471e-05, -3.017578274011612e-05, -2.890080213546753e-05, -2.762582153081894e-05, -2.635084092617035e-05, -2.507586032152176e-05, -2.380087971687317e-05, -2.252589911222458e-05, -2.125091850757599e-05, -1.99759379029274e-05, -1.870095729827881e-05, -1.742597669363022e-05, -1.615099608898163e-05, -1.4876015484333038e-05, -1.3601034879684448e-05, -1.2326054275035858e-05, -1.1051073670387268e-05, -9.776093065738678e-06, -8.501112461090088e-06, -7.226131856441498e-06, -5.951151251792908e-06, -4.676170647144318e-06, -3.4011900424957275e-06, -2.1262094378471375e-06, -8.512288331985474e-07, 4.237517714500427e-07, 1.6987323760986328e-06, 2.973712980747223e-06, 4.248693585395813e-06, 5.523674190044403e-06, 6.798654794692993e-06, 8.073635399341583e-06, 9.348616003990173e-06, 1.0623596608638763e-05, 1.1898577213287354e-05, 1.3173557817935944e-05, 1.4448538422584534e-05, 1.5723519027233124e-05, 1.6998499631881714e-05, 1.8273480236530304e-05, 1.9548460841178894e-05, 2.0823441445827484e-05, 2.2098422050476074e-05, 2.3373402655124664e-05, 2.4648383259773254e-05, 2.5923363864421844e-05, 2.7198344469070435e-05, 2.8473325073719025e-05, 2.9748305678367615e-05, 3.1023286283016205e-05, 3.2298266887664795e-05, 3.3573247492313385e-05, 3.4848228096961975e-05, 3.6123208701610565e-05, 3.7398189306259155e-05, 3.8673169910907745e-05, 3.9948150515556335e-05, 4.1223131120204926e-05, 4.2498111724853516e-05]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 3.0, 4.0, 4.0, 9.0, 3.0, 9.0, 7.0, 9.0, 12.0, 14.0, 11.0, 22.0, 23.0, 23.0, 35.0, 31.0, 48.0, 41.0, 66.0, 49.0, 41.0, 44.0, 60.0, 57.0, 50.0, 49.0, 45.0, 33.0, 33.0, 37.0, 21.0, 27.0, 12.0, 14.0, 12.0, 10.0, 9.0, 10.0, 2.0, 4.0, 7.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.3046875, -4.186553955078125, -4.06842041015625, -3.950286865234375, -3.8321533203125, -3.714019775390625, -3.59588623046875, -3.477752685546875, -3.359619140625, -3.241485595703125, -3.12335205078125, -3.005218505859375, -2.8870849609375, -2.768951416015625, -2.65081787109375, -2.532684326171875, -2.41455078125, -2.296417236328125, -2.17828369140625, -2.060150146484375, -1.9420166015625, -1.823883056640625, -1.70574951171875, -1.587615966796875, -1.469482421875, -1.351348876953125, -1.23321533203125, -1.115081787109375, -0.9969482421875, -0.878814697265625, -0.76068115234375, -0.642547607421875, -0.5244140625, -0.406280517578125, -0.28814697265625, -0.170013427734375, -0.0518798828125, 0.066253662109375, 0.18438720703125, 0.302520751953125, 0.420654296875, 0.538787841796875, 0.65692138671875, 0.775054931640625, 0.8931884765625, 1.011322021484375, 1.12945556640625, 1.247589111328125, 1.36572265625, 1.483856201171875, 1.60198974609375, 1.720123291015625, 1.8382568359375, 1.956390380859375, 2.07452392578125, 2.192657470703125, 2.310791015625, 2.428924560546875, 2.54705810546875, 2.665191650390625, 2.7833251953125, 2.901458740234375, 3.01959228515625, 3.137725830078125, 3.255859375]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 7.0, 9.0, 8.0, 14.0, 19.0, 29.0, 27.0, 40.0, 80.0, 77.0, 107.0, 149.0, 215.0, 282.0, 418.0, 654.0, 918.0, 1387.0, 2292.0, 3716.0, 6622.0, 13633.0, 34254.0, 136741.0, 618647.0, 158254.0, 37408.0, 14608.0, 6999.0, 3900.0, 2311.0, 1540.0, 975.0, 677.0, 424.0, 324.0, 209.0, 182.0, 116.0, 91.0, 52.0, 43.0, 33.0, 23.0, 10.0, 9.0, 14.0, 2.0, 4.0, 3.0, 0.0, 1.0, 4.0], "bins": [-11.921875, -11.58642578125, -11.2509765625, -10.91552734375, -10.580078125, -10.24462890625, -9.9091796875, -9.57373046875, -9.23828125, -8.90283203125, -8.5673828125, -8.23193359375, -7.896484375, -7.56103515625, -7.2255859375, -6.89013671875, -6.5546875, -6.21923828125, -5.8837890625, -5.54833984375, -5.212890625, -4.87744140625, -4.5419921875, -4.20654296875, -3.87109375, -3.53564453125, -3.2001953125, -2.86474609375, -2.529296875, -2.19384765625, -1.8583984375, -1.52294921875, -1.1875, -0.85205078125, -0.5166015625, -0.18115234375, 0.154296875, 0.48974609375, 0.8251953125, 1.16064453125, 1.49609375, 1.83154296875, 2.1669921875, 2.50244140625, 2.837890625, 3.17333984375, 3.5087890625, 3.84423828125, 4.1796875, 4.51513671875, 4.8505859375, 5.18603515625, 5.521484375, 5.85693359375, 6.1923828125, 6.52783203125, 6.86328125, 7.19873046875, 7.5341796875, 7.86962890625, 8.205078125, 8.54052734375, 8.8759765625, 9.21142578125, 9.546875]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 3.0, 6.0, 9.0, 6.0, 17.0, 12.0, 13.0, 12.0, 22.0, 24.0, 28.0, 46.0, 33.0, 48.0, 47.0, 64.0, 77.0, 182.0, 1654.0, 262.0, 88.0, 60.0, 49.0, 36.0, 33.0, 32.0, 28.0, 38.0, 18.0, 17.0, 21.0, 18.0, 9.0, 13.0, 6.0, 5.0, 8.0, 9.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.40625, -13.9903564453125, -13.574462890625, -13.1585693359375, -12.74267578125, -12.3267822265625, -11.910888671875, -11.4949951171875, -11.0791015625, -10.6632080078125, -10.247314453125, -9.8314208984375, -9.41552734375, -8.9996337890625, -8.583740234375, -8.1678466796875, -7.751953125, -7.3360595703125, -6.920166015625, -6.5042724609375, -6.08837890625, -5.6724853515625, -5.256591796875, -4.8406982421875, -4.4248046875, -4.0089111328125, -3.593017578125, -3.1771240234375, -2.76123046875, -2.3453369140625, -1.929443359375, -1.5135498046875, -1.09765625, -0.6817626953125, -0.265869140625, 0.1500244140625, 0.56591796875, 0.9818115234375, 1.397705078125, 1.8135986328125, 2.2294921875, 2.6453857421875, 3.061279296875, 3.4771728515625, 3.89306640625, 4.3089599609375, 4.724853515625, 5.1407470703125, 5.556640625, 5.9725341796875, 6.388427734375, 6.8043212890625, 7.22021484375, 7.6361083984375, 8.052001953125, 8.4678955078125, 8.8837890625, 9.2996826171875, 9.715576171875, 10.1314697265625, 10.54736328125, 10.9632568359375, 11.379150390625, 11.7950439453125, 12.2109375]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 3.0, 8.0, 5.0, 4.0, 3.0, 9.0, 11.0, 15.0, 19.0, 13.0, 19.0, 25.0, 37.0, 37.0, 38.0, 72.0, 127.0, 288.0, 1237.0, 212086.0, 2928476.0, 2353.0, 353.0, 162.0, 72.0, 43.0, 38.0, 40.0, 24.0, 19.0, 13.0, 8.0, 14.0, 10.0, 14.0, 7.0, 7.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.1875, -55.2236328125, -53.259765625, -51.2958984375, -49.33203125, -47.3681640625, -45.404296875, -43.4404296875, -41.4765625, -39.5126953125, -37.548828125, -35.5849609375, -33.62109375, -31.6572265625, -29.693359375, -27.7294921875, -25.765625, -23.8017578125, -21.837890625, -19.8740234375, -17.91015625, -15.9462890625, -13.982421875, -12.0185546875, -10.0546875, -8.0908203125, -6.126953125, -4.1630859375, -2.19921875, -0.2353515625, 1.728515625, 3.6923828125, 5.65625, 7.6201171875, 9.583984375, 11.5478515625, 13.51171875, 15.4755859375, 17.439453125, 19.4033203125, 21.3671875, 23.3310546875, 25.294921875, 27.2587890625, 29.22265625, 31.1865234375, 33.150390625, 35.1142578125, 37.078125, 39.0419921875, 41.005859375, 42.9697265625, 44.93359375, 46.8974609375, 48.861328125, 50.8251953125, 52.7890625, 54.7529296875, 56.716796875, 58.6806640625, 60.64453125, 62.6083984375, 64.572265625, 66.5361328125, 68.5]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 539.0, 477.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-130.96717834472656, -116.40142059326172, -101.83566284179688, -87.26991271972656, -72.70415496826172, -58.138397216796875, -43.57264709472656, -29.00688934326172, -14.441131591796875, 0.12462425231933594, 14.690380096435547, 29.256134033203125, 43.82189178466797, 58.38764953613281, 72.95339965820312, 87.51915740966797, 102.08491516113281, 116.65067291259766, 131.2164306640625, 145.7821807861328, 160.34793090820312, 174.9136962890625, 189.4794464111328, 204.04519653320312, 218.6109619140625, 233.1767120361328, 247.7424774169922, 262.3082275390625, 276.8739929199219, 291.43975830078125, 306.0054931640625, 320.5712585449219, 335.13702392578125, 349.7027893066406, 364.2685241699219, 378.83428955078125, 393.4000549316406, 407.9658203125, 422.53155517578125, 437.0973205566406, 451.6630859375, 466.2288513183594, 480.7945861816406, 495.3603515625, 509.9261169433594, 524.4918823242188, 539.0576171875, 553.6233520507812, 568.1890869140625, 582.7548217773438, 597.3206176757812, 611.8863525390625, 626.4520874023438, 641.0178833007812, 655.5836181640625, 670.1493530273438, 684.7151489257812, 699.2808837890625, 713.8466796875, 728.4124145507812, 742.9781494140625, 757.5439453125, 772.1096801757812, 786.6754150390625, 801.2412109375]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 0.0, 4.0, 5.0, 7.0, 7.0, 4.0, 9.0, 13.0, 13.0, 14.0, 20.0, 21.0, 39.0, 25.0, 30.0, 35.0, 32.0, 46.0, 45.0, 54.0, 51.0, 31.0, 47.0, 55.0, 42.0, 52.0, 42.0, 43.0, 34.0, 29.0, 32.0, 20.0, 21.0, 15.0, 15.0, 6.0, 7.0, 5.0, 8.0, 10.0, 9.0, 3.0, 6.0, 2.0, 3.0, 0.0, 1.0, 1.0], "bins": [-48.69575119018555, -47.21363830566406, -45.73152542114258, -44.249412536621094, -42.76729965209961, -41.285186767578125, -39.803077697753906, -38.320960998535156, -36.83885192871094, -35.35673904418945, -33.87462615966797, -32.392513275146484, -30.910400390625, -29.428287506103516, -27.946176528930664, -26.46406364440918, -24.981948852539062, -23.499835968017578, -22.017723083496094, -20.53561019897461, -19.053497314453125, -17.57138442993164, -16.08927345275879, -14.607160568237305, -13.12504768371582, -11.642934799194336, -10.160821914672852, -8.678709983825684, -7.196597099304199, -5.714484214782715, -4.232372283935547, -2.7502593994140625, -1.2681465148925781, 0.21396613121032715, 1.6960787773132324, 3.1781911849975586, 4.660304069519043, 6.142416954040527, 7.624528884887695, 9.10664176940918, 10.588754653930664, 12.070867538452148, 13.552980422973633, 15.0350923538208, 16.51720428466797, 17.999317169189453, 19.481430053710938, 20.963542938232422, 22.445655822753906, 23.92776870727539, 25.409881591796875, 26.89199447631836, 28.374107360839844, 29.856220245361328, 31.33833122253418, 32.82044219970703, 34.30255889892578, 35.784671783447266, 37.26678466796875, 38.748897552490234, 40.23101043701172, 41.7131233215332, 43.19523620605469, 44.677345275878906, 46.15945816040039]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 5.0, 1.0, 3.0, 6.0, 5.0, 9.0, 5.0, 8.0, 14.0, 11.0, 18.0, 21.0, 19.0, 24.0, 37.0, 25.0, 32.0, 53.0, 50.0, 48.0, 53.0, 63.0, 63.0, 55.0, 49.0, 45.0, 34.0, 34.0, 50.0, 26.0, 32.0, 19.0, 17.0, 14.0, 11.0, 17.0, 9.0, 5.0, 4.0, 4.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.59765625, -4.468719482421875, -4.33978271484375, -4.210845947265625, -4.0819091796875, -3.952972412109375, -3.82403564453125, -3.695098876953125, -3.566162109375, -3.437225341796875, -3.30828857421875, -3.179351806640625, -3.0504150390625, -2.921478271484375, -2.79254150390625, -2.663604736328125, -2.53466796875, -2.405731201171875, -2.27679443359375, -2.147857666015625, -2.0189208984375, -1.889984130859375, -1.76104736328125, -1.632110595703125, -1.503173828125, -1.374237060546875, -1.24530029296875, -1.116363525390625, -0.9874267578125, -0.858489990234375, -0.72955322265625, -0.600616455078125, -0.4716796875, -0.342742919921875, -0.21380615234375, -0.084869384765625, 0.0440673828125, 0.173004150390625, 0.30194091796875, 0.430877685546875, 0.559814453125, 0.688751220703125, 0.81768798828125, 0.946624755859375, 1.0755615234375, 1.204498291015625, 1.33343505859375, 1.462371826171875, 1.59130859375, 1.720245361328125, 1.84918212890625, 1.978118896484375, 2.1070556640625, 2.235992431640625, 2.36492919921875, 2.493865966796875, 2.622802734375, 2.751739501953125, 2.88067626953125, 3.009613037109375, 3.1385498046875, 3.267486572265625, 3.39642333984375, 3.525360107421875, 3.654296875]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 4.0, 4.0, 5.0, 8.0, 8.0, 7.0, 15.0, 14.0, 18.0, 20.0, 26.0, 34.0, 54.0, 82.0, 114.0, 199.0, 377.0, 945.0, 2514.0, 7476.0, 26079.0, 200900.0, 3825511.0, 103737.0, 17968.0, 5043.0, 1739.0, 616.0, 281.0, 149.0, 77.0, 73.0, 36.0, 26.0, 26.0, 22.0, 19.0, 16.0, 9.0, 8.0, 10.0, 4.0, 3.0, 3.0, 6.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-29.46875, -28.658935546875, -27.84912109375, -27.039306640625, -26.2294921875, -25.419677734375, -24.60986328125, -23.800048828125, -22.990234375, -22.180419921875, -21.37060546875, -20.560791015625, -19.7509765625, -18.941162109375, -18.13134765625, -17.321533203125, -16.51171875, -15.701904296875, -14.89208984375, -14.082275390625, -13.2724609375, -12.462646484375, -11.65283203125, -10.843017578125, -10.033203125, -9.223388671875, -8.41357421875, -7.603759765625, -6.7939453125, -5.984130859375, -5.17431640625, -4.364501953125, -3.5546875, -2.744873046875, -1.93505859375, -1.125244140625, -0.3154296875, 0.494384765625, 1.30419921875, 2.114013671875, 2.923828125, 3.733642578125, 4.54345703125, 5.353271484375, 6.1630859375, 6.972900390625, 7.78271484375, 8.592529296875, 9.40234375, 10.212158203125, 11.02197265625, 11.831787109375, 12.6416015625, 13.451416015625, 14.26123046875, 15.071044921875, 15.880859375, 16.690673828125, 17.50048828125, 18.310302734375, 19.1201171875, 19.929931640625, 20.73974609375, 21.549560546875, 22.359375]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 5.0, 3.0, 3.0, 3.0, 10.0, 9.0, 4.0, 5.0, 7.0, 7.0, 6.0, 10.0, 17.0, 28.0, 23.0, 36.0, 44.0, 69.0, 92.0, 138.0, 222.0, 394.0, 616.0, 734.0, 566.0, 326.0, 191.0, 125.0, 103.0, 70.0, 57.0, 34.0, 31.0, 21.0, 15.0, 21.0, 7.0, 7.0, 7.0, 5.0, 2.0, 4.0, 7.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.2421875, -9.867919921875, -9.49365234375, -9.119384765625, -8.7451171875, -8.370849609375, -7.99658203125, -7.622314453125, -7.248046875, -6.873779296875, -6.49951171875, -6.125244140625, -5.7509765625, -5.376708984375, -5.00244140625, -4.628173828125, -4.25390625, -3.879638671875, -3.50537109375, -3.131103515625, -2.7568359375, -2.382568359375, -2.00830078125, -1.634033203125, -1.259765625, -0.885498046875, -0.51123046875, -0.136962890625, 0.2373046875, 0.611572265625, 0.98583984375, 1.360107421875, 1.734375, 2.108642578125, 2.48291015625, 2.857177734375, 3.2314453125, 3.605712890625, 3.97998046875, 4.354248046875, 4.728515625, 5.102783203125, 5.47705078125, 5.851318359375, 6.2255859375, 6.599853515625, 6.97412109375, 7.348388671875, 7.72265625, 8.096923828125, 8.47119140625, 8.845458984375, 9.2197265625, 9.593994140625, 9.96826171875, 10.342529296875, 10.716796875, 11.091064453125, 11.46533203125, 11.839599609375, 12.2138671875, 12.588134765625, 12.96240234375, 13.336669921875, 13.7109375]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 8.0, 6.0, 10.0, 11.0, 19.0, 28.0, 51.0, 98.0, 114.0, 203.0, 363.0, 619.0, 1092.0, 1837.0, 3491.0, 6557.0, 12726.0, 28120.0, 68520.0, 247204.0, 2781544.0, 839604.0, 120062.0, 43419.0, 18980.0, 9255.0, 4580.0, 2482.0, 1387.0, 761.0, 429.0, 264.0, 161.0, 100.0, 59.0, 39.0, 29.0, 19.0, 11.0, 15.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-20.84375, -20.2607421875, -19.677734375, -19.0947265625, -18.51171875, -17.9287109375, -17.345703125, -16.7626953125, -16.1796875, -15.5966796875, -15.013671875, -14.4306640625, -13.84765625, -13.2646484375, -12.681640625, -12.0986328125, -11.515625, -10.9326171875, -10.349609375, -9.7666015625, -9.18359375, -8.6005859375, -8.017578125, -7.4345703125, -6.8515625, -6.2685546875, -5.685546875, -5.1025390625, -4.51953125, -3.9365234375, -3.353515625, -2.7705078125, -2.1875, -1.6044921875, -1.021484375, -0.4384765625, 0.14453125, 0.7275390625, 1.310546875, 1.8935546875, 2.4765625, 3.0595703125, 3.642578125, 4.2255859375, 4.80859375, 5.3916015625, 5.974609375, 6.5576171875, 7.140625, 7.7236328125, 8.306640625, 8.8896484375, 9.47265625, 10.0556640625, 10.638671875, 11.2216796875, 11.8046875, 12.3876953125, 12.970703125, 13.5537109375, 14.13671875, 14.7197265625, 15.302734375, 15.8857421875, 16.46875]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 2.0, 6.0, 14.0, 18.0, 41.0, 66.0, 125.0, 194.0, 217.0, 129.0, 89.0, 40.0, 32.0, 14.0, 10.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.10537338256836, -45.595149993896484, -43.084922790527344, -40.57469940185547, -38.064476013183594, -35.55425262451172, -33.044029235839844, -30.533802032470703, -28.023578643798828, -25.513355255126953, -23.003129959106445, -20.492904663085938, -17.982681274414062, -15.472456932067871, -12.96223258972168, -10.452007293701172, -7.941783905029297, -5.4315595626831055, -2.921335220336914, -0.41111087799072266, 2.0991134643554688, 4.60933780670166, 7.119562149047852, 9.62978744506836, 12.140010833740234, 14.650235176086426, 17.160459518432617, 19.670684814453125, 22.180908203125, 24.691131591796875, 27.201356887817383, 29.71158218383789, 32.2218017578125, 34.732025146484375, 37.24224853515625, 39.75247573852539, 42.262699127197266, 44.77292251586914, 47.28314971923828, 49.793373107910156, 52.30359649658203, 54.813819885253906, 57.32404327392578, 59.83427047729492, 62.3444938659668, 64.85472106933594, 67.36494445800781, 69.87516784667969, 72.38539123535156, 74.89561462402344, 77.40583801269531, 79.91606140136719, 82.42628479003906, 84.93651580810547, 87.44673919677734, 89.95696258544922, 92.4671859741211, 94.97740936279297, 97.48763275146484, 99.99785614013672, 102.50808715820312, 105.018310546875, 107.52853393554688, 110.03875732421875, 112.54898071289062]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 6.0, 1.0, 0.0, 3.0, 6.0, 17.0, 15.0, 9.0, 14.0, 20.0, 20.0, 22.0, 20.0, 28.0, 41.0, 31.0, 46.0, 41.0, 51.0, 40.0, 35.0, 43.0, 44.0, 51.0, 40.0, 44.0, 40.0, 28.0, 33.0, 40.0, 34.0, 18.0, 22.0, 13.0, 18.0, 9.0, 11.0, 10.0, 12.0, 8.0, 10.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-41.330196380615234, -40.10775375366211, -38.885311126708984, -37.662872314453125, -36.4404296875, -35.217987060546875, -33.99554443359375, -32.773101806640625, -31.550662994384766, -30.32822036743164, -29.10577964782715, -27.883337020874023, -26.66089630126953, -25.438453674316406, -24.21601104736328, -22.99357032775879, -21.771127700805664, -20.54868507385254, -19.326244354248047, -18.103801727294922, -16.88136100769043, -15.658918380737305, -14.436476707458496, -13.214035034179688, -11.991593360900879, -10.76915168762207, -9.546710014343262, -8.324268341064453, -7.101826190948486, -5.879384517669678, -4.656942367553711, -3.4345006942749023, -2.2120590209960938, -0.9896172285079956, 0.23282456398010254, 1.4552664756774902, 2.677708148956299, 3.9001498222351074, 5.122591972351074, 6.345033645629883, 7.567475318908691, 8.7899169921875, 10.012358665466309, 11.234800338745117, 12.457242965698242, 13.679683685302734, 14.90212631225586, 16.124568939208984, 17.347009658813477, 18.5694522857666, 19.791893005371094, 21.01433563232422, 22.23677635192871, 23.459218978881836, 24.681659698486328, 25.904102325439453, 27.126544952392578, 28.348987579345703, 29.571428298950195, 30.79387092590332, 32.01631164550781, 33.23875427246094, 34.46119689941406, 35.68363952636719, 36.90607833862305]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 0.0, 4.0, 6.0, 4.0, 4.0, 3.0, 8.0, 7.0, 10.0, 12.0, 5.0, 12.0, 13.0, 25.0, 25.0, 22.0, 36.0, 24.0, 36.0, 39.0, 51.0, 52.0, 54.0, 55.0, 60.0, 49.0, 51.0, 41.0, 48.0, 25.0, 29.0, 37.0, 32.0, 18.0, 19.0, 24.0, 16.0, 8.0, 6.0, 10.0, 7.0, 3.0, 6.0, 6.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.3828125, -4.256591796875, -4.13037109375, -4.004150390625, -3.8779296875, -3.751708984375, -3.62548828125, -3.499267578125, -3.373046875, -3.246826171875, -3.12060546875, -2.994384765625, -2.8681640625, -2.741943359375, -2.61572265625, -2.489501953125, -2.36328125, -2.237060546875, -2.11083984375, -1.984619140625, -1.8583984375, -1.732177734375, -1.60595703125, -1.479736328125, -1.353515625, -1.227294921875, -1.10107421875, -0.974853515625, -0.8486328125, -0.722412109375, -0.59619140625, -0.469970703125, -0.34375, -0.217529296875, -0.09130859375, 0.034912109375, 0.1611328125, 0.287353515625, 0.41357421875, 0.539794921875, 0.666015625, 0.792236328125, 0.91845703125, 1.044677734375, 1.1708984375, 1.297119140625, 1.42333984375, 1.549560546875, 1.67578125, 1.802001953125, 1.92822265625, 2.054443359375, 2.1806640625, 2.306884765625, 2.43310546875, 2.559326171875, 2.685546875, 2.811767578125, 2.93798828125, 3.064208984375, 3.1904296875, 3.316650390625, 3.44287109375, 3.569091796875, 3.6953125]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 5.0, 1.0, 0.0, 4.0, 7.0, 9.0, 19.0, 28.0, 34.0, 55.0, 74.0, 142.0, 213.0, 350.0, 507.0, 849.0, 1396.0, 2232.0, 3630.0, 6306.0, 11016.0, 20172.0, 38288.0, 78422.0, 186648.0, 365671.0, 175243.0, 74694.0, 36938.0, 19336.0, 10781.0, 5998.0, 3625.0, 2222.0, 1319.0, 874.0, 486.0, 356.0, 212.0, 138.0, 90.0, 52.0, 42.0, 30.0, 15.0, 14.0, 8.0, 10.0, 2.0, 2.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1624755859375, -0.156768798828125, -0.15106201171875, -0.145355224609375, -0.1396484375, -0.133941650390625, -0.12823486328125, -0.122528076171875, -0.1168212890625, -0.111114501953125, -0.10540771484375, -0.099700927734375, -0.093994140625, -0.088287353515625, -0.08258056640625, -0.076873779296875, -0.0711669921875, -0.065460205078125, -0.05975341796875, -0.054046630859375, -0.04833984375, -0.042633056640625, -0.03692626953125, -0.031219482421875, -0.0255126953125, -0.019805908203125, -0.01409912109375, -0.008392333984375, -0.002685546875, 0.003021240234375, 0.00872802734375, 0.014434814453125, 0.0201416015625, 0.025848388671875, 0.03155517578125, 0.037261962890625, 0.04296875, 0.048675537109375, 0.05438232421875, 0.060089111328125, 0.0657958984375, 0.071502685546875, 0.07720947265625, 0.082916259765625, 0.088623046875, 0.094329833984375, 0.10003662109375, 0.105743408203125, 0.1114501953125, 0.117156982421875, 0.12286376953125, 0.128570556640625, 0.13427734375, 0.139984130859375, 0.14569091796875, 0.151397705078125, 0.1571044921875, 0.162811279296875, 0.16851806640625, 0.174224853515625, 0.179931640625, 0.185638427734375, 0.19134521484375, 0.197052001953125, 0.2027587890625]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 9.0, 7.0, 10.0, 7.0, 9.0, 9.0, 11.0, 14.0, 12.0, 16.0, 16.0, 20.0, 25.0, 23.0, 21.0, 37.0, 29.0, 37.0, 42.0, 36.0, 44.0, 38.0, 1068.0, 45.0, 32.0, 37.0, 37.0, 36.0, 27.0, 32.0, 33.0, 31.0, 24.0, 25.0, 20.0, 22.0, 19.0, 13.0, 10.0, 5.0, 8.0, 8.0, 6.0, 4.0, 6.0, 7.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-2.453125, -2.379608154296875, -2.30609130859375, -2.232574462890625, -2.1590576171875, -2.085540771484375, -2.01202392578125, -1.938507080078125, -1.864990234375, -1.791473388671875, -1.71795654296875, -1.644439697265625, -1.5709228515625, -1.497406005859375, -1.42388916015625, -1.350372314453125, -1.27685546875, -1.203338623046875, -1.12982177734375, -1.056304931640625, -0.9827880859375, -0.909271240234375, -0.83575439453125, -0.762237548828125, -0.688720703125, -0.615203857421875, -0.54168701171875, -0.468170166015625, -0.3946533203125, -0.321136474609375, -0.24761962890625, -0.174102783203125, -0.1005859375, -0.027069091796875, 0.04644775390625, 0.119964599609375, 0.1934814453125, 0.266998291015625, 0.34051513671875, 0.414031982421875, 0.487548828125, 0.561065673828125, 0.63458251953125, 0.708099365234375, 0.7816162109375, 0.855133056640625, 0.92864990234375, 1.002166748046875, 1.07568359375, 1.149200439453125, 1.22271728515625, 1.296234130859375, 1.3697509765625, 1.443267822265625, 1.51678466796875, 1.590301513671875, 1.663818359375, 1.737335205078125, 1.81085205078125, 1.884368896484375, 1.9578857421875, 2.031402587890625, 2.10491943359375, 2.178436279296875, 2.251953125]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 4.0, 5.0, 10.0, 10.0, 12.0, 25.0, 28.0, 48.0, 84.0, 134.0, 180.0, 238.0, 345.0, 437.0, 696.0, 913.0, 1352.0, 1932.0, 2729.0, 4008.0, 5728.0, 8496.0, 12834.0, 19305.0, 29671.0, 46513.0, 74744.0, 122451.0, 1254527.0, 194284.0, 115861.0, 70317.0, 43686.0, 28407.0, 18543.0, 12137.0, 8203.0, 5563.0, 3742.0, 2735.0, 1803.0, 1316.0, 938.0, 641.0, 478.0, 317.0, 222.0, 146.0, 113.0, 84.0, 53.0, 29.0, 22.0, 19.0, 13.0, 7.0, 5.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.10076904296875, -0.09761428833007812, -0.09445953369140625, -0.09130477905273438, -0.0881500244140625, -0.08499526977539062, -0.08184051513671875, -0.07868576049804688, -0.075531005859375, -0.07237625122070312, -0.06922149658203125, -0.06606674194335938, -0.0629119873046875, -0.059757232666015625, -0.05660247802734375, -0.053447723388671875, -0.05029296875, -0.047138214111328125, -0.04398345947265625, -0.040828704833984375, -0.0376739501953125, -0.034519195556640625, -0.03136444091796875, -0.028209686279296875, -0.025054931640625, -0.021900177001953125, -0.01874542236328125, -0.015590667724609375, -0.0124359130859375, -0.009281158447265625, -0.00612640380859375, -0.002971649169921875, 0.00018310546875, 0.003337860107421875, 0.00649261474609375, 0.009647369384765625, 0.0128021240234375, 0.015956878662109375, 0.01911163330078125, 0.022266387939453125, 0.025421142578125, 0.028575897216796875, 0.03173065185546875, 0.034885406494140625, 0.0380401611328125, 0.041194915771484375, 0.04434967041015625, 0.047504425048828125, 0.0506591796875, 0.053813934326171875, 0.05696868896484375, 0.060123443603515625, 0.0632781982421875, 0.06643295288085938, 0.06958770751953125, 0.07274246215820312, 0.075897216796875, 0.07905197143554688, 0.08220672607421875, 0.08536148071289062, 0.0885162353515625, 0.09167098999023438, 0.09482574462890625, 0.09798049926757812, 0.10113525390625]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 3.0, 2.0, 4.0, 5.0, 7.0, 9.0, 20.0, 12.0, 27.0, 30.0, 37.0, 55.0, 57.0, 69.0, 90.0, 91.0, 101.0, 91.0, 79.0, 48.0, 38.0, 31.0, 17.0, 18.0, 11.0, 16.0, 10.0, 6.0, 11.0, 2.0, 2.0, 1.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011271238327026367, -0.00010924879461526871, -0.00010578520596027374, -0.00010232161730527878, -9.885802865028381e-05, -9.539443999528885e-05, -9.193085134029388e-05, -8.846726268529892e-05, -8.500367403030396e-05, -8.154008537530899e-05, -7.807649672031403e-05, -7.461290806531906e-05, -7.11493194103241e-05, -6.768573075532913e-05, -6.422214210033417e-05, -6.07585534453392e-05, -5.729496479034424e-05, -5.3831376135349274e-05, -5.036778748035431e-05, -4.6904198825359344e-05, -4.344061017036438e-05, -3.9977021515369415e-05, -3.651343286037445e-05, -3.3049844205379486e-05, -2.958625555038452e-05, -2.6122666895389557e-05, -2.2659078240394592e-05, -1.9195489585399628e-05, -1.5731900930404663e-05, -1.2268312275409698e-05, -8.804723620414734e-06, -5.341134965419769e-06, -1.8775463104248047e-06, 1.58604234457016e-06, 5.0496309995651245e-06, 8.513219654560089e-06, 1.1976808309555054e-05, 1.544039696455002e-05, 1.8903985619544983e-05, 2.2367574274539948e-05, 2.5831162929534912e-05, 2.9294751584529877e-05, 3.275834023952484e-05, 3.6221928894519806e-05, 3.968551754951477e-05, 4.3149106204509735e-05, 4.66126948595047e-05, 5.0076283514499664e-05, 5.353987216949463e-05, 5.7003460824489594e-05, 6.046704947948456e-05, 6.393063813447952e-05, 6.739422678947449e-05, 7.085781544446945e-05, 7.432140409946442e-05, 7.778499275445938e-05, 8.124858140945435e-05, 8.471217006444931e-05, 8.817575871944427e-05, 9.163934737443924e-05, 9.51029360294342e-05, 9.856652468442917e-05, 0.00010203011333942413, 0.0001054937019944191, 0.00010895729064941406]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 3.0, 6.0, 4.0, 10.0, 5.0, 13.0, 10.0, 16.0, 24.0, 27.0, 30.0, 40.0, 58.0, 92.0, 124.0, 207.0, 456.0, 1816.0, 15602.0, 949518.0, 75321.0, 3650.0, 733.0, 257.0, 149.0, 110.0, 70.0, 44.0, 49.0, 29.0, 24.0, 13.0, 13.0, 11.0, 6.0, 7.0, 0.0, 4.0, 1.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0015802383422851562, -0.0015303939580917358, -0.0014805495738983154, -0.001430705189704895, -0.0013808608055114746, -0.0013310164213180542, -0.0012811720371246338, -0.0012313276529312134, -0.001181483268737793, -0.0011316388845443726, -0.0010817945003509521, -0.0010319501161575317, -0.0009821057319641113, -0.0009322613477706909, -0.0008824169635772705, -0.0008325725793838501, -0.0007827281951904297, -0.0007328838109970093, -0.0006830394268035889, -0.0006331950426101685, -0.000583350658416748, -0.0005335062742233276, -0.0004836618900299072, -0.0004338175058364868, -0.0003839731216430664, -0.000334128737449646, -0.0002842843532562256, -0.00023443996906280518, -0.00018459558486938477, -0.00013475120067596436, -8.490681648254395e-05, -3.5062432289123535e-05, 1.4781951904296875e-05, 6.462633609771729e-05, 0.0001144707202911377, 0.0001643151044845581, 0.00021415948867797852, 0.0002640038728713989, 0.00031384825706481934, 0.00036369264125823975, 0.00041353702545166016, 0.00046338140964508057, 0.000513225793838501, 0.0005630701780319214, 0.0006129145622253418, 0.0006627589464187622, 0.0007126033306121826, 0.000762447714805603, 0.0008122920989990234, 0.0008621364831924438, 0.0009119808673858643, 0.0009618252515792847, 0.001011669635772705, 0.0010615140199661255, 0.001111358404159546, 0.0011612027883529663, 0.0012110471725463867, 0.0012608915567398071, 0.0013107359409332275, 0.001360580325126648, 0.0014104247093200684, 0.0014602690935134888, 0.0015101134777069092, 0.0015599578619003296, 0.00160980224609375]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 24.0, 47.0, 221.0, 456.0, 199.0, 52.0, 9.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002675997093319893, -0.00025982767692767084, -0.00025205567362718284, -0.0002442836412228644, -0.0002365116379223764, -0.00022873962006997317, -0.00022096760221756995, -0.0002131955698132515, -0.0002054235665127635, -0.00019765154866036028, -0.00018987953080795705, -0.00018210751295555383, -0.0001743354951031506, -0.00016656347725074738, -0.00015879145939834416, -0.0001510194269940257, -0.00014324740914162248, -0.00013547539128921926, -0.00012770337343681604, -0.00011993135558441281, -0.00011215933773200959, -0.00010438731987960637, -9.661529475124553e-05, -8.88432768988423e-05, -8.107125904643908e-05, -7.329924119403586e-05, -6.552722334163263e-05, -5.7755201851250604e-05, -4.998318399884738e-05, -4.221116614644416e-05, -3.4439144656062126e-05, -2.6667126803658903e-05, -1.8895123503170907e-05, -1.1123104741272982e-05, -3.351085979375057e-06, 4.42093369201757e-06, 1.2192951544420794e-05, 1.9964969396824017e-05, 2.7736990887206048e-05, 3.550900873960927e-05, 4.3281026592012495e-05, 5.105304444441572e-05, 5.882506229681894e-05, 6.659708742517978e-05, 7.4369105277583e-05, 8.214112312998623e-05, 8.991314098238945e-05, 9.768515883479267e-05, 0.0001054571766871959, 0.00011322919453959912, 0.00012100121239200234, 0.00012877323024440557, 0.0001365452480968088, 0.00014431726594921201, 0.00015208928380161524, 0.0001598613162059337, 0.00016763331950642169, 0.0001754053373588249, 0.00018317735521122813, 0.00019094937306363136, 0.00019872139091603458, 0.0002064934087684378, 0.00021426542662084103, 0.00022203745902515948, 0.0002298094768775627]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 3.0, 6.0, 9.0, 4.0, 11.0, 11.0, 12.0, 12.0, 13.0, 16.0, 15.0, 21.0, 23.0, 23.0, 30.0, 29.0, 32.0, 35.0, 33.0, 36.0, 48.0, 23.0, 47.0, 39.0, 38.0, 30.0, 32.0, 46.0, 38.0, 41.0, 37.0, 30.0, 30.0, 15.0, 25.0, 12.0, 25.0, 8.0, 16.0, 13.0, 5.0, 6.0, 7.0, 7.0, 6.0, 8.0, 1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.100799560546875e-05, -3.972742706537247e-05, -3.8446858525276184e-05, -3.71662899851799e-05, -3.588572144508362e-05, -3.4605152904987335e-05, -3.332458436489105e-05, -3.204401582479477e-05, -3.0763447284698486e-05, -2.9482878744602203e-05, -2.820231020450592e-05, -2.6921741664409637e-05, -2.5641173124313354e-05, -2.436060458421707e-05, -2.308003604412079e-05, -2.1799467504024506e-05, -2.0518898963928223e-05, -1.923833042383194e-05, -1.7957761883735657e-05, -1.6677193343639374e-05, -1.539662480354309e-05, -1.4116056263446808e-05, -1.2835487723350525e-05, -1.1554919183254242e-05, -1.0274350643157959e-05, -8.993782103061676e-06, -7.713213562965393e-06, -6.43264502286911e-06, -5.152076482772827e-06, -3.871507942676544e-06, -2.5909394025802612e-06, -1.3103708624839783e-06, -2.9802322387695312e-08, 1.2507662177085876e-06, 2.5313347578048706e-06, 3.8119032979011536e-06, 5.0924718379974365e-06, 6.3730403780937195e-06, 7.653608918190002e-06, 8.934177458286285e-06, 1.0214745998382568e-05, 1.1495314538478851e-05, 1.2775883078575134e-05, 1.4056451618671417e-05, 1.53370201587677e-05, 1.6617588698863983e-05, 1.7898157238960266e-05, 1.917872577905655e-05, 2.0459294319152832e-05, 2.1739862859249115e-05, 2.3020431399345398e-05, 2.430099993944168e-05, 2.5581568479537964e-05, 2.6862137019634247e-05, 2.814270555973053e-05, 2.9423274099826813e-05, 3.0703842639923096e-05, 3.198441118001938e-05, 3.326497972011566e-05, 3.4545548260211945e-05, 3.582611680030823e-05, 3.710668534040451e-05, 3.8387253880500793e-05, 3.9667822420597076e-05, 4.094839096069336e-05]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 0.0, 4.0, 6.0, 4.0, 4.0, 3.0, 8.0, 7.0, 10.0, 12.0, 5.0, 12.0, 13.0, 25.0, 25.0, 22.0, 36.0, 24.0, 36.0, 39.0, 51.0, 52.0, 54.0, 55.0, 60.0, 49.0, 51.0, 41.0, 48.0, 25.0, 29.0, 37.0, 32.0, 18.0, 19.0, 24.0, 16.0, 8.0, 6.0, 10.0, 7.0, 3.0, 6.0, 6.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.3828125, -4.256591796875, -4.13037109375, -4.004150390625, -3.8779296875, -3.751708984375, -3.62548828125, -3.499267578125, -3.373046875, -3.246826171875, -3.12060546875, -2.994384765625, -2.8681640625, -2.741943359375, -2.61572265625, -2.489501953125, -2.36328125, -2.237060546875, -2.11083984375, -1.984619140625, -1.8583984375, -1.732177734375, -1.60595703125, -1.479736328125, -1.353515625, -1.227294921875, -1.10107421875, -0.974853515625, -0.8486328125, -0.722412109375, -0.59619140625, -0.469970703125, -0.34375, -0.217529296875, -0.09130859375, 0.034912109375, 0.1611328125, 0.287353515625, 0.41357421875, 0.539794921875, 0.666015625, 0.792236328125, 0.91845703125, 1.044677734375, 1.1708984375, 1.297119140625, 1.42333984375, 1.549560546875, 1.67578125, 1.802001953125, 1.92822265625, 2.054443359375, 2.1806640625, 2.306884765625, 2.43310546875, 2.559326171875, 2.685546875, 2.811767578125, 2.93798828125, 3.064208984375, 3.1904296875, 3.316650390625, 3.44287109375, 3.569091796875, 3.6953125]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 0.0, 4.0, 5.0, 4.0, 12.0, 13.0, 12.0, 28.0, 20.0, 34.0, 42.0, 61.0, 100.0, 115.0, 164.0, 268.0, 332.0, 534.0, 762.0, 1148.0, 1829.0, 3289.0, 7155.0, 31120.0, 458420.0, 493645.0, 33083.0, 7391.0, 3415.0, 1945.0, 1131.0, 783.0, 495.0, 348.0, 237.0, 185.0, 104.0, 79.0, 56.0, 46.0, 26.0, 27.0, 16.0, 22.0, 16.0, 9.0, 12.0, 2.0, 5.0, 5.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-7.93359375, -7.67779541015625, -7.4219970703125, -7.16619873046875, -6.910400390625, -6.65460205078125, -6.3988037109375, -6.14300537109375, -5.88720703125, -5.63140869140625, -5.3756103515625, -5.11981201171875, -4.864013671875, -4.60821533203125, -4.3524169921875, -4.09661865234375, -3.8408203125, -3.58502197265625, -3.3292236328125, -3.07342529296875, -2.817626953125, -2.56182861328125, -2.3060302734375, -2.05023193359375, -1.79443359375, -1.53863525390625, -1.2828369140625, -1.02703857421875, -0.771240234375, -0.51544189453125, -0.2596435546875, -0.00384521484375, 0.251953125, 0.50775146484375, 0.7635498046875, 1.01934814453125, 1.275146484375, 1.53094482421875, 1.7867431640625, 2.04254150390625, 2.29833984375, 2.55413818359375, 2.8099365234375, 3.06573486328125, 3.321533203125, 3.57733154296875, 3.8331298828125, 4.08892822265625, 4.3447265625, 4.60052490234375, 4.8563232421875, 5.11212158203125, 5.367919921875, 5.62371826171875, 5.8795166015625, 6.13531494140625, 6.39111328125, 6.64691162109375, 6.9027099609375, 7.15850830078125, 7.414306640625, 7.67010498046875, 7.9259033203125, 8.18170166015625, 8.4375]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 0.0, 2.0, 1.0, 7.0, 5.0, 4.0, 9.0, 8.0, 10.0, 7.0, 18.0, 16.0, 15.0, 24.0, 26.0, 28.0, 26.0, 41.0, 39.0, 48.0, 43.0, 66.0, 94.0, 1776.0, 286.0, 61.0, 47.0, 51.0, 37.0, 24.0, 30.0, 30.0, 26.0, 22.0, 23.0, 23.0, 19.0, 16.0, 13.0, 7.0, 7.0, 5.0, 5.0, 2.0, 2.0, 1.0, 6.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.078125, -15.58740234375, -15.0966796875, -14.60595703125, -14.115234375, -13.62451171875, -13.1337890625, -12.64306640625, -12.15234375, -11.66162109375, -11.1708984375, -10.68017578125, -10.189453125, -9.69873046875, -9.2080078125, -8.71728515625, -8.2265625, -7.73583984375, -7.2451171875, -6.75439453125, -6.263671875, -5.77294921875, -5.2822265625, -4.79150390625, -4.30078125, -3.81005859375, -3.3193359375, -2.82861328125, -2.337890625, -1.84716796875, -1.3564453125, -0.86572265625, -0.375, 0.11572265625, 0.6064453125, 1.09716796875, 1.587890625, 2.07861328125, 2.5693359375, 3.06005859375, 3.55078125, 4.04150390625, 4.5322265625, 5.02294921875, 5.513671875, 6.00439453125, 6.4951171875, 6.98583984375, 7.4765625, 7.96728515625, 8.4580078125, 8.94873046875, 9.439453125, 9.93017578125, 10.4208984375, 10.91162109375, 11.40234375, 11.89306640625, 12.3837890625, 12.87451171875, 13.365234375, 13.85595703125, 14.3466796875, 14.83740234375, 15.328125]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 5.0, 0.0, 2.0, 3.0, 5.0, 6.0, 5.0, 13.0, 6.0, 13.0, 23.0, 18.0, 24.0, 35.0, 37.0, 44.0, 59.0, 67.0, 132.0, 302.0, 1085.0, 4328.0, 56271.0, 3070332.0, 9604.0, 2109.0, 577.0, 181.0, 95.0, 72.0, 48.0, 46.0, 28.0, 27.0, 24.0, 17.0, 17.0, 5.0, 10.0, 6.0, 9.0, 5.0, 6.0, 6.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.34375, -32.27685546875, -31.2099609375, -30.14306640625, -29.076171875, -28.00927734375, -26.9423828125, -25.87548828125, -24.80859375, -23.74169921875, -22.6748046875, -21.60791015625, -20.541015625, -19.47412109375, -18.4072265625, -17.34033203125, -16.2734375, -15.20654296875, -14.1396484375, -13.07275390625, -12.005859375, -10.93896484375, -9.8720703125, -8.80517578125, -7.73828125, -6.67138671875, -5.6044921875, -4.53759765625, -3.470703125, -2.40380859375, -1.3369140625, -0.27001953125, 0.796875, 1.86376953125, 2.9306640625, 3.99755859375, 5.064453125, 6.13134765625, 7.1982421875, 8.26513671875, 9.33203125, 10.39892578125, 11.4658203125, 12.53271484375, 13.599609375, 14.66650390625, 15.7333984375, 16.80029296875, 17.8671875, 18.93408203125, 20.0009765625, 21.06787109375, 22.134765625, 23.20166015625, 24.2685546875, 25.33544921875, 26.40234375, 27.46923828125, 28.5361328125, 29.60302734375, 30.669921875, 31.73681640625, 32.8037109375, 33.87060546875, 34.9375]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [1.0, 6.0, 489.0, 519.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.175048828125, -10.110292434692383, -5.045536041259766, 0.019220352172851562, 5.083976745605469, 10.148733139038086, 15.213489532470703, 20.278244018554688, 25.343002319335938, 30.407758712768555, 35.47251510620117, 40.537269592285156, 45.602027893066406, 50.666786193847656, 55.73154067993164, 60.796295166015625, 65.86105346679688, 70.92581176757812, 75.99057006835938, 81.0553207397461, 86.12007904052734, 91.1848373413086, 96.24958801269531, 101.31434631347656, 106.37910461425781, 111.44386291503906, 116.50862121582031, 121.57337188720703, 126.63813018798828, 131.702880859375, 136.76763916015625, 141.8323974609375, 146.89715576171875, 151.9619140625, 157.02667236328125, 162.0914306640625, 167.15618896484375, 172.22093200683594, 177.2856903076172, 182.35044860839844, 187.4152069091797, 192.47996520996094, 197.5447235107422, 202.60948181152344, 207.67422485351562, 212.73898315429688, 217.80374145507812, 222.86849975585938, 227.93325805664062, 232.99801635742188, 238.06277465820312, 243.12753295898438, 248.19229125976562, 253.2570343017578, 258.3218078613281, 263.38653564453125, 268.4512939453125, 273.51605224609375, 278.580810546875, 283.64556884765625, 288.7103271484375, 293.77508544921875, 298.83984375, 303.90460205078125, 308.9693603515625]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 2.0, 3.0, 10.0, 8.0, 8.0, 7.0, 15.0, 13.0, 15.0, 13.0, 17.0, 21.0, 18.0, 21.0, 24.0, 17.0, 27.0, 27.0, 37.0, 33.0, 33.0, 34.0, 37.0, 37.0, 39.0, 47.0, 38.0, 49.0, 36.0, 43.0, 39.0, 29.0, 27.0, 29.0, 17.0, 19.0, 14.0, 19.0, 20.0, 16.0, 6.0, 11.0, 9.0, 9.0, 5.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-47.5921516418457, -46.260528564453125, -44.92890167236328, -43.59727478027344, -42.26565170288086, -40.93402862548828, -39.60240173339844, -38.270774841308594, -36.939151763916016, -35.60752868652344, -34.275901794433594, -32.94427490234375, -31.612651824951172, -30.28102684020996, -28.94940185546875, -27.61777687072754, -26.286151885986328, -24.954526901245117, -23.622901916503906, -22.291276931762695, -20.959651947021484, -19.628026962280273, -18.296401977539062, -16.96477699279785, -15.63315200805664, -14.30152702331543, -12.969902038574219, -11.638277053833008, -10.306652069091797, -8.975027084350586, -7.643402099609375, -6.311777114868164, -4.980155944824219, -3.648530960083008, -2.316905975341797, -0.9852809906005859, 0.346343994140625, 1.677968978881836, 3.009593963623047, 4.341218948364258, 5.672843933105469, 7.00446891784668, 8.33609390258789, 9.667718887329102, 10.999343872070312, 12.330968856811523, 13.662593841552734, 14.994218826293945, 16.325843811035156, 17.657468795776367, 18.989093780517578, 20.32071876525879, 21.65234375, 22.98396873474121, 24.315593719482422, 25.647218704223633, 26.978843688964844, 28.310468673706055, 29.642093658447266, 30.973718643188477, 32.30534362792969, 33.63697052001953, 34.96859359741211, 36.30021667480469, 37.63184356689453]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 3.0, 4.0, 7.0, 3.0, 8.0, 14.0, 8.0, 7.0, 10.0, 16.0, 23.0, 25.0, 20.0, 36.0, 28.0, 28.0, 48.0, 45.0, 59.0, 48.0, 53.0, 60.0, 54.0, 46.0, 43.0, 35.0, 37.0, 32.0, 28.0, 36.0, 27.0, 19.0, 22.0, 18.0, 6.0, 9.0, 9.0, 6.0, 6.0, 4.0, 5.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-4.56640625, -4.435455322265625, -4.30450439453125, -4.173553466796875, -4.0426025390625, -3.911651611328125, -3.78070068359375, -3.649749755859375, -3.518798828125, -3.387847900390625, -3.25689697265625, -3.125946044921875, -2.9949951171875, -2.864044189453125, -2.73309326171875, -2.602142333984375, -2.47119140625, -2.340240478515625, -2.20928955078125, -2.078338623046875, -1.9473876953125, -1.816436767578125, -1.68548583984375, -1.554534912109375, -1.423583984375, -1.292633056640625, -1.16168212890625, -1.030731201171875, -0.8997802734375, -0.768829345703125, -0.63787841796875, -0.506927490234375, -0.3759765625, -0.245025634765625, -0.11407470703125, 0.016876220703125, 0.1478271484375, 0.278778076171875, 0.40972900390625, 0.540679931640625, 0.671630859375, 0.802581787109375, 0.93353271484375, 1.064483642578125, 1.1954345703125, 1.326385498046875, 1.45733642578125, 1.588287353515625, 1.71923828125, 1.850189208984375, 1.98114013671875, 2.112091064453125, 2.2430419921875, 2.373992919921875, 2.50494384765625, 2.635894775390625, 2.766845703125, 2.897796630859375, 3.02874755859375, 3.159698486328125, 3.2906494140625, 3.421600341796875, 3.55255126953125, 3.683502197265625, 3.814453125]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 5.0, 2.0, 3.0, 6.0, 10.0, 8.0, 16.0, 12.0, 22.0, 30.0, 56.0, 65.0, 86.0, 174.0, 273.0, 432.0, 810.0, 1479.0, 2947.0, 6022.0, 13750.0, 34379.0, 159989.0, 3333900.0, 553164.0, 52594.0, 18343.0, 7813.0, 3652.0, 1864.0, 990.0, 531.0, 320.0, 208.0, 124.0, 59.0, 46.0, 24.0, 21.0, 15.0, 12.0, 4.0, 4.0, 5.0, 4.0, 6.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-16.671875, -16.191162109375, -15.71044921875, -15.229736328125, -14.7490234375, -14.268310546875, -13.78759765625, -13.306884765625, -12.826171875, -12.345458984375, -11.86474609375, -11.384033203125, -10.9033203125, -10.422607421875, -9.94189453125, -9.461181640625, -8.98046875, -8.499755859375, -8.01904296875, -7.538330078125, -7.0576171875, -6.576904296875, -6.09619140625, -5.615478515625, -5.134765625, -4.654052734375, -4.17333984375, -3.692626953125, -3.2119140625, -2.731201171875, -2.25048828125, -1.769775390625, -1.2890625, -0.808349609375, -0.32763671875, 0.153076171875, 0.6337890625, 1.114501953125, 1.59521484375, 2.075927734375, 2.556640625, 3.037353515625, 3.51806640625, 3.998779296875, 4.4794921875, 4.960205078125, 5.44091796875, 5.921630859375, 6.40234375, 6.883056640625, 7.36376953125, 7.844482421875, 8.3251953125, 8.805908203125, 9.28662109375, 9.767333984375, 10.248046875, 10.728759765625, 11.20947265625, 11.690185546875, 12.1708984375, 12.651611328125, 13.13232421875, 13.613037109375, 14.09375]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 4.0, 5.0, 4.0, 7.0, 9.0, 11.0, 20.0, 13.0, 24.0, 44.0, 48.0, 79.0, 88.0, 130.0, 248.0, 514.0, 796.0, 840.0, 473.0, 224.0, 135.0, 99.0, 55.0, 49.0, 42.0, 34.0, 22.0, 14.0, 8.0, 8.0, 7.0, 6.0, 5.0, 8.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-14.7890625, -14.341552734375, -13.89404296875, -13.446533203125, -12.9990234375, -12.551513671875, -12.10400390625, -11.656494140625, -11.208984375, -10.761474609375, -10.31396484375, -9.866455078125, -9.4189453125, -8.971435546875, -8.52392578125, -8.076416015625, -7.62890625, -7.181396484375, -6.73388671875, -6.286376953125, -5.8388671875, -5.391357421875, -4.94384765625, -4.496337890625, -4.048828125, -3.601318359375, -3.15380859375, -2.706298828125, -2.2587890625, -1.811279296875, -1.36376953125, -0.916259765625, -0.46875, -0.021240234375, 0.42626953125, 0.873779296875, 1.3212890625, 1.768798828125, 2.21630859375, 2.663818359375, 3.111328125, 3.558837890625, 4.00634765625, 4.453857421875, 4.9013671875, 5.348876953125, 5.79638671875, 6.243896484375, 6.69140625, 7.138916015625, 7.58642578125, 8.033935546875, 8.4814453125, 8.928955078125, 9.37646484375, 9.823974609375, 10.271484375, 10.718994140625, 11.16650390625, 11.614013671875, 12.0615234375, 12.509033203125, 12.95654296875, 13.404052734375, 13.8515625]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 1.0, 8.0, 8.0, 12.0, 19.0, 31.0, 52.0, 50.0, 92.0, 137.0, 191.0, 308.0, 434.0, 729.0, 1146.0, 1982.0, 3480.0, 6084.0, 11376.0, 22030.0, 45536.0, 114848.0, 672895.0, 2826327.0, 327185.0, 83237.0, 36220.0, 17938.0, 9334.0, 5062.0, 2923.0, 1704.0, 1026.0, 643.0, 432.0, 262.0, 182.0, 111.0, 78.0, 50.0, 38.0, 23.0, 21.0, 12.0, 8.0, 11.0, 0.0, 3.0, 6.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-16.71875, -16.201904296875, -15.68505859375, -15.168212890625, -14.6513671875, -14.134521484375, -13.61767578125, -13.100830078125, -12.583984375, -12.067138671875, -11.55029296875, -11.033447265625, -10.5166015625, -9.999755859375, -9.48291015625, -8.966064453125, -8.44921875, -7.932373046875, -7.41552734375, -6.898681640625, -6.3818359375, -5.864990234375, -5.34814453125, -4.831298828125, -4.314453125, -3.797607421875, -3.28076171875, -2.763916015625, -2.2470703125, -1.730224609375, -1.21337890625, -0.696533203125, -0.1796875, 0.337158203125, 0.85400390625, 1.370849609375, 1.8876953125, 2.404541015625, 2.92138671875, 3.438232421875, 3.955078125, 4.471923828125, 4.98876953125, 5.505615234375, 6.0224609375, 6.539306640625, 7.05615234375, 7.572998046875, 8.08984375, 8.606689453125, 9.12353515625, 9.640380859375, 10.1572265625, 10.674072265625, 11.19091796875, 11.707763671875, 12.224609375, 12.741455078125, 13.25830078125, 13.775146484375, 14.2919921875, 14.808837890625, 15.32568359375, 15.842529296875, 16.359375]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 10.0, 11.0, 29.0, 45.0, 89.0, 160.0, 206.0, 180.0, 118.0, 71.0, 33.0, 23.0, 11.0, 12.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-95.14019012451172, -92.25006866455078, -89.35995483398438, -86.46983337402344, -83.5797119140625, -80.6895980834961, -77.79947662353516, -74.90936279296875, -72.01924133300781, -69.12911987304688, -66.23900604248047, -63.34888458251953, -60.45876693725586, -57.56864929199219, -54.67852783203125, -51.78841018676758, -48.898292541503906, -46.008174896240234, -43.11805725097656, -40.227935791015625, -37.33781814575195, -34.44770050048828, -31.557580947875977, -28.667461395263672, -25.77734375, -22.887226104736328, -19.997106552124023, -17.10698699951172, -14.216869354248047, -11.326750755310059, -8.43663215637207, -5.546512603759766, -2.656402587890625, 0.23371601104736328, 3.1238346099853516, 6.01395320892334, 8.904071807861328, 11.794190406799316, 14.684309005737305, 17.57442855834961, 20.46454620361328, 23.354663848876953, 26.244783401489258, 29.134902954101562, 32.025020599365234, 34.915138244628906, 37.805259704589844, 40.695377349853516, 43.58549499511719, 46.47561264038086, 49.36573028564453, 52.25585174560547, 55.14596939086914, 58.03608703613281, 60.92620849609375, 63.81632614135742, 66.7064437866211, 69.59656524658203, 72.48667907714844, 75.37680053710938, 78.26692199707031, 81.15703582763672, 84.04715728759766, 86.93727111816406, 89.827392578125]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 2.0, 2.0, 8.0, 0.0, 7.0, 12.0, 7.0, 2.0, 14.0, 11.0, 16.0, 17.0, 29.0, 27.0, 30.0, 30.0, 38.0, 34.0, 38.0, 30.0, 38.0, 44.0, 37.0, 53.0, 47.0, 44.0, 39.0, 36.0, 45.0, 33.0, 36.0, 33.0, 18.0, 26.0, 16.0, 21.0, 22.0, 15.0, 12.0, 9.0, 8.0, 4.0, 6.0, 5.0, 5.0, 2.0, 2.0, 0.0, 2.0, 3.0, 1.0, 2.0], "bins": [-41.89741134643555, -40.713348388671875, -39.5292854309082, -38.34522247314453, -37.161155700683594, -35.97709274291992, -34.79302978515625, -33.60896682739258, -32.424903869628906, -31.240840911865234, -30.056777954101562, -28.872713088989258, -27.688650131225586, -26.504587173461914, -25.32052230834961, -24.136459350585938, -22.952396392822266, -21.768333435058594, -20.584270477294922, -19.400205612182617, -18.216142654418945, -17.032079696655273, -15.848015785217285, -14.663951873779297, -13.479888916015625, -12.295825958251953, -11.111762046813965, -9.927698135375977, -8.743635177612305, -7.559571743011475, -6.3755083084106445, -5.191444396972656, -4.007377624511719, -2.8233141899108887, -1.6392507553100586, -0.4551873207092285, 0.7288761138916016, 1.9129395484924316, 3.0970029830932617, 4.28106689453125, 5.465129852294922, 6.649193286895752, 7.833256721496582, 9.01732063293457, 10.201383590698242, 11.385446548461914, 12.569510459899902, 13.75357437133789, 14.937637329101562, 16.121700286865234, 17.305763244628906, 18.48982810974121, 19.673891067504883, 20.857954025268555, 22.04201889038086, 23.22608184814453, 24.410144805908203, 25.594207763671875, 26.778270721435547, 27.96233558654785, 29.146398544311523, 30.330461502075195, 31.5145263671875, 32.69858932495117, 33.882652282714844]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 5.0, 4.0, 5.0, 5.0, 7.0, 6.0, 9.0, 10.0, 12.0, 12.0, 17.0, 19.0, 23.0, 33.0, 20.0, 33.0, 29.0, 44.0, 45.0, 42.0, 52.0, 58.0, 48.0, 46.0, 63.0, 47.0, 31.0, 43.0, 30.0, 30.0, 26.0, 23.0, 24.0, 21.0, 19.0, 13.0, 10.0, 10.0, 9.0, 3.0, 6.0, 4.0, 5.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0], "bins": [-4.74609375, -4.6146240234375, -4.483154296875, -4.3516845703125, -4.22021484375, -4.0887451171875, -3.957275390625, -3.8258056640625, -3.6943359375, -3.5628662109375, -3.431396484375, -3.2999267578125, -3.16845703125, -3.0369873046875, -2.905517578125, -2.7740478515625, -2.642578125, -2.5111083984375, -2.379638671875, -2.2481689453125, -2.11669921875, -1.9852294921875, -1.853759765625, -1.7222900390625, -1.5908203125, -1.4593505859375, -1.327880859375, -1.1964111328125, -1.06494140625, -0.9334716796875, -0.802001953125, -0.6705322265625, -0.5390625, -0.4075927734375, -0.276123046875, -0.1446533203125, -0.01318359375, 0.1182861328125, 0.249755859375, 0.3812255859375, 0.5126953125, 0.6441650390625, 0.775634765625, 0.9071044921875, 1.03857421875, 1.1700439453125, 1.301513671875, 1.4329833984375, 1.564453125, 1.6959228515625, 1.827392578125, 1.9588623046875, 2.09033203125, 2.2218017578125, 2.353271484375, 2.4847412109375, 2.6162109375, 2.7476806640625, 2.879150390625, 3.0106201171875, 3.14208984375, 3.2735595703125, 3.405029296875, 3.5364990234375, 3.66796875]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 1.0, 3.0, 12.0, 6.0, 9.0, 19.0, 21.0, 36.0, 48.0, 88.0, 115.0, 181.0, 278.0, 426.0, 665.0, 1042.0, 1719.0, 2845.0, 4853.0, 8487.0, 14961.0, 28255.0, 56483.0, 122081.0, 284971.0, 280710.0, 120635.0, 55790.0, 28028.0, 15139.0, 8394.0, 4835.0, 2852.0, 1716.0, 1057.0, 640.0, 395.0, 260.0, 173.0, 120.0, 74.0, 47.0, 27.0, 26.0, 17.0, 9.0, 4.0, 3.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.2103271484375, -0.20413970947265625, -0.1979522705078125, -0.19176483154296875, -0.185577392578125, -0.17938995361328125, -0.1732025146484375, -0.16701507568359375, -0.16082763671875, -0.15464019775390625, -0.1484527587890625, -0.14226531982421875, -0.136077880859375, -0.12989044189453125, -0.1237030029296875, -0.11751556396484375, -0.111328125, -0.10514068603515625, -0.0989532470703125, -0.09276580810546875, -0.086578369140625, -0.08039093017578125, -0.0742034912109375, -0.06801605224609375, -0.06182861328125, -0.05564117431640625, -0.0494537353515625, -0.04326629638671875, -0.037078857421875, -0.03089141845703125, -0.0247039794921875, -0.01851654052734375, -0.0123291015625, -0.00614166259765625, 4.57763671875e-05, 0.00623321533203125, 0.012420654296875, 0.01860809326171875, 0.0247955322265625, 0.03098297119140625, 0.03717041015625, 0.04335784912109375, 0.0495452880859375, 0.05573272705078125, 0.061920166015625, 0.06810760498046875, 0.0742950439453125, 0.08048248291015625, 0.086669921875, 0.09285736083984375, 0.0990447998046875, 0.10523223876953125, 0.111419677734375, 0.11760711669921875, 0.1237945556640625, 0.12998199462890625, 0.13616943359375, 0.14235687255859375, 0.1485443115234375, 0.15473175048828125, 0.160919189453125, 0.16710662841796875, 0.1732940673828125, 0.17948150634765625, 0.1856689453125]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 3.0, 0.0, 3.0, 4.0, 4.0, 4.0, 3.0, 8.0, 17.0, 9.0, 11.0, 15.0, 11.0, 22.0, 27.0, 17.0, 26.0, 24.0, 24.0, 38.0, 30.0, 42.0, 49.0, 33.0, 35.0, 28.0, 1071.0, 30.0, 32.0, 31.0, 25.0, 33.0, 35.0, 29.0, 28.0, 29.0, 24.0, 19.0, 22.0, 22.0, 25.0, 18.0, 8.0, 20.0, 3.0, 9.0, 7.0, 5.0, 8.0, 6.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.30859375, -2.230865478515625, -2.15313720703125, -2.075408935546875, -1.9976806640625, -1.919952392578125, -1.84222412109375, -1.764495849609375, -1.686767578125, -1.609039306640625, -1.53131103515625, -1.453582763671875, -1.3758544921875, -1.298126220703125, -1.22039794921875, -1.142669677734375, -1.06494140625, -0.987213134765625, -0.90948486328125, -0.831756591796875, -0.7540283203125, -0.676300048828125, -0.59857177734375, -0.520843505859375, -0.443115234375, -0.365386962890625, -0.28765869140625, -0.209930419921875, -0.1322021484375, -0.054473876953125, 0.02325439453125, 0.100982666015625, 0.1787109375, 0.256439208984375, 0.33416748046875, 0.411895751953125, 0.4896240234375, 0.567352294921875, 0.64508056640625, 0.722808837890625, 0.800537109375, 0.878265380859375, 0.95599365234375, 1.033721923828125, 1.1114501953125, 1.189178466796875, 1.26690673828125, 1.344635009765625, 1.42236328125, 1.500091552734375, 1.57781982421875, 1.655548095703125, 1.7332763671875, 1.811004638671875, 1.88873291015625, 1.966461181640625, 2.044189453125, 2.121917724609375, 2.19964599609375, 2.277374267578125, 2.3551025390625, 2.432830810546875, 2.51055908203125, 2.588287353515625, 2.666015625]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 2.0, 6.0, 6.0, 16.0, 19.0, 21.0, 27.0, 32.0, 54.0, 63.0, 78.0, 137.0, 191.0, 241.0, 377.0, 480.0, 692.0, 924.0, 1359.0, 2012.0, 2738.0, 3975.0, 5869.0, 8671.0, 12908.0, 19730.0, 30042.0, 46657.0, 72746.0, 115748.0, 193768.0, 1240412.0, 120654.0, 75301.0, 47728.0, 30886.0, 20275.0, 13407.0, 8949.0, 5957.0, 4244.0, 2898.0, 1949.0, 1368.0, 990.0, 734.0, 518.0, 347.0, 243.0, 200.0, 148.0, 106.0, 82.0, 50.0, 28.0, 29.0, 11.0, 16.0, 15.0, 5.0, 3.0, 2.0, 5.0], "bins": [-0.1065673828125, -0.103240966796875, -0.09991455078125, -0.096588134765625, -0.09326171875, -0.089935302734375, -0.08660888671875, -0.083282470703125, -0.0799560546875, -0.076629638671875, -0.07330322265625, -0.069976806640625, -0.066650390625, -0.063323974609375, -0.05999755859375, -0.056671142578125, -0.0533447265625, -0.050018310546875, -0.04669189453125, -0.043365478515625, -0.0400390625, -0.036712646484375, -0.03338623046875, -0.030059814453125, -0.0267333984375, -0.023406982421875, -0.02008056640625, -0.016754150390625, -0.013427734375, -0.010101318359375, -0.00677490234375, -0.003448486328125, -0.0001220703125, 0.003204345703125, 0.00653076171875, 0.009857177734375, 0.01318359375, 0.016510009765625, 0.01983642578125, 0.023162841796875, 0.0264892578125, 0.029815673828125, 0.03314208984375, 0.036468505859375, 0.039794921875, 0.043121337890625, 0.04644775390625, 0.049774169921875, 0.0531005859375, 0.056427001953125, 0.05975341796875, 0.063079833984375, 0.06640625, 0.069732666015625, 0.07305908203125, 0.076385498046875, 0.0797119140625, 0.083038330078125, 0.08636474609375, 0.089691162109375, 0.093017578125, 0.096343994140625, 0.09967041015625, 0.102996826171875, 0.1063232421875]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 0.0, 6.0, 3.0, 10.0, 9.0, 9.0, 15.0, 12.0, 19.0, 31.0, 31.0, 48.0, 60.0, 67.0, 90.0, 106.0, 110.0, 74.0, 72.0, 59.0, 46.0, 37.0, 26.0, 18.0, 11.0, 8.0, 6.0, 4.0, 5.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011920928955078125, -0.00011474266648292542, -0.00011027604341506958, -0.00010580942034721375, -0.00010134279727935791, -9.687617421150208e-05, -9.240955114364624e-05, -8.79429280757904e-05, -8.347630500793457e-05, -7.900968194007874e-05, -7.45430588722229e-05, -7.007643580436707e-05, -6.560981273651123e-05, -6.11431896686554e-05, -5.667656660079956e-05, -5.2209943532943726e-05, -4.774332046508789e-05, -4.3276697397232056e-05, -3.881007432937622e-05, -3.4343451261520386e-05, -2.987682819366455e-05, -2.5410205125808716e-05, -2.094358205795288e-05, -1.6476958990097046e-05, -1.2010335922241211e-05, -7.543712854385376e-06, -3.077089786529541e-06, 1.389533281326294e-06, 5.856156349182129e-06, 1.0322779417037964e-05, 1.4789402484893799e-05, 1.9256025552749634e-05, 2.372264862060547e-05, 2.8189271688461304e-05, 3.265589475631714e-05, 3.7122517824172974e-05, 4.158914089202881e-05, 4.6055763959884644e-05, 5.052238702774048e-05, 5.4989010095596313e-05, 5.945563316345215e-05, 6.392225623130798e-05, 6.838887929916382e-05, 7.285550236701965e-05, 7.732212543487549e-05, 8.178874850273132e-05, 8.625537157058716e-05, 9.072199463844299e-05, 9.518861770629883e-05, 9.965524077415466e-05, 0.0001041218638420105, 0.00010858848690986633, 0.00011305510997772217, 0.000117521733045578, 0.00012198835611343384, 0.00012645497918128967, 0.0001309216022491455, 0.00013538822531700134, 0.00013985484838485718, 0.000144321471452713, 0.00014878809452056885, 0.00015325471758842468, 0.00015772134065628052, 0.00016218796372413635, 0.0001666545867919922]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 2.0, 0.0, 4.0, 5.0, 12.0, 10.0, 12.0, 8.0, 26.0, 39.0, 46.0, 73.0, 99.0, 139.0, 328.0, 1036.0, 5306.0, 53085.0, 891507.0, 87414.0, 7272.0, 1254.0, 361.0, 165.0, 113.0, 60.0, 57.0, 30.0, 22.0, 25.0, 20.0, 8.0, 6.0, 2.0, 5.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0020046234130859375, -0.0019482821226119995, -0.0018919408321380615, -0.0018355995416641235, -0.0017792582511901855, -0.0017229169607162476, -0.0016665756702423096, -0.0016102343797683716, -0.0015538930892944336, -0.0014975517988204956, -0.0014412105083465576, -0.0013848692178726196, -0.0013285279273986816, -0.0012721866369247437, -0.0012158453464508057, -0.0011595040559768677, -0.0011031627655029297, -0.0010468214750289917, -0.0009904801845550537, -0.0009341388940811157, -0.0008777976036071777, -0.0008214563131332397, -0.0007651150226593018, -0.0007087737321853638, -0.0006524324417114258, -0.0005960911512374878, -0.0005397498607635498, -0.0004834085702896118, -0.00042706727981567383, -0.00037072598934173584, -0.00031438469886779785, -0.00025804340839385986, -0.00020170211791992188, -0.0001453608274459839, -8.90195369720459e-05, -3.267824649810791e-05, 2.3663043975830078e-05, 8.000433444976807e-05, 0.00013634562492370605, 0.00019268691539764404, 0.00024902820587158203, 0.00030536949634552, 0.000361710786819458, 0.000418052077293396, 0.000474393367767334, 0.000530734658241272, 0.00058707594871521, 0.000643417239189148, 0.0006997585296630859, 0.0007560998201370239, 0.0008124411106109619, 0.0008687824010848999, 0.0009251236915588379, 0.0009814649820327759, 0.0010378062725067139, 0.0010941475629806519, 0.0011504888534545898, 0.0012068301439285278, 0.0012631714344024658, 0.0013195127248764038, 0.0013758540153503418, 0.0014321953058242798, 0.0014885365962982178, 0.0015448778867721558, 0.0016012191772460938]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 11.0, 14.0, 29.0, 71.0, 148.0, 366.0, 213.0, 72.0, 45.0, 15.0, 14.0, 5.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010348988143960014, -9.455355757381767e-05, -8.56172337080352e-05, -7.668090984225273e-05, -6.774459325242788e-05, -5.88082657486666e-05, -4.987194552086294e-05, -4.093562165508047e-05, -3.1999297789298e-05, -2.306297392351553e-05, -1.4126651876722462e-05, -5.1903298299293965e-06, 3.745994035853073e-06, 1.2682317901635543e-05, 2.1618638129439205e-05, 3.0554961995221674e-05, 3.9491285861004144e-05, 4.8427609726786613e-05, 5.736393359256908e-05, 6.630025745835155e-05, 7.523657404817641e-05, 8.417290518991649e-05, 9.310922177974135e-05, 0.00010204554564552382, 0.00011098186951130629, 0.00011991819337708876, 0.00012885451724287122, 0.00013779083383269608, 0.00014672716497443616, 0.00015566348156426102, 0.00016459979815408587, 0.00017353612929582596, 0.00018247246043756604, 0.0001914087770273909, 0.00020034510816913098, 0.00020928142475895584, 0.00021821775590069592, 0.00022715407249052078, 0.00023609038908034563, 0.0002450267202220857, 0.0002539630513638258, 0.0002628993825055659, 0.0002718356845434755, 0.0002807720156852156, 0.0002897083468269557, 0.00029864467796869576, 0.0003075809800066054, 0.00031651731114834547, 0.00032545364229008555, 0.00033438997343182564, 0.00034332627546973526, 0.00035226260661147535, 0.00036119893775321543, 0.0003701352688949555, 0.00037907157093286514, 0.0003880079020746052, 0.00039694420411251485, 0.00040588053525425494, 0.00041481683729216456, 0.00042375316843390465, 0.00043268949957564473, 0.0004416258307173848, 0.00045056213275529444, 0.0004594984638970345, 0.0004684347950387746]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 3.0, 6.0, 0.0, 3.0, 9.0, 13.0, 12.0, 7.0, 11.0, 21.0, 18.0, 17.0, 22.0, 21.0, 28.0, 25.0, 27.0, 34.0, 32.0, 30.0, 29.0, 36.0, 43.0, 46.0, 30.0, 34.0, 38.0, 38.0, 26.0, 28.0, 30.0, 31.0, 32.0, 28.0, 19.0, 36.0, 25.0, 17.0, 15.0, 16.0, 8.0, 16.0, 8.0, 4.0, 4.0, 5.0, 7.0, 4.0, 2.0, 3.0, 5.0, 5.0, 1.0, 3.0], "bins": [-5.5909156799316406e-05, -5.427934229373932e-05, -5.264952778816223e-05, -5.1019713282585144e-05, -4.938989877700806e-05, -4.776008427143097e-05, -4.613026976585388e-05, -4.4500455260276794e-05, -4.287064075469971e-05, -4.124082624912262e-05, -3.961101174354553e-05, -3.7981197237968445e-05, -3.635138273239136e-05, -3.472156822681427e-05, -3.309175372123718e-05, -3.1461939215660095e-05, -2.9832124710083008e-05, -2.820231020450592e-05, -2.6572495698928833e-05, -2.4942681193351746e-05, -2.3312866687774658e-05, -2.168305218219757e-05, -2.0053237676620483e-05, -1.8423423171043396e-05, -1.679360866546631e-05, -1.5163794159889221e-05, -1.3533979654312134e-05, -1.1904165148735046e-05, -1.0274350643157959e-05, -8.644536137580872e-06, -7.014721632003784e-06, -5.384907126426697e-06, -3.7550926208496094e-06, -2.125278115272522e-06, -4.954636096954346e-07, 1.1343508958816528e-06, 2.7641654014587402e-06, 4.393979907035828e-06, 6.023794412612915e-06, 7.653608918190002e-06, 9.28342342376709e-06, 1.0913237929344177e-05, 1.2543052434921265e-05, 1.4172866940498352e-05, 1.580268144607544e-05, 1.7432495951652527e-05, 1.9062310457229614e-05, 2.06921249628067e-05, 2.232193946838379e-05, 2.3951753973960876e-05, 2.5581568479537964e-05, 2.721138298511505e-05, 2.884119749069214e-05, 3.0471011996269226e-05, 3.2100826501846313e-05, 3.37306410074234e-05, 3.536045551300049e-05, 3.6990270018577576e-05, 3.862008452415466e-05, 4.024989902973175e-05, 4.187971353530884e-05, 4.3509528040885925e-05, 4.513934254646301e-05, 4.67691570520401e-05, 4.839897155761719e-05]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 5.0, 4.0, 5.0, 5.0, 7.0, 6.0, 9.0, 10.0, 12.0, 12.0, 17.0, 19.0, 23.0, 33.0, 20.0, 33.0, 29.0, 44.0, 45.0, 42.0, 52.0, 58.0, 48.0, 46.0, 63.0, 47.0, 31.0, 43.0, 30.0, 30.0, 26.0, 23.0, 24.0, 21.0, 19.0, 13.0, 10.0, 10.0, 9.0, 3.0, 6.0, 4.0, 5.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0], "bins": [-4.74609375, -4.6146240234375, -4.483154296875, -4.3516845703125, -4.22021484375, -4.0887451171875, -3.957275390625, -3.8258056640625, -3.6943359375, -3.5628662109375, -3.431396484375, -3.2999267578125, -3.16845703125, -3.0369873046875, -2.905517578125, -2.7740478515625, -2.642578125, -2.5111083984375, -2.379638671875, -2.2481689453125, -2.11669921875, -1.9852294921875, -1.853759765625, -1.7222900390625, -1.5908203125, -1.4593505859375, -1.327880859375, -1.1964111328125, -1.06494140625, -0.9334716796875, -0.802001953125, -0.6705322265625, -0.5390625, -0.4075927734375, -0.276123046875, -0.1446533203125, -0.01318359375, 0.1182861328125, 0.249755859375, 0.3812255859375, 0.5126953125, 0.6441650390625, 0.775634765625, 0.9071044921875, 1.03857421875, 1.1700439453125, 1.301513671875, 1.4329833984375, 1.564453125, 1.6959228515625, 1.827392578125, 1.9588623046875, 2.09033203125, 2.2218017578125, 2.353271484375, 2.4847412109375, 2.6162109375, 2.7476806640625, 2.879150390625, 3.0106201171875, 3.14208984375, 3.2735595703125, 3.405029296875, 3.5364990234375, 3.66796875]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 3.0, 4.0, 9.0, 5.0, 13.0, 11.0, 22.0, 28.0, 27.0, 50.0, 71.0, 90.0, 134.0, 199.0, 247.0, 362.0, 511.0, 694.0, 1007.0, 1446.0, 1985.0, 2942.0, 5007.0, 12142.0, 64979.0, 645732.0, 262807.0, 27916.0, 7645.0, 3973.0, 2410.0, 1785.0, 1251.0, 854.0, 638.0, 467.0, 306.0, 222.0, 149.0, 114.0, 71.0, 58.0, 57.0, 36.0, 24.0, 20.0, 8.0, 11.0, 5.0, 6.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.8203125, -5.63720703125, -5.4541015625, -5.27099609375, -5.087890625, -4.90478515625, -4.7216796875, -4.53857421875, -4.35546875, -4.17236328125, -3.9892578125, -3.80615234375, -3.623046875, -3.43994140625, -3.2568359375, -3.07373046875, -2.890625, -2.70751953125, -2.5244140625, -2.34130859375, -2.158203125, -1.97509765625, -1.7919921875, -1.60888671875, -1.42578125, -1.24267578125, -1.0595703125, -0.87646484375, -0.693359375, -0.51025390625, -0.3271484375, -0.14404296875, 0.0390625, 0.22216796875, 0.4052734375, 0.58837890625, 0.771484375, 0.95458984375, 1.1376953125, 1.32080078125, 1.50390625, 1.68701171875, 1.8701171875, 2.05322265625, 2.236328125, 2.41943359375, 2.6025390625, 2.78564453125, 2.96875, 3.15185546875, 3.3349609375, 3.51806640625, 3.701171875, 3.88427734375, 4.0673828125, 4.25048828125, 4.43359375, 4.61669921875, 4.7998046875, 4.98291015625, 5.166015625, 5.34912109375, 5.5322265625, 5.71533203125, 5.8984375]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 5.0, 6.0, 8.0, 10.0, 13.0, 10.0, 13.0, 15.0, 15.0, 13.0, 24.0, 27.0, 31.0, 32.0, 32.0, 32.0, 22.0, 34.0, 39.0, 33.0, 56.0, 47.0, 278.0, 1724.0, 96.0, 45.0, 45.0, 47.0, 45.0, 30.0, 30.0, 35.0, 24.0, 19.0, 16.0, 16.0, 16.0, 17.0, 15.0, 3.0, 8.0, 8.0, 8.0, 2.0, 3.0, 4.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.21875, -12.795166015625, -12.37158203125, -11.947998046875, -11.5244140625, -11.100830078125, -10.67724609375, -10.253662109375, -9.830078125, -9.406494140625, -8.98291015625, -8.559326171875, -8.1357421875, -7.712158203125, -7.28857421875, -6.864990234375, -6.44140625, -6.017822265625, -5.59423828125, -5.170654296875, -4.7470703125, -4.323486328125, -3.89990234375, -3.476318359375, -3.052734375, -2.629150390625, -2.20556640625, -1.781982421875, -1.3583984375, -0.934814453125, -0.51123046875, -0.087646484375, 0.3359375, 0.759521484375, 1.18310546875, 1.606689453125, 2.0302734375, 2.453857421875, 2.87744140625, 3.301025390625, 3.724609375, 4.148193359375, 4.57177734375, 4.995361328125, 5.4189453125, 5.842529296875, 6.26611328125, 6.689697265625, 7.11328125, 7.536865234375, 7.96044921875, 8.384033203125, 8.8076171875, 9.231201171875, 9.65478515625, 10.078369140625, 10.501953125, 10.925537109375, 11.34912109375, 11.772705078125, 12.1962890625, 12.619873046875, 13.04345703125, 13.467041015625, 13.890625]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 8.0, 3.0, 6.0, 13.0, 10.0, 9.0, 19.0, 25.0, 40.0, 31.0, 50.0, 108.0, 163.0, 268.0, 529.0, 1496.0, 4890.0, 25738.0, 3049823.0, 51751.0, 7089.0, 1996.0, 704.0, 323.0, 189.0, 113.0, 78.0, 55.0, 32.0, 38.0, 21.0, 21.0, 20.0, 18.0, 8.0, 10.0, 9.0, 2.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.078125, -22.177490234375, -21.27685546875, -20.376220703125, -19.4755859375, -18.574951171875, -17.67431640625, -16.773681640625, -15.873046875, -14.972412109375, -14.07177734375, -13.171142578125, -12.2705078125, -11.369873046875, -10.46923828125, -9.568603515625, -8.66796875, -7.767333984375, -6.86669921875, -5.966064453125, -5.0654296875, -4.164794921875, -3.26416015625, -2.363525390625, -1.462890625, -0.562255859375, 0.33837890625, 1.239013671875, 2.1396484375, 3.040283203125, 3.94091796875, 4.841552734375, 5.7421875, 6.642822265625, 7.54345703125, 8.444091796875, 9.3447265625, 10.245361328125, 11.14599609375, 12.046630859375, 12.947265625, 13.847900390625, 14.74853515625, 15.649169921875, 16.5498046875, 17.450439453125, 18.35107421875, 19.251708984375, 20.15234375, 21.052978515625, 21.95361328125, 22.854248046875, 23.7548828125, 24.655517578125, 25.55615234375, 26.456787109375, 27.357421875, 28.258056640625, 29.15869140625, 30.059326171875, 30.9599609375, 31.860595703125, 32.76123046875, 33.661865234375, 34.5625]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 16.0, 169.0, 634.0, 175.0, 18.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-177.4801788330078, -173.7400665283203, -169.9999542236328, -166.25982666015625, -162.51971435546875, -158.77960205078125, -155.03948974609375, -151.29937744140625, -147.5592498779297, -143.8191375732422, -140.0790252685547, -136.33889770507812, -132.59878540039062, -128.85867309570312, -125.11856079101562, -121.3784408569336, -117.63833618164062, -113.89822387695312, -110.1581039428711, -106.4179916381836, -102.67787170410156, -98.93775939941406, -95.19764709472656, -91.45752716064453, -87.7174072265625, -83.977294921875, -80.23717498779297, -76.49706268310547, -72.75694274902344, -69.01683044433594, -65.27671813964844, -61.536598205566406, -57.79648208618164, -54.056365966796875, -50.31624984741211, -46.576133728027344, -42.836021423339844, -39.09590530395508, -35.35578918457031, -31.61567497253418, -27.875558853149414, -24.13544273376465, -20.395328521728516, -16.65521240234375, -12.9150972366333, -9.174982070922852, -5.434865951538086, -1.6947517395019531, 2.0453643798828125, 5.785479545593262, 9.525594711303711, 13.265710830688477, 17.00582504272461, 20.745941162109375, 24.48605728149414, 28.226171493530273, 31.96628761291504, 35.70640182495117, 39.44651794433594, 43.1866340637207, 46.92675018310547, 50.66686248779297, 54.406982421875, 58.1470947265625, 61.887210845947266]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 7.0, 2.0, 3.0, 13.0, 13.0, 5.0, 14.0, 8.0, 16.0, 20.0, 18.0, 33.0, 30.0, 36.0, 23.0, 41.0, 42.0, 42.0, 45.0, 39.0, 42.0, 48.0, 46.0, 43.0, 37.0, 36.0, 39.0, 38.0, 36.0, 32.0, 20.0, 18.0, 16.0, 15.0, 21.0, 11.0, 18.0, 10.0, 10.0, 6.0, 6.0, 2.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-51.54596710205078, -49.972530364990234, -48.39908981323242, -46.825653076171875, -45.25221633911133, -43.67877960205078, -42.10533905029297, -40.53190231323242, -38.958465576171875, -37.38502883911133, -35.811588287353516, -34.23815155029297, -32.66471481323242, -31.091276168823242, -29.517837524414062, -27.944400787353516, -26.370960235595703, -24.797521591186523, -23.224084854125977, -21.650646209716797, -20.07720947265625, -18.50377082824707, -16.93033218383789, -15.356894493103027, -13.783456802368164, -12.2100191116333, -10.636581420898438, -9.063142776489258, -7.4897050857543945, -5.916267395019531, -4.342828750610352, -2.7693910598754883, -1.195953369140625, 0.3774845600128174, 1.9509224891662598, 3.5243606567382812, 5.0977983474731445, 6.671236038208008, 8.244674682617188, 9.81811237335205, 11.391550064086914, 12.964987754821777, 14.53842544555664, 16.11186408996582, 17.685302734375, 19.258739471435547, 20.832178115844727, 22.405616760253906, 23.979053497314453, 25.552492141723633, 27.12592887878418, 28.69936752319336, 30.272804260253906, 31.846242904663086, 33.419681549072266, 34.99311828613281, 36.566558837890625, 38.13999557495117, 39.713436126708984, 41.28687286376953, 42.86030960083008, 44.433746337890625, 46.00718688964844, 47.580623626708984, 49.15406036376953]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 1.0, 5.0, 6.0, 5.0, 3.0, 7.0, 6.0, 6.0, 12.0, 12.0, 21.0, 13.0, 10.0, 22.0, 30.0, 23.0, 40.0, 41.0, 36.0, 46.0, 47.0, 39.0, 65.0, 47.0, 47.0, 40.0, 56.0, 48.0, 37.0, 27.0, 29.0, 25.0, 23.0, 18.0, 27.0, 23.0, 8.0, 16.0, 8.0, 8.0, 4.0, 3.0, 7.0, 2.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-4.88671875, -4.7510986328125, -4.615478515625, -4.4798583984375, -4.34423828125, -4.2086181640625, -4.072998046875, -3.9373779296875, -3.8017578125, -3.6661376953125, -3.530517578125, -3.3948974609375, -3.25927734375, -3.1236572265625, -2.988037109375, -2.8524169921875, -2.716796875, -2.5811767578125, -2.445556640625, -2.3099365234375, -2.17431640625, -2.0386962890625, -1.903076171875, -1.7674560546875, -1.6318359375, -1.4962158203125, -1.360595703125, -1.2249755859375, -1.08935546875, -0.9537353515625, -0.818115234375, -0.6824951171875, -0.546875, -0.4112548828125, -0.275634765625, -0.1400146484375, -0.00439453125, 0.1312255859375, 0.266845703125, 0.4024658203125, 0.5380859375, 0.6737060546875, 0.809326171875, 0.9449462890625, 1.08056640625, 1.2161865234375, 1.351806640625, 1.4874267578125, 1.623046875, 1.7586669921875, 1.894287109375, 2.0299072265625, 2.16552734375, 2.3011474609375, 2.436767578125, 2.5723876953125, 2.7080078125, 2.8436279296875, 2.979248046875, 3.1148681640625, 3.25048828125, 3.3861083984375, 3.521728515625, 3.6573486328125, 3.79296875]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 3.0, 7.0, 9.0, 8.0, 13.0, 18.0, 26.0, 53.0, 55.0, 101.0, 153.0, 236.0, 365.0, 647.0, 1125.0, 2015.0, 3697.0, 6986.0, 15007.0, 36032.0, 185140.0, 3196809.0, 648287.0, 57923.0, 20462.0, 9116.0, 4482.0, 2337.0, 1248.0, 777.0, 456.0, 256.0, 155.0, 96.0, 68.0, 36.0, 31.0, 13.0, 16.0, 9.0, 5.0, 1.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.1015625, -12.6602783203125, -12.218994140625, -11.7777099609375, -11.33642578125, -10.8951416015625, -10.453857421875, -10.0125732421875, -9.5712890625, -9.1300048828125, -8.688720703125, -8.2474365234375, -7.80615234375, -7.3648681640625, -6.923583984375, -6.4822998046875, -6.041015625, -5.5997314453125, -5.158447265625, -4.7171630859375, -4.27587890625, -3.8345947265625, -3.393310546875, -2.9520263671875, -2.5107421875, -2.0694580078125, -1.628173828125, -1.1868896484375, -0.74560546875, -0.3043212890625, 0.136962890625, 0.5782470703125, 1.01953125, 1.4608154296875, 1.902099609375, 2.3433837890625, 2.78466796875, 3.2259521484375, 3.667236328125, 4.1085205078125, 4.5498046875, 4.9910888671875, 5.432373046875, 5.8736572265625, 6.31494140625, 6.7562255859375, 7.197509765625, 7.6387939453125, 8.080078125, 8.5213623046875, 8.962646484375, 9.4039306640625, 9.84521484375, 10.2864990234375, 10.727783203125, 11.1690673828125, 11.6103515625, 12.0516357421875, 12.492919921875, 12.9342041015625, 13.37548828125, 13.8167724609375, 14.258056640625, 14.6993408203125, 15.140625]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 4.0, 6.0, 7.0, 5.0, 5.0, 6.0, 17.0, 10.0, 13.0, 21.0, 22.0, 32.0, 37.0, 44.0, 71.0, 101.0, 135.0, 284.0, 455.0, 610.0, 691.0, 482.0, 320.0, 191.0, 131.0, 85.0, 63.0, 46.0, 34.0, 30.0, 20.0, 20.0, 13.0, 17.0, 10.0, 5.0, 7.0, 2.0, 8.0, 4.0, 2.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-11.5078125, -11.1611328125, -10.814453125, -10.4677734375, -10.12109375, -9.7744140625, -9.427734375, -9.0810546875, -8.734375, -8.3876953125, -8.041015625, -7.6943359375, -7.34765625, -7.0009765625, -6.654296875, -6.3076171875, -5.9609375, -5.6142578125, -5.267578125, -4.9208984375, -4.57421875, -4.2275390625, -3.880859375, -3.5341796875, -3.1875, -2.8408203125, -2.494140625, -2.1474609375, -1.80078125, -1.4541015625, -1.107421875, -0.7607421875, -0.4140625, -0.0673828125, 0.279296875, 0.6259765625, 0.97265625, 1.3193359375, 1.666015625, 2.0126953125, 2.359375, 2.7060546875, 3.052734375, 3.3994140625, 3.74609375, 4.0927734375, 4.439453125, 4.7861328125, 5.1328125, 5.4794921875, 5.826171875, 6.1728515625, 6.51953125, 6.8662109375, 7.212890625, 7.5595703125, 7.90625, 8.2529296875, 8.599609375, 8.9462890625, 9.29296875, 9.6396484375, 9.986328125, 10.3330078125, 10.6796875]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 3.0, 3.0, 5.0, 11.0, 6.0, 16.0, 13.0, 23.0, 38.0, 50.0, 85.0, 127.0, 254.0, 437.0, 847.0, 1551.0, 2817.0, 5401.0, 11128.0, 25088.0, 65748.0, 307244.0, 3104498.0, 527954.0, 84086.0, 30304.0, 13101.0, 6362.0, 3186.0, 1704.0, 957.0, 496.0, 296.0, 149.0, 115.0, 50.0, 41.0, 33.0, 18.0, 1.0, 13.0, 5.0, 8.0, 4.0, 2.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-18.34375, -17.72412109375, -17.1044921875, -16.48486328125, -15.865234375, -15.24560546875, -14.6259765625, -14.00634765625, -13.38671875, -12.76708984375, -12.1474609375, -11.52783203125, -10.908203125, -10.28857421875, -9.6689453125, -9.04931640625, -8.4296875, -7.81005859375, -7.1904296875, -6.57080078125, -5.951171875, -5.33154296875, -4.7119140625, -4.09228515625, -3.47265625, -2.85302734375, -2.2333984375, -1.61376953125, -0.994140625, -0.37451171875, 0.2451171875, 0.86474609375, 1.484375, 2.10400390625, 2.7236328125, 3.34326171875, 3.962890625, 4.58251953125, 5.2021484375, 5.82177734375, 6.44140625, 7.06103515625, 7.6806640625, 8.30029296875, 8.919921875, 9.53955078125, 10.1591796875, 10.77880859375, 11.3984375, 12.01806640625, 12.6376953125, 13.25732421875, 13.876953125, 14.49658203125, 15.1162109375, 15.73583984375, 16.35546875, 16.97509765625, 17.5947265625, 18.21435546875, 18.833984375, 19.45361328125, 20.0732421875, 20.69287109375, 21.3125]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 12.0, 6.0, 17.0, 29.0, 42.0, 47.0, 92.0, 146.0, 166.0, 143.0, 97.0, 71.0, 52.0, 30.0, 25.0, 9.0, 9.0, 4.0, 2.0, 0.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.87895202636719, -60.52501678466797, -58.171085357666016, -55.81715393066406, -53.463218688964844, -51.109283447265625, -48.75535202026367, -46.40142059326172, -44.0474853515625, -41.69355010986328, -39.33961868286133, -36.985687255859375, -34.631752014160156, -32.27781677246094, -29.923885345458984, -27.5699520111084, -25.216018676757812, -22.862085342407227, -20.50815200805664, -18.154218673706055, -15.800285339355469, -13.446352005004883, -11.092418670654297, -8.738485336303711, -6.384552001953125, -4.030618667602539, -1.6766853332519531, 0.6772480010986328, 3.0311813354492188, 5.385114669799805, 7.739048004150391, 10.092981338500977, 12.446907043457031, 14.800840377807617, 17.154773712158203, 19.50870704650879, 21.862640380859375, 24.21657371520996, 26.570507049560547, 28.924440383911133, 31.27837371826172, 33.63230895996094, 35.98624038696289, 38.340171813964844, 40.69410705566406, 43.04804229736328, 45.401973724365234, 47.75590515136719, 50.109840393066406, 52.463775634765625, 54.81770706176758, 57.17163848876953, 59.52557373046875, 61.87950897216797, 64.23344421386719, 66.58737182617188, 68.9413070678711, 71.29524230957031, 73.649169921875, 76.00310516357422, 78.35704040527344, 80.71097564697266, 83.06491088867188, 85.41883850097656, 87.77277374267578]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [4.0, 2.0, 1.0, 0.0, 3.0, 1.0, 4.0, 6.0, 15.0, 5.0, 7.0, 13.0, 17.0, 13.0, 18.0, 19.0, 21.0, 25.0, 19.0, 34.0, 31.0, 27.0, 32.0, 34.0, 32.0, 36.0, 40.0, 43.0, 38.0, 55.0, 40.0, 43.0, 38.0, 40.0, 33.0, 35.0, 33.0, 22.0, 23.0, 22.0, 22.0, 11.0, 17.0, 12.0, 8.0, 4.0, 4.0, 4.0, 7.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.83740234375, -29.712251663208008, -28.587100982666016, -27.461950302124023, -26.33679962158203, -25.21164894104004, -24.086498260498047, -22.961347579956055, -21.836196899414062, -20.71104621887207, -19.585895538330078, -18.460744857788086, -17.335594177246094, -16.2104434967041, -15.08529281616211, -13.960142135620117, -12.834991455078125, -11.709840774536133, -10.58469009399414, -9.459539413452148, -8.334388732910156, -7.209238052368164, -6.084087371826172, -4.95893669128418, -3.8337860107421875, -2.7086353302001953, -1.5834846496582031, -0.45833396911621094, 0.6668167114257812, 1.7919673919677734, 2.9171180725097656, 4.042268753051758, 5.16741943359375, 6.292570114135742, 7.417720794677734, 8.542871475219727, 9.668022155761719, 10.793172836303711, 11.918323516845703, 13.043474197387695, 14.168624877929688, 15.29377555847168, 16.418926239013672, 17.544076919555664, 18.669227600097656, 19.79437828063965, 20.91952896118164, 22.044679641723633, 23.169830322265625, 24.294981002807617, 25.42013168334961, 26.5452823638916, 27.670433044433594, 28.795583724975586, 29.920734405517578, 31.04588508605957, 32.17103576660156, 33.29618835449219, 34.42133712768555, 35.546485900878906, 36.67163848876953, 37.796791076660156, 38.921939849853516, 40.047088623046875, 41.1722412109375]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 5.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 2.0, 2.0, 6.0, 6.0, 3.0, 8.0, 11.0, 5.0, 13.0, 13.0, 14.0, 22.0, 16.0, 19.0, 18.0, 46.0, 34.0, 35.0, 37.0, 42.0, 56.0, 54.0, 39.0, 50.0, 50.0, 38.0, 45.0, 26.0, 43.0, 34.0, 35.0, 25.0, 19.0, 26.0, 18.0, 14.0, 17.0, 9.0, 17.0, 10.0, 9.0, 5.0, 3.0, 2.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.5859375, -4.45037841796875, -4.3148193359375, -4.17926025390625, -4.043701171875, -3.90814208984375, -3.7725830078125, -3.63702392578125, -3.50146484375, -3.36590576171875, -3.2303466796875, -3.09478759765625, -2.959228515625, -2.82366943359375, -2.6881103515625, -2.55255126953125, -2.4169921875, -2.28143310546875, -2.1458740234375, -2.01031494140625, -1.874755859375, -1.73919677734375, -1.6036376953125, -1.46807861328125, -1.33251953125, -1.19696044921875, -1.0614013671875, -0.92584228515625, -0.790283203125, -0.65472412109375, -0.5191650390625, -0.38360595703125, -0.248046875, -0.11248779296875, 0.0230712890625, 0.15863037109375, 0.294189453125, 0.42974853515625, 0.5653076171875, 0.70086669921875, 0.83642578125, 0.97198486328125, 1.1075439453125, 1.24310302734375, 1.378662109375, 1.51422119140625, 1.6497802734375, 1.78533935546875, 1.9208984375, 2.05645751953125, 2.1920166015625, 2.32757568359375, 2.463134765625, 2.59869384765625, 2.7342529296875, 2.86981201171875, 3.00537109375, 3.14093017578125, 3.2764892578125, 3.41204833984375, 3.547607421875, 3.68316650390625, 3.8187255859375, 3.95428466796875, 4.08984375]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 6.0, 7.0, 11.0, 23.0, 23.0, 26.0, 44.0, 53.0, 114.0, 152.0, 274.0, 428.0, 565.0, 923.0, 1324.0, 2170.0, 3612.0, 5823.0, 9344.0, 16295.0, 28390.0, 52544.0, 101748.0, 209119.0, 294309.0, 150298.0, 75696.0, 40080.0, 22142.0, 12761.0, 7549.0, 4722.0, 2866.0, 1814.0, 1143.0, 759.0, 482.0, 320.0, 205.0, 131.0, 105.0, 56.0, 41.0, 21.0, 18.0, 12.0, 10.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.1751708984375, -0.1695709228515625, -0.163970947265625, -0.1583709716796875, -0.15277099609375, -0.1471710205078125, -0.141571044921875, -0.1359710693359375, -0.13037109375, -0.1247711181640625, -0.119171142578125, -0.1135711669921875, -0.10797119140625, -0.1023712158203125, -0.096771240234375, -0.0911712646484375, -0.0855712890625, -0.0799713134765625, -0.074371337890625, -0.0687713623046875, -0.06317138671875, -0.0575714111328125, -0.051971435546875, -0.0463714599609375, -0.040771484375, -0.0351715087890625, -0.029571533203125, -0.0239715576171875, -0.01837158203125, -0.0127716064453125, -0.007171630859375, -0.0015716552734375, 0.0040283203125, 0.0096282958984375, 0.015228271484375, 0.0208282470703125, 0.02642822265625, 0.0320281982421875, 0.037628173828125, 0.0432281494140625, 0.048828125, 0.0544281005859375, 0.060028076171875, 0.0656280517578125, 0.07122802734375, 0.0768280029296875, 0.082427978515625, 0.0880279541015625, 0.0936279296875, 0.0992279052734375, 0.104827880859375, 0.1104278564453125, 0.11602783203125, 0.1216278076171875, 0.127227783203125, 0.1328277587890625, 0.138427734375, 0.1440277099609375, 0.149627685546875, 0.1552276611328125, 0.16082763671875, 0.1664276123046875, 0.172027587890625, 0.1776275634765625, 0.1832275390625]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 6.0, 6.0, 7.0, 4.0, 7.0, 5.0, 8.0, 13.0, 16.0, 13.0, 18.0, 24.0, 19.0, 19.0, 36.0, 28.0, 43.0, 33.0, 40.0, 39.0, 50.0, 46.0, 1062.0, 35.0, 43.0, 36.0, 39.0, 36.0, 36.0, 36.0, 30.0, 26.0, 18.0, 25.0, 20.0, 21.0, 17.0, 19.0, 6.0, 9.0, 12.0, 8.0, 4.0, 4.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.8984375, -2.807220458984375, -2.71600341796875, -2.624786376953125, -2.5335693359375, -2.442352294921875, -2.35113525390625, -2.259918212890625, -2.168701171875, -2.077484130859375, -1.98626708984375, -1.895050048828125, -1.8038330078125, -1.712615966796875, -1.62139892578125, -1.530181884765625, -1.43896484375, -1.347747802734375, -1.25653076171875, -1.165313720703125, -1.0740966796875, -0.982879638671875, -0.89166259765625, -0.800445556640625, -0.709228515625, -0.618011474609375, -0.52679443359375, -0.435577392578125, -0.3443603515625, -0.253143310546875, -0.16192626953125, -0.070709228515625, 0.0205078125, 0.111724853515625, 0.20294189453125, 0.294158935546875, 0.3853759765625, 0.476593017578125, 0.56781005859375, 0.659027099609375, 0.750244140625, 0.841461181640625, 0.93267822265625, 1.023895263671875, 1.1151123046875, 1.206329345703125, 1.29754638671875, 1.388763427734375, 1.47998046875, 1.571197509765625, 1.66241455078125, 1.753631591796875, 1.8448486328125, 1.936065673828125, 2.02728271484375, 2.118499755859375, 2.209716796875, 2.300933837890625, 2.39215087890625, 2.483367919921875, 2.5745849609375, 2.665802001953125, 2.75701904296875, 2.848236083984375, 2.939453125]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 2.0, 6.0, 8.0, 7.0, 18.0, 28.0, 33.0, 59.0, 55.0, 102.0, 139.0, 199.0, 295.0, 449.0, 598.0, 810.0, 1263.0, 1845.0, 2653.0, 3849.0, 5855.0, 8819.0, 13332.0, 21441.0, 33907.0, 54278.0, 88494.0, 149461.0, 1286932.0, 164573.0, 96258.0, 58556.0, 36134.0, 22880.0, 14950.0, 9478.0, 6346.0, 4096.0, 2818.0, 1946.0, 1236.0, 905.0, 631.0, 420.0, 314.0, 189.0, 162.0, 106.0, 66.0, 48.0, 38.0, 17.0, 14.0, 8.0, 7.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.11968994140625, -0.11590003967285156, -0.11211013793945312, -0.10832023620605469, -0.10453033447265625, -0.10074043273925781, -0.09695053100585938, -0.09316062927246094, -0.0893707275390625, -0.08558082580566406, -0.08179092407226562, -0.07800102233886719, -0.07421112060546875, -0.07042121887207031, -0.06663131713867188, -0.06284141540527344, -0.059051513671875, -0.05526161193847656, -0.051471710205078125, -0.04768180847167969, -0.04389190673828125, -0.04010200500488281, -0.036312103271484375, -0.03252220153808594, -0.0287322998046875, -0.024942398071289062, -0.021152496337890625, -0.017362594604492188, -0.01357269287109375, -0.009782791137695312, -0.005992889404296875, -0.0022029876708984375, 0.0015869140625, 0.0053768157958984375, 0.009166717529296875, 0.012956619262695312, 0.01674652099609375, 0.020536422729492188, 0.024326324462890625, 0.028116226196289062, 0.0319061279296875, 0.03569602966308594, 0.039485931396484375, 0.04327583312988281, 0.04706573486328125, 0.05085563659667969, 0.054645538330078125, 0.05843544006347656, 0.062225341796875, 0.06601524353027344, 0.06980514526367188, 0.07359504699707031, 0.07738494873046875, 0.08117485046386719, 0.08496475219726562, 0.08875465393066406, 0.0925445556640625, 0.09633445739746094, 0.10012435913085938, 0.10391426086425781, 0.10770416259765625, 0.11149406433105469, 0.11528396606445312, 0.11907386779785156, 0.12286376953125]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 3.0, 2.0, 3.0, 4.0, 8.0, 8.0, 9.0, 9.0, 17.0, 19.0, 17.0, 22.0, 33.0, 42.0, 48.0, 84.0, 127.0, 142.0, 101.0, 81.0, 37.0, 19.0, 26.0, 19.0, 28.0, 27.0, 15.0, 12.0, 13.0, 4.0, 2.0, 5.0, 5.0, 5.0, 4.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00018453598022460938, -0.00017823092639446259, -0.0001719258725643158, -0.000165620818734169, -0.00015931576490402222, -0.00015301071107387543, -0.00014670565724372864, -0.00014040060341358185, -0.00013409554958343506, -0.00012779049575328827, -0.00012148544192314148, -0.00011518038809299469, -0.0001088753342628479, -0.00010257028043270111, -9.626522660255432e-05, -8.996017277240753e-05, -8.365511894226074e-05, -7.735006511211395e-05, -7.104501128196716e-05, -6.473995745182037e-05, -5.8434903621673584e-05, -5.2129849791526794e-05, -4.5824795961380005e-05, -3.9519742131233215e-05, -3.3214688301086426e-05, -2.6909634470939636e-05, -2.0604580640792847e-05, -1.4299526810646057e-05, -7.994472980499268e-06, -1.689419150352478e-06, 4.6156346797943115e-06, 1.0920688509941101e-05, 1.722574234008789e-05, 2.353079617023468e-05, 2.983585000038147e-05, 3.614090383052826e-05, 4.244595766067505e-05, 4.875101149082184e-05, 5.505606532096863e-05, 6.136111915111542e-05, 6.766617298126221e-05, 7.3971226811409e-05, 8.027628064155579e-05, 8.658133447170258e-05, 9.288638830184937e-05, 9.919144213199615e-05, 0.00010549649596214294, 0.00011180154979228973, 0.00011810660362243652, 0.0001244116574525833, 0.0001307167112827301, 0.0001370217651128769, 0.00014332681894302368, 0.00014963187277317047, 0.00015593692660331726, 0.00016224198043346405, 0.00016854703426361084, 0.00017485208809375763, 0.00018115714192390442, 0.0001874621957540512, 0.000193767249584198, 0.0002000723034143448, 0.00020637735724449158, 0.00021268241107463837, 0.00021898746490478516]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 4.0, 9.0, 3.0, 12.0, 12.0, 16.0, 21.0, 27.0, 40.0, 55.0, 62.0, 96.0, 167.0, 286.0, 717.0, 2330.0, 12102.0, 127233.0, 860822.0, 36618.0, 5536.0, 1239.0, 443.0, 245.0, 137.0, 84.0, 63.0, 40.0, 41.0, 28.0, 16.0, 10.0, 9.0, 4.0, 9.0, 6.0, 2.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00225067138671875, -0.002180933952331543, -0.002111196517944336, -0.002041459083557129, -0.001971721649169922, -0.0019019842147827148, -0.0018322467803955078, -0.0017625093460083008, -0.0016927719116210938, -0.0016230344772338867, -0.0015532970428466797, -0.0014835596084594727, -0.0014138221740722656, -0.0013440847396850586, -0.0012743473052978516, -0.0012046098709106445, -0.0011348724365234375, -0.0010651350021362305, -0.0009953975677490234, -0.0009256601333618164, -0.0008559226989746094, -0.0007861852645874023, -0.0007164478302001953, -0.0006467103958129883, -0.0005769729614257812, -0.0005072355270385742, -0.0004374980926513672, -0.00036776065826416016, -0.0002980232238769531, -0.0002282857894897461, -0.00015854835510253906, -8.881092071533203e-05, -1.9073486328125e-05, 5.066394805908203e-05, 0.00012040138244628906, 0.0001901388168334961, 0.0002598762512207031, 0.00032961368560791016, 0.0003993511199951172, 0.0004690885543823242, 0.0005388259887695312, 0.0006085634231567383, 0.0006783008575439453, 0.0007480382919311523, 0.0008177757263183594, 0.0008875131607055664, 0.0009572505950927734, 0.0010269880294799805, 0.0010967254638671875, 0.0011664628982543945, 0.0012362003326416016, 0.0013059377670288086, 0.0013756752014160156, 0.0014454126358032227, 0.0015151500701904297, 0.0015848875045776367, 0.0016546249389648438, 0.0017243623733520508, 0.0017940998077392578, 0.0018638372421264648, 0.0019335746765136719, 0.002003312110900879, 0.002073049545288086, 0.002142786979675293, 0.0022125244140625]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 11.0, 24.0, 53.0, 91.0, 269.0, 320.0, 123.0, 56.0, 30.0, 15.0, 3.0, 12.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0005585396429523826, -0.0005473850178532302, -0.0005362303927540779, -0.0005250758258625865, -0.0005139212007634342, -0.0005027665756642818, -0.0004916119505651295, -0.0004804573254659772, -0.0004693027294706553, -0.000458148104371503, -0.0004469935083761811, -0.0004358388832770288, -0.00042468425817787647, -0.0004135296621825546, -0.0004023750370834023, -0.0003912204410880804, -0.0003800658159889281, -0.00036891119088977575, -0.0003577565948944539, -0.00034660196979530156, -0.0003354473737999797, -0.00032429274870082736, -0.00031313812360167503, -0.0003019834985025227, -0.00029082890250720084, -0.0002796742774080485, -0.00026851968141272664, -0.0002573650563135743, -0.000246210431214422, -0.00023505583521910012, -0.0002239012101199478, -0.0002127465995727107, -0.00020159201812930405, -0.00019043740758206695, -0.00017928279703482985, -0.00016812817193567753, -0.00015697356138844043, -0.00014581895084120333, -0.000134664325742051, -0.0001235097151948139, -0.00011235510464757681, -0.00010120049410033971, -9.0045876277145e-05, -7.889125845395029e-05, -6.773664790671319e-05, -5.658203372149728e-05, -4.542741953628138e-05, -3.4272801713086665e-05, -2.3118191165849566e-05, -1.1963576980633661e-05, -8.089627954177558e-07, 1.034565138979815e-05, 2.1500265575014055e-05, 3.265487976022996e-05, 4.3809493945445865e-05, 5.496411176864058e-05, 6.611872231587768e-05, 7.727333286311477e-05, 8.842795068630949e-05, 9.95825685095042e-05, 0.0001107371790567413, 0.0001218917896039784, 0.00013304641470313072, 0.00014420102525036782, 0.00015535563579760492]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 9.0, 4.0, 5.0, 7.0, 2.0, 10.0, 4.0, 17.0, 16.0, 20.0, 19.0, 18.0, 22.0, 26.0, 24.0, 27.0, 41.0, 36.0, 35.0, 29.0, 37.0, 38.0, 49.0, 47.0, 35.0, 39.0, 48.0, 44.0, 30.0, 28.0, 37.0, 23.0, 29.0, 25.0, 13.0, 15.0, 14.0, 13.0, 14.0, 11.0, 7.0, 6.0, 10.0, 12.0, 3.0, 0.0, 6.0, 2.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.362531661987305e-05, -8.097290992736816e-05, -7.832050323486328e-05, -7.56680965423584e-05, -7.301568984985352e-05, -7.036328315734863e-05, -6.771087646484375e-05, -6.505846977233887e-05, -6.240606307983398e-05, -5.97536563873291e-05, -5.710124969482422e-05, -5.4448843002319336e-05, -5.179643630981445e-05, -4.914402961730957e-05, -4.649162292480469e-05, -4.3839216232299805e-05, -4.118680953979492e-05, -3.853440284729004e-05, -3.5881996154785156e-05, -3.3229589462280273e-05, -3.057718276977539e-05, -2.7924776077270508e-05, -2.5272369384765625e-05, -2.2619962692260742e-05, -1.996755599975586e-05, -1.7315149307250977e-05, -1.4662742614746094e-05, -1.2010335922241211e-05, -9.357929229736328e-06, -6.705522537231445e-06, -4.0531158447265625e-06, -1.4007091522216797e-06, 1.2516975402832031e-06, 3.904104232788086e-06, 6.556510925292969e-06, 9.208917617797852e-06, 1.1861324310302734e-05, 1.4513731002807617e-05, 1.71661376953125e-05, 1.9818544387817383e-05, 2.2470951080322266e-05, 2.512335777282715e-05, 2.777576446533203e-05, 3.0428171157836914e-05, 3.30805778503418e-05, 3.573298454284668e-05, 3.838539123535156e-05, 4.1037797927856445e-05, 4.369020462036133e-05, 4.634261131286621e-05, 4.8995018005371094e-05, 5.1647424697875977e-05, 5.429983139038086e-05, 5.695223808288574e-05, 5.9604644775390625e-05, 6.225705146789551e-05, 6.490945816040039e-05, 6.756186485290527e-05, 7.021427154541016e-05, 7.286667823791504e-05, 7.551908493041992e-05, 7.81714916229248e-05, 8.082389831542969e-05, 8.347630500793457e-05, 8.612871170043945e-05]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 5.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 2.0, 2.0, 6.0, 6.0, 3.0, 8.0, 11.0, 5.0, 13.0, 13.0, 14.0, 22.0, 16.0, 19.0, 18.0, 46.0, 34.0, 35.0, 37.0, 42.0, 56.0, 54.0, 39.0, 50.0, 50.0, 38.0, 45.0, 26.0, 43.0, 34.0, 35.0, 25.0, 19.0, 26.0, 18.0, 14.0, 17.0, 9.0, 17.0, 10.0, 9.0, 5.0, 3.0, 2.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.5859375, -4.45037841796875, -4.3148193359375, -4.17926025390625, -4.043701171875, -3.90814208984375, -3.7725830078125, -3.63702392578125, -3.50146484375, -3.36590576171875, -3.2303466796875, -3.09478759765625, -2.959228515625, -2.82366943359375, -2.6881103515625, -2.55255126953125, -2.4169921875, -2.28143310546875, -2.1458740234375, -2.01031494140625, -1.874755859375, -1.73919677734375, -1.6036376953125, -1.46807861328125, -1.33251953125, -1.19696044921875, -1.0614013671875, -0.92584228515625, -0.790283203125, -0.65472412109375, -0.5191650390625, -0.38360595703125, -0.248046875, -0.11248779296875, 0.0230712890625, 0.15863037109375, 0.294189453125, 0.42974853515625, 0.5653076171875, 0.70086669921875, 0.83642578125, 0.97198486328125, 1.1075439453125, 1.24310302734375, 1.378662109375, 1.51422119140625, 1.6497802734375, 1.78533935546875, 1.9208984375, 2.05645751953125, 2.1920166015625, 2.32757568359375, 2.463134765625, 2.59869384765625, 2.7342529296875, 2.86981201171875, 3.00537109375, 3.14093017578125, 3.2764892578125, 3.41204833984375, 3.547607421875, 3.68316650390625, 3.8187255859375, 3.95428466796875, 4.08984375]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 8.0, 8.0, 8.0, 12.0, 20.0, 21.0, 17.0, 28.0, 54.0, 53.0, 72.0, 102.0, 160.0, 244.0, 329.0, 461.0, 683.0, 1026.0, 1480.0, 2482.0, 4390.0, 10225.0, 33441.0, 168995.0, 597317.0, 171182.0, 33781.0, 10193.0, 4495.0, 2454.0, 1518.0, 990.0, 686.0, 453.0, 339.0, 234.0, 148.0, 105.0, 76.0, 79.0, 45.0, 29.0, 36.0, 14.0, 14.0, 15.0, 13.0, 9.0, 6.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 2.0], "bins": [-4.03515625, -3.9110107421875, -3.786865234375, -3.6627197265625, -3.53857421875, -3.4144287109375, -3.290283203125, -3.1661376953125, -3.0419921875, -2.9178466796875, -2.793701171875, -2.6695556640625, -2.54541015625, -2.4212646484375, -2.297119140625, -2.1729736328125, -2.048828125, -1.9246826171875, -1.800537109375, -1.6763916015625, -1.55224609375, -1.4281005859375, -1.303955078125, -1.1798095703125, -1.0556640625, -0.9315185546875, -0.807373046875, -0.6832275390625, -0.55908203125, -0.4349365234375, -0.310791015625, -0.1866455078125, -0.0625, 0.0616455078125, 0.185791015625, 0.3099365234375, 0.43408203125, 0.5582275390625, 0.682373046875, 0.8065185546875, 0.9306640625, 1.0548095703125, 1.178955078125, 1.3031005859375, 1.42724609375, 1.5513916015625, 1.675537109375, 1.7996826171875, 1.923828125, 2.0479736328125, 2.172119140625, 2.2962646484375, 2.42041015625, 2.5445556640625, 2.668701171875, 2.7928466796875, 2.9169921875, 3.0411376953125, 3.165283203125, 3.2894287109375, 3.41357421875, 3.5377197265625, 3.661865234375, 3.7860107421875, 3.91015625]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 6.0, 6.0, 8.0, 7.0, 8.0, 8.0, 13.0, 25.0, 32.0, 32.0, 31.0, 38.0, 42.0, 30.0, 41.0, 42.0, 38.0, 71.0, 401.0, 1672.0, 74.0, 57.0, 49.0, 44.0, 32.0, 37.0, 36.0, 37.0, 29.0, 26.0, 19.0, 16.0, 9.0, 8.0, 9.0, 11.0, 5.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.265625, -18.71630859375, -18.1669921875, -17.61767578125, -17.068359375, -16.51904296875, -15.9697265625, -15.42041015625, -14.87109375, -14.32177734375, -13.7724609375, -13.22314453125, -12.673828125, -12.12451171875, -11.5751953125, -11.02587890625, -10.4765625, -9.92724609375, -9.3779296875, -8.82861328125, -8.279296875, -7.72998046875, -7.1806640625, -6.63134765625, -6.08203125, -5.53271484375, -4.9833984375, -4.43408203125, -3.884765625, -3.33544921875, -2.7861328125, -2.23681640625, -1.6875, -1.13818359375, -0.5888671875, -0.03955078125, 0.509765625, 1.05908203125, 1.6083984375, 2.15771484375, 2.70703125, 3.25634765625, 3.8056640625, 4.35498046875, 4.904296875, 5.45361328125, 6.0029296875, 6.55224609375, 7.1015625, 7.65087890625, 8.2001953125, 8.74951171875, 9.298828125, 9.84814453125, 10.3974609375, 10.94677734375, 11.49609375, 12.04541015625, 12.5947265625, 13.14404296875, 13.693359375, 14.24267578125, 14.7919921875, 15.34130859375, 15.890625]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 5.0, 4.0, 5.0, 9.0, 10.0, 8.0, 10.0, 16.0, 17.0, 37.0, 24.0, 42.0, 55.0, 77.0, 99.0, 175.0, 342.0, 964.0, 5095.0, 283253.0, 2844649.0, 8375.0, 1362.0, 405.0, 228.0, 111.0, 85.0, 50.0, 41.0, 32.0, 38.0, 27.0, 16.0, 10.0, 8.0, 10.0, 6.0, 5.0, 9.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.03125, -24.171630859375, -23.31201171875, -22.452392578125, -21.5927734375, -20.733154296875, -19.87353515625, -19.013916015625, -18.154296875, -17.294677734375, -16.43505859375, -15.575439453125, -14.7158203125, -13.856201171875, -12.99658203125, -12.136962890625, -11.27734375, -10.417724609375, -9.55810546875, -8.698486328125, -7.8388671875, -6.979248046875, -6.11962890625, -5.260009765625, -4.400390625, -3.540771484375, -2.68115234375, -1.821533203125, -0.9619140625, -0.102294921875, 0.75732421875, 1.616943359375, 2.4765625, 3.336181640625, 4.19580078125, 5.055419921875, 5.9150390625, 6.774658203125, 7.63427734375, 8.493896484375, 9.353515625, 10.213134765625, 11.07275390625, 11.932373046875, 12.7919921875, 13.651611328125, 14.51123046875, 15.370849609375, 16.23046875, 17.090087890625, 17.94970703125, 18.809326171875, 19.6689453125, 20.528564453125, 21.38818359375, 22.247802734375, 23.107421875, 23.967041015625, 24.82666015625, 25.686279296875, 26.5458984375, 27.405517578125, 28.26513671875, 29.124755859375, 29.984375]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [2.0, 1.0, 78.0, 555.0, 361.0, 21.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.706419944763184, -7.173535346984863, -4.640650749206543, -2.1077661514282227, 0.42511844635009766, 2.958003044128418, 5.490887641906738, 8.023772239685059, 10.556656837463379, 13.0895414352417, 15.62242603302002, 18.155311584472656, 20.688194274902344, 23.221080780029297, 25.753963470458984, 28.286849975585938, 30.819732666015625, 33.35261535644531, 35.885501861572266, 38.41838836669922, 40.951271057128906, 43.484153747558594, 46.01704025268555, 48.5499267578125, 51.08280944824219, 53.615692138671875, 56.14857864379883, 58.68146514892578, 61.21434783935547, 63.747230529785156, 66.28012084960938, 68.81300354003906, 71.34588623046875, 73.87876892089844, 76.41165161132812, 78.94454193115234, 81.47742462158203, 84.01030731201172, 86.54319763183594, 89.07608032226562, 91.60896301269531, 94.141845703125, 96.67472839355469, 99.2076187133789, 101.7405014038086, 104.27338409423828, 106.8062744140625, 109.33915710449219, 111.87203979492188, 114.40492248535156, 116.93780517578125, 119.47069549560547, 122.00357818603516, 124.53646087646484, 127.06935119628906, 129.60223388671875, 132.13511657714844, 134.66799926757812, 137.2008819580078, 139.7337646484375, 142.26666259765625, 144.79954528808594, 147.33242797851562, 149.8653106689453, 152.398193359375]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 4.0, 4.0, 13.0, 9.0, 8.0, 10.0, 8.0, 16.0, 22.0, 18.0, 30.0, 29.0, 27.0, 31.0, 40.0, 30.0, 39.0, 42.0, 44.0, 44.0, 47.0, 41.0, 45.0, 61.0, 57.0, 27.0, 32.0, 30.0, 30.0, 25.0, 29.0, 24.0, 12.0, 17.0, 13.0, 13.0, 7.0, 3.0, 6.0, 4.0, 4.0, 4.0, 2.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-50.50505447387695, -48.863956451416016, -47.22285461425781, -45.581756591796875, -43.94065856933594, -42.299560546875, -40.6584587097168, -39.01736068725586, -37.37626266479492, -35.735164642333984, -34.09406280517578, -32.452964782714844, -30.811866760253906, -29.170766830444336, -27.529666900634766, -25.888568878173828, -24.247468948364258, -22.606369018554688, -20.96527099609375, -19.32417106628418, -17.683073043823242, -16.041973114013672, -14.400874137878418, -12.759775161743164, -11.11867618560791, -9.477577209472656, -7.836478233337402, -6.19537878036499, -4.554279804229736, -2.913180351257324, -1.2720813751220703, 0.3690176010131836, 2.0101165771484375, 3.6512155532836914, 5.292314529418945, 6.933413982391357, 8.574512481689453, 10.215612411499023, 11.856711387634277, 13.497810363769531, 15.138909339904785, 16.78000831604004, 18.42110824584961, 20.062206268310547, 21.703306198120117, 23.344406127929688, 24.985504150390625, 26.626602172851562, 28.267702102661133, 29.908802032470703, 31.54990005493164, 33.19099807739258, 34.83209991455078, 36.47319793701172, 38.114295959472656, 39.755393981933594, 41.3964958190918, 43.037593841552734, 44.67869567871094, 46.319793701171875, 47.96089172363281, 49.60198974609375, 51.24309158325195, 52.88418960571289, 54.52528762817383]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 4.0, 4.0, 4.0, 5.0, 5.0, 8.0, 9.0, 8.0, 11.0, 13.0, 18.0, 14.0, 20.0, 16.0, 17.0, 34.0, 43.0, 26.0, 42.0, 43.0, 57.0, 41.0, 45.0, 46.0, 50.0, 41.0, 35.0, 45.0, 31.0, 34.0, 38.0, 32.0, 19.0, 22.0, 24.0, 18.0, 17.0, 10.0, 9.0, 13.0, 11.0, 6.0, 5.0, 6.0, 0.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.4609375, -4.32666015625, -4.1923828125, -4.05810546875, -3.923828125, -3.78955078125, -3.6552734375, -3.52099609375, -3.38671875, -3.25244140625, -3.1181640625, -2.98388671875, -2.849609375, -2.71533203125, -2.5810546875, -2.44677734375, -2.3125, -2.17822265625, -2.0439453125, -1.90966796875, -1.775390625, -1.64111328125, -1.5068359375, -1.37255859375, -1.23828125, -1.10400390625, -0.9697265625, -0.83544921875, -0.701171875, -0.56689453125, -0.4326171875, -0.29833984375, -0.1640625, -0.02978515625, 0.1044921875, 0.23876953125, 0.373046875, 0.50732421875, 0.6416015625, 0.77587890625, 0.91015625, 1.04443359375, 1.1787109375, 1.31298828125, 1.447265625, 1.58154296875, 1.7158203125, 1.85009765625, 1.984375, 2.11865234375, 2.2529296875, 2.38720703125, 2.521484375, 2.65576171875, 2.7900390625, 2.92431640625, 3.05859375, 3.19287109375, 3.3271484375, 3.46142578125, 3.595703125, 3.72998046875, 3.8642578125, 3.99853515625, 4.1328125]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 6.0, 4.0, 7.0, 8.0, 12.0, 20.0, 28.0, 43.0, 46.0, 61.0, 93.0, 110.0, 168.0, 250.0, 362.0, 539.0, 726.0, 1136.0, 1713.0, 2542.0, 4223.0, 7002.0, 12309.0, 23572.0, 61232.0, 477667.0, 2889898.0, 579961.0, 72014.0, 25574.0, 13030.0, 7451.0, 4450.0, 2813.0, 1705.0, 1162.0, 722.0, 522.0, 340.0, 272.0, 145.0, 109.0, 76.0, 47.0, 32.0, 29.0, 21.0, 12.0, 12.0, 8.0, 2.0, 3.0, 1.0, 3.0, 1.0], "bins": [-11.5703125, -11.2447509765625, -10.919189453125, -10.5936279296875, -10.26806640625, -9.9425048828125, -9.616943359375, -9.2913818359375, -8.9658203125, -8.6402587890625, -8.314697265625, -7.9891357421875, -7.66357421875, -7.3380126953125, -7.012451171875, -6.6868896484375, -6.361328125, -6.0357666015625, -5.710205078125, -5.3846435546875, -5.05908203125, -4.7335205078125, -4.407958984375, -4.0823974609375, -3.7568359375, -3.4312744140625, -3.105712890625, -2.7801513671875, -2.45458984375, -2.1290283203125, -1.803466796875, -1.4779052734375, -1.15234375, -0.8267822265625, -0.501220703125, -0.1756591796875, 0.14990234375, 0.4754638671875, 0.801025390625, 1.1265869140625, 1.4521484375, 1.7777099609375, 2.103271484375, 2.4288330078125, 2.75439453125, 3.0799560546875, 3.405517578125, 3.7310791015625, 4.056640625, 4.3822021484375, 4.707763671875, 5.0333251953125, 5.35888671875, 5.6844482421875, 6.010009765625, 6.3355712890625, 6.6611328125, 6.9866943359375, 7.312255859375, 7.6378173828125, 7.96337890625, 8.2889404296875, 8.614501953125, 8.9400634765625, 9.265625]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 6.0, 1.0, 6.0, 8.0, 6.0, 16.0, 14.0, 16.0, 18.0, 11.0, 21.0, 36.0, 34.0, 49.0, 61.0, 73.0, 136.0, 207.0, 350.0, 582.0, 722.0, 563.0, 371.0, 226.0, 134.0, 85.0, 64.0, 50.0, 43.0, 32.0, 31.0, 26.0, 17.0, 13.0, 5.0, 10.0, 4.0, 8.0, 6.0, 7.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.53125, -11.1873779296875, -10.843505859375, -10.4996337890625, -10.15576171875, -9.8118896484375, -9.468017578125, -9.1241455078125, -8.7802734375, -8.4364013671875, -8.092529296875, -7.7486572265625, -7.40478515625, -7.0609130859375, -6.717041015625, -6.3731689453125, -6.029296875, -5.6854248046875, -5.341552734375, -4.9976806640625, -4.65380859375, -4.3099365234375, -3.966064453125, -3.6221923828125, -3.2783203125, -2.9344482421875, -2.590576171875, -2.2467041015625, -1.90283203125, -1.5589599609375, -1.215087890625, -0.8712158203125, -0.52734375, -0.1834716796875, 0.160400390625, 0.5042724609375, 0.84814453125, 1.1920166015625, 1.535888671875, 1.8797607421875, 2.2236328125, 2.5675048828125, 2.911376953125, 3.2552490234375, 3.59912109375, 3.9429931640625, 4.286865234375, 4.6307373046875, 4.974609375, 5.3184814453125, 5.662353515625, 6.0062255859375, 6.35009765625, 6.6939697265625, 7.037841796875, 7.3817138671875, 7.7255859375, 8.0694580078125, 8.413330078125, 8.7572021484375, 9.10107421875, 9.4449462890625, 9.788818359375, 10.1326904296875, 10.4765625]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 6.0, 4.0, 7.0, 9.0, 13.0, 31.0, 50.0, 86.0, 133.0, 252.0, 456.0, 774.0, 1410.0, 2391.0, 4487.0, 8370.0, 16005.0, 33129.0, 78197.0, 336758.0, 2812588.0, 704921.0, 109840.0, 42362.0, 19953.0, 10102.0, 5363.0, 2895.0, 1592.0, 884.0, 467.0, 329.0, 160.0, 114.0, 54.0, 39.0, 16.0, 20.0, 7.0, 12.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.7421875, -12.2454833984375, -11.748779296875, -11.2520751953125, -10.75537109375, -10.2586669921875, -9.761962890625, -9.2652587890625, -8.7685546875, -8.2718505859375, -7.775146484375, -7.2784423828125, -6.78173828125, -6.2850341796875, -5.788330078125, -5.2916259765625, -4.794921875, -4.2982177734375, -3.801513671875, -3.3048095703125, -2.80810546875, -2.3114013671875, -1.814697265625, -1.3179931640625, -0.8212890625, -0.3245849609375, 0.172119140625, 0.6688232421875, 1.16552734375, 1.6622314453125, 2.158935546875, 2.6556396484375, 3.15234375, 3.6490478515625, 4.145751953125, 4.6424560546875, 5.13916015625, 5.6358642578125, 6.132568359375, 6.6292724609375, 7.1259765625, 7.6226806640625, 8.119384765625, 8.6160888671875, 9.11279296875, 9.6094970703125, 10.106201171875, 10.6029052734375, 11.099609375, 11.5963134765625, 12.093017578125, 12.5897216796875, 13.08642578125, 13.5831298828125, 14.079833984375, 14.5765380859375, 15.0732421875, 15.5699462890625, 16.066650390625, 16.5633544921875, 17.06005859375, 17.5567626953125, 18.053466796875, 18.5501708984375, 19.046875]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 5.0, 4.0, 6.0, 11.0, 13.0, 17.0, 21.0, 47.0, 64.0, 92.0, 139.0, 108.0, 133.0, 101.0, 78.0, 60.0, 34.0, 21.0, 20.0, 11.0, 10.0, 5.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-93.07738494873047, -91.0455093383789, -89.01364135742188, -86.98176574707031, -84.94989776611328, -82.91802215576172, -80.88615417480469, -78.85427856445312, -76.82240295410156, -74.79052734375, -72.75865936279297, -70.7267837524414, -68.69491577148438, -66.66304016113281, -64.63116455078125, -62.59929656982422, -60.56742477416992, -58.535552978515625, -56.50368118286133, -54.47180938720703, -52.43993377685547, -50.40806198120117, -48.376190185546875, -46.34431838989258, -44.31244659423828, -42.280574798583984, -40.24870300292969, -38.216827392578125, -36.18495559692383, -34.15308380126953, -32.121212005615234, -30.089340209960938, -28.05746078491211, -26.025588989257812, -23.993715286254883, -21.961843490600586, -19.929969787597656, -17.89809799194336, -15.866226196289062, -13.83435344696045, -11.802480697631836, -9.770607948303223, -7.738735675811768, -5.7068634033203125, -3.674990653991699, -1.643117904663086, 0.38875389099121094, 2.420626640319824, 4.4524993896484375, 6.484372138977051, 8.516244888305664, 10.548116683959961, 12.579989433288574, 14.611862182617188, 16.643733978271484, 18.67560577392578, 20.70747947692871, 22.739351272583008, 24.771224975585938, 26.803096771240234, 28.83496856689453, 30.86684226989746, 32.898712158203125, 34.93058776855469, 36.962459564208984]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 2.0, 1.0, 15.0, 10.0, 6.0, 10.0, 15.0, 12.0, 23.0, 25.0, 24.0, 27.0, 25.0, 31.0, 29.0, 35.0, 44.0, 35.0, 40.0, 41.0, 35.0, 37.0, 46.0, 45.0, 39.0, 33.0, 39.0, 47.0, 35.0, 30.0, 23.0, 21.0, 18.0, 18.0, 17.0, 11.0, 11.0, 14.0, 10.0, 11.0, 5.0, 3.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0], "bins": [-41.79270935058594, -40.66359329223633, -39.53447341918945, -38.405357360839844, -37.27623748779297, -36.14712142944336, -35.01800537109375, -33.888885498046875, -32.759769439697266, -31.630651473999023, -30.50153350830078, -29.372417449951172, -28.24329948425293, -27.114181518554688, -25.985063552856445, -24.855945587158203, -23.72682762145996, -22.59770965576172, -21.468591690063477, -20.339473724365234, -19.210357666015625, -18.081239700317383, -16.95212173461914, -15.823003768920898, -14.693886756896973, -13.56476879119873, -12.435651779174805, -11.306533813476562, -10.17741584777832, -9.048298835754395, -7.919180870056152, -6.790063381195068, -5.660945892333984, -4.5318284034729, -3.4027106761932373, -2.273592948913574, -1.1444754600524902, -0.01535797119140625, 1.113759994506836, 2.24287748336792, 3.371994972229004, 4.501112461090088, 5.630229949951172, 6.759347915649414, 7.888465404510498, 9.017582893371582, 10.146700859069824, 11.27581787109375, 12.404935836791992, 13.534053802490234, 14.66317081451416, 15.792288780212402, 16.921405792236328, 18.05052375793457, 19.179641723632812, 20.308759689331055, 21.437877655029297, 22.56699562072754, 23.69611358642578, 24.82522964477539, 25.954347610473633, 27.083465576171875, 28.212583541870117, 29.34170150756836, 30.47081756591797]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 3.0, 4.0, 4.0, 2.0, 7.0, 5.0, 9.0, 7.0, 23.0, 21.0, 18.0, 12.0, 20.0, 31.0, 29.0, 41.0, 35.0, 44.0, 33.0, 50.0, 50.0, 54.0, 44.0, 45.0, 44.0, 48.0, 43.0, 38.0, 30.0, 37.0, 22.0, 24.0, 16.0, 27.0, 21.0, 15.0, 10.0, 4.0, 8.0, 7.0, 6.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.98828125, -4.8446044921875, -4.700927734375, -4.5572509765625, -4.41357421875, -4.2698974609375, -4.126220703125, -3.9825439453125, -3.8388671875, -3.6951904296875, -3.551513671875, -3.4078369140625, -3.26416015625, -3.1204833984375, -2.976806640625, -2.8331298828125, -2.689453125, -2.5457763671875, -2.402099609375, -2.2584228515625, -2.11474609375, -1.9710693359375, -1.827392578125, -1.6837158203125, -1.5400390625, -1.3963623046875, -1.252685546875, -1.1090087890625, -0.96533203125, -0.8216552734375, -0.677978515625, -0.5343017578125, -0.390625, -0.2469482421875, -0.103271484375, 0.0404052734375, 0.18408203125, 0.3277587890625, 0.471435546875, 0.6151123046875, 0.7587890625, 0.9024658203125, 1.046142578125, 1.1898193359375, 1.33349609375, 1.4771728515625, 1.620849609375, 1.7645263671875, 1.908203125, 2.0518798828125, 2.195556640625, 2.3392333984375, 2.48291015625, 2.6265869140625, 2.770263671875, 2.9139404296875, 3.0576171875, 3.2012939453125, 3.344970703125, 3.4886474609375, 3.63232421875, 3.7760009765625, 3.919677734375, 4.0633544921875, 4.20703125]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 5.0, 5.0, 3.0, 5.0, 9.0, 18.0, 18.0, 24.0, 47.0, 68.0, 80.0, 119.0, 191.0, 247.0, 445.0, 644.0, 1034.0, 1591.0, 2662.0, 4189.0, 6840.0, 11641.0, 20344.0, 36698.0, 69608.0, 139366.0, 306871.0, 222974.0, 102228.0, 52635.0, 28047.0, 15872.0, 9178.0, 5523.0, 3341.0, 2063.0, 1285.0, 871.0, 586.0, 398.0, 287.0, 150.0, 101.0, 98.0, 51.0, 42.0, 24.0, 10.0, 15.0, 8.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.2137451171875, -0.20741844177246094, -0.20109176635742188, -0.1947650909423828, -0.18843841552734375, -0.1821117401123047, -0.17578506469726562, -0.16945838928222656, -0.1631317138671875, -0.15680503845214844, -0.15047836303710938, -0.1441516876220703, -0.13782501220703125, -0.1314983367919922, -0.12517166137695312, -0.11884498596191406, -0.112518310546875, -0.10619163513183594, -0.09986495971679688, -0.09353828430175781, -0.08721160888671875, -0.08088493347167969, -0.07455825805664062, -0.06823158264160156, -0.0619049072265625, -0.05557823181152344, -0.049251556396484375, -0.04292488098144531, -0.03659820556640625, -0.030271530151367188, -0.023944854736328125, -0.017618179321289062, -0.01129150390625, -0.0049648284912109375, 0.001361846923828125, 0.0076885223388671875, 0.01401519775390625, 0.020341873168945312, 0.026668548583984375, 0.03299522399902344, 0.0393218994140625, 0.04564857482910156, 0.051975250244140625, 0.05830192565917969, 0.06462860107421875, 0.07095527648925781, 0.07728195190429688, 0.08360862731933594, 0.089935302734375, 0.09626197814941406, 0.10258865356445312, 0.10891532897949219, 0.11524200439453125, 0.12156867980957031, 0.12789535522460938, 0.13422203063964844, 0.1405487060546875, 0.14687538146972656, 0.15320205688476562, 0.1595287322998047, 0.16585540771484375, 0.1721820831298828, 0.17850875854492188, 0.18483543395996094, 0.191162109375]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 4.0, 7.0, 0.0, 3.0, 2.0, 9.0, 9.0, 6.0, 18.0, 14.0, 12.0, 24.0, 12.0, 19.0, 14.0, 25.0, 33.0, 37.0, 34.0, 27.0, 38.0, 40.0, 40.0, 42.0, 33.0, 1056.0, 50.0, 31.0, 32.0, 36.0, 23.0, 31.0, 30.0, 24.0, 28.0, 22.0, 22.0, 20.0, 25.0, 19.0, 15.0, 18.0, 10.0, 8.0, 10.0, 8.0, 8.0, 4.0, 5.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.39453125, -2.31005859375, -2.2255859375, -2.14111328125, -2.056640625, -1.97216796875, -1.8876953125, -1.80322265625, -1.71875, -1.63427734375, -1.5498046875, -1.46533203125, -1.380859375, -1.29638671875, -1.2119140625, -1.12744140625, -1.04296875, -0.95849609375, -0.8740234375, -0.78955078125, -0.705078125, -0.62060546875, -0.5361328125, -0.45166015625, -0.3671875, -0.28271484375, -0.1982421875, -0.11376953125, -0.029296875, 0.05517578125, 0.1396484375, 0.22412109375, 0.30859375, 0.39306640625, 0.4775390625, 0.56201171875, 0.646484375, 0.73095703125, 0.8154296875, 0.89990234375, 0.984375, 1.06884765625, 1.1533203125, 1.23779296875, 1.322265625, 1.40673828125, 1.4912109375, 1.57568359375, 1.66015625, 1.74462890625, 1.8291015625, 1.91357421875, 1.998046875, 2.08251953125, 2.1669921875, 2.25146484375, 2.3359375, 2.42041015625, 2.5048828125, 2.58935546875, 2.673828125, 2.75830078125, 2.8427734375, 2.92724609375, 3.01171875]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 4.0, 2.0, 6.0, 10.0, 7.0, 15.0, 15.0, 33.0, 54.0, 78.0, 136.0, 178.0, 278.0, 380.0, 547.0, 752.0, 1136.0, 1655.0, 2538.0, 3671.0, 5436.0, 8248.0, 12738.0, 19812.0, 30941.0, 49019.0, 78612.0, 130237.0, 1264701.0, 187489.0, 110952.0, 67545.0, 42326.0, 26635.0, 17440.0, 11213.0, 7199.0, 4963.0, 3279.0, 2157.0, 1471.0, 1039.0, 680.0, 483.0, 332.0, 231.0, 172.0, 99.0, 62.0, 38.0, 35.0, 25.0, 12.0, 9.0, 3.0, 8.0, 4.0, 1.0, 4.0, 0.0, 3.0], "bins": [-0.11883544921875, -0.11510372161865234, -0.11137199401855469, -0.10764026641845703, -0.10390853881835938, -0.10017681121826172, -0.09644508361816406, -0.0927133560180664, -0.08898162841796875, -0.0852499008178711, -0.08151817321777344, -0.07778644561767578, -0.07405471801757812, -0.07032299041748047, -0.06659126281738281, -0.06285953521728516, -0.0591278076171875, -0.055396080017089844, -0.05166435241699219, -0.04793262481689453, -0.044200897216796875, -0.04046916961669922, -0.03673744201660156, -0.033005714416503906, -0.02927398681640625, -0.025542259216308594, -0.021810531616210938, -0.01807880401611328, -0.014347076416015625, -0.010615348815917969, -0.0068836212158203125, -0.0031518936157226562, 0.000579833984375, 0.004311561584472656, 0.008043289184570312, 0.011775016784667969, 0.015506744384765625, 0.01923847198486328, 0.022970199584960938, 0.026701927185058594, 0.03043365478515625, 0.034165382385253906, 0.03789710998535156, 0.04162883758544922, 0.045360565185546875, 0.04909229278564453, 0.05282402038574219, 0.056555747985839844, 0.0602874755859375, 0.06401920318603516, 0.06775093078613281, 0.07148265838623047, 0.07521438598632812, 0.07894611358642578, 0.08267784118652344, 0.0864095687866211, 0.09014129638671875, 0.0938730239868164, 0.09760475158691406, 0.10133647918701172, 0.10506820678710938, 0.10879993438720703, 0.11253166198730469, 0.11626338958740234, 0.1199951171875]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 5.0, 2.0, 5.0, 7.0, 8.0, 7.0, 9.0, 5.0, 16.0, 17.0, 21.0, 29.0, 43.0, 50.0, 72.0, 101.0, 123.0, 128.0, 92.0, 61.0, 53.0, 39.0, 27.0, 16.0, 14.0, 10.0, 11.0, 8.0, 3.0, 5.0, 6.0, 3.0, 7.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 1.0], "bins": [-0.0002942085266113281, -0.0002866499125957489, -0.0002790912985801697, -0.00027153268456459045, -0.00026397407054901123, -0.000256415456533432, -0.0002488568425178528, -0.00024129822850227356, -0.00023373961448669434, -0.0002261810004711151, -0.0002186223864555359, -0.00021106377243995667, -0.00020350515842437744, -0.00019594654440879822, -0.000188387930393219, -0.00018082931637763977, -0.00017327070236206055, -0.00016571208834648132, -0.0001581534743309021, -0.00015059486031532288, -0.00014303624629974365, -0.00013547763228416443, -0.0001279190182685852, -0.00012036040425300598, -0.00011280179023742676, -0.00010524317622184753, -9.768456220626831e-05, -9.012594819068909e-05, -8.256733417510986e-05, -7.500872015953064e-05, -6.745010614395142e-05, -5.989149212837219e-05, -5.233287811279297e-05, -4.4774264097213745e-05, -3.721565008163452e-05, -2.9657036066055298e-05, -2.2098422050476074e-05, -1.453980803489685e-05, -6.981194019317627e-06, 5.774199962615967e-07, 8.13603401184082e-06, 1.5694648027420044e-05, 2.3253262042999268e-05, 3.081187605857849e-05, 3.8370490074157715e-05, 4.592910408973694e-05, 5.348771810531616e-05, 6.104633212089539e-05, 6.860494613647461e-05, 7.616356015205383e-05, 8.372217416763306e-05, 9.128078818321228e-05, 9.88394021987915e-05, 0.00010639801621437073, 0.00011395663022994995, 0.00012151524424552917, 0.0001290738582611084, 0.00013663247227668762, 0.00014419108629226685, 0.00015174970030784607, 0.0001593083143234253, 0.00016686692833900452, 0.00017442554235458374, 0.00018198415637016296, 0.0001895427703857422]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 4.0, 7.0, 3.0, 8.0, 5.0, 10.0, 10.0, 11.0, 15.0, 28.0, 41.0, 46.0, 87.0, 178.0, 299.0, 730.0, 2614.0, 25632.0, 927766.0, 84161.0, 4984.0, 1045.0, 356.0, 179.0, 116.0, 67.0, 43.0, 32.0, 22.0, 13.0, 11.0, 14.0, 3.0, 3.0, 4.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0025768280029296875, -0.0024836957454681396, -0.002390563488006592, -0.002297431230545044, -0.002204298973083496, -0.0021111667156219482, -0.0020180344581604004, -0.0019249022006988525, -0.0018317699432373047, -0.0017386376857757568, -0.001645505428314209, -0.0015523731708526611, -0.0014592409133911133, -0.0013661086559295654, -0.0012729763984680176, -0.0011798441410064697, -0.0010867118835449219, -0.000993579626083374, -0.0009004473686218262, -0.0008073151111602783, -0.0007141828536987305, -0.0006210505962371826, -0.0005279183387756348, -0.0004347860813140869, -0.00034165382385253906, -0.0002485215663909912, -0.00015538930892944336, -6.225705146789551e-05, 3.0875205993652344e-05, 0.0001240074634552002, 0.00021713972091674805, 0.0003102719783782959, 0.00040340423583984375, 0.0004965364933013916, 0.0005896687507629395, 0.0006828010082244873, 0.0007759332656860352, 0.000869065523147583, 0.0009621977806091309, 0.0010553300380706787, 0.0011484622955322266, 0.0012415945529937744, 0.0013347268104553223, 0.0014278590679168701, 0.001520991325378418, 0.0016141235828399658, 0.0017072558403015137, 0.0018003880977630615, 0.0018935203552246094, 0.0019866526126861572, 0.002079784870147705, 0.002172917127609253, 0.0022660493850708008, 0.0023591816425323486, 0.0024523138999938965, 0.0025454461574554443, 0.002638578414916992, 0.00273171067237854, 0.002824842929840088, 0.0029179751873016357, 0.0030111074447631836, 0.0031042397022247314, 0.0031973719596862793, 0.003290504217147827, 0.003383636474609375]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 6.0, 19.0, 67.0, 276.0, 450.0, 142.0, 38.0, 9.0, 5.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00016187355504371226, -0.00014212331734597683, -0.0001223730796482414, -0.00010262283467454836, -8.287259697681293e-05, -6.31223592790775e-05, -4.337211430538446e-05, -2.3621876607649028e-05, -3.8716389099135995e-06, 1.5878600606811233e-05, 3.5628840123536065e-05, 5.53790814592503e-05, 7.512931915698573e-05, 9.487955685472116e-05, 0.0001146298018284142, 0.00013438003952614963, 0.00015413027722388506, 0.0001738805149216205, 0.00019363075261935592, 0.00021338099031709135, 0.00023313122801482677, 0.0002528814657125622, 0.00027263170341029763, 0.0002923819702118635, 0.0003121321788057685, 0.0003318824165035039, 0.00035163265420123935, 0.0003713828918989748, 0.0003911331295967102, 0.00041088336729444563, 0.00043063360499218106, 0.00045038387179374695, 0.00047013413859531283, 0.0004898844053968787, 0.0005096346139907837, 0.0005293848807923496, 0.0005491350893862545, 0.0005688853561878204, 0.0005886355647817254, 0.0006083858315832913, 0.0006281360401771963, 0.0006478863069787621, 0.0006676365155726671, 0.000687386782374233, 0.000707136990968138, 0.0007268872577697039, 0.0007466374663636088, 0.0007663877331651747, 0.0007861379999667406, 0.0008058882667683065, 0.0008256384753622115, 0.0008453887421637774, 0.0008651389507576823, 0.0008848892175592482, 0.0009046394261531532, 0.0009243896929547191, 0.000944139901548624, 0.0009638901683501899, 0.0009836404351517558, 0.0010033906437456608, 0.0010231408523395658, 0.0010428910609334707, 0.0010626413859426975, 0.0010823915945366025, 0.0011021418031305075]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 4.0, 5.0, 4.0, 7.0, 8.0, 9.0, 12.0, 12.0, 17.0, 14.0, 19.0, 19.0, 27.0, 26.0, 32.0, 52.0, 36.0, 33.0, 42.0, 31.0, 43.0, 51.0, 42.0, 47.0, 38.0, 52.0, 35.0, 34.0, 45.0, 26.0, 26.0, 28.0, 18.0, 17.0, 18.0, 16.0, 14.0, 14.0, 13.0, 9.0, 4.0, 5.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.781122207641602e-05, -9.447243064641953e-05, -9.113363921642303e-05, -8.779484778642654e-05, -8.445605635643005e-05, -8.111726492643356e-05, -7.777847349643707e-05, -7.443968206644058e-05, -7.110089063644409e-05, -6.77620992064476e-05, -6.442330777645111e-05, -6.108451634645462e-05, -5.774572491645813e-05, -5.440693348646164e-05, -5.106814205646515e-05, -4.772935062646866e-05, -4.439055919647217e-05, -4.105176776647568e-05, -3.771297633647919e-05, -3.4374184906482697e-05, -3.1035393476486206e-05, -2.7696602046489716e-05, -2.4357810616493225e-05, -2.1019019186496735e-05, -1.7680227756500244e-05, -1.4341436326503754e-05, -1.1002644896507263e-05, -7.663853466510773e-06, -4.325062036514282e-06, -9.862706065177917e-07, 2.3525208234786987e-06, 5.691312253475189e-06, 9.03010368347168e-06, 1.236889511346817e-05, 1.570768654346466e-05, 1.904647797346115e-05, 2.238526940345764e-05, 2.5724060833454132e-05, 2.9062852263450623e-05, 3.240164369344711e-05, 3.5740435123443604e-05, 3.9079226553440094e-05, 4.2418017983436584e-05, 4.5756809413433075e-05, 4.9095600843429565e-05, 5.2434392273426056e-05, 5.5773183703422546e-05, 5.911197513341904e-05, 6.245076656341553e-05, 6.578955799341202e-05, 6.912834942340851e-05, 7.2467140853405e-05, 7.580593228340149e-05, 7.914472371339798e-05, 8.248351514339447e-05, 8.582230657339096e-05, 8.916109800338745e-05, 9.249988943338394e-05, 9.583868086338043e-05, 9.917747229337692e-05, 0.00010251626372337341, 0.0001058550551533699, 0.0001091938465833664, 0.00011253263801336288, 0.00011587142944335938]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 3.0, 4.0, 4.0, 2.0, 7.0, 5.0, 9.0, 7.0, 23.0, 21.0, 18.0, 12.0, 20.0, 31.0, 29.0, 41.0, 35.0, 44.0, 33.0, 50.0, 50.0, 54.0, 44.0, 45.0, 44.0, 48.0, 43.0, 38.0, 30.0, 37.0, 22.0, 24.0, 16.0, 27.0, 21.0, 15.0, 10.0, 4.0, 8.0, 7.0, 6.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.98828125, -4.8446044921875, -4.700927734375, -4.5572509765625, -4.41357421875, -4.2698974609375, -4.126220703125, -3.9825439453125, -3.8388671875, -3.6951904296875, -3.551513671875, -3.4078369140625, -3.26416015625, -3.1204833984375, -2.976806640625, -2.8331298828125, -2.689453125, -2.5457763671875, -2.402099609375, -2.2584228515625, -2.11474609375, -1.9710693359375, -1.827392578125, -1.6837158203125, -1.5400390625, -1.3963623046875, -1.252685546875, -1.1090087890625, -0.96533203125, -0.8216552734375, -0.677978515625, -0.5343017578125, -0.390625, -0.2469482421875, -0.103271484375, 0.0404052734375, 0.18408203125, 0.3277587890625, 0.471435546875, 0.6151123046875, 0.7587890625, 0.9024658203125, 1.046142578125, 1.1898193359375, 1.33349609375, 1.4771728515625, 1.620849609375, 1.7645263671875, 1.908203125, 2.0518798828125, 2.195556640625, 2.3392333984375, 2.48291015625, 2.6265869140625, 2.770263671875, 2.9139404296875, 3.0576171875, 3.2012939453125, 3.344970703125, 3.4886474609375, 3.63232421875, 3.7760009765625, 3.919677734375, 4.0633544921875, 4.20703125]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 6.0, 4.0, 5.0, 9.0, 6.0, 13.0, 17.0, 19.0, 22.0, 38.0, 68.0, 86.0, 114.0, 165.0, 214.0, 289.0, 437.0, 634.0, 830.0, 1219.0, 1826.0, 2722.0, 4598.0, 11805.0, 59921.0, 406844.0, 459695.0, 69979.0, 13049.0, 4990.0, 2812.0, 1863.0, 1228.0, 893.0, 607.0, 395.0, 339.0, 212.0, 159.0, 113.0, 72.0, 63.0, 38.0, 38.0, 24.0, 19.0, 15.0, 11.0, 8.0, 14.0, 4.0, 8.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-4.80078125, -4.6461181640625, -4.491455078125, -4.3367919921875, -4.18212890625, -4.0274658203125, -3.872802734375, -3.7181396484375, -3.5634765625, -3.4088134765625, -3.254150390625, -3.0994873046875, -2.94482421875, -2.7901611328125, -2.635498046875, -2.4808349609375, -2.326171875, -2.1715087890625, -2.016845703125, -1.8621826171875, -1.70751953125, -1.5528564453125, -1.398193359375, -1.2435302734375, -1.0888671875, -0.9342041015625, -0.779541015625, -0.6248779296875, -0.47021484375, -0.3155517578125, -0.160888671875, -0.0062255859375, 0.1484375, 0.3031005859375, 0.457763671875, 0.6124267578125, 0.76708984375, 0.9217529296875, 1.076416015625, 1.2310791015625, 1.3857421875, 1.5404052734375, 1.695068359375, 1.8497314453125, 2.00439453125, 2.1590576171875, 2.313720703125, 2.4683837890625, 2.623046875, 2.7777099609375, 2.932373046875, 3.0870361328125, 3.24169921875, 3.3963623046875, 3.551025390625, 3.7056884765625, 3.8603515625, 4.0150146484375, 4.169677734375, 4.3243408203125, 4.47900390625, 4.6336669921875, 4.788330078125, 4.9429931640625, 5.09765625]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 5.0, 4.0, 5.0, 9.0, 13.0, 17.0, 23.0, 13.0, 18.0, 28.0, 32.0, 38.0, 36.0, 43.0, 58.0, 62.0, 70.0, 96.0, 1735.0, 257.0, 57.0, 63.0, 58.0, 49.0, 48.0, 32.0, 29.0, 24.0, 25.0, 21.0, 20.0, 15.0, 15.0, 4.0, 8.0, 8.0, 7.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.796875, -16.213134765625, -15.62939453125, -15.045654296875, -14.4619140625, -13.878173828125, -13.29443359375, -12.710693359375, -12.126953125, -11.543212890625, -10.95947265625, -10.375732421875, -9.7919921875, -9.208251953125, -8.62451171875, -8.040771484375, -7.45703125, -6.873291015625, -6.28955078125, -5.705810546875, -5.1220703125, -4.538330078125, -3.95458984375, -3.370849609375, -2.787109375, -2.203369140625, -1.61962890625, -1.035888671875, -0.4521484375, 0.131591796875, 0.71533203125, 1.299072265625, 1.8828125, 2.466552734375, 3.05029296875, 3.634033203125, 4.2177734375, 4.801513671875, 5.38525390625, 5.968994140625, 6.552734375, 7.136474609375, 7.72021484375, 8.303955078125, 8.8876953125, 9.471435546875, 10.05517578125, 10.638916015625, 11.22265625, 11.806396484375, 12.39013671875, 12.973876953125, 13.5576171875, 14.141357421875, 14.72509765625, 15.308837890625, 15.892578125, 16.476318359375, 17.06005859375, 17.643798828125, 18.2275390625, 18.811279296875, 19.39501953125, 19.978759765625, 20.5625]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 6.0, 13.0, 21.0, 25.0, 35.0, 60.0, 101.0, 218.0, 569.0, 1675.0, 15076.0, 3101025.0, 23599.0, 2161.0, 597.0, 240.0, 117.0, 62.0, 50.0, 26.0, 18.0, 9.0, 5.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.59375, -45.8671875, -44.140625, -42.4140625, -40.6875, -38.9609375, -37.234375, -35.5078125, -33.78125, -32.0546875, -30.328125, -28.6015625, -26.875, -25.1484375, -23.421875, -21.6953125, -19.96875, -18.2421875, -16.515625, -14.7890625, -13.0625, -11.3359375, -9.609375, -7.8828125, -6.15625, -4.4296875, -2.703125, -0.9765625, 0.75, 2.4765625, 4.203125, 5.9296875, 7.65625, 9.3828125, 11.109375, 12.8359375, 14.5625, 16.2890625, 18.015625, 19.7421875, 21.46875, 23.1953125, 24.921875, 26.6484375, 28.375, 30.1015625, 31.828125, 33.5546875, 35.28125, 37.0078125, 38.734375, 40.4609375, 42.1875, 43.9140625, 45.640625, 47.3671875, 49.09375, 50.8203125, 52.546875, 54.2734375, 56.0, 57.7265625, 59.453125, 61.1796875, 62.90625]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 16.0, 810.0, 189.0, 2.0, 2.0, 1.0], "bins": [-646.9931640625, -636.1585693359375, -625.3239135742188, -614.4893188476562, -603.6547241210938, -592.820068359375, -581.9854736328125, -571.15087890625, -560.3162841796875, -549.481689453125, -538.6470336914062, -527.8124389648438, -516.9778442382812, -506.1432189941406, -495.30859375, -484.4739990234375, -473.63934326171875, -462.8047180175781, -451.9701232910156, -441.135498046875, -430.3009033203125, -419.4662780761719, -408.63165283203125, -397.79705810546875, -386.9624328613281, -376.1278076171875, -365.293212890625, -354.4585876464844, -343.62396240234375, -332.78936767578125, -321.9547424316406, -311.1201171875, -300.2854919433594, -289.45086669921875, -278.61627197265625, -267.7816467285156, -256.947021484375, -246.1124267578125, -235.27780151367188, -224.4431915283203, -213.60858154296875, -202.7739715576172, -191.93936157226562, -181.104736328125, -170.27012634277344, -159.43551635742188, -148.60089111328125, -137.7662811279297, -126.93167114257812, -116.09706115722656, -105.26244354248047, -94.42782592773438, -83.59321594238281, -72.75860595703125, -61.923988342285156, -51.08937072753906, -40.2547607421875, -29.420146942138672, -18.585533142089844, -7.750919342041016, 3.0836944580078125, 13.91830825805664, 24.75292205810547, 35.58753967285156, 46.422149658203125]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 6.0, 2.0, 4.0, 6.0, 8.0, 3.0, 5.0, 10.0, 11.0, 9.0, 13.0, 16.0, 21.0, 18.0, 19.0, 22.0, 20.0, 22.0, 23.0, 38.0, 32.0, 30.0, 32.0, 37.0, 36.0, 41.0, 32.0, 38.0, 28.0, 39.0, 43.0, 34.0, 25.0, 42.0, 38.0, 25.0, 27.0, 18.0, 22.0, 11.0, 18.0, 10.0, 9.0, 13.0, 11.0, 9.0, 8.0, 4.0, 5.0, 10.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-46.1485595703125, -44.679508209228516, -43.210453033447266, -41.74140167236328, -40.27234649658203, -38.80329513549805, -37.33424377441406, -35.86518859863281, -34.39613342285156, -32.92708206176758, -31.458026885986328, -29.988975524902344, -28.519920349121094, -27.05086898803711, -25.581815719604492, -24.112762451171875, -22.64371109008789, -21.174657821655273, -19.705604553222656, -18.236553192138672, -16.767498016357422, -15.298445701599121, -13.82939338684082, -12.360340118408203, -10.891286849975586, -9.422233581542969, -7.95318078994751, -6.484127998352051, -5.015074729919434, -3.5460214614868164, -2.0769691467285156, -0.6079158782958984, 0.8611335754394531, 2.330186605453491, 3.7992396354675293, 5.268292427062988, 6.7373456954956055, 8.206398963928223, 9.675451278686523, 11.14450454711914, 12.613557815551758, 14.082611083984375, 15.551664352416992, 17.02071762084961, 18.489768981933594, 19.958824157714844, 21.427875518798828, 22.896928787231445, 24.365982055664062, 25.83503532409668, 27.304088592529297, 28.77313995361328, 30.24219512939453, 31.711246490478516, 33.1802978515625, 34.64935302734375, 36.118408203125, 37.587459564208984, 39.056514739990234, 40.52556610107422, 41.99462127685547, 43.46367263793945, 44.93272399902344, 46.40177917480469, 47.87083053588867]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 7.0, 4.0, 3.0, 7.0, 5.0, 13.0, 18.0, 16.0, 20.0, 22.0, 14.0, 16.0, 38.0, 29.0, 47.0, 52.0, 37.0, 41.0, 54.0, 49.0, 49.0, 41.0, 41.0, 44.0, 44.0, 36.0, 42.0, 28.0, 34.0, 27.0, 27.0, 21.0, 16.0, 12.0, 10.0, 8.0, 5.0, 5.0, 7.0, 5.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.2734375, -5.11822509765625, -4.9630126953125, -4.80780029296875, -4.652587890625, -4.49737548828125, -4.3421630859375, -4.18695068359375, -4.03173828125, -3.87652587890625, -3.7213134765625, -3.56610107421875, -3.410888671875, -3.25567626953125, -3.1004638671875, -2.94525146484375, -2.7900390625, -2.63482666015625, -2.4796142578125, -2.32440185546875, -2.169189453125, -2.01397705078125, -1.8587646484375, -1.70355224609375, -1.54833984375, -1.39312744140625, -1.2379150390625, -1.08270263671875, -0.927490234375, -0.77227783203125, -0.6170654296875, -0.46185302734375, -0.306640625, -0.15142822265625, 0.0037841796875, 0.15899658203125, 0.314208984375, 0.46942138671875, 0.6246337890625, 0.77984619140625, 0.93505859375, 1.09027099609375, 1.2454833984375, 1.40069580078125, 1.555908203125, 1.71112060546875, 1.8663330078125, 2.02154541015625, 2.1767578125, 2.33197021484375, 2.4871826171875, 2.64239501953125, 2.797607421875, 2.95281982421875, 3.1080322265625, 3.26324462890625, 3.41845703125, 3.57366943359375, 3.7288818359375, 3.88409423828125, 4.039306640625, 4.19451904296875, 4.3497314453125, 4.50494384765625, 4.66015625]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 7.0, 14.0, 15.0, 19.0, 19.0, 41.0, 44.0, 69.0, 136.0, 238.0, 318.0, 564.0, 947.0, 1766.0, 3385.0, 6371.0, 13043.0, 30565.0, 122735.0, 2230547.0, 1626561.0, 102866.0, 28354.0, 12456.0, 6029.0, 3199.0, 1705.0, 988.0, 514.0, 286.0, 198.0, 106.0, 64.0, 37.0, 19.0, 15.0, 10.0, 10.0, 6.0, 6.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-15.9453125, -15.513671875, -15.08203125, -14.650390625, -14.21875, -13.787109375, -13.35546875, -12.923828125, -12.4921875, -12.060546875, -11.62890625, -11.197265625, -10.765625, -10.333984375, -9.90234375, -9.470703125, -9.0390625, -8.607421875, -8.17578125, -7.744140625, -7.3125, -6.880859375, -6.44921875, -6.017578125, -5.5859375, -5.154296875, -4.72265625, -4.291015625, -3.859375, -3.427734375, -2.99609375, -2.564453125, -2.1328125, -1.701171875, -1.26953125, -0.837890625, -0.40625, 0.025390625, 0.45703125, 0.888671875, 1.3203125, 1.751953125, 2.18359375, 2.615234375, 3.046875, 3.478515625, 3.91015625, 4.341796875, 4.7734375, 5.205078125, 5.63671875, 6.068359375, 6.5, 6.931640625, 7.36328125, 7.794921875, 8.2265625, 8.658203125, 9.08984375, 9.521484375, 9.953125, 10.384765625, 10.81640625, 11.248046875, 11.6796875]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 6.0, 4.0, 7.0, 11.0, 13.0, 29.0, 46.0, 41.0, 63.0, 99.0, 170.0, 281.0, 493.0, 838.0, 890.0, 505.0, 209.0, 131.0, 66.0, 45.0, 46.0, 34.0, 18.0, 7.0, 10.0, 6.0, 2.0, 3.0, 3.0, 5.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.4609375, -9.9364013671875, -9.411865234375, -8.8873291015625, -8.36279296875, -7.8382568359375, -7.313720703125, -6.7891845703125, -6.2646484375, -5.7401123046875, -5.215576171875, -4.6910400390625, -4.16650390625, -3.6419677734375, -3.117431640625, -2.5928955078125, -2.068359375, -1.5438232421875, -1.019287109375, -0.4947509765625, 0.02978515625, 0.5543212890625, 1.078857421875, 1.6033935546875, 2.1279296875, 2.6524658203125, 3.177001953125, 3.7015380859375, 4.22607421875, 4.7506103515625, 5.275146484375, 5.7996826171875, 6.32421875, 6.8487548828125, 7.373291015625, 7.8978271484375, 8.42236328125, 8.9468994140625, 9.471435546875, 9.9959716796875, 10.5205078125, 11.0450439453125, 11.569580078125, 12.0941162109375, 12.61865234375, 13.1431884765625, 13.667724609375, 14.1922607421875, 14.716796875, 15.2413330078125, 15.765869140625, 16.2904052734375, 16.81494140625, 17.3394775390625, 17.864013671875, 18.3885498046875, 18.9130859375, 19.4376220703125, 19.962158203125, 20.4866943359375, 21.01123046875, 21.5357666015625, 22.060302734375, 22.5848388671875, 23.109375]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 2.0, 7.0, 10.0, 11.0, 11.0, 14.0, 43.0, 47.0, 56.0, 126.0, 230.0, 458.0, 791.0, 1721.0, 3832.0, 8869.0, 23981.0, 72591.0, 428616.0, 3221012.0, 331526.0, 63966.0, 21263.0, 8263.0, 3484.0, 1634.0, 763.0, 423.0, 214.0, 121.0, 66.0, 49.0, 24.0, 21.0, 10.0, 9.0, 11.0, 5.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0], "bins": [-25.703125, -25.03466796875, -24.3662109375, -23.69775390625, -23.029296875, -22.36083984375, -21.6923828125, -21.02392578125, -20.35546875, -19.68701171875, -19.0185546875, -18.35009765625, -17.681640625, -17.01318359375, -16.3447265625, -15.67626953125, -15.0078125, -14.33935546875, -13.6708984375, -13.00244140625, -12.333984375, -11.66552734375, -10.9970703125, -10.32861328125, -9.66015625, -8.99169921875, -8.3232421875, -7.65478515625, -6.986328125, -6.31787109375, -5.6494140625, -4.98095703125, -4.3125, -3.64404296875, -2.9755859375, -2.30712890625, -1.638671875, -0.97021484375, -0.3017578125, 0.36669921875, 1.03515625, 1.70361328125, 2.3720703125, 3.04052734375, 3.708984375, 4.37744140625, 5.0458984375, 5.71435546875, 6.3828125, 7.05126953125, 7.7197265625, 8.38818359375, 9.056640625, 9.72509765625, 10.3935546875, 11.06201171875, 11.73046875, 12.39892578125, 13.0673828125, 13.73583984375, 14.404296875, 15.07275390625, 15.7412109375, 16.40966796875, 17.078125]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 6.0, 12.0, 13.0, 16.0, 62.0, 105.0, 182.0, 252.0, 174.0, 105.0, 41.0, 21.0, 9.0, 10.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-142.0196533203125, -138.1363067626953, -134.25296020507812, -130.36962890625, -126.48627471923828, -122.60293579101562, -118.71958923339844, -114.83624267578125, -110.9529037475586, -107.0695571899414, -103.18621826171875, -99.30287170410156, -95.41952514648438, -91.53618621826172, -87.65283966064453, -83.76950073242188, -79.88615417480469, -76.0028076171875, -72.11946868896484, -68.23612213134766, -64.35277557373047, -60.46943664550781, -56.586090087890625, -52.7027473449707, -48.81939697265625, -44.93605422973633, -41.05270767211914, -37.16936492919922, -33.2860221862793, -29.402677536010742, -25.519332885742188, -21.635990142822266, -17.752647399902344, -13.869303703308105, -9.985960006713867, -6.1026153564453125, -2.219271659851074, 1.664072036743164, 5.547416687011719, 9.43075942993164, 13.314104080200195, 17.19744873046875, 21.080791473388672, 24.964136123657227, 28.84748077392578, 32.7308235168457, 36.614166259765625, 40.49751281738281, 44.380855560302734, 48.264198303222656, 52.147544860839844, 56.030887603759766, 59.91423034667969, 63.797576904296875, 67.68092346191406, 71.56426239013672, 75.4476089477539, 79.3309555053711, 83.21429443359375, 87.09764099121094, 90.98098754882812, 94.86432647705078, 98.74767303466797, 102.63101196289062, 106.51435852050781]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 2.0, 7.0, 10.0, 8.0, 10.0, 24.0, 14.0, 25.0, 21.0, 28.0, 22.0, 35.0, 37.0, 37.0, 46.0, 47.0, 59.0, 48.0, 46.0, 51.0, 53.0, 42.0, 52.0, 43.0, 41.0, 28.0, 32.0, 19.0, 35.0, 20.0, 19.0, 6.0, 9.0, 11.0, 4.0, 5.0, 2.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.46049499511719, -48.06324768066406, -46.66600036621094, -45.26875305175781, -43.87150573730469, -42.47425842285156, -41.07701110839844, -39.67976760864258, -38.28252029418945, -36.88527297973633, -35.4880256652832, -34.09077835083008, -32.69353103637695, -31.29628562927246, -29.899038314819336, -28.501792907714844, -27.104543685913086, -25.70729637145996, -24.310049057006836, -22.912803649902344, -21.51555633544922, -20.118309020996094, -18.72106170654297, -17.323814392089844, -15.926568031311035, -14.52932071685791, -13.132074356079102, -11.734827041625977, -10.337579727172852, -8.940333366394043, -7.543086051940918, -6.145839691162109, -4.748592376708984, -3.3513455390930176, -1.9540984630584717, -0.5568513870239258, 0.840395450592041, 2.237642288208008, 3.634889602661133, 5.032135963439941, 6.429383277893066, 7.826630115509033, 9.223876953125, 10.621124267578125, 12.01837158203125, 13.415617942810059, 14.812865257263184, 16.210111618041992, 17.607358932495117, 19.004606246948242, 20.401853561401367, 21.79909896850586, 23.196346282958984, 24.59359359741211, 25.990840911865234, 27.38808822631836, 28.785335540771484, 30.18258285522461, 31.579830169677734, 32.97707748413086, 34.374324798583984, 35.771568298339844, 37.16881561279297, 38.566062927246094, 39.96331024169922]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 5.0, 3.0, 5.0, 9.0, 7.0, 6.0, 7.0, 8.0, 16.0, 17.0, 14.0, 10.0, 23.0, 24.0, 39.0, 33.0, 35.0, 32.0, 32.0, 43.0, 46.0, 48.0, 48.0, 37.0, 33.0, 45.0, 43.0, 35.0, 30.0, 35.0, 32.0, 33.0, 33.0, 28.0, 16.0, 17.0, 14.0, 12.0, 11.0, 7.0, 7.0, 4.0, 8.0, 8.0, 5.0, 0.0, 1.0, 3.0, 1.0, 3.0], "bins": [-5.2265625, -5.084686279296875, -4.94281005859375, -4.800933837890625, -4.6590576171875, -4.517181396484375, -4.37530517578125, -4.233428955078125, -4.091552734375, -3.949676513671875, -3.80780029296875, -3.665924072265625, -3.5240478515625, -3.382171630859375, -3.24029541015625, -3.098419189453125, -2.95654296875, -2.814666748046875, -2.67279052734375, -2.530914306640625, -2.3890380859375, -2.247161865234375, -2.10528564453125, -1.963409423828125, -1.821533203125, -1.679656982421875, -1.53778076171875, -1.395904541015625, -1.2540283203125, -1.112152099609375, -0.97027587890625, -0.828399658203125, -0.6865234375, -0.544647216796875, -0.40277099609375, -0.260894775390625, -0.1190185546875, 0.022857666015625, 0.16473388671875, 0.306610107421875, 0.448486328125, 0.590362548828125, 0.73223876953125, 0.874114990234375, 1.0159912109375, 1.157867431640625, 1.29974365234375, 1.441619873046875, 1.58349609375, 1.725372314453125, 1.86724853515625, 2.009124755859375, 2.1510009765625, 2.292877197265625, 2.43475341796875, 2.576629638671875, 2.718505859375, 2.860382080078125, 3.00225830078125, 3.144134521484375, 3.2860107421875, 3.427886962890625, 3.56976318359375, 3.711639404296875, 3.853515625]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 3.0, 4.0, 9.0, 8.0, 12.0, 14.0, 19.0, 30.0, 40.0, 50.0, 101.0, 136.0, 190.0, 285.0, 433.0, 656.0, 1017.0, 1503.0, 2344.0, 3727.0, 5727.0, 9282.0, 14688.0, 24444.0, 40896.0, 72008.0, 133755.0, 266930.0, 214884.0, 107377.0, 58795.0, 34236.0, 20567.0, 12577.0, 7773.0, 4966.0, 3122.0, 1994.0, 1278.0, 873.0, 573.0, 386.0, 263.0, 179.0, 123.0, 87.0, 57.0, 44.0, 32.0, 17.0, 18.0, 16.0, 5.0, 5.0, 3.0, 6.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.1832275390625, -0.17728424072265625, -0.1713409423828125, -0.16539764404296875, -0.159454345703125, -0.15351104736328125, -0.1475677490234375, -0.14162445068359375, -0.13568115234375, -0.12973785400390625, -0.1237945556640625, -0.11785125732421875, -0.111907958984375, -0.10596466064453125, -0.1000213623046875, -0.09407806396484375, -0.088134765625, -0.08219146728515625, -0.0762481689453125, -0.07030487060546875, -0.064361572265625, -0.05841827392578125, -0.0524749755859375, -0.04653167724609375, -0.04058837890625, -0.03464508056640625, -0.0287017822265625, -0.02275848388671875, -0.016815185546875, -0.01087188720703125, -0.0049285888671875, 0.00101470947265625, 0.0069580078125, 0.01290130615234375, 0.0188446044921875, 0.02478790283203125, 0.030731201171875, 0.03667449951171875, 0.0426177978515625, 0.04856109619140625, 0.05450439453125, 0.06044769287109375, 0.0663909912109375, 0.07233428955078125, 0.078277587890625, 0.08422088623046875, 0.0901641845703125, 0.09610748291015625, 0.10205078125, 0.10799407958984375, 0.1139373779296875, 0.11988067626953125, 0.125823974609375, 0.13176727294921875, 0.1377105712890625, 0.14365386962890625, 0.14959716796875, 0.15554046630859375, 0.1614837646484375, 0.16742706298828125, 0.173370361328125, 0.17931365966796875, 0.1852569580078125, 0.19120025634765625, 0.1971435546875]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 6.0, 4.0, 4.0, 6.0, 4.0, 9.0, 16.0, 11.0, 17.0, 14.0, 13.0, 27.0, 25.0, 26.0, 31.0, 27.0, 39.0, 36.0, 45.0, 28.0, 45.0, 52.0, 1053.0, 53.0, 39.0, 38.0, 39.0, 35.0, 34.0, 25.0, 27.0, 31.0, 24.0, 16.0, 17.0, 15.0, 17.0, 17.0, 16.0, 9.0, 10.0, 7.0, 4.0, 11.0, 5.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.09765625, -3.003631591796875, -2.90960693359375, -2.815582275390625, -2.7215576171875, -2.627532958984375, -2.53350830078125, -2.439483642578125, -2.345458984375, -2.251434326171875, -2.15740966796875, -2.063385009765625, -1.9693603515625, -1.875335693359375, -1.78131103515625, -1.687286376953125, -1.59326171875, -1.499237060546875, -1.40521240234375, -1.311187744140625, -1.2171630859375, -1.123138427734375, -1.02911376953125, -0.935089111328125, -0.841064453125, -0.747039794921875, -0.65301513671875, -0.558990478515625, -0.4649658203125, -0.370941162109375, -0.27691650390625, -0.182891845703125, -0.0888671875, 0.005157470703125, 0.09918212890625, 0.193206787109375, 0.2872314453125, 0.381256103515625, 0.47528076171875, 0.569305419921875, 0.663330078125, 0.757354736328125, 0.85137939453125, 0.945404052734375, 1.0394287109375, 1.133453369140625, 1.22747802734375, 1.321502685546875, 1.41552734375, 1.509552001953125, 1.60357666015625, 1.697601318359375, 1.7916259765625, 1.885650634765625, 1.97967529296875, 2.073699951171875, 2.167724609375, 2.261749267578125, 2.35577392578125, 2.449798583984375, 2.5438232421875, 2.637847900390625, 2.73187255859375, 2.825897216796875, 2.919921875]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [4.0, 3.0, 10.0, 10.0, 17.0, 22.0, 29.0, 39.0, 33.0, 61.0, 67.0, 110.0, 173.0, 226.0, 338.0, 422.0, 589.0, 822.0, 1189.0, 1543.0, 2245.0, 3225.0, 4684.0, 6693.0, 10218.0, 15150.0, 22858.0, 34778.0, 53615.0, 83440.0, 130572.0, 1243267.0, 168573.0, 108663.0, 69560.0, 44566.0, 29465.0, 18924.0, 12711.0, 8697.0, 5850.0, 3990.0, 2738.0, 1966.0, 1388.0, 1029.0, 694.0, 501.0, 372.0, 269.0, 192.0, 155.0, 108.0, 92.0, 52.0, 46.0, 32.0, 25.0, 12.0, 10.0, 8.0, 6.0, 2.0, 4.0], "bins": [-0.1121826171875, -0.10865402221679688, -0.10512542724609375, -0.10159683227539062, -0.0980682373046875, -0.09453964233398438, -0.09101104736328125, -0.08748245239257812, -0.083953857421875, -0.08042526245117188, -0.07689666748046875, -0.07336807250976562, -0.0698394775390625, -0.06631088256835938, -0.06278228759765625, -0.059253692626953125, -0.05572509765625, -0.052196502685546875, -0.04866790771484375, -0.045139312744140625, -0.0416107177734375, -0.038082122802734375, -0.03455352783203125, -0.031024932861328125, -0.027496337890625, -0.023967742919921875, -0.02043914794921875, -0.016910552978515625, -0.0133819580078125, -0.009853363037109375, -0.00632476806640625, -0.002796173095703125, 0.000732421875, 0.004261016845703125, 0.00778961181640625, 0.011318206787109375, 0.0148468017578125, 0.018375396728515625, 0.02190399169921875, 0.025432586669921875, 0.028961181640625, 0.032489776611328125, 0.03601837158203125, 0.039546966552734375, 0.0430755615234375, 0.046604156494140625, 0.05013275146484375, 0.053661346435546875, 0.05718994140625, 0.060718536376953125, 0.06424713134765625, 0.06777572631835938, 0.0713043212890625, 0.07483291625976562, 0.07836151123046875, 0.08189010620117188, 0.085418701171875, 0.08894729614257812, 0.09247589111328125, 0.09600448608398438, 0.0995330810546875, 0.10306167602539062, 0.10659027099609375, 0.11011886596679688, 0.1136474609375]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 6.0, 2.0, 7.0, 2.0, 8.0, 10.0, 8.0, 11.0, 24.0, 18.0, 24.0, 24.0, 25.0, 22.0, 37.0, 53.0, 58.0, 55.0, 106.0, 106.0, 85.0, 52.0, 38.0, 37.0, 25.0, 13.0, 32.0, 18.0, 14.0, 15.0, 9.0, 9.0, 9.0, 6.0, 8.0, 3.0, 5.0, 3.0, 1.0, 4.0, 7.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0001595020294189453, -0.0001546330749988556, -0.00014976412057876587, -0.00014489516615867615, -0.00014002621173858643, -0.0001351572573184967, -0.00013028830289840698, -0.00012541934847831726, -0.00012055039405822754, -0.00011568143963813782, -0.0001108124852180481, -0.00010594353079795837, -0.00010107457637786865, -9.620562195777893e-05, -9.133666753768921e-05, -8.646771311759949e-05, -8.159875869750977e-05, -7.672980427742004e-05, -7.186084985733032e-05, -6.69918954372406e-05, -6.212294101715088e-05, -5.725398659706116e-05, -5.2385032176971436e-05, -4.7516077756881714e-05, -4.264712333679199e-05, -3.777816891670227e-05, -3.290921449661255e-05, -2.8040260076522827e-05, -2.3171305656433105e-05, -1.8302351236343384e-05, -1.3433396816253662e-05, -8.56444239616394e-06, -3.6954879760742188e-06, 1.173466444015503e-06, 6.042420864105225e-06, 1.0911375284194946e-05, 1.5780329704284668e-05, 2.064928412437439e-05, 2.551823854446411e-05, 3.0387192964553833e-05, 3.5256147384643555e-05, 4.0125101804733276e-05, 4.4994056224823e-05, 4.986301064491272e-05, 5.473196506500244e-05, 5.960091948509216e-05, 6.446987390518188e-05, 6.93388283252716e-05, 7.420778274536133e-05, 7.907673716545105e-05, 8.394569158554077e-05, 8.881464600563049e-05, 9.368360042572021e-05, 9.855255484580994e-05, 0.00010342150926589966, 0.00010829046368598938, 0.0001131594181060791, 0.00011802837252616882, 0.00012289732694625854, 0.00012776628136634827, 0.000132635235786438, 0.0001375041902065277, 0.00014237314462661743, 0.00014724209904670715, 0.00015211105346679688]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 0.0, 5.0, 5.0, 6.0, 10.0, 10.0, 13.0, 9.0, 21.0, 21.0, 39.0, 37.0, 72.0, 93.0, 200.0, 467.0, 1709.0, 10384.0, 185124.0, 821212.0, 24631.0, 3088.0, 736.0, 253.0, 126.0, 71.0, 58.0, 38.0, 19.0, 22.0, 21.0, 18.0, 4.0, 13.0, 4.0, 5.0, 4.0, 3.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.002338409423828125, -0.0022634267807006836, -0.002188444137573242, -0.0021134614944458008, -0.0020384788513183594, -0.001963496208190918, -0.0018885135650634766, -0.0018135309219360352, -0.0017385482788085938, -0.0016635656356811523, -0.001588582992553711, -0.0015136003494262695, -0.0014386177062988281, -0.0013636350631713867, -0.0012886524200439453, -0.001213669776916504, -0.0011386871337890625, -0.001063704490661621, -0.0009887218475341797, -0.0009137392044067383, -0.0008387565612792969, -0.0007637739181518555, -0.0006887912750244141, -0.0006138086318969727, -0.0005388259887695312, -0.00046384334564208984, -0.00038886070251464844, -0.00031387805938720703, -0.00023889541625976562, -0.00016391277313232422, -8.893013000488281e-05, -1.3947486877441406e-05, 6.103515625e-05, 0.0001360177993774414, 0.0002110004425048828, 0.0002859830856323242, 0.0003609657287597656, 0.00043594837188720703, 0.0005109310150146484, 0.0005859136581420898, 0.0006608963012695312, 0.0007358789443969727, 0.0008108615875244141, 0.0008858442306518555, 0.0009608268737792969, 0.0010358095169067383, 0.0011107921600341797, 0.001185774803161621, 0.0012607574462890625, 0.001335740089416504, 0.0014107227325439453, 0.0014857053756713867, 0.0015606880187988281, 0.0016356706619262695, 0.001710653305053711, 0.0017856359481811523, 0.0018606185913085938, 0.0019356012344360352, 0.0020105838775634766, 0.002085566520690918, 0.0021605491638183594, 0.0022355318069458008, 0.002310514450073242, 0.0023854970932006836, 0.002460479736328125]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 3.0, 6.0, 4.0, 16.0, 24.0, 33.0, 73.0, 112.0, 201.0, 217.0, 141.0, 73.0, 46.0, 24.0, 13.0, 13.0, 8.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011385445395717397, -0.00010680659033823758, -9.975873399525881e-05, -9.271087037632242e-05, -8.566300675738603e-05, -7.861515041440725e-05, -7.156728679547086e-05, -6.451942317653447e-05, -5.747156319557689e-05, -5.042370321461931e-05, -4.337583959568292e-05, -3.6327979614725336e-05, -2.928011781477835e-05, -2.2232256014831364e-05, -1.5184396033873782e-05, -8.136532414937392e-06, -1.0886724339798093e-06, 5.959188911219826e-06, 1.3007050256419461e-05, 2.0054911146871746e-05, 2.7102772946818732e-05, 3.415063474676572e-05, 4.11984947277233e-05, 4.824635834665969e-05, 5.529421832761727e-05, 6.234207830857486e-05, 6.938994192751125e-05, 7.643780554644763e-05, 8.348566188942641e-05, 9.05335255083628e-05, 9.758138912729919e-05, 0.00010462924547027797, 0.00011167711636517197, 0.00011872497998410836, 0.00012577284360304475, 0.00013282069994602352, 0.0001398685562890023, 0.0001469164271838963, 0.00015396428352687508, 0.00016101213986985385, 0.00016806001076474786, 0.00017510786710772663, 0.00018215573800262064, 0.0001892035943455994, 0.0001962514506885782, 0.0002032993215834722, 0.00021034717792645097, 0.00021739504882134497, 0.00022444289061240852, 0.0002314907469553873, 0.0002385386178502813, 0.0002455864741932601, 0.0002526343450881541, 0.0002596821868792176, 0.00026673005777411163, 0.00027377792866900563, 0.00028082579956389964, 0.00028787367045879364, 0.0002949215122498572, 0.0003019693831447512, 0.0003090172540396452, 0.00031606509583070874, 0.00032311296672560275, 0.00033016083762049675, 0.0003372086794115603]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 7.0, 3.0, 10.0, 13.0, 11.0, 6.0, 18.0, 11.0, 25.0, 17.0, 22.0, 32.0, 21.0, 38.0, 40.0, 28.0, 37.0, 41.0, 49.0, 32.0, 52.0, 53.0, 40.0, 41.0, 35.0, 35.0, 36.0, 33.0, 18.0, 26.0, 28.0, 27.0, 12.0, 24.0, 10.0, 12.0, 10.0, 18.0, 4.0, 8.0, 4.0, 4.0, 2.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0], "bins": [-7.528066635131836e-05, -7.275864481925964e-05, -7.023662328720093e-05, -6.771460175514221e-05, -6.51925802230835e-05, -6.267055869102478e-05, -6.0148537158966064e-05, -5.762651562690735e-05, -5.510449409484863e-05, -5.258247256278992e-05, -5.00604510307312e-05, -4.7538429498672485e-05, -4.501640796661377e-05, -4.2494386434555054e-05, -3.997236490249634e-05, -3.745034337043762e-05, -3.4928321838378906e-05, -3.240630030632019e-05, -2.9884278774261475e-05, -2.736225724220276e-05, -2.4840235710144043e-05, -2.2318214178085327e-05, -1.979619264602661e-05, -1.7274171113967896e-05, -1.475214958190918e-05, -1.2230128049850464e-05, -9.708106517791748e-06, -7.186084985733032e-06, -4.664063453674316e-06, -2.1420419216156006e-06, 3.7997961044311523e-07, 2.902001142501831e-06, 5.424022674560547e-06, 7.946044206619263e-06, 1.0468065738677979e-05, 1.2990087270736694e-05, 1.551210880279541e-05, 1.8034130334854126e-05, 2.0556151866912842e-05, 2.3078173398971558e-05, 2.5600194931030273e-05, 2.812221646308899e-05, 3.0644237995147705e-05, 3.316625952720642e-05, 3.568828105926514e-05, 3.821030259132385e-05, 4.073232412338257e-05, 4.3254345655441284e-05, 4.57763671875e-05, 4.8298388719558716e-05, 5.082041025161743e-05, 5.334243178367615e-05, 5.586445331573486e-05, 5.838647484779358e-05, 6.0908496379852295e-05, 6.343051791191101e-05, 6.595253944396973e-05, 6.847456097602844e-05, 7.099658250808716e-05, 7.351860404014587e-05, 7.604062557220459e-05, 7.85626471042633e-05, 8.108466863632202e-05, 8.360669016838074e-05, 8.612871170043945e-05]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 5.0, 3.0, 5.0, 9.0, 7.0, 6.0, 7.0, 8.0, 16.0, 17.0, 14.0, 10.0, 23.0, 24.0, 39.0, 33.0, 35.0, 32.0, 32.0, 43.0, 46.0, 48.0, 48.0, 37.0, 33.0, 45.0, 43.0, 35.0, 30.0, 35.0, 32.0, 33.0, 33.0, 28.0, 16.0, 17.0, 14.0, 12.0, 11.0, 7.0, 7.0, 4.0, 8.0, 8.0, 5.0, 0.0, 1.0, 3.0, 1.0, 3.0], "bins": [-5.2265625, -5.084686279296875, -4.94281005859375, -4.800933837890625, -4.6590576171875, -4.517181396484375, -4.37530517578125, -4.233428955078125, -4.091552734375, -3.949676513671875, -3.80780029296875, -3.665924072265625, -3.5240478515625, -3.382171630859375, -3.24029541015625, -3.098419189453125, -2.95654296875, -2.814666748046875, -2.67279052734375, -2.530914306640625, -2.3890380859375, -2.247161865234375, -2.10528564453125, -1.963409423828125, -1.821533203125, -1.679656982421875, -1.53778076171875, -1.395904541015625, -1.2540283203125, -1.112152099609375, -0.97027587890625, -0.828399658203125, -0.6865234375, -0.544647216796875, -0.40277099609375, -0.260894775390625, -0.1190185546875, 0.022857666015625, 0.16473388671875, 0.306610107421875, 0.448486328125, 0.590362548828125, 0.73223876953125, 0.874114990234375, 1.0159912109375, 1.157867431640625, 1.29974365234375, 1.441619873046875, 1.58349609375, 1.725372314453125, 1.86724853515625, 2.009124755859375, 2.1510009765625, 2.292877197265625, 2.43475341796875, 2.576629638671875, 2.718505859375, 2.860382080078125, 3.00225830078125, 3.144134521484375, 3.2860107421875, 3.427886962890625, 3.56976318359375, 3.711639404296875, 3.853515625]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 0.0, 5.0, 3.0, 11.0, 14.0, 18.0, 28.0, 38.0, 37.0, 58.0, 92.0, 128.0, 187.0, 257.0, 402.0, 496.0, 707.0, 1014.0, 1462.0, 2046.0, 2997.0, 4598.0, 7960.0, 16416.0, 48710.0, 229572.0, 569385.0, 104650.0, 27810.0, 11354.0, 6037.0, 3722.0, 2462.0, 1676.0, 1198.0, 877.0, 592.0, 446.0, 306.0, 211.0, 170.0, 114.0, 76.0, 67.0, 38.0, 39.0, 20.0, 16.0, 13.0, 7.0, 7.0, 4.0, 4.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.5859375, -5.39508056640625, -5.2042236328125, -5.01336669921875, -4.822509765625, -4.63165283203125, -4.4407958984375, -4.24993896484375, -4.05908203125, -3.86822509765625, -3.6773681640625, -3.48651123046875, -3.295654296875, -3.10479736328125, -2.9139404296875, -2.72308349609375, -2.5322265625, -2.34136962890625, -2.1505126953125, -1.95965576171875, -1.768798828125, -1.57794189453125, -1.3870849609375, -1.19622802734375, -1.00537109375, -0.81451416015625, -0.6236572265625, -0.43280029296875, -0.241943359375, -0.05108642578125, 0.1397705078125, 0.33062744140625, 0.521484375, 0.71234130859375, 0.9031982421875, 1.09405517578125, 1.284912109375, 1.47576904296875, 1.6666259765625, 1.85748291015625, 2.04833984375, 2.23919677734375, 2.4300537109375, 2.62091064453125, 2.811767578125, 3.00262451171875, 3.1934814453125, 3.38433837890625, 3.5751953125, 3.76605224609375, 3.9569091796875, 4.14776611328125, 4.338623046875, 4.52947998046875, 4.7203369140625, 4.91119384765625, 5.10205078125, 5.29290771484375, 5.4837646484375, 5.67462158203125, 5.865478515625, 6.05633544921875, 6.2471923828125, 6.43804931640625, 6.62890625]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 0.0, 6.0, 3.0, 7.0, 8.0, 10.0, 12.0, 11.0, 15.0, 19.0, 25.0, 15.0, 19.0, 27.0, 36.0, 17.0, 28.0, 38.0, 38.0, 42.0, 54.0, 109.0, 403.0, 1526.0, 113.0, 59.0, 52.0, 42.0, 39.0, 38.0, 35.0, 26.0, 21.0, 25.0, 25.0, 22.0, 12.0, 7.0, 10.0, 14.0, 6.0, 8.0, 7.0, 6.0, 5.0, 4.0, 0.0, 6.0, 2.0, 1.0, 5.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.8515625, -14.3880615234375, -13.924560546875, -13.4610595703125, -12.99755859375, -12.5340576171875, -12.070556640625, -11.6070556640625, -11.1435546875, -10.6800537109375, -10.216552734375, -9.7530517578125, -9.28955078125, -8.8260498046875, -8.362548828125, -7.8990478515625, -7.435546875, -6.9720458984375, -6.508544921875, -6.0450439453125, -5.58154296875, -5.1180419921875, -4.654541015625, -4.1910400390625, -3.7275390625, -3.2640380859375, -2.800537109375, -2.3370361328125, -1.87353515625, -1.4100341796875, -0.946533203125, -0.4830322265625, -0.01953125, 0.4439697265625, 0.907470703125, 1.3709716796875, 1.83447265625, 2.2979736328125, 2.761474609375, 3.2249755859375, 3.6884765625, 4.1519775390625, 4.615478515625, 5.0789794921875, 5.54248046875, 6.0059814453125, 6.469482421875, 6.9329833984375, 7.396484375, 7.8599853515625, 8.323486328125, 8.7869873046875, 9.25048828125, 9.7139892578125, 10.177490234375, 10.6409912109375, 11.1044921875, 11.5679931640625, 12.031494140625, 12.4949951171875, 12.95849609375, 13.4219970703125, 13.885498046875, 14.3489990234375, 14.8125]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 5.0, 6.0, 6.0, 8.0, 10.0, 13.0, 7.0, 18.0, 19.0, 17.0, 28.0, 51.0, 75.0, 75.0, 145.0, 245.0, 584.0, 1842.0, 9979.0, 2141678.0, 979225.0, 8748.0, 1647.0, 564.0, 240.0, 136.0, 105.0, 47.0, 54.0, 38.0, 24.0, 19.0, 15.0, 12.0, 9.0, 7.0, 1.0, 7.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-38.625, -37.5205078125, -36.416015625, -35.3115234375, -34.20703125, -33.1025390625, -31.998046875, -30.8935546875, -29.7890625, -28.6845703125, -27.580078125, -26.4755859375, -25.37109375, -24.2666015625, -23.162109375, -22.0576171875, -20.953125, -19.8486328125, -18.744140625, -17.6396484375, -16.53515625, -15.4306640625, -14.326171875, -13.2216796875, -12.1171875, -11.0126953125, -9.908203125, -8.8037109375, -7.69921875, -6.5947265625, -5.490234375, -4.3857421875, -3.28125, -2.1767578125, -1.072265625, 0.0322265625, 1.13671875, 2.2412109375, 3.345703125, 4.4501953125, 5.5546875, 6.6591796875, 7.763671875, 8.8681640625, 9.97265625, 11.0771484375, 12.181640625, 13.2861328125, 14.390625, 15.4951171875, 16.599609375, 17.7041015625, 18.80859375, 19.9130859375, 21.017578125, 22.1220703125, 23.2265625, 24.3310546875, 25.435546875, 26.5400390625, 27.64453125, 28.7490234375, 29.853515625, 30.9580078125, 32.0625]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 6.0, 111.0, 459.0, 369.0, 61.0, 10.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-136.85890197753906, -134.0025634765625, -131.14620971679688, -128.28985595703125, -125.43351745605469, -122.5771713256836, -119.7208251953125, -116.8644790649414, -114.00813293457031, -111.15178680419922, -108.29544067382812, -105.43909454345703, -102.58274841308594, -99.72640228271484, -96.87005615234375, -94.01371002197266, -91.15736389160156, -88.30101776123047, -85.44467163085938, -82.58832550048828, -79.73197937011719, -76.8756332397461, -74.019287109375, -71.1629409790039, -68.30659484863281, -65.45024871826172, -62.593902587890625, -59.73755645751953, -56.88121032714844, -54.024864196777344, -51.16851806640625, -48.312171936035156, -45.4558219909668, -42.5994758605957, -39.74312973022461, -36.886783599853516, -34.03043746948242, -31.174091339111328, -28.317745208740234, -25.46139907836914, -22.605052947998047, -19.748706817626953, -16.89236068725586, -14.036014556884766, -11.179668426513672, -8.323322296142578, -5.466976165771484, -2.6106300354003906, 0.24571609497070312, 3.102062225341797, 5.958408355712891, 8.814754486083984, 11.671100616455078, 14.527446746826172, 17.383792877197266, 20.24013900756836, 23.096485137939453, 25.952831268310547, 28.80917739868164, 31.665523529052734, 34.52186965942383, 37.37821578979492, 40.234561920166016, 43.09090805053711, 45.9472541809082]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 7.0, 4.0, 6.0, 2.0, 8.0, 12.0, 10.0, 12.0, 15.0, 22.0, 29.0, 33.0, 25.0, 32.0, 39.0, 44.0, 38.0, 35.0, 43.0, 57.0, 48.0, 39.0, 39.0, 36.0, 39.0, 45.0, 29.0, 40.0, 33.0, 23.0, 22.0, 17.0, 19.0, 26.0, 19.0, 9.0, 8.0, 6.0, 8.0, 7.0, 5.0, 5.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-48.24293899536133, -46.78824996948242, -45.33356475830078, -43.878875732421875, -42.42418670654297, -40.96949768066406, -39.514808654785156, -38.060123443603516, -36.60543441772461, -35.1507453918457, -33.69606018066406, -32.241371154785156, -30.78668212890625, -29.331993103027344, -27.87730598449707, -26.422618865966797, -24.96792984008789, -23.513240814208984, -22.05855369567871, -20.603866577148438, -19.14917755126953, -17.694488525390625, -16.23980140686035, -14.785113334655762, -13.330425262451172, -11.875737190246582, -10.421049118041992, -8.966361045837402, -7.5116729736328125, -6.056984901428223, -4.602296829223633, -3.147608757019043, -1.6929168701171875, -0.23822879791259766, 1.2164592742919922, 2.671147346496582, 4.125835418701172, 5.580523490905762, 7.035211563110352, 8.489899635314941, 9.944587707519531, 11.399275779724121, 12.853963851928711, 14.3086519241333, 15.76333999633789, 17.218029022216797, 18.67271614074707, 20.127403259277344, 21.58209228515625, 23.036781311035156, 24.49146842956543, 25.946155548095703, 27.40084457397461, 28.855533599853516, 30.31022071838379, 31.764907836914062, 33.21959686279297, 34.674285888671875, 36.12897491455078, 37.58366012573242, 39.03834915161133, 40.493038177490234, 41.947723388671875, 43.40241241455078, 44.85710144042969]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 4.0, 6.0, 7.0, 8.0, 7.0, 5.0, 10.0, 16.0, 14.0, 14.0, 20.0, 22.0, 30.0, 38.0, 28.0, 36.0, 31.0, 45.0, 44.0, 42.0, 45.0, 46.0, 36.0, 47.0, 39.0, 33.0, 36.0, 38.0, 37.0, 25.0, 38.0, 31.0, 23.0, 17.0, 15.0, 14.0, 13.0, 7.0, 8.0, 8.0, 6.0, 7.0, 1.0, 3.0, 2.0, 3.0, 1.0, 2.0], "bins": [-5.5546875, -5.40655517578125, -5.2584228515625, -5.11029052734375, -4.962158203125, -4.81402587890625, -4.6658935546875, -4.51776123046875, -4.36962890625, -4.22149658203125, -4.0733642578125, -3.92523193359375, -3.777099609375, -3.62896728515625, -3.4808349609375, -3.33270263671875, -3.1845703125, -3.03643798828125, -2.8883056640625, -2.74017333984375, -2.592041015625, -2.44390869140625, -2.2957763671875, -2.14764404296875, -1.99951171875, -1.85137939453125, -1.7032470703125, -1.55511474609375, -1.406982421875, -1.25885009765625, -1.1107177734375, -0.96258544921875, -0.814453125, -0.66632080078125, -0.5181884765625, -0.37005615234375, -0.221923828125, -0.07379150390625, 0.0743408203125, 0.22247314453125, 0.37060546875, 0.51873779296875, 0.6668701171875, 0.81500244140625, 0.963134765625, 1.11126708984375, 1.2593994140625, 1.40753173828125, 1.5556640625, 1.70379638671875, 1.8519287109375, 2.00006103515625, 2.148193359375, 2.29632568359375, 2.4444580078125, 2.59259033203125, 2.74072265625, 2.88885498046875, 3.0369873046875, 3.18511962890625, 3.333251953125, 3.48138427734375, 3.6295166015625, 3.77764892578125, 3.92578125]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 3.0, 6.0, 6.0, 10.0, 24.0, 22.0, 39.0, 50.0, 68.0, 74.0, 130.0, 226.0, 252.0, 402.0, 567.0, 845.0, 1317.0, 1963.0, 3028.0, 4859.0, 8149.0, 14453.0, 27759.0, 82219.0, 655214.0, 2616167.0, 623517.0, 86876.0, 29310.0, 14692.0, 8432.0, 4958.0, 2996.0, 1974.0, 1249.0, 813.0, 508.0, 380.0, 228.0, 177.0, 98.0, 73.0, 48.0, 33.0, 29.0, 17.0, 8.0, 7.0, 7.0, 4.0, 3.0, 0.0, 1.0, 0.0, 3.0], "bins": [-10.4765625, -10.1728515625, -9.869140625, -9.5654296875, -9.26171875, -8.9580078125, -8.654296875, -8.3505859375, -8.046875, -7.7431640625, -7.439453125, -7.1357421875, -6.83203125, -6.5283203125, -6.224609375, -5.9208984375, -5.6171875, -5.3134765625, -5.009765625, -4.7060546875, -4.40234375, -4.0986328125, -3.794921875, -3.4912109375, -3.1875, -2.8837890625, -2.580078125, -2.2763671875, -1.97265625, -1.6689453125, -1.365234375, -1.0615234375, -0.7578125, -0.4541015625, -0.150390625, 0.1533203125, 0.45703125, 0.7607421875, 1.064453125, 1.3681640625, 1.671875, 1.9755859375, 2.279296875, 2.5830078125, 2.88671875, 3.1904296875, 3.494140625, 3.7978515625, 4.1015625, 4.4052734375, 4.708984375, 5.0126953125, 5.31640625, 5.6201171875, 5.923828125, 6.2275390625, 6.53125, 6.8349609375, 7.138671875, 7.4423828125, 7.74609375, 8.0498046875, 8.353515625, 8.6572265625, 8.9609375]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 7.0, 1.0, 4.0, 7.0, 8.0, 18.0, 10.0, 26.0, 23.0, 34.0, 46.0, 78.0, 122.0, 189.0, 385.0, 674.0, 885.0, 663.0, 364.0, 175.0, 119.0, 57.0, 53.0, 40.0, 29.0, 12.0, 7.0, 8.0, 11.0, 7.0, 4.0, 8.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.15625, -15.673583984375, -15.19091796875, -14.708251953125, -14.2255859375, -13.742919921875, -13.26025390625, -12.777587890625, -12.294921875, -11.812255859375, -11.32958984375, -10.846923828125, -10.3642578125, -9.881591796875, -9.39892578125, -8.916259765625, -8.43359375, -7.950927734375, -7.46826171875, -6.985595703125, -6.5029296875, -6.020263671875, -5.53759765625, -5.054931640625, -4.572265625, -4.089599609375, -3.60693359375, -3.124267578125, -2.6416015625, -2.158935546875, -1.67626953125, -1.193603515625, -0.7109375, -0.228271484375, 0.25439453125, 0.737060546875, 1.2197265625, 1.702392578125, 2.18505859375, 2.667724609375, 3.150390625, 3.633056640625, 4.11572265625, 4.598388671875, 5.0810546875, 5.563720703125, 6.04638671875, 6.529052734375, 7.01171875, 7.494384765625, 7.97705078125, 8.459716796875, 8.9423828125, 9.425048828125, 9.90771484375, 10.390380859375, 10.873046875, 11.355712890625, 11.83837890625, 12.321044921875, 12.8037109375, 13.286376953125, 13.76904296875, 14.251708984375, 14.734375]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 8.0, 8.0, 15.0, 17.0, 37.0, 39.0, 77.0, 96.0, 145.0, 250.0, 373.0, 576.0, 998.0, 1809.0, 3325.0, 6784.0, 14456.0, 34091.0, 104524.0, 947880.0, 2747835.0, 235758.0, 54315.0, 21090.0, 9483.0, 4603.0, 2446.0, 1284.0, 726.0, 427.0, 283.0, 172.0, 118.0, 78.0, 49.0, 36.0, 28.0, 17.0, 12.0, 5.0, 4.0, 7.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.1875, -16.63720703125, -16.0869140625, -15.53662109375, -14.986328125, -14.43603515625, -13.8857421875, -13.33544921875, -12.78515625, -12.23486328125, -11.6845703125, -11.13427734375, -10.583984375, -10.03369140625, -9.4833984375, -8.93310546875, -8.3828125, -7.83251953125, -7.2822265625, -6.73193359375, -6.181640625, -5.63134765625, -5.0810546875, -4.53076171875, -3.98046875, -3.43017578125, -2.8798828125, -2.32958984375, -1.779296875, -1.22900390625, -0.6787109375, -0.12841796875, 0.421875, 0.97216796875, 1.5224609375, 2.07275390625, 2.623046875, 3.17333984375, 3.7236328125, 4.27392578125, 4.82421875, 5.37451171875, 5.9248046875, 6.47509765625, 7.025390625, 7.57568359375, 8.1259765625, 8.67626953125, 9.2265625, 9.77685546875, 10.3271484375, 10.87744140625, 11.427734375, 11.97802734375, 12.5283203125, 13.07861328125, 13.62890625, 14.17919921875, 14.7294921875, 15.27978515625, 15.830078125, 16.38037109375, 16.9306640625, 17.48095703125, 18.03125]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 6.0, 9.0, 13.0, 28.0, 44.0, 73.0, 108.0, 156.0, 153.0, 147.0, 96.0, 71.0, 37.0, 28.0, 13.0, 8.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-72.43875885009766, -69.81275177001953, -67.1867446899414, -64.56074523925781, -61.93473815917969, -59.30873107910156, -56.68272399902344, -54.05671691894531, -51.43071365356445, -48.80470657348633, -46.17870330810547, -43.552696228027344, -40.92668914794922, -38.30068588256836, -35.674678802490234, -33.048675537109375, -30.42266845703125, -27.796663284301758, -25.170658111572266, -22.54465103149414, -19.91864585876465, -17.292640686035156, -14.666634559631348, -12.040628433227539, -9.414623260498047, -6.7886176109313965, -4.162611961364746, -1.5366063117980957, 1.0893993377685547, 3.715404510498047, 6.3414106369018555, 8.967416763305664, 11.593429565429688, 14.21943473815918, 16.845439910888672, 19.471446990966797, 22.09745216369629, 24.72345733642578, 27.349464416503906, 29.9754695892334, 32.60147476196289, 35.227481842041016, 37.853485107421875, 40.4794921875, 43.105499267578125, 45.731502532958984, 48.35750961303711, 50.98351287841797, 53.609519958496094, 56.23552703857422, 58.86153030395508, 61.4875373840332, 64.11354064941406, 66.73954772949219, 69.36555480957031, 71.99156188964844, 74.61756896972656, 77.24357604980469, 79.86958312988281, 82.4955825805664, 85.12158966064453, 87.74759674072266, 90.37360382080078, 92.9996109008789, 95.6256103515625]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 7.0, 7.0, 16.0, 14.0, 7.0, 15.0, 20.0, 22.0, 22.0, 32.0, 28.0, 48.0, 37.0, 45.0, 42.0, 35.0, 51.0, 48.0, 49.0, 58.0, 55.0, 33.0, 39.0, 26.0, 31.0, 28.0, 29.0, 24.0, 18.0, 11.0, 17.0, 13.0, 14.0, 13.0, 12.0, 12.0, 4.0, 2.0, 4.0, 5.0, 0.0, 1.0, 2.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.66984939575195, -37.38703918457031, -36.104225158691406, -34.821414947509766, -33.538604736328125, -32.25579071044922, -30.972980499267578, -29.690168380737305, -28.40735626220703, -27.124544143676758, -25.841732025146484, -24.558921813964844, -23.27610969543457, -21.993297576904297, -20.710487365722656, -19.427675247192383, -18.14486312866211, -16.862051010131836, -15.579239845275879, -14.296428680419922, -13.013616561889648, -11.730804443359375, -10.447993278503418, -9.165182113647461, -7.8823699951171875, -6.599558353424072, -5.316746711730957, -4.033935070037842, -2.7511234283447266, -1.4683117866516113, -0.1855001449584961, 1.097311019897461, 2.3801231384277344, 3.6629347801208496, 4.945746421813965, 6.22855806350708, 7.511369705200195, 8.794181823730469, 10.076992988586426, 11.359804153442383, 12.642616271972656, 13.92542839050293, 15.208239555358887, 16.491050720214844, 17.773862838745117, 19.05667495727539, 20.33948516845703, 21.622297286987305, 22.905109405517578, 24.18792152404785, 25.470733642578125, 26.753543853759766, 28.03635597229004, 29.319168090820312, 30.601978302001953, 31.884790420532227, 33.1676025390625, 34.45041275024414, 35.73322677612305, 37.01603698730469, 38.298851013183594, 39.581661224365234, 40.864471435546875, 42.14728546142578, 43.43009567260742]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 6.0, 3.0, 3.0, 9.0, 8.0, 13.0, 12.0, 18.0, 24.0, 20.0, 21.0, 26.0, 34.0, 33.0, 37.0, 39.0, 45.0, 41.0, 50.0, 56.0, 37.0, 40.0, 39.0, 30.0, 45.0, 45.0, 36.0, 35.0, 23.0, 25.0, 22.0, 20.0, 16.0, 15.0, 18.0, 17.0, 13.0, 8.0, 10.0, 1.0, 0.0, 6.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-5.5, -5.34844970703125, -5.1968994140625, -5.04534912109375, -4.893798828125, -4.74224853515625, -4.5906982421875, -4.43914794921875, -4.28759765625, -4.13604736328125, -3.9844970703125, -3.83294677734375, -3.681396484375, -3.52984619140625, -3.3782958984375, -3.22674560546875, -3.0751953125, -2.92364501953125, -2.7720947265625, -2.62054443359375, -2.468994140625, -2.31744384765625, -2.1658935546875, -2.01434326171875, -1.86279296875, -1.71124267578125, -1.5596923828125, -1.40814208984375, -1.256591796875, -1.10504150390625, -0.9534912109375, -0.80194091796875, -0.650390625, -0.49884033203125, -0.3472900390625, -0.19573974609375, -0.044189453125, 0.10736083984375, 0.2589111328125, 0.41046142578125, 0.56201171875, 0.71356201171875, 0.8651123046875, 1.01666259765625, 1.168212890625, 1.31976318359375, 1.4713134765625, 1.62286376953125, 1.7744140625, 1.92596435546875, 2.0775146484375, 2.22906494140625, 2.380615234375, 2.53216552734375, 2.6837158203125, 2.83526611328125, 2.98681640625, 3.13836669921875, 3.2899169921875, 3.44146728515625, 3.593017578125, 3.74456787109375, 3.8961181640625, 4.04766845703125, 4.19921875]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 4.0, 3.0, 4.0, 4.0, 8.0, 7.0, 22.0, 19.0, 39.0, 47.0, 65.0, 111.0, 173.0, 232.0, 389.0, 608.0, 995.0, 1521.0, 2522.0, 4318.0, 7422.0, 12510.0, 22622.0, 40966.0, 79414.0, 170181.0, 338660.0, 182454.0, 84024.0, 43518.0, 23395.0, 13175.0, 7536.0, 4441.0, 2701.0, 1604.0, 1028.0, 644.0, 408.0, 265.0, 160.0, 103.0, 75.0, 61.0, 32.0, 20.0, 21.0, 10.0, 6.0, 8.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.229736328125, -0.2222137451171875, -0.214691162109375, -0.2071685791015625, -0.19964599609375, -0.1921234130859375, -0.184600830078125, -0.1770782470703125, -0.1695556640625, -0.1620330810546875, -0.154510498046875, -0.1469879150390625, -0.13946533203125, -0.1319427490234375, -0.124420166015625, -0.1168975830078125, -0.109375, -0.1018524169921875, -0.094329833984375, -0.0868072509765625, -0.07928466796875, -0.0717620849609375, -0.064239501953125, -0.0567169189453125, -0.0491943359375, -0.0416717529296875, -0.034149169921875, -0.0266265869140625, -0.01910400390625, -0.0115814208984375, -0.004058837890625, 0.0034637451171875, 0.010986328125, 0.0185089111328125, 0.026031494140625, 0.0335540771484375, 0.04107666015625, 0.0485992431640625, 0.056121826171875, 0.0636444091796875, 0.0711669921875, 0.0786895751953125, 0.086212158203125, 0.0937347412109375, 0.10125732421875, 0.1087799072265625, 0.116302490234375, 0.1238250732421875, 0.13134765625, 0.1388702392578125, 0.146392822265625, 0.1539154052734375, 0.16143798828125, 0.1689605712890625, 0.176483154296875, 0.1840057373046875, 0.1915283203125, 0.1990509033203125, 0.206573486328125, 0.2140960693359375, 0.22161865234375, 0.2291412353515625, 0.236663818359375, 0.2441864013671875, 0.251708984375]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 6.0, 7.0, 3.0, 7.0, 6.0, 7.0, 9.0, 11.0, 13.0, 22.0, 25.0, 29.0, 24.0, 22.0, 30.0, 31.0, 31.0, 41.0, 43.0, 43.0, 43.0, 32.0, 1063.0, 41.0, 46.0, 30.0, 40.0, 22.0, 35.0, 28.0, 35.0, 32.0, 24.0, 26.0, 18.0, 24.0, 9.0, 14.0, 14.0, 8.0, 8.0, 5.0, 4.0, 4.0, 7.0, 5.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.580078125, -2.489288330078125, -2.39849853515625, -2.307708740234375, -2.2169189453125, -2.126129150390625, -2.03533935546875, -1.944549560546875, -1.853759765625, -1.762969970703125, -1.67218017578125, -1.581390380859375, -1.4906005859375, -1.399810791015625, -1.30902099609375, -1.218231201171875, -1.12744140625, -1.036651611328125, -0.94586181640625, -0.855072021484375, -0.7642822265625, -0.673492431640625, -0.58270263671875, -0.491912841796875, -0.401123046875, -0.310333251953125, -0.21954345703125, -0.128753662109375, -0.0379638671875, 0.052825927734375, 0.14361572265625, 0.234405517578125, 0.3251953125, 0.415985107421875, 0.50677490234375, 0.597564697265625, 0.6883544921875, 0.779144287109375, 0.86993408203125, 0.960723876953125, 1.051513671875, 1.142303466796875, 1.23309326171875, 1.323883056640625, 1.4146728515625, 1.505462646484375, 1.59625244140625, 1.687042236328125, 1.77783203125, 1.868621826171875, 1.95941162109375, 2.050201416015625, 2.1409912109375, 2.231781005859375, 2.32257080078125, 2.413360595703125, 2.504150390625, 2.594940185546875, 2.68572998046875, 2.776519775390625, 2.8673095703125, 2.958099365234375, 3.04888916015625, 3.139678955078125, 3.23046875]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [4.0, 2.0, 7.0, 7.0, 5.0, 10.0, 19.0, 18.0, 33.0, 36.0, 50.0, 100.0, 131.0, 179.0, 252.0, 337.0, 518.0, 666.0, 946.0, 1212.0, 1779.0, 2682.0, 3664.0, 5303.0, 7799.0, 11208.0, 16565.0, 24573.0, 37098.0, 56673.0, 88701.0, 140867.0, 1254215.0, 155745.0, 97783.0, 62169.0, 40836.0, 27021.0, 18216.0, 12063.0, 8351.0, 5729.0, 3947.0, 2734.0, 1948.0, 1392.0, 992.0, 730.0, 499.0, 387.0, 238.0, 203.0, 153.0, 81.0, 70.0, 51.0, 31.0, 41.0, 25.0, 15.0, 19.0, 7.0, 7.0, 10.0], "bins": [-0.11602783203125, -0.11246967315673828, -0.10891151428222656, -0.10535335540771484, -0.10179519653320312, -0.0982370376586914, -0.09467887878417969, -0.09112071990966797, -0.08756256103515625, -0.08400440216064453, -0.08044624328613281, -0.0768880844116211, -0.07332992553710938, -0.06977176666259766, -0.06621360778808594, -0.06265544891357422, -0.0590972900390625, -0.05553913116455078, -0.05198097229003906, -0.048422813415527344, -0.044864654541015625, -0.041306495666503906, -0.03774833679199219, -0.03419017791748047, -0.03063201904296875, -0.02707386016845703, -0.023515701293945312, -0.019957542419433594, -0.016399383544921875, -0.012841224670410156, -0.009283065795898438, -0.005724906921386719, -0.002166748046875, 0.0013914108276367188, 0.0049495697021484375, 0.008507728576660156, 0.012065887451171875, 0.015624046325683594, 0.019182205200195312, 0.02274036407470703, 0.02629852294921875, 0.02985668182373047, 0.03341484069824219, 0.036972999572753906, 0.040531158447265625, 0.044089317321777344, 0.04764747619628906, 0.05120563507080078, 0.0547637939453125, 0.05832195281982422, 0.06188011169433594, 0.06543827056884766, 0.06899642944335938, 0.0725545883178711, 0.07611274719238281, 0.07967090606689453, 0.08322906494140625, 0.08678722381591797, 0.09034538269042969, 0.0939035415649414, 0.09746170043945312, 0.10101985931396484, 0.10457801818847656, 0.10813617706298828, 0.1116943359375]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 6.0, 2.0, 3.0, 6.0, 5.0, 6.0, 4.0, 6.0, 10.0, 11.0, 8.0, 17.0, 11.0, 12.0, 16.0, 26.0, 28.0, 35.0, 57.0, 70.0, 89.0, 106.0, 80.0, 86.0, 59.0, 48.0, 43.0, 29.0, 27.0, 20.0, 13.0, 20.0, 11.0, 5.0, 7.0, 4.0, 8.0, 5.0, 4.0, 1.0, 2.0, 5.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00020623207092285156, -0.00019990280270576477, -0.00019357353448867798, -0.0001872442662715912, -0.0001809149980545044, -0.0001745857298374176, -0.0001682564616203308, -0.00016192719340324402, -0.00015559792518615723, -0.00014926865696907043, -0.00014293938875198364, -0.00013661012053489685, -0.00013028085231781006, -0.00012395158410072327, -0.00011762231588363647, -0.00011129304766654968, -0.00010496377944946289, -9.86345112323761e-05, -9.23052430152893e-05, -8.597597479820251e-05, -7.964670658111572e-05, -7.331743836402893e-05, -6.698817014694214e-05, -6.065890192985535e-05, -5.4329633712768555e-05, -4.800036549568176e-05, -4.167109727859497e-05, -3.534182906150818e-05, -2.9012560844421387e-05, -2.2683292627334595e-05, -1.6354024410247803e-05, -1.002475619316101e-05, -3.6954879760742188e-06, 2.6337802410125732e-06, 8.963048458099365e-06, 1.5292316675186157e-05, 2.162158489227295e-05, 2.795085310935974e-05, 3.428012132644653e-05, 4.0609389543533325e-05, 4.693865776062012e-05, 5.326792597770691e-05, 5.95971941947937e-05, 6.592646241188049e-05, 7.225573062896729e-05, 7.858499884605408e-05, 8.491426706314087e-05, 9.124353528022766e-05, 9.757280349731445e-05, 0.00010390207171440125, 0.00011023133993148804, 0.00011656060814857483, 0.00012288987636566162, 0.0001292191445827484, 0.0001355484127998352, 0.000141877681016922, 0.0001482069492340088, 0.00015453621745109558, 0.00016086548566818237, 0.00016719475388526917, 0.00017352402210235596, 0.00017985329031944275, 0.00018618255853652954, 0.00019251182675361633, 0.00019884109497070312]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 1.0, 1.0, 6.0, 3.0, 8.0, 6.0, 7.0, 14.0, 11.0, 27.0, 27.0, 34.0, 51.0, 58.0, 104.0, 144.0, 351.0, 1018.0, 4537.0, 36434.0, 851626.0, 140527.0, 10604.0, 1842.0, 517.0, 214.0, 89.0, 67.0, 55.0, 40.0, 20.0, 20.0, 20.0, 17.0, 18.0, 7.0, 7.0, 4.0, 4.0, 6.0, 5.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0024585723876953125, -0.0023729801177978516, -0.0022873878479003906, -0.0022017955780029297, -0.0021162033081054688, -0.002030611038208008, -0.0019450187683105469, -0.001859426498413086, -0.001773834228515625, -0.001688241958618164, -0.0016026496887207031, -0.0015170574188232422, -0.0014314651489257812, -0.0013458728790283203, -0.0012602806091308594, -0.0011746883392333984, -0.0010890960693359375, -0.0010035037994384766, -0.0009179115295410156, -0.0008323192596435547, -0.0007467269897460938, -0.0006611347198486328, -0.0005755424499511719, -0.0004899501800537109, -0.00040435791015625, -0.00031876564025878906, -0.00023317337036132812, -0.0001475811004638672, -6.198883056640625e-05, 2.3603439331054688e-05, 0.00010919570922851562, 0.00019478797912597656, 0.0002803802490234375, 0.00036597251892089844, 0.0004515647888183594, 0.0005371570587158203, 0.0006227493286132812, 0.0007083415985107422, 0.0007939338684082031, 0.0008795261383056641, 0.000965118408203125, 0.001050710678100586, 0.0011363029479980469, 0.0012218952178955078, 0.0013074874877929688, 0.0013930797576904297, 0.0014786720275878906, 0.0015642642974853516, 0.0016498565673828125, 0.0017354488372802734, 0.0018210411071777344, 0.0019066333770751953, 0.0019922256469726562, 0.002077817916870117, 0.002163410186767578, 0.002249002456665039, 0.0023345947265625, 0.002420186996459961, 0.002505779266357422, 0.002591371536254883, 0.0026769638061523438, 0.0027625560760498047, 0.0028481483459472656, 0.0029337406158447266, 0.0030193328857421875]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 6.0, 9.0, 9.0, 23.0, 37.0, 57.0, 97.0, 151.0, 180.0, 173.0, 104.0, 60.0, 33.0, 29.0, 13.0, 8.0, 7.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011117279791506007, -0.00010345063492422923, -9.57284719333984e-05, -8.800631621852517e-05, -8.028415322769433e-05, -7.25619902368635e-05, -6.483982724603266e-05, -5.7117664255201817e-05, -4.939550126437098e-05, -4.167333827354014e-05, -3.39511752827093e-05, -2.622901592985727e-05, -1.850685293902643e-05, -1.0784689948195592e-05, -3.06253059534356e-06, 4.659632395487279e-06, 1.2381795386318117e-05, 2.0103958377148956e-05, 2.782611954899039e-05, 3.5548280720831826e-05, 4.3270443711662665e-05, 5.0992606702493504e-05, 5.8714766055345535e-05, 6.643692904617637e-05, 7.415909203700721e-05, 8.188125502783805e-05, 8.960341801866889e-05, 9.732558100949973e-05, 0.00010504774400033057, 0.0001127699069911614, 0.00012049206270603463, 0.00012821421842090786, 0.00013593639596365392, 0.00014365855895448476, 0.0001513807219453156, 0.00015910288493614644, 0.00016682504792697728, 0.00017454721091780812, 0.00018226937390863895, 0.00018999152234755456, 0.00019771369989030063, 0.00020543586288113147, 0.0002131580258719623, 0.00022088018886279315, 0.00022860235185362399, 0.00023632451484445482, 0.00024404667783528566, 0.0002517688262742013, 0.0002594909747131169, 0.0002672131231520325, 0.00027493530069477856, 0.00028265744913369417, 0.00029037962667644024, 0.00029810177511535585, 0.0003058239526581019, 0.0003135461010970175, 0.0003212682786397636, 0.0003289904270786792, 0.00033671260462142527, 0.0003444347530603409, 0.00035215693060308695, 0.00035987907904200256, 0.0003676012565847486, 0.00037532340502366424, 0.0003830455825664103]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 6.0, 5.0, 8.0, 9.0, 12.0, 10.0, 16.0, 15.0, 12.0, 9.0, 17.0, 19.0, 28.0, 18.0, 28.0, 30.0, 34.0, 31.0, 30.0, 35.0, 43.0, 39.0, 34.0, 39.0, 39.0, 33.0, 31.0, 30.0, 30.0, 42.0, 31.0, 24.0, 28.0, 22.0, 21.0, 13.0, 24.0, 13.0, 17.0, 11.0, 6.0, 8.0, 8.0, 14.0, 7.0, 7.0, 4.0, 2.0, 4.0, 0.0, 3.0, 3.0, 3.0, 2.0, 1.0, 2.0], "bins": [-8.422136306762695e-05, -8.152052760124207e-05, -7.881969213485718e-05, -7.611885666847229e-05, -7.34180212020874e-05, -7.071718573570251e-05, -6.801635026931763e-05, -6.531551480293274e-05, -6.261467933654785e-05, -5.9913843870162964e-05, -5.7213008403778076e-05, -5.451217293739319e-05, -5.18113374710083e-05, -4.911050200462341e-05, -4.6409666538238525e-05, -4.370883107185364e-05, -4.100799560546875e-05, -3.830716013908386e-05, -3.5606324672698975e-05, -3.290548920631409e-05, -3.02046537399292e-05, -2.750381827354431e-05, -2.4802982807159424e-05, -2.2102147340774536e-05, -1.940131187438965e-05, -1.670047640800476e-05, -1.3999640941619873e-05, -1.1298805475234985e-05, -8.597970008850098e-06, -5.89713454246521e-06, -3.1962990760803223e-06, -4.954636096954346e-07, 2.205371856689453e-06, 4.906207323074341e-06, 7.6070427894592285e-06, 1.0307878255844116e-05, 1.3008713722229004e-05, 1.570954918861389e-05, 1.841038465499878e-05, 2.1111220121383667e-05, 2.3812055587768555e-05, 2.6512891054153442e-05, 2.921372652053833e-05, 3.191456198692322e-05, 3.4615397453308105e-05, 3.731623291969299e-05, 4.001706838607788e-05, 4.271790385246277e-05, 4.5418739318847656e-05, 4.8119574785232544e-05, 5.082041025161743e-05, 5.352124571800232e-05, 5.622208118438721e-05, 5.8922916650772095e-05, 6.162375211715698e-05, 6.432458758354187e-05, 6.702542304992676e-05, 6.972625851631165e-05, 7.242709398269653e-05, 7.512792944908142e-05, 7.782876491546631e-05, 8.05296003818512e-05, 8.323043584823608e-05, 8.593127131462097e-05, 8.863210678100586e-05]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 6.0, 3.0, 3.0, 9.0, 8.0, 13.0, 12.0, 18.0, 24.0, 20.0, 21.0, 26.0, 34.0, 33.0, 37.0, 39.0, 45.0, 41.0, 50.0, 56.0, 37.0, 40.0, 39.0, 30.0, 45.0, 45.0, 36.0, 35.0, 23.0, 25.0, 22.0, 20.0, 16.0, 15.0, 18.0, 17.0, 13.0, 8.0, 10.0, 1.0, 0.0, 6.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-5.5, -5.34844970703125, -5.1968994140625, -5.04534912109375, -4.893798828125, -4.74224853515625, -4.5906982421875, -4.43914794921875, -4.28759765625, -4.13604736328125, -3.9844970703125, -3.83294677734375, -3.681396484375, -3.52984619140625, -3.3782958984375, -3.22674560546875, -3.0751953125, -2.92364501953125, -2.7720947265625, -2.62054443359375, -2.468994140625, -2.31744384765625, -2.1658935546875, -2.01434326171875, -1.86279296875, -1.71124267578125, -1.5596923828125, -1.40814208984375, -1.256591796875, -1.10504150390625, -0.9534912109375, -0.80194091796875, -0.650390625, -0.49884033203125, -0.3472900390625, -0.19573974609375, -0.044189453125, 0.10736083984375, 0.2589111328125, 0.41046142578125, 0.56201171875, 0.71356201171875, 0.8651123046875, 1.01666259765625, 1.168212890625, 1.31976318359375, 1.4713134765625, 1.62286376953125, 1.7744140625, 1.92596435546875, 2.0775146484375, 2.22906494140625, 2.380615234375, 2.53216552734375, 2.6837158203125, 2.83526611328125, 2.98681640625, 3.13836669921875, 3.2899169921875, 3.44146728515625, 3.593017578125, 3.74456787109375, 3.8961181640625, 4.04766845703125, 4.19921875]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 2.0, 4.0, 4.0, 14.0, 7.0, 21.0, 27.0, 33.0, 54.0, 65.0, 101.0, 118.0, 183.0, 270.0, 435.0, 635.0, 958.0, 1493.0, 2309.0, 4046.0, 8348.0, 22472.0, 114273.0, 722021.0, 127106.0, 23632.0, 8685.0, 4359.0, 2453.0, 1471.0, 907.0, 636.0, 448.0, 282.0, 209.0, 158.0, 111.0, 50.0, 65.0, 27.0, 22.0, 23.0, 8.0, 5.0, 5.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.96875, -8.6749267578125, -8.381103515625, -8.0872802734375, -7.79345703125, -7.4996337890625, -7.205810546875, -6.9119873046875, -6.6181640625, -6.3243408203125, -6.030517578125, -5.7366943359375, -5.44287109375, -5.1490478515625, -4.855224609375, -4.5614013671875, -4.267578125, -3.9737548828125, -3.679931640625, -3.3861083984375, -3.09228515625, -2.7984619140625, -2.504638671875, -2.2108154296875, -1.9169921875, -1.6231689453125, -1.329345703125, -1.0355224609375, -0.74169921875, -0.4478759765625, -0.154052734375, 0.1397705078125, 0.43359375, 0.7274169921875, 1.021240234375, 1.3150634765625, 1.60888671875, 1.9027099609375, 2.196533203125, 2.4903564453125, 2.7841796875, 3.0780029296875, 3.371826171875, 3.6656494140625, 3.95947265625, 4.2532958984375, 4.547119140625, 4.8409423828125, 5.134765625, 5.4285888671875, 5.722412109375, 6.0162353515625, 6.31005859375, 6.6038818359375, 6.897705078125, 7.1915283203125, 7.4853515625, 7.7791748046875, 8.072998046875, 8.3668212890625, 8.66064453125, 8.9544677734375, 9.248291015625, 9.5421142578125, 9.8359375]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 5.0, 6.0, 10.0, 2.0, 10.0, 11.0, 10.0, 15.0, 24.0, 28.0, 22.0, 37.0, 31.0, 44.0, 45.0, 47.0, 71.0, 105.0, 293.0, 1600.0, 168.0, 86.0, 43.0, 41.0, 46.0, 35.0, 33.0, 31.0, 27.0, 30.0, 20.0, 15.0, 17.0, 16.0, 7.0, 6.0, 2.0, 5.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.71875, -19.14453125, -18.5703125, -17.99609375, -17.421875, -16.84765625, -16.2734375, -15.69921875, -15.125, -14.55078125, -13.9765625, -13.40234375, -12.828125, -12.25390625, -11.6796875, -11.10546875, -10.53125, -9.95703125, -9.3828125, -8.80859375, -8.234375, -7.66015625, -7.0859375, -6.51171875, -5.9375, -5.36328125, -4.7890625, -4.21484375, -3.640625, -3.06640625, -2.4921875, -1.91796875, -1.34375, -0.76953125, -0.1953125, 0.37890625, 0.953125, 1.52734375, 2.1015625, 2.67578125, 3.25, 3.82421875, 4.3984375, 4.97265625, 5.546875, 6.12109375, 6.6953125, 7.26953125, 7.84375, 8.41796875, 8.9921875, 9.56640625, 10.140625, 10.71484375, 11.2890625, 11.86328125, 12.4375, 13.01171875, 13.5859375, 14.16015625, 14.734375, 15.30859375, 15.8828125, 16.45703125, 17.03125]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 3.0, 3.0, 2.0, 11.0, 9.0, 9.0, 22.0, 34.0, 35.0, 37.0, 81.0, 95.0, 203.0, 417.0, 1422.0, 11061.0, 3020396.0, 106573.0, 3826.0, 753.0, 282.0, 151.0, 74.0, 64.0, 45.0, 26.0, 20.0, 14.0, 14.0, 12.0, 8.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.75, -31.1728515625, -29.595703125, -28.0185546875, -26.44140625, -24.8642578125, -23.287109375, -21.7099609375, -20.1328125, -18.5556640625, -16.978515625, -15.4013671875, -13.82421875, -12.2470703125, -10.669921875, -9.0927734375, -7.515625, -5.9384765625, -4.361328125, -2.7841796875, -1.20703125, 0.3701171875, 1.947265625, 3.5244140625, 5.1015625, 6.6787109375, 8.255859375, 9.8330078125, 11.41015625, 12.9873046875, 14.564453125, 16.1416015625, 17.71875, 19.2958984375, 20.873046875, 22.4501953125, 24.02734375, 25.6044921875, 27.181640625, 28.7587890625, 30.3359375, 31.9130859375, 33.490234375, 35.0673828125, 36.64453125, 38.2216796875, 39.798828125, 41.3759765625, 42.953125, 44.5302734375, 46.107421875, 47.6845703125, 49.26171875, 50.8388671875, 52.416015625, 53.9931640625, 55.5703125, 57.1474609375, 58.724609375, 60.3017578125, 61.87890625, 63.4560546875, 65.033203125, 66.6103515625, 68.1875]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 6.0, 78.0, 305.0, 432.0, 169.0, 23.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.01662254333496, -21.103092193603516, -18.189563751220703, -15.276033401489258, -12.362503051757812, -9.448972702026367, -6.535444259643555, -3.6219139099121094, -0.7083835601806641, 2.205146312713623, 5.11867618560791, 8.032205581665039, 10.945735931396484, 13.85926628112793, 16.772794723510742, 19.686325073242188, 22.599855422973633, 25.513385772705078, 28.42691421508789, 31.340444564819336, 34.25397491455078, 37.167503356933594, 40.081031799316406, 42.994564056396484, 45.90809631347656, 48.821624755859375, 51.73515701293945, 54.648685455322266, 57.562217712402344, 60.475746154785156, 63.38927459716797, 66.30280303955078, 69.21633911132812, 72.12986755371094, 75.04339599609375, 77.95692443847656, 80.8704605102539, 83.78398895263672, 86.69751739501953, 89.61104583740234, 92.52458190917969, 95.4381103515625, 98.35163879394531, 101.26516723632812, 104.17870330810547, 107.09223175048828, 110.0057601928711, 112.9192886352539, 115.83281707763672, 118.74634552001953, 121.65987396240234, 124.57341003417969, 127.4869384765625, 130.4004669189453, 133.31399536132812, 136.22752380371094, 139.14105224609375, 142.05458068847656, 144.96810913085938, 147.8816375732422, 150.795166015625, 153.70870971679688, 156.62222290039062, 159.5357666015625, 162.4492950439453]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 4.0, 6.0, 7.0, 5.0, 11.0, 6.0, 13.0, 13.0, 21.0, 16.0, 17.0, 17.0, 29.0, 23.0, 28.0, 35.0, 37.0, 45.0, 40.0, 29.0, 39.0, 42.0, 32.0, 38.0, 38.0, 35.0, 43.0, 28.0, 42.0, 32.0, 28.0, 22.0, 28.0, 25.0, 24.0, 15.0, 11.0, 9.0, 14.0, 19.0, 8.0, 8.0, 5.0, 5.0, 3.0, 3.0, 0.0, 3.0, 5.0, 1.0, 0.0, 1.0], "bins": [-42.793819427490234, -41.54755401611328, -40.301292419433594, -39.05502700805664, -37.80876159667969, -36.5625, -35.31623458862305, -34.069969177246094, -32.823707580566406, -31.577444076538086, -30.331180572509766, -29.084915161132812, -27.838651657104492, -26.592388153076172, -25.34612274169922, -24.0998592376709, -22.853595733642578, -21.607332229614258, -20.361068725585938, -19.114803314208984, -17.868539810180664, -16.622276306152344, -15.376011848449707, -14.12974739074707, -12.88348388671875, -11.63722038269043, -10.390955924987793, -9.144691467285156, -7.898427963256836, -6.652163982391357, -5.405900001525879, -4.159635543823242, -2.9133758544921875, -1.667111873626709, -0.42084789276123047, 0.825416088104248, 2.0716800689697266, 3.317944049835205, 4.564208030700684, 5.81047248840332, 7.056735992431641, 8.302999496459961, 9.549263954162598, 10.795528411865234, 12.041791915893555, 13.288055419921875, 14.534319877624512, 15.780584335327148, 17.02684783935547, 18.27311134338379, 19.51937484741211, 20.765640258789062, 22.011903762817383, 23.258167266845703, 24.504432678222656, 25.750696182250977, 26.996959686279297, 28.243223190307617, 29.489486694335938, 30.73575210571289, 31.98201560974121, 33.22827911376953, 34.474544525146484, 35.72080993652344, 36.967071533203125]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 5.0, 4.0, 4.0, 4.0, 10.0, 8.0, 5.0, 20.0, 24.0, 17.0, 21.0, 21.0, 29.0, 26.0, 29.0, 52.0, 51.0, 45.0, 43.0, 50.0, 52.0, 37.0, 31.0, 38.0, 47.0, 56.0, 35.0, 31.0, 23.0, 32.0, 29.0, 14.0, 21.0, 15.0, 14.0, 14.0, 19.0, 10.0, 5.0, 6.0, 3.0, 6.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.67578125, -5.5133056640625, -5.350830078125, -5.1883544921875, -5.02587890625, -4.8634033203125, -4.700927734375, -4.5384521484375, -4.3759765625, -4.2135009765625, -4.051025390625, -3.8885498046875, -3.72607421875, -3.5635986328125, -3.401123046875, -3.2386474609375, -3.076171875, -2.9136962890625, -2.751220703125, -2.5887451171875, -2.42626953125, -2.2637939453125, -2.101318359375, -1.9388427734375, -1.7763671875, -1.6138916015625, -1.451416015625, -1.2889404296875, -1.12646484375, -0.9639892578125, -0.801513671875, -0.6390380859375, -0.4765625, -0.3140869140625, -0.151611328125, 0.0108642578125, 0.17333984375, 0.3358154296875, 0.498291015625, 0.6607666015625, 0.8232421875, 0.9857177734375, 1.148193359375, 1.3106689453125, 1.47314453125, 1.6356201171875, 1.798095703125, 1.9605712890625, 2.123046875, 2.2855224609375, 2.447998046875, 2.6104736328125, 2.77294921875, 2.9354248046875, 3.097900390625, 3.2603759765625, 3.4228515625, 3.5853271484375, 3.747802734375, 3.9102783203125, 4.07275390625, 4.2352294921875, 4.397705078125, 4.5601806640625, 4.72265625]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 9.0, 3.0, 10.0, 10.0, 15.0, 20.0, 17.0, 30.0, 45.0, 64.0, 69.0, 123.0, 262.0, 482.0, 1051.0, 2702.0, 8056.0, 29472.0, 382297.0, 3608882.0, 130013.0, 20948.0, 5995.0, 2022.0, 798.0, 346.0, 182.0, 95.0, 67.0, 46.0, 41.0, 25.0, 31.0, 17.0, 14.0, 5.0, 4.0, 6.0, 6.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.921875, -25.208984375, -24.49609375, -23.783203125, -23.0703125, -22.357421875, -21.64453125, -20.931640625, -20.21875, -19.505859375, -18.79296875, -18.080078125, -17.3671875, -16.654296875, -15.94140625, -15.228515625, -14.515625, -13.802734375, -13.08984375, -12.376953125, -11.6640625, -10.951171875, -10.23828125, -9.525390625, -8.8125, -8.099609375, -7.38671875, -6.673828125, -5.9609375, -5.248046875, -4.53515625, -3.822265625, -3.109375, -2.396484375, -1.68359375, -0.970703125, -0.2578125, 0.455078125, 1.16796875, 1.880859375, 2.59375, 3.306640625, 4.01953125, 4.732421875, 5.4453125, 6.158203125, 6.87109375, 7.583984375, 8.296875, 9.009765625, 9.72265625, 10.435546875, 11.1484375, 11.861328125, 12.57421875, 13.287109375, 14.0, 14.712890625, 15.42578125, 16.138671875, 16.8515625, 17.564453125, 18.27734375, 18.990234375, 19.703125]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 6.0, 4.0, 10.0, 9.0, 15.0, 22.0, 26.0, 42.0, 71.0, 142.0, 266.0, 559.0, 1058.0, 966.0, 441.0, 199.0, 80.0, 49.0, 46.0, 25.0, 12.0, 13.0, 9.0, 2.0, 6.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-27.34375, -26.6734619140625, -26.003173828125, -25.3328857421875, -24.66259765625, -23.9923095703125, -23.322021484375, -22.6517333984375, -21.9814453125, -21.3111572265625, -20.640869140625, -19.9705810546875, -19.30029296875, -18.6300048828125, -17.959716796875, -17.2894287109375, -16.619140625, -15.9488525390625, -15.278564453125, -14.6082763671875, -13.93798828125, -13.2677001953125, -12.597412109375, -11.9271240234375, -11.2568359375, -10.5865478515625, -9.916259765625, -9.2459716796875, -8.57568359375, -7.9053955078125, -7.235107421875, -6.5648193359375, -5.89453125, -5.2242431640625, -4.553955078125, -3.8836669921875, -3.21337890625, -2.5430908203125, -1.872802734375, -1.2025146484375, -0.5322265625, 0.1380615234375, 0.808349609375, 1.4786376953125, 2.14892578125, 2.8192138671875, 3.489501953125, 4.1597900390625, 4.830078125, 5.5003662109375, 6.170654296875, 6.8409423828125, 7.51123046875, 8.1815185546875, 8.851806640625, 9.5220947265625, 10.1923828125, 10.8626708984375, 11.532958984375, 12.2032470703125, 12.87353515625, 13.5438232421875, 14.214111328125, 14.8843994140625, 15.5546875]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 8.0, 15.0, 20.0, 24.0, 52.0, 79.0, 153.0, 438.0, 1930.0, 11649.0, 174196.0, 3930130.0, 66967.0, 6745.0, 1230.0, 355.0, 129.0, 55.0, 50.0, 23.0, 14.0, 8.0, 12.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.96875, -36.27099609375, -34.5732421875, -32.87548828125, -31.177734375, -29.47998046875, -27.7822265625, -26.08447265625, -24.38671875, -22.68896484375, -20.9912109375, -19.29345703125, -17.595703125, -15.89794921875, -14.2001953125, -12.50244140625, -10.8046875, -9.10693359375, -7.4091796875, -5.71142578125, -4.013671875, -2.31591796875, -0.6181640625, 1.07958984375, 2.77734375, 4.47509765625, 6.1728515625, 7.87060546875, 9.568359375, 11.26611328125, 12.9638671875, 14.66162109375, 16.359375, 18.05712890625, 19.7548828125, 21.45263671875, 23.150390625, 24.84814453125, 26.5458984375, 28.24365234375, 29.94140625, 31.63916015625, 33.3369140625, 35.03466796875, 36.732421875, 38.43017578125, 40.1279296875, 41.82568359375, 43.5234375, 45.22119140625, 46.9189453125, 48.61669921875, 50.314453125, 52.01220703125, 53.7099609375, 55.40771484375, 57.10546875, 58.80322265625, 60.5009765625, 62.19873046875, 63.896484375, 65.59423828125, 67.2919921875, 68.98974609375, 70.6875]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 6.0, 8.0, 8.0, 8.0, 13.0, 9.0, 22.0, 25.0, 30.0, 43.0, 57.0, 71.0, 90.0, 111.0, 113.0, 90.0, 91.0, 54.0, 41.0, 31.0, 20.0, 15.0, 23.0, 19.0, 5.0, 3.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-43.74475860595703, -42.00543212890625, -40.26610565185547, -38.52677536010742, -36.78744888305664, -35.04812240600586, -33.30879592895508, -31.569467544555664, -29.83013916015625, -28.09081268310547, -26.351484298706055, -24.612157821655273, -22.87282943725586, -21.133502960205078, -19.394176483154297, -17.654848098754883, -15.915521621704102, -14.176194190979004, -12.436866760253906, -10.697540283203125, -8.958211898803711, -7.21888542175293, -5.479557991027832, -3.7402305603027344, -2.0009031295776367, -0.2615758180618286, 1.4777514934539795, 3.217078685760498, 4.956406116485596, 6.695733070373535, 8.435060501098633, 10.17438793182373, 11.913715362548828, 13.653042793273926, 15.392370223999023, 17.131696701049805, 18.87102508544922, 20.6103515625, 22.34967803955078, 24.089006423950195, 25.82833480834961, 27.56766128540039, 29.306989669799805, 31.046316146850586, 32.78564453125, 34.52497100830078, 36.26429748535156, 38.003623962402344, 39.742950439453125, 41.482276916503906, 43.22160339355469, 44.960933685302734, 46.700260162353516, 48.4395866394043, 50.17891311645508, 51.918243408203125, 53.657569885253906, 55.39689636230469, 57.13622283935547, 58.875553131103516, 60.6148796081543, 62.35420608520508, 64.09353637695312, 65.8328628540039, 67.57218933105469]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 4.0, 3.0, 2.0, 5.0, 3.0, 8.0, 8.0, 5.0, 16.0, 9.0, 11.0, 19.0, 29.0, 18.0, 19.0, 34.0, 31.0, 34.0, 36.0, 36.0, 36.0, 32.0, 49.0, 34.0, 43.0, 50.0, 36.0, 35.0, 43.0, 37.0, 20.0, 34.0, 27.0, 38.0, 16.0, 19.0, 17.0, 19.0, 16.0, 24.0, 13.0, 10.0, 5.0, 8.0, 4.0, 3.0, 5.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-41.2381706237793, -40.04390335083008, -38.84963607788086, -37.65536880493164, -36.46110534667969, -35.26683807373047, -34.07257080078125, -32.87830352783203, -31.684036254882812, -30.489768981933594, -29.295501708984375, -28.10123634338379, -26.90696907043457, -25.71270179748535, -24.518436431884766, -23.324169158935547, -22.129901885986328, -20.93563461303711, -19.74136734008789, -18.547101974487305, -17.352834701538086, -16.158567428588867, -14.964301109313965, -13.770034790039062, -12.575767517089844, -11.381500244140625, -10.187233924865723, -8.99296760559082, -7.798700332641602, -6.604433536529541, -5.4101667404174805, -4.215900421142578, -3.021636962890625, -1.8273701667785645, -0.6331033706665039, 0.5611634254455566, 1.7554302215576172, 2.9496970176696777, 4.143963813781738, 5.338230133056641, 6.532497406005859, 7.72676420211792, 8.92103099822998, 10.115297317504883, 11.309564590454102, 12.50383186340332, 13.698098182678223, 14.892364501953125, 16.086631774902344, 17.280899047851562, 18.47516632080078, 19.669431686401367, 20.863698959350586, 22.057966232299805, 23.25223159790039, 24.44649887084961, 25.640766143798828, 26.835033416748047, 28.029300689697266, 29.22356605529785, 30.41783332824707, 31.61210060119629, 32.806365966796875, 34.000633239746094, 35.19490051269531]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 1.0, 3.0, 2.0, 3.0, 6.0, 10.0, 10.0, 10.0, 9.0, 23.0, 18.0, 25.0, 26.0, 24.0, 35.0, 43.0, 45.0, 42.0, 37.0, 42.0, 43.0, 39.0, 34.0, 52.0, 44.0, 37.0, 45.0, 33.0, 42.0, 32.0, 23.0, 21.0, 16.0, 20.0, 28.0, 14.0, 13.0, 13.0, 7.0, 3.0, 12.0, 7.0, 6.0, 4.0, 4.0, 1.0, 3.0], "bins": [-6.1953125, -6.03692626953125, -5.8785400390625, -5.72015380859375, -5.561767578125, -5.40338134765625, -5.2449951171875, -5.08660888671875, -4.92822265625, -4.76983642578125, -4.6114501953125, -4.45306396484375, -4.294677734375, -4.13629150390625, -3.9779052734375, -3.81951904296875, -3.6611328125, -3.50274658203125, -3.3443603515625, -3.18597412109375, -3.027587890625, -2.86920166015625, -2.7108154296875, -2.55242919921875, -2.39404296875, -2.23565673828125, -2.0772705078125, -1.91888427734375, -1.760498046875, -1.60211181640625, -1.4437255859375, -1.28533935546875, -1.126953125, -0.96856689453125, -0.8101806640625, -0.65179443359375, -0.493408203125, -0.33502197265625, -0.1766357421875, -0.01824951171875, 0.14013671875, 0.29852294921875, 0.4569091796875, 0.61529541015625, 0.773681640625, 0.93206787109375, 1.0904541015625, 1.24884033203125, 1.4072265625, 1.56561279296875, 1.7239990234375, 1.88238525390625, 2.040771484375, 2.19915771484375, 2.3575439453125, 2.51593017578125, 2.67431640625, 2.83270263671875, 2.9910888671875, 3.14947509765625, 3.307861328125, 3.46624755859375, 3.6246337890625, 3.78302001953125, 3.94140625]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 5.0, 8.0, 8.0, 20.0, 24.0, 29.0, 50.0, 71.0, 104.0, 164.0, 254.0, 425.0, 640.0, 1058.0, 1653.0, 2706.0, 4235.0, 6865.0, 11258.0, 19158.0, 32801.0, 59991.0, 116925.0, 242424.0, 266236.0, 128537.0, 65607.0, 35467.0, 20391.0, 11862.0, 7301.0, 4562.0, 2784.0, 1862.0, 1147.0, 672.0, 465.0, 275.0, 189.0, 104.0, 74.0, 34.0, 33.0, 31.0, 20.0, 11.0, 3.0, 8.0, 4.0, 2.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.22021484375, -0.212890625, -0.20556640625, -0.1982421875, -0.19091796875, -0.18359375, -0.17626953125, -0.1689453125, -0.16162109375, -0.154296875, -0.14697265625, -0.1396484375, -0.13232421875, -0.125, -0.11767578125, -0.1103515625, -0.10302734375, -0.095703125, -0.08837890625, -0.0810546875, -0.07373046875, -0.06640625, -0.05908203125, -0.0517578125, -0.04443359375, -0.037109375, -0.02978515625, -0.0224609375, -0.01513671875, -0.0078125, -0.00048828125, 0.0068359375, 0.01416015625, 0.021484375, 0.02880859375, 0.0361328125, 0.04345703125, 0.05078125, 0.05810546875, 0.0654296875, 0.07275390625, 0.080078125, 0.08740234375, 0.0947265625, 0.10205078125, 0.109375, 0.11669921875, 0.1240234375, 0.13134765625, 0.138671875, 0.14599609375, 0.1533203125, 0.16064453125, 0.16796875, 0.17529296875, 0.1826171875, 0.18994140625, 0.197265625, 0.20458984375, 0.2119140625, 0.21923828125, 0.2265625, 0.23388671875, 0.2412109375, 0.24853515625]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 1.0, 1.0, 3.0, 5.0, 4.0, 3.0, 3.0, 7.0, 8.0, 15.0, 18.0, 16.0, 19.0, 12.0, 26.0, 22.0, 17.0, 31.0, 22.0, 26.0, 40.0, 34.0, 33.0, 34.0, 41.0, 50.0, 1068.0, 56.0, 42.0, 33.0, 33.0, 36.0, 35.0, 27.0, 35.0, 20.0, 25.0, 15.0, 18.0, 23.0, 14.0, 18.0, 15.0, 8.0, 6.0, 5.0, 6.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.92578125, -2.82659912109375, -2.7274169921875, -2.62823486328125, -2.529052734375, -2.42987060546875, -2.3306884765625, -2.23150634765625, -2.13232421875, -2.03314208984375, -1.9339599609375, -1.83477783203125, -1.735595703125, -1.63641357421875, -1.5372314453125, -1.43804931640625, -1.3388671875, -1.23968505859375, -1.1405029296875, -1.04132080078125, -0.942138671875, -0.84295654296875, -0.7437744140625, -0.64459228515625, -0.54541015625, -0.44622802734375, -0.3470458984375, -0.24786376953125, -0.148681640625, -0.04949951171875, 0.0496826171875, 0.14886474609375, 0.248046875, 0.34722900390625, 0.4464111328125, 0.54559326171875, 0.644775390625, 0.74395751953125, 0.8431396484375, 0.94232177734375, 1.04150390625, 1.14068603515625, 1.2398681640625, 1.33905029296875, 1.438232421875, 1.53741455078125, 1.6365966796875, 1.73577880859375, 1.8349609375, 1.93414306640625, 2.0333251953125, 2.13250732421875, 2.231689453125, 2.33087158203125, 2.4300537109375, 2.52923583984375, 2.62841796875, 2.72760009765625, 2.8267822265625, 2.92596435546875, 3.025146484375, 3.12432861328125, 3.2235107421875, 3.32269287109375, 3.421875]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 5.0, 9.0, 8.0, 7.0, 16.0, 31.0, 47.0, 83.0, 95.0, 140.0, 218.0, 309.0, 451.0, 648.0, 940.0, 1459.0, 2352.0, 3558.0, 5496.0, 8870.0, 14441.0, 23602.0, 40237.0, 69133.0, 119904.0, 219176.0, 1276391.0, 127539.0, 73053.0, 42656.0, 25163.0, 15367.0, 9294.0, 5736.0, 3590.0, 2431.0, 1568.0, 1016.0, 659.0, 433.0, 359.0, 214.0, 137.0, 98.0, 62.0, 40.0, 29.0, 20.0, 14.0, 10.0, 7.0, 6.0, 6.0, 4.0, 1.0, 3.0, 0.0, 3.0], "bins": [-0.15234375, -0.14759063720703125, -0.1428375244140625, -0.13808441162109375, -0.133331298828125, -0.12857818603515625, -0.1238250732421875, -0.11907196044921875, -0.11431884765625, -0.10956573486328125, -0.1048126220703125, -0.10005950927734375, -0.095306396484375, -0.09055328369140625, -0.0858001708984375, -0.08104705810546875, -0.0762939453125, -0.07154083251953125, -0.0667877197265625, -0.06203460693359375, -0.057281494140625, -0.05252838134765625, -0.0477752685546875, -0.04302215576171875, -0.03826904296875, -0.03351593017578125, -0.0287628173828125, -0.02400970458984375, -0.019256591796875, -0.01450347900390625, -0.0097503662109375, -0.00499725341796875, -0.000244140625, 0.00450897216796875, 0.0092620849609375, 0.01401519775390625, 0.018768310546875, 0.02352142333984375, 0.0282745361328125, 0.03302764892578125, 0.03778076171875, 0.04253387451171875, 0.0472869873046875, 0.05204010009765625, 0.056793212890625, 0.06154632568359375, 0.0662994384765625, 0.07105255126953125, 0.0758056640625, 0.08055877685546875, 0.0853118896484375, 0.09006500244140625, 0.094818115234375, 0.09957122802734375, 0.1043243408203125, 0.10907745361328125, 0.11383056640625, 0.11858367919921875, 0.1233367919921875, 0.12808990478515625, 0.132843017578125, 0.13759613037109375, 0.1423492431640625, 0.14710235595703125, 0.15185546875]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 1.0, 6.0, 4.0, 9.0, 9.0, 4.0, 9.0, 15.0, 14.0, 12.0, 22.0, 17.0, 29.0, 46.0, 72.0, 149.0, 140.0, 125.0, 89.0, 57.0, 29.0, 27.0, 26.0, 7.0, 10.0, 4.0, 9.0, 8.0, 8.0, 6.0, 5.0, 4.0, 2.0, 4.0, 4.0, 2.0, 4.0, 5.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00022780895233154297, -0.00022038258612155914, -0.00021295621991157532, -0.0002055298537015915, -0.00019810348749160767, -0.00019067712128162384, -0.00018325075507164001, -0.0001758243888616562, -0.00016839802265167236, -0.00016097165644168854, -0.0001535452902317047, -0.00014611892402172089, -0.00013869255781173706, -0.00013126619160175323, -0.0001238398253917694, -0.00011641345918178558, -0.00010898709297180176, -0.00010156072676181793, -9.41343605518341e-05, -8.670799434185028e-05, -7.928162813186646e-05, -7.185526192188263e-05, -6.44288957118988e-05, -5.700252950191498e-05, -4.957616329193115e-05, -4.214979708194733e-05, -3.47234308719635e-05, -2.7297064661979675e-05, -1.987069845199585e-05, -1.2444332242012024e-05, -5.017966032028198e-06, 2.4084001779556274e-06, 9.834766387939453e-06, 1.726113259792328e-05, 2.4687498807907104e-05, 3.211386501789093e-05, 3.9540231227874756e-05, 4.696659743785858e-05, 5.439296364784241e-05, 6.181932985782623e-05, 6.924569606781006e-05, 7.667206227779388e-05, 8.409842848777771e-05, 9.152479469776154e-05, 9.895116090774536e-05, 0.00010637752711772919, 0.00011380389332771301, 0.00012123025953769684, 0.00012865662574768066, 0.0001360829919576645, 0.00014350935816764832, 0.00015093572437763214, 0.00015836209058761597, 0.0001657884567975998, 0.00017321482300758362, 0.00018064118921756744, 0.00018806755542755127, 0.0001954939216375351, 0.00020292028784751892, 0.00021034665405750275, 0.00021777302026748657, 0.0002251993864774704, 0.00023262575268745422, 0.00024005211889743805, 0.0002474784851074219]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 1.0, 1.0, 4.0, 1.0, 4.0, 6.0, 3.0, 8.0, 6.0, 10.0, 12.0, 19.0, 20.0, 17.0, 24.0, 45.0, 71.0, 107.0, 307.0, 1128.0, 10871.0, 787902.0, 240465.0, 6141.0, 802.0, 206.0, 133.0, 52.0, 47.0, 41.0, 26.0, 12.0, 13.0, 14.0, 8.0, 9.0, 4.0, 3.0, 4.0, 5.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004001617431640625, -0.0038799643516540527, -0.0037583112716674805, -0.003636658191680908, -0.003515005111694336, -0.0033933520317077637, -0.0032716989517211914, -0.003150045871734619, -0.003028392791748047, -0.0029067397117614746, -0.0027850866317749023, -0.00266343355178833, -0.002541780471801758, -0.0024201273918151855, -0.0022984743118286133, -0.002176821231842041, -0.0020551681518554688, -0.0019335150718688965, -0.0018118619918823242, -0.001690208911895752, -0.0015685558319091797, -0.0014469027519226074, -0.0013252496719360352, -0.0012035965919494629, -0.0010819435119628906, -0.0009602904319763184, -0.0008386373519897461, -0.0007169842720031738, -0.0005953311920166016, -0.0004736781120300293, -0.00035202503204345703, -0.00023037195205688477, -0.0001087188720703125, 1.2934207916259766e-05, 0.00013458728790283203, 0.0002562403678894043, 0.00037789344787597656, 0.0004995465278625488, 0.0006211996078491211, 0.0007428526878356934, 0.0008645057678222656, 0.0009861588478088379, 0.0011078119277954102, 0.0012294650077819824, 0.0013511180877685547, 0.001472771167755127, 0.0015944242477416992, 0.0017160773277282715, 0.0018377304077148438, 0.001959383487701416, 0.0020810365676879883, 0.0022026896476745605, 0.002324342727661133, 0.002445995807647705, 0.0025676488876342773, 0.0026893019676208496, 0.002810955047607422, 0.002932608127593994, 0.0030542612075805664, 0.0031759142875671387, 0.003297567367553711, 0.003419220447540283, 0.0035408735275268555, 0.0036625266075134277, 0.0037841796875]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 6.0, 27.0, 39.0, 98.0, 277.0, 307.0, 150.0, 58.0, 30.0, 11.0, 3.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002455570502206683, -0.0002312363649252802, -0.00021691566507797688, -0.00020259497978258878, -0.00018827427993528545, -0.00017395359463989735, -0.00015963290934450924, -0.00014531222404912114, -0.0001309915242018178, -0.0001166708316304721, -0.00010235013905912638, -8.802945376373827e-05, -7.370876119239256e-05, -5.938806862104684e-05, -4.506738332565874e-05, -3.074669075431302e-05, -1.6425998182967305e-05, -2.105307430610992e-06, 1.2215383321745321e-05, 2.653607225511223e-05, 4.085676482645795e-05, 5.5177457397803664e-05, 6.949814269319177e-05, 8.381883526453748e-05, 9.81395278358832e-05, 0.00011246022040722892, 0.00012678091297857463, 0.00014110159827396274, 0.00015542228356935084, 0.00016974298341665417, 0.00018406366871204227, 0.0001983843685593456, 0.0002127050538547337, 0.0002270257391501218, 0.00024134643899742514, 0.00025566713884472847, 0.00026998782414011657, 0.0002843085094355047, 0.0002986291947308928, 0.0003129498800262809, 0.00032727059442549944, 0.00034159127972088754, 0.00035591196501627564, 0.0003702326794154942, 0.0003845533647108823, 0.0003988740500062704, 0.0004131947353016585, 0.0004275154205970466, 0.0004418361058924347, 0.0004561567911878228, 0.0004704774764832109, 0.000484798161778599, 0.0004991188761778176, 0.0005134395323693752, 0.0005277602467685938, 0.0005420809611678123, 0.00055640161735937, 0.0005707223317585886, 0.0005850429879501462, 0.0005993637023493648, 0.0006136843585409224, 0.000628005072940141, 0.0006423257291316986, 0.0006566464435309172, 0.0006709671579301357]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 8.0, 7.0, 3.0, 3.0, 15.0, 17.0, 11.0, 12.0, 8.0, 27.0, 15.0, 18.0, 31.0, 29.0, 46.0, 36.0, 35.0, 32.0, 38.0, 53.0, 43.0, 36.0, 39.0, 29.0, 37.0, 31.0, 45.0, 35.0, 28.0, 32.0, 29.0, 21.0, 26.0, 15.0, 15.0, 13.0, 14.0, 7.0, 14.0, 11.0, 8.0, 10.0, 8.0, 3.0, 4.0, 5.0, 3.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.071826934814453e-05, -8.761603385210037e-05, -8.451379835605621e-05, -8.141156286001205e-05, -7.83093273639679e-05, -7.520709186792374e-05, -7.210485637187958e-05, -6.900262087583542e-05, -6.590038537979126e-05, -6.27981498837471e-05, -5.969591438770294e-05, -5.659367889165878e-05, -5.3491443395614624e-05, -5.0389207899570465e-05, -4.7286972403526306e-05, -4.418473690748215e-05, -4.108250141143799e-05, -3.798026591539383e-05, -3.487803041934967e-05, -3.177579492330551e-05, -2.8673559427261353e-05, -2.5571323931217194e-05, -2.2469088435173035e-05, -1.9366852939128876e-05, -1.6264617443084717e-05, -1.3162381947040558e-05, -1.0060146450996399e-05, -6.95791095495224e-06, -3.855675458908081e-06, -7.534399628639221e-07, 2.348795533180237e-06, 5.451031029224396e-06, 8.553266525268555e-06, 1.1655502021312714e-05, 1.4757737517356873e-05, 1.785997301340103e-05, 2.096220850944519e-05, 2.406444400548935e-05, 2.7166679501533508e-05, 3.0268914997577667e-05, 3.3371150493621826e-05, 3.6473385989665985e-05, 3.9575621485710144e-05, 4.26778569817543e-05, 4.578009247779846e-05, 4.888232797384262e-05, 5.198456346988678e-05, 5.508679896593094e-05, 5.81890344619751e-05, 6.129126995801926e-05, 6.439350545406342e-05, 6.749574095010757e-05, 7.059797644615173e-05, 7.370021194219589e-05, 7.680244743824005e-05, 7.990468293428421e-05, 8.300691843032837e-05, 8.610915392637253e-05, 8.921138942241669e-05, 9.231362491846085e-05, 9.5415860414505e-05, 9.851809591054916e-05, 0.00010162033140659332, 0.00010472256690263748, 0.00010782480239868164]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 1.0, 3.0, 2.0, 3.0, 6.0, 10.0, 11.0, 9.0, 9.0, 23.0, 18.0, 25.0, 26.0, 24.0, 35.0, 43.0, 45.0, 42.0, 37.0, 42.0, 43.0, 39.0, 34.0, 52.0, 44.0, 37.0, 45.0, 33.0, 42.0, 32.0, 23.0, 21.0, 16.0, 20.0, 28.0, 14.0, 13.0, 13.0, 7.0, 3.0, 12.0, 7.0, 6.0, 4.0, 4.0, 1.0, 3.0], "bins": [-6.1953125, -6.03692626953125, -5.8785400390625, -5.72015380859375, -5.561767578125, -5.40338134765625, -5.2449951171875, -5.08660888671875, -4.92822265625, -4.76983642578125, -4.6114501953125, -4.45306396484375, -4.294677734375, -4.13629150390625, -3.9779052734375, -3.81951904296875, -3.6611328125, -3.50274658203125, -3.3443603515625, -3.18597412109375, -3.027587890625, -2.86920166015625, -2.7108154296875, -2.55242919921875, -2.39404296875, -2.23565673828125, -2.0772705078125, -1.91888427734375, -1.760498046875, -1.60211181640625, -1.4437255859375, -1.28533935546875, -1.126953125, -0.96856689453125, -0.8101806640625, -0.65179443359375, -0.493408203125, -0.33502197265625, -0.1766357421875, -0.01824951171875, 0.14013671875, 0.29852294921875, 0.4569091796875, 0.61529541015625, 0.773681640625, 0.93206787109375, 1.0904541015625, 1.24884033203125, 1.4072265625, 1.56561279296875, 1.7239990234375, 1.88238525390625, 2.040771484375, 2.19915771484375, 2.3575439453125, 2.51593017578125, 2.67431640625, 2.83270263671875, 2.9910888671875, 3.14947509765625, 3.307861328125, 3.46624755859375, 3.6246337890625, 3.78302001953125, 3.94140625]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 6.0, 3.0, 2.0, 5.0, 4.0, 8.0, 11.0, 14.0, 14.0, 33.0, 42.0, 67.0, 73.0, 114.0, 134.0, 209.0, 286.0, 370.0, 507.0, 601.0, 820.0, 1082.0, 1392.0, 1836.0, 2648.0, 4260.0, 7782.0, 18129.0, 54260.0, 233401.0, 524242.0, 129270.0, 35439.0, 12969.0, 5977.0, 3423.0, 2277.0, 1642.0, 1277.0, 925.0, 751.0, 549.0, 449.0, 331.0, 265.0, 185.0, 135.0, 105.0, 66.0, 46.0, 40.0, 23.0, 27.0, 13.0, 15.0, 4.0, 5.0, 7.0, 1.0, 1.0, 0.0, 2.0], "bins": [-5.203125, -5.0421142578125, -4.881103515625, -4.7200927734375, -4.55908203125, -4.3980712890625, -4.237060546875, -4.0760498046875, -3.9150390625, -3.7540283203125, -3.593017578125, -3.4320068359375, -3.27099609375, -3.1099853515625, -2.948974609375, -2.7879638671875, -2.626953125, -2.4659423828125, -2.304931640625, -2.1439208984375, -1.98291015625, -1.8218994140625, -1.660888671875, -1.4998779296875, -1.3388671875, -1.1778564453125, -1.016845703125, -0.8558349609375, -0.69482421875, -0.5338134765625, -0.372802734375, -0.2117919921875, -0.05078125, 0.1102294921875, 0.271240234375, 0.4322509765625, 0.59326171875, 0.7542724609375, 0.915283203125, 1.0762939453125, 1.2373046875, 1.3983154296875, 1.559326171875, 1.7203369140625, 1.88134765625, 2.0423583984375, 2.203369140625, 2.3643798828125, 2.525390625, 2.6864013671875, 2.847412109375, 3.0084228515625, 3.16943359375, 3.3304443359375, 3.491455078125, 3.6524658203125, 3.8134765625, 3.9744873046875, 4.135498046875, 4.2965087890625, 4.45751953125, 4.6185302734375, 4.779541015625, 4.9405517578125, 5.1015625]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 3.0, 2.0, 3.0, 6.0, 8.0, 8.0, 10.0, 21.0, 14.0, 19.0, 18.0, 23.0, 26.0, 40.0, 40.0, 55.0, 47.0, 57.0, 72.0, 85.0, 300.0, 1506.0, 168.0, 74.0, 62.0, 43.0, 45.0, 44.0, 33.0, 30.0, 28.0, 35.0, 18.0, 18.0, 12.0, 20.0, 13.0, 13.0, 8.0, 9.0, 6.0, 3.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.390625, -15.82958984375, -15.2685546875, -14.70751953125, -14.146484375, -13.58544921875, -13.0244140625, -12.46337890625, -11.90234375, -11.34130859375, -10.7802734375, -10.21923828125, -9.658203125, -9.09716796875, -8.5361328125, -7.97509765625, -7.4140625, -6.85302734375, -6.2919921875, -5.73095703125, -5.169921875, -4.60888671875, -4.0478515625, -3.48681640625, -2.92578125, -2.36474609375, -1.8037109375, -1.24267578125, -0.681640625, -0.12060546875, 0.4404296875, 1.00146484375, 1.5625, 2.12353515625, 2.6845703125, 3.24560546875, 3.806640625, 4.36767578125, 4.9287109375, 5.48974609375, 6.05078125, 6.61181640625, 7.1728515625, 7.73388671875, 8.294921875, 8.85595703125, 9.4169921875, 9.97802734375, 10.5390625, 11.10009765625, 11.6611328125, 12.22216796875, 12.783203125, 13.34423828125, 13.9052734375, 14.46630859375, 15.02734375, 15.58837890625, 16.1494140625, 16.71044921875, 17.271484375, 17.83251953125, 18.3935546875, 18.95458984375, 19.515625]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 3.0, 7.0, 15.0, 19.0, 38.0, 69.0, 105.0, 223.0, 638.0, 4764.0, 3120020.0, 18358.0, 875.0, 289.0, 135.0, 70.0, 26.0, 21.0, 16.0, 8.0, 6.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-130.5, -127.4404296875, -124.380859375, -121.3212890625, -118.26171875, -115.2021484375, -112.142578125, -109.0830078125, -106.0234375, -102.9638671875, -99.904296875, -96.8447265625, -93.78515625, -90.7255859375, -87.666015625, -84.6064453125, -81.546875, -78.4873046875, -75.427734375, -72.3681640625, -69.30859375, -66.2490234375, -63.189453125, -60.1298828125, -57.0703125, -54.0107421875, -50.951171875, -47.8916015625, -44.83203125, -41.7724609375, -38.712890625, -35.6533203125, -32.59375, -29.5341796875, -26.474609375, -23.4150390625, -20.35546875, -17.2958984375, -14.236328125, -11.1767578125, -8.1171875, -5.0576171875, -1.998046875, 1.0615234375, 4.12109375, 7.1806640625, 10.240234375, 13.2998046875, 16.359375, 19.4189453125, 22.478515625, 25.5380859375, 28.59765625, 31.6572265625, 34.716796875, 37.7763671875, 40.8359375, 43.8955078125, 46.955078125, 50.0146484375, 53.07421875, 56.1337890625, 59.193359375, 62.2529296875, 65.3125]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 10.0, 115.0, 702.0, 185.0, 5.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.335866928100586, -19.8385009765625, -14.341134071350098, -8.843767166137695, -3.3464012145996094, 2.1509647369384766, 7.648332595825195, 13.145696640014648, 18.643064498901367, 24.140430450439453, 29.637798309326172, 35.135162353515625, 40.632530212402344, 46.12989807128906, 51.62726593017578, 57.12462615966797, 62.62199401855469, 68.1193618774414, 73.61672973632812, 79.11408996582031, 84.61145782470703, 90.10882568359375, 95.60619354248047, 101.10356140136719, 106.6009292602539, 112.09829711914062, 117.59566497802734, 123.09303283691406, 128.59039306640625, 134.0877685546875, 139.5851287841797, 145.08248901367188, 150.57984924316406, 156.07720947265625, 161.5745849609375, 167.0719451904297, 172.56932067871094, 178.06668090820312, 183.56405639648438, 189.06141662597656, 194.55877685546875, 200.05613708496094, 205.5535125732422, 211.05087280273438, 216.54824829101562, 222.0456085205078, 227.54296875, 233.04034423828125, 238.5377197265625, 244.0350799560547, 249.53245544433594, 255.02981567382812, 260.5271911621094, 266.0245361328125, 271.52191162109375, 277.019287109375, 282.5166320800781, 288.0140075683594, 293.5113525390625, 299.00872802734375, 304.506103515625, 310.00347900390625, 315.5008239746094, 320.9981994628906, 326.4955749511719]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 1.0, 4.0, 9.0, 4.0, 8.0, 3.0, 7.0, 14.0, 21.0, 21.0, 18.0, 24.0, 29.0, 38.0, 24.0, 34.0, 45.0, 48.0, 39.0, 39.0, 38.0, 43.0, 39.0, 42.0, 51.0, 30.0, 35.0, 36.0, 36.0, 29.0, 35.0, 36.0, 16.0, 13.0, 23.0, 20.0, 15.0, 11.0, 8.0, 3.0, 8.0, 1.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-59.065223693847656, -57.421199798583984, -55.77717590332031, -54.133148193359375, -52.4891242980957, -50.84510040283203, -49.20107650756836, -47.55705261230469, -45.91302490234375, -44.26900100708008, -42.624977111816406, -40.98094940185547, -39.3369255065918, -37.692901611328125, -36.04887771606445, -34.40485382080078, -32.76082992553711, -31.116806030273438, -29.472780227661133, -27.82875633239746, -26.184730529785156, -24.540706634521484, -22.896682739257812, -21.25265884399414, -19.608633041381836, -17.964609146118164, -16.32058334350586, -14.676559448242188, -13.0325345993042, -11.388509750366211, -9.744485855102539, -8.10046100616455, -6.456439971923828, -4.81241512298584, -3.1683907508850098, -1.5243663787841797, 0.1196584701538086, 1.7636833190917969, 3.4077072143554688, 5.051732063293457, 6.695756912231445, 8.339781761169434, 9.983806610107422, 11.627830505371094, 13.271855354309082, 14.91588020324707, 16.559904098510742, 18.203929901123047, 19.84795379638672, 21.49197769165039, 23.136003494262695, 24.780027389526367, 26.424053192138672, 28.068077087402344, 29.712100982666016, 31.356124877929688, 33.000152587890625, 34.6441764831543, 36.28820037841797, 37.932228088378906, 39.57625198364258, 41.22027587890625, 42.86429977416992, 44.508323669433594, 46.152347564697266]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 5.0, 5.0, 7.0, 7.0, 14.0, 7.0, 15.0, 20.0, 18.0, 19.0, 29.0, 36.0, 26.0, 32.0, 38.0, 42.0, 49.0, 46.0, 42.0, 36.0, 50.0, 43.0, 35.0, 35.0, 44.0, 32.0, 32.0, 26.0, 34.0, 24.0, 20.0, 18.0, 17.0, 20.0, 17.0, 8.0, 10.0, 13.0, 4.0, 5.0, 7.0, 5.0, 4.0, 4.0, 3.0, 0.0, 0.0, 1.0], "bins": [-5.80859375, -5.6475830078125, -5.486572265625, -5.3255615234375, -5.16455078125, -5.0035400390625, -4.842529296875, -4.6815185546875, -4.5205078125, -4.3594970703125, -4.198486328125, -4.0374755859375, -3.87646484375, -3.7154541015625, -3.554443359375, -3.3934326171875, -3.232421875, -3.0714111328125, -2.910400390625, -2.7493896484375, -2.58837890625, -2.4273681640625, -2.266357421875, -2.1053466796875, -1.9443359375, -1.7833251953125, -1.622314453125, -1.4613037109375, -1.30029296875, -1.1392822265625, -0.978271484375, -0.8172607421875, -0.65625, -0.4952392578125, -0.334228515625, -0.1732177734375, -0.01220703125, 0.1488037109375, 0.309814453125, 0.4708251953125, 0.6318359375, 0.7928466796875, 0.953857421875, 1.1148681640625, 1.27587890625, 1.4368896484375, 1.597900390625, 1.7589111328125, 1.919921875, 2.0809326171875, 2.241943359375, 2.4029541015625, 2.56396484375, 2.7249755859375, 2.885986328125, 3.0469970703125, 3.2080078125, 3.3690185546875, 3.530029296875, 3.6910400390625, 3.85205078125, 4.0130615234375, 4.174072265625, 4.3350830078125, 4.49609375]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 5.0, 2.0, 8.0, 5.0, 12.0, 22.0, 21.0, 31.0, 41.0, 64.0, 80.0, 128.0, 174.0, 247.0, 432.0, 693.0, 1218.0, 1999.0, 3469.0, 6152.0, 12369.0, 28056.0, 128047.0, 1286075.0, 2336097.0, 306298.0, 46138.0, 17010.0, 8497.0, 4519.0, 2632.0, 1504.0, 842.0, 525.0, 288.0, 202.0, 105.0, 84.0, 48.0, 35.0, 38.0, 19.0, 12.0, 14.0, 7.0, 8.0, 3.0, 4.0, 3.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-11.09375, -10.7491455078125, -10.404541015625, -10.0599365234375, -9.71533203125, -9.3707275390625, -9.026123046875, -8.6815185546875, -8.3369140625, -7.9923095703125, -7.647705078125, -7.3031005859375, -6.95849609375, -6.6138916015625, -6.269287109375, -5.9246826171875, -5.580078125, -5.2354736328125, -4.890869140625, -4.5462646484375, -4.20166015625, -3.8570556640625, -3.512451171875, -3.1678466796875, -2.8232421875, -2.4786376953125, -2.134033203125, -1.7894287109375, -1.44482421875, -1.1002197265625, -0.755615234375, -0.4110107421875, -0.06640625, 0.2781982421875, 0.622802734375, 0.9674072265625, 1.31201171875, 1.6566162109375, 2.001220703125, 2.3458251953125, 2.6904296875, 3.0350341796875, 3.379638671875, 3.7242431640625, 4.06884765625, 4.4134521484375, 4.758056640625, 5.1026611328125, 5.447265625, 5.7918701171875, 6.136474609375, 6.4810791015625, 6.82568359375, 7.1702880859375, 7.514892578125, 7.8594970703125, 8.2041015625, 8.5487060546875, 8.893310546875, 9.2379150390625, 9.58251953125, 9.9271240234375, 10.271728515625, 10.6163330078125, 10.9609375]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 5.0, 10.0, 3.0, 5.0, 6.0, 8.0, 16.0, 18.0, 29.0, 25.0, 38.0, 52.0, 86.0, 74.0, 124.0, 211.0, 292.0, 402.0, 605.0, 551.0, 422.0, 325.0, 224.0, 141.0, 107.0, 58.0, 53.0, 29.0, 34.0, 23.0, 26.0, 13.0, 15.0, 6.0, 3.0, 6.0, 9.0, 8.0, 3.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.8671875, -10.5172119140625, -10.167236328125, -9.8172607421875, -9.46728515625, -9.1173095703125, -8.767333984375, -8.4173583984375, -8.0673828125, -7.7174072265625, -7.367431640625, -7.0174560546875, -6.66748046875, -6.3175048828125, -5.967529296875, -5.6175537109375, -5.267578125, -4.9176025390625, -4.567626953125, -4.2176513671875, -3.86767578125, -3.5177001953125, -3.167724609375, -2.8177490234375, -2.4677734375, -2.1177978515625, -1.767822265625, -1.4178466796875, -1.06787109375, -0.7178955078125, -0.367919921875, -0.0179443359375, 0.33203125, 0.6820068359375, 1.031982421875, 1.3819580078125, 1.73193359375, 2.0819091796875, 2.431884765625, 2.7818603515625, 3.1318359375, 3.4818115234375, 3.831787109375, 4.1817626953125, 4.53173828125, 4.8817138671875, 5.231689453125, 5.5816650390625, 5.931640625, 6.2816162109375, 6.631591796875, 6.9815673828125, 7.33154296875, 7.6815185546875, 8.031494140625, 8.3814697265625, 8.7314453125, 9.0814208984375, 9.431396484375, 9.7813720703125, 10.13134765625, 10.4813232421875, 10.831298828125, 11.1812744140625, 11.53125]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0, 4.0, 5.0, 2.0, 9.0, 10.0, 11.0, 7.0, 19.0, 20.0, 28.0, 50.0, 61.0, 102.0, 234.0, 449.0, 933.0, 1982.0, 4529.0, 12012.0, 37308.0, 175480.0, 2620716.0, 1198573.0, 99832.0, 26223.0, 9008.0, 3499.0, 1518.0, 785.0, 379.0, 185.0, 113.0, 70.0, 37.0, 24.0, 22.0, 12.0, 9.0, 6.0, 5.0, 6.0, 4.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-21.609375, -20.9892578125, -20.369140625, -19.7490234375, -19.12890625, -18.5087890625, -17.888671875, -17.2685546875, -16.6484375, -16.0283203125, -15.408203125, -14.7880859375, -14.16796875, -13.5478515625, -12.927734375, -12.3076171875, -11.6875, -11.0673828125, -10.447265625, -9.8271484375, -9.20703125, -8.5869140625, -7.966796875, -7.3466796875, -6.7265625, -6.1064453125, -5.486328125, -4.8662109375, -4.24609375, -3.6259765625, -3.005859375, -2.3857421875, -1.765625, -1.1455078125, -0.525390625, 0.0947265625, 0.71484375, 1.3349609375, 1.955078125, 2.5751953125, 3.1953125, 3.8154296875, 4.435546875, 5.0556640625, 5.67578125, 6.2958984375, 6.916015625, 7.5361328125, 8.15625, 8.7763671875, 9.396484375, 10.0166015625, 10.63671875, 11.2568359375, 11.876953125, 12.4970703125, 13.1171875, 13.7373046875, 14.357421875, 14.9775390625, 15.59765625, 16.2177734375, 16.837890625, 17.4580078125, 18.078125]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 7.0, 17.0, 37.0, 79.0, 143.0, 235.0, 209.0, 136.0, 71.0, 29.0, 23.0, 10.0, 4.0, 2.0, 5.0, 2.0, 1.0], "bins": [-184.7446746826172, -181.25218200683594, -177.7596893310547, -174.26719665527344, -170.7747039794922, -167.28221130371094, -163.7897186279297, -160.2972412109375, -156.80474853515625, -153.312255859375, -149.81976318359375, -146.3272705078125, -142.83477783203125, -139.34228515625, -135.84979248046875, -132.3572998046875, -128.86480712890625, -125.372314453125, -121.87982177734375, -118.3873291015625, -114.89483642578125, -111.40234375, -107.90985870361328, -104.41736602783203, -100.92487335205078, -97.43238067626953, -93.93988800048828, -90.44739532470703, -86.95491027832031, -83.46241760253906, -79.96992492675781, -76.47743225097656, -72.98493957519531, -69.49244689941406, -65.99995422363281, -62.50746536254883, -59.01497268676758, -55.52248001098633, -52.029991149902344, -48.537498474121094, -45.04500198364258, -41.55250930786133, -38.060020446777344, -34.567527770996094, -31.075035095214844, -27.582542419433594, -24.090051651000977, -20.59756088256836, -17.10506820678711, -13.612576484680176, -10.120084762573242, -6.627593040466309, -3.135101318359375, 0.357391357421875, 3.849882125854492, 7.342372894287109, 10.83486557006836, 14.327357292175293, 17.819849014282227, 21.312339782714844, 24.804832458496094, 28.297325134277344, 31.78981590270996, 35.28230667114258, 38.77479934692383]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 1.0, 1.0, 3.0, 4.0, 6.0, 5.0, 9.0, 8.0, 7.0, 13.0, 16.0, 14.0, 12.0, 15.0, 24.0, 24.0, 29.0, 32.0, 33.0, 38.0, 46.0, 32.0, 47.0, 32.0, 49.0, 37.0, 43.0, 31.0, 47.0, 41.0, 28.0, 31.0, 34.0, 18.0, 27.0, 19.0, 22.0, 18.0, 21.0, 23.0, 12.0, 17.0, 8.0, 6.0, 8.0, 8.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.559051513671875, -36.393348693847656, -35.2276496887207, -34.061946868896484, -32.896244049072266, -31.73054313659668, -30.564842224121094, -29.399139404296875, -28.23343849182129, -27.067737579345703, -25.902034759521484, -24.7363338470459, -23.570632934570312, -22.404930114746094, -21.239229202270508, -20.073528289794922, -18.907825469970703, -17.742124557495117, -16.5764217376709, -15.410720825195312, -14.24501895904541, -13.079317092895508, -11.913616180419922, -10.74791431427002, -9.582212448120117, -8.416510581970215, -7.250809192657471, -6.085107803344727, -4.919405937194824, -3.753704071044922, -2.5880026817321777, -1.4223012924194336, -0.2565956115722656, 0.9091060161590576, 2.074807643890381, 3.240509271621704, 4.406210899353027, 5.57191276550293, 6.737614154815674, 7.903315544128418, 9.06901741027832, 10.234719276428223, 11.400421142578125, 12.566122055053711, 13.731823921203613, 14.897525787353516, 16.0632266998291, 17.228927612304688, 18.394630432128906, 19.560331344604492, 20.72603416442871, 21.891735076904297, 23.057437896728516, 24.2231388092041, 25.388839721679688, 26.554542541503906, 27.720243453979492, 28.885944366455078, 30.051647186279297, 31.217348098754883, 32.38304901123047, 33.54875183105469, 34.714454650878906, 35.88015365600586, 37.04585647583008]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 0.0, 4.0, 3.0, 3.0, 5.0, 5.0, 2.0, 5.0, 9.0, 3.0, 12.0, 12.0, 11.0, 10.0, 19.0, 17.0, 19.0, 22.0, 25.0, 28.0, 31.0, 27.0, 28.0, 34.0, 37.0, 48.0, 40.0, 35.0, 45.0, 49.0, 31.0, 31.0, 45.0, 38.0, 29.0, 27.0, 30.0, 23.0, 28.0, 21.0, 20.0, 17.0, 15.0, 11.0, 5.0, 8.0, 11.0, 4.0, 5.0, 5.0, 5.0, 7.0, 3.0, 4.0, 1.0, 3.0], "bins": [-5.28515625, -5.1380615234375, -4.990966796875, -4.8438720703125, -4.69677734375, -4.5496826171875, -4.402587890625, -4.2554931640625, -4.1083984375, -3.9613037109375, -3.814208984375, -3.6671142578125, -3.52001953125, -3.3729248046875, -3.225830078125, -3.0787353515625, -2.931640625, -2.7845458984375, -2.637451171875, -2.4903564453125, -2.34326171875, -2.1961669921875, -2.049072265625, -1.9019775390625, -1.7548828125, -1.6077880859375, -1.460693359375, -1.3135986328125, -1.16650390625, -1.0194091796875, -0.872314453125, -0.7252197265625, -0.578125, -0.4310302734375, -0.283935546875, -0.1368408203125, 0.01025390625, 0.1573486328125, 0.304443359375, 0.4515380859375, 0.5986328125, 0.7457275390625, 0.892822265625, 1.0399169921875, 1.18701171875, 1.3341064453125, 1.481201171875, 1.6282958984375, 1.775390625, 1.9224853515625, 2.069580078125, 2.2166748046875, 2.36376953125, 2.5108642578125, 2.657958984375, 2.8050537109375, 2.9521484375, 3.0992431640625, 3.246337890625, 3.3934326171875, 3.54052734375, 3.6876220703125, 3.834716796875, 3.9818115234375, 4.12890625]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 1.0, 3.0, 11.0, 11.0, 15.0, 21.0, 37.0, 42.0, 79.0, 102.0, 169.0, 232.0, 356.0, 526.0, 801.0, 1194.0, 1800.0, 2705.0, 4136.0, 6257.0, 9622.0, 15167.0, 24159.0, 38024.0, 63540.0, 111522.0, 213159.0, 239972.0, 127398.0, 70947.0, 42724.0, 25973.0, 16767.0, 10840.0, 7121.0, 4463.0, 2863.0, 1891.0, 1277.0, 865.0, 556.0, 383.0, 256.0, 176.0, 112.0, 88.0, 51.0, 51.0, 21.0, 25.0, 16.0, 13.0, 7.0, 12.0, 2.0, 3.0], "bins": [-0.2193603515625, -0.21311187744140625, -0.2068634033203125, -0.20061492919921875, -0.194366455078125, -0.18811798095703125, -0.1818695068359375, -0.17562103271484375, -0.16937255859375, -0.16312408447265625, -0.1568756103515625, -0.15062713623046875, -0.144378662109375, -0.13813018798828125, -0.1318817138671875, -0.12563323974609375, -0.119384765625, -0.11313629150390625, -0.1068878173828125, -0.10063934326171875, -0.094390869140625, -0.08814239501953125, -0.0818939208984375, -0.07564544677734375, -0.06939697265625, -0.06314849853515625, -0.0569000244140625, -0.05065155029296875, -0.044403076171875, -0.03815460205078125, -0.0319061279296875, -0.02565765380859375, -0.0194091796875, -0.01316070556640625, -0.0069122314453125, -0.00066375732421875, 0.005584716796875, 0.01183319091796875, 0.0180816650390625, 0.02433013916015625, 0.03057861328125, 0.03682708740234375, 0.0430755615234375, 0.04932403564453125, 0.055572509765625, 0.06182098388671875, 0.0680694580078125, 0.07431793212890625, 0.08056640625, 0.08681488037109375, 0.0930633544921875, 0.09931182861328125, 0.105560302734375, 0.11180877685546875, 0.1180572509765625, 0.12430572509765625, 0.13055419921875, 0.13680267333984375, 0.1430511474609375, 0.14929962158203125, 0.155548095703125, 0.16179656982421875, 0.1680450439453125, 0.17429351806640625, 0.1805419921875]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 4.0, 1.0, 6.0, 8.0, 1.0, 6.0, 6.0, 11.0, 16.0, 24.0, 25.0, 20.0, 23.0, 34.0, 30.0, 33.0, 48.0, 45.0, 35.0, 46.0, 42.0, 1065.0, 39.0, 42.0, 56.0, 56.0, 50.0, 41.0, 31.0, 36.0, 25.0, 24.0, 20.0, 18.0, 10.0, 20.0, 13.0, 4.0, 7.0, 7.0, 3.0, 2.0, 2.0, 3.0, 2.0], "bins": [-4.875, -4.754425048828125, -4.63385009765625, -4.513275146484375, -4.3927001953125, -4.272125244140625, -4.15155029296875, -4.030975341796875, -3.910400390625, -3.789825439453125, -3.66925048828125, -3.548675537109375, -3.4281005859375, -3.307525634765625, -3.18695068359375, -3.066375732421875, -2.94580078125, -2.825225830078125, -2.70465087890625, -2.584075927734375, -2.4635009765625, -2.342926025390625, -2.22235107421875, -2.101776123046875, -1.981201171875, -1.860626220703125, -1.74005126953125, -1.619476318359375, -1.4989013671875, -1.378326416015625, -1.25775146484375, -1.137176513671875, -1.0166015625, -0.896026611328125, -0.77545166015625, -0.654876708984375, -0.5343017578125, -0.413726806640625, -0.29315185546875, -0.172576904296875, -0.052001953125, 0.068572998046875, 0.18914794921875, 0.309722900390625, 0.4302978515625, 0.550872802734375, 0.67144775390625, 0.792022705078125, 0.91259765625, 1.033172607421875, 1.15374755859375, 1.274322509765625, 1.3948974609375, 1.515472412109375, 1.63604736328125, 1.756622314453125, 1.877197265625, 1.997772216796875, 2.11834716796875, 2.238922119140625, 2.3594970703125, 2.480072021484375, 2.60064697265625, 2.721221923828125, 2.841796875]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 4.0, 1.0, 1.0, 9.0, 4.0, 7.0, 13.0, 17.0, 29.0, 50.0, 78.0, 106.0, 163.0, 234.0, 315.0, 527.0, 783.0, 1087.0, 1690.0, 2607.0, 3915.0, 6134.0, 9869.0, 15997.0, 26937.0, 45851.0, 80982.0, 148291.0, 1298643.0, 196710.0, 107327.0, 59694.0, 34228.0, 20467.0, 12401.0, 7753.0, 4880.0, 3203.0, 2074.0, 1366.0, 872.0, 610.0, 382.0, 297.0, 184.0, 132.0, 88.0, 41.0, 32.0, 19.0, 14.0, 9.0, 4.0, 5.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.1612548828125, -0.1561737060546875, -0.151092529296875, -0.1460113525390625, -0.14093017578125, -0.1358489990234375, -0.130767822265625, -0.1256866455078125, -0.12060546875, -0.1155242919921875, -0.110443115234375, -0.1053619384765625, -0.10028076171875, -0.0951995849609375, -0.090118408203125, -0.0850372314453125, -0.0799560546875, -0.0748748779296875, -0.069793701171875, -0.0647125244140625, -0.05963134765625, -0.0545501708984375, -0.049468994140625, -0.0443878173828125, -0.039306640625, -0.0342254638671875, -0.029144287109375, -0.0240631103515625, -0.01898193359375, -0.0139007568359375, -0.008819580078125, -0.0037384033203125, 0.0013427734375, 0.0064239501953125, 0.011505126953125, 0.0165863037109375, 0.02166748046875, 0.0267486572265625, 0.031829833984375, 0.0369110107421875, 0.0419921875, 0.0470733642578125, 0.052154541015625, 0.0572357177734375, 0.06231689453125, 0.0673980712890625, 0.072479248046875, 0.0775604248046875, 0.0826416015625, 0.0877227783203125, 0.092803955078125, 0.0978851318359375, 0.10296630859375, 0.1080474853515625, 0.113128662109375, 0.1182098388671875, 0.123291015625, 0.1283721923828125, 0.133453369140625, 0.1385345458984375, 0.14361572265625, 0.1486968994140625, 0.153778076171875, 0.1588592529296875, 0.1639404296875]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 5.0, 2.0, 3.0, 5.0, 10.0, 12.0, 25.0, 31.0, 41.0, 51.0, 108.0, 132.0, 167.0, 138.0, 83.0, 59.0, 31.0, 24.0, 18.0, 14.0, 5.0, 6.0, 6.0, 5.0, 1.0, 0.0, 3.0, 4.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0], "bins": [-0.0002617835998535156, -0.0002547726035118103, -0.000247761607170105, -0.00024075061082839966, -0.00023373961448669434, -0.00022672861814498901, -0.0002197176218032837, -0.00021270662546157837, -0.00020569562911987305, -0.00019868463277816772, -0.0001916736364364624, -0.00018466264009475708, -0.00017765164375305176, -0.00017064064741134644, -0.0001636296510696411, -0.0001566186547279358, -0.00014960765838623047, -0.00014259666204452515, -0.00013558566570281982, -0.0001285746693611145, -0.00012156367301940918, -0.00011455267667770386, -0.00010754168033599854, -0.00010053068399429321, -9.351968765258789e-05, -8.650869131088257e-05, -7.949769496917725e-05, -7.248669862747192e-05, -6.54757022857666e-05, -5.846470594406128e-05, -5.145370960235596e-05, -4.4442713260650635e-05, -3.743171691894531e-05, -3.042072057723999e-05, -2.3409724235534668e-05, -1.6398727893829346e-05, -9.387731552124023e-06, -2.376735210418701e-06, 4.634261131286621e-06, 1.1645257472991943e-05, 1.8656253814697266e-05, 2.5667250156402588e-05, 3.267824649810791e-05, 3.968924283981323e-05, 4.6700239181518555e-05, 5.371123552322388e-05, 6.07222318649292e-05, 6.773322820663452e-05, 7.474422454833984e-05, 8.175522089004517e-05, 8.876621723175049e-05, 9.577721357345581e-05, 0.00010278820991516113, 0.00010979920625686646, 0.00011681020259857178, 0.0001238211989402771, 0.00013083219528198242, 0.00013784319162368774, 0.00014485418796539307, 0.0001518651843070984, 0.0001588761806488037, 0.00016588717699050903, 0.00017289817333221436, 0.00017990916967391968, 0.000186920166015625]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 3.0, 4.0, 6.0, 3.0, 9.0, 7.0, 15.0, 13.0, 18.0, 29.0, 41.0, 55.0, 126.0, 243.0, 1031.0, 24858.0, 996105.0, 24453.0, 971.0, 231.0, 120.0, 52.0, 48.0, 34.0, 19.0, 18.0, 11.0, 7.0, 7.0, 1.0, 2.0, 3.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0031185150146484375, -0.0030008256435394287, -0.00288313627243042, -0.002765446901321411, -0.0026477575302124023, -0.0025300681591033936, -0.0024123787879943848, -0.002294689416885376, -0.002177000045776367, -0.0020593106746673584, -0.0019416213035583496, -0.0018239319324493408, -0.001706242561340332, -0.0015885531902313232, -0.0014708638191223145, -0.0013531744480133057, -0.0012354850769042969, -0.001117795705795288, -0.0010001063346862793, -0.0008824169635772705, -0.0007647275924682617, -0.0006470382213592529, -0.0005293488502502441, -0.00041165947914123535, -0.00029397010803222656, -0.00017628073692321777, -5.8591365814208984e-05, 5.9098005294799805e-05, 0.0001767873764038086, 0.0002944767475128174, 0.00041216611862182617, 0.000529855489730835, 0.0006475448608398438, 0.0007652342319488525, 0.0008829236030578613, 0.0010006129741668701, 0.001118302345275879, 0.0012359917163848877, 0.0013536810874938965, 0.0014713704586029053, 0.001589059829711914, 0.0017067492008209229, 0.0018244385719299316, 0.0019421279430389404, 0.0020598173141479492, 0.002177506685256958, 0.002295196056365967, 0.0024128854274749756, 0.0025305747985839844, 0.002648264169692993, 0.002765953540802002, 0.0028836429119110107, 0.0030013322830200195, 0.0031190216541290283, 0.003236711025238037, 0.003354400396347046, 0.0034720897674560547, 0.0035897791385650635, 0.0037074685096740723, 0.003825157880783081, 0.00394284725189209, 0.004060536623001099, 0.004178225994110107, 0.004295915365219116, 0.004413604736328125]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 10.0, 73.0, 585.0, 316.0, 31.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00012557857553474605, -9.938875155057758e-05, -7.319892756640911e-05, -4.700910358224064e-05, -2.081927959807217e-05, 5.370544386096299e-06, 3.156036837026477e-05, 5.775019235443324e-05, 8.394001633860171e-05, 0.00011012984032277018, 0.00013631966430693865, 0.00016250948829110712, 0.0001886993122752756, 0.00021488913625944406, 0.00024107896024361253, 0.0002672687987796962, 0.00029345860821194947, 0.0003196484176442027, 0.0003458382561802864, 0.0003720280947163701, 0.00039821790414862335, 0.0004244077135808766, 0.0004505975521169603, 0.000476787390653044, 0.0005029771709814668, 0.0005291670095175505, 0.0005553568480536342, 0.000581546628382057, 0.0006077364669181406, 0.0006339263054542243, 0.0006601160857826471, 0.0006863059243187308, 0.0007124957628548145, 0.0007386856013908982, 0.0007648754399269819, 0.0007910652202554047, 0.0008172550587914884, 0.0008434448973275721, 0.0008696346776559949, 0.0008958245161920786, 0.0009220143547281623, 0.000948204193264246, 0.0009743940318003297, 0.0010005838703364134, 0.0010267735924571753, 0.001052963430993259, 0.0010791532695293427, 0.0011053431080654263, 0.00113153294660151, 0.0011577227851375937, 0.0011839126236736774, 0.0012101024622097611, 0.0012362923007458448, 0.0012624820228666067, 0.0012886718614026904, 0.0013148616999387741, 0.0013410515384748578, 0.0013672413770109415, 0.0013934312155470252, 0.001419621054083109, 0.0014458107762038708, 0.0014720006147399545, 0.0014981904532760382, 0.0015243802918121219, 0.0015505701303482056]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 2.0, 7.0, 10.0, 14.0, 11.0, 19.0, 23.0, 26.0, 29.0, 36.0, 35.0, 40.0, 39.0, 32.0, 34.0, 53.0, 47.0, 48.0, 60.0, 42.0, 55.0, 57.0, 46.0, 38.0, 38.0, 41.0, 28.0, 27.0, 14.0, 19.0, 10.0, 10.0, 10.0, 3.0, 3.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.906291961669922e-05, -9.575486183166504e-05, -9.244680404663086e-05, -8.913874626159668e-05, -8.58306884765625e-05, -8.252263069152832e-05, -7.921457290649414e-05, -7.590651512145996e-05, -7.259845733642578e-05, -6.92903995513916e-05, -6.598234176635742e-05, -6.267428398132324e-05, -5.936622619628906e-05, -5.605816841125488e-05, -5.27501106262207e-05, -4.9442052841186523e-05, -4.6133995056152344e-05, -4.2825937271118164e-05, -3.9517879486083984e-05, -3.6209821701049805e-05, -3.2901763916015625e-05, -2.9593706130981445e-05, -2.6285648345947266e-05, -2.2977590560913086e-05, -1.9669532775878906e-05, -1.6361474990844727e-05, -1.3053417205810547e-05, -9.745359420776367e-06, -6.4373016357421875e-06, -3.129243850708008e-06, 1.7881393432617188e-07, 3.4868717193603516e-06, 6.794929504394531e-06, 1.0102987289428711e-05, 1.341104507446289e-05, 1.671910285949707e-05, 2.002716064453125e-05, 2.333521842956543e-05, 2.664327621459961e-05, 2.995133399963379e-05, 3.325939178466797e-05, 3.656744956970215e-05, 3.987550735473633e-05, 4.318356513977051e-05, 4.649162292480469e-05, 4.979968070983887e-05, 5.310773849487305e-05, 5.6415796279907227e-05, 5.9723854064941406e-05, 6.303191184997559e-05, 6.633996963500977e-05, 6.964802742004395e-05, 7.295608520507812e-05, 7.62641429901123e-05, 7.957220077514648e-05, 8.288025856018066e-05, 8.618831634521484e-05, 8.949637413024902e-05, 9.28044319152832e-05, 9.611248970031738e-05, 9.942054748535156e-05, 0.00010272860527038574, 0.00010603666305541992, 0.0001093447208404541, 0.00011265277862548828]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 0.0, 4.0, 3.0, 3.0, 5.0, 5.0, 2.0, 5.0, 9.0, 3.0, 12.0, 12.0, 11.0, 10.0, 19.0, 17.0, 19.0, 22.0, 25.0, 28.0, 31.0, 27.0, 28.0, 34.0, 37.0, 48.0, 40.0, 35.0, 45.0, 49.0, 31.0, 31.0, 45.0, 38.0, 29.0, 27.0, 30.0, 23.0, 28.0, 21.0, 20.0, 17.0, 15.0, 11.0, 5.0, 8.0, 11.0, 4.0, 5.0, 5.0, 5.0, 7.0, 3.0, 4.0, 1.0, 3.0], "bins": [-5.28515625, -5.1380615234375, -4.990966796875, -4.8438720703125, -4.69677734375, -4.5496826171875, -4.402587890625, -4.2554931640625, -4.1083984375, -3.9613037109375, -3.814208984375, -3.6671142578125, -3.52001953125, -3.3729248046875, -3.225830078125, -3.0787353515625, -2.931640625, -2.7845458984375, -2.637451171875, -2.4903564453125, -2.34326171875, -2.1961669921875, -2.049072265625, -1.9019775390625, -1.7548828125, -1.6077880859375, -1.460693359375, -1.3135986328125, -1.16650390625, -1.0194091796875, -0.872314453125, -0.7252197265625, -0.578125, -0.4310302734375, -0.283935546875, -0.1368408203125, 0.01025390625, 0.1573486328125, 0.304443359375, 0.4515380859375, 0.5986328125, 0.7457275390625, 0.892822265625, 1.0399169921875, 1.18701171875, 1.3341064453125, 1.481201171875, 1.6282958984375, 1.775390625, 1.9224853515625, 2.069580078125, 2.2166748046875, 2.36376953125, 2.5108642578125, 2.657958984375, 2.8050537109375, 2.9521484375, 3.0992431640625, 3.246337890625, 3.3934326171875, 3.54052734375, 3.6876220703125, 3.834716796875, 3.9818115234375, 4.12890625]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 7.0, 3.0, 4.0, 10.0, 9.0, 7.0, 19.0, 15.0, 27.0, 49.0, 61.0, 109.0, 178.0, 347.0, 621.0, 1136.0, 1990.0, 3747.0, 7852.0, 20973.0, 84973.0, 518478.0, 325726.0, 53687.0, 15313.0, 6250.0, 3096.0, 1674.0, 925.0, 495.0, 286.0, 165.0, 120.0, 58.0, 32.0, 43.0, 11.0, 12.0, 11.0, 11.0, 10.0, 13.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-9.3203125, -9.05291748046875, -8.7855224609375, -8.51812744140625, -8.250732421875, -7.98333740234375, -7.7159423828125, -7.44854736328125, -7.18115234375, -6.91375732421875, -6.6463623046875, -6.37896728515625, -6.111572265625, -5.84417724609375, -5.5767822265625, -5.30938720703125, -5.0419921875, -4.77459716796875, -4.5072021484375, -4.23980712890625, -3.972412109375, -3.70501708984375, -3.4376220703125, -3.17022705078125, -2.90283203125, -2.63543701171875, -2.3680419921875, -2.10064697265625, -1.833251953125, -1.56585693359375, -1.2984619140625, -1.03106689453125, -0.763671875, -0.49627685546875, -0.2288818359375, 0.03851318359375, 0.305908203125, 0.57330322265625, 0.8406982421875, 1.10809326171875, 1.37548828125, 1.64288330078125, 1.9102783203125, 2.17767333984375, 2.445068359375, 2.71246337890625, 2.9798583984375, 3.24725341796875, 3.5146484375, 3.78204345703125, 4.0494384765625, 4.31683349609375, 4.584228515625, 4.85162353515625, 5.1190185546875, 5.38641357421875, 5.65380859375, 5.92120361328125, 6.1885986328125, 6.45599365234375, 6.723388671875, 6.99078369140625, 7.2581787109375, 7.52557373046875, 7.79296875]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 5.0, 3.0, 5.0, 12.0, 14.0, 13.0, 22.0, 13.0, 18.0, 29.0, 35.0, 37.0, 44.0, 48.0, 63.0, 79.0, 140.0, 390.0, 1444.0, 173.0, 88.0, 54.0, 56.0, 38.0, 34.0, 37.0, 32.0, 28.0, 20.0, 15.0, 12.0, 17.0, 3.0, 5.0, 6.0, 7.0, 6.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0], "bins": [-24.890625, -24.236083984375, -23.58154296875, -22.927001953125, -22.2724609375, -21.617919921875, -20.96337890625, -20.308837890625, -19.654296875, -18.999755859375, -18.34521484375, -17.690673828125, -17.0361328125, -16.381591796875, -15.72705078125, -15.072509765625, -14.41796875, -13.763427734375, -13.10888671875, -12.454345703125, -11.7998046875, -11.145263671875, -10.49072265625, -9.836181640625, -9.181640625, -8.527099609375, -7.87255859375, -7.218017578125, -6.5634765625, -5.908935546875, -5.25439453125, -4.599853515625, -3.9453125, -3.290771484375, -2.63623046875, -1.981689453125, -1.3271484375, -0.672607421875, -0.01806640625, 0.636474609375, 1.291015625, 1.945556640625, 2.60009765625, 3.254638671875, 3.9091796875, 4.563720703125, 5.21826171875, 5.872802734375, 6.52734375, 7.181884765625, 7.83642578125, 8.490966796875, 9.1455078125, 9.800048828125, 10.45458984375, 11.109130859375, 11.763671875, 12.418212890625, 13.07275390625, 13.727294921875, 14.3818359375, 15.036376953125, 15.69091796875, 16.345458984375, 17.0]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 2.0, 9.0, 5.0, 3.0, 4.0, 9.0, 10.0, 7.0, 17.0, 23.0, 31.0, 44.0, 55.0, 59.0, 101.0, 152.0, 224.0, 372.0, 892.0, 6559.0, 1615961.0, 1512765.0, 6454.0, 893.0, 353.0, 198.0, 150.0, 94.0, 64.0, 54.0, 28.0, 35.0, 19.0, 14.0, 13.0, 11.0, 9.0, 8.0, 4.0, 4.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.15625, -35.60791015625, -34.0595703125, -32.51123046875, -30.962890625, -29.41455078125, -27.8662109375, -26.31787109375, -24.76953125, -23.22119140625, -21.6728515625, -20.12451171875, -18.576171875, -17.02783203125, -15.4794921875, -13.93115234375, -12.3828125, -10.83447265625, -9.2861328125, -7.73779296875, -6.189453125, -4.64111328125, -3.0927734375, -1.54443359375, 0.00390625, 1.55224609375, 3.1005859375, 4.64892578125, 6.197265625, 7.74560546875, 9.2939453125, 10.84228515625, 12.390625, 13.93896484375, 15.4873046875, 17.03564453125, 18.583984375, 20.13232421875, 21.6806640625, 23.22900390625, 24.77734375, 26.32568359375, 27.8740234375, 29.42236328125, 30.970703125, 32.51904296875, 34.0673828125, 35.61572265625, 37.1640625, 38.71240234375, 40.2607421875, 41.80908203125, 43.357421875, 44.90576171875, 46.4541015625, 48.00244140625, 49.55078125, 51.09912109375, 52.6474609375, 54.19580078125, 55.744140625, 57.29248046875, 58.8408203125, 60.38916015625, 61.9375]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 88.0, 734.0, 187.0, 6.0], "bins": [-352.61859130859375, -346.8965759277344, -341.174560546875, -335.4525146484375, -329.7304992675781, -324.00848388671875, -318.2864685058594, -312.564453125, -306.8424072265625, -301.1203918457031, -295.39837646484375, -289.67633056640625, -283.9543151855469, -278.2322998046875, -272.5102844238281, -266.78826904296875, -261.0662536621094, -255.34423828125, -249.62220764160156, -243.9001922607422, -238.17816162109375, -232.45614624023438, -226.734130859375, -221.01210021972656, -215.29006958007812, -209.56805419921875, -203.8460235595703, -198.12400817871094, -192.4019775390625, -186.67996215820312, -180.95794677734375, -175.2359161376953, -169.51390075683594, -163.79188537597656, -158.06985473632812, -152.34783935546875, -146.6258087158203, -140.90379333496094, -135.1817626953125, -129.45974731445312, -123.73772430419922, -118.01570129394531, -112.2936782836914, -106.5716552734375, -100.84963989257812, -95.12761688232422, -89.40559387207031, -83.68357849121094, -77.9615478515625, -72.2395248413086, -66.51750183105469, -60.79548263549805, -55.073463439941406, -49.3514404296875, -43.629417419433594, -37.90739822387695, -32.18537521362305, -26.463354110717773, -20.7413330078125, -15.019309997558594, -9.29728889465332, -3.575267791748047, 2.1467552185058594, 7.8687744140625, 13.59079647064209]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 2.0, 5.0, 11.0, 8.0, 23.0, 11.0, 14.0, 17.0, 17.0, 21.0, 34.0, 23.0, 23.0, 34.0, 26.0, 29.0, 44.0, 55.0, 43.0, 38.0, 43.0, 51.0, 45.0, 36.0, 39.0, 37.0, 38.0, 41.0, 41.0, 24.0, 25.0, 22.0, 13.0, 21.0, 18.0, 10.0, 6.0, 6.0, 6.0, 1.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-52.89966583251953, -51.41289520263672, -49.926124572753906, -48.439353942871094, -46.95258712768555, -45.465816497802734, -43.97904586791992, -42.49227523803711, -41.0055046081543, -39.518733978271484, -38.03196334838867, -36.545196533203125, -35.05842590332031, -33.5716552734375, -32.08488464355469, -30.598114013671875, -29.111345291137695, -27.624574661254883, -26.137805938720703, -24.65103530883789, -23.164264678955078, -21.677494049072266, -20.190725326538086, -18.703954696655273, -17.217185974121094, -15.730416297912598, -14.243645668029785, -12.756875991821289, -11.270105361938477, -9.78333568572998, -8.296566009521484, -6.809795379638672, -5.323024749755859, -3.836254596710205, -2.34948468208313, -0.8627147674560547, 0.6240553855895996, 2.110825538635254, 3.59759521484375, 5.0843658447265625, 6.571135520935059, 8.057905197143555, 9.544675827026367, 11.031445503234863, 12.51821517944336, 14.004985809326172, 15.491755485534668, 16.978527069091797, 18.465295791625977, 19.95206642150879, 21.43883514404297, 22.92560577392578, 24.412376403808594, 25.899147033691406, 27.385915756225586, 28.8726863861084, 30.359455108642578, 31.84622573852539, 33.3329963684082, 34.81976318359375, 36.30653381347656, 37.793304443359375, 39.28007507324219, 40.766845703125, 42.25361633300781]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 3.0, 4.0, 3.0, 4.0, 6.0, 6.0, 7.0, 7.0, 22.0, 9.0, 8.0, 22.0, 22.0, 12.0, 22.0, 28.0, 31.0, 27.0, 25.0, 26.0, 40.0, 39.0, 51.0, 36.0, 42.0, 48.0, 39.0, 37.0, 35.0, 38.0, 21.0, 32.0, 29.0, 34.0, 27.0, 18.0, 30.0, 15.0, 12.0, 13.0, 12.0, 10.0, 7.0, 7.0, 8.0, 8.0, 4.0, 6.0, 5.0, 1.0, 1.0, 5.0, 3.0], "bins": [-5.55078125, -5.39544677734375, -5.2401123046875, -5.08477783203125, -4.929443359375, -4.77410888671875, -4.6187744140625, -4.46343994140625, -4.30810546875, -4.15277099609375, -3.9974365234375, -3.84210205078125, -3.686767578125, -3.53143310546875, -3.3760986328125, -3.22076416015625, -3.0654296875, -2.91009521484375, -2.7547607421875, -2.59942626953125, -2.444091796875, -2.28875732421875, -2.1334228515625, -1.97808837890625, -1.82275390625, -1.66741943359375, -1.5120849609375, -1.35675048828125, -1.201416015625, -1.04608154296875, -0.8907470703125, -0.73541259765625, -0.580078125, -0.42474365234375, -0.2694091796875, -0.11407470703125, 0.041259765625, 0.19659423828125, 0.3519287109375, 0.50726318359375, 0.66259765625, 0.81793212890625, 0.9732666015625, 1.12860107421875, 1.283935546875, 1.43927001953125, 1.5946044921875, 1.74993896484375, 1.9052734375, 2.06060791015625, 2.2159423828125, 2.37127685546875, 2.526611328125, 2.68194580078125, 2.8372802734375, 2.99261474609375, 3.14794921875, 3.30328369140625, 3.4586181640625, 3.61395263671875, 3.769287109375, 3.92462158203125, 4.0799560546875, 4.23529052734375, 4.390625]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 7.0, 3.0, 5.0, 4.0, 5.0, 4.0, 6.0, 6.0, 14.0, 18.0, 23.0, 21.0, 26.0, 39.0, 58.0, 85.0, 186.0, 378.0, 807.0, 1846.0, 4540.0, 12566.0, 49740.0, 1125193.0, 2839130.0, 127165.0, 20221.0, 6907.0, 2847.0, 1156.0, 574.0, 267.0, 139.0, 78.0, 50.0, 33.0, 27.0, 16.0, 21.0, 20.0, 10.0, 6.0, 5.0, 12.0, 7.0, 7.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-20.765625, -20.175537109375, -19.58544921875, -18.995361328125, -18.4052734375, -17.815185546875, -17.22509765625, -16.635009765625, -16.044921875, -15.454833984375, -14.86474609375, -14.274658203125, -13.6845703125, -13.094482421875, -12.50439453125, -11.914306640625, -11.32421875, -10.734130859375, -10.14404296875, -9.553955078125, -8.9638671875, -8.373779296875, -7.78369140625, -7.193603515625, -6.603515625, -6.013427734375, -5.42333984375, -4.833251953125, -4.2431640625, -3.653076171875, -3.06298828125, -2.472900390625, -1.8828125, -1.292724609375, -0.70263671875, -0.112548828125, 0.4775390625, 1.067626953125, 1.65771484375, 2.247802734375, 2.837890625, 3.427978515625, 4.01806640625, 4.608154296875, 5.1982421875, 5.788330078125, 6.37841796875, 6.968505859375, 7.55859375, 8.148681640625, 8.73876953125, 9.328857421875, 9.9189453125, 10.509033203125, 11.09912109375, 11.689208984375, 12.279296875, 12.869384765625, 13.45947265625, 14.049560546875, 14.6396484375, 15.229736328125, 15.81982421875, 16.409912109375, 17.0]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 2.0, 4.0, 5.0, 11.0, 9.0, 14.0, 11.0, 16.0, 20.0, 26.0, 38.0, 50.0, 73.0, 112.0, 154.0, 225.0, 399.0, 502.0, 616.0, 562.0, 378.0, 259.0, 160.0, 112.0, 75.0, 61.0, 50.0, 38.0, 27.0, 15.0, 10.0, 12.0, 9.0, 6.0, 7.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.78125, -12.38916015625, -11.9970703125, -11.60498046875, -11.212890625, -10.82080078125, -10.4287109375, -10.03662109375, -9.64453125, -9.25244140625, -8.8603515625, -8.46826171875, -8.076171875, -7.68408203125, -7.2919921875, -6.89990234375, -6.5078125, -6.11572265625, -5.7236328125, -5.33154296875, -4.939453125, -4.54736328125, -4.1552734375, -3.76318359375, -3.37109375, -2.97900390625, -2.5869140625, -2.19482421875, -1.802734375, -1.41064453125, -1.0185546875, -0.62646484375, -0.234375, 0.15771484375, 0.5498046875, 0.94189453125, 1.333984375, 1.72607421875, 2.1181640625, 2.51025390625, 2.90234375, 3.29443359375, 3.6865234375, 4.07861328125, 4.470703125, 4.86279296875, 5.2548828125, 5.64697265625, 6.0390625, 6.43115234375, 6.8232421875, 7.21533203125, 7.607421875, 7.99951171875, 8.3916015625, 8.78369140625, 9.17578125, 9.56787109375, 9.9599609375, 10.35205078125, 10.744140625, 11.13623046875, 11.5283203125, 11.92041015625, 12.3125]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 4.0, 6.0, 13.0, 7.0, 6.0, 11.0, 21.0, 27.0, 32.0, 76.0, 139.0, 205.0, 476.0, 1178.0, 3665.0, 13774.0, 77229.0, 2116612.0, 1889613.0, 72433.0, 13200.0, 3394.0, 1127.0, 499.0, 206.0, 129.0, 59.0, 35.0, 31.0, 19.0, 19.0, 13.0, 11.0, 6.0, 1.0, 2.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.03125, -25.1630859375, -24.294921875, -23.4267578125, -22.55859375, -21.6904296875, -20.822265625, -19.9541015625, -19.0859375, -18.2177734375, -17.349609375, -16.4814453125, -15.61328125, -14.7451171875, -13.876953125, -13.0087890625, -12.140625, -11.2724609375, -10.404296875, -9.5361328125, -8.66796875, -7.7998046875, -6.931640625, -6.0634765625, -5.1953125, -4.3271484375, -3.458984375, -2.5908203125, -1.72265625, -0.8544921875, 0.013671875, 0.8818359375, 1.75, 2.6181640625, 3.486328125, 4.3544921875, 5.22265625, 6.0908203125, 6.958984375, 7.8271484375, 8.6953125, 9.5634765625, 10.431640625, 11.2998046875, 12.16796875, 13.0361328125, 13.904296875, 14.7724609375, 15.640625, 16.5087890625, 17.376953125, 18.2451171875, 19.11328125, 19.9814453125, 20.849609375, 21.7177734375, 22.5859375, 23.4541015625, 24.322265625, 25.1904296875, 26.05859375, 26.9267578125, 27.794921875, 28.6630859375, 29.53125]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 8.0, 13.0, 24.0, 33.0, 58.0, 103.0, 145.0, 184.0, 171.0, 117.0, 65.0, 36.0, 20.0, 11.0, 4.0, 13.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-84.35810089111328, -81.84437561035156, -79.33065795898438, -76.81693267822266, -74.30321502685547, -71.78948974609375, -69.27577209472656, -66.76204681396484, -64.24832153320312, -61.73460006713867, -59.22087860107422, -56.7071533203125, -54.19343185424805, -51.679710388183594, -49.16598892211914, -46.65226745605469, -44.138545989990234, -41.62482452392578, -39.11110305786133, -36.597381591796875, -34.083656311035156, -31.569934844970703, -29.05621337890625, -26.542490005493164, -24.02876853942871, -21.515047073364258, -19.001323699951172, -16.48760223388672, -13.97387981414795, -11.46015739440918, -8.946435928344727, -6.432712554931641, -3.9189910888671875, -1.405268907546997, 1.1084532737731934, 3.6221752166748047, 6.135897636413574, 8.649620056152344, 11.163341522216797, 13.677064895629883, 16.190786361694336, 18.70450782775879, 21.218231201171875, 23.731952667236328, 26.24567413330078, 28.759397506713867, 31.27311897277832, 33.786842346191406, 36.30056381225586, 38.81428527832031, 41.328006744384766, 43.84172821044922, 46.35545349121094, 48.86917495727539, 51.382896423339844, 53.89662170410156, 56.41033935546875, 58.9240608215332, 61.437782287597656, 63.951507568359375, 66.46522521972656, 68.97895050048828, 71.49267578125, 74.00639343261719, 76.5201187133789]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 3.0, 6.0, 6.0, 11.0, 7.0, 5.0, 12.0, 20.0, 15.0, 20.0, 23.0, 21.0, 21.0, 31.0, 42.0, 37.0, 30.0, 37.0, 28.0, 41.0, 45.0, 37.0, 48.0, 33.0, 43.0, 34.0, 40.0, 39.0, 34.0, 26.0, 27.0, 34.0, 25.0, 28.0, 15.0, 17.0, 14.0, 9.0, 5.0, 11.0, 9.0, 5.0, 2.0, 2.0, 1.0, 4.0, 2.0, 0.0, 3.0], "bins": [-41.67401123046875, -40.541015625, -39.408016204833984, -38.275020599365234, -37.14202117919922, -36.00902557373047, -34.87602615356445, -33.7430305480957, -32.61003112792969, -31.477033615112305, -30.344036102294922, -29.21103858947754, -28.078041076660156, -26.945043563842773, -25.81204605102539, -24.67905044555664, -23.546052932739258, -22.413055419921875, -21.280057907104492, -20.14706039428711, -19.014062881469727, -17.881065368652344, -16.748069763183594, -15.615071296691895, -14.482073783874512, -13.349076271057129, -12.216078758239746, -11.08308219909668, -9.950084686279297, -8.817087173461914, -7.684089660644531, -6.551092147827148, -5.418092727661133, -4.28509521484375, -3.1520979404449463, -2.0191006660461426, -0.8861031532287598, 0.24689435958862305, 1.3798913955688477, 2.5128889083862305, 3.6458864212036133, 4.778883934020996, 5.911881446838379, 7.0448784828186035, 8.177875518798828, 9.310873031616211, 10.443870544433594, 11.576868057250977, 12.70986557006836, 13.842863082885742, 14.975860595703125, 16.108858108520508, 17.24185562133789, 18.374853134155273, 19.507850646972656, 20.640846252441406, 21.773845672607422, 22.906843185424805, 24.039840698242188, 25.17283821105957, 26.305835723876953, 27.438833236694336, 28.57183074951172, 29.70482635498047, 30.83782386779785]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 1.0, 2.0, 3.0, 3.0, 2.0, 8.0, 3.0, 5.0, 6.0, 11.0, 16.0, 6.0, 14.0, 24.0, 18.0, 17.0, 26.0, 22.0, 31.0, 37.0, 31.0, 34.0, 43.0, 28.0, 49.0, 32.0, 35.0, 40.0, 34.0, 48.0, 37.0, 34.0, 33.0, 37.0, 27.0, 33.0, 25.0, 19.0, 20.0, 25.0, 13.0, 9.0, 9.0, 7.0, 12.0, 8.0, 9.0, 0.0, 4.0, 4.0, 7.0, 2.0, 4.0, 3.0, 0.0, 2.0], "bins": [-5.43359375, -5.27667236328125, -5.1197509765625, -4.96282958984375, -4.805908203125, -4.64898681640625, -4.4920654296875, -4.33514404296875, -4.17822265625, -4.02130126953125, -3.8643798828125, -3.70745849609375, -3.550537109375, -3.39361572265625, -3.2366943359375, -3.07977294921875, -2.9228515625, -2.76593017578125, -2.6090087890625, -2.45208740234375, -2.295166015625, -2.13824462890625, -1.9813232421875, -1.82440185546875, -1.66748046875, -1.51055908203125, -1.3536376953125, -1.19671630859375, -1.039794921875, -0.88287353515625, -0.7259521484375, -0.56903076171875, -0.412109375, -0.25518798828125, -0.0982666015625, 0.05865478515625, 0.215576171875, 0.37249755859375, 0.5294189453125, 0.68634033203125, 0.84326171875, 1.00018310546875, 1.1571044921875, 1.31402587890625, 1.470947265625, 1.62786865234375, 1.7847900390625, 1.94171142578125, 2.0986328125, 2.25555419921875, 2.4124755859375, 2.56939697265625, 2.726318359375, 2.88323974609375, 3.0401611328125, 3.19708251953125, 3.35400390625, 3.51092529296875, 3.6678466796875, 3.82476806640625, 3.981689453125, 4.13861083984375, 4.2955322265625, 4.45245361328125, 4.609375]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 4.0, 8.0, 5.0, 13.0, 19.0, 32.0, 29.0, 63.0, 85.0, 113.0, 182.0, 234.0, 405.0, 588.0, 840.0, 1161.0, 1739.0, 2427.0, 3531.0, 5485.0, 8137.0, 12325.0, 19110.0, 31255.0, 51668.0, 91629.0, 172938.0, 259907.0, 163654.0, 86595.0, 49567.0, 29839.0, 18568.0, 11943.0, 8087.0, 5258.0, 3604.0, 2382.0, 1694.0, 1117.0, 743.0, 499.0, 379.0, 201.0, 147.0, 119.0, 79.0, 46.0, 39.0, 23.0, 11.0, 15.0, 10.0, 4.0, 5.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.213623046875, -0.20637130737304688, -0.19911956787109375, -0.19186782836914062, -0.1846160888671875, -0.17736434936523438, -0.17011260986328125, -0.16286087036132812, -0.155609130859375, -0.14835739135742188, -0.14110565185546875, -0.13385391235351562, -0.1266021728515625, -0.11935043334960938, -0.11209869384765625, -0.10484695434570312, -0.09759521484375, -0.09034347534179688, -0.08309173583984375, -0.07583999633789062, -0.0685882568359375, -0.061336517333984375, -0.05408477783203125, -0.046833038330078125, -0.039581298828125, -0.032329559326171875, -0.02507781982421875, -0.017826080322265625, -0.0105743408203125, -0.003322601318359375, 0.00392913818359375, 0.011180877685546875, 0.0184326171875, 0.025684356689453125, 0.03293609619140625, 0.040187835693359375, 0.0474395751953125, 0.054691314697265625, 0.06194305419921875, 0.06919479370117188, 0.076446533203125, 0.08369827270507812, 0.09095001220703125, 0.09820175170898438, 0.1054534912109375, 0.11270523071289062, 0.11995697021484375, 0.12720870971679688, 0.13446044921875, 0.14171218872070312, 0.14896392822265625, 0.15621566772460938, 0.1634674072265625, 0.17071914672851562, 0.17797088623046875, 0.18522262573242188, 0.192474365234375, 0.19972610473632812, 0.20697784423828125, 0.21422958374023438, 0.2214813232421875, 0.22873306274414062, 0.23598480224609375, 0.24323654174804688, 0.25048828125]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0, 2.0, 8.0, 13.0, 8.0, 6.0, 10.0, 7.0, 9.0, 21.0, 27.0, 27.0, 28.0, 25.0, 31.0, 36.0, 44.0, 33.0, 41.0, 30.0, 47.0, 39.0, 1053.0, 46.0, 40.0, 35.0, 41.0, 39.0, 35.0, 20.0, 21.0, 21.0, 15.0, 26.0, 23.0, 16.0, 11.0, 14.0, 12.0, 12.0, 8.0, 7.0, 11.0, 4.0, 6.0, 0.0, 5.0, 2.0, 4.0, 5.0, 4.0, 1.0, 3.0], "bins": [-3.345703125, -3.246337890625, -3.14697265625, -3.047607421875, -2.9482421875, -2.848876953125, -2.74951171875, -2.650146484375, -2.55078125, -2.451416015625, -2.35205078125, -2.252685546875, -2.1533203125, -2.053955078125, -1.95458984375, -1.855224609375, -1.755859375, -1.656494140625, -1.55712890625, -1.457763671875, -1.3583984375, -1.259033203125, -1.15966796875, -1.060302734375, -0.9609375, -0.861572265625, -0.76220703125, -0.662841796875, -0.5634765625, -0.464111328125, -0.36474609375, -0.265380859375, -0.166015625, -0.066650390625, 0.03271484375, 0.132080078125, 0.2314453125, 0.330810546875, 0.43017578125, 0.529541015625, 0.62890625, 0.728271484375, 0.82763671875, 0.927001953125, 1.0263671875, 1.125732421875, 1.22509765625, 1.324462890625, 1.423828125, 1.523193359375, 1.62255859375, 1.721923828125, 1.8212890625, 1.920654296875, 2.02001953125, 2.119384765625, 2.21875, 2.318115234375, 2.41748046875, 2.516845703125, 2.6162109375, 2.715576171875, 2.81494140625, 2.914306640625, 3.013671875]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 4.0, 8.0, 13.0, 21.0, 33.0, 51.0, 69.0, 74.0, 119.0, 142.0, 223.0, 295.0, 405.0, 583.0, 789.0, 1103.0, 1566.0, 2249.0, 3185.0, 4541.0, 6935.0, 10453.0, 15613.0, 24554.0, 39381.0, 63588.0, 104622.0, 174453.0, 1270041.0, 141192.0, 85356.0, 51594.0, 32360.0, 20428.0, 13262.0, 8582.0, 5871.0, 3928.0, 2775.0, 1885.0, 1331.0, 958.0, 692.0, 500.0, 352.0, 275.0, 201.0, 144.0, 96.0, 83.0, 42.0, 40.0, 25.0, 14.0, 17.0, 8.0, 11.0, 4.0, 2.0, 3.0], "bins": [-0.147705078125, -0.14313125610351562, -0.13855743408203125, -0.13398361206054688, -0.1294097900390625, -0.12483596801757812, -0.12026214599609375, -0.11568832397460938, -0.111114501953125, -0.10654067993164062, -0.10196685791015625, -0.09739303588867188, -0.0928192138671875, -0.08824539184570312, -0.08367156982421875, -0.07909774780273438, -0.07452392578125, -0.06995010375976562, -0.06537628173828125, -0.060802459716796875, -0.0562286376953125, -0.051654815673828125, -0.04708099365234375, -0.042507171630859375, -0.037933349609375, -0.033359527587890625, -0.02878570556640625, -0.024211883544921875, -0.0196380615234375, -0.015064239501953125, -0.01049041748046875, -0.005916595458984375, -0.0013427734375, 0.003231048583984375, 0.00780487060546875, 0.012378692626953125, 0.0169525146484375, 0.021526336669921875, 0.02610015869140625, 0.030673980712890625, 0.035247802734375, 0.039821624755859375, 0.04439544677734375, 0.048969268798828125, 0.0535430908203125, 0.058116912841796875, 0.06269073486328125, 0.06726455688476562, 0.07183837890625, 0.07641220092773438, 0.08098602294921875, 0.08555984497070312, 0.0901336669921875, 0.09470748901367188, 0.09928131103515625, 0.10385513305664062, 0.108428955078125, 0.11300277709960938, 0.11757659912109375, 0.12215042114257812, 0.1267242431640625, 0.13129806518554688, 0.13587188720703125, 0.14044570922851562, 0.14501953125]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 4.0, 1.0, 1.0, 3.0, 2.0, 6.0, 8.0, 6.0, 10.0, 7.0, 16.0, 26.0, 27.0, 37.0, 49.0, 51.0, 100.0, 122.0, 133.0, 113.0, 71.0, 51.0, 29.0, 25.0, 19.0, 17.0, 14.0, 16.0, 10.0, 4.0, 9.0, 8.0, 1.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00026345252990722656, -0.000254753977060318, -0.0002460554242134094, -0.00023735687136650085, -0.00022865831851959229, -0.00021995976567268372, -0.00021126121282577515, -0.00020256265997886658, -0.000193864107131958, -0.00018516555428504944, -0.00017646700143814087, -0.0001677684485912323, -0.00015906989574432373, -0.00015037134289741516, -0.0001416727900505066, -0.00013297423720359802, -0.00012427568435668945, -0.00011557713150978088, -0.00010687857866287231, -9.818002581596375e-05, -8.948147296905518e-05, -8.07829201221466e-05, -7.208436727523804e-05, -6.338581442832947e-05, -5.46872615814209e-05, -4.598870873451233e-05, -3.729015588760376e-05, -2.859160304069519e-05, -1.989305019378662e-05, -1.1194497346878052e-05, -2.4959444999694824e-06, 6.202608346939087e-06, 1.4901161193847656e-05, 2.3599714040756226e-05, 3.2298266887664795e-05, 4.0996819734573364e-05, 4.9695372581481934e-05, 5.83939254283905e-05, 6.709247827529907e-05, 7.579103112220764e-05, 8.448958396911621e-05, 9.318813681602478e-05, 0.00010188668966293335, 0.00011058524250984192, 0.00011928379535675049, 0.00012798234820365906, 0.00013668090105056763, 0.0001453794538974762, 0.00015407800674438477, 0.00016277655959129333, 0.0001714751124382019, 0.00018017366528511047, 0.00018887221813201904, 0.0001975707709789276, 0.00020626932382583618, 0.00021496787667274475, 0.00022366642951965332, 0.0002323649823665619, 0.00024106353521347046, 0.00024976208806037903, 0.0002584606409072876, 0.00026715919375419617, 0.00027585774660110474, 0.0002845562994480133, 0.0002932548522949219]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 7.0, 6.0, 12.0, 11.0, 14.0, 28.0, 21.0, 41.0, 59.0, 75.0, 141.0, 307.0, 1922.0, 137163.0, 902379.0, 5391.0, 460.0, 172.0, 96.0, 66.0, 54.0, 27.0, 29.0, 11.0, 22.0, 6.0, 5.0, 6.0, 8.0, 0.0, 2.0, 3.0, 1.0, 5.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.00543975830078125, -0.005285024642944336, -0.005130290985107422, -0.004975557327270508, -0.004820823669433594, -0.00466609001159668, -0.004511356353759766, -0.0043566226959228516, -0.0042018890380859375, -0.0040471553802490234, -0.0038924217224121094, -0.0037376880645751953, -0.0035829544067382812, -0.003428220748901367, -0.003273487091064453, -0.003118753433227539, -0.002964019775390625, -0.002809286117553711, -0.002654552459716797, -0.002499818801879883, -0.0023450851440429688, -0.0021903514862060547, -0.0020356178283691406, -0.0018808841705322266, -0.0017261505126953125, -0.0015714168548583984, -0.0014166831970214844, -0.0012619495391845703, -0.0011072158813476562, -0.0009524822235107422, -0.0007977485656738281, -0.0006430149078369141, -0.00048828125, -0.00033354759216308594, -0.00017881393432617188, -2.4080276489257812e-05, 0.00013065338134765625, 0.0002853870391845703, 0.0004401206970214844, 0.0005948543548583984, 0.0007495880126953125, 0.0009043216705322266, 0.0010590553283691406, 0.0012137889862060547, 0.0013685226440429688, 0.0015232563018798828, 0.0016779899597167969, 0.001832723617553711, 0.001987457275390625, 0.002142190933227539, 0.002296924591064453, 0.002451658248901367, 0.0026063919067382812, 0.0027611255645751953, 0.0029158592224121094, 0.0030705928802490234, 0.0032253265380859375, 0.0033800601959228516, 0.0035347938537597656, 0.0036895275115966797, 0.0038442611694335938, 0.003998994827270508, 0.004153728485107422, 0.004308462142944336, 0.00446319580078125]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 3.0, 16.0, 43.0, 99.0, 201.0, 316.0, 187.0, 89.0, 40.0, 12.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00045145832700654864, -0.0004383531922940165, -0.0004252480575814843, -0.0004121429519727826, -0.00039903781726025045, -0.0003859326825477183, -0.0003728275478351861, -0.00035972241312265396, -0.00034661730751395226, -0.0003335121728014201, -0.00032040703808888793, -0.0003073019324801862, -0.00029419679776765406, -0.0002810916630551219, -0.00026798652834258974, -0.0002548813936300576, -0.0002417762589175254, -0.00022867112420499325, -0.00021556600404437631, -0.00020246086933184415, -0.00018935574917122722, -0.00017625061445869505, -0.0001631454797461629, -0.00015004034503363073, -0.0001369352248730138, -0.00012383009016048163, -0.0001107249699998647, -9.761983528733253e-05, -8.451470785075799e-05, -7.140958041418344e-05, -5.8304445701651275e-05, -4.519931826507673e-05, -3.209416172467172e-05, -1.898903246910777e-05, -5.883903213543817e-06, 7.221227861009538e-06, 2.0326355297584087e-05, 3.3431482734158635e-05, 4.65366174466908e-05, 5.9641744883265346e-05, 7.27468723198399e-05, 8.585199975641444e-05, 9.895712719298899e-05, 0.00011206226190552115, 0.00012516739661805332, 0.00013827251677867025, 0.00015137765149120241, 0.00016448277165181935, 0.0001775879063643515, 0.00019069304107688367, 0.0002037981612375006, 0.00021690329595003277, 0.0002300084161106497, 0.00024311355082318187, 0.00025621868553571403, 0.0002693238202482462, 0.0002824289258569479, 0.00029553406056948006, 0.0003086391952820122, 0.00032174430089071393, 0.0003348494356032461, 0.00034795457031577826, 0.0003610597050283104, 0.0003741648397408426, 0.00038726997445337474]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 0.0, 0.0, 3.0, 4.0, 8.0, 6.0, 6.0, 6.0, 10.0, 8.0, 18.0, 12.0, 20.0, 16.0, 26.0, 17.0, 35.0, 24.0, 26.0, 30.0, 31.0, 38.0, 36.0, 32.0, 41.0, 36.0, 34.0, 34.0, 40.0, 31.0, 37.0, 30.0, 27.0, 29.0, 29.0, 18.0, 28.0, 32.0, 26.0, 17.0, 16.0, 16.0, 15.0, 10.0, 5.0, 11.0, 5.0, 5.0, 2.0, 4.0, 3.0, 3.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0], "bins": [-9.5367431640625e-05, -9.240582585334778e-05, -8.944422006607056e-05, -8.648261427879333e-05, -8.352100849151611e-05, -8.055940270423889e-05, -7.759779691696167e-05, -7.463619112968445e-05, -7.167458534240723e-05, -6.871297955513e-05, -6.575137376785278e-05, -6.278976798057556e-05, -5.982816219329834e-05, -5.686655640602112e-05, -5.3904950618743896e-05, -5.0943344831466675e-05, -4.798173904418945e-05, -4.502013325691223e-05, -4.205852746963501e-05, -3.909692168235779e-05, -3.6135315895080566e-05, -3.3173710107803345e-05, -3.0212104320526123e-05, -2.72504985332489e-05, -2.428889274597168e-05, -2.1327286958694458e-05, -1.8365681171417236e-05, -1.5404075384140015e-05, -1.2442469596862793e-05, -9.480863809585571e-06, -6.51925802230835e-06, -3.557652235031128e-06, -5.960464477539062e-07, 2.3655593395233154e-06, 5.327165126800537e-06, 8.288770914077759e-06, 1.125037670135498e-05, 1.4211982488632202e-05, 1.7173588275909424e-05, 2.0135194063186646e-05, 2.3096799850463867e-05, 2.605840563774109e-05, 2.902001142501831e-05, 3.198161721229553e-05, 3.4943222999572754e-05, 3.7904828786849976e-05, 4.08664345741272e-05, 4.382804036140442e-05, 4.678964614868164e-05, 4.975125193595886e-05, 5.2712857723236084e-05, 5.5674463510513306e-05, 5.863606929779053e-05, 6.159767508506775e-05, 6.455928087234497e-05, 6.752088665962219e-05, 7.048249244689941e-05, 7.344409823417664e-05, 7.640570402145386e-05, 7.936730980873108e-05, 8.23289155960083e-05, 8.529052138328552e-05, 8.825212717056274e-05, 9.121373295783997e-05, 9.417533874511719e-05]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 1.0, 2.0, 3.0, 3.0, 2.0, 8.0, 3.0, 5.0, 6.0, 11.0, 16.0, 6.0, 14.0, 24.0, 18.0, 17.0, 26.0, 22.0, 31.0, 37.0, 31.0, 34.0, 43.0, 28.0, 49.0, 32.0, 35.0, 40.0, 34.0, 48.0, 37.0, 34.0, 33.0, 37.0, 27.0, 33.0, 25.0, 19.0, 20.0, 25.0, 13.0, 9.0, 9.0, 7.0, 12.0, 8.0, 9.0, 0.0, 4.0, 4.0, 7.0, 2.0, 4.0, 3.0, 0.0, 2.0], "bins": [-5.43359375, -5.27667236328125, -5.1197509765625, -4.96282958984375, -4.805908203125, -4.64898681640625, -4.4920654296875, -4.33514404296875, -4.17822265625, -4.02130126953125, -3.8643798828125, -3.70745849609375, -3.550537109375, -3.39361572265625, -3.2366943359375, -3.07977294921875, -2.9228515625, -2.76593017578125, -2.6090087890625, -2.45208740234375, -2.295166015625, -2.13824462890625, -1.9813232421875, -1.82440185546875, -1.66748046875, -1.51055908203125, -1.3536376953125, -1.19671630859375, -1.039794921875, -0.88287353515625, -0.7259521484375, -0.56903076171875, -0.412109375, -0.25518798828125, -0.0982666015625, 0.05865478515625, 0.215576171875, 0.37249755859375, 0.5294189453125, 0.68634033203125, 0.84326171875, 1.00018310546875, 1.1571044921875, 1.31402587890625, 1.470947265625, 1.62786865234375, 1.7847900390625, 1.94171142578125, 2.0986328125, 2.25555419921875, 2.4124755859375, 2.56939697265625, 2.726318359375, 2.88323974609375, 3.0401611328125, 3.19708251953125, 3.35400390625, 3.51092529296875, 3.6678466796875, 3.82476806640625, 3.981689453125, 4.13861083984375, 4.2955322265625, 4.45245361328125, 4.609375]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 7.0, 6.0, 7.0, 13.0, 16.0, 15.0, 32.0, 38.0, 72.0, 112.0, 178.0, 357.0, 645.0, 1195.0, 2636.0, 5807.0, 13843.0, 37781.0, 130268.0, 514531.0, 244439.0, 60692.0, 20409.0, 8318.0, 3592.0, 1657.0, 790.0, 467.0, 222.0, 158.0, 87.0, 43.0, 43.0, 29.0, 12.0, 14.0, 7.0, 7.0, 8.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-10.4609375, -10.16796875, -9.875, -9.58203125, -9.2890625, -8.99609375, -8.703125, -8.41015625, -8.1171875, -7.82421875, -7.53125, -7.23828125, -6.9453125, -6.65234375, -6.359375, -6.06640625, -5.7734375, -5.48046875, -5.1875, -4.89453125, -4.6015625, -4.30859375, -4.015625, -3.72265625, -3.4296875, -3.13671875, -2.84375, -2.55078125, -2.2578125, -1.96484375, -1.671875, -1.37890625, -1.0859375, -0.79296875, -0.5, -0.20703125, 0.0859375, 0.37890625, 0.671875, 0.96484375, 1.2578125, 1.55078125, 1.84375, 2.13671875, 2.4296875, 2.72265625, 3.015625, 3.30859375, 3.6015625, 3.89453125, 4.1875, 4.48046875, 4.7734375, 5.06640625, 5.359375, 5.65234375, 5.9453125, 6.23828125, 6.53125, 6.82421875, 7.1171875, 7.41015625, 7.703125, 7.99609375, 8.2890625]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 6.0, 9.0, 3.0, 5.0, 6.0, 5.0, 12.0, 17.0, 15.0, 17.0, 24.0, 23.0, 36.0, 38.0, 57.0, 53.0, 61.0, 80.0, 143.0, 1432.0, 391.0, 162.0, 80.0, 59.0, 38.0, 41.0, 38.0, 32.0, 21.0, 25.0, 27.0, 20.0, 25.0, 11.0, 7.0, 8.0, 4.0, 11.0, 9.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-21.984375, -21.356201171875, -20.72802734375, -20.099853515625, -19.4716796875, -18.843505859375, -18.21533203125, -17.587158203125, -16.958984375, -16.330810546875, -15.70263671875, -15.074462890625, -14.4462890625, -13.818115234375, -13.18994140625, -12.561767578125, -11.93359375, -11.305419921875, -10.67724609375, -10.049072265625, -9.4208984375, -8.792724609375, -8.16455078125, -7.536376953125, -6.908203125, -6.280029296875, -5.65185546875, -5.023681640625, -4.3955078125, -3.767333984375, -3.13916015625, -2.510986328125, -1.8828125, -1.254638671875, -0.62646484375, 0.001708984375, 0.6298828125, 1.258056640625, 1.88623046875, 2.514404296875, 3.142578125, 3.770751953125, 4.39892578125, 5.027099609375, 5.6552734375, 6.283447265625, 6.91162109375, 7.539794921875, 8.16796875, 8.796142578125, 9.42431640625, 10.052490234375, 10.6806640625, 11.308837890625, 11.93701171875, 12.565185546875, 13.193359375, 13.821533203125, 14.44970703125, 15.077880859375, 15.7060546875, 16.334228515625, 16.96240234375, 17.590576171875, 18.21875]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 6.0, 15.0, 16.0, 18.0, 24.0, 31.0, 49.0, 73.0, 114.0, 146.0, 280.0, 507.0, 1514.0, 11975.0, 2929617.0, 194892.0, 4427.0, 968.0, 421.0, 214.0, 128.0, 73.0, 46.0, 39.0, 31.0, 24.0, 22.0, 12.0, 11.0, 3.0, 5.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.6875, -62.7744140625, -60.861328125, -58.9482421875, -57.03515625, -55.1220703125, -53.208984375, -51.2958984375, -49.3828125, -47.4697265625, -45.556640625, -43.6435546875, -41.73046875, -39.8173828125, -37.904296875, -35.9912109375, -34.078125, -32.1650390625, -30.251953125, -28.3388671875, -26.42578125, -24.5126953125, -22.599609375, -20.6865234375, -18.7734375, -16.8603515625, -14.947265625, -13.0341796875, -11.12109375, -9.2080078125, -7.294921875, -5.3818359375, -3.46875, -1.5556640625, 0.357421875, 2.2705078125, 4.18359375, 6.0966796875, 8.009765625, 9.9228515625, 11.8359375, 13.7490234375, 15.662109375, 17.5751953125, 19.48828125, 21.4013671875, 23.314453125, 25.2275390625, 27.140625, 29.0537109375, 30.966796875, 32.8798828125, 34.79296875, 36.7060546875, 38.619140625, 40.5322265625, 42.4453125, 44.3583984375, 46.271484375, 48.1845703125, 50.09765625, 52.0107421875, 53.923828125, 55.8369140625, 57.75]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 56.0, 909.0, 54.0], "bins": [-819.0232543945312, -805.9126586914062, -792.8020629882812, -779.69140625, -766.580810546875, -753.47021484375, -740.359619140625, -727.2490234375, -714.138427734375, -701.02783203125, -687.917236328125, -674.806640625, -661.6959838867188, -648.5853881835938, -635.4747924804688, -622.3641967773438, -609.2535400390625, -596.1429443359375, -583.0323486328125, -569.9217529296875, -556.8110961914062, -543.7005004882812, -530.5899047851562, -517.4793090820312, -504.36871337890625, -491.25811767578125, -478.1474914550781, -465.0368957519531, -451.9263000488281, -438.815673828125, -425.705078125, -412.594482421875, -399.4838562011719, -386.3732604980469, -373.26263427734375, -360.15203857421875, -347.04144287109375, -333.9308166503906, -320.8202209472656, -307.7095947265625, -294.5990295410156, -281.4884338378906, -268.3778076171875, -255.2672119140625, -242.15660095214844, -229.04598999023438, -215.93539428710938, -202.8247833251953, -189.71417236328125, -176.6035614013672, -163.4929656982422, -150.38235473632812, -137.27174377441406, -124.16114044189453, -111.050537109375, -97.93992614746094, -84.82931518554688, -71.71871185302734, -58.60810089111328, -45.49749755859375, -32.38689041137695, -19.276283264160156, -6.165679931640625, 6.9449310302734375, 20.055532455444336]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 3.0, 1.0, 5.0, 5.0, 4.0, 8.0, 7.0, 9.0, 13.0, 21.0, 18.0, 21.0, 27.0, 22.0, 21.0, 25.0, 24.0, 34.0, 30.0, 36.0, 30.0, 45.0, 47.0, 36.0, 48.0, 28.0, 45.0, 33.0, 33.0, 47.0, 24.0, 36.0, 28.0, 25.0, 34.0, 17.0, 30.0, 12.0, 13.0, 8.0, 5.0, 12.0, 11.0, 10.0, 6.0, 5.0, 1.0, 3.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-41.331886291503906, -39.768226623535156, -38.20457077026367, -36.64091110229492, -35.07725524902344, -33.51359558105469, -31.94993782043457, -30.386280059814453, -28.822620391845703, -27.258962631225586, -25.69530487060547, -24.13164520263672, -22.5679874420166, -21.004329681396484, -19.440671920776367, -17.87701416015625, -16.313356399536133, -14.749698638916016, -13.186039924621582, -11.622382164001465, -10.058723449707031, -8.495065689086914, -6.931407928466797, -5.367749214172363, -3.804091453552246, -2.2404332160949707, -0.6767752170562744, 0.8868827819824219, 2.4505410194396973, 4.014199256896973, 5.57785701751709, 7.141515731811523, 8.70517349243164, 10.268831253051758, 11.832489967346191, 13.396147727966309, 14.959806442260742, 16.52346420288086, 18.087121963500977, 19.650779724121094, 21.214439392089844, 22.77809715270996, 24.341754913330078, 25.905414581298828, 27.469072341918945, 29.032730102539062, 30.59638786315918, 32.1600456237793, 33.72370147705078, 35.28736114501953, 36.851016998291016, 38.414676666259766, 39.97833251953125, 41.5419921875, 43.10565185546875, 44.669307708740234, 46.232967376708984, 47.796627044677734, 49.36028289794922, 50.92394256591797, 52.48759841918945, 54.0512580871582, 55.61491394042969, 57.17857360839844, 58.74223327636719]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 6.0, 3.0, 4.0, 6.0, 12.0, 3.0, 12.0, 8.0, 10.0, 18.0, 26.0, 21.0, 16.0, 26.0, 32.0, 35.0, 30.0, 39.0, 35.0, 37.0, 35.0, 42.0, 45.0, 33.0, 33.0, 40.0, 31.0, 41.0, 44.0, 27.0, 34.0, 25.0, 27.0, 24.0, 19.0, 17.0, 20.0, 11.0, 12.0, 11.0, 8.0, 7.0, 9.0, 5.0, 7.0, 6.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-5.6640625, -5.48779296875, -5.3115234375, -5.13525390625, -4.958984375, -4.78271484375, -4.6064453125, -4.43017578125, -4.25390625, -4.07763671875, -3.9013671875, -3.72509765625, -3.548828125, -3.37255859375, -3.1962890625, -3.02001953125, -2.84375, -2.66748046875, -2.4912109375, -2.31494140625, -2.138671875, -1.96240234375, -1.7861328125, -1.60986328125, -1.43359375, -1.25732421875, -1.0810546875, -0.90478515625, -0.728515625, -0.55224609375, -0.3759765625, -0.19970703125, -0.0234375, 0.15283203125, 0.3291015625, 0.50537109375, 0.681640625, 0.85791015625, 1.0341796875, 1.21044921875, 1.38671875, 1.56298828125, 1.7392578125, 1.91552734375, 2.091796875, 2.26806640625, 2.4443359375, 2.62060546875, 2.796875, 2.97314453125, 3.1494140625, 3.32568359375, 3.501953125, 3.67822265625, 3.8544921875, 4.03076171875, 4.20703125, 4.38330078125, 4.5595703125, 4.73583984375, 4.912109375, 5.08837890625, 5.2646484375, 5.44091796875, 5.6171875]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 5.0, 5.0, 5.0, 7.0, 8.0, 8.0, 13.0, 17.0, 23.0, 35.0, 40.0, 71.0, 100.0, 129.0, 220.0, 390.0, 723.0, 1413.0, 3109.0, 8342.0, 26932.0, 240383.0, 2953489.0, 885046.0, 51883.0, 13278.0, 4496.0, 1909.0, 950.0, 487.0, 236.0, 169.0, 105.0, 69.0, 49.0, 30.0, 19.0, 17.0, 11.0, 21.0, 6.0, 11.0, 7.0, 7.0, 5.0, 3.0, 0.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-19.046875, -18.481689453125, -17.91650390625, -17.351318359375, -16.7861328125, -16.220947265625, -15.65576171875, -15.090576171875, -14.525390625, -13.960205078125, -13.39501953125, -12.829833984375, -12.2646484375, -11.699462890625, -11.13427734375, -10.569091796875, -10.00390625, -9.438720703125, -8.87353515625, -8.308349609375, -7.7431640625, -7.177978515625, -6.61279296875, -6.047607421875, -5.482421875, -4.917236328125, -4.35205078125, -3.786865234375, -3.2216796875, -2.656494140625, -2.09130859375, -1.526123046875, -0.9609375, -0.395751953125, 0.16943359375, 0.734619140625, 1.2998046875, 1.864990234375, 2.43017578125, 2.995361328125, 3.560546875, 4.125732421875, 4.69091796875, 5.256103515625, 5.8212890625, 6.386474609375, 6.95166015625, 7.516845703125, 8.08203125, 8.647216796875, 9.21240234375, 9.777587890625, 10.3427734375, 10.907958984375, 11.47314453125, 12.038330078125, 12.603515625, 13.168701171875, 13.73388671875, 14.299072265625, 14.8642578125, 15.429443359375, 15.99462890625, 16.559814453125, 17.125]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 3.0, 2.0, 7.0, 11.0, 11.0, 19.0, 29.0, 37.0, 50.0, 68.0, 99.0, 191.0, 305.0, 521.0, 736.0, 695.0, 457.0, 323.0, 147.0, 121.0, 69.0, 46.0, 27.0, 28.0, 21.0, 17.0, 12.0, 4.0, 4.0, 5.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.015625, -13.47607421875, -12.9365234375, -12.39697265625, -11.857421875, -11.31787109375, -10.7783203125, -10.23876953125, -9.69921875, -9.15966796875, -8.6201171875, -8.08056640625, -7.541015625, -7.00146484375, -6.4619140625, -5.92236328125, -5.3828125, -4.84326171875, -4.3037109375, -3.76416015625, -3.224609375, -2.68505859375, -2.1455078125, -1.60595703125, -1.06640625, -0.52685546875, 0.0126953125, 0.55224609375, 1.091796875, 1.63134765625, 2.1708984375, 2.71044921875, 3.25, 3.78955078125, 4.3291015625, 4.86865234375, 5.408203125, 5.94775390625, 6.4873046875, 7.02685546875, 7.56640625, 8.10595703125, 8.6455078125, 9.18505859375, 9.724609375, 10.26416015625, 10.8037109375, 11.34326171875, 11.8828125, 12.42236328125, 12.9619140625, 13.50146484375, 14.041015625, 14.58056640625, 15.1201171875, 15.65966796875, 16.19921875, 16.73876953125, 17.2783203125, 17.81787109375, 18.357421875, 18.89697265625, 19.4365234375, 19.97607421875, 20.515625]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 3.0, 5.0, 4.0, 6.0, 15.0, 13.0, 26.0, 34.0, 36.0, 64.0, 122.0, 253.0, 667.0, 3677.0, 52307.0, 3961992.0, 166717.0, 6567.0, 1029.0, 350.0, 150.0, 83.0, 42.0, 41.0, 29.0, 15.0, 11.0, 9.0, 1.0, 6.0, 2.0, 2.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-69.375, -67.57958984375, -65.7841796875, -63.98876953125, -62.193359375, -60.39794921875, -58.6025390625, -56.80712890625, -55.01171875, -53.21630859375, -51.4208984375, -49.62548828125, -47.830078125, -46.03466796875, -44.2392578125, -42.44384765625, -40.6484375, -38.85302734375, -37.0576171875, -35.26220703125, -33.466796875, -31.67138671875, -29.8759765625, -28.08056640625, -26.28515625, -24.48974609375, -22.6943359375, -20.89892578125, -19.103515625, -17.30810546875, -15.5126953125, -13.71728515625, -11.921875, -10.12646484375, -8.3310546875, -6.53564453125, -4.740234375, -2.94482421875, -1.1494140625, 0.64599609375, 2.44140625, 4.23681640625, 6.0322265625, 7.82763671875, 9.623046875, 11.41845703125, 13.2138671875, 15.00927734375, 16.8046875, 18.60009765625, 20.3955078125, 22.19091796875, 23.986328125, 25.78173828125, 27.5771484375, 29.37255859375, 31.16796875, 32.96337890625, 34.7587890625, 36.55419921875, 38.349609375, 40.14501953125, 41.9404296875, 43.73583984375, 45.53125]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 11.0, 25.0, 50.0, 64.0, 141.0, 202.0, 206.0, 149.0, 90.0, 47.0, 9.0, 9.0, 7.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-79.82642364501953, -76.34666442871094, -72.86690521240234, -69.38714599609375, -65.90738677978516, -62.42762756347656, -58.947872161865234, -55.46811294555664, -51.98835372924805, -48.50859451293945, -45.02883529663086, -41.54907989501953, -38.06932067871094, -34.589561462402344, -31.10980224609375, -27.630043029785156, -24.150283813476562, -20.67052459716797, -17.190765380859375, -13.711008071899414, -10.23124885559082, -6.751489639282227, -3.2717323303222656, 0.20802688598632812, 3.687786102294922, 7.167544841766357, 10.647303581237793, 14.12706184387207, 17.606821060180664, 21.086580276489258, 24.56633758544922, 28.046096801757812, 31.525863647460938, 35.00562286376953, 38.485382080078125, 41.96514129638672, 45.44490051269531, 48.924659729003906, 52.404415130615234, 55.88417434692383, 59.36393356323242, 62.843692779541016, 66.32344818115234, 69.80320739746094, 73.28296661376953, 76.76272583007812, 80.24248504638672, 83.72224426269531, 87.2020034790039, 90.6817626953125, 94.1615219116211, 97.64128112792969, 101.12104034423828, 104.60079956054688, 108.08055114746094, 111.56031799316406, 115.04006958007812, 118.51982879638672, 121.99958801269531, 125.4793472290039, 128.9591064453125, 132.43885803222656, 135.9186248779297, 139.39837646484375, 142.87814331054688]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 6.0, 4.0, 1.0, 2.0, 2.0, 5.0, 9.0, 13.0, 10.0, 11.0, 8.0, 14.0, 17.0, 16.0, 22.0, 29.0, 19.0, 28.0, 23.0, 33.0, 31.0, 45.0, 31.0, 36.0, 39.0, 36.0, 51.0, 35.0, 46.0, 47.0, 24.0, 18.0, 35.0, 25.0, 23.0, 30.0, 23.0, 28.0, 19.0, 17.0, 19.0, 15.0, 12.0, 10.0, 15.0, 9.0, 3.0, 9.0, 5.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-36.98271560668945, -35.75434875488281, -34.525978088378906, -33.297611236572266, -32.069244384765625, -30.84087371826172, -29.612506866455078, -28.384138107299805, -27.15576934814453, -25.927400588989258, -24.699033737182617, -23.470664978027344, -22.24229621887207, -21.013927459716797, -19.785560607910156, -18.557191848754883, -17.328824996948242, -16.10045623779297, -14.872088432312012, -13.643720626831055, -12.415351867675781, -11.186984062194824, -9.958616256713867, -8.730247497558594, -7.501879692077637, -6.2735114097595215, -5.045143127441406, -3.816775321960449, -2.588407039642334, -1.3600387573242188, -0.13167095184326172, 1.0966978073120117, 2.3250656127929688, 3.553433895111084, 4.781802177429199, 6.010169982910156, 7.2385382652282715, 8.466906547546387, 9.695274353027344, 10.923643112182617, 12.152010917663574, 13.380378723144531, 14.608747482299805, 15.837115287780762, 17.06548309326172, 18.293851852416992, 19.522220611572266, 20.750587463378906, 21.97895622253418, 23.207324981689453, 24.435691833496094, 25.664060592651367, 26.89242935180664, 28.12079620361328, 29.349164962768555, 30.577533721923828, 31.80590057373047, 33.03426742553711, 34.262638092041016, 35.491004943847656, 36.7193717956543, 37.9477424621582, 39.176109313964844, 40.40447998046875, 41.63284683227539]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 3.0, 3.0, 9.0, 6.0, 17.0, 13.0, 19.0, 17.0, 17.0, 23.0, 25.0, 28.0, 34.0, 31.0, 40.0, 54.0, 55.0, 47.0, 51.0, 52.0, 46.0, 57.0, 32.0, 37.0, 35.0, 41.0, 39.0, 21.0, 27.0, 23.0, 22.0, 15.0, 17.0, 8.0, 3.0, 14.0, 2.0, 7.0, 6.0, 3.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.5390625, -6.3299560546875, -6.120849609375, -5.9117431640625, -5.70263671875, -5.4935302734375, -5.284423828125, -5.0753173828125, -4.8662109375, -4.6571044921875, -4.447998046875, -4.2388916015625, -4.02978515625, -3.8206787109375, -3.611572265625, -3.4024658203125, -3.193359375, -2.9842529296875, -2.775146484375, -2.5660400390625, -2.35693359375, -2.1478271484375, -1.938720703125, -1.7296142578125, -1.5205078125, -1.3114013671875, -1.102294921875, -0.8931884765625, -0.68408203125, -0.4749755859375, -0.265869140625, -0.0567626953125, 0.15234375, 0.3614501953125, 0.570556640625, 0.7796630859375, 0.98876953125, 1.1978759765625, 1.406982421875, 1.6160888671875, 1.8251953125, 2.0343017578125, 2.243408203125, 2.4525146484375, 2.66162109375, 2.8707275390625, 3.079833984375, 3.2889404296875, 3.498046875, 3.7071533203125, 3.916259765625, 4.1253662109375, 4.33447265625, 4.5435791015625, 4.752685546875, 4.9617919921875, 5.1708984375, 5.3800048828125, 5.589111328125, 5.7982177734375, 6.00732421875, 6.2164306640625, 6.425537109375, 6.6346435546875, 6.84375]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 4.0, 6.0, 10.0, 15.0, 27.0, 27.0, 40.0, 88.0, 139.0, 216.0, 340.0, 556.0, 960.0, 1525.0, 2656.0, 4511.0, 7780.0, 13707.0, 24668.0, 44747.0, 88104.0, 204865.0, 339651.0, 156695.0, 70828.0, 37687.0, 20722.0, 11627.0, 6723.0, 4026.0, 2237.0, 1286.0, 788.0, 513.0, 286.0, 175.0, 105.0, 75.0, 49.0, 34.0, 23.0, 18.0, 9.0, 4.0, 2.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.345703125, -0.3353385925292969, -0.32497406005859375, -0.3146095275878906, -0.3042449951171875, -0.2938804626464844, -0.28351593017578125, -0.2731513977050781, -0.262786865234375, -0.2524223327636719, -0.24205780029296875, -0.23169326782226562, -0.2213287353515625, -0.21096420288085938, -0.20059967041015625, -0.19023513793945312, -0.17987060546875, -0.16950607299804688, -0.15914154052734375, -0.14877700805664062, -0.1384124755859375, -0.12804794311523438, -0.11768341064453125, -0.10731887817382812, -0.096954345703125, -0.08658981323242188, -0.07622528076171875, -0.06586074829101562, -0.0554962158203125, -0.045131683349609375, -0.03476715087890625, -0.024402618408203125, -0.0140380859375, -0.003673553466796875, 0.00669097900390625, 0.017055511474609375, 0.0274200439453125, 0.037784576416015625, 0.04814910888671875, 0.058513641357421875, 0.068878173828125, 0.07924270629882812, 0.08960723876953125, 0.09997177124023438, 0.1103363037109375, 0.12070083618164062, 0.13106536865234375, 0.14142990112304688, 0.15179443359375, 0.16215896606445312, 0.17252349853515625, 0.18288803100585938, 0.1932525634765625, 0.20361709594726562, 0.21398162841796875, 0.22434616088867188, 0.234710693359375, 0.24507522583007812, 0.25543975830078125, 0.2658042907714844, 0.2761688232421875, 0.2865333557128906, 0.29689788818359375, 0.3072624206542969, 0.317626953125]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 9.0, 5.0, 4.0, 4.0, 4.0, 17.0, 12.0, 14.0, 18.0, 18.0, 15.0, 23.0, 26.0, 25.0, 30.0, 25.0, 28.0, 27.0, 40.0, 37.0, 44.0, 43.0, 1070.0, 31.0, 36.0, 34.0, 38.0, 39.0, 48.0, 25.0, 30.0, 32.0, 25.0, 28.0, 26.0, 26.0, 11.0, 14.0, 9.0, 9.0, 13.0, 9.0, 5.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 2.0], "bins": [-4.06640625, -3.95172119140625, -3.8370361328125, -3.72235107421875, -3.607666015625, -3.49298095703125, -3.3782958984375, -3.26361083984375, -3.14892578125, -3.03424072265625, -2.9195556640625, -2.80487060546875, -2.690185546875, -2.57550048828125, -2.4608154296875, -2.34613037109375, -2.2314453125, -2.11676025390625, -2.0020751953125, -1.88739013671875, -1.772705078125, -1.65802001953125, -1.5433349609375, -1.42864990234375, -1.31396484375, -1.19927978515625, -1.0845947265625, -0.96990966796875, -0.855224609375, -0.74053955078125, -0.6258544921875, -0.51116943359375, -0.396484375, -0.28179931640625, -0.1671142578125, -0.05242919921875, 0.062255859375, 0.17694091796875, 0.2916259765625, 0.40631103515625, 0.52099609375, 0.63568115234375, 0.7503662109375, 0.86505126953125, 0.979736328125, 1.09442138671875, 1.2091064453125, 1.32379150390625, 1.4384765625, 1.55316162109375, 1.6678466796875, 1.78253173828125, 1.897216796875, 2.01190185546875, 2.1265869140625, 2.24127197265625, 2.35595703125, 2.47064208984375, 2.5853271484375, 2.70001220703125, 2.814697265625, 2.92938232421875, 3.0440673828125, 3.15875244140625, 3.2734375]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 8.0, 6.0, 21.0, 25.0, 42.0, 58.0, 73.0, 109.0, 160.0, 221.0, 360.0, 537.0, 744.0, 1010.0, 1377.0, 2181.0, 3177.0, 4634.0, 6843.0, 10871.0, 16520.0, 25858.0, 41124.0, 66861.0, 109907.0, 182691.0, 1265740.0, 134915.0, 80872.0, 50217.0, 31663.0, 20182.0, 12752.0, 8190.0, 5606.0, 3628.0, 2430.0, 1724.0, 1175.0, 800.0, 528.0, 388.0, 289.0, 214.0, 136.0, 98.0, 52.0, 33.0, 29.0, 18.0, 12.0, 10.0, 7.0, 7.0, 3.0, 2.0, 2.0, 2.0], "bins": [-0.1632080078125, -0.1581401824951172, -0.15307235717773438, -0.14800453186035156, -0.14293670654296875, -0.13786888122558594, -0.13280105590820312, -0.1277332305908203, -0.1226654052734375, -0.11759757995605469, -0.11252975463867188, -0.10746192932128906, -0.10239410400390625, -0.09732627868652344, -0.09225845336914062, -0.08719062805175781, -0.082122802734375, -0.07705497741699219, -0.07198715209960938, -0.06691932678222656, -0.06185150146484375, -0.05678367614746094, -0.051715850830078125, -0.04664802551269531, -0.0415802001953125, -0.03651237487792969, -0.031444549560546875, -0.026376724243164062, -0.02130889892578125, -0.016241073608398438, -0.011173248291015625, -0.0061054229736328125, -0.00103759765625, 0.0040302276611328125, 0.009098052978515625, 0.014165878295898438, 0.01923370361328125, 0.024301528930664062, 0.029369354248046875, 0.03443717956542969, 0.0395050048828125, 0.04457283020019531, 0.049640655517578125, 0.05470848083496094, 0.05977630615234375, 0.06484413146972656, 0.06991195678710938, 0.07497978210449219, 0.080047607421875, 0.08511543273925781, 0.09018325805664062, 0.09525108337402344, 0.10031890869140625, 0.10538673400878906, 0.11045455932617188, 0.11552238464355469, 0.1205902099609375, 0.1256580352783203, 0.13072586059570312, 0.13579368591308594, 0.14086151123046875, 0.14592933654785156, 0.15099716186523438, 0.1560649871826172, 0.1611328125]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 2.0, 6.0, 7.0, 6.0, 6.0, 11.0, 21.0, 13.0, 34.0, 37.0, 56.0, 89.0, 109.0, 115.0, 124.0, 91.0, 65.0, 44.0, 39.0, 29.0, 15.0, 11.0, 15.0, 13.0, 12.0, 7.0, 5.0, 5.0, 5.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002167224884033203, -0.00020942464470863342, -0.00020212680101394653, -0.00019482895731925964, -0.00018753111362457275, -0.00018023326992988586, -0.00017293542623519897, -0.00016563758254051208, -0.0001583397388458252, -0.0001510418951511383, -0.00014374405145645142, -0.00013644620776176453, -0.00012914836406707764, -0.00012185052037239075, -0.00011455267667770386, -0.00010725483298301697, -9.995698928833008e-05, -9.265914559364319e-05, -8.53613018989563e-05, -7.806345820426941e-05, -7.076561450958252e-05, -6.346777081489563e-05, -5.616992712020874e-05, -4.887208342552185e-05, -4.157423973083496e-05, -3.427639603614807e-05, -2.697855234146118e-05, -1.9680708646774292e-05, -1.2382864952087402e-05, -5.085021257400513e-06, 2.212822437286377e-06, 9.510666131973267e-06, 1.6808509826660156e-05, 2.4106353521347046e-05, 3.1404197216033936e-05, 3.8702040910720825e-05, 4.5999884605407715e-05, 5.3297728300094604e-05, 6.0595571994781494e-05, 6.789341568946838e-05, 7.519125938415527e-05, 8.248910307884216e-05, 8.978694677352905e-05, 9.708479046821594e-05, 0.00010438263416290283, 0.00011168047785758972, 0.00011897832155227661, 0.0001262761652469635, 0.0001335740089416504, 0.00014087185263633728, 0.00014816969633102417, 0.00015546754002571106, 0.00016276538372039795, 0.00017006322741508484, 0.00017736107110977173, 0.00018465891480445862, 0.0001919567584991455, 0.0001992546021938324, 0.0002065524458885193, 0.00021385028958320618, 0.00022114813327789307, 0.00022844597697257996, 0.00023574382066726685, 0.00024304166436195374, 0.0002503395080566406]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 7.0, 9.0, 17.0, 14.0, 17.0, 17.0, 41.0, 43.0, 73.0, 124.0, 264.0, 1170.0, 54006.0, 981968.0, 9695.0, 587.0, 207.0, 113.0, 65.0, 37.0, 22.0, 16.0, 7.0, 7.0, 9.0, 6.0, 4.0, 1.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.005214691162109375, -0.005062758922576904, -0.004910826683044434, -0.004758894443511963, -0.004606962203979492, -0.0044550299644470215, -0.004303097724914551, -0.00415116548538208, -0.003999233245849609, -0.0038473010063171387, -0.003695368766784668, -0.0035434365272521973, -0.0033915042877197266, -0.003239572048187256, -0.003087639808654785, -0.0029357075691223145, -0.0027837753295898438, -0.002631843090057373, -0.0024799108505249023, -0.0023279786109924316, -0.002176046371459961, -0.0020241141319274902, -0.0018721818923950195, -0.0017202496528625488, -0.0015683174133300781, -0.0014163851737976074, -0.0012644529342651367, -0.001112520694732666, -0.0009605884552001953, -0.0008086562156677246, -0.0006567239761352539, -0.0005047917366027832, -0.0003528594970703125, -0.0002009272575378418, -4.8995018005371094e-05, 0.00010293722152709961, 0.0002548694610595703, 0.000406801700592041, 0.0005587339401245117, 0.0007106661796569824, 0.0008625984191894531, 0.0010145306587219238, 0.0011664628982543945, 0.0013183951377868652, 0.001470327377319336, 0.0016222596168518066, 0.0017741918563842773, 0.001926124095916748, 0.0020780563354492188, 0.0022299885749816895, 0.00238192081451416, 0.002533853054046631, 0.0026857852935791016, 0.0028377175331115723, 0.002989649772644043, 0.0031415820121765137, 0.0032935142517089844, 0.003445446491241455, 0.0035973787307739258, 0.0037493109703063965, 0.003901243209838867, 0.004053175449371338, 0.004205107688903809, 0.004357039928436279, 0.00450897216796875]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 12.0, 38.0, 171.0, 514.0, 223.0, 43.0, 14.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008655885467305779, -0.0008419420919381082, -0.0008182956953532994, -0.0007946492405608296, -0.0007710028439760208, -0.0007473563891835511, -0.0007237099343910813, -0.0007000635378062725, -0.0006764171412214637, -0.0006527706864289939, -0.0006291242898441851, -0.0006054778350517154, -0.0005818314384669065, -0.0005581849836744368, -0.0005345385288819671, -0.0005108921322971582, -0.0004872456775046885, -0.0004635992518160492, -0.00043995282612740993, -0.0004163063713349402, -0.00039265997475013137, -0.00036901351995766163, -0.00034536709426902235, -0.00032172066858038306, -0.0002980742428917438, -0.0002744278172031045, -0.0002507813915144652, -0.0002271349512739107, -0.00020348852558527142, -0.00017984209989663213, -0.00015619565965607762, -0.00013254923396743834, -0.00010890280827879906, -8.525638259015977e-05, -6.160994962556288e-05, -3.796351666096598e-05, -1.4317090972326696e-05, 9.329334716312587e-06, 3.29757749568671e-05, 5.662220064550638e-05, 8.026862633414567e-05, 0.00010391505202278495, 0.00012756147771142423, 0.00015120791795197874, 0.00017485434364061803, 0.0001985007693292573, 0.00022214720956981182, 0.0002457936352584511, 0.0002694400609470904, 0.00029308648663572967, 0.00031673291232436895, 0.0003403793671168387, 0.0003640257637016475, 0.00038767221849411726, 0.00041131864418275654, 0.0004349650698713958, 0.0004586114955600351, 0.0004822579212486744, 0.0005059043760411441, 0.000529550772625953, 0.0005531972274184227, 0.0005768436240032315, 0.0006004900787957013, 0.000624136533588171, 0.0006477829301729798]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 4.0, 4.0, 4.0, 2.0, 7.0, 10.0, 8.0, 8.0, 13.0, 22.0, 14.0, 19.0, 20.0, 29.0, 26.0, 33.0, 30.0, 29.0, 30.0, 36.0, 31.0, 33.0, 38.0, 39.0, 36.0, 39.0, 40.0, 43.0, 30.0, 40.0, 31.0, 35.0, 22.0, 25.0, 21.0, 29.0, 23.0, 15.0, 8.0, 14.0, 18.0, 8.0, 8.0, 8.0, 11.0, 3.0, 3.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-8.308887481689453e-05, -8.052308112382889e-05, -7.795728743076324e-05, -7.53914937376976e-05, -7.282570004463196e-05, -7.025990635156631e-05, -6.769411265850067e-05, -6.512831896543503e-05, -6.256252527236938e-05, -5.999673157930374e-05, -5.74309378862381e-05, -5.4865144193172455e-05, -5.229935050010681e-05, -4.973355680704117e-05, -4.7167763113975525e-05, -4.460196942090988e-05, -4.203617572784424e-05, -3.9470382034778595e-05, -3.690458834171295e-05, -3.433879464864731e-05, -3.1773000955581665e-05, -2.9207207262516022e-05, -2.664141356945038e-05, -2.4075619876384735e-05, -2.1509826183319092e-05, -1.894403249025345e-05, -1.6378238797187805e-05, -1.3812445104122162e-05, -1.1246651411056519e-05, -8.680857717990875e-06, -6.115064024925232e-06, -3.5492703318595886e-06, -9.834766387939453e-07, 1.582317054271698e-06, 4.148110747337341e-06, 6.713904440402985e-06, 9.279698133468628e-06, 1.1845491826534271e-05, 1.4411285519599915e-05, 1.6977079212665558e-05, 1.95428729057312e-05, 2.2108666598796844e-05, 2.4674460291862488e-05, 2.724025398492813e-05, 2.9806047677993774e-05, 3.237184137105942e-05, 3.493763506412506e-05, 3.7503428757190704e-05, 4.006922245025635e-05, 4.263501614332199e-05, 4.5200809836387634e-05, 4.776660352945328e-05, 5.033239722251892e-05, 5.2898190915584564e-05, 5.546398460865021e-05, 5.802977830171585e-05, 6.0595571994781494e-05, 6.316136568784714e-05, 6.572715938091278e-05, 6.829295307397842e-05, 7.085874676704407e-05, 7.342454046010971e-05, 7.599033415317535e-05, 7.8556127846241e-05, 8.112192153930664e-05]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 3.0, 3.0, 9.0, 6.0, 17.0, 13.0, 19.0, 17.0, 17.0, 23.0, 25.0, 28.0, 34.0, 31.0, 40.0, 54.0, 55.0, 47.0, 51.0, 52.0, 46.0, 57.0, 32.0, 37.0, 35.0, 41.0, 39.0, 21.0, 27.0, 23.0, 22.0, 15.0, 17.0, 8.0, 3.0, 14.0, 2.0, 7.0, 6.0, 3.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.5390625, -6.3299560546875, -6.120849609375, -5.9117431640625, -5.70263671875, -5.4935302734375, -5.284423828125, -5.0753173828125, -4.8662109375, -4.6571044921875, -4.447998046875, -4.2388916015625, -4.02978515625, -3.8206787109375, -3.611572265625, -3.4024658203125, -3.193359375, -2.9842529296875, -2.775146484375, -2.5660400390625, -2.35693359375, -2.1478271484375, -1.938720703125, -1.7296142578125, -1.5205078125, -1.3114013671875, -1.102294921875, -0.8931884765625, -0.68408203125, -0.4749755859375, -0.265869140625, -0.0567626953125, 0.15234375, 0.3614501953125, 0.570556640625, 0.7796630859375, 0.98876953125, 1.1978759765625, 1.406982421875, 1.6160888671875, 1.8251953125, 2.0343017578125, 2.243408203125, 2.4525146484375, 2.66162109375, 2.8707275390625, 3.079833984375, 3.2889404296875, 3.498046875, 3.7071533203125, 3.916259765625, 4.1253662109375, 4.33447265625, 4.5435791015625, 4.752685546875, 4.9617919921875, 5.1708984375, 5.3800048828125, 5.589111328125, 5.7982177734375, 6.00732421875, 6.2164306640625, 6.425537109375, 6.6346435546875, 6.84375]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 8.0, 3.0, 8.0, 15.0, 17.0, 29.0, 43.0, 75.0, 84.0, 196.0, 277.0, 526.0, 858.0, 1570.0, 2837.0, 5482.0, 11350.0, 28818.0, 127624.0, 595910.0, 205293.0, 39513.0, 13838.0, 6624.0, 3336.0, 1806.0, 1002.0, 549.0, 322.0, 212.0, 125.0, 67.0, 47.0, 36.0, 19.0, 21.0, 7.0, 6.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.1875, -9.875244140625, -9.56298828125, -9.250732421875, -8.9384765625, -8.626220703125, -8.31396484375, -8.001708984375, -7.689453125, -7.377197265625, -7.06494140625, -6.752685546875, -6.4404296875, -6.128173828125, -5.81591796875, -5.503662109375, -5.19140625, -4.879150390625, -4.56689453125, -4.254638671875, -3.9423828125, -3.630126953125, -3.31787109375, -3.005615234375, -2.693359375, -2.381103515625, -2.06884765625, -1.756591796875, -1.4443359375, -1.132080078125, -0.81982421875, -0.507568359375, -0.1953125, 0.116943359375, 0.42919921875, 0.741455078125, 1.0537109375, 1.365966796875, 1.67822265625, 1.990478515625, 2.302734375, 2.614990234375, 2.92724609375, 3.239501953125, 3.5517578125, 3.864013671875, 4.17626953125, 4.488525390625, 4.80078125, 5.113037109375, 5.42529296875, 5.737548828125, 6.0498046875, 6.362060546875, 6.67431640625, 6.986572265625, 7.298828125, 7.611083984375, 7.92333984375, 8.235595703125, 8.5478515625, 8.860107421875, 9.17236328125, 9.484619140625, 9.796875]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 2.0, 3.0, 5.0, 9.0, 8.0, 10.0, 20.0, 11.0, 12.0, 19.0, 19.0, 30.0, 35.0, 34.0, 30.0, 55.0, 45.0, 40.0, 70.0, 177.0, 1573.0, 294.0, 92.0, 61.0, 40.0, 57.0, 39.0, 43.0, 31.0, 36.0, 25.0, 29.0, 19.0, 18.0, 12.0, 9.0, 9.0, 8.0, 4.0, 7.0, 4.0, 3.0, 3.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.6875, -19.001708984375, -18.31591796875, -17.630126953125, -16.9443359375, -16.258544921875, -15.57275390625, -14.886962890625, -14.201171875, -13.515380859375, -12.82958984375, -12.143798828125, -11.4580078125, -10.772216796875, -10.08642578125, -9.400634765625, -8.71484375, -8.029052734375, -7.34326171875, -6.657470703125, -5.9716796875, -5.285888671875, -4.60009765625, -3.914306640625, -3.228515625, -2.542724609375, -1.85693359375, -1.171142578125, -0.4853515625, 0.200439453125, 0.88623046875, 1.572021484375, 2.2578125, 2.943603515625, 3.62939453125, 4.315185546875, 5.0009765625, 5.686767578125, 6.37255859375, 7.058349609375, 7.744140625, 8.429931640625, 9.11572265625, 9.801513671875, 10.4873046875, 11.173095703125, 11.85888671875, 12.544677734375, 13.23046875, 13.916259765625, 14.60205078125, 15.287841796875, 15.9736328125, 16.659423828125, 17.34521484375, 18.031005859375, 18.716796875, 19.402587890625, 20.08837890625, 20.774169921875, 21.4599609375, 22.145751953125, 22.83154296875, 23.517333984375, 24.203125]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 5.0, 5.0, 8.0, 5.0, 4.0, 9.0, 13.0, 26.0, 38.0, 60.0, 85.0, 166.0, 331.0, 881.0, 14759.0, 3118041.0, 9884.0, 727.0, 278.0, 159.0, 80.0, 52.0, 30.0, 12.0, 9.0, 7.0, 15.0, 4.0, 2.0, 2.0, 3.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-118.375, -114.939453125, -111.50390625, -108.068359375, -104.6328125, -101.197265625, -97.76171875, -94.326171875, -90.890625, -87.455078125, -84.01953125, -80.583984375, -77.1484375, -73.712890625, -70.27734375, -66.841796875, -63.40625, -59.970703125, -56.53515625, -53.099609375, -49.6640625, -46.228515625, -42.79296875, -39.357421875, -35.921875, -32.486328125, -29.05078125, -25.615234375, -22.1796875, -18.744140625, -15.30859375, -11.873046875, -8.4375, -5.001953125, -1.56640625, 1.869140625, 5.3046875, 8.740234375, 12.17578125, 15.611328125, 19.046875, 22.482421875, 25.91796875, 29.353515625, 32.7890625, 36.224609375, 39.66015625, 43.095703125, 46.53125, 49.966796875, 53.40234375, 56.837890625, 60.2734375, 63.708984375, 67.14453125, 70.580078125, 74.015625, 77.451171875, 80.88671875, 84.322265625, 87.7578125, 91.193359375, 94.62890625, 98.064453125, 101.5]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 127.0, 881.0, 10.0], "bins": [-911.3828735351562, -896.7440795898438, -882.105224609375, -867.4664306640625, -852.82763671875, -838.1888427734375, -823.5499877929688, -808.9111938476562, -794.2723999023438, -779.6336059570312, -764.9947509765625, -750.35595703125, -735.7171630859375, -721.078369140625, -706.4395141601562, -691.8007202148438, -677.1619262695312, -662.5231323242188, -647.88427734375, -633.2454833984375, -618.606689453125, -603.9678955078125, -589.3290405273438, -574.6902465820312, -560.0514526367188, -545.4126586914062, -530.7738037109375, -516.135009765625, -501.4962158203125, -486.8573913574219, -472.2185974121094, -457.57977294921875, -442.94091796875, -428.3020935058594, -413.6632995605469, -399.02447509765625, -384.38568115234375, -369.7468566894531, -355.1080627441406, -340.46923828125, -325.8304443359375, -311.1916198730469, -296.5528259277344, -281.91400146484375, -267.27520751953125, -252.63638305664062, -237.99758911132812, -223.3587646484375, -208.719970703125, -194.08116149902344, -179.44235229492188, -164.8035430908203, -150.16473388671875, -135.52590942382812, -120.8871078491211, -106.24829864501953, -91.60948181152344, -76.97067260742188, -62.33186340332031, -47.693050384521484, -33.05424118041992, -18.415428161621094, -3.7766189575195312, 10.862190246582031, 25.500995635986328]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 2.0, 10.0, 7.0, 6.0, 4.0, 11.0, 5.0, 22.0, 12.0, 18.0, 23.0, 17.0, 16.0, 31.0, 28.0, 40.0, 33.0, 32.0, 28.0, 33.0, 43.0, 43.0, 46.0, 44.0, 49.0, 44.0, 34.0, 42.0, 35.0, 39.0, 33.0, 30.0, 19.0, 28.0, 10.0, 14.0, 17.0, 7.0, 10.0, 8.0, 6.0, 7.0, 9.0, 5.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.141475677490234, -52.46421813964844, -50.786964416503906, -49.10970687866211, -47.43244934082031, -45.75519561767578, -44.077938079833984, -42.40068054199219, -40.723426818847656, -39.04616928100586, -37.36891555786133, -35.69165802001953, -34.014400482177734, -32.33714294433594, -30.659889221191406, -28.98263168334961, -27.305374145507812, -25.62811851501465, -23.95086097717285, -22.273605346679688, -20.59634780883789, -18.919092178344727, -17.241836547851562, -15.564579963684082, -13.887323379516602, -12.210066795349121, -10.53281021118164, -8.855554580688477, -7.178297996520996, -5.501041412353516, -3.8237857818603516, -2.146529197692871, -0.46927642822265625, 1.2079799175262451, 2.8852362632751465, 4.562492370605469, 6.239748954772949, 7.91700553894043, 9.594261169433594, 11.271517753601074, 12.948774337768555, 14.626030921936035, 16.303287506103516, 17.98054313659668, 19.657798767089844, 21.33505630493164, 23.012311935424805, 24.68956756591797, 26.366825103759766, 28.04408073425293, 29.721338272094727, 31.39859390258789, 33.07585144042969, 34.75310516357422, 36.430362701416016, 38.10762023925781, 39.784873962402344, 41.46213150024414, 43.13938522338867, 44.81664276123047, 46.493900299072266, 48.17115783691406, 49.848411560058594, 51.52566909790039, 53.20292663574219]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 8.0, 6.0, 7.0, 5.0, 13.0, 12.0, 13.0, 14.0, 14.0, 30.0, 24.0, 29.0, 32.0, 30.0, 44.0, 53.0, 47.0, 46.0, 34.0, 48.0, 45.0, 50.0, 41.0, 40.0, 35.0, 38.0, 31.0, 29.0, 32.0, 25.0, 25.0, 18.0, 18.0, 8.0, 14.0, 11.0, 7.0, 11.0, 3.0, 4.0, 6.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.5625, -7.3397216796875, -7.116943359375, -6.8941650390625, -6.67138671875, -6.4486083984375, -6.225830078125, -6.0030517578125, -5.7802734375, -5.5574951171875, -5.334716796875, -5.1119384765625, -4.88916015625, -4.6663818359375, -4.443603515625, -4.2208251953125, -3.998046875, -3.7752685546875, -3.552490234375, -3.3297119140625, -3.10693359375, -2.8841552734375, -2.661376953125, -2.4385986328125, -2.2158203125, -1.9930419921875, -1.770263671875, -1.5474853515625, -1.32470703125, -1.1019287109375, -0.879150390625, -0.6563720703125, -0.43359375, -0.2108154296875, 0.011962890625, 0.2347412109375, 0.45751953125, 0.6802978515625, 0.903076171875, 1.1258544921875, 1.3486328125, 1.5714111328125, 1.794189453125, 2.0169677734375, 2.23974609375, 2.4625244140625, 2.685302734375, 2.9080810546875, 3.130859375, 3.3536376953125, 3.576416015625, 3.7991943359375, 4.02197265625, 4.2447509765625, 4.467529296875, 4.6903076171875, 4.9130859375, 5.1358642578125, 5.358642578125, 5.5814208984375, 5.80419921875, 6.0269775390625, 6.249755859375, 6.4725341796875, 6.6953125]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 8.0, 8.0, 18.0, 15.0, 18.0, 25.0, 41.0, 69.0, 85.0, 125.0, 215.0, 271.0, 477.0, 694.0, 1224.0, 2318.0, 4806.0, 13244.0, 65542.0, 842786.0, 2700254.0, 497851.0, 44110.0, 10921.0, 4323.0, 1974.0, 1006.0, 694.0, 366.0, 240.0, 164.0, 130.0, 73.0, 60.0, 35.0, 32.0, 18.0, 11.0, 15.0, 5.0, 5.0, 3.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0], "bins": [-15.875, -15.426513671875, -14.97802734375, -14.529541015625, -14.0810546875, -13.632568359375, -13.18408203125, -12.735595703125, -12.287109375, -11.838623046875, -11.39013671875, -10.941650390625, -10.4931640625, -10.044677734375, -9.59619140625, -9.147705078125, -8.69921875, -8.250732421875, -7.80224609375, -7.353759765625, -6.9052734375, -6.456787109375, -6.00830078125, -5.559814453125, -5.111328125, -4.662841796875, -4.21435546875, -3.765869140625, -3.3173828125, -2.868896484375, -2.42041015625, -1.971923828125, -1.5234375, -1.074951171875, -0.62646484375, -0.177978515625, 0.2705078125, 0.718994140625, 1.16748046875, 1.615966796875, 2.064453125, 2.512939453125, 2.96142578125, 3.409912109375, 3.8583984375, 4.306884765625, 4.75537109375, 5.203857421875, 5.65234375, 6.100830078125, 6.54931640625, 6.997802734375, 7.4462890625, 7.894775390625, 8.34326171875, 8.791748046875, 9.240234375, 9.688720703125, 10.13720703125, 10.585693359375, 11.0341796875, 11.482666015625, 11.93115234375, 12.379638671875, 12.828125]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 5.0, 8.0, 9.0, 9.0, 8.0, 24.0, 16.0, 28.0, 42.0, 54.0, 87.0, 95.0, 135.0, 225.0, 396.0, 532.0, 707.0, 554.0, 375.0, 257.0, 147.0, 97.0, 71.0, 51.0, 43.0, 26.0, 24.0, 14.0, 12.0, 3.0, 8.0, 3.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.40625, -12.951904296875, -12.49755859375, -12.043212890625, -11.5888671875, -11.134521484375, -10.68017578125, -10.225830078125, -9.771484375, -9.317138671875, -8.86279296875, -8.408447265625, -7.9541015625, -7.499755859375, -7.04541015625, -6.591064453125, -6.13671875, -5.682373046875, -5.22802734375, -4.773681640625, -4.3193359375, -3.864990234375, -3.41064453125, -2.956298828125, -2.501953125, -2.047607421875, -1.59326171875, -1.138916015625, -0.6845703125, -0.230224609375, 0.22412109375, 0.678466796875, 1.1328125, 1.587158203125, 2.04150390625, 2.495849609375, 2.9501953125, 3.404541015625, 3.85888671875, 4.313232421875, 4.767578125, 5.221923828125, 5.67626953125, 6.130615234375, 6.5849609375, 7.039306640625, 7.49365234375, 7.947998046875, 8.40234375, 8.856689453125, 9.31103515625, 9.765380859375, 10.2197265625, 10.674072265625, 11.12841796875, 11.582763671875, 12.037109375, 12.491455078125, 12.94580078125, 13.400146484375, 13.8544921875, 14.308837890625, 14.76318359375, 15.217529296875, 15.671875]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 5.0, 7.0, 5.0, 7.0, 14.0, 24.0, 22.0, 33.0, 61.0, 81.0, 143.0, 236.0, 515.0, 2346.0, 23430.0, 2878115.0, 1270843.0, 15637.0, 1692.0, 469.0, 192.0, 113.0, 95.0, 52.0, 35.0, 29.0, 15.0, 25.0, 9.0, 9.0, 10.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-54.0, -52.4541015625, -50.908203125, -49.3623046875, -47.81640625, -46.2705078125, -44.724609375, -43.1787109375, -41.6328125, -40.0869140625, -38.541015625, -36.9951171875, -35.44921875, -33.9033203125, -32.357421875, -30.8115234375, -29.265625, -27.7197265625, -26.173828125, -24.6279296875, -23.08203125, -21.5361328125, -19.990234375, -18.4443359375, -16.8984375, -15.3525390625, -13.806640625, -12.2607421875, -10.71484375, -9.1689453125, -7.623046875, -6.0771484375, -4.53125, -2.9853515625, -1.439453125, 0.1064453125, 1.65234375, 3.1982421875, 4.744140625, 6.2900390625, 7.8359375, 9.3818359375, 10.927734375, 12.4736328125, 14.01953125, 15.5654296875, 17.111328125, 18.6572265625, 20.203125, 21.7490234375, 23.294921875, 24.8408203125, 26.38671875, 27.9326171875, 29.478515625, 31.0244140625, 32.5703125, 34.1162109375, 35.662109375, 37.2080078125, 38.75390625, 40.2998046875, 41.845703125, 43.3916015625, 44.9375]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 6.0, 5.0, 18.0, 36.0, 86.0, 180.0, 208.0, 200.0, 129.0, 85.0, 36.0, 13.0, 7.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-163.62261962890625, -160.40814208984375, -157.19366455078125, -153.97918701171875, -150.76470947265625, -147.55023193359375, -144.3357696533203, -141.1212921142578, -137.9068145751953, -134.6923370361328, -131.4778594970703, -128.2633819580078, -125.04891204833984, -121.83443450927734, -118.61995697021484, -115.40548706054688, -112.19100952148438, -108.97653198242188, -105.76205444335938, -102.5475845336914, -99.3331069946289, -96.1186294555664, -92.9041519165039, -89.68968200683594, -86.4751968383789, -83.2607192993164, -80.0462417602539, -76.83177185058594, -73.61729431152344, -70.40281677246094, -67.18833923339844, -63.9738655090332, -60.759395599365234, -57.544918060302734, -54.3304443359375, -51.115966796875, -47.901493072509766, -44.687015533447266, -41.47254180908203, -38.25806427001953, -35.04358673095703, -31.829111099243164, -28.614635467529297, -25.400157928466797, -22.185684204101562, -18.971206665039062, -15.756731033325195, -12.542255401611328, -9.327781677246094, -6.113306045532227, -2.898829936981201, 0.3156461715698242, 3.5301218032836914, 6.744598388671875, 9.959074020385742, 13.17354965209961, 16.388025283813477, 19.602500915527344, 22.81697654724121, 26.031452178955078, 29.245929718017578, 32.46040344238281, 35.67488098144531, 38.88935852050781, 42.10383224487305]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 5.0, 6.0, 7.0, 14.0, 10.0, 8.0, 17.0, 15.0, 18.0, 20.0, 20.0, 24.0, 35.0, 33.0, 26.0, 41.0, 36.0, 30.0, 45.0, 46.0, 41.0, 36.0, 35.0, 42.0, 33.0, 42.0, 30.0, 43.0, 36.0, 42.0, 29.0, 29.0, 16.0, 13.0, 18.0, 9.0, 13.0, 10.0, 6.0, 5.0, 7.0, 9.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-35.07271194458008, -33.81715774536133, -32.56160354614258, -31.306047439575195, -30.050491333007812, -28.794937133789062, -27.539382934570312, -26.28382682800293, -25.028270721435547, -23.772716522216797, -22.517160415649414, -21.261606216430664, -20.00605010986328, -18.75049591064453, -17.49494171142578, -16.2393856048584, -14.983831405639648, -13.728276252746582, -12.472721099853516, -11.217166900634766, -9.961610794067383, -8.706056594848633, -7.450501441955566, -6.1949462890625, -4.939391136169434, -3.683835983276367, -2.42828106880188, -1.1727261543273926, 0.08282899856567383, 1.3383841514587402, 2.5939388275146484, 3.849493980407715, 5.105049133300781, 6.360604286193848, 7.616159439086914, 8.871713638305664, 10.127269744873047, 11.382823944091797, 12.638379096984863, 13.89393424987793, 15.149489402770996, 16.405044555664062, 17.660598754882812, 18.916154861450195, 20.171709060668945, 21.427265167236328, 22.682819366455078, 23.938373565673828, 25.19392967224121, 26.44948387145996, 27.705039978027344, 28.960594177246094, 30.216150283813477, 31.471704483032227, 32.72726058959961, 33.98281478881836, 35.23836898803711, 36.49392318725586, 37.74947738647461, 39.005035400390625, 40.260589599609375, 41.516143798828125, 42.771697998046875, 44.027252197265625, 45.28281021118164]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 5.0, 6.0, 6.0, 8.0, 16.0, 7.0, 11.0, 14.0, 11.0, 20.0, 20.0, 23.0, 32.0, 21.0, 37.0, 44.0, 47.0, 45.0, 52.0, 40.0, 45.0, 33.0, 46.0, 40.0, 35.0, 51.0, 34.0, 33.0, 26.0, 34.0, 23.0, 23.0, 19.0, 12.0, 9.0, 17.0, 16.0, 11.0, 7.0, 9.0, 7.0, 2.0, 4.0, 1.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.6875, -6.4852294921875, -6.282958984375, -6.0806884765625, -5.87841796875, -5.6761474609375, -5.473876953125, -5.2716064453125, -5.0693359375, -4.8670654296875, -4.664794921875, -4.4625244140625, -4.26025390625, -4.0579833984375, -3.855712890625, -3.6534423828125, -3.451171875, -3.2489013671875, -3.046630859375, -2.8443603515625, -2.64208984375, -2.4398193359375, -2.237548828125, -2.0352783203125, -1.8330078125, -1.6307373046875, -1.428466796875, -1.2261962890625, -1.02392578125, -0.8216552734375, -0.619384765625, -0.4171142578125, -0.21484375, -0.0125732421875, 0.189697265625, 0.3919677734375, 0.59423828125, 0.7965087890625, 0.998779296875, 1.2010498046875, 1.4033203125, 1.6055908203125, 1.807861328125, 2.0101318359375, 2.21240234375, 2.4146728515625, 2.616943359375, 2.8192138671875, 3.021484375, 3.2237548828125, 3.426025390625, 3.6282958984375, 3.83056640625, 4.0328369140625, 4.235107421875, 4.4373779296875, 4.6396484375, 4.8419189453125, 5.044189453125, 5.2464599609375, 5.44873046875, 5.6510009765625, 5.853271484375, 6.0555419921875, 6.2578125]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 3.0, 4.0, 7.0, 13.0, 10.0, 14.0, 38.0, 47.0, 59.0, 88.0, 115.0, 151.0, 204.0, 332.0, 451.0, 640.0, 924.0, 1257.0, 1881.0, 2681.0, 4020.0, 5983.0, 8657.0, 12933.0, 19853.0, 31616.0, 52753.0, 93197.0, 177639.0, 266353.0, 153158.0, 81764.0, 47400.0, 29122.0, 18149.0, 12003.0, 7743.0, 5172.0, 3653.0, 2533.0, 1762.0, 1196.0, 867.0, 643.0, 442.0, 300.0, 232.0, 164.0, 98.0, 74.0, 59.0, 32.0, 30.0, 16.0, 14.0, 10.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.2529296875, -0.244873046875, -0.23681640625, -0.228759765625, -0.220703125, -0.212646484375, -0.20458984375, -0.196533203125, -0.1884765625, -0.180419921875, -0.17236328125, -0.164306640625, -0.15625, -0.148193359375, -0.14013671875, -0.132080078125, -0.1240234375, -0.115966796875, -0.10791015625, -0.099853515625, -0.091796875, -0.083740234375, -0.07568359375, -0.067626953125, -0.0595703125, -0.051513671875, -0.04345703125, -0.035400390625, -0.02734375, -0.019287109375, -0.01123046875, -0.003173828125, 0.0048828125, 0.012939453125, 0.02099609375, 0.029052734375, 0.037109375, 0.045166015625, 0.05322265625, 0.061279296875, 0.0693359375, 0.077392578125, 0.08544921875, 0.093505859375, 0.1015625, 0.109619140625, 0.11767578125, 0.125732421875, 0.1337890625, 0.141845703125, 0.14990234375, 0.157958984375, 0.166015625, 0.174072265625, 0.18212890625, 0.190185546875, 0.1982421875, 0.206298828125, 0.21435546875, 0.222412109375, 0.23046875, 0.238525390625, 0.24658203125, 0.254638671875, 0.2626953125]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 6.0, 2.0, 9.0, 4.0, 8.0, 7.0, 13.0, 10.0, 10.0, 13.0, 25.0, 25.0, 21.0, 30.0, 36.0, 42.0, 38.0, 38.0, 50.0, 45.0, 35.0, 1057.0, 54.0, 49.0, 44.0, 42.0, 38.0, 31.0, 33.0, 41.0, 27.0, 22.0, 22.0, 12.0, 11.0, 16.0, 20.0, 13.0, 14.0, 6.0, 3.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.20703125, -4.07720947265625, -3.9473876953125, -3.81756591796875, -3.687744140625, -3.55792236328125, -3.4281005859375, -3.29827880859375, -3.16845703125, -3.03863525390625, -2.9088134765625, -2.77899169921875, -2.649169921875, -2.51934814453125, -2.3895263671875, -2.25970458984375, -2.1298828125, -2.00006103515625, -1.8702392578125, -1.74041748046875, -1.610595703125, -1.48077392578125, -1.3509521484375, -1.22113037109375, -1.09130859375, -0.96148681640625, -0.8316650390625, -0.70184326171875, -0.572021484375, -0.44219970703125, -0.3123779296875, -0.18255615234375, -0.052734375, 0.07708740234375, 0.2069091796875, 0.33673095703125, 0.466552734375, 0.59637451171875, 0.7261962890625, 0.85601806640625, 0.98583984375, 1.11566162109375, 1.2454833984375, 1.37530517578125, 1.505126953125, 1.63494873046875, 1.7647705078125, 1.89459228515625, 2.0244140625, 2.15423583984375, 2.2840576171875, 2.41387939453125, 2.543701171875, 2.67352294921875, 2.8033447265625, 2.93316650390625, 3.06298828125, 3.19281005859375, 3.3226318359375, 3.45245361328125, 3.582275390625, 3.71209716796875, 3.8419189453125, 3.97174072265625, 4.1015625]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 4.0, 4.0, 7.0, 10.0, 27.0, 31.0, 58.0, 66.0, 111.0, 133.0, 212.0, 336.0, 493.0, 716.0, 1076.0, 1640.0, 2488.0, 3794.0, 5936.0, 9315.0, 14942.0, 24893.0, 41446.0, 72332.0, 133492.0, 1293290.0, 216159.0, 114863.0, 63230.0, 36825.0, 21618.0, 13533.0, 8380.0, 5392.0, 3522.0, 2174.0, 1506.0, 1015.0, 700.0, 466.0, 299.0, 186.0, 147.0, 90.0, 64.0, 39.0, 27.0, 21.0, 7.0, 11.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.198486328125, -0.1922607421875, -0.18603515625, -0.1798095703125, -0.173583984375, -0.1673583984375, -0.1611328125, -0.1549072265625, -0.148681640625, -0.1424560546875, -0.13623046875, -0.1300048828125, -0.123779296875, -0.1175537109375, -0.111328125, -0.1051025390625, -0.098876953125, -0.0926513671875, -0.08642578125, -0.0802001953125, -0.073974609375, -0.0677490234375, -0.0615234375, -0.0552978515625, -0.049072265625, -0.0428466796875, -0.03662109375, -0.0303955078125, -0.024169921875, -0.0179443359375, -0.01171875, -0.0054931640625, 0.000732421875, 0.0069580078125, 0.01318359375, 0.0194091796875, 0.025634765625, 0.0318603515625, 0.0380859375, 0.0443115234375, 0.050537109375, 0.0567626953125, 0.06298828125, 0.0692138671875, 0.075439453125, 0.0816650390625, 0.087890625, 0.0941162109375, 0.100341796875, 0.1065673828125, 0.11279296875, 0.1190185546875, 0.125244140625, 0.1314697265625, 0.1376953125, 0.1439208984375, 0.150146484375, 0.1563720703125, 0.16259765625, 0.1688232421875, 0.175048828125, 0.1812744140625, 0.1875, 0.1937255859375, 0.199951171875]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 3.0, 3.0, 5.0, 2.0, 4.0, 3.0, 3.0, 3.0, 1.0, 6.0, 2.0, 11.0, 9.0, 14.0, 16.0, 15.0, 14.0, 23.0, 23.0, 30.0, 39.0, 53.0, 88.0, 81.0, 85.0, 119.0, 83.0, 62.0, 36.0, 44.0, 25.0, 17.0, 12.0, 4.0, 14.0, 10.0, 9.0, 3.0, 4.0, 3.0, 4.0, 2.0, 6.0, 2.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 4.0], "bins": [-0.0001875162124633789, -0.0001815836876630783, -0.0001756511628627777, -0.0001697186380624771, -0.00016378611326217651, -0.00015785358846187592, -0.00015192106366157532, -0.00014598853886127472, -0.00014005601406097412, -0.00013412348926067352, -0.00012819096446037292, -0.00012225843966007233, -0.00011632591485977173, -0.00011039339005947113, -0.00010446086525917053, -9.852834045886993e-05, -9.259581565856934e-05, -8.666329085826874e-05, -8.073076605796814e-05, -7.479824125766754e-05, -6.886571645736694e-05, -6.293319165706635e-05, -5.700066685676575e-05, -5.106814205646515e-05, -4.513561725616455e-05, -3.920309245586395e-05, -3.3270567655563354e-05, -2.7338042855262756e-05, -2.1405518054962158e-05, -1.547299325466156e-05, -9.540468454360962e-06, -3.6079436540603638e-06, 2.3245811462402344e-06, 8.257105946540833e-06, 1.418963074684143e-05, 2.012215554714203e-05, 2.6054680347442627e-05, 3.1987205147743225e-05, 3.791972994804382e-05, 4.385225474834442e-05, 4.978477954864502e-05, 5.571730434894562e-05, 6.164982914924622e-05, 6.758235394954681e-05, 7.351487874984741e-05, 7.944740355014801e-05, 8.537992835044861e-05, 9.13124531507492e-05, 9.72449779510498e-05, 0.0001031775027513504, 0.000109110027551651, 0.0001150425523519516, 0.0001209750771522522, 0.0001269076019525528, 0.0001328401267528534, 0.000138772651553154, 0.0001447051763534546, 0.0001506377011537552, 0.00015657022595405579, 0.00016250275075435638, 0.00016843527555465698, 0.00017436780035495758, 0.00018030032515525818, 0.00018623284995555878, 0.00019216537475585938]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 6.0, 3.0, 4.0, 3.0, 9.0, 12.0, 4.0, 7.0, 12.0, 10.0, 12.0, 16.0, 26.0, 24.0, 24.0, 29.0, 53.0, 86.0, 141.0, 275.0, 787.0, 4570.0, 58321.0, 945719.0, 33783.0, 3268.0, 635.0, 225.0, 118.0, 82.0, 51.0, 40.0, 39.0, 23.0, 17.0, 20.0, 22.0, 12.0, 15.0, 16.0, 6.0, 7.0, 1.0, 3.0, 9.0, 5.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.003570556640625, -0.0034637153148651123, -0.0033568739891052246, -0.003250032663345337, -0.0031431913375854492, -0.0030363500118255615, -0.002929508686065674, -0.002822667360305786, -0.0027158260345458984, -0.0026089847087860107, -0.002502143383026123, -0.0023953020572662354, -0.0022884607315063477, -0.00218161940574646, -0.0020747780799865723, -0.0019679367542266846, -0.0018610954284667969, -0.0017542541027069092, -0.0016474127769470215, -0.0015405714511871338, -0.001433730125427246, -0.0013268887996673584, -0.0012200474739074707, -0.001113206148147583, -0.0010063648223876953, -0.0008995234966278076, -0.0007926821708679199, -0.0006858408451080322, -0.0005789995193481445, -0.00047215819358825684, -0.00036531686782836914, -0.00025847554206848145, -0.00015163421630859375, -4.4792890548706055e-05, 6.204843521118164e-05, 0.00016888976097106934, 0.00027573108673095703, 0.0003825724124908447, 0.0004894137382507324, 0.0005962550640106201, 0.0007030963897705078, 0.0008099377155303955, 0.0009167790412902832, 0.001023620367050171, 0.0011304616928100586, 0.0012373030185699463, 0.001344144344329834, 0.0014509856700897217, 0.0015578269958496094, 0.001664668321609497, 0.0017715096473693848, 0.0018783509731292725, 0.00198519229888916, 0.002092033624649048, 0.0021988749504089355, 0.0023057162761688232, 0.002412557601928711, 0.0025193989276885986, 0.0026262402534484863, 0.002733081579208374, 0.0028399229049682617, 0.0029467642307281494, 0.003053605556488037, 0.003160446882247925, 0.0032672882080078125]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 7.0, 50.0, 301.0, 532.0, 103.0, 18.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004028836265206337, -0.0003723732952494174, -0.0003418629930820316, -0.00031135266181081533, -0.0002808423596434295, -0.00025033202837221324, -0.0002198217116529122, -0.00018931139493361115, -0.0001588010782143101, -0.00012829076149500906, -9.778044477570802e-05, -6.727012078044936e-05, -3.6759804061148316e-05, -6.2494800658896565e-06, 2.426083665341139e-05, 5.477115337271243e-05, 8.528147009201348e-05, 0.00011579178681131452, 0.00014630210353061557, 0.00017681243480183184, 0.00020732273696921766, 0.00023783306824043393, 0.00026834337040781975, 0.000298853701679036, 0.0003293640329502523, 0.00035987436422146857, 0.0003903846663888544, 0.00042089499766007066, 0.0004514052998274565, 0.00048191563109867275, 0.000512425962369889, 0.0005429362645372748, 0.0005734465667046607, 0.0006039568688720465, 0.0006344672292470932, 0.000664977531414479, 0.0006954878335818648, 0.0007259981939569116, 0.0007565084961242974, 0.0007870187982916832, 0.000817529100459069, 0.0008480394026264548, 0.0008785497630015016, 0.0009090600651688874, 0.0009395703673362732, 0.0009700807277113199, 0.0010005909716710448, 0.0010311013320460916, 0.0010616116924211383, 0.001092122052796185, 0.00112263229675591, 0.0011531426571309566, 0.0011836530175060034, 0.0012141632614657283, 0.001244673621840775, 0.0012751838658005, 0.0013056942261755466, 0.0013362045865505934, 0.0013667148305103183, 0.001397225190885365, 0.0014277355512604117, 0.0014582457952201366, 0.0014887561555951834, 0.00151926651597023, 0.001549776759929955]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 6.0, 9.0, 2.0, 6.0, 11.0, 14.0, 14.0, 21.0, 22.0, 31.0, 31.0, 23.0, 42.0, 29.0, 37.0, 38.0, 36.0, 37.0, 40.0, 57.0, 45.0, 40.0, 40.0, 45.0, 43.0, 30.0, 28.0, 40.0, 30.0, 22.0, 26.0, 18.0, 20.0, 21.0, 8.0, 10.0, 8.0, 11.0, 5.0, 2.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.00011587142944335938, -0.0001124255359172821, -0.00010897964239120483, -0.00010553374886512756, -0.00010208785533905029, -9.864196181297302e-05, -9.519606828689575e-05, -9.175017476081848e-05, -8.830428123474121e-05, -8.485838770866394e-05, -8.141249418258667e-05, -7.79666006565094e-05, -7.452070713043213e-05, -7.107481360435486e-05, -6.762892007827759e-05, -6.418302655220032e-05, -6.073713302612305e-05, -5.7291239500045776e-05, -5.3845345973968506e-05, -5.0399452447891235e-05, -4.6953558921813965e-05, -4.3507665395736694e-05, -4.0061771869659424e-05, -3.661587834358215e-05, -3.316998481750488e-05, -2.9724091291427612e-05, -2.6278197765350342e-05, -2.283230423927307e-05, -1.93864107131958e-05, -1.594051718711853e-05, -1.249462366104126e-05, -9.04873013496399e-06, -5.602836608886719e-06, -2.1569430828094482e-06, 1.2889504432678223e-06, 4.734843969345093e-06, 8.180737495422363e-06, 1.1626631021499634e-05, 1.5072524547576904e-05, 1.8518418073654175e-05, 2.1964311599731445e-05, 2.5410205125808716e-05, 2.8856098651885986e-05, 3.230199217796326e-05, 3.574788570404053e-05, 3.91937792301178e-05, 4.263967275619507e-05, 4.608556628227234e-05, 4.953145980834961e-05, 5.297735333442688e-05, 5.642324686050415e-05, 5.986914038658142e-05, 6.331503391265869e-05, 6.676092743873596e-05, 7.020682096481323e-05, 7.36527144908905e-05, 7.709860801696777e-05, 8.054450154304504e-05, 8.399039506912231e-05, 8.743628859519958e-05, 9.088218212127686e-05, 9.432807564735413e-05, 9.77739691734314e-05, 0.00010121986269950867, 0.00010466575622558594]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 5.0, 6.0, 6.0, 8.0, 16.0, 7.0, 11.0, 14.0, 11.0, 20.0, 20.0, 23.0, 32.0, 21.0, 37.0, 44.0, 47.0, 45.0, 52.0, 40.0, 45.0, 33.0, 46.0, 40.0, 35.0, 51.0, 34.0, 33.0, 26.0, 34.0, 23.0, 23.0, 19.0, 12.0, 9.0, 17.0, 16.0, 11.0, 7.0, 9.0, 7.0, 2.0, 4.0, 1.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.6875, -6.4852294921875, -6.282958984375, -6.0806884765625, -5.87841796875, -5.6761474609375, -5.473876953125, -5.2716064453125, -5.0693359375, -4.8670654296875, -4.664794921875, -4.4625244140625, -4.26025390625, -4.0579833984375, -3.855712890625, -3.6534423828125, -3.451171875, -3.2489013671875, -3.046630859375, -2.8443603515625, -2.64208984375, -2.4398193359375, -2.237548828125, -2.0352783203125, -1.8330078125, -1.6307373046875, -1.428466796875, -1.2261962890625, -1.02392578125, -0.8216552734375, -0.619384765625, -0.4171142578125, -0.21484375, -0.0125732421875, 0.189697265625, 0.3919677734375, 0.59423828125, 0.7965087890625, 0.998779296875, 1.2010498046875, 1.4033203125, 1.6055908203125, 1.807861328125, 2.0101318359375, 2.21240234375, 2.4146728515625, 2.616943359375, 2.8192138671875, 3.021484375, 3.2237548828125, 3.426025390625, 3.6282958984375, 3.83056640625, 4.0328369140625, 4.235107421875, 4.4373779296875, 4.6396484375, 4.8419189453125, 5.044189453125, 5.2464599609375, 5.44873046875, 5.6510009765625, 5.853271484375, 6.0555419921875, 6.2578125]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 9.0, 12.0, 18.0, 19.0, 27.0, 32.0, 55.0, 81.0, 94.0, 140.0, 180.0, 260.0, 353.0, 519.0, 721.0, 1028.0, 1620.0, 2571.0, 4441.0, 8581.0, 20786.0, 63486.0, 220317.0, 472582.0, 166261.0, 49214.0, 16902.0, 7312.0, 3798.0, 2314.0, 1495.0, 953.0, 678.0, 490.0, 326.0, 232.0, 167.0, 132.0, 105.0, 71.0, 49.0, 40.0, 22.0, 24.0, 9.0, 15.0, 10.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-6.80078125, -6.59710693359375, -6.3934326171875, -6.18975830078125, -5.986083984375, -5.78240966796875, -5.5787353515625, -5.37506103515625, -5.17138671875, -4.96771240234375, -4.7640380859375, -4.56036376953125, -4.356689453125, -4.15301513671875, -3.9493408203125, -3.74566650390625, -3.5419921875, -3.33831787109375, -3.1346435546875, -2.93096923828125, -2.727294921875, -2.52362060546875, -2.3199462890625, -2.11627197265625, -1.91259765625, -1.70892333984375, -1.5052490234375, -1.30157470703125, -1.097900390625, -0.89422607421875, -0.6905517578125, -0.48687744140625, -0.283203125, -0.07952880859375, 0.1241455078125, 0.32781982421875, 0.531494140625, 0.73516845703125, 0.9388427734375, 1.14251708984375, 1.34619140625, 1.54986572265625, 1.7535400390625, 1.95721435546875, 2.160888671875, 2.36456298828125, 2.5682373046875, 2.77191162109375, 2.9755859375, 3.17926025390625, 3.3829345703125, 3.58660888671875, 3.790283203125, 3.99395751953125, 4.1976318359375, 4.40130615234375, 4.60498046875, 4.80865478515625, 5.0123291015625, 5.21600341796875, 5.419677734375, 5.62335205078125, 5.8270263671875, 6.03070068359375, 6.234375]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 3.0, 7.0, 4.0, 4.0, 6.0, 9.0, 6.0, 14.0, 11.0, 12.0, 18.0, 28.0, 28.0, 24.0, 21.0, 38.0, 38.0, 44.0, 44.0, 51.0, 75.0, 232.0, 1540.0, 281.0, 75.0, 47.0, 45.0, 48.0, 39.0, 37.0, 32.0, 33.0, 23.0, 16.0, 26.0, 22.0, 19.0, 13.0, 14.0, 4.0, 5.0, 2.0, 5.0, 5.0, 1.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-20.5, -19.851318359375, -19.20263671875, -18.553955078125, -17.9052734375, -17.256591796875, -16.60791015625, -15.959228515625, -15.310546875, -14.661865234375, -14.01318359375, -13.364501953125, -12.7158203125, -12.067138671875, -11.41845703125, -10.769775390625, -10.12109375, -9.472412109375, -8.82373046875, -8.175048828125, -7.5263671875, -6.877685546875, -6.22900390625, -5.580322265625, -4.931640625, -4.282958984375, -3.63427734375, -2.985595703125, -2.3369140625, -1.688232421875, -1.03955078125, -0.390869140625, 0.2578125, 0.906494140625, 1.55517578125, 2.203857421875, 2.8525390625, 3.501220703125, 4.14990234375, 4.798583984375, 5.447265625, 6.095947265625, 6.74462890625, 7.393310546875, 8.0419921875, 8.690673828125, 9.33935546875, 9.988037109375, 10.63671875, 11.285400390625, 11.93408203125, 12.582763671875, 13.2314453125, 13.880126953125, 14.52880859375, 15.177490234375, 15.826171875, 16.474853515625, 17.12353515625, 17.772216796875, 18.4208984375, 19.069580078125, 19.71826171875, 20.366943359375, 21.015625]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 0.0, 5.0, 10.0, 13.0, 21.0, 27.0, 40.0, 78.0, 116.0, 188.0, 392.0, 1198.0, 60445.0, 3079378.0, 2694.0, 502.0, 234.0, 127.0, 95.0, 56.0, 33.0, 23.0, 14.0, 16.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-108.1875, -105.197265625, -102.20703125, -99.216796875, -96.2265625, -93.236328125, -90.24609375, -87.255859375, -84.265625, -81.275390625, -78.28515625, -75.294921875, -72.3046875, -69.314453125, -66.32421875, -63.333984375, -60.34375, -57.353515625, -54.36328125, -51.373046875, -48.3828125, -45.392578125, -42.40234375, -39.412109375, -36.421875, -33.431640625, -30.44140625, -27.451171875, -24.4609375, -21.470703125, -18.48046875, -15.490234375, -12.5, -9.509765625, -6.51953125, -3.529296875, -0.5390625, 2.451171875, 5.44140625, 8.431640625, 11.421875, 14.412109375, 17.40234375, 20.392578125, 23.3828125, 26.373046875, 29.36328125, 32.353515625, 35.34375, 38.333984375, 41.32421875, 44.314453125, 47.3046875, 50.294921875, 53.28515625, 56.275390625, 59.265625, 62.255859375, 65.24609375, 68.236328125, 71.2265625, 74.216796875, 77.20703125, 80.197265625, 83.1875]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 20.0, 283.0, 590.0, 109.0, 16.0, 0.0, 1.0, 0.0, 1.0], "bins": [-237.1805419921875, -233.03941345214844, -228.89828491210938, -224.75714111328125, -220.6160125732422, -216.47488403320312, -212.33375549316406, -208.192626953125, -204.05148315429688, -199.9103546142578, -195.76922607421875, -191.62808227539062, -187.48695373535156, -183.3458251953125, -179.20469665527344, -175.06356811523438, -170.9224395751953, -166.78131103515625, -162.6401824951172, -158.49903869628906, -154.35791015625, -150.21678161621094, -146.07565307617188, -141.9345245361328, -137.79339599609375, -133.6522674560547, -129.51113891601562, -125.37000274658203, -121.22886657714844, -117.08773803710938, -112.94660949707031, -108.80548095703125, -104.66434478759766, -100.5232162475586, -96.382080078125, -92.24095153808594, -88.09982299804688, -83.95868682861328, -79.81755828857422, -75.67642211914062, -71.53529357910156, -67.3941650390625, -63.253028869628906, -59.111900329589844, -54.970767974853516, -50.82963562011719, -46.688507080078125, -42.5473747253418, -38.40624237060547, -34.26511001586914, -30.123979568481445, -25.98284912109375, -21.841716766357422, -17.700584411621094, -13.559453964233398, -9.418323516845703, -5.277189254760742, -1.1360578536987305, 3.0050735473632812, 7.146204948425293, 11.287336349487305, 15.428468704223633, 19.569599151611328, 23.710729598999023, 27.85186195373535]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 7.0, 8.0, 16.0, 10.0, 14.0, 11.0, 14.0, 26.0, 23.0, 12.0, 29.0, 25.0, 38.0, 32.0, 36.0, 27.0, 41.0, 35.0, 39.0, 47.0, 37.0, 42.0, 38.0, 41.0, 55.0, 38.0, 42.0, 26.0, 28.0, 34.0, 13.0, 33.0, 18.0, 15.0, 13.0, 7.0, 10.0, 7.0, 3.0, 4.0, 6.0, 3.0, 1.0, 3.0, 3.0, 2.0, 2.0], "bins": [-61.30418395996094, -59.64155578613281, -57.97892761230469, -56.3162956237793, -54.65366744995117, -52.99103927612305, -51.328407287597656, -49.66577911376953, -48.003150939941406, -46.34052276611328, -44.677894592285156, -43.015262603759766, -41.35263442993164, -39.690006256103516, -38.027374267578125, -36.36474609375, -34.702117919921875, -33.03948974609375, -31.376859664916992, -29.714229583740234, -28.05160140991211, -26.388973236083984, -24.726343154907227, -23.06371307373047, -21.401084899902344, -19.73845672607422, -18.07582664489746, -16.413196563720703, -14.750568389892578, -13.087939262390137, -11.425310134887695, -9.762681007385254, -8.100048065185547, -6.4374189376831055, -4.774789810180664, -3.1121606826782227, -1.4495315551757812, 0.21309757232666016, 1.8757266998291016, 3.538355827331543, 5.200984954833984, 6.863614082336426, 8.526243209838867, 10.188872337341309, 11.85150146484375, 13.514130592346191, 15.176759719848633, 16.83938980102539, 18.502017974853516, 20.16464614868164, 21.8272762298584, 23.489906311035156, 25.15253448486328, 26.815162658691406, 28.477792739868164, 30.140422821044922, 31.803050994873047, 33.46567916870117, 35.12831115722656, 36.79093933105469, 38.45356750488281, 40.11619567871094, 41.77882385253906, 43.44145584106445, 45.10408401489258]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 4.0, 3.0, 9.0, 13.0, 10.0, 12.0, 12.0, 12.0, 12.0, 22.0, 27.0, 26.0, 30.0, 40.0, 40.0, 45.0, 42.0, 53.0, 45.0, 39.0, 46.0, 44.0, 45.0, 37.0, 47.0, 35.0, 30.0, 41.0, 35.0, 23.0, 21.0, 19.0, 14.0, 13.0, 13.0, 10.0, 15.0, 7.0, 8.0, 2.0, 7.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.68359375, -7.45257568359375, -7.2215576171875, -6.99053955078125, -6.759521484375, -6.52850341796875, -6.2974853515625, -6.06646728515625, -5.83544921875, -5.60443115234375, -5.3734130859375, -5.14239501953125, -4.911376953125, -4.68035888671875, -4.4493408203125, -4.21832275390625, -3.9873046875, -3.75628662109375, -3.5252685546875, -3.29425048828125, -3.063232421875, -2.83221435546875, -2.6011962890625, -2.37017822265625, -2.13916015625, -1.90814208984375, -1.6771240234375, -1.44610595703125, -1.215087890625, -0.98406982421875, -0.7530517578125, -0.52203369140625, -0.291015625, -0.05999755859375, 0.1710205078125, 0.40203857421875, 0.633056640625, 0.86407470703125, 1.0950927734375, 1.32611083984375, 1.55712890625, 1.78814697265625, 2.0191650390625, 2.25018310546875, 2.481201171875, 2.71221923828125, 2.9432373046875, 3.17425537109375, 3.4052734375, 3.63629150390625, 3.8673095703125, 4.09832763671875, 4.329345703125, 4.56036376953125, 4.7913818359375, 5.02239990234375, 5.25341796875, 5.48443603515625, 5.7154541015625, 5.94647216796875, 6.177490234375, 6.40850830078125, 6.6395263671875, 6.87054443359375, 7.1015625]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 2.0, 1.0, 2.0, 6.0, 8.0, 8.0, 11.0, 15.0, 20.0, 29.0, 36.0, 50.0, 69.0, 92.0, 128.0, 195.0, 284.0, 473.0, 910.0, 1955.0, 4862.0, 14553.0, 100522.0, 1443921.0, 2358644.0, 232494.0, 23075.0, 6581.0, 2550.0, 1141.0, 582.0, 379.0, 198.0, 128.0, 96.0, 72.0, 48.0, 34.0, 25.0, 20.0, 22.0, 18.0, 8.0, 11.0, 6.0, 2.0, 0.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.4375, -15.9561767578125, -15.474853515625, -14.9935302734375, -14.51220703125, -14.0308837890625, -13.549560546875, -13.0682373046875, -12.5869140625, -12.1055908203125, -11.624267578125, -11.1429443359375, -10.66162109375, -10.1802978515625, -9.698974609375, -9.2176513671875, -8.736328125, -8.2550048828125, -7.773681640625, -7.2923583984375, -6.81103515625, -6.3297119140625, -5.848388671875, -5.3670654296875, -4.8857421875, -4.4044189453125, -3.923095703125, -3.4417724609375, -2.96044921875, -2.4791259765625, -1.997802734375, -1.5164794921875, -1.03515625, -0.5538330078125, -0.072509765625, 0.4088134765625, 0.89013671875, 1.3714599609375, 1.852783203125, 2.3341064453125, 2.8154296875, 3.2967529296875, 3.778076171875, 4.2593994140625, 4.74072265625, 5.2220458984375, 5.703369140625, 6.1846923828125, 6.666015625, 7.1473388671875, 7.628662109375, 8.1099853515625, 8.59130859375, 9.0726318359375, 9.553955078125, 10.0352783203125, 10.5166015625, 10.9979248046875, 11.479248046875, 11.9605712890625, 12.44189453125, 12.9232177734375, 13.404541015625, 13.8858642578125, 14.3671875]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 3.0, 4.0, 4.0, 7.0, 9.0, 11.0, 13.0, 15.0, 24.0, 24.0, 37.0, 44.0, 71.0, 67.0, 108.0, 171.0, 220.0, 334.0, 478.0, 557.0, 551.0, 441.0, 252.0, 162.0, 114.0, 93.0, 62.0, 57.0, 33.0, 21.0, 17.0, 12.0, 10.0, 10.0, 11.0, 4.0, 2.0, 8.0, 2.0, 3.0, 5.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.109375, -11.7142333984375, -11.319091796875, -10.9239501953125, -10.52880859375, -10.1336669921875, -9.738525390625, -9.3433837890625, -8.9482421875, -8.5531005859375, -8.157958984375, -7.7628173828125, -7.36767578125, -6.9725341796875, -6.577392578125, -6.1822509765625, -5.787109375, -5.3919677734375, -4.996826171875, -4.6016845703125, -4.20654296875, -3.8114013671875, -3.416259765625, -3.0211181640625, -2.6259765625, -2.2308349609375, -1.835693359375, -1.4405517578125, -1.04541015625, -0.6502685546875, -0.255126953125, 0.1400146484375, 0.53515625, 0.9302978515625, 1.325439453125, 1.7205810546875, 2.11572265625, 2.5108642578125, 2.906005859375, 3.3011474609375, 3.6962890625, 4.0914306640625, 4.486572265625, 4.8817138671875, 5.27685546875, 5.6719970703125, 6.067138671875, 6.4622802734375, 6.857421875, 7.2525634765625, 7.647705078125, 8.0428466796875, 8.43798828125, 8.8331298828125, 9.228271484375, 9.6234130859375, 10.0185546875, 10.4136962890625, 10.808837890625, 11.2039794921875, 11.59912109375, 11.9942626953125, 12.389404296875, 12.7845458984375, 13.1796875]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 2.0, 3.0, 5.0, 4.0, 3.0, 5.0, 6.0, 6.0, 13.0, 11.0, 13.0, 20.0, 22.0, 31.0, 64.0, 69.0, 93.0, 144.0, 259.0, 687.0, 4842.0, 183604.0, 3968652.0, 32396.0, 2142.0, 462.0, 236.0, 124.0, 90.0, 69.0, 53.0, 33.0, 27.0, 24.0, 13.0, 15.0, 9.0, 10.0, 9.0, 3.0, 5.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-59.28125, -57.44677734375, -55.6123046875, -53.77783203125, -51.943359375, -50.10888671875, -48.2744140625, -46.43994140625, -44.60546875, -42.77099609375, -40.9365234375, -39.10205078125, -37.267578125, -35.43310546875, -33.5986328125, -31.76416015625, -29.9296875, -28.09521484375, -26.2607421875, -24.42626953125, -22.591796875, -20.75732421875, -18.9228515625, -17.08837890625, -15.25390625, -13.41943359375, -11.5849609375, -9.75048828125, -7.916015625, -6.08154296875, -4.2470703125, -2.41259765625, -0.578125, 1.25634765625, 3.0908203125, 4.92529296875, 6.759765625, 8.59423828125, 10.4287109375, 12.26318359375, 14.09765625, 15.93212890625, 17.7666015625, 19.60107421875, 21.435546875, 23.27001953125, 25.1044921875, 26.93896484375, 28.7734375, 30.60791015625, 32.4423828125, 34.27685546875, 36.111328125, 37.94580078125, 39.7802734375, 41.61474609375, 43.44921875, 45.28369140625, 47.1181640625, 48.95263671875, 50.787109375, 52.62158203125, 54.4560546875, 56.29052734375, 58.125]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 18.0, 47.0, 236.0, 465.0, 191.0, 48.0, 9.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-340.7276306152344, -334.5817565917969, -328.43585205078125, -322.28997802734375, -316.1440734863281, -309.9981994628906, -303.8523254394531, -297.7064208984375, -291.560546875, -285.4146728515625, -279.2687683105469, -273.1228942871094, -266.97698974609375, -260.83111572265625, -254.6852264404297, -248.53933715820312, -242.39346313476562, -236.24757385253906, -230.1016845703125, -223.955810546875, -217.80992126464844, -211.66403198242188, -205.5181427001953, -199.37225341796875, -193.2263641357422, -187.08047485351562, -180.93458557128906, -174.78871154785156, -168.642822265625, -162.49693298339844, -156.35104370117188, -150.20516967773438, -144.05926513671875, -137.9133758544922, -131.76748657226562, -125.6216049194336, -119.47572326660156, -113.329833984375, -107.18394470214844, -101.0380630493164, -94.89218139648438, -88.74629211425781, -82.60041046142578, -76.45452117919922, -70.30863952636719, -64.16275024414062, -58.01686477661133, -51.87097930908203, -45.725093841552734, -39.57920837402344, -33.43332290649414, -27.28743553161621, -21.141550064086914, -14.995664596557617, -8.849777221679688, -2.7038917541503906, 3.4419937133789062, 9.587879180908203, 15.733765602111816, 21.87965202331543, 28.025537490844727, 34.171424865722656, 40.31731033325195, 46.46319580078125, 52.60908126831055]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 3.0, 3.0, 4.0, 3.0, 7.0, 8.0, 8.0, 11.0, 15.0, 20.0, 25.0, 23.0, 25.0, 24.0, 27.0, 39.0, 33.0, 37.0, 49.0, 33.0, 45.0, 41.0, 45.0, 55.0, 43.0, 43.0, 46.0, 34.0, 32.0, 40.0, 25.0, 32.0, 20.0, 20.0, 11.0, 20.0, 14.0, 9.0, 7.0, 5.0, 10.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-49.86748123168945, -48.42293930053711, -46.9783935546875, -45.533851623535156, -44.08930969238281, -42.64476776123047, -41.20022201538086, -39.755680084228516, -38.311134338378906, -36.86659240722656, -35.42204666137695, -33.97750473022461, -32.532962799072266, -31.08841896057129, -29.643875122070312, -28.19933319091797, -26.754791259765625, -25.31024742126465, -23.865705490112305, -22.421161651611328, -20.976619720458984, -19.532075881958008, -18.08753204345703, -16.642990112304688, -15.198446273803711, -13.75390338897705, -12.30936050415039, -10.864816665649414, -9.420273780822754, -7.975730895996094, -6.531187057495117, -5.086644172668457, -3.6421051025390625, -2.1975619792938232, -0.753018856048584, 0.6915245056152344, 2.1360673904418945, 3.5806102752685547, 5.025154113769531, 6.469696998596191, 7.914239883422852, 9.358782768249512, 10.803325653076172, 12.247869491577148, 13.692412376403809, 15.136955261230469, 16.581499099731445, 18.026042938232422, 19.470584869384766, 20.915128707885742, 22.359670639038086, 23.804214477539062, 25.248756408691406, 26.693300247192383, 28.13784408569336, 29.582386016845703, 31.02692985534668, 32.471473693847656, 33.916015625, 35.360557556152344, 36.80510330200195, 38.2496452331543, 39.694190979003906, 41.13873291015625, 42.583274841308594]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 6.0, 1.0, 4.0, 4.0, 2.0, 8.0, 5.0, 11.0, 9.0, 13.0, 14.0, 24.0, 20.0, 28.0, 26.0, 28.0, 28.0, 49.0, 46.0, 41.0, 39.0, 59.0, 47.0, 46.0, 45.0, 40.0, 45.0, 33.0, 41.0, 38.0, 29.0, 32.0, 26.0, 21.0, 19.0, 20.0, 15.0, 8.0, 20.0, 9.0, 4.0, 5.0, 5.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.44921875, -7.2308349609375, -7.012451171875, -6.7940673828125, -6.57568359375, -6.3572998046875, -6.138916015625, -5.9205322265625, -5.7021484375, -5.4837646484375, -5.265380859375, -5.0469970703125, -4.82861328125, -4.6102294921875, -4.391845703125, -4.1734619140625, -3.955078125, -3.7366943359375, -3.518310546875, -3.2999267578125, -3.08154296875, -2.8631591796875, -2.644775390625, -2.4263916015625, -2.2080078125, -1.9896240234375, -1.771240234375, -1.5528564453125, -1.33447265625, -1.1160888671875, -0.897705078125, -0.6793212890625, -0.4609375, -0.2425537109375, -0.024169921875, 0.1942138671875, 0.41259765625, 0.6309814453125, 0.849365234375, 1.0677490234375, 1.2861328125, 1.5045166015625, 1.722900390625, 1.9412841796875, 2.15966796875, 2.3780517578125, 2.596435546875, 2.8148193359375, 3.033203125, 3.2515869140625, 3.469970703125, 3.6883544921875, 3.90673828125, 4.1251220703125, 4.343505859375, 4.5618896484375, 4.7802734375, 4.9986572265625, 5.217041015625, 5.4354248046875, 5.65380859375, 5.8721923828125, 6.090576171875, 6.3089599609375, 6.52734375]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 5.0, 4.0, 17.0, 26.0, 26.0, 60.0, 78.0, 110.0, 168.0, 230.0, 302.0, 492.0, 727.0, 1129.0, 1649.0, 2479.0, 3806.0, 5837.0, 9091.0, 14947.0, 25042.0, 44702.0, 85542.0, 173083.0, 307265.0, 174944.0, 85521.0, 44635.0, 25243.0, 14911.0, 9268.0, 5838.0, 3811.0, 2568.0, 1632.0, 1080.0, 793.0, 472.0, 326.0, 233.0, 153.0, 103.0, 81.0, 46.0, 22.0, 26.0, 15.0, 7.0, 6.0, 4.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.322509765625, -0.3125877380371094, -0.30266571044921875, -0.2927436828613281, -0.2828216552734375, -0.2728996276855469, -0.26297760009765625, -0.2530555725097656, -0.243133544921875, -0.23321151733398438, -0.22328948974609375, -0.21336746215820312, -0.2034454345703125, -0.19352340698242188, -0.18360137939453125, -0.17367935180664062, -0.16375732421875, -0.15383529663085938, -0.14391326904296875, -0.13399124145507812, -0.1240692138671875, -0.11414718627929688, -0.10422515869140625, -0.09430313110351562, -0.084381103515625, -0.07445907592773438, -0.06453704833984375, -0.054615020751953125, -0.0446929931640625, -0.034770965576171875, -0.02484893798828125, -0.014926910400390625, -0.0050048828125, 0.004917144775390625, 0.01483917236328125, 0.024761199951171875, 0.0346832275390625, 0.044605255126953125, 0.05452728271484375, 0.06444931030273438, 0.074371337890625, 0.08429336547851562, 0.09421539306640625, 0.10413742065429688, 0.1140594482421875, 0.12398147583007812, 0.13390350341796875, 0.14382553100585938, 0.15374755859375, 0.16366958618164062, 0.17359161376953125, 0.18351364135742188, 0.1934356689453125, 0.20335769653320312, 0.21327972412109375, 0.22320175170898438, 0.233123779296875, 0.24304580688476562, 0.25296783447265625, 0.2628898620605469, 0.2728118896484375, 0.2827339172363281, 0.29265594482421875, 0.3025779724121094, 0.3125]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 6.0, 1.0, 1.0, 9.0, 12.0, 12.0, 20.0, 13.0, 10.0, 17.0, 22.0, 25.0, 29.0, 25.0, 26.0, 34.0, 32.0, 55.0, 38.0, 38.0, 41.0, 1061.0, 30.0, 52.0, 40.0, 36.0, 45.0, 44.0, 32.0, 33.0, 32.0, 27.0, 26.0, 20.0, 19.0, 15.0, 9.0, 7.0, 16.0, 5.0, 6.0, 8.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.26171875, -4.1292724609375, -3.996826171875, -3.8643798828125, -3.73193359375, -3.5994873046875, -3.467041015625, -3.3345947265625, -3.2021484375, -3.0697021484375, -2.937255859375, -2.8048095703125, -2.67236328125, -2.5399169921875, -2.407470703125, -2.2750244140625, -2.142578125, -2.0101318359375, -1.877685546875, -1.7452392578125, -1.61279296875, -1.4803466796875, -1.347900390625, -1.2154541015625, -1.0830078125, -0.9505615234375, -0.818115234375, -0.6856689453125, -0.55322265625, -0.4207763671875, -0.288330078125, -0.1558837890625, -0.0234375, 0.1090087890625, 0.241455078125, 0.3739013671875, 0.50634765625, 0.6387939453125, 0.771240234375, 0.9036865234375, 1.0361328125, 1.1685791015625, 1.301025390625, 1.4334716796875, 1.56591796875, 1.6983642578125, 1.830810546875, 1.9632568359375, 2.095703125, 2.2281494140625, 2.360595703125, 2.4930419921875, 2.62548828125, 2.7579345703125, 2.890380859375, 3.0228271484375, 3.1552734375, 3.2877197265625, 3.420166015625, 3.5526123046875, 3.68505859375, 3.8175048828125, 3.949951171875, 4.0823974609375, 4.21484375]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 7.0, 3.0, 9.0, 10.0, 15.0, 31.0, 46.0, 49.0, 101.0, 110.0, 154.0, 202.0, 305.0, 397.0, 599.0, 832.0, 1152.0, 1615.0, 2255.0, 3186.0, 4572.0, 6679.0, 9756.0, 14368.0, 22057.0, 34122.0, 53373.0, 86476.0, 142469.0, 1267709.0, 166447.0, 100575.0, 60982.0, 38603.0, 25166.0, 16594.0, 10874.0, 7511.0, 5220.0, 3568.0, 2533.0, 1855.0, 1308.0, 938.0, 675.0, 472.0, 361.0, 227.0, 150.0, 132.0, 77.0, 72.0, 50.0, 39.0, 20.0, 16.0, 9.0, 4.0, 7.0, 3.0, 3.0], "bins": [-0.174072265625, -0.16874122619628906, -0.16341018676757812, -0.1580791473388672, -0.15274810791015625, -0.1474170684814453, -0.14208602905273438, -0.13675498962402344, -0.1314239501953125, -0.12609291076660156, -0.12076187133789062, -0.11543083190917969, -0.11009979248046875, -0.10476875305175781, -0.09943771362304688, -0.09410667419433594, -0.088775634765625, -0.08344459533691406, -0.07811355590820312, -0.07278251647949219, -0.06745147705078125, -0.06212043762207031, -0.056789398193359375, -0.05145835876464844, -0.0461273193359375, -0.04079627990722656, -0.035465240478515625, -0.030134201049804688, -0.02480316162109375, -0.019472122192382812, -0.014141082763671875, -0.008810043334960938, -0.00347900390625, 0.0018520355224609375, 0.007183074951171875, 0.012514114379882812, 0.01784515380859375, 0.023176193237304688, 0.028507232666015625, 0.03383827209472656, 0.0391693115234375, 0.04450035095214844, 0.049831390380859375, 0.05516242980957031, 0.06049346923828125, 0.06582450866699219, 0.07115554809570312, 0.07648658752441406, 0.081817626953125, 0.08714866638183594, 0.09247970581054688, 0.09781074523925781, 0.10314178466796875, 0.10847282409667969, 0.11380386352539062, 0.11913490295410156, 0.1244659423828125, 0.12979698181152344, 0.13512802124023438, 0.1404590606689453, 0.14579010009765625, 0.1511211395263672, 0.15645217895507812, 0.16178321838378906, 0.1671142578125]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 5.0, 8.0, 10.0, 11.0, 9.0, 16.0, 14.0, 15.0, 11.0, 15.0, 31.0, 25.0, 46.0, 55.0, 52.0, 67.0, 67.0, 66.0, 84.0, 63.0, 59.0, 62.0, 31.0, 20.0, 24.0, 19.0, 13.0, 13.0, 15.0, 8.0, 7.0, 14.0, 9.0, 5.0, 10.0, 3.0, 4.0, 3.0, 6.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0003161430358886719, -0.00030638277530670166, -0.00029662251472473145, -0.00028686225414276123, -0.000277101993560791, -0.0002673417329788208, -0.0002575814723968506, -0.00024782121181488037, -0.00023806095123291016, -0.00022830069065093994, -0.00021854043006896973, -0.0002087801694869995, -0.0001990199089050293, -0.00018925964832305908, -0.00017949938774108887, -0.00016973912715911865, -0.00015997886657714844, -0.00015021860599517822, -0.000140458345413208, -0.0001306980848312378, -0.00012093782424926758, -0.00011117756366729736, -0.00010141730308532715, -9.165704250335693e-05, -8.189678192138672e-05, -7.21365213394165e-05, -6.237626075744629e-05, -5.2616000175476074e-05, -4.285573959350586e-05, -3.3095479011535645e-05, -2.333521842956543e-05, -1.3574957847595215e-05, -3.814697265625e-06, 5.945563316345215e-06, 1.570582389831543e-05, 2.5466084480285645e-05, 3.522634506225586e-05, 4.4986605644226074e-05, 5.474686622619629e-05, 6.45071268081665e-05, 7.426738739013672e-05, 8.402764797210693e-05, 9.378790855407715e-05, 0.00010354816913604736, 0.00011330842971801758, 0.0001230686902999878, 0.000132828950881958, 0.00014258921146392822, 0.00015234947204589844, 0.00016210973262786865, 0.00017186999320983887, 0.00018163025379180908, 0.0001913905143737793, 0.0002011507749557495, 0.00021091103553771973, 0.00022067129611968994, 0.00023043155670166016, 0.00024019181728363037, 0.0002499520778656006, 0.0002597123384475708, 0.000269472599029541, 0.00027923285961151123, 0.00028899312019348145, 0.00029875338077545166, 0.0003085136413574219]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 5.0, 2.0, 7.0, 8.0, 9.0, 11.0, 15.0, 17.0, 16.0, 19.0, 38.0, 33.0, 46.0, 57.0, 85.0, 111.0, 193.0, 484.0, 3201.0, 213018.0, 824054.0, 5769.0, 604.0, 226.0, 137.0, 70.0, 78.0, 56.0, 36.0, 33.0, 20.0, 25.0, 14.0, 17.0, 5.0, 8.0, 6.0, 8.0, 9.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.00635528564453125, -0.006157279014587402, -0.005959272384643555, -0.005761265754699707, -0.005563259124755859, -0.005365252494812012, -0.005167245864868164, -0.004969239234924316, -0.004771232604980469, -0.004573225975036621, -0.0043752193450927734, -0.004177212715148926, -0.003979206085205078, -0.0037811994552612305, -0.003583192825317383, -0.003385186195373535, -0.0031871795654296875, -0.00298917293548584, -0.002791166305541992, -0.0025931596755981445, -0.002395153045654297, -0.0021971464157104492, -0.0019991397857666016, -0.001801133155822754, -0.0016031265258789062, -0.0014051198959350586, -0.001207113265991211, -0.0010091066360473633, -0.0008111000061035156, -0.000613093376159668, -0.0004150867462158203, -0.00021708011627197266, -1.9073486328125e-05, 0.00017893314361572266, 0.0003769397735595703, 0.000574946403503418, 0.0007729530334472656, 0.0009709596633911133, 0.001168966293334961, 0.0013669729232788086, 0.0015649795532226562, 0.001762986183166504, 0.0019609928131103516, 0.0021589994430541992, 0.002357006072998047, 0.0025550127029418945, 0.002753019332885742, 0.00295102596282959, 0.0031490325927734375, 0.003347039222717285, 0.003545045852661133, 0.0037430524826049805, 0.003941059112548828, 0.004139065742492676, 0.0043370723724365234, 0.004535079002380371, 0.004733085632324219, 0.004931092262268066, 0.005129098892211914, 0.005327105522155762, 0.005525112152099609, 0.005723118782043457, 0.005921125411987305, 0.006119132041931152, 0.006317138671875]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 14.0, 963.0, 39.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00035580756957642734, -0.00021655917225871235, -7.731077494099736e-05, 6.193763692863286e-05, 0.00020118601969443262, 0.0003404344024602324, 0.00047968284343369305, 0.0006189312553033233, 0.0007581795798614621, 0.0008974279626272619, 0.0010366763453930616, 0.0011759247863665223, 0.001315173227339983, 0.0014544215518981218, 0.0015936699928715825, 0.0017329184338450432, 0.001872166758403182, 0.002011415082961321, 0.0021506636403501034, 0.0022899119649082422, 0.002429160289466381, 0.0025684088468551636, 0.0027076571714133024, 0.0028469054959714413, 0.0029861540533602238, 0.0031254023779183626, 0.003264650935307145, 0.003403899259865284, 0.003543147584423423, 0.0036823959089815617, 0.003821644466370344, 0.003960893023759127, 0.004100141581147909, 0.004239390138536692, 0.004378638230264187, 0.004517886787652969, 0.004657135345041752, 0.004796383436769247, 0.0049356319941580296, 0.005074880551546812, 0.005214128643274307, 0.00535337720066309, 0.005492625292390585, 0.0056318738497793674, 0.00577112240716815, 0.005910370498895645, 0.006049619056284428, 0.00618886761367321, 0.006328116171061993, 0.006467364728450775, 0.00660661282017827, 0.006745861377567053, 0.006885109934955835, 0.0070243580266833305, 0.007163606584072113, 0.0073028551414608955, 0.007442103233188391, 0.007581351790577173, 0.007720599882304668, 0.007859848439693451, 0.007999096997082233, 0.008138345554471016, 0.008277593180537224, 0.008416841737926006, 0.008556090295314789]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 9.0, 1.0, 9.0, 11.0, 25.0, 16.0, 34.0, 45.0, 56.0, 59.0, 69.0, 51.0, 65.0, 61.0, 69.0, 69.0, 68.0, 67.0, 50.0, 44.0, 34.0, 27.0, 14.0, 22.0, 9.0, 9.0, 8.0, 5.0, 4.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.00045931339263916016, -0.00044902414083480835, -0.00043873488903045654, -0.00042844563722610474, -0.00041815638542175293, -0.0004078671336174011, -0.0003975778818130493, -0.0003872886300086975, -0.0003769993782043457, -0.0003667101263999939, -0.0003564208745956421, -0.0003461316227912903, -0.0003358423709869385, -0.00032555311918258667, -0.00031526386737823486, -0.00030497461557388306, -0.00029468536376953125, -0.00028439611196517944, -0.00027410686016082764, -0.00026381760835647583, -0.000253528356552124, -0.00024323910474777222, -0.0002329498529434204, -0.0002226606011390686, -0.0002123713493347168, -0.000202082097530365, -0.00019179284572601318, -0.00018150359392166138, -0.00017121434211730957, -0.00016092509031295776, -0.00015063583850860596, -0.00014034658670425415, -0.00013005733489990234, -0.00011976808309555054, -0.00010947883129119873, -9.918957948684692e-05, -8.890032768249512e-05, -7.861107587814331e-05, -6.83218240737915e-05, -5.80325722694397e-05, -4.774332046508789e-05, -3.7454068660736084e-05, -2.7164816856384277e-05, -1.687556505203247e-05, -6.586313247680664e-06, 3.7029385566711426e-06, 1.399219036102295e-05, 2.4281442165374756e-05, 3.457069396972656e-05, 4.485994577407837e-05, 5.5149197578430176e-05, 6.543844938278198e-05, 7.572770118713379e-05, 8.60169529914856e-05, 9.63062047958374e-05, 0.00010659545660018921, 0.00011688470840454102, 0.00012717396020889282, 0.00013746321201324463, 0.00014775246381759644, 0.00015804171562194824, 0.00016833096742630005, 0.00017862021923065186, 0.00018890947103500366, 0.00019919872283935547]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 6.0, 1.0, 4.0, 4.0, 2.0, 8.0, 5.0, 11.0, 9.0, 13.0, 14.0, 24.0, 20.0, 28.0, 26.0, 28.0, 28.0, 49.0, 46.0, 41.0, 39.0, 59.0, 47.0, 46.0, 45.0, 40.0, 45.0, 33.0, 40.0, 39.0, 29.0, 32.0, 26.0, 21.0, 19.0, 20.0, 15.0, 8.0, 20.0, 9.0, 4.0, 5.0, 5.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.44921875, -7.2308349609375, -7.012451171875, -6.7940673828125, -6.57568359375, -6.3572998046875, -6.138916015625, -5.9205322265625, -5.7021484375, -5.4837646484375, -5.265380859375, -5.0469970703125, -4.82861328125, -4.6102294921875, -4.391845703125, -4.1734619140625, -3.955078125, -3.7366943359375, -3.518310546875, -3.2999267578125, -3.08154296875, -2.8631591796875, -2.644775390625, -2.4263916015625, -2.2080078125, -1.9896240234375, -1.771240234375, -1.5528564453125, -1.33447265625, -1.1160888671875, -0.897705078125, -0.6793212890625, -0.4609375, -0.2425537109375, -0.024169921875, 0.1942138671875, 0.41259765625, 0.6309814453125, 0.849365234375, 1.0677490234375, 1.2861328125, 1.5045166015625, 1.722900390625, 1.9412841796875, 2.15966796875, 2.3780517578125, 2.596435546875, 2.8148193359375, 3.033203125, 3.2515869140625, 3.469970703125, 3.6883544921875, 3.90673828125, 4.1251220703125, 4.343505859375, 4.5618896484375, 4.7802734375, 4.9986572265625, 5.217041015625, 5.4354248046875, 5.65380859375, 5.8721923828125, 6.090576171875, 6.3089599609375, 6.52734375]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 5.0, 7.0, 10.0, 13.0, 20.0, 32.0, 38.0, 60.0, 65.0, 138.0, 178.0, 280.0, 452.0, 712.0, 1145.0, 1970.0, 3531.0, 6509.0, 13157.0, 29261.0, 74564.0, 241758.0, 440463.0, 143041.0, 49195.0, 20531.0, 9720.0, 4927.0, 2680.0, 1517.0, 937.0, 531.0, 373.0, 230.0, 158.0, 119.0, 68.0, 47.0, 44.0, 21.0, 19.0, 10.0, 10.0, 7.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.3515625, -6.15484619140625, -5.9581298828125, -5.76141357421875, -5.564697265625, -5.36798095703125, -5.1712646484375, -4.97454833984375, -4.77783203125, -4.58111572265625, -4.3843994140625, -4.18768310546875, -3.990966796875, -3.79425048828125, -3.5975341796875, -3.40081787109375, -3.2041015625, -3.00738525390625, -2.8106689453125, -2.61395263671875, -2.417236328125, -2.22052001953125, -2.0238037109375, -1.82708740234375, -1.63037109375, -1.43365478515625, -1.2369384765625, -1.04022216796875, -0.843505859375, -0.64678955078125, -0.4500732421875, -0.25335693359375, -0.056640625, 0.14007568359375, 0.3367919921875, 0.53350830078125, 0.730224609375, 0.92694091796875, 1.1236572265625, 1.32037353515625, 1.51708984375, 1.71380615234375, 1.9105224609375, 2.10723876953125, 2.303955078125, 2.50067138671875, 2.6973876953125, 2.89410400390625, 3.0908203125, 3.28753662109375, 3.4842529296875, 3.68096923828125, 3.877685546875, 4.07440185546875, 4.2711181640625, 4.46783447265625, 4.66455078125, 4.86126708984375, 5.0579833984375, 5.25469970703125, 5.451416015625, 5.64813232421875, 5.8448486328125, 6.04156494140625, 6.23828125]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 8.0, 4.0, 1.0, 4.0, 6.0, 8.0, 8.0, 9.0, 11.0, 13.0, 23.0, 20.0, 20.0, 30.0, 26.0, 28.0, 43.0, 45.0, 45.0, 55.0, 82.0, 210.0, 1576.0, 252.0, 97.0, 58.0, 42.0, 42.0, 39.0, 40.0, 39.0, 31.0, 28.0, 23.0, 21.0, 17.0, 12.0, 5.0, 1.0, 9.0, 9.0, 7.0, 2.0, 1.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.125, -18.454833984375, -17.78466796875, -17.114501953125, -16.4443359375, -15.774169921875, -15.10400390625, -14.433837890625, -13.763671875, -13.093505859375, -12.42333984375, -11.753173828125, -11.0830078125, -10.412841796875, -9.74267578125, -9.072509765625, -8.40234375, -7.732177734375, -7.06201171875, -6.391845703125, -5.7216796875, -5.051513671875, -4.38134765625, -3.711181640625, -3.041015625, -2.370849609375, -1.70068359375, -1.030517578125, -0.3603515625, 0.309814453125, 0.97998046875, 1.650146484375, 2.3203125, 2.990478515625, 3.66064453125, 4.330810546875, 5.0009765625, 5.671142578125, 6.34130859375, 7.011474609375, 7.681640625, 8.351806640625, 9.02197265625, 9.692138671875, 10.3623046875, 11.032470703125, 11.70263671875, 12.372802734375, 13.04296875, 13.713134765625, 14.38330078125, 15.053466796875, 15.7236328125, 16.393798828125, 17.06396484375, 17.734130859375, 18.404296875, 19.074462890625, 19.74462890625, 20.414794921875, 21.0849609375, 21.755126953125, 22.42529296875, 23.095458984375, 23.765625]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 5.0, 4.0, 1.0, 2.0, 5.0, 12.0, 8.0, 10.0, 11.0, 17.0, 21.0, 30.0, 52.0, 49.0, 75.0, 86.0, 104.0, 180.0, 207.0, 335.0, 687.0, 3803.0, 718440.0, 2413963.0, 5637.0, 801.0, 304.0, 213.0, 166.0, 123.0, 64.0, 67.0, 48.0, 39.0, 37.0, 26.0, 17.0, 9.0, 14.0, 8.0, 8.0, 4.0, 4.0, 4.0, 10.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-54.5625, -53.00634765625, -51.4501953125, -49.89404296875, -48.337890625, -46.78173828125, -45.2255859375, -43.66943359375, -42.11328125, -40.55712890625, -39.0009765625, -37.44482421875, -35.888671875, -34.33251953125, -32.7763671875, -31.22021484375, -29.6640625, -28.10791015625, -26.5517578125, -24.99560546875, -23.439453125, -21.88330078125, -20.3271484375, -18.77099609375, -17.21484375, -15.65869140625, -14.1025390625, -12.54638671875, -10.990234375, -9.43408203125, -7.8779296875, -6.32177734375, -4.765625, -3.20947265625, -1.6533203125, -0.09716796875, 1.458984375, 3.01513671875, 4.5712890625, 6.12744140625, 7.68359375, 9.23974609375, 10.7958984375, 12.35205078125, 13.908203125, 15.46435546875, 17.0205078125, 18.57666015625, 20.1328125, 21.68896484375, 23.2451171875, 24.80126953125, 26.357421875, 27.91357421875, 29.4697265625, 31.02587890625, 32.58203125, 34.13818359375, 35.6943359375, 37.25048828125, 38.806640625, 40.36279296875, 41.9189453125, 43.47509765625, 45.03125]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 7.0, 117.0, 520.0, 324.0, 45.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.345001220703125, -42.9844856262207, -39.62397384643555, -36.263458251953125, -32.90294647216797, -29.542430877685547, -26.181915283203125, -22.821401596069336, -19.460887908935547, -16.100374221801758, -12.739859580993652, -9.379344940185547, -6.018831253051758, -2.6583175659179688, 0.7021980285644531, 4.062711715698242, 7.423225402832031, 10.78373908996582, 14.144253730773926, 17.50476837158203, 20.86528205871582, 24.22579574584961, 27.58631134033203, 30.94682502746582, 34.30733871459961, 37.66785430908203, 41.02836608886719, 44.38888168334961, 47.74939727783203, 51.10990905761719, 54.47042465209961, 57.83094024658203, 61.19145202636719, 64.55196380615234, 67.91248321533203, 71.27299499511719, 74.63350677490234, 77.9940185546875, 81.35453796386719, 84.71504974365234, 88.0755615234375, 91.43607330322266, 94.79659271240234, 98.1571044921875, 101.51761627197266, 104.87812805175781, 108.2386474609375, 111.59915924072266, 114.95967864990234, 118.3201904296875, 121.68070983886719, 125.04122161865234, 128.4017333984375, 131.7622528076172, 135.12277221679688, 138.4832763671875, 141.8437957763672, 145.20431518554688, 148.5648193359375, 151.9253387451172, 155.28585815429688, 158.6463623046875, 162.0068817138672, 165.36740112304688, 168.7279052734375]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 6.0, 10.0, 11.0, 6.0, 7.0, 9.0, 19.0, 14.0, 11.0, 20.0, 23.0, 30.0, 29.0, 19.0, 31.0, 29.0, 38.0, 38.0, 45.0, 42.0, 45.0, 48.0, 34.0, 36.0, 38.0, 34.0, 39.0, 37.0, 29.0, 26.0, 35.0, 27.0, 16.0, 11.0, 22.0, 16.0, 11.0, 15.0, 6.0, 6.0, 9.0, 9.0, 6.0, 4.0, 4.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0], "bins": [-52.46171569824219, -50.881256103515625, -49.30079650878906, -47.7203369140625, -46.13987731933594, -44.55941390991211, -42.97895431518555, -41.398494720458984, -39.81803512573242, -38.23757553100586, -36.6571159362793, -35.076656341552734, -33.496192932128906, -31.915735244750977, -30.33527374267578, -28.75481414794922, -27.174354553222656, -25.593894958496094, -24.01343536376953, -22.432973861694336, -20.852514266967773, -19.27205467224121, -17.691593170166016, -16.111133575439453, -14.53067398071289, -12.950214385986328, -11.36975383758545, -9.78929328918457, -8.208833694458008, -6.628373622894287, -5.047913551330566, -3.4674530029296875, -1.886993408203125, -0.3065333366394043, 1.2739267349243164, 2.854386806488037, 4.434846878051758, 6.0153069496154785, 7.595767021179199, 9.176227569580078, 10.75668716430664, 12.337146759033203, 13.917607307434082, 15.498067855834961, 17.078527450561523, 18.658987045288086, 20.23944854736328, 21.819908142089844, 23.400367736816406, 24.98082733154297, 26.56128692626953, 28.141748428344727, 29.72220802307129, 31.30266761779785, 32.88312911987305, 34.46358871459961, 36.04404830932617, 37.624507904052734, 39.2049674987793, 40.78542709350586, 42.36589050292969, 43.94635009765625, 45.52680969238281, 47.107269287109375, 48.68772888183594]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 7.0, 7.0, 0.0, 6.0, 5.0, 7.0, 15.0, 10.0, 12.0, 16.0, 16.0, 22.0, 23.0, 31.0, 22.0, 30.0, 41.0, 43.0, 36.0, 35.0, 50.0, 50.0, 56.0, 41.0, 52.0, 30.0, 23.0, 34.0, 38.0, 36.0, 31.0, 26.0, 33.0, 19.0, 17.0, 14.0, 10.0, 19.0, 9.0, 12.0, 5.0, 10.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-7.38671875, -7.17340087890625, -6.9600830078125, -6.74676513671875, -6.533447265625, -6.32012939453125, -6.1068115234375, -5.89349365234375, -5.68017578125, -5.46685791015625, -5.2535400390625, -5.04022216796875, -4.826904296875, -4.61358642578125, -4.4002685546875, -4.18695068359375, -3.9736328125, -3.76031494140625, -3.5469970703125, -3.33367919921875, -3.120361328125, -2.90704345703125, -2.6937255859375, -2.48040771484375, -2.26708984375, -2.05377197265625, -1.8404541015625, -1.62713623046875, -1.413818359375, -1.20050048828125, -0.9871826171875, -0.77386474609375, -0.560546875, -0.34722900390625, -0.1339111328125, 0.07940673828125, 0.292724609375, 0.50604248046875, 0.7193603515625, 0.93267822265625, 1.14599609375, 1.35931396484375, 1.5726318359375, 1.78594970703125, 1.999267578125, 2.21258544921875, 2.4259033203125, 2.63922119140625, 2.8525390625, 3.06585693359375, 3.2791748046875, 3.49249267578125, 3.705810546875, 3.91912841796875, 4.1324462890625, 4.34576416015625, 4.55908203125, 4.77239990234375, 4.9857177734375, 5.19903564453125, 5.412353515625, 5.62567138671875, 5.8389892578125, 6.05230712890625, 6.265625]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 7.0, 2.0, 5.0, 7.0, 1.0, 10.0, 7.0, 7.0, 12.0, 8.0, 27.0, 27.0, 33.0, 47.0, 59.0, 96.0, 134.0, 254.0, 414.0, 801.0, 1851.0, 4839.0, 19209.0, 287128.0, 3087101.0, 745288.0, 35075.0, 6999.0, 2483.0, 981.0, 530.0, 280.0, 167.0, 121.0, 68.0, 51.0, 29.0, 32.0, 23.0, 16.0, 8.0, 16.0, 9.0, 10.0, 8.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0], "bins": [-20.375, -19.786865234375, -19.19873046875, -18.610595703125, -18.0224609375, -17.434326171875, -16.84619140625, -16.258056640625, -15.669921875, -15.081787109375, -14.49365234375, -13.905517578125, -13.3173828125, -12.729248046875, -12.14111328125, -11.552978515625, -10.96484375, -10.376708984375, -9.78857421875, -9.200439453125, -8.6123046875, -8.024169921875, -7.43603515625, -6.847900390625, -6.259765625, -5.671630859375, -5.08349609375, -4.495361328125, -3.9072265625, -3.319091796875, -2.73095703125, -2.142822265625, -1.5546875, -0.966552734375, -0.37841796875, 0.209716796875, 0.7978515625, 1.385986328125, 1.97412109375, 2.562255859375, 3.150390625, 3.738525390625, 4.32666015625, 4.914794921875, 5.5029296875, 6.091064453125, 6.67919921875, 7.267333984375, 7.85546875, 8.443603515625, 9.03173828125, 9.619873046875, 10.2080078125, 10.796142578125, 11.38427734375, 11.972412109375, 12.560546875, 13.148681640625, 13.73681640625, 14.324951171875, 14.9130859375, 15.501220703125, 16.08935546875, 16.677490234375, 17.265625]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 4.0, 4.0, 7.0, 13.0, 14.0, 25.0, 29.0, 36.0, 50.0, 82.0, 122.0, 191.0, 284.0, 500.0, 677.0, 650.0, 542.0, 328.0, 162.0, 107.0, 71.0, 57.0, 41.0, 19.0, 13.0, 15.0, 7.0, 9.0, 5.0, 3.0, 5.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-18.6875, -18.2086181640625, -17.729736328125, -17.2508544921875, -16.77197265625, -16.2930908203125, -15.814208984375, -15.3353271484375, -14.8564453125, -14.3775634765625, -13.898681640625, -13.4197998046875, -12.94091796875, -12.4620361328125, -11.983154296875, -11.5042724609375, -11.025390625, -10.5465087890625, -10.067626953125, -9.5887451171875, -9.10986328125, -8.6309814453125, -8.152099609375, -7.6732177734375, -7.1943359375, -6.7154541015625, -6.236572265625, -5.7576904296875, -5.27880859375, -4.7999267578125, -4.321044921875, -3.8421630859375, -3.36328125, -2.8843994140625, -2.405517578125, -1.9266357421875, -1.44775390625, -0.9688720703125, -0.489990234375, -0.0111083984375, 0.4677734375, 0.9466552734375, 1.425537109375, 1.9044189453125, 2.38330078125, 2.8621826171875, 3.341064453125, 3.8199462890625, 4.298828125, 4.7777099609375, 5.256591796875, 5.7354736328125, 6.21435546875, 6.6932373046875, 7.172119140625, 7.6510009765625, 8.1298828125, 8.6087646484375, 9.087646484375, 9.5665283203125, 10.04541015625, 10.5242919921875, 11.003173828125, 11.4820556640625, 11.9609375]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 5.0, 4.0, 3.0, 7.0, 10.0, 14.0, 10.0, 26.0, 21.0, 59.0, 68.0, 130.0, 200.0, 536.0, 3089.0, 315759.0, 3863527.0, 9167.0, 882.0, 299.0, 170.0, 97.0, 64.0, 33.0, 30.0, 32.0, 12.0, 13.0, 6.0, 5.0, 3.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.40625, -55.12646484375, -52.8466796875, -50.56689453125, -48.287109375, -46.00732421875, -43.7275390625, -41.44775390625, -39.16796875, -36.88818359375, -34.6083984375, -32.32861328125, -30.048828125, -27.76904296875, -25.4892578125, -23.20947265625, -20.9296875, -18.64990234375, -16.3701171875, -14.09033203125, -11.810546875, -9.53076171875, -7.2509765625, -4.97119140625, -2.69140625, -0.41162109375, 1.8681640625, 4.14794921875, 6.427734375, 8.70751953125, 10.9873046875, 13.26708984375, 15.546875, 17.82666015625, 20.1064453125, 22.38623046875, 24.666015625, 26.94580078125, 29.2255859375, 31.50537109375, 33.78515625, 36.06494140625, 38.3447265625, 40.62451171875, 42.904296875, 45.18408203125, 47.4638671875, 49.74365234375, 52.0234375, 54.30322265625, 56.5830078125, 58.86279296875, 61.142578125, 63.42236328125, 65.7021484375, 67.98193359375, 70.26171875, 72.54150390625, 74.8212890625, 77.10107421875, 79.380859375, 81.66064453125, 83.9404296875, 86.22021484375, 88.5]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 15.0, 28.0, 80.0, 157.0, 280.0, 275.0, 121.0, 44.0, 9.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-192.33062744140625, -188.61984252929688, -184.90904235839844, -181.19825744628906, -177.48745727539062, -173.77667236328125, -170.0658721923828, -166.35508728027344, -162.644287109375, -158.93350219726562, -155.2227020263672, -151.5119171142578, -147.80111694335938, -144.09033203125, -140.37953186035156, -136.6687469482422, -132.9579620361328, -129.24717712402344, -125.536376953125, -121.8255844116211, -118.11479187011719, -114.40400695800781, -110.69320678710938, -106.982421875, -103.27162170410156, -99.56082916259766, -95.85003662109375, -92.13924407958984, -88.42845153808594, -84.71766662597656, -81.00686645507812, -77.29608154296875, -73.58528137207031, -69.8744888305664, -66.1636962890625, -62.452903747558594, -58.74211502075195, -55.03132247924805, -51.32052993774414, -47.6097412109375, -43.898948669433594, -40.18815612792969, -36.47736358642578, -32.766571044921875, -29.055782318115234, -25.344989776611328, -21.634197235107422, -17.92340660095215, -14.212615966796875, -10.501824378967285, -6.791032314300537, -3.080240249633789, 0.6305513381958008, 4.341342926025391, 8.052135467529297, 11.76292610168457, 15.473718643188477, 19.184511184692383, 22.895301818847656, 26.606094360351562, 30.31688690185547, 34.027679443359375, 37.73847198486328, 41.44926071166992, 45.16005325317383]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 5.0, 5.0, 3.0, 14.0, 7.0, 10.0, 8.0, 14.0, 8.0, 12.0, 25.0, 29.0, 28.0, 19.0, 27.0, 32.0, 34.0, 32.0, 35.0, 46.0, 45.0, 55.0, 49.0, 40.0, 45.0, 52.0, 40.0, 26.0, 40.0, 35.0, 24.0, 19.0, 26.0, 18.0, 16.0, 9.0, 19.0, 15.0, 10.0, 8.0, 8.0, 4.0, 4.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-44.25641632080078, -43.02717590332031, -41.79793930053711, -40.56869888305664, -39.33946228027344, -38.11022186279297, -36.8809814453125, -35.6517448425293, -34.42250442504883, -33.19326400756836, -31.964027404785156, -30.734786987304688, -29.50554847717285, -28.276309967041016, -27.04707145690918, -25.817832946777344, -24.588594436645508, -23.359355926513672, -22.130117416381836, -20.90087890625, -19.67163848876953, -18.442399978637695, -17.21316146850586, -15.983922004699707, -14.754683494567871, -13.525444984436035, -12.296205520629883, -11.066967010498047, -9.837728500366211, -8.608489036560059, -7.379250526428223, -6.15001106262207, -4.920772552490234, -3.6915335655212402, -2.462294816970825, -1.2330560684204102, -0.0038170814514160156, 1.2254219055175781, 2.454660415649414, 3.6838998794555664, 4.913138389587402, 6.1423773765563965, 7.371616363525391, 8.600854873657227, 9.830093383789062, 11.059332847595215, 12.28857135772705, 13.517810821533203, 14.747049331665039, 15.976287841796875, 17.20552635192871, 18.434764862060547, 19.664005279541016, 20.89324378967285, 22.122482299804688, 23.351722717285156, 24.58095932006836, 25.810197830200195, 27.03943634033203, 28.2686767578125, 29.497915267944336, 30.727153778076172, 31.956392288208008, 33.185630798339844, 34.41487121582031]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 6.0, 6.0, 4.0, 9.0, 11.0, 11.0, 12.0, 16.0, 18.0, 17.0, 30.0, 22.0, 18.0, 27.0, 43.0, 38.0, 35.0, 39.0, 46.0, 40.0, 46.0, 36.0, 47.0, 44.0, 37.0, 31.0, 45.0, 28.0, 35.0, 28.0, 21.0, 29.0, 18.0, 21.0, 15.0, 13.0, 12.0, 10.0, 14.0, 7.0, 8.0, 6.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.546875, -6.34478759765625, -6.1427001953125, -5.94061279296875, -5.738525390625, -5.53643798828125, -5.3343505859375, -5.13226318359375, -4.93017578125, -4.72808837890625, -4.5260009765625, -4.32391357421875, -4.121826171875, -3.91973876953125, -3.7176513671875, -3.51556396484375, -3.3134765625, -3.11138916015625, -2.9093017578125, -2.70721435546875, -2.505126953125, -2.30303955078125, -2.1009521484375, -1.89886474609375, -1.69677734375, -1.49468994140625, -1.2926025390625, -1.09051513671875, -0.888427734375, -0.68634033203125, -0.4842529296875, -0.28216552734375, -0.080078125, 0.12200927734375, 0.3240966796875, 0.52618408203125, 0.728271484375, 0.93035888671875, 1.1324462890625, 1.33453369140625, 1.53662109375, 1.73870849609375, 1.9407958984375, 2.14288330078125, 2.344970703125, 2.54705810546875, 2.7491455078125, 2.95123291015625, 3.1533203125, 3.35540771484375, 3.5574951171875, 3.75958251953125, 3.961669921875, 4.16375732421875, 4.3658447265625, 4.56793212890625, 4.77001953125, 4.97210693359375, 5.1741943359375, 5.37628173828125, 5.578369140625, 5.78045654296875, 5.9825439453125, 6.18463134765625, 6.38671875]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 1.0, 8.0, 7.0, 8.0, 27.0, 27.0, 56.0, 54.0, 78.0, 150.0, 188.0, 264.0, 446.0, 627.0, 978.0, 1390.0, 2111.0, 2992.0, 4606.0, 6934.0, 10357.0, 16059.0, 25309.0, 40384.0, 67371.0, 118673.0, 232063.0, 225701.0, 115107.0, 65868.0, 39655.0, 24694.0, 15749.0, 10135.0, 6759.0, 4370.0, 3048.0, 2099.0, 1388.0, 906.0, 662.0, 388.0, 280.0, 210.0, 118.0, 94.0, 60.0, 38.0, 12.0, 13.0, 23.0, 9.0, 2.0, 7.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.258544921875, -0.2501983642578125, -0.241851806640625, -0.2335052490234375, -0.22515869140625, -0.2168121337890625, -0.208465576171875, -0.2001190185546875, -0.1917724609375, -0.1834259033203125, -0.175079345703125, -0.1667327880859375, -0.15838623046875, -0.1500396728515625, -0.141693115234375, -0.1333465576171875, -0.125, -0.1166534423828125, -0.108306884765625, -0.0999603271484375, -0.09161376953125, -0.0832672119140625, -0.074920654296875, -0.0665740966796875, -0.0582275390625, -0.0498809814453125, -0.041534423828125, -0.0331878662109375, -0.02484130859375, -0.0164947509765625, -0.008148193359375, 0.0001983642578125, 0.008544921875, 0.0168914794921875, 0.025238037109375, 0.0335845947265625, 0.04193115234375, 0.0502777099609375, 0.058624267578125, 0.0669708251953125, 0.0753173828125, 0.0836639404296875, 0.092010498046875, 0.1003570556640625, 0.10870361328125, 0.1170501708984375, 0.125396728515625, 0.1337432861328125, 0.14208984375, 0.1504364013671875, 0.158782958984375, 0.1671295166015625, 0.17547607421875, 0.1838226318359375, 0.192169189453125, 0.2005157470703125, 0.2088623046875, 0.2172088623046875, 0.225555419921875, 0.2339019775390625, 0.24224853515625, 0.2505950927734375, 0.258941650390625, 0.2672882080078125, 0.275634765625]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 13.0, 8.0, 15.0, 8.0, 15.0, 11.0, 9.0, 21.0, 22.0, 27.0, 22.0, 32.0, 37.0, 31.0, 43.0, 38.0, 45.0, 34.0, 38.0, 1070.0, 32.0, 33.0, 45.0, 36.0, 39.0, 42.0, 30.0, 38.0, 30.0, 35.0, 22.0, 14.0, 19.0, 13.0, 11.0, 13.0, 11.0, 5.0, 8.0, 3.0, 4.0, 5.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.880859375, -3.749542236328125, -3.61822509765625, -3.486907958984375, -3.3555908203125, -3.224273681640625, -3.09295654296875, -2.961639404296875, -2.830322265625, -2.699005126953125, -2.56768798828125, -2.436370849609375, -2.3050537109375, -2.173736572265625, -2.04241943359375, -1.911102294921875, -1.77978515625, -1.648468017578125, -1.51715087890625, -1.385833740234375, -1.2545166015625, -1.123199462890625, -0.99188232421875, -0.860565185546875, -0.729248046875, -0.597930908203125, -0.46661376953125, -0.335296630859375, -0.2039794921875, -0.072662353515625, 0.05865478515625, 0.189971923828125, 0.3212890625, 0.452606201171875, 0.58392333984375, 0.715240478515625, 0.8465576171875, 0.977874755859375, 1.10919189453125, 1.240509033203125, 1.371826171875, 1.503143310546875, 1.63446044921875, 1.765777587890625, 1.8970947265625, 2.028411865234375, 2.15972900390625, 2.291046142578125, 2.42236328125, 2.553680419921875, 2.68499755859375, 2.816314697265625, 2.9476318359375, 3.078948974609375, 3.21026611328125, 3.341583251953125, 3.472900390625, 3.604217529296875, 3.73553466796875, 3.866851806640625, 3.9981689453125, 4.129486083984375, 4.26080322265625, 4.392120361328125, 4.5234375]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 4.0, 8.0, 5.0, 17.0, 15.0, 31.0, 37.0, 40.0, 74.0, 108.0, 165.0, 227.0, 314.0, 406.0, 619.0, 874.0, 1296.0, 1896.0, 2665.0, 3941.0, 5839.0, 8934.0, 13638.0, 21314.0, 33515.0, 55443.0, 93210.0, 161362.0, 1290687.0, 158965.0, 91432.0, 54719.0, 33577.0, 21188.0, 13518.0, 8781.0, 5663.0, 3953.0, 2632.0, 1795.0, 1238.0, 866.0, 609.0, 450.0, 297.0, 234.0, 164.0, 109.0, 89.0, 54.0, 34.0, 28.0, 23.0, 10.0, 14.0, 5.0, 9.0, 4.0, 2.0, 2.0], "bins": [-0.19091796875, -0.1850414276123047, -0.17916488647460938, -0.17328834533691406, -0.16741180419921875, -0.16153526306152344, -0.15565872192382812, -0.1497821807861328, -0.1439056396484375, -0.1380290985107422, -0.13215255737304688, -0.12627601623535156, -0.12039947509765625, -0.11452293395996094, -0.10864639282226562, -0.10276985168457031, -0.096893310546875, -0.09101676940917969, -0.08514022827148438, -0.07926368713378906, -0.07338714599609375, -0.06751060485839844, -0.061634063720703125, -0.05575752258300781, -0.0498809814453125, -0.04400444030761719, -0.038127899169921875, -0.03225135803222656, -0.02637481689453125, -0.020498275756835938, -0.014621734619140625, -0.008745193481445312, -0.00286865234375, 0.0030078887939453125, 0.008884429931640625, 0.014760971069335938, 0.02063751220703125, 0.026514053344726562, 0.032390594482421875, 0.03826713562011719, 0.0441436767578125, 0.05002021789550781, 0.055896759033203125, 0.06177330017089844, 0.06764984130859375, 0.07352638244628906, 0.07940292358398438, 0.08527946472167969, 0.091156005859375, 0.09703254699707031, 0.10290908813476562, 0.10878562927246094, 0.11466217041015625, 0.12053871154785156, 0.12641525268554688, 0.1322917938232422, 0.1381683349609375, 0.1440448760986328, 0.14992141723632812, 0.15579795837402344, 0.16167449951171875, 0.16755104064941406, 0.17342758178710938, 0.1793041229248047, 0.1851806640625]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 2.0, 3.0, 7.0, 6.0, 9.0, 11.0, 10.0, 13.0, 18.0, 25.0, 28.0, 34.0, 37.0, 35.0, 79.0, 108.0, 140.0, 112.0, 83.0, 52.0, 41.0, 30.0, 22.0, 16.0, 17.0, 10.0, 16.0, 6.0, 7.0, 7.0, 4.0, 0.0, 0.0, 3.0, 0.0, 3.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003261566162109375, -0.00031606853008270264, -0.0003059804439544678, -0.0002958923578262329, -0.00028580427169799805, -0.0002757161855697632, -0.0002656280994415283, -0.00025554001331329346, -0.0002454519271850586, -0.00023536384105682373, -0.00022527575492858887, -0.000215187668800354, -0.00020509958267211914, -0.00019501149654388428, -0.00018492341041564941, -0.00017483532428741455, -0.0001647472381591797, -0.00015465915203094482, -0.00014457106590270996, -0.0001344829797744751, -0.00012439489364624023, -0.00011430680751800537, -0.00010421872138977051, -9.413063526153564e-05, -8.404254913330078e-05, -7.395446300506592e-05, -6.386637687683105e-05, -5.377829074859619e-05, -4.369020462036133e-05, -3.3602118492126465e-05, -2.35140323638916e-05, -1.3425946235656738e-05, -3.337860107421875e-06, 6.750226020812988e-06, 1.683831214904785e-05, 2.6926398277282715e-05, 3.701448440551758e-05, 4.710257053375244e-05, 5.7190656661987305e-05, 6.727874279022217e-05, 7.736682891845703e-05, 8.74549150466919e-05, 9.754300117492676e-05, 0.00010763108730316162, 0.00011771917343139648, 0.00012780725955963135, 0.0001378953456878662, 0.00014798343181610107, 0.00015807151794433594, 0.0001681596040725708, 0.00017824769020080566, 0.00018833577632904053, 0.0001984238624572754, 0.00020851194858551025, 0.00021860003471374512, 0.00022868812084197998, 0.00023877620697021484, 0.0002488642930984497, 0.00025895237922668457, 0.00026904046535491943, 0.0002791285514831543, 0.00028921663761138916, 0.000299304723739624, 0.0003093928098678589, 0.00031948089599609375]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 9.0, 6.0, 14.0, 9.0, 12.0, 20.0, 25.0, 35.0, 35.0, 62.0, 99.0, 131.0, 249.0, 679.0, 16097.0, 1023624.0, 6272.0, 509.0, 195.0, 119.0, 90.0, 67.0, 47.0, 31.0, 24.0, 17.0, 16.0, 9.0, 9.0, 12.0, 7.0, 2.0, 6.0, 2.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.006137847900390625, -0.0059424638748168945, -0.005747079849243164, -0.005551695823669434, -0.005356311798095703, -0.005160927772521973, -0.004965543746948242, -0.004770159721374512, -0.004574775695800781, -0.004379391670227051, -0.00418400764465332, -0.00398862361907959, -0.0037932395935058594, -0.003597855567932129, -0.0034024715423583984, -0.003207087516784668, -0.0030117034912109375, -0.002816319465637207, -0.0026209354400634766, -0.002425551414489746, -0.0022301673889160156, -0.002034783363342285, -0.0018393993377685547, -0.0016440153121948242, -0.0014486312866210938, -0.0012532472610473633, -0.0010578632354736328, -0.0008624792098999023, -0.0006670951843261719, -0.0004717111587524414, -0.00027632713317871094, -8.094310760498047e-05, 0.00011444091796875, 0.00030982494354248047, 0.0005052089691162109, 0.0007005929946899414, 0.0008959770202636719, 0.0010913610458374023, 0.0012867450714111328, 0.0014821290969848633, 0.0016775131225585938, 0.0018728971481323242, 0.0020682811737060547, 0.002263665199279785, 0.0024590492248535156, 0.002654433250427246, 0.0028498172760009766, 0.003045201301574707, 0.0032405853271484375, 0.003435969352722168, 0.0036313533782958984, 0.003826737403869629, 0.004022121429443359, 0.00421750545501709, 0.00441288948059082, 0.004608273506164551, 0.004803657531738281, 0.004999041557312012, 0.005194425582885742, 0.005389809608459473, 0.005585193634033203, 0.005780577659606934, 0.005975961685180664, 0.0061713457107543945, 0.006366729736328125]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 7.0, 201.0, 762.0, 42.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000331379531417042, -0.00028601803933270276, -0.00024065653269644827, -0.00019529502606019378, -0.00014993353397585452, -0.00010457204189151525, -5.921052070334554e-05, -1.3849028619006276e-05, 3.1512463465332985e-05, 7.687396282562986e-05, 0.00012223546218592674, 0.00016759696882218122, 0.00021295846090652049, 0.00025831995299085975, 0.00030368147417902946, 0.0003490429662633687, 0.000394404458347708, 0.00043976595043204725, 0.0004851274425163865, 0.0005304889637045562, 0.0005758504848927259, 0.0006212119478732347, 0.0006665734690614045, 0.0007119349902495742, 0.000757296453230083, 0.0008026579744182527, 0.0008480194373987615, 0.0008933809585869312, 0.00093874242156744, 0.0009841038845479488, 0.0010294654639437795, 0.0010748269269242883, 0.001120188506320119, 0.0011655499693006277, 0.0012109115486964583, 0.0012562730116769671, 0.001301634474657476, 0.0013469960540533066, 0.0013923575170338154, 0.0014377189800143242, 0.001483080442994833, 0.0015284419059753418, 0.0015738034853711724, 0.0016191649483516812, 0.00166452641133219, 0.0017098879907280207, 0.0017552494537085295, 0.0018006109166890383, 0.001845972496084869, 0.0018913339590653777, 0.0019366955384612083, 0.001982057001441717, 0.002027418464422226, 0.0020727799274027348, 0.0021181413903832436, 0.002163503086194396, 0.002208864549174905, 0.0022542260121554136, 0.0022995874751359224, 0.002344949170947075, 0.0023903106339275837, 0.0024356720969080925, 0.0024810335598886013, 0.00252639502286911, 0.002571756485849619]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 7.0, 3.0, 3.0, 8.0, 5.0, 9.0, 10.0, 13.0, 14.0, 15.0, 24.0, 15.0, 26.0, 24.0, 30.0, 36.0, 32.0, 29.0, 39.0, 45.0, 41.0, 38.0, 37.0, 54.0, 33.0, 50.0, 38.0, 41.0, 47.0, 37.0, 37.0, 28.0, 23.0, 19.0, 11.0, 18.0, 16.0, 18.0, 5.0, 4.0, 11.0, 5.0, 6.0, 2.0, 2.0, 3.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.00016635656356811523, -0.0001615956425666809, -0.00015683472156524658, -0.00015207380056381226, -0.00014731287956237793, -0.0001425519585609436, -0.00013779103755950928, -0.00013303011655807495, -0.00012826919555664062, -0.0001235082745552063, -0.00011874735355377197, -0.00011398643255233765, -0.00010922551155090332, -0.000104464590549469, -9.970366954803467e-05, -9.494274854660034e-05, -9.018182754516602e-05, -8.542090654373169e-05, -8.065998554229736e-05, -7.589906454086304e-05, -7.113814353942871e-05, -6.637722253799438e-05, -6.161630153656006e-05, -5.685538053512573e-05, -5.2094459533691406e-05, -4.733353853225708e-05, -4.2572617530822754e-05, -3.781169652938843e-05, -3.30507755279541e-05, -2.8289854526519775e-05, -2.352893352508545e-05, -1.8768012523651123e-05, -1.4007091522216797e-05, -9.24617052078247e-06, -4.4852495193481445e-06, 2.7567148208618164e-07, 5.036592483520508e-06, 9.797513484954834e-06, 1.455843448638916e-05, 1.9319355487823486e-05, 2.4080276489257812e-05, 2.884119749069214e-05, 3.3602118492126465e-05, 3.836303949356079e-05, 4.312396049499512e-05, 4.788488149642944e-05, 5.264580249786377e-05, 5.7406723499298096e-05, 6.216764450073242e-05, 6.692856550216675e-05, 7.168948650360107e-05, 7.64504075050354e-05, 8.121132850646973e-05, 8.597224950790405e-05, 9.073317050933838e-05, 9.54940915107727e-05, 0.00010025501251220703, 0.00010501593351364136, 0.00010977685451507568, 0.00011453777551651001, 0.00011929869651794434, 0.00012405961751937866, 0.000128820538520813, 0.00013358145952224731, 0.00013834238052368164]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 6.0, 6.0, 4.0, 9.0, 11.0, 11.0, 12.0, 16.0, 18.0, 17.0, 30.0, 22.0, 18.0, 27.0, 43.0, 38.0, 35.0, 39.0, 46.0, 40.0, 46.0, 36.0, 47.0, 44.0, 37.0, 31.0, 45.0, 28.0, 35.0, 28.0, 21.0, 29.0, 18.0, 21.0, 15.0, 13.0, 12.0, 10.0, 14.0, 7.0, 8.0, 6.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.546875, -6.34478759765625, -6.1427001953125, -5.94061279296875, -5.738525390625, -5.53643798828125, -5.3343505859375, -5.13226318359375, -4.93017578125, -4.72808837890625, -4.5260009765625, -4.32391357421875, -4.121826171875, -3.91973876953125, -3.7176513671875, -3.51556396484375, -3.3134765625, -3.11138916015625, -2.9093017578125, -2.70721435546875, -2.505126953125, -2.30303955078125, -2.1009521484375, -1.89886474609375, -1.69677734375, -1.49468994140625, -1.2926025390625, -1.09051513671875, -0.888427734375, -0.68634033203125, -0.4842529296875, -0.28216552734375, -0.080078125, 0.12200927734375, 0.3240966796875, 0.52618408203125, 0.728271484375, 0.93035888671875, 1.1324462890625, 1.33453369140625, 1.53662109375, 1.73870849609375, 1.9407958984375, 2.14288330078125, 2.344970703125, 2.54705810546875, 2.7491455078125, 2.95123291015625, 3.1533203125, 3.35540771484375, 3.5574951171875, 3.75958251953125, 3.961669921875, 4.16375732421875, 4.3658447265625, 4.56793212890625, 4.77001953125, 4.97210693359375, 5.1741943359375, 5.37628173828125, 5.578369140625, 5.78045654296875, 5.9825439453125, 6.18463134765625, 6.38671875]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 9.0, 5.0, 22.0, 12.0, 31.0, 24.0, 48.0, 63.0, 83.0, 92.0, 162.0, 231.0, 373.0, 507.0, 893.0, 1557.0, 2876.0, 5482.0, 11961.0, 29042.0, 80595.0, 236563.0, 430414.0, 155295.0, 53545.0, 20083.0, 8813.0, 4151.0, 2202.0, 1230.0, 723.0, 456.0, 298.0, 206.0, 150.0, 86.0, 81.0, 45.0, 47.0, 29.0, 17.0, 22.0, 11.0, 8.0, 9.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0], "bins": [-6.81640625, -6.60540771484375, -6.3944091796875, -6.18341064453125, -5.972412109375, -5.76141357421875, -5.5504150390625, -5.33941650390625, -5.12841796875, -4.91741943359375, -4.7064208984375, -4.49542236328125, -4.284423828125, -4.07342529296875, -3.8624267578125, -3.65142822265625, -3.4404296875, -3.22943115234375, -3.0184326171875, -2.80743408203125, -2.596435546875, -2.38543701171875, -2.1744384765625, -1.96343994140625, -1.75244140625, -1.54144287109375, -1.3304443359375, -1.11944580078125, -0.908447265625, -0.69744873046875, -0.4864501953125, -0.27545166015625, -0.064453125, 0.14654541015625, 0.3575439453125, 0.56854248046875, 0.779541015625, 0.99053955078125, 1.2015380859375, 1.41253662109375, 1.62353515625, 1.83453369140625, 2.0455322265625, 2.25653076171875, 2.467529296875, 2.67852783203125, 2.8895263671875, 3.10052490234375, 3.3115234375, 3.52252197265625, 3.7335205078125, 3.94451904296875, 4.155517578125, 4.36651611328125, 4.5775146484375, 4.78851318359375, 4.99951171875, 5.21051025390625, 5.4215087890625, 5.63250732421875, 5.843505859375, 6.05450439453125, 6.2655029296875, 6.47650146484375, 6.6875]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 6.0, 4.0, 3.0, 3.0, 9.0, 14.0, 4.0, 12.0, 8.0, 20.0, 19.0, 25.0, 24.0, 30.0, 22.0, 28.0, 28.0, 29.0, 37.0, 66.0, 86.0, 179.0, 1512.0, 308.0, 107.0, 69.0, 44.0, 37.0, 37.0, 40.0, 43.0, 22.0, 33.0, 29.0, 23.0, 15.0, 14.0, 9.0, 12.0, 9.0, 15.0, 6.0, 6.0, 3.0, 3.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.28125, -17.739013671875, -17.19677734375, -16.654541015625, -16.1123046875, -15.570068359375, -15.02783203125, -14.485595703125, -13.943359375, -13.401123046875, -12.85888671875, -12.316650390625, -11.7744140625, -11.232177734375, -10.68994140625, -10.147705078125, -9.60546875, -9.063232421875, -8.52099609375, -7.978759765625, -7.4365234375, -6.894287109375, -6.35205078125, -5.809814453125, -5.267578125, -4.725341796875, -4.18310546875, -3.640869140625, -3.0986328125, -2.556396484375, -2.01416015625, -1.471923828125, -0.9296875, -0.387451171875, 0.15478515625, 0.697021484375, 1.2392578125, 1.781494140625, 2.32373046875, 2.865966796875, 3.408203125, 3.950439453125, 4.49267578125, 5.034912109375, 5.5771484375, 6.119384765625, 6.66162109375, 7.203857421875, 7.74609375, 8.288330078125, 8.83056640625, 9.372802734375, 9.9150390625, 10.457275390625, 10.99951171875, 11.541748046875, 12.083984375, 12.626220703125, 13.16845703125, 13.710693359375, 14.2529296875, 14.795166015625, 15.33740234375, 15.879638671875, 16.421875]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 4.0, 3.0, 5.0, 5.0, 6.0, 14.0, 12.0, 12.0, 16.0, 25.0, 36.0, 29.0, 48.0, 62.0, 78.0, 105.0, 135.0, 237.0, 432.0, 915.0, 3873.0, 322805.0, 2806583.0, 7814.0, 1111.0, 425.0, 250.0, 175.0, 132.0, 89.0, 73.0, 42.0, 42.0, 28.0, 21.0, 16.0, 13.0, 10.0, 11.0, 8.0, 4.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-44.75, -43.26513671875, -41.7802734375, -40.29541015625, -38.810546875, -37.32568359375, -35.8408203125, -34.35595703125, -32.87109375, -31.38623046875, -29.9013671875, -28.41650390625, -26.931640625, -25.44677734375, -23.9619140625, -22.47705078125, -20.9921875, -19.50732421875, -18.0224609375, -16.53759765625, -15.052734375, -13.56787109375, -12.0830078125, -10.59814453125, -9.11328125, -7.62841796875, -6.1435546875, -4.65869140625, -3.173828125, -1.68896484375, -0.2041015625, 1.28076171875, 2.765625, 4.25048828125, 5.7353515625, 7.22021484375, 8.705078125, 10.18994140625, 11.6748046875, 13.15966796875, 14.64453125, 16.12939453125, 17.6142578125, 19.09912109375, 20.583984375, 22.06884765625, 23.5537109375, 25.03857421875, 26.5234375, 28.00830078125, 29.4931640625, 30.97802734375, 32.462890625, 33.94775390625, 35.4326171875, 36.91748046875, 38.40234375, 39.88720703125, 41.3720703125, 42.85693359375, 44.341796875, 45.82666015625, 47.3115234375, 48.79638671875, 50.28125]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 111.0, 524.0, 345.0, 33.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-204.02435302734375, -200.29823303222656, -196.57211303710938, -192.84597778320312, -189.11985778808594, -185.39373779296875, -181.66761779785156, -177.94149780273438, -174.21536254882812, -170.48924255371094, -166.76312255859375, -163.0369873046875, -159.3108673095703, -155.58474731445312, -151.85862731933594, -148.13250732421875, -144.40638732910156, -140.68026733398438, -136.9541473388672, -133.22801208496094, -129.50189208984375, -125.77577209472656, -122.04965209960938, -118.32352447509766, -114.59739685058594, -110.87127685546875, -107.14514923095703, -103.41902923583984, -99.69290161132812, -95.96678161621094, -92.24066162109375, -88.51453399658203, -84.78840637207031, -81.06228637695312, -77.3361587524414, -73.61003875732422, -69.8839111328125, -66.15779113769531, -62.43166732788086, -58.705543518066406, -54.97942352294922, -51.253299713134766, -47.52717590332031, -43.801055908203125, -40.07493209838867, -36.34880828857422, -32.622684478759766, -28.896562576293945, -25.170440673828125, -21.444316864013672, -17.71819496154785, -13.992071151733398, -10.265948295593262, -6.539825439453125, -2.813701629638672, 0.9124202728271484, 4.638544082641602, 8.364666938781738, 12.090789794921875, 15.816913604736328, 19.54303741455078, 23.2691593170166, 26.995283126831055, 30.721405029296875, 34.44752883911133]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 6.0, 2.0, 2.0, 0.0, 3.0, 4.0, 5.0, 8.0, 6.0, 12.0, 18.0, 17.0, 21.0, 16.0, 25.0, 23.0, 19.0, 25.0, 32.0, 26.0, 33.0, 44.0, 37.0, 42.0, 44.0, 52.0, 45.0, 40.0, 33.0, 35.0, 21.0, 36.0, 41.0, 45.0, 34.0, 26.0, 29.0, 17.0, 15.0, 16.0, 15.0, 8.0, 10.0, 9.0, 5.0, 3.0, 4.0, 5.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.30317687988281, -39.91122055053711, -38.51926803588867, -37.12731170654297, -35.735355377197266, -34.34339904785156, -32.951446533203125, -31.559490203857422, -30.16753578186035, -28.77558135986328, -27.383625030517578, -25.991670608520508, -24.599716186523438, -23.207759857177734, -21.815805435180664, -20.423851013183594, -19.03189468383789, -17.63994026184082, -16.247983932495117, -14.856029510498047, -13.46407413482666, -12.072118759155273, -10.680164337158203, -9.288208961486816, -7.89625358581543, -6.504298210144043, -5.1123433113098145, -3.720388412475586, -2.328433036804199, -0.9364776611328125, 0.4554767608642578, 1.8474321365356445, 3.239391326904297, 4.631346702575684, 6.023301601409912, 7.415256500244141, 8.807211875915527, 10.199167251586914, 11.591121673583984, 12.983077049255371, 14.375032424926758, 15.766987800598145, 17.15894317626953, 18.5508975982666, 19.942852020263672, 21.334808349609375, 22.726762771606445, 24.118717193603516, 25.51067352294922, 26.90262794494629, 28.294584274291992, 29.686538696289062, 31.078495025634766, 32.47045135498047, 33.862403869628906, 35.25436019897461, 36.64631652832031, 38.038272857666016, 39.43022537231445, 40.822181701660156, 42.21413803100586, 43.60609436035156, 44.998046875, 46.3900032043457, 47.78195571899414]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 3.0, 6.0, 7.0, 4.0, 9.0, 10.0, 12.0, 15.0, 22.0, 22.0, 22.0, 20.0, 19.0, 23.0, 24.0, 46.0, 34.0, 42.0, 54.0, 46.0, 34.0, 44.0, 42.0, 41.0, 43.0, 30.0, 45.0, 33.0, 26.0, 32.0, 37.0, 28.0, 16.0, 19.0, 16.0, 14.0, 15.0, 8.0, 8.0, 10.0, 11.0, 10.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.0, -6.7862548828125, -6.572509765625, -6.3587646484375, -6.14501953125, -5.9312744140625, -5.717529296875, -5.5037841796875, -5.2900390625, -5.0762939453125, -4.862548828125, -4.6488037109375, -4.43505859375, -4.2213134765625, -4.007568359375, -3.7938232421875, -3.580078125, -3.3663330078125, -3.152587890625, -2.9388427734375, -2.72509765625, -2.5113525390625, -2.297607421875, -2.0838623046875, -1.8701171875, -1.6563720703125, -1.442626953125, -1.2288818359375, -1.01513671875, -0.8013916015625, -0.587646484375, -0.3739013671875, -0.16015625, 0.0535888671875, 0.267333984375, 0.4810791015625, 0.69482421875, 0.9085693359375, 1.122314453125, 1.3360595703125, 1.5498046875, 1.7635498046875, 1.977294921875, 2.1910400390625, 2.40478515625, 2.6185302734375, 2.832275390625, 3.0460205078125, 3.259765625, 3.4735107421875, 3.687255859375, 3.9010009765625, 4.11474609375, 4.3284912109375, 4.542236328125, 4.7559814453125, 4.9697265625, 5.1834716796875, 5.397216796875, 5.6109619140625, 5.82470703125, 6.0384521484375, 6.252197265625, 6.4659423828125, 6.6796875]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 7.0, 4.0, 2.0, 11.0, 10.0, 8.0, 10.0, 14.0, 18.0, 19.0, 35.0, 33.0, 54.0, 66.0, 80.0, 162.0, 336.0, 866.0, 2372.0, 9401.0, 96906.0, 2905599.0, 1138901.0, 31322.0, 5229.0, 1524.0, 554.0, 270.0, 139.0, 78.0, 58.0, 39.0, 35.0, 16.0, 21.0, 16.0, 14.0, 11.0, 15.0, 5.0, 11.0, 6.0, 3.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-23.453125, -22.759521484375, -22.06591796875, -21.372314453125, -20.6787109375, -19.985107421875, -19.29150390625, -18.597900390625, -17.904296875, -17.210693359375, -16.51708984375, -15.823486328125, -15.1298828125, -14.436279296875, -13.74267578125, -13.049072265625, -12.35546875, -11.661865234375, -10.96826171875, -10.274658203125, -9.5810546875, -8.887451171875, -8.19384765625, -7.500244140625, -6.806640625, -6.113037109375, -5.41943359375, -4.725830078125, -4.0322265625, -3.338623046875, -2.64501953125, -1.951416015625, -1.2578125, -0.564208984375, 0.12939453125, 0.822998046875, 1.5166015625, 2.210205078125, 2.90380859375, 3.597412109375, 4.291015625, 4.984619140625, 5.67822265625, 6.371826171875, 7.0654296875, 7.759033203125, 8.45263671875, 9.146240234375, 9.83984375, 10.533447265625, 11.22705078125, 11.920654296875, 12.6142578125, 13.307861328125, 14.00146484375, 14.695068359375, 15.388671875, 16.082275390625, 16.77587890625, 17.469482421875, 18.1630859375, 18.856689453125, 19.55029296875, 20.243896484375, 20.9375]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 2.0, 3.0, 7.0, 2.0, 2.0, 8.0, 10.0, 19.0, 17.0, 20.0, 38.0, 37.0, 46.0, 59.0, 76.0, 142.0, 204.0, 297.0, 418.0, 519.0, 530.0, 485.0, 352.0, 232.0, 158.0, 110.0, 72.0, 48.0, 28.0, 20.0, 22.0, 17.0, 17.0, 15.0, 11.0, 8.0, 6.0, 6.0, 4.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.2109375, -11.8538818359375, -11.496826171875, -11.1397705078125, -10.78271484375, -10.4256591796875, -10.068603515625, -9.7115478515625, -9.3544921875, -8.9974365234375, -8.640380859375, -8.2833251953125, -7.92626953125, -7.5692138671875, -7.212158203125, -6.8551025390625, -6.498046875, -6.1409912109375, -5.783935546875, -5.4268798828125, -5.06982421875, -4.7127685546875, -4.355712890625, -3.9986572265625, -3.6416015625, -3.2845458984375, -2.927490234375, -2.5704345703125, -2.21337890625, -1.8563232421875, -1.499267578125, -1.1422119140625, -0.78515625, -0.4281005859375, -0.071044921875, 0.2860107421875, 0.64306640625, 1.0001220703125, 1.357177734375, 1.7142333984375, 2.0712890625, 2.4283447265625, 2.785400390625, 3.1424560546875, 3.49951171875, 3.8565673828125, 4.213623046875, 4.5706787109375, 4.927734375, 5.2847900390625, 5.641845703125, 5.9989013671875, 6.35595703125, 6.7130126953125, 7.070068359375, 7.4271240234375, 7.7841796875, 8.1412353515625, 8.498291015625, 8.8553466796875, 9.21240234375, 9.5694580078125, 9.926513671875, 10.2835693359375, 10.640625]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 3.0, 9.0, 3.0, 5.0, 9.0, 12.0, 9.0, 20.0, 19.0, 17.0, 20.0, 24.0, 55.0, 58.0, 94.0, 164.0, 254.0, 505.0, 2381.0, 78636.0, 4068334.0, 40659.0, 1782.0, 466.0, 234.0, 151.0, 83.0, 60.0, 45.0, 43.0, 30.0, 25.0, 14.0, 18.0, 17.0, 6.0, 2.0, 2.0, 7.0, 4.0, 0.0, 2.0, 2.0, 5.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.875, -53.9765625, -52.078125, -50.1796875, -48.28125, -46.3828125, -44.484375, -42.5859375, -40.6875, -38.7890625, -36.890625, -34.9921875, -33.09375, -31.1953125, -29.296875, -27.3984375, -25.5, -23.6015625, -21.703125, -19.8046875, -17.90625, -16.0078125, -14.109375, -12.2109375, -10.3125, -8.4140625, -6.515625, -4.6171875, -2.71875, -0.8203125, 1.078125, 2.9765625, 4.875, 6.7734375, 8.671875, 10.5703125, 12.46875, 14.3671875, 16.265625, 18.1640625, 20.0625, 21.9609375, 23.859375, 25.7578125, 27.65625, 29.5546875, 31.453125, 33.3515625, 35.25, 37.1484375, 39.046875, 40.9453125, 42.84375, 44.7421875, 46.640625, 48.5390625, 50.4375, 52.3359375, 54.234375, 56.1328125, 58.03125, 59.9296875, 61.828125, 63.7265625, 65.625]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 17.0, 97.0, 297.0, 399.0, 160.0, 34.0, 7.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.88795471191406, -38.234310150146484, -33.580665588378906, -28.927021026611328, -24.27337646484375, -19.619731903076172, -14.966087341308594, -10.312442779541016, -5.6587982177734375, -1.0051536560058594, 3.6484909057617188, 8.302135467529297, 12.955780029296875, 17.609424591064453, 22.26306915283203, 26.91671371459961, 31.570358276367188, 36.224002838134766, 40.877647399902344, 45.53129196166992, 50.1849365234375, 54.83858108520508, 59.492225646972656, 64.1458740234375, 68.79951477050781, 73.45315551757812, 78.10680389404297, 82.76045227050781, 87.41409301757812, 92.06773376464844, 96.72138214111328, 101.37503051757812, 106.02867126464844, 110.68231201171875, 115.3359603881836, 119.98960876464844, 124.64324951171875, 129.29689025878906, 133.95053100585938, 138.60418701171875, 143.25782775878906, 147.91146850585938, 152.56512451171875, 157.21876525878906, 161.87240600585938, 166.5260467529297, 171.1796875, 175.83334350585938, 180.4869842529297, 185.140625, 189.79428100585938, 194.4479217529297, 199.1015625, 203.7552032470703, 208.40884399414062, 213.0625, 217.7161407470703, 222.36978149414062, 227.0234375, 231.6770782470703, 236.33071899414062, 240.98435974121094, 245.63800048828125, 250.29165649414062, 254.94529724121094]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 4.0, 9.0, 9.0, 6.0, 8.0, 8.0, 15.0, 14.0, 21.0, 19.0, 23.0, 29.0, 30.0, 29.0, 31.0, 49.0, 29.0, 32.0, 44.0, 46.0, 41.0, 42.0, 41.0, 35.0, 45.0, 34.0, 33.0, 34.0, 30.0, 28.0, 26.0, 22.0, 18.0, 13.0, 18.0, 16.0, 15.0, 7.0, 12.0, 5.0, 7.0, 10.0, 6.0, 3.0, 5.0, 1.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 3.0], "bins": [-33.48048782348633, -32.41051483154297, -31.34054183959961, -30.27056884765625, -29.20059585571289, -28.13062286376953, -27.060651779174805, -25.990678787231445, -24.920705795288086, -23.850732803344727, -22.780759811401367, -21.710786819458008, -20.64081573486328, -19.570842742919922, -18.500869750976562, -17.430896759033203, -16.360923767089844, -15.290950775146484, -14.220977783203125, -13.151005744934082, -12.081032752990723, -11.011059761047363, -9.94108772277832, -8.871114730834961, -7.801141738891602, -6.731168746948242, -5.661196231842041, -4.59122371673584, -3.5212507247924805, -2.451277732849121, -1.38130521774292, -0.31133270263671875, 0.758636474609375, 1.8286092281341553, 2.8985819816589355, 3.968554735183716, 5.038527488708496, 6.1085004806518555, 7.178472995758057, 8.248445510864258, 9.318418502807617, 10.388391494750977, 11.458364486694336, 12.528336524963379, 13.598309516906738, 14.668282508850098, 15.73825454711914, 16.8082275390625, 17.87820053100586, 18.94817352294922, 20.018146514892578, 21.088119506835938, 22.158092498779297, 23.228065490722656, 24.298036575317383, 25.368009567260742, 26.4379825592041, 27.50795555114746, 28.57792854309082, 29.64790153503418, 30.717872619628906, 31.787845611572266, 32.857818603515625, 33.927791595458984, 34.997764587402344]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 5.0, 9.0, 8.0, 4.0, 14.0, 12.0, 12.0, 20.0, 13.0, 23.0, 19.0, 18.0, 22.0, 37.0, 21.0, 33.0, 27.0, 41.0, 43.0, 47.0, 53.0, 35.0, 46.0, 36.0, 39.0, 36.0, 32.0, 22.0, 25.0, 39.0, 36.0, 26.0, 24.0, 24.0, 9.0, 15.0, 11.0, 15.0, 14.0, 7.0, 8.0, 8.0, 4.0, 4.0, 1.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.9296875, -5.73681640625, -5.5439453125, -5.35107421875, -5.158203125, -4.96533203125, -4.7724609375, -4.57958984375, -4.38671875, -4.19384765625, -4.0009765625, -3.80810546875, -3.615234375, -3.42236328125, -3.2294921875, -3.03662109375, -2.84375, -2.65087890625, -2.4580078125, -2.26513671875, -2.072265625, -1.87939453125, -1.6865234375, -1.49365234375, -1.30078125, -1.10791015625, -0.9150390625, -0.72216796875, -0.529296875, -0.33642578125, -0.1435546875, 0.04931640625, 0.2421875, 0.43505859375, 0.6279296875, 0.82080078125, 1.013671875, 1.20654296875, 1.3994140625, 1.59228515625, 1.78515625, 1.97802734375, 2.1708984375, 2.36376953125, 2.556640625, 2.74951171875, 2.9423828125, 3.13525390625, 3.328125, 3.52099609375, 3.7138671875, 3.90673828125, 4.099609375, 4.29248046875, 4.4853515625, 4.67822265625, 4.87109375, 5.06396484375, 5.2568359375, 5.44970703125, 5.642578125, 5.83544921875, 6.0283203125, 6.22119140625, 6.4140625]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [5.0, 0.0, 1.0, 2.0, 3.0, 5.0, 10.0, 6.0, 25.0, 18.0, 30.0, 44.0, 76.0, 105.0, 149.0, 211.0, 322.0, 462.0, 711.0, 869.0, 1333.0, 1890.0, 2655.0, 3837.0, 5356.0, 7714.0, 11215.0, 15740.0, 22848.0, 34712.0, 54040.0, 91650.0, 171407.0, 250851.0, 144417.0, 78467.0, 47596.0, 31069.0, 20973.0, 14189.0, 9968.0, 7011.0, 4901.0, 3401.0, 2486.0, 1766.0, 1216.0, 877.0, 627.0, 420.0, 284.0, 202.0, 141.0, 94.0, 56.0, 42.0, 30.0, 20.0, 8.0, 9.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.271240234375, -0.2631111145019531, -0.25498199462890625, -0.24685287475585938, -0.2387237548828125, -0.23059463500976562, -0.22246551513671875, -0.21433639526367188, -0.206207275390625, -0.19807815551757812, -0.18994903564453125, -0.18181991577148438, -0.1736907958984375, -0.16556167602539062, -0.15743255615234375, -0.14930343627929688, -0.14117431640625, -0.13304519653320312, -0.12491607666015625, -0.11678695678710938, -0.1086578369140625, -0.10052871704101562, -0.09239959716796875, -0.08427047729492188, -0.076141357421875, -0.06801223754882812, -0.05988311767578125, -0.051753997802734375, -0.0436248779296875, -0.035495758056640625, -0.02736663818359375, -0.019237518310546875, -0.0111083984375, -0.002979278564453125, 0.00514984130859375, 0.013278961181640625, 0.0214080810546875, 0.029537200927734375, 0.03766632080078125, 0.045795440673828125, 0.053924560546875, 0.062053680419921875, 0.07018280029296875, 0.07831192016601562, 0.0864410400390625, 0.09457015991210938, 0.10269927978515625, 0.11082839965820312, 0.11895751953125, 0.12708663940429688, 0.13521575927734375, 0.14334487915039062, 0.1514739990234375, 0.15960311889648438, 0.16773223876953125, 0.17586135864257812, 0.183990478515625, 0.19211959838867188, 0.20024871826171875, 0.20837783813476562, 0.2165069580078125, 0.22463607788085938, 0.23276519775390625, 0.24089431762695312, 0.2490234375]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 3.0, 8.0, 9.0, 9.0, 12.0, 20.0, 11.0, 12.0, 21.0, 27.0, 21.0, 26.0, 34.0, 42.0, 39.0, 32.0, 37.0, 42.0, 52.0, 36.0, 1071.0, 44.0, 49.0, 49.0, 33.0, 57.0, 26.0, 32.0, 26.0, 27.0, 20.0, 16.0, 19.0, 10.0, 14.0, 8.0, 8.0, 8.0, 6.0, 7.0, 4.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.36328125, -4.2230224609375, -4.082763671875, -3.9425048828125, -3.80224609375, -3.6619873046875, -3.521728515625, -3.3814697265625, -3.2412109375, -3.1009521484375, -2.960693359375, -2.8204345703125, -2.68017578125, -2.5399169921875, -2.399658203125, -2.2593994140625, -2.119140625, -1.9788818359375, -1.838623046875, -1.6983642578125, -1.55810546875, -1.4178466796875, -1.277587890625, -1.1373291015625, -0.9970703125, -0.8568115234375, -0.716552734375, -0.5762939453125, -0.43603515625, -0.2957763671875, -0.155517578125, -0.0152587890625, 0.125, 0.2652587890625, 0.405517578125, 0.5457763671875, 0.68603515625, 0.8262939453125, 0.966552734375, 1.1068115234375, 1.2470703125, 1.3873291015625, 1.527587890625, 1.6678466796875, 1.80810546875, 1.9483642578125, 2.088623046875, 2.2288818359375, 2.369140625, 2.5093994140625, 2.649658203125, 2.7899169921875, 2.93017578125, 3.0704345703125, 3.210693359375, 3.3509521484375, 3.4912109375, 3.6314697265625, 3.771728515625, 3.9119873046875, 4.05224609375, 4.1925048828125, 4.332763671875, 4.4730224609375, 4.61328125]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 11.0, 12.0, 17.0, 34.0, 47.0, 79.0, 106.0, 163.0, 209.0, 299.0, 439.0, 680.0, 939.0, 1345.0, 1942.0, 2970.0, 4371.0, 6571.0, 9849.0, 15448.0, 24789.0, 40028.0, 65291.0, 113333.0, 208472.0, 1279433.0, 127252.0, 72797.0, 43475.0, 27261.0, 16775.0, 10925.0, 7041.0, 4811.0, 3128.0, 2102.0, 1475.0, 998.0, 698.0, 443.0, 354.0, 236.0, 151.0, 105.0, 68.0, 49.0, 32.0, 27.0, 20.0, 10.0, 8.0, 7.0, 5.0, 2.0, 3.0, 0.0, 3.0], "bins": [-0.203369140625, -0.19703292846679688, -0.19069671630859375, -0.18436050415039062, -0.1780242919921875, -0.17168807983398438, -0.16535186767578125, -0.15901565551757812, -0.152679443359375, -0.14634323120117188, -0.14000701904296875, -0.13367080688476562, -0.1273345947265625, -0.12099838256835938, -0.11466217041015625, -0.10832595825195312, -0.10198974609375, -0.09565353393554688, -0.08931732177734375, -0.08298110961914062, -0.0766448974609375, -0.07030868530273438, -0.06397247314453125, -0.057636260986328125, -0.051300048828125, -0.044963836669921875, -0.03862762451171875, -0.032291412353515625, -0.0259552001953125, -0.019618988037109375, -0.01328277587890625, -0.006946563720703125, -0.0006103515625, 0.005725860595703125, 0.01206207275390625, 0.018398284912109375, 0.0247344970703125, 0.031070709228515625, 0.03740692138671875, 0.043743133544921875, 0.050079345703125, 0.056415557861328125, 0.06275177001953125, 0.06908798217773438, 0.0754241943359375, 0.08176040649414062, 0.08809661865234375, 0.09443283081054688, 0.10076904296875, 0.10710525512695312, 0.11344146728515625, 0.11977767944335938, 0.1261138916015625, 0.13245010375976562, 0.13878631591796875, 0.14512252807617188, 0.151458740234375, 0.15779495239257812, 0.16413116455078125, 0.17046737670898438, 0.1768035888671875, 0.18313980102539062, 0.18947601318359375, 0.19581222534179688, 0.2021484375]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 5.0, 2.0, 2.0, 2.0, 5.0, 3.0, 3.0, 19.0, 16.0, 31.0, 46.0, 68.0, 106.0, 174.0, 191.0, 114.0, 71.0, 48.0, 38.0, 21.0, 16.0, 6.0, 7.0, 6.0, 4.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00024962425231933594, -0.00023877620697021484, -0.00022792816162109375, -0.00021708011627197266, -0.00020623207092285156, -0.00019538402557373047, -0.00018453598022460938, -0.00017368793487548828, -0.0001628398895263672, -0.0001519918441772461, -0.000141143798828125, -0.0001302957534790039, -0.00011944770812988281, -0.00010859966278076172, -9.775161743164062e-05, -8.690357208251953e-05, -7.605552673339844e-05, -6.520748138427734e-05, -5.435943603515625e-05, -4.3511390686035156e-05, -3.266334533691406e-05, -2.181529998779297e-05, -1.0967254638671875e-05, -1.1920928955078125e-07, 1.0728836059570312e-05, 2.1576881408691406e-05, 3.24249267578125e-05, 4.3272972106933594e-05, 5.412101745605469e-05, 6.496906280517578e-05, 7.581710815429688e-05, 8.666515350341797e-05, 9.751319885253906e-05, 0.00010836124420166016, 0.00011920928955078125, 0.00013005733489990234, 0.00014090538024902344, 0.00015175342559814453, 0.00016260147094726562, 0.00017344951629638672, 0.0001842975616455078, 0.0001951456069946289, 0.00020599365234375, 0.0002168416976928711, 0.0002276897430419922, 0.00023853778839111328, 0.0002493858337402344, 0.00026023387908935547, 0.00027108192443847656, 0.00028192996978759766, 0.00029277801513671875, 0.00030362606048583984, 0.00031447410583496094, 0.00032532215118408203, 0.0003361701965332031, 0.0003470182418823242, 0.0003578662872314453, 0.0003687143325805664, 0.0003795623779296875, 0.0003904104232788086, 0.0004012584686279297, 0.0004121065139770508, 0.0004229545593261719, 0.00043380260467529297, 0.00044465065002441406]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 4.0, 1.0, 8.0, 13.0, 12.0, 10.0, 27.0, 41.0, 80.0, 118.0, 355.0, 1662.0, 568968.0, 475003.0, 1593.0, 351.0, 136.0, 67.0, 31.0, 27.0, 12.0, 10.0, 7.0, 7.0, 3.0, 2.0, 7.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00909423828125, -0.008872389793395996, -0.008650541305541992, -0.008428692817687988, -0.008206844329833984, -0.00798499584197998, -0.0077631473541259766, -0.007541298866271973, -0.007319450378417969, -0.007097601890563965, -0.006875753402709961, -0.006653904914855957, -0.006432056427001953, -0.006210207939147949, -0.005988359451293945, -0.005766510963439941, -0.0055446624755859375, -0.005322813987731934, -0.00510096549987793, -0.004879117012023926, -0.004657268524169922, -0.004435420036315918, -0.004213571548461914, -0.00399172306060791, -0.0037698745727539062, -0.0035480260848999023, -0.0033261775970458984, -0.0031043291091918945, -0.0028824806213378906, -0.0026606321334838867, -0.002438783645629883, -0.002216935157775879, -0.001995086669921875, -0.001773238182067871, -0.0015513896942138672, -0.0013295412063598633, -0.0011076927185058594, -0.0008858442306518555, -0.0006639957427978516, -0.00044214725494384766, -0.00022029876708984375, 1.5497207641601562e-06, 0.00022339820861816406, 0.00044524669647216797, 0.0006670951843261719, 0.0008889436721801758, 0.0011107921600341797, 0.0013326406478881836, 0.0015544891357421875, 0.0017763376235961914, 0.0019981861114501953, 0.0022200345993041992, 0.002441883087158203, 0.002663731575012207, 0.002885580062866211, 0.003107428550720215, 0.0033292770385742188, 0.0035511255264282227, 0.0037729740142822266, 0.0039948225021362305, 0.004216670989990234, 0.004438519477844238, 0.004660367965698242, 0.004882216453552246, 0.00510406494140625]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 16.0, 12.0, 37.0, 87.0, 168.0, 243.0, 216.0, 116.0, 60.0, 32.0, 11.0, 3.0, 3.0, 5.0], "bins": [-0.0006774240173399448, -0.0006652597221545875, -0.0006530954269692302, -0.0006409311899915338, -0.0006287668948061764, -0.0006166025996208191, -0.0006044383044354618, -0.0005922740092501044, -0.000580109772272408, -0.0005679454770870507, -0.0005557811819016933, -0.0005436169449239969, -0.0005314526497386396, -0.0005192883545532823, -0.0005071240593679249, -0.0004949597641825676, -0.00048279546899721026, -0.00047063117381185293, -0.00045846690773032606, -0.0004463026125449687, -0.00043413834646344185, -0.0004219740512780845, -0.0004098097560927272, -0.0003976454900112003, -0.00038548122392967343, -0.0003733169287443161, -0.0003611526626627892, -0.0003489883674774319, -0.000336824101395905, -0.0003246598062105477, -0.00031249551102519035, -0.0003003312449436635, -0.00028816694975830615, -0.0002760026545729488, -0.00026383838849142194, -0.0002516740933060646, -0.0002395098126726225, -0.0002273455320391804, -0.0002151812514057383, -0.0002030169707722962, -0.00019085267558693886, -0.00017868839495349675, -0.00016652411432005465, -0.00015435981913469732, -0.00014219553850125521, -0.0001300312578678131, -0.000117866977234371, -0.00010570268932497129, -9.35384159674868e-05, -8.13741353340447e-05, -6.920984742464498e-05, -5.704556679120287e-05, -4.488128251978196e-05, -3.271699824836105e-05, -2.0552717614918947e-05, -8.38842970551923e-06, 3.7758509279228747e-06, 1.5940135199343786e-05, 2.8104417651775293e-05, 4.02687001042068e-05, 5.243298437562771e-05, 6.459726864704862e-05, 7.676154928049073e-05, 8.892583718989044e-05, 0.00010109011782333255]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 5.0, 4.0, 4.0, 6.0, 7.0, 8.0, 15.0, 12.0, 13.0, 17.0, 24.0, 36.0, 23.0, 30.0, 38.0, 31.0, 35.0, 35.0, 43.0, 34.0, 40.0, 42.0, 48.0, 54.0, 38.0, 40.0, 48.0, 38.0, 36.0, 31.0, 28.0, 20.0, 27.0, 17.0, 17.0, 10.0, 12.0, 11.0, 6.0, 6.0, 4.0, 2.0, 2.0, 4.0, 4.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001068115234375, -0.00010351184755563736, -0.00010021217167377472, -9.691249579191208e-05, -9.361281991004944e-05, -9.03131440281868e-05, -8.701346814632416e-05, -8.371379226446152e-05, -8.041411638259888e-05, -7.711444050073624e-05, -7.38147646188736e-05, -7.051508873701096e-05, -6.721541285514832e-05, -6.391573697328568e-05, -6.0616061091423035e-05, -5.7316385209560394e-05, -5.4016709327697754e-05, -5.0717033445835114e-05, -4.741735756397247e-05, -4.411768168210983e-05, -4.081800580024719e-05, -3.751832991838455e-05, -3.421865403652191e-05, -3.091897815465927e-05, -2.761930227279663e-05, -2.431962639093399e-05, -2.101995050907135e-05, -1.772027462720871e-05, -1.442059874534607e-05, -1.1120922863483429e-05, -7.821246981620789e-06, -4.521571099758148e-06, -1.2218952178955078e-06, 2.0777806639671326e-06, 5.377456545829773e-06, 8.677132427692413e-06, 1.1976808309555054e-05, 1.5276484191417694e-05, 1.8576160073280334e-05, 2.1875835955142975e-05, 2.5175511837005615e-05, 2.8475187718868256e-05, 3.1774863600730896e-05, 3.5074539482593536e-05, 3.837421536445618e-05, 4.167389124631882e-05, 4.497356712818146e-05, 4.82732430100441e-05, 5.157291889190674e-05, 5.487259477376938e-05, 5.817227065563202e-05, 6.147194653749466e-05, 6.47716224193573e-05, 6.807129830121994e-05, 7.137097418308258e-05, 7.467065006494522e-05, 7.797032594680786e-05, 8.12700018286705e-05, 8.456967771053314e-05, 8.786935359239578e-05, 9.116902947425842e-05, 9.446870535612106e-05, 9.77683812379837e-05, 0.00010106805711984634, 0.00010436773300170898]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 5.0, 9.0, 8.0, 4.0, 14.0, 12.0, 12.0, 20.0, 13.0, 23.0, 19.0, 18.0, 22.0, 37.0, 21.0, 33.0, 27.0, 41.0, 43.0, 47.0, 53.0, 35.0, 46.0, 36.0, 39.0, 36.0, 32.0, 22.0, 25.0, 39.0, 36.0, 26.0, 24.0, 24.0, 9.0, 15.0, 11.0, 15.0, 14.0, 7.0, 8.0, 8.0, 4.0, 4.0, 1.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.9296875, -5.73681640625, -5.5439453125, -5.35107421875, -5.158203125, -4.96533203125, -4.7724609375, -4.57958984375, -4.38671875, -4.19384765625, -4.0009765625, -3.80810546875, -3.615234375, -3.42236328125, -3.2294921875, -3.03662109375, -2.84375, -2.65087890625, -2.4580078125, -2.26513671875, -2.072265625, -1.87939453125, -1.6865234375, -1.49365234375, -1.30078125, -1.10791015625, -0.9150390625, -0.72216796875, -0.529296875, -0.33642578125, -0.1435546875, 0.04931640625, 0.2421875, 0.43505859375, 0.6279296875, 0.82080078125, 1.013671875, 1.20654296875, 1.3994140625, 1.59228515625, 1.78515625, 1.97802734375, 2.1708984375, 2.36376953125, 2.556640625, 2.74951171875, 2.9423828125, 3.13525390625, 3.328125, 3.52099609375, 3.7138671875, 3.90673828125, 4.099609375, 4.29248046875, 4.4853515625, 4.67822265625, 4.87109375, 5.06396484375, 5.2568359375, 5.44970703125, 5.642578125, 5.83544921875, 6.0283203125, 6.22119140625, 6.4140625]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 3.0, 5.0, 6.0, 11.0, 15.0, 6.0, 19.0, 19.0, 28.0, 33.0, 44.0, 49.0, 90.0, 113.0, 145.0, 295.0, 486.0, 1061.0, 2248.0, 6058.0, 22651.0, 133918.0, 702383.0, 143688.0, 24202.0, 6207.0, 2252.0, 1073.0, 537.0, 303.0, 164.0, 119.0, 89.0, 56.0, 43.0, 24.0, 26.0, 16.0, 19.0, 14.0, 8.0, 10.0, 7.0, 1.0, 3.0, 3.0, 5.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.7421875, -11.36962890625, -10.9970703125, -10.62451171875, -10.251953125, -9.87939453125, -9.5068359375, -9.13427734375, -8.76171875, -8.38916015625, -8.0166015625, -7.64404296875, -7.271484375, -6.89892578125, -6.5263671875, -6.15380859375, -5.78125, -5.40869140625, -5.0361328125, -4.66357421875, -4.291015625, -3.91845703125, -3.5458984375, -3.17333984375, -2.80078125, -2.42822265625, -2.0556640625, -1.68310546875, -1.310546875, -0.93798828125, -0.5654296875, -0.19287109375, 0.1796875, 0.55224609375, 0.9248046875, 1.29736328125, 1.669921875, 2.04248046875, 2.4150390625, 2.78759765625, 3.16015625, 3.53271484375, 3.9052734375, 4.27783203125, 4.650390625, 5.02294921875, 5.3955078125, 5.76806640625, 6.140625, 6.51318359375, 6.8857421875, 7.25830078125, 7.630859375, 8.00341796875, 8.3759765625, 8.74853515625, 9.12109375, 9.49365234375, 9.8662109375, 10.23876953125, 10.611328125, 10.98388671875, 11.3564453125, 11.72900390625, 12.1015625]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 1.0, 4.0, 3.0, 5.0, 2.0, 6.0, 5.0, 13.0, 13.0, 10.0, 13.0, 16.0, 14.0, 21.0, 42.0, 27.0, 26.0, 24.0, 29.0, 49.0, 46.0, 48.0, 106.0, 185.0, 1531.0, 243.0, 99.0, 73.0, 54.0, 39.0, 36.0, 45.0, 30.0, 28.0, 23.0, 26.0, 19.0, 20.0, 11.0, 15.0, 13.0, 9.0, 4.0, 14.0, 5.0, 2.0, 2.0, 5.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-18.0625, -17.510498046875, -16.95849609375, -16.406494140625, -15.8544921875, -15.302490234375, -14.75048828125, -14.198486328125, -13.646484375, -13.094482421875, -12.54248046875, -11.990478515625, -11.4384765625, -10.886474609375, -10.33447265625, -9.782470703125, -9.23046875, -8.678466796875, -8.12646484375, -7.574462890625, -7.0224609375, -6.470458984375, -5.91845703125, -5.366455078125, -4.814453125, -4.262451171875, -3.71044921875, -3.158447265625, -2.6064453125, -2.054443359375, -1.50244140625, -0.950439453125, -0.3984375, 0.153564453125, 0.70556640625, 1.257568359375, 1.8095703125, 2.361572265625, 2.91357421875, 3.465576171875, 4.017578125, 4.569580078125, 5.12158203125, 5.673583984375, 6.2255859375, 6.777587890625, 7.32958984375, 7.881591796875, 8.43359375, 8.985595703125, 9.53759765625, 10.089599609375, 10.6416015625, 11.193603515625, 11.74560546875, 12.297607421875, 12.849609375, 13.401611328125, 13.95361328125, 14.505615234375, 15.0576171875, 15.609619140625, 16.16162109375, 16.713623046875, 17.265625]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 5.0, 2.0, 3.0, 8.0, 8.0, 17.0, 15.0, 18.0, 25.0, 26.0, 26.0, 39.0, 34.0, 62.0, 84.0, 86.0, 137.0, 314.0, 621.0, 2213.0, 74032.0, 3054895.0, 10563.0, 1242.0, 458.0, 242.0, 135.0, 75.0, 64.0, 44.0, 43.0, 43.0, 26.0, 15.0, 19.0, 8.0, 13.0, 11.0, 12.0, 6.0, 5.0, 8.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-50.0625, -48.41064453125, -46.7587890625, -45.10693359375, -43.455078125, -41.80322265625, -40.1513671875, -38.49951171875, -36.84765625, -35.19580078125, -33.5439453125, -31.89208984375, -30.240234375, -28.58837890625, -26.9365234375, -25.28466796875, -23.6328125, -21.98095703125, -20.3291015625, -18.67724609375, -17.025390625, -15.37353515625, -13.7216796875, -12.06982421875, -10.41796875, -8.76611328125, -7.1142578125, -5.46240234375, -3.810546875, -2.15869140625, -0.5068359375, 1.14501953125, 2.796875, 4.44873046875, 6.1005859375, 7.75244140625, 9.404296875, 11.05615234375, 12.7080078125, 14.35986328125, 16.01171875, 17.66357421875, 19.3154296875, 20.96728515625, 22.619140625, 24.27099609375, 25.9228515625, 27.57470703125, 29.2265625, 30.87841796875, 32.5302734375, 34.18212890625, 35.833984375, 37.48583984375, 39.1376953125, 40.78955078125, 42.44140625, 44.09326171875, 45.7451171875, 47.39697265625, 49.048828125, 50.70068359375, 52.3525390625, 54.00439453125, 55.65625]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 15.0, 40.0, 96.0, 201.0, 288.0, 210.0, 116.0, 31.0, 19.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.84120559692383, -32.39612579345703, -30.951047897338867, -29.505970001220703, -28.060890197753906, -26.615812301635742, -25.170734405517578, -23.72565460205078, -22.280576705932617, -20.835498809814453, -19.390419006347656, -17.945341110229492, -16.500263214111328, -15.055183410644531, -13.610105514526367, -12.165026664733887, -10.719947814941406, -9.274868965148926, -7.8297905921936035, -6.384712219238281, -4.939633369445801, -3.4945545196533203, -2.0494766235351562, -0.6043977737426758, 0.8406810760498047, 2.285759687423706, 3.7308382987976074, 5.17591667175293, 6.62099552154541, 8.06607437133789, 9.511152267456055, 10.956231117248535, 12.40130615234375, 13.84638500213623, 15.291463851928711, 16.736541748046875, 18.181621551513672, 19.626699447631836, 21.07177734375, 22.516857147216797, 23.96193504333496, 25.407012939453125, 26.852092742919922, 28.297170639038086, 29.74224853515625, 31.187328338623047, 32.632408142089844, 34.077484130859375, 35.52256393432617, 36.96764373779297, 38.4127197265625, 39.8577995300293, 41.302879333496094, 42.747955322265625, 44.19303512573242, 45.63811492919922, 47.08319091796875, 48.52827072143555, 49.97334671020508, 51.418426513671875, 52.86350631713867, 54.30858612060547, 55.753662109375, 57.1987419128418, 58.643821716308594]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 6.0, 9.0, 6.0, 8.0, 8.0, 15.0, 15.0, 17.0, 23.0, 18.0, 21.0, 36.0, 27.0, 27.0, 28.0, 37.0, 34.0, 42.0, 50.0, 49.0, 42.0, 43.0, 47.0, 29.0, 44.0, 39.0, 28.0, 34.0, 30.0, 32.0, 39.0, 16.0, 17.0, 14.0, 19.0, 7.0, 7.0, 6.0, 10.0, 6.0, 8.0, 4.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.48288345336914, -47.91722106933594, -46.35155487060547, -44.785892486572266, -43.22023010253906, -41.654563903808594, -40.08890151977539, -38.52323913574219, -36.95757293701172, -35.391910552978516, -33.82624435424805, -32.260581970214844, -30.694917678833008, -29.129253387451172, -27.56359100341797, -25.997926712036133, -24.432262420654297, -22.86659812927246, -21.300933837890625, -19.735271453857422, -18.169607162475586, -16.60394287109375, -15.03827953338623, -13.472616195678711, -11.906951904296875, -10.341287612915039, -8.77562427520752, -7.209960460662842, -5.644296646118164, -4.078632831573486, -2.5129690170288086, -0.9473056793212891, 0.6183547973632812, 2.184018611907959, 3.7496824264526367, 5.3153462409973145, 6.881010055541992, 8.446674346923828, 10.012337684631348, 11.578001022338867, 13.143665313720703, 14.709329605102539, 16.274993896484375, 17.840656280517578, 19.406320571899414, 20.97198486328125, 22.537647247314453, 24.10331153869629, 25.668975830078125, 27.23464012145996, 28.800304412841797, 30.365966796875, 31.931631088256836, 33.49729537963867, 35.062957763671875, 36.628623962402344, 38.19428634643555, 39.75994873046875, 41.32561492919922, 42.89127731323242, 44.456939697265625, 46.022605895996094, 47.5882682800293, 49.1539306640625, 50.71959686279297]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 6.0, 9.0, 8.0, 10.0, 6.0, 9.0, 16.0, 20.0, 12.0, 24.0, 12.0, 16.0, 26.0, 30.0, 31.0, 34.0, 31.0, 33.0, 42.0, 43.0, 33.0, 50.0, 48.0, 37.0, 53.0, 25.0, 26.0, 37.0, 22.0, 30.0, 30.0, 34.0, 28.0, 16.0, 19.0, 17.0, 16.0, 14.0, 9.0, 11.0, 13.0, 3.0, 5.0, 4.0, 3.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-6.57421875, -6.36981201171875, -6.1654052734375, -5.96099853515625, -5.756591796875, -5.55218505859375, -5.3477783203125, -5.14337158203125, -4.93896484375, -4.73455810546875, -4.5301513671875, -4.32574462890625, -4.121337890625, -3.91693115234375, -3.7125244140625, -3.50811767578125, -3.3037109375, -3.09930419921875, -2.8948974609375, -2.69049072265625, -2.486083984375, -2.28167724609375, -2.0772705078125, -1.87286376953125, -1.66845703125, -1.46405029296875, -1.2596435546875, -1.05523681640625, -0.850830078125, -0.64642333984375, -0.4420166015625, -0.23760986328125, -0.033203125, 0.17120361328125, 0.3756103515625, 0.58001708984375, 0.784423828125, 0.98883056640625, 1.1932373046875, 1.39764404296875, 1.60205078125, 1.80645751953125, 2.0108642578125, 2.21527099609375, 2.419677734375, 2.62408447265625, 2.8284912109375, 3.03289794921875, 3.2373046875, 3.44171142578125, 3.6461181640625, 3.85052490234375, 4.054931640625, 4.25933837890625, 4.4637451171875, 4.66815185546875, 4.87255859375, 5.07696533203125, 5.2813720703125, 5.48577880859375, 5.690185546875, 5.89459228515625, 6.0989990234375, 6.30340576171875, 6.5078125]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 9.0, 4.0, 3.0, 7.0, 9.0, 17.0, 20.0, 36.0, 38.0, 62.0, 90.0, 136.0, 202.0, 246.0, 355.0, 575.0, 1016.0, 1834.0, 3374.0, 7121.0, 18088.0, 68283.0, 336425.0, 1239735.0, 1704808.0, 629566.0, 131729.0, 29604.0, 10282.0, 4614.0, 2423.0, 1317.0, 755.0, 483.0, 295.0, 211.0, 140.0, 111.0, 94.0, 49.0, 37.0, 26.0, 14.0, 18.0, 8.0, 14.0, 7.0, 6.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.78125, -9.50347900390625, -9.2257080078125, -8.94793701171875, -8.670166015625, -8.39239501953125, -8.1146240234375, -7.83685302734375, -7.55908203125, -7.28131103515625, -7.0035400390625, -6.72576904296875, -6.447998046875, -6.17022705078125, -5.8924560546875, -5.61468505859375, -5.3369140625, -5.05914306640625, -4.7813720703125, -4.50360107421875, -4.225830078125, -3.94805908203125, -3.6702880859375, -3.39251708984375, -3.11474609375, -2.83697509765625, -2.5592041015625, -2.28143310546875, -2.003662109375, -1.72589111328125, -1.4481201171875, -1.17034912109375, -0.892578125, -0.61480712890625, -0.3370361328125, -0.05926513671875, 0.218505859375, 0.49627685546875, 0.7740478515625, 1.05181884765625, 1.32958984375, 1.60736083984375, 1.8851318359375, 2.16290283203125, 2.440673828125, 2.71844482421875, 2.9962158203125, 3.27398681640625, 3.5517578125, 3.82952880859375, 4.1072998046875, 4.38507080078125, 4.662841796875, 4.94061279296875, 5.2183837890625, 5.49615478515625, 5.77392578125, 6.05169677734375, 6.3294677734375, 6.60723876953125, 6.885009765625, 7.16278076171875, 7.4405517578125, 7.71832275390625, 7.99609375]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 7.0, 6.0, 8.0, 10.0, 15.0, 15.0, 18.0, 17.0, 31.0, 27.0, 49.0, 45.0, 68.0, 95.0, 122.0, 172.0, 254.0, 348.0, 373.0, 501.0, 441.0, 341.0, 285.0, 193.0, 146.0, 118.0, 73.0, 62.0, 43.0, 28.0, 28.0, 32.0, 24.0, 19.0, 15.0, 8.0, 5.0, 4.0, 10.0, 5.0, 2.0, 6.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0], "bins": [-11.1796875, -10.8673095703125, -10.554931640625, -10.2425537109375, -9.93017578125, -9.6177978515625, -9.305419921875, -8.9930419921875, -8.6806640625, -8.3682861328125, -8.055908203125, -7.7435302734375, -7.43115234375, -7.1187744140625, -6.806396484375, -6.4940185546875, -6.181640625, -5.8692626953125, -5.556884765625, -5.2445068359375, -4.93212890625, -4.6197509765625, -4.307373046875, -3.9949951171875, -3.6826171875, -3.3702392578125, -3.057861328125, -2.7454833984375, -2.43310546875, -2.1207275390625, -1.808349609375, -1.4959716796875, -1.18359375, -0.8712158203125, -0.558837890625, -0.2464599609375, 0.06591796875, 0.3782958984375, 0.690673828125, 1.0030517578125, 1.3154296875, 1.6278076171875, 1.940185546875, 2.2525634765625, 2.56494140625, 2.8773193359375, 3.189697265625, 3.5020751953125, 3.814453125, 4.1268310546875, 4.439208984375, 4.7515869140625, 5.06396484375, 5.3763427734375, 5.688720703125, 6.0010986328125, 6.3134765625, 6.6258544921875, 6.938232421875, 7.2506103515625, 7.56298828125, 7.8753662109375, 8.187744140625, 8.5001220703125, 8.8125]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 3.0, 0.0, 4.0, 3.0, 1.0, 4.0, 11.0, 4.0, 7.0, 8.0, 19.0, 13.0, 26.0, 30.0, 35.0, 38.0, 47.0, 76.0, 130.0, 188.0, 255.0, 512.0, 1245.0, 5342.0, 70054.0, 3714986.0, 384466.0, 12720.0, 2170.0, 748.0, 410.0, 225.0, 137.0, 91.0, 61.0, 48.0, 40.0, 27.0, 24.0, 11.0, 18.0, 15.0, 5.0, 11.0, 8.0, 4.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.9375, -31.7900390625, -30.642578125, -29.4951171875, -28.34765625, -27.2001953125, -26.052734375, -24.9052734375, -23.7578125, -22.6103515625, -21.462890625, -20.3154296875, -19.16796875, -18.0205078125, -16.873046875, -15.7255859375, -14.578125, -13.4306640625, -12.283203125, -11.1357421875, -9.98828125, -8.8408203125, -7.693359375, -6.5458984375, -5.3984375, -4.2509765625, -3.103515625, -1.9560546875, -0.80859375, 0.3388671875, 1.486328125, 2.6337890625, 3.78125, 4.9287109375, 6.076171875, 7.2236328125, 8.37109375, 9.5185546875, 10.666015625, 11.8134765625, 12.9609375, 14.1083984375, 15.255859375, 16.4033203125, 17.55078125, 18.6982421875, 19.845703125, 20.9931640625, 22.140625, 23.2880859375, 24.435546875, 25.5830078125, 26.73046875, 27.8779296875, 29.025390625, 30.1728515625, 31.3203125, 32.4677734375, 33.615234375, 34.7626953125, 35.91015625, 37.0576171875, 38.205078125, 39.3525390625, 40.5]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 5.0, 17.0, 23.0, 73.0, 171.0, 218.0, 226.0, 140.0, 82.0, 40.0, 11.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.88778305053711, -42.240169525146484, -39.592552185058594, -36.94493865966797, -34.297325134277344, -31.649709701538086, -29.002094268798828, -26.354480743408203, -23.706865310668945, -21.059249877929688, -18.411636352539062, -15.764020919799805, -13.116406440734863, -10.468791961669922, -7.821176528930664, -5.173563003540039, -2.5259475708007812, 0.12166714668273926, 2.7692818641662598, 5.416896820068359, 8.0645112991333, 10.712125778198242, 13.3597412109375, 16.007354736328125, 18.654970169067383, 21.30258560180664, 23.950199127197266, 26.597814559936523, 29.24542999267578, 31.893043518066406, 34.54065704345703, 37.188270568847656, 39.83589172363281, 42.48350524902344, 45.13112258911133, 47.77873611450195, 50.42634963989258, 53.07396697998047, 55.721580505371094, 58.36919403076172, 61.016807556152344, 63.66442108154297, 66.3120346069336, 68.95965576171875, 71.60726928710938, 74.2548828125, 76.90249633789062, 79.55010986328125, 82.19772338867188, 84.8453369140625, 87.49295043945312, 90.14056396484375, 92.7881851196289, 95.43579864501953, 98.08341217041016, 100.73102569580078, 103.37864685058594, 106.02626037597656, 108.67387390136719, 111.32148742675781, 113.96910858154297, 116.6167221069336, 119.26433563232422, 121.91194915771484, 124.55956268310547]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 2.0, 6.0, 5.0, 5.0, 8.0, 7.0, 7.0, 12.0, 21.0, 21.0, 18.0, 21.0, 22.0, 26.0, 40.0, 35.0, 34.0, 39.0, 48.0, 48.0, 52.0, 33.0, 42.0, 51.0, 39.0, 47.0, 41.0, 29.0, 33.0, 27.0, 30.0, 23.0, 19.0, 13.0, 13.0, 21.0, 7.0, 19.0, 13.0, 7.0, 10.0, 5.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-43.8133659362793, -42.58719253540039, -41.36101531982422, -40.13484191894531, -38.908668518066406, -37.682491302490234, -36.45631790161133, -35.230140686035156, -34.00396728515625, -32.777793884277344, -31.551616668701172, -30.325443267822266, -29.099267959594727, -27.873092651367188, -26.64691925048828, -25.420743942260742, -24.194568634033203, -22.968393325805664, -21.742218017578125, -20.51604461669922, -19.28986930847168, -18.06369400024414, -16.837520599365234, -15.611345291137695, -14.385169982910156, -13.158994674682617, -11.932820320129395, -10.706645965576172, -9.480470657348633, -8.254295349121094, -7.028120994567871, -5.801946640014648, -4.575767517089844, -3.349592685699463, -2.123417854309082, -0.8972430229187012, 0.3289318084716797, 1.5551066398620605, 2.7812814712524414, 4.007455825805664, 5.233631134033203, 6.459805965423584, 7.685980796813965, 8.912155151367188, 10.138330459594727, 11.364505767822266, 12.590680122375488, 13.816854476928711, 15.04302978515625, 16.26920509338379, 17.495380401611328, 18.721553802490234, 19.947729110717773, 21.173904418945312, 22.40007781982422, 23.626253128051758, 24.852428436279297, 26.078603744506836, 27.304779052734375, 28.53095245361328, 29.75712776184082, 30.98330307006836, 32.209476470947266, 33.43565368652344, 34.661827087402344]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 1.0, 0.0, 6.0, 4.0, 4.0, 5.0, 3.0, 8.0, 13.0, 6.0, 13.0, 12.0, 17.0, 15.0, 13.0, 19.0, 22.0, 34.0, 20.0, 34.0, 32.0, 37.0, 29.0, 35.0, 34.0, 41.0, 37.0, 45.0, 30.0, 37.0, 27.0, 34.0, 39.0, 36.0, 35.0, 26.0, 23.0, 22.0, 18.0, 15.0, 25.0, 13.0, 16.0, 12.0, 14.0, 7.0, 8.0, 6.0, 10.0, 3.0, 4.0, 4.0, 3.0, 0.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0, 2.0], "bins": [-5.40625, -5.22894287109375, -5.0516357421875, -4.87432861328125, -4.697021484375, -4.51971435546875, -4.3424072265625, -4.16510009765625, -3.98779296875, -3.81048583984375, -3.6331787109375, -3.45587158203125, -3.278564453125, -3.10125732421875, -2.9239501953125, -2.74664306640625, -2.5693359375, -2.39202880859375, -2.2147216796875, -2.03741455078125, -1.860107421875, -1.68280029296875, -1.5054931640625, -1.32818603515625, -1.15087890625, -0.97357177734375, -0.7962646484375, -0.61895751953125, -0.441650390625, -0.26434326171875, -0.0870361328125, 0.09027099609375, 0.267578125, 0.44488525390625, 0.6221923828125, 0.79949951171875, 0.976806640625, 1.15411376953125, 1.3314208984375, 1.50872802734375, 1.68603515625, 1.86334228515625, 2.0406494140625, 2.21795654296875, 2.395263671875, 2.57257080078125, 2.7498779296875, 2.92718505859375, 3.1044921875, 3.28179931640625, 3.4591064453125, 3.63641357421875, 3.813720703125, 3.99102783203125, 4.1683349609375, 4.34564208984375, 4.52294921875, 4.70025634765625, 4.8775634765625, 5.05487060546875, 5.232177734375, 5.40948486328125, 5.5867919921875, 5.76409912109375, 5.94140625]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 6.0, 6.0, 9.0, 12.0, 33.0, 49.0, 85.0, 86.0, 164.0, 226.0, 353.0, 587.0, 868.0, 1218.0, 2111.0, 3129.0, 5006.0, 8183.0, 12913.0, 21867.0, 38254.0, 69455.0, 136670.0, 295442.0, 218328.0, 102582.0, 54157.0, 30415.0, 17526.0, 10533.0, 6599.0, 4212.0, 2526.0, 1730.0, 1136.0, 687.0, 447.0, 308.0, 225.0, 146.0, 74.0, 58.0, 44.0, 30.0, 20.0, 21.0, 9.0, 8.0, 3.0, 1.0, 2.0, 3.0, 2.0, 1.0], "bins": [-0.3330078125, -0.3231544494628906, -0.31330108642578125, -0.3034477233886719, -0.2935943603515625, -0.2837409973144531, -0.27388763427734375, -0.2640342712402344, -0.254180908203125, -0.24432754516601562, -0.23447418212890625, -0.22462081909179688, -0.2147674560546875, -0.20491409301757812, -0.19506072998046875, -0.18520736694335938, -0.17535400390625, -0.16550064086914062, -0.15564727783203125, -0.14579391479492188, -0.1359405517578125, -0.12608718872070312, -0.11623382568359375, -0.10638046264648438, -0.096527099609375, -0.08667373657226562, -0.07682037353515625, -0.06696701049804688, -0.0571136474609375, -0.047260284423828125, -0.03740692138671875, -0.027553558349609375, -0.0177001953125, -0.007846832275390625, 0.00200653076171875, 0.011859893798828125, 0.0217132568359375, 0.031566619873046875, 0.04141998291015625, 0.051273345947265625, 0.061126708984375, 0.07098007202148438, 0.08083343505859375, 0.09068679809570312, 0.1005401611328125, 0.11039352416992188, 0.12024688720703125, 0.13010025024414062, 0.13995361328125, 0.14980697631835938, 0.15966033935546875, 0.16951370239257812, 0.1793670654296875, 0.18922042846679688, 0.19907379150390625, 0.20892715454101562, 0.218780517578125, 0.22863388061523438, 0.23848724365234375, 0.24834060668945312, 0.2581939697265625, 0.2680473327636719, 0.27790069580078125, 0.2877540588378906, 0.297607421875]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 0.0, 1.0, 3.0, 3.0, 7.0, 6.0, 8.0, 4.0, 10.0, 9.0, 5.0, 12.0, 16.0, 12.0, 8.0, 21.0, 20.0, 18.0, 24.0, 22.0, 30.0, 20.0, 39.0, 20.0, 39.0, 28.0, 31.0, 39.0, 1058.0, 33.0, 23.0, 37.0, 38.0, 27.0, 35.0, 29.0, 36.0, 24.0, 29.0, 27.0, 17.0, 24.0, 23.0, 22.0, 12.0, 12.0, 13.0, 8.0, 7.0, 12.0, 11.0, 10.0, 5.0, 5.0, 2.0, 2.0, 1.0, 2.0], "bins": [-3.685546875, -3.579833984375, -3.47412109375, -3.368408203125, -3.2626953125, -3.156982421875, -3.05126953125, -2.945556640625, -2.83984375, -2.734130859375, -2.62841796875, -2.522705078125, -2.4169921875, -2.311279296875, -2.20556640625, -2.099853515625, -1.994140625, -1.888427734375, -1.78271484375, -1.677001953125, -1.5712890625, -1.465576171875, -1.35986328125, -1.254150390625, -1.1484375, -1.042724609375, -0.93701171875, -0.831298828125, -0.7255859375, -0.619873046875, -0.51416015625, -0.408447265625, -0.302734375, -0.197021484375, -0.09130859375, 0.014404296875, 0.1201171875, 0.225830078125, 0.33154296875, 0.437255859375, 0.54296875, 0.648681640625, 0.75439453125, 0.860107421875, 0.9658203125, 1.071533203125, 1.17724609375, 1.282958984375, 1.388671875, 1.494384765625, 1.60009765625, 1.705810546875, 1.8115234375, 1.917236328125, 2.02294921875, 2.128662109375, 2.234375, 2.340087890625, 2.44580078125, 2.551513671875, 2.6572265625, 2.762939453125, 2.86865234375, 2.974365234375, 3.080078125]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [7.0, 7.0, 14.0, 17.0, 23.0, 34.0, 28.0, 47.0, 66.0, 81.0, 123.0, 182.0, 272.0, 356.0, 501.0, 612.0, 893.0, 1107.0, 1570.0, 2169.0, 2903.0, 4188.0, 5687.0, 7902.0, 11348.0, 16307.0, 23831.0, 35077.0, 53301.0, 84798.0, 137819.0, 1250855.0, 161791.0, 99567.0, 62448.0, 40494.0, 26914.0, 18570.0, 12682.0, 9019.0, 6425.0, 4626.0, 3386.0, 2415.0, 1802.0, 1293.0, 976.0, 700.0, 536.0, 376.0, 294.0, 187.0, 164.0, 117.0, 70.0, 52.0, 45.0, 28.0, 16.0, 12.0, 8.0, 6.0, 4.0, 4.0], "bins": [-0.15869140625, -0.15368080139160156, -0.14867019653320312, -0.1436595916748047, -0.13864898681640625, -0.1336383819580078, -0.12862777709960938, -0.12361717224121094, -0.1186065673828125, -0.11359596252441406, -0.10858535766601562, -0.10357475280761719, -0.09856414794921875, -0.09355354309082031, -0.08854293823242188, -0.08353233337402344, -0.078521728515625, -0.07351112365722656, -0.06850051879882812, -0.06348991394042969, -0.05847930908203125, -0.05346870422363281, -0.048458099365234375, -0.04344749450683594, -0.0384368896484375, -0.03342628479003906, -0.028415679931640625, -0.023405075073242188, -0.01839447021484375, -0.013383865356445312, -0.008373260498046875, -0.0033626556396484375, 0.00164794921875, 0.0066585540771484375, 0.011669158935546875, 0.016679763793945312, 0.02169036865234375, 0.026700973510742188, 0.031711578369140625, 0.03672218322753906, 0.0417327880859375, 0.04674339294433594, 0.051753997802734375, 0.05676460266113281, 0.06177520751953125, 0.06678581237792969, 0.07179641723632812, 0.07680702209472656, 0.081817626953125, 0.08682823181152344, 0.09183883666992188, 0.09684944152832031, 0.10186004638671875, 0.10687065124511719, 0.11188125610351562, 0.11689186096191406, 0.1219024658203125, 0.12691307067871094, 0.13192367553710938, 0.1369342803955078, 0.14194488525390625, 0.1469554901123047, 0.15196609497070312, 0.15697669982910156, 0.1619873046875]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 10.0, 3.0, 4.0, 1.0, 10.0, 5.0, 9.0, 4.0, 12.0, 20.0, 21.0, 39.0, 54.0, 95.0, 122.0, 139.0, 155.0, 97.0, 48.0, 45.0, 21.0, 23.0, 8.0, 14.0, 18.0, 6.0, 9.0, 3.0, 4.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00030350685119628906, -0.00029393285512924194, -0.0002843588590621948, -0.0002747848629951477, -0.0002652108669281006, -0.00025563687086105347, -0.00024606287479400635, -0.00023648887872695923, -0.0002269148826599121, -0.000217340886592865, -0.00020776689052581787, -0.00019819289445877075, -0.00018861889839172363, -0.00017904490232467651, -0.0001694709062576294, -0.00015989691019058228, -0.00015032291412353516, -0.00014074891805648804, -0.00013117492198944092, -0.0001216009259223938, -0.00011202692985534668, -0.00010245293378829956, -9.287893772125244e-05, -8.330494165420532e-05, -7.37309455871582e-05, -6.415694952011108e-05, -5.4582953453063965e-05, -4.5008957386016846e-05, -3.5434961318969727e-05, -2.5860965251922607e-05, -1.6286969184875488e-05, -6.712973117828369e-06, 2.86102294921875e-06, 1.2435019016265869e-05, 2.2009015083312988e-05, 3.158301115036011e-05, 4.1157007217407227e-05, 5.0731003284454346e-05, 6.0304999351501465e-05, 6.987899541854858e-05, 7.94529914855957e-05, 8.902698755264282e-05, 9.860098361968994e-05, 0.00010817497968673706, 0.00011774897575378418, 0.0001273229718208313, 0.00013689696788787842, 0.00014647096395492554, 0.00015604496002197266, 0.00016561895608901978, 0.0001751929521560669, 0.00018476694822311401, 0.00019434094429016113, 0.00020391494035720825, 0.00021348893642425537, 0.0002230629324913025, 0.0002326369285583496, 0.00024221092462539673, 0.00025178492069244385, 0.00026135891675949097, 0.0002709329128265381, 0.0002805069088935852, 0.0002900809049606323, 0.00029965490102767944, 0.00030922889709472656]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 1.0, 1.0, 4.0, 1.0, 5.0, 6.0, 13.0, 10.0, 19.0, 22.0, 27.0, 54.0, 77.0, 120.0, 234.0, 723.0, 10962.0, 1028055.0, 7004.0, 634.0, 248.0, 110.0, 60.0, 54.0, 24.0, 18.0, 20.0, 8.0, 15.0, 2.0, 7.0, 4.0, 5.0, 7.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006572723388671875, -0.006370186805725098, -0.00616765022277832, -0.005965113639831543, -0.005762577056884766, -0.005560040473937988, -0.005357503890991211, -0.005154967308044434, -0.004952430725097656, -0.004749894142150879, -0.0045473575592041016, -0.004344820976257324, -0.004142284393310547, -0.0039397478103637695, -0.003737211227416992, -0.003534674644470215, -0.0033321380615234375, -0.00312960147857666, -0.002927064895629883, -0.0027245283126831055, -0.002521991729736328, -0.0023194551467895508, -0.0021169185638427734, -0.001914381980895996, -0.0017118453979492188, -0.0015093088150024414, -0.001306772232055664, -0.0011042356491088867, -0.0009016990661621094, -0.000699162483215332, -0.0004966259002685547, -0.00029408931732177734, -9.1552734375e-05, 0.00011098384857177734, 0.0003135204315185547, 0.000516057014465332, 0.0007185935974121094, 0.0009211301803588867, 0.001123666763305664, 0.0013262033462524414, 0.0015287399291992188, 0.001731276512145996, 0.0019338130950927734, 0.0021363496780395508, 0.002338886260986328, 0.0025414228439331055, 0.002743959426879883, 0.00294649600982666, 0.0031490325927734375, 0.003351569175720215, 0.003554105758666992, 0.0037566423416137695, 0.003959178924560547, 0.004161715507507324, 0.0043642520904541016, 0.004566788673400879, 0.004769325256347656, 0.004971861839294434, 0.005174398422241211, 0.005376935005187988, 0.005579471588134766, 0.005782008171081543, 0.00598454475402832, 0.006187081336975098, 0.006389617919921875]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [3.0, 176.0, 809.0, 30.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00013096180919092149, -7.412311970256269e-05, -1.7284430214203894e-05, 3.95542592741549e-05, 9.63929487625137e-05, 0.00015323162369895726, 0.0002100703277392313, 0.0002669090172275901, 0.00032374769216403365, 0.0003805863671004772, 0.00043742507114075124, 0.0004942637751810253, 0.0005511024501174688, 0.0006079411250539124, 0.000664779799990356, 0.0007216185331344604, 0.000778457208070904, 0.0008352958830073476, 0.0008921346161514521, 0.0009489732910878956, 0.0010058119660243392, 0.0010626506991684437, 0.0011194893158972263, 0.0011763280490413308, 0.0012331667821854353, 0.0012900055153295398, 0.0013468441320583224, 0.001403682865202427, 0.0014605214819312096, 0.001517360215075314, 0.0015741989482194185, 0.0016310375649482012, 0.0016878761816769838, 0.0017447149148210883, 0.001801553531549871, 0.0018583922646939754, 0.001915230881422758, 0.0019720694981515408, 0.002028908347710967, 0.0020857469644397497, 0.002142585813999176, 0.0021994244307279587, 0.002256263280287385, 0.0023131018970161676, 0.0023699405137449503, 0.0024267793633043766, 0.0024836179800331593, 0.002540456596761942, 0.0025972952134907246, 0.0026541338302195072, 0.0027109726797789335, 0.002767811296507716, 0.002824649913236499, 0.002881488762795925, 0.002938327379524708, 0.0029951659962534904, 0.003052004612982273, 0.0031088432297110558, 0.003165682079270482, 0.0032225206959992647, 0.0032793593127280474, 0.0033361981622874737, 0.0033930367790162563, 0.003449875395745039, 0.0035067142453044653]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 3.0, 6.0, 6.0, 4.0, 4.0, 8.0, 7.0, 8.0, 19.0, 17.0, 22.0, 26.0, 34.0, 28.0, 44.0, 45.0, 44.0, 40.0, 48.0, 42.0, 58.0, 43.0, 54.0, 50.0, 40.0, 44.0, 44.0, 36.0, 34.0, 28.0, 29.0, 19.0, 18.0, 16.0, 16.0, 13.0, 8.0, 0.0, 4.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.0001665949821472168, -0.00016227364540100098, -0.00015795230865478516, -0.00015363097190856934, -0.00014930963516235352, -0.0001449882984161377, -0.00014066696166992188, -0.00013634562492370605, -0.00013202428817749023, -0.00012770295143127441, -0.0001233816146850586, -0.00011906027793884277, -0.00011473894119262695, -0.00011041760444641113, -0.00010609626770019531, -0.00010177493095397949, -9.745359420776367e-05, -9.313225746154785e-05, -8.881092071533203e-05, -8.448958396911621e-05, -8.016824722290039e-05, -7.584691047668457e-05, -7.152557373046875e-05, -6.720423698425293e-05, -6.288290023803711e-05, -5.856156349182129e-05, -5.424022674560547e-05, -4.991888999938965e-05, -4.559755325317383e-05, -4.127621650695801e-05, -3.695487976074219e-05, -3.263354301452637e-05, -2.8312206268310547e-05, -2.3990869522094727e-05, -1.9669532775878906e-05, -1.5348196029663086e-05, -1.1026859283447266e-05, -6.705522537231445e-06, -2.384185791015625e-06, 1.9371509552001953e-06, 6.258487701416016e-06, 1.0579824447631836e-05, 1.4901161193847656e-05, 1.9222497940063477e-05, 2.3543834686279297e-05, 2.7865171432495117e-05, 3.218650817871094e-05, 3.650784492492676e-05, 4.082918167114258e-05, 4.51505184173584e-05, 4.947185516357422e-05, 5.379319190979004e-05, 5.811452865600586e-05, 6.243586540222168e-05, 6.67572021484375e-05, 7.107853889465332e-05, 7.539987564086914e-05, 7.972121238708496e-05, 8.404254913330078e-05, 8.83638858795166e-05, 9.268522262573242e-05, 9.700655937194824e-05, 0.00010132789611816406, 0.00010564923286437988, 0.0001099705696105957]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 1.0, 0.0, 6.0, 4.0, 4.0, 5.0, 3.0, 8.0, 13.0, 6.0, 13.0, 12.0, 17.0, 15.0, 13.0, 19.0, 22.0, 34.0, 20.0, 34.0, 32.0, 37.0, 29.0, 35.0, 34.0, 41.0, 37.0, 45.0, 30.0, 37.0, 27.0, 34.0, 38.0, 37.0, 35.0, 26.0, 23.0, 22.0, 18.0, 15.0, 25.0, 13.0, 16.0, 12.0, 14.0, 7.0, 8.0, 6.0, 10.0, 3.0, 4.0, 4.0, 3.0, 0.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0, 2.0], "bins": [-5.40625, -5.22894287109375, -5.0516357421875, -4.87432861328125, -4.697021484375, -4.51971435546875, -4.3424072265625, -4.16510009765625, -3.98779296875, -3.81048583984375, -3.6331787109375, -3.45587158203125, -3.278564453125, -3.10125732421875, -2.9239501953125, -2.74664306640625, -2.5693359375, -2.39202880859375, -2.2147216796875, -2.03741455078125, -1.860107421875, -1.68280029296875, -1.5054931640625, -1.32818603515625, -1.15087890625, -0.97357177734375, -0.7962646484375, -0.61895751953125, -0.441650390625, -0.26434326171875, -0.0870361328125, 0.09027099609375, 0.267578125, 0.44488525390625, 0.6221923828125, 0.79949951171875, 0.976806640625, 1.15411376953125, 1.3314208984375, 1.50872802734375, 1.68603515625, 1.86334228515625, 2.0406494140625, 2.21795654296875, 2.395263671875, 2.57257080078125, 2.7498779296875, 2.92718505859375, 3.1044921875, 3.28179931640625, 3.4591064453125, 3.63641357421875, 3.813720703125, 3.99102783203125, 4.1683349609375, 4.34564208984375, 4.52294921875, 4.70025634765625, 4.8775634765625, 5.05487060546875, 5.232177734375, 5.40948486328125, 5.5867919921875, 5.76409912109375, 5.94140625]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 4.0, 2.0, 6.0, 3.0, 7.0, 8.0, 8.0, 17.0, 22.0, 29.0, 44.0, 54.0, 72.0, 98.0, 146.0, 283.0, 407.0, 715.0, 1380.0, 2661.0, 4745.0, 9418.0, 18887.0, 39266.0, 88066.0, 228736.0, 368858.0, 158495.0, 65807.0, 30121.0, 14416.0, 7253.0, 3723.0, 2047.0, 1116.0, 553.0, 368.0, 213.0, 138.0, 124.0, 71.0, 48.0, 28.0, 25.0, 15.0, 12.0, 15.0, 11.0, 2.0, 9.0, 2.0, 2.0, 4.0, 1.0, 1.0, 2.0, 4.0, 0.0, 0.0, 1.0], "bins": [-5.95703125, -5.76055908203125, -5.5640869140625, -5.36761474609375, -5.171142578125, -4.97467041015625, -4.7781982421875, -4.58172607421875, -4.38525390625, -4.18878173828125, -3.9923095703125, -3.79583740234375, -3.599365234375, -3.40289306640625, -3.2064208984375, -3.00994873046875, -2.8134765625, -2.61700439453125, -2.4205322265625, -2.22406005859375, -2.027587890625, -1.83111572265625, -1.6346435546875, -1.43817138671875, -1.24169921875, -1.04522705078125, -0.8487548828125, -0.65228271484375, -0.455810546875, -0.25933837890625, -0.0628662109375, 0.13360595703125, 0.330078125, 0.52655029296875, 0.7230224609375, 0.91949462890625, 1.115966796875, 1.31243896484375, 1.5089111328125, 1.70538330078125, 1.90185546875, 2.09832763671875, 2.2947998046875, 2.49127197265625, 2.687744140625, 2.88421630859375, 3.0806884765625, 3.27716064453125, 3.4736328125, 3.67010498046875, 3.8665771484375, 4.06304931640625, 4.259521484375, 4.45599365234375, 4.6524658203125, 4.84893798828125, 5.04541015625, 5.24188232421875, 5.4383544921875, 5.63482666015625, 5.831298828125, 6.02777099609375, 6.2242431640625, 6.42071533203125, 6.6171875]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 7.0, 4.0, 4.0, 12.0, 5.0, 18.0, 15.0, 19.0, 23.0, 24.0, 36.0, 45.0, 37.0, 37.0, 48.0, 73.0, 87.0, 166.0, 1486.0, 317.0, 110.0, 77.0, 49.0, 49.0, 33.0, 35.0, 34.0, 36.0, 31.0, 21.0, 30.0, 15.0, 10.0, 13.0, 9.0, 7.0, 7.0, 4.0, 5.0, 2.0, 2.0, 3.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0], "bins": [-20.75, -20.1533203125, -19.556640625, -18.9599609375, -18.36328125, -17.7666015625, -17.169921875, -16.5732421875, -15.9765625, -15.3798828125, -14.783203125, -14.1865234375, -13.58984375, -12.9931640625, -12.396484375, -11.7998046875, -11.203125, -10.6064453125, -10.009765625, -9.4130859375, -8.81640625, -8.2197265625, -7.623046875, -7.0263671875, -6.4296875, -5.8330078125, -5.236328125, -4.6396484375, -4.04296875, -3.4462890625, -2.849609375, -2.2529296875, -1.65625, -1.0595703125, -0.462890625, 0.1337890625, 0.73046875, 1.3271484375, 1.923828125, 2.5205078125, 3.1171875, 3.7138671875, 4.310546875, 4.9072265625, 5.50390625, 6.1005859375, 6.697265625, 7.2939453125, 7.890625, 8.4873046875, 9.083984375, 9.6806640625, 10.27734375, 10.8740234375, 11.470703125, 12.0673828125, 12.6640625, 13.2607421875, 13.857421875, 14.4541015625, 15.05078125, 15.6474609375, 16.244140625, 16.8408203125, 17.4375]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 6.0, 1.0, 5.0, 9.0, 8.0, 16.0, 14.0, 23.0, 27.0, 30.0, 45.0, 52.0, 78.0, 122.0, 139.0, 206.0, 367.0, 896.0, 5832.0, 312002.0, 2801132.0, 21786.0, 1581.0, 470.0, 256.0, 172.0, 116.0, 75.0, 56.0, 51.0, 38.0, 28.0, 18.0, 8.0, 15.0, 5.0, 5.0, 8.0, 3.0, 2.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-40.34375, -39.19775390625, -38.0517578125, -36.90576171875, -35.759765625, -34.61376953125, -33.4677734375, -32.32177734375, -31.17578125, -30.02978515625, -28.8837890625, -27.73779296875, -26.591796875, -25.44580078125, -24.2998046875, -23.15380859375, -22.0078125, -20.86181640625, -19.7158203125, -18.56982421875, -17.423828125, -16.27783203125, -15.1318359375, -13.98583984375, -12.83984375, -11.69384765625, -10.5478515625, -9.40185546875, -8.255859375, -7.10986328125, -5.9638671875, -4.81787109375, -3.671875, -2.52587890625, -1.3798828125, -0.23388671875, 0.912109375, 2.05810546875, 3.2041015625, 4.35009765625, 5.49609375, 6.64208984375, 7.7880859375, 8.93408203125, 10.080078125, 11.22607421875, 12.3720703125, 13.51806640625, 14.6640625, 15.81005859375, 16.9560546875, 18.10205078125, 19.248046875, 20.39404296875, 21.5400390625, 22.68603515625, 23.83203125, 24.97802734375, 26.1240234375, 27.27001953125, 28.416015625, 29.56201171875, 30.7080078125, 31.85400390625, 33.0]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 257.0, 737.0, 25.0], "bins": [-478.84661865234375, -471.14825439453125, -463.4499206542969, -455.7515563964844, -448.05322265625, -440.3548583984375, -432.656494140625, -424.9581604003906, -417.2597961425781, -409.5614318847656, -401.86309814453125, -394.16473388671875, -386.4664001464844, -378.7680358886719, -371.0697021484375, -363.371337890625, -355.6729736328125, -347.974609375, -340.2762756347656, -332.5779113769531, -324.87957763671875, -317.18121337890625, -309.48284912109375, -301.7845153808594, -294.086181640625, -286.3878173828125, -278.6894836425781, -270.9911193847656, -263.29278564453125, -255.59442138671875, -247.8960723876953, -240.19772338867188, -232.49935913085938, -224.80101013183594, -217.1026611328125, -209.404296875, -201.70594787597656, -194.00759887695312, -186.3092498779297, -178.61090087890625, -170.91253662109375, -163.2141876220703, -155.51583862304688, -147.81747436523438, -140.11912536621094, -132.4207763671875, -124.72242736816406, -117.02407836914062, -109.32572937011719, -101.62738037109375, -93.92902374267578, -86.23067474365234, -78.53231811523438, -70.83396911621094, -63.1356201171875, -55.4372673034668, -47.738914489746094, -40.04056167602539, -32.34220886230469, -24.64385986328125, -16.945507049560547, -9.247154235839844, -1.5488052368164062, 6.149547576904297, 13.847900390625]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 1.0, 5.0, 2.0, 7.0, 5.0, 7.0, 7.0, 6.0, 18.0, 13.0, 11.0, 16.0, 20.0, 19.0, 26.0, 23.0, 20.0, 32.0, 35.0, 32.0, 43.0, 55.0, 36.0, 30.0, 42.0, 56.0, 42.0, 39.0, 29.0, 37.0, 41.0, 30.0, 27.0, 37.0, 23.0, 21.0, 21.0, 15.0, 13.0, 11.0, 11.0, 9.0, 11.0, 5.0, 3.0, 4.0, 7.0, 0.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-42.76203536987305, -41.372535705566406, -39.98303985595703, -38.593544006347656, -37.204044342041016, -35.814544677734375, -34.425048828125, -33.035552978515625, -31.646053314208984, -30.256555557250977, -28.86705780029297, -27.47756004333496, -26.088062286376953, -24.698564529418945, -23.309066772460938, -21.91956901550293, -20.530071258544922, -19.140573501586914, -17.751075744628906, -16.3615779876709, -14.97208023071289, -13.582582473754883, -12.193084716796875, -10.803586959838867, -9.41408920288086, -8.024591445922852, -6.635093688964844, -5.245595932006836, -3.856098175048828, -2.4666004180908203, -1.0771026611328125, 0.3123950958251953, 1.7018966674804688, 3.0913944244384766, 4.480892181396484, 5.870389938354492, 7.2598876953125, 8.649385452270508, 10.038883209228516, 11.428380966186523, 12.817878723144531, 14.207376480102539, 15.596874237060547, 16.986371994018555, 18.375869750976562, 19.76536750793457, 21.154865264892578, 22.544363021850586, 23.933860778808594, 25.3233585357666, 26.71285629272461, 28.102354049682617, 29.491851806640625, 30.881349563598633, 32.27084732055664, 33.66034698486328, 35.049842834472656, 36.43933868408203, 37.82883834838867, 39.21833801269531, 40.60783386230469, 41.99732971191406, 43.3868293762207, 44.776329040527344, 46.16582489013672]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 6.0, 5.0, 7.0, 3.0, 17.0, 15.0, 12.0, 15.0, 18.0, 15.0, 19.0, 16.0, 31.0, 24.0, 31.0, 31.0, 31.0, 31.0, 37.0, 42.0, 39.0, 41.0, 43.0, 33.0, 33.0, 38.0, 40.0, 29.0, 33.0, 38.0, 32.0, 30.0, 18.0, 19.0, 16.0, 22.0, 25.0, 9.0, 12.0, 12.0, 7.0, 10.0, 6.0, 2.0, 5.0, 3.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.69921875, -5.506103515625, -5.31298828125, -5.119873046875, -4.9267578125, -4.733642578125, -4.54052734375, -4.347412109375, -4.154296875, -3.961181640625, -3.76806640625, -3.574951171875, -3.3818359375, -3.188720703125, -2.99560546875, -2.802490234375, -2.609375, -2.416259765625, -2.22314453125, -2.030029296875, -1.8369140625, -1.643798828125, -1.45068359375, -1.257568359375, -1.064453125, -0.871337890625, -0.67822265625, -0.485107421875, -0.2919921875, -0.098876953125, 0.09423828125, 0.287353515625, 0.48046875, 0.673583984375, 0.86669921875, 1.059814453125, 1.2529296875, 1.446044921875, 1.63916015625, 1.832275390625, 2.025390625, 2.218505859375, 2.41162109375, 2.604736328125, 2.7978515625, 2.990966796875, 3.18408203125, 3.377197265625, 3.5703125, 3.763427734375, 3.95654296875, 4.149658203125, 4.3427734375, 4.535888671875, 4.72900390625, 4.922119140625, 5.115234375, 5.308349609375, 5.50146484375, 5.694580078125, 5.8876953125, 6.080810546875, 6.27392578125, 6.467041015625, 6.66015625]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 5.0, 5.0, 4.0, 6.0, 5.0, 12.0, 16.0, 12.0, 19.0, 19.0, 18.0, 31.0, 30.0, 50.0, 55.0, 111.0, 206.0, 408.0, 1025.0, 2956.0, 13624.0, 209392.0, 3180894.0, 748721.0, 28928.0, 4808.0, 1534.0, 617.0, 300.0, 163.0, 80.0, 43.0, 35.0, 31.0, 25.0, 14.0, 16.0, 10.0, 8.0, 15.0, 5.0, 5.0, 9.0, 8.0, 2.0, 2.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.1875, -18.581787109375, -17.97607421875, -17.370361328125, -16.7646484375, -16.158935546875, -15.55322265625, -14.947509765625, -14.341796875, -13.736083984375, -13.13037109375, -12.524658203125, -11.9189453125, -11.313232421875, -10.70751953125, -10.101806640625, -9.49609375, -8.890380859375, -8.28466796875, -7.678955078125, -7.0732421875, -6.467529296875, -5.86181640625, -5.256103515625, -4.650390625, -4.044677734375, -3.43896484375, -2.833251953125, -2.2275390625, -1.621826171875, -1.01611328125, -0.410400390625, 0.1953125, 0.801025390625, 1.40673828125, 2.012451171875, 2.6181640625, 3.223876953125, 3.82958984375, 4.435302734375, 5.041015625, 5.646728515625, 6.25244140625, 6.858154296875, 7.4638671875, 8.069580078125, 8.67529296875, 9.281005859375, 9.88671875, 10.492431640625, 11.09814453125, 11.703857421875, 12.3095703125, 12.915283203125, 13.52099609375, 14.126708984375, 14.732421875, 15.338134765625, 15.94384765625, 16.549560546875, 17.1552734375, 17.760986328125, 18.36669921875, 18.972412109375, 19.578125]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 4.0, 9.0, 12.0, 2.0, 5.0, 8.0, 14.0, 17.0, 31.0, 26.0, 42.0, 57.0, 62.0, 75.0, 124.0, 184.0, 284.0, 392.0, 496.0, 570.0, 462.0, 331.0, 265.0, 163.0, 100.0, 70.0, 63.0, 40.0, 45.0, 23.0, 20.0, 11.0, 13.0, 11.0, 9.0, 9.0, 9.0, 1.0, 5.0, 5.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.046875, -8.7279052734375, -8.408935546875, -8.0899658203125, -7.77099609375, -7.4520263671875, -7.133056640625, -6.8140869140625, -6.4951171875, -6.1761474609375, -5.857177734375, -5.5382080078125, -5.21923828125, -4.9002685546875, -4.581298828125, -4.2623291015625, -3.943359375, -3.6243896484375, -3.305419921875, -2.9864501953125, -2.66748046875, -2.3485107421875, -2.029541015625, -1.7105712890625, -1.3916015625, -1.0726318359375, -0.753662109375, -0.4346923828125, -0.11572265625, 0.2032470703125, 0.522216796875, 0.8411865234375, 1.16015625, 1.4791259765625, 1.798095703125, 2.1170654296875, 2.43603515625, 2.7550048828125, 3.073974609375, 3.3929443359375, 3.7119140625, 4.0308837890625, 4.349853515625, 4.6688232421875, 4.98779296875, 5.3067626953125, 5.625732421875, 5.9447021484375, 6.263671875, 6.5826416015625, 6.901611328125, 7.2205810546875, 7.53955078125, 7.8585205078125, 8.177490234375, 8.4964599609375, 8.8154296875, 9.1343994140625, 9.453369140625, 9.7723388671875, 10.09130859375, 10.4102783203125, 10.729248046875, 11.0482177734375, 11.3671875]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 7.0, 6.0, 8.0, 7.0, 12.0, 17.0, 13.0, 20.0, 21.0, 34.0, 50.0, 47.0, 81.0, 116.0, 156.0, 262.0, 520.0, 1660.0, 9640.0, 169759.0, 3871619.0, 128818.0, 8443.0, 1514.0, 560.0, 276.0, 164.0, 107.0, 93.0, 65.0, 48.0, 45.0, 26.0, 14.0, 10.0, 4.0, 8.0, 11.0, 5.0, 4.0, 8.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-40.625, -39.4794921875, -38.333984375, -37.1884765625, -36.04296875, -34.8974609375, -33.751953125, -32.6064453125, -31.4609375, -30.3154296875, -29.169921875, -28.0244140625, -26.87890625, -25.7333984375, -24.587890625, -23.4423828125, -22.296875, -21.1513671875, -20.005859375, -18.8603515625, -17.71484375, -16.5693359375, -15.423828125, -14.2783203125, -13.1328125, -11.9873046875, -10.841796875, -9.6962890625, -8.55078125, -7.4052734375, -6.259765625, -5.1142578125, -3.96875, -2.8232421875, -1.677734375, -0.5322265625, 0.61328125, 1.7587890625, 2.904296875, 4.0498046875, 5.1953125, 6.3408203125, 7.486328125, 8.6318359375, 9.77734375, 10.9228515625, 12.068359375, 13.2138671875, 14.359375, 15.5048828125, 16.650390625, 17.7958984375, 18.94140625, 20.0869140625, 21.232421875, 22.3779296875, 23.5234375, 24.6689453125, 25.814453125, 26.9599609375, 28.10546875, 29.2509765625, 30.396484375, 31.5419921875, 32.6875]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 18.0, 276.0, 553.0, 155.0, 15.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-107.67435455322266, -101.0995101928711, -94.52466583251953, -87.9498291015625, -81.37498474121094, -74.80014038085938, -68.22529602050781, -61.65045166015625, -55.07560729980469, -48.500762939453125, -41.92591857910156, -35.351078033447266, -28.776233673095703, -22.20138931274414, -15.626548767089844, -9.051704406738281, -2.4768600463867188, 4.097983360290527, 10.672826766967773, 17.247669219970703, 23.822513580322266, 30.397357940673828, 36.972198486328125, 43.54704284667969, 50.12188720703125, 56.69673156738281, 63.271575927734375, 69.84642028808594, 76.4212646484375, 82.99610900878906, 89.5709457397461, 96.14579010009766, 102.72064208984375, 109.29548645019531, 115.87033081054688, 122.44517517089844, 129.02001953125, 135.59486389160156, 142.16970825195312, 148.74453735351562, 155.31939697265625, 161.8942413330078, 168.46908569335938, 175.04393005371094, 181.6187744140625, 188.19361877441406, 194.76846313476562, 201.34329223632812, 207.9181365966797, 214.49298095703125, 221.0678253173828, 227.64266967773438, 234.21751403808594, 240.7923583984375, 247.3671875, 253.94204711914062, 260.5168762207031, 267.0917053222656, 273.66656494140625, 280.24139404296875, 286.8162536621094, 293.3910827636719, 299.9659423828125, 306.540771484375, 313.1156311035156]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 9.0, 11.0, 5.0, 10.0, 11.0, 16.0, 15.0, 16.0, 22.0, 21.0, 21.0, 36.0, 26.0, 51.0, 27.0, 34.0, 35.0, 30.0, 35.0, 41.0, 40.0, 40.0, 45.0, 40.0, 52.0, 36.0, 34.0, 29.0, 24.0, 27.0, 27.0, 14.0, 22.0, 14.0, 26.0, 12.0, 11.0, 10.0, 5.0, 9.0, 4.0, 7.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0], "bins": [-36.977989196777344, -35.93315505981445, -34.88832092285156, -33.843482971191406, -32.798648834228516, -31.753814697265625, -30.708980560302734, -29.664146423339844, -28.61931037902832, -27.57447624206543, -26.529640197753906, -25.484806060791016, -24.439971923828125, -23.3951358795166, -22.35030174255371, -21.305465698242188, -20.260631561279297, -19.215797424316406, -18.170961380004883, -17.126127243041992, -16.08129119873047, -15.036457061767578, -13.991622924804688, -12.94678783416748, -11.901952743530273, -10.857117652893066, -9.81228256225586, -8.767448425292969, -7.722613334655762, -6.677778244018555, -5.632943630218506, -4.588109016418457, -3.543275833129883, -2.498440980911255, -1.453606128692627, -0.408771276473999, 0.6360635757446289, 1.680898666381836, 2.7257332801818848, 3.7705678939819336, 4.815402984619141, 5.860238075256348, 6.9050726890563965, 7.949907302856445, 8.994742393493652, 10.03957748413086, 11.08441162109375, 12.129246711730957, 13.174081802368164, 14.218916893005371, 15.263751983642578, 16.30858612060547, 17.35342025756836, 18.398256301879883, 19.443090438842773, 20.487926483154297, 21.532760620117188, 22.577594757080078, 23.6224308013916, 24.667264938354492, 25.712100982666016, 26.756935119628906, 27.801769256591797, 28.846603393554688, 29.89143943786621]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 6.0, 8.0, 8.0, 5.0, 12.0, 12.0, 30.0, 26.0, 29.0, 35.0, 32.0, 38.0, 37.0, 41.0, 55.0, 62.0, 61.0, 40.0, 45.0, 53.0, 70.0, 47.0, 38.0, 35.0, 29.0, 28.0, 23.0, 28.0, 24.0, 11.0, 13.0, 6.0, 8.0, 5.0, 5.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.671875, -9.4132080078125, -9.154541015625, -8.8958740234375, -8.63720703125, -8.3785400390625, -8.119873046875, -7.8612060546875, -7.6025390625, -7.3438720703125, -7.085205078125, -6.8265380859375, -6.56787109375, -6.3092041015625, -6.050537109375, -5.7918701171875, -5.533203125, -5.2745361328125, -5.015869140625, -4.7572021484375, -4.49853515625, -4.2398681640625, -3.981201171875, -3.7225341796875, -3.4638671875, -3.2052001953125, -2.946533203125, -2.6878662109375, -2.42919921875, -2.1705322265625, -1.911865234375, -1.6531982421875, -1.39453125, -1.1358642578125, -0.877197265625, -0.6185302734375, -0.35986328125, -0.1011962890625, 0.157470703125, 0.4161376953125, 0.6748046875, 0.9334716796875, 1.192138671875, 1.4508056640625, 1.70947265625, 1.9681396484375, 2.226806640625, 2.4854736328125, 2.744140625, 3.0028076171875, 3.261474609375, 3.5201416015625, 3.77880859375, 4.0374755859375, 4.296142578125, 4.5548095703125, 4.8134765625, 5.0721435546875, 5.330810546875, 5.5894775390625, 5.84814453125, 6.1068115234375, 6.365478515625, 6.6241455078125, 6.8828125]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 6.0, 6.0, 8.0, 13.0, 12.0, 16.0, 32.0, 41.0, 71.0, 107.0, 167.0, 297.0, 466.0, 766.0, 1244.0, 2195.0, 3899.0, 7108.0, 12478.0, 23348.0, 44054.0, 90613.0, 220050.0, 351102.0, 149046.0, 66795.0, 33864.0, 17873.0, 9837.0, 5339.0, 3144.0, 1867.0, 1050.0, 621.0, 395.0, 228.0, 149.0, 76.0, 53.0, 44.0, 25.0, 19.0, 10.0, 8.0, 6.0, 4.0, 4.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.3857421875, -0.3737983703613281, -0.36185455322265625, -0.3499107360839844, -0.3379669189453125, -0.3260231018066406, -0.31407928466796875, -0.3021354675292969, -0.290191650390625, -0.2782478332519531, -0.26630401611328125, -0.2543601989746094, -0.2424163818359375, -0.23047256469726562, -0.21852874755859375, -0.20658493041992188, -0.19464111328125, -0.18269729614257812, -0.17075347900390625, -0.15880966186523438, -0.1468658447265625, -0.13492202758789062, -0.12297821044921875, -0.11103439331054688, -0.099090576171875, -0.08714675903320312, -0.07520294189453125, -0.06325912475585938, -0.0513153076171875, -0.039371490478515625, -0.02742767333984375, -0.015483856201171875, -0.0035400390625, 0.008403778076171875, 0.02034759521484375, 0.032291412353515625, 0.0442352294921875, 0.056179046630859375, 0.06812286376953125, 0.08006668090820312, 0.092010498046875, 0.10395431518554688, 0.11589813232421875, 0.12784194946289062, 0.1397857666015625, 0.15172958374023438, 0.16367340087890625, 0.17561721801757812, 0.18756103515625, 0.19950485229492188, 0.21144866943359375, 0.22339248657226562, 0.2353363037109375, 0.24728012084960938, 0.25922393798828125, 0.2711677551269531, 0.283111572265625, 0.2950553894042969, 0.30699920654296875, 0.3189430236816406, 0.3308868408203125, 0.3428306579589844, 0.35477447509765625, 0.3667182922363281, 0.378662109375]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 5.0, 3.0, 9.0, 9.0, 15.0, 13.0, 18.0, 19.0, 30.0, 26.0, 35.0, 25.0, 28.0, 39.0, 44.0, 40.0, 43.0, 43.0, 41.0, 1077.0, 44.0, 48.0, 43.0, 29.0, 39.0, 48.0, 36.0, 30.0, 32.0, 23.0, 16.0, 13.0, 16.0, 13.0, 9.0, 4.0, 6.0, 7.0, 8.0, 2.0, 1.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.958984375, -3.813079833984375, -3.66717529296875, -3.521270751953125, -3.3753662109375, -3.229461669921875, -3.08355712890625, -2.937652587890625, -2.791748046875, -2.645843505859375, -2.49993896484375, -2.354034423828125, -2.2081298828125, -2.062225341796875, -1.91632080078125, -1.770416259765625, -1.62451171875, -1.478607177734375, -1.33270263671875, -1.186798095703125, -1.0408935546875, -0.894989013671875, -0.74908447265625, -0.603179931640625, -0.457275390625, -0.311370849609375, -0.16546630859375, -0.019561767578125, 0.1263427734375, 0.272247314453125, 0.41815185546875, 0.564056396484375, 0.7099609375, 0.855865478515625, 1.00177001953125, 1.147674560546875, 1.2935791015625, 1.439483642578125, 1.58538818359375, 1.731292724609375, 1.877197265625, 2.023101806640625, 2.16900634765625, 2.314910888671875, 2.4608154296875, 2.606719970703125, 2.75262451171875, 2.898529052734375, 3.04443359375, 3.190338134765625, 3.33624267578125, 3.482147216796875, 3.6280517578125, 3.773956298828125, 3.91986083984375, 4.065765380859375, 4.211669921875, 4.357574462890625, 4.50347900390625, 4.649383544921875, 4.7952880859375, 4.941192626953125, 5.08709716796875, 5.233001708984375, 5.37890625]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 4.0, 11.0, 16.0, 18.0, 41.0, 62.0, 104.0, 151.0, 252.0, 342.0, 540.0, 870.0, 1298.0, 1950.0, 3113.0, 4732.0, 7664.0, 12241.0, 20008.0, 34014.0, 58725.0, 107812.0, 209151.0, 1314363.0, 138802.0, 74045.0, 42241.0, 24648.0, 14790.0, 9021.0, 5775.0, 3664.0, 2367.0, 1438.0, 991.0, 620.0, 447.0, 270.0, 208.0, 107.0, 61.0, 48.0, 28.0, 29.0, 19.0, 10.0, 7.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 3.0], "bins": [-0.2293701171875, -0.2222461700439453, -0.21512222290039062, -0.20799827575683594, -0.20087432861328125, -0.19375038146972656, -0.18662643432617188, -0.1795024871826172, -0.1723785400390625, -0.1652545928955078, -0.15813064575195312, -0.15100669860839844, -0.14388275146484375, -0.13675880432128906, -0.12963485717773438, -0.12251091003417969, -0.115386962890625, -0.10826301574707031, -0.10113906860351562, -0.09401512145996094, -0.08689117431640625, -0.07976722717285156, -0.07264328002929688, -0.06551933288574219, -0.0583953857421875, -0.05127143859863281, -0.044147491455078125, -0.03702354431152344, -0.02989959716796875, -0.022775650024414062, -0.015651702880859375, -0.008527755737304688, -0.00140380859375, 0.0057201385498046875, 0.012844085693359375, 0.019968032836914062, 0.02709197998046875, 0.03421592712402344, 0.041339874267578125, 0.04846382141113281, 0.0555877685546875, 0.06271171569824219, 0.06983566284179688, 0.07695960998535156, 0.08408355712890625, 0.09120750427246094, 0.09833145141601562, 0.10545539855957031, 0.112579345703125, 0.11970329284667969, 0.12682723999023438, 0.13395118713378906, 0.14107513427734375, 0.14819908142089844, 0.15532302856445312, 0.1624469757080078, 0.1695709228515625, 0.1766948699951172, 0.18381881713867188, 0.19094276428222656, 0.19806671142578125, 0.20519065856933594, 0.21231460571289062, 0.2194385528564453, 0.2265625]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 5.0, 5.0, 9.0, 10.0, 13.0, 8.0, 8.0, 18.0, 26.0, 33.0, 34.0, 44.0, 47.0, 65.0, 56.0, 59.0, 82.0, 75.0, 61.0, 58.0, 53.0, 50.0, 33.0, 34.0, 21.0, 15.0, 22.0, 7.0, 10.0, 11.0, 6.0, 4.0, 5.0, 4.0, 3.0, 5.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0003516674041748047, -0.00034119561314582825, -0.0003307238221168518, -0.00032025203108787537, -0.0003097802400588989, -0.0002993084490299225, -0.00028883665800094604, -0.0002783648669719696, -0.00026789307594299316, -0.0002574212849140167, -0.0002469494938850403, -0.00023647770285606384, -0.0002260059118270874, -0.00021553412079811096, -0.00020506232976913452, -0.00019459053874015808, -0.00018411874771118164, -0.0001736469566822052, -0.00016317516565322876, -0.00015270337462425232, -0.00014223158359527588, -0.00013175979256629944, -0.000121288001537323, -0.00011081621050834656, -0.00010034441947937012, -8.987262845039368e-05, -7.940083742141724e-05, -6.89290463924408e-05, -5.8457255363464355e-05, -4.7985464334487915e-05, -3.7513673305511475e-05, -2.7041882276535034e-05, -1.6570091247558594e-05, -6.098300218582153e-06, 4.373490810394287e-06, 1.4845281839370728e-05, 2.5317072868347168e-05, 3.578886389732361e-05, 4.626065492630005e-05, 5.673244595527649e-05, 6.720423698425293e-05, 7.767602801322937e-05, 8.814781904220581e-05, 9.861961007118225e-05, 0.00010909140110015869, 0.00011956319212913513, 0.00013003498315811157, 0.000140506774187088, 0.00015097856521606445, 0.0001614503562450409, 0.00017192214727401733, 0.00018239393830299377, 0.00019286572933197021, 0.00020333752036094666, 0.0002138093113899231, 0.00022428110241889954, 0.00023475289344787598, 0.0002452246844768524, 0.00025569647550582886, 0.0002661682665348053, 0.00027664005756378174, 0.0002871118485927582, 0.0002975836396217346, 0.00030805543065071106, 0.0003185272216796875]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 0.0, 4.0, 5.0, 2.0, 5.0, 7.0, 8.0, 14.0, 15.0, 20.0, 24.0, 27.0, 46.0, 42.0, 74.0, 123.0, 169.0, 324.0, 867.0, 20678.0, 1019646.0, 5108.0, 570.0, 242.0, 159.0, 101.0, 65.0, 56.0, 43.0, 28.0, 15.0, 6.0, 11.0, 14.0, 10.0, 5.0, 8.0, 6.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.00695037841796875, -0.006721436977386475, -0.006492495536804199, -0.006263554096221924, -0.0060346126556396484, -0.005805671215057373, -0.005576729774475098, -0.005347788333892822, -0.005118846893310547, -0.0048899054527282715, -0.004660964012145996, -0.004432022571563721, -0.004203081130981445, -0.00397413969039917, -0.0037451982498168945, -0.003516256809234619, -0.0032873153686523438, -0.0030583739280700684, -0.002829432487487793, -0.0026004910469055176, -0.002371549606323242, -0.002142608165740967, -0.0019136667251586914, -0.001684725284576416, -0.0014557838439941406, -0.0012268424034118652, -0.0009979009628295898, -0.0007689595222473145, -0.0005400180816650391, -0.00031107664108276367, -8.213520050048828e-05, 0.0001468062400817871, 0.0003757476806640625, 0.0006046891212463379, 0.0008336305618286133, 0.0010625720024108887, 0.001291513442993164, 0.0015204548835754395, 0.0017493963241577148, 0.0019783377647399902, 0.0022072792053222656, 0.002436220645904541, 0.0026651620864868164, 0.002894103527069092, 0.003123044967651367, 0.0033519864082336426, 0.003580927848815918, 0.0038098692893981934, 0.004038810729980469, 0.004267752170562744, 0.0044966936111450195, 0.004725635051727295, 0.00495457649230957, 0.005183517932891846, 0.005412459373474121, 0.0056414008140563965, 0.005870342254638672, 0.006099283695220947, 0.006328225135803223, 0.006557166576385498, 0.0067861080169677734, 0.007015049457550049, 0.007243990898132324, 0.0074729323387146, 0.007701873779296875]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 796.0, 220.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00020801069331355393, -9.725535346660763e-05, 1.3499986380338669e-05, 0.0001242553407792002, 0.00023501066607423127, 0.00034576599136926234, 0.0004565213748719543, 0.0005672767292708158, 0.0006780320545658469, 0.000788787379860878, 0.0008995427051559091, 0.0010102980304509401, 0.001121053472161293, 0.0012318086810410023, 0.0013425641227513552, 0.0014533194480463862, 0.0015640747733414173, 0.0016748300986364484, 0.0017855854239314795, 0.0018963408656418324, 0.0020070960745215416, 0.0021178515162318945, 0.0022286069579422474, 0.0023393621668219566, 0.002450117375701666, 0.0025608728174120188, 0.002671628026291728, 0.002782383468002081, 0.00289313867688179, 0.003003894118592143, 0.003114649560302496, 0.003225404769182205, 0.0033361599780619144, 0.0034469154197722673, 0.0035576706286519766, 0.0036684260703623295, 0.0037791812792420387, 0.0038899367209523916, 0.0040006921626627445, 0.004111447371542454, 0.004222202580422163, 0.004332957789301872, 0.004443713463842869, 0.004554468672722578, 0.004665223881602287, 0.0047759790904819965, 0.004886734765022993, 0.004997489973902702, 0.005108245648443699, 0.005219000857323408, 0.005329756531864405, 0.005440511740744114, 0.005551266949623823, 0.005662022158503532, 0.005772777833044529, 0.005883533041924238, 0.0059942882508039474, 0.006105043459683657, 0.006215799134224653, 0.0063265543431043625, 0.006437309551984072, 0.006548064760863781, 0.0066588204354047775, 0.006769575644284487, 0.006880330853164196]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 4.0, 5.0, 3.0, 2.0, 7.0, 10.0, 14.0, 16.0, 17.0, 24.0, 29.0, 23.0, 44.0, 36.0, 38.0, 44.0, 56.0, 48.0, 49.0, 70.0, 60.0, 55.0, 53.0, 47.0, 33.0, 33.0, 39.0, 31.0, 26.0, 21.0, 22.0, 12.0, 19.0, 9.0, 6.0, 2.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0], "bins": [-0.00030040740966796875, -0.0002930592745542526, -0.0002857111394405365, -0.0002783630043268204, -0.00027101486921310425, -0.0002636667340993881, -0.000256318598985672, -0.00024897046387195587, -0.00024162232875823975, -0.00023427419364452362, -0.0002269260585308075, -0.00021957792341709137, -0.00021222978830337524, -0.00020488165318965912, -0.000197533518075943, -0.00019018538296222687, -0.00018283724784851074, -0.00017548911273479462, -0.0001681409776210785, -0.00016079284250736237, -0.00015344470739364624, -0.00014609657227993011, -0.000138748437166214, -0.00013140030205249786, -0.00012405216693878174, -0.00011670403182506561, -0.00010935589671134949, -0.00010200776159763336, -9.465962648391724e-05, -8.731149137020111e-05, -7.996335625648499e-05, -7.261522114276886e-05, -6.526708602905273e-05, -5.791895091533661e-05, -5.0570815801620483e-05, -4.322268068790436e-05, -3.587454557418823e-05, -2.8526410460472107e-05, -2.117827534675598e-05, -1.3830140233039856e-05, -6.4820051193237305e-06, 8.66129994392395e-07, 8.21426510810852e-06, 1.5562400221824646e-05, 2.291053533554077e-05, 3.0258670449256897e-05, 3.760680556297302e-05, 4.495494067668915e-05, 5.2303075790405273e-05, 5.96512109041214e-05, 6.699934601783752e-05, 7.434748113155365e-05, 8.169561624526978e-05, 8.90437513589859e-05, 9.639188647270203e-05, 0.00010374002158641815, 0.00011108815670013428, 0.0001184362918138504, 0.00012578442692756653, 0.00013313256204128265, 0.00014048069715499878, 0.0001478288322687149, 0.00015517696738243103, 0.00016252510249614716, 0.00016987323760986328]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 6.0, 8.0, 8.0, 5.0, 12.0, 12.0, 30.0, 26.0, 29.0, 35.0, 32.0, 38.0, 37.0, 41.0, 55.0, 62.0, 61.0, 40.0, 45.0, 53.0, 70.0, 47.0, 38.0, 35.0, 29.0, 28.0, 23.0, 28.0, 24.0, 11.0, 13.0, 6.0, 8.0, 5.0, 5.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.671875, -9.4132080078125, -9.154541015625, -8.8958740234375, -8.63720703125, -8.3785400390625, -8.119873046875, -7.8612060546875, -7.6025390625, -7.3438720703125, -7.085205078125, -6.8265380859375, -6.56787109375, -6.3092041015625, -6.050537109375, -5.7918701171875, -5.533203125, -5.2745361328125, -5.015869140625, -4.7572021484375, -4.49853515625, -4.2398681640625, -3.981201171875, -3.7225341796875, -3.4638671875, -3.2052001953125, -2.946533203125, -2.6878662109375, -2.42919921875, -2.1705322265625, -1.911865234375, -1.6531982421875, -1.39453125, -1.1358642578125, -0.877197265625, -0.6185302734375, -0.35986328125, -0.1011962890625, 0.157470703125, 0.4161376953125, 0.6748046875, 0.9334716796875, 1.192138671875, 1.4508056640625, 1.70947265625, 1.9681396484375, 2.226806640625, 2.4854736328125, 2.744140625, 3.0028076171875, 3.261474609375, 3.5201416015625, 3.77880859375, 4.0374755859375, 4.296142578125, 4.5548095703125, 4.8134765625, 5.0721435546875, 5.330810546875, 5.5894775390625, 5.84814453125, 6.1068115234375, 6.365478515625, 6.6241455078125, 6.8828125]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 6.0, 5.0, 10.0, 11.0, 22.0, 34.0, 51.0, 78.0, 107.0, 171.0, 311.0, 519.0, 956.0, 2042.0, 4615.0, 14015.0, 82677.0, 816673.0, 101197.0, 15533.0, 4961.0, 2095.0, 1099.0, 554.0, 336.0, 182.0, 96.0, 70.0, 54.0, 31.0, 14.0, 15.0, 7.0, 8.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-18.921875, -18.3740234375, -17.826171875, -17.2783203125, -16.73046875, -16.1826171875, -15.634765625, -15.0869140625, -14.5390625, -13.9912109375, -13.443359375, -12.8955078125, -12.34765625, -11.7998046875, -11.251953125, -10.7041015625, -10.15625, -9.6083984375, -9.060546875, -8.5126953125, -7.96484375, -7.4169921875, -6.869140625, -6.3212890625, -5.7734375, -5.2255859375, -4.677734375, -4.1298828125, -3.58203125, -3.0341796875, -2.486328125, -1.9384765625, -1.390625, -0.8427734375, -0.294921875, 0.2529296875, 0.80078125, 1.3486328125, 1.896484375, 2.4443359375, 2.9921875, 3.5400390625, 4.087890625, 4.6357421875, 5.18359375, 5.7314453125, 6.279296875, 6.8271484375, 7.375, 7.9228515625, 8.470703125, 9.0185546875, 9.56640625, 10.1142578125, 10.662109375, 11.2099609375, 11.7578125, 12.3056640625, 12.853515625, 13.4013671875, 13.94921875, 14.4970703125, 15.044921875, 15.5927734375, 16.140625]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 6.0, 2.0, 5.0, 3.0, 3.0, 4.0, 4.0, 12.0, 12.0, 10.0, 15.0, 25.0, 12.0, 21.0, 16.0, 31.0, 25.0, 29.0, 32.0, 41.0, 38.0, 51.0, 63.0, 121.0, 273.0, 1468.0, 201.0, 84.0, 72.0, 37.0, 38.0, 43.0, 33.0, 40.0, 26.0, 22.0, 23.0, 14.0, 17.0, 14.0, 13.0, 10.0, 8.0, 6.0, 8.0, 6.0, 8.0, 5.0, 3.0, 4.0, 3.0, 3.0, 0.0, 1.0], "bins": [-17.4375, -16.943603515625, -16.44970703125, -15.955810546875, -15.4619140625, -14.968017578125, -14.47412109375, -13.980224609375, -13.486328125, -12.992431640625, -12.49853515625, -12.004638671875, -11.5107421875, -11.016845703125, -10.52294921875, -10.029052734375, -9.53515625, -9.041259765625, -8.54736328125, -8.053466796875, -7.5595703125, -7.065673828125, -6.57177734375, -6.077880859375, -5.583984375, -5.090087890625, -4.59619140625, -4.102294921875, -3.6083984375, -3.114501953125, -2.62060546875, -2.126708984375, -1.6328125, -1.138916015625, -0.64501953125, -0.151123046875, 0.3427734375, 0.836669921875, 1.33056640625, 1.824462890625, 2.318359375, 2.812255859375, 3.30615234375, 3.800048828125, 4.2939453125, 4.787841796875, 5.28173828125, 5.775634765625, 6.26953125, 6.763427734375, 7.25732421875, 7.751220703125, 8.2451171875, 8.739013671875, 9.23291015625, 9.726806640625, 10.220703125, 10.714599609375, 11.20849609375, 11.702392578125, 12.1962890625, 12.690185546875, 13.18408203125, 13.677978515625, 14.171875]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 8.0, 9.0, 11.0, 15.0, 16.0, 25.0, 29.0, 34.0, 41.0, 65.0, 107.0, 133.0, 294.0, 896.0, 10446.0, 3063431.0, 67284.0, 1860.0, 432.0, 186.0, 113.0, 73.0, 49.0, 40.0, 36.0, 25.0, 23.0, 9.0, 7.0, 6.0, 7.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-52.1875, -50.4306640625, -48.673828125, -46.9169921875, -45.16015625, -43.4033203125, -41.646484375, -39.8896484375, -38.1328125, -36.3759765625, -34.619140625, -32.8623046875, -31.10546875, -29.3486328125, -27.591796875, -25.8349609375, -24.078125, -22.3212890625, -20.564453125, -18.8076171875, -17.05078125, -15.2939453125, -13.537109375, -11.7802734375, -10.0234375, -8.2666015625, -6.509765625, -4.7529296875, -2.99609375, -1.2392578125, 0.517578125, 2.2744140625, 4.03125, 5.7880859375, 7.544921875, 9.3017578125, 11.05859375, 12.8154296875, 14.572265625, 16.3291015625, 18.0859375, 19.8427734375, 21.599609375, 23.3564453125, 25.11328125, 26.8701171875, 28.626953125, 30.3837890625, 32.140625, 33.8974609375, 35.654296875, 37.4111328125, 39.16796875, 40.9248046875, 42.681640625, 44.4384765625, 46.1953125, 47.9521484375, 49.708984375, 51.4658203125, 53.22265625, 54.9794921875, 56.736328125, 58.4931640625, 60.25]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 165.0, 641.0, 191.0, 12.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-91.22120666503906, -87.34039306640625, -83.45957946777344, -79.5787582397461, -75.69794464111328, -71.81713104248047, -67.93631744384766, -64.05549621582031, -60.1746826171875, -56.29386901855469, -52.41305160522461, -48.5322380065918, -44.65142059326172, -40.770606994628906, -36.889793395996094, -33.008975982666016, -29.128162384033203, -25.247346878051758, -21.366531372070312, -17.4857177734375, -13.604901313781738, -9.72408676147461, -5.843271255493164, -1.9624557495117188, 1.9183597564697266, 5.799175262451172, 9.679990768432617, 13.560805320739746, 17.441619873046875, 21.32243537902832, 25.203250885009766, 29.08406639099121, 32.964881896972656, 36.84569549560547, 40.72651290893555, 44.60732650756836, 48.48814392089844, 52.36895751953125, 56.24977111816406, 60.13058853149414, 64.01140594482422, 67.89221954345703, 71.77303314208984, 75.65385437011719, 79.53466796875, 83.41548156738281, 87.29629516601562, 91.17710876464844, 95.05792236328125, 98.93873596191406, 102.81954956054688, 106.70037078857422, 110.58118438720703, 114.46199798583984, 118.34281158447266, 122.2236328125, 126.10444641113281, 129.98526000976562, 133.86607360839844, 137.74688720703125, 141.62770080566406, 145.50851440429688, 149.38934326171875, 153.27015686035156, 157.15097045898438]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 5.0, 0.0, 0.0, 7.0, 9.0, 4.0, 8.0, 8.0, 8.0, 16.0, 15.0, 11.0, 14.0, 22.0, 24.0, 22.0, 27.0, 31.0, 36.0, 33.0, 40.0, 34.0, 32.0, 45.0, 39.0, 41.0, 53.0, 43.0, 42.0, 43.0, 30.0, 40.0, 36.0, 26.0, 26.0, 26.0, 20.0, 20.0, 19.0, 9.0, 6.0, 7.0, 8.0, 6.0, 6.0, 6.0, 1.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.70075607299805, -41.321895599365234, -39.94303512573242, -38.564178466796875, -37.18531799316406, -35.80645751953125, -34.42759704589844, -33.048736572265625, -31.669878005981445, -30.291017532348633, -28.912158966064453, -27.53329849243164, -26.154438018798828, -24.77557945251465, -23.396718978881836, -22.017860412597656, -20.638999938964844, -19.26013946533203, -17.88128089904785, -16.50242042541504, -15.123560905456543, -13.744701385498047, -12.365840911865234, -10.986981391906738, -9.608121871948242, -8.229262351989746, -6.850402355194092, -5.4715423583984375, -4.092682838439941, -2.7138233184814453, -1.3349628448486328, 0.04389667510986328, 1.422760009765625, 2.8016197681427, 4.180479526519775, 5.55933952331543, 6.938199043273926, 8.317058563232422, 9.695919036865234, 11.07477855682373, 12.453638076782227, 13.832497596740723, 15.211357116699219, 16.59021759033203, 17.969078063964844, 19.347936630249023, 20.726797103881836, 22.105655670166016, 23.484516143798828, 24.86337661743164, 26.24223518371582, 27.621095657348633, 28.999954223632812, 30.378814697265625, 31.757675170898438, 33.13653564453125, 34.51539611816406, 35.894256591796875, 37.27311706542969, 38.6519775390625, 40.03083419799805, 41.40969467163086, 42.78855514526367, 44.167415618896484, 45.54627227783203]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 6.0, 0.0, 6.0, 14.0, 5.0, 12.0, 11.0, 31.0, 23.0, 23.0, 27.0, 35.0, 36.0, 46.0, 44.0, 47.0, 52.0, 39.0, 53.0, 62.0, 52.0, 41.0, 42.0, 45.0, 41.0, 39.0, 26.0, 34.0, 25.0, 23.0, 10.0, 12.0, 10.0, 9.0, 13.0, 4.0, 7.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0], "bins": [-9.9296875, -9.6739501953125, -9.418212890625, -9.1624755859375, -8.90673828125, -8.6510009765625, -8.395263671875, -8.1395263671875, -7.8837890625, -7.6280517578125, -7.372314453125, -7.1165771484375, -6.86083984375, -6.6051025390625, -6.349365234375, -6.0936279296875, -5.837890625, -5.5821533203125, -5.326416015625, -5.0706787109375, -4.81494140625, -4.5592041015625, -4.303466796875, -4.0477294921875, -3.7919921875, -3.5362548828125, -3.280517578125, -3.0247802734375, -2.76904296875, -2.5133056640625, -2.257568359375, -2.0018310546875, -1.74609375, -1.4903564453125, -1.234619140625, -0.9788818359375, -0.72314453125, -0.4674072265625, -0.211669921875, 0.0440673828125, 0.2998046875, 0.5555419921875, 0.811279296875, 1.0670166015625, 1.32275390625, 1.5784912109375, 1.834228515625, 2.0899658203125, 2.345703125, 2.6014404296875, 2.857177734375, 3.1129150390625, 3.36865234375, 3.6243896484375, 3.880126953125, 4.1358642578125, 4.3916015625, 4.6473388671875, 4.903076171875, 5.1588134765625, 5.41455078125, 5.6702880859375, 5.926025390625, 6.1817626953125, 6.4375]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 3.0, 8.0, 9.0, 15.0, 15.0, 28.0, 32.0, 55.0, 65.0, 89.0, 162.0, 265.0, 567.0, 1202.0, 3521.0, 15535.0, 231300.0, 2960020.0, 930848.0, 40300.0, 6629.0, 1903.0, 758.0, 373.0, 221.0, 110.0, 75.0, 42.0, 37.0, 25.0, 13.0, 12.0, 13.0, 9.0, 9.0, 5.0, 6.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-20.984375, -20.427978515625, -19.87158203125, -19.315185546875, -18.7587890625, -18.202392578125, -17.64599609375, -17.089599609375, -16.533203125, -15.976806640625, -15.42041015625, -14.864013671875, -14.3076171875, -13.751220703125, -13.19482421875, -12.638427734375, -12.08203125, -11.525634765625, -10.96923828125, -10.412841796875, -9.8564453125, -9.300048828125, -8.74365234375, -8.187255859375, -7.630859375, -7.074462890625, -6.51806640625, -5.961669921875, -5.4052734375, -4.848876953125, -4.29248046875, -3.736083984375, -3.1796875, -2.623291015625, -2.06689453125, -1.510498046875, -0.9541015625, -0.397705078125, 0.15869140625, 0.715087890625, 1.271484375, 1.827880859375, 2.38427734375, 2.940673828125, 3.4970703125, 4.053466796875, 4.60986328125, 5.166259765625, 5.72265625, 6.279052734375, 6.83544921875, 7.391845703125, 7.9482421875, 8.504638671875, 9.06103515625, 9.617431640625, 10.173828125, 10.730224609375, 11.28662109375, 11.843017578125, 12.3994140625, 12.955810546875, 13.51220703125, 14.068603515625, 14.625]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 3.0, 7.0, 5.0, 2.0, 3.0, 9.0, 18.0, 16.0, 20.0, 26.0, 36.0, 53.0, 67.0, 93.0, 136.0, 198.0, 323.0, 477.0, 553.0, 553.0, 444.0, 330.0, 213.0, 157.0, 97.0, 53.0, 46.0, 36.0, 25.0, 11.0, 13.0, 11.0, 9.0, 12.0, 3.0, 4.0, 5.0, 3.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.015625, -10.69189453125, -10.3681640625, -10.04443359375, -9.720703125, -9.39697265625, -9.0732421875, -8.74951171875, -8.42578125, -8.10205078125, -7.7783203125, -7.45458984375, -7.130859375, -6.80712890625, -6.4833984375, -6.15966796875, -5.8359375, -5.51220703125, -5.1884765625, -4.86474609375, -4.541015625, -4.21728515625, -3.8935546875, -3.56982421875, -3.24609375, -2.92236328125, -2.5986328125, -2.27490234375, -1.951171875, -1.62744140625, -1.3037109375, -0.97998046875, -0.65625, -0.33251953125, -0.0087890625, 0.31494140625, 0.638671875, 0.96240234375, 1.2861328125, 1.60986328125, 1.93359375, 2.25732421875, 2.5810546875, 2.90478515625, 3.228515625, 3.55224609375, 3.8759765625, 4.19970703125, 4.5234375, 4.84716796875, 5.1708984375, 5.49462890625, 5.818359375, 6.14208984375, 6.4658203125, 6.78955078125, 7.11328125, 7.43701171875, 7.7607421875, 8.08447265625, 8.408203125, 8.73193359375, 9.0556640625, 9.37939453125, 9.703125]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 7.0, 3.0, 3.0, 15.0, 18.0, 15.0, 23.0, 26.0, 52.0, 68.0, 91.0, 158.0, 218.0, 415.0, 880.0, 2593.0, 12131.0, 131558.0, 3616194.0, 401799.0, 21501.0, 3915.0, 1201.0, 514.0, 287.0, 163.0, 126.0, 80.0, 54.0, 56.0, 27.0, 27.0, 22.0, 9.0, 6.0, 6.0, 7.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-25.125, -24.277587890625, -23.43017578125, -22.582763671875, -21.7353515625, -20.887939453125, -20.04052734375, -19.193115234375, -18.345703125, -17.498291015625, -16.65087890625, -15.803466796875, -14.9560546875, -14.108642578125, -13.26123046875, -12.413818359375, -11.56640625, -10.718994140625, -9.87158203125, -9.024169921875, -8.1767578125, -7.329345703125, -6.48193359375, -5.634521484375, -4.787109375, -3.939697265625, -3.09228515625, -2.244873046875, -1.3974609375, -0.550048828125, 0.29736328125, 1.144775390625, 1.9921875, 2.839599609375, 3.68701171875, 4.534423828125, 5.3818359375, 6.229248046875, 7.07666015625, 7.924072265625, 8.771484375, 9.618896484375, 10.46630859375, 11.313720703125, 12.1611328125, 13.008544921875, 13.85595703125, 14.703369140625, 15.55078125, 16.398193359375, 17.24560546875, 18.093017578125, 18.9404296875, 19.787841796875, 20.63525390625, 21.482666015625, 22.330078125, 23.177490234375, 24.02490234375, 24.872314453125, 25.7197265625, 26.567138671875, 27.41455078125, 28.261962890625, 29.109375]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 4.0, 8.0, 17.0, 76.0, 197.0, 322.0, 247.0, 102.0, 33.0, 8.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.93488121032715, -28.945446014404297, -25.956010818481445, -22.966575622558594, -19.97713851928711, -16.98770523071289, -13.998268127441406, -11.008832931518555, -8.019397735595703, -5.029962539672852, -2.040526866912842, 0.948908805847168, 3.9383440017700195, 6.927779197692871, 9.917215347290039, 12.90665054321289, 15.896085739135742, 18.885520935058594, 21.874956130981445, 24.864391326904297, 27.85382843017578, 30.84326171875, 33.832698822021484, 36.82213592529297, 39.81156921386719, 42.80100631713867, 45.79043960571289, 48.779876708984375, 51.769309997558594, 54.75874710083008, 57.74818420410156, 60.73761749267578, 63.72705841064453, 66.71649169921875, 69.7059326171875, 72.69536590576172, 75.68479919433594, 78.67423248291016, 81.6636734008789, 84.65310668945312, 87.64253997802734, 90.63197326660156, 93.62141418457031, 96.61084747314453, 99.60028076171875, 102.58971405029297, 105.57915496826172, 108.56858825683594, 111.55802917480469, 114.5474624633789, 117.53690338134766, 120.52633666992188, 123.5157699584961, 126.50520324707031, 129.49464416503906, 132.48406982421875, 135.4735107421875, 138.46295166015625, 141.45237731933594, 144.4418182373047, 147.43125915527344, 150.42068481445312, 153.41012573242188, 156.39956665039062, 159.3889923095703]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 4.0, 9.0, 6.0, 10.0, 8.0, 17.0, 15.0, 15.0, 26.0, 26.0, 24.0, 24.0, 23.0, 30.0, 29.0, 31.0, 37.0, 38.0, 40.0, 34.0, 41.0, 29.0, 41.0, 33.0, 44.0, 36.0, 29.0, 42.0, 21.0, 41.0, 27.0, 30.0, 20.0, 22.0, 12.0, 17.0, 10.0, 8.0, 9.0, 11.0, 8.0, 4.0, 7.0, 4.0, 1.0, 7.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.238014221191406, -24.36113739013672, -23.48426055908203, -22.60738182067871, -21.730504989624023, -20.853628158569336, -19.976749420166016, -19.099872589111328, -18.22299575805664, -17.346118927001953, -16.469242095947266, -15.592363357543945, -14.715486526489258, -13.83860969543457, -12.961731910705566, -12.084854125976562, -11.207977294921875, -10.331100463867188, -9.454222679138184, -8.57734489440918, -7.700468063354492, -6.8235907554626465, -5.946713447570801, -5.069836139678955, -4.192958831787109, -3.3160815238952637, -2.439204216003418, -1.5623269081115723, -0.6854496002197266, 0.19142770767211914, 1.0683050155639648, 1.9451823234558105, 2.8220577239990234, 3.698935031890869, 4.575812339782715, 5.4526896476745605, 6.329566955566406, 7.206444263458252, 8.083321571350098, 8.960199356079102, 9.837076187133789, 10.713953018188477, 11.59083080291748, 12.467708587646484, 13.344585418701172, 14.22146224975586, 15.098340034484863, 15.975217819213867, 16.852094650268555, 17.728971481323242, 18.605850219726562, 19.48272705078125, 20.359603881835938, 21.236480712890625, 22.113357543945312, 22.990236282348633, 23.86711311340332, 24.743989944458008, 25.620868682861328, 26.497745513916016, 27.374622344970703, 28.25149917602539, 29.128376007080078, 30.0052547454834, 30.882131576538086]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 4.0, 5.0, 7.0, 5.0, 7.0, 5.0, 8.0, 10.0, 17.0, 20.0, 14.0, 19.0, 17.0, 30.0, 26.0, 22.0, 26.0, 29.0, 42.0, 30.0, 46.0, 40.0, 52.0, 35.0, 38.0, 29.0, 34.0, 34.0, 38.0, 31.0, 40.0, 28.0, 24.0, 31.0, 21.0, 19.0, 19.0, 14.0, 14.0, 10.0, 12.0, 9.0, 12.0, 8.0, 5.0, 5.0, 4.0, 2.0, 3.0, 3.0, 0.0, 3.0, 4.0, 0.0, 0.0, 0.0, 3.0], "bins": [-5.84375, -5.65521240234375, -5.4666748046875, -5.27813720703125, -5.089599609375, -4.90106201171875, -4.7125244140625, -4.52398681640625, -4.33544921875, -4.14691162109375, -3.9583740234375, -3.76983642578125, -3.581298828125, -3.39276123046875, -3.2042236328125, -3.01568603515625, -2.8271484375, -2.63861083984375, -2.4500732421875, -2.26153564453125, -2.072998046875, -1.88446044921875, -1.6959228515625, -1.50738525390625, -1.31884765625, -1.13031005859375, -0.9417724609375, -0.75323486328125, -0.564697265625, -0.37615966796875, -0.1876220703125, 0.00091552734375, 0.189453125, 0.37799072265625, 0.5665283203125, 0.75506591796875, 0.943603515625, 1.13214111328125, 1.3206787109375, 1.50921630859375, 1.69775390625, 1.88629150390625, 2.0748291015625, 2.26336669921875, 2.451904296875, 2.64044189453125, 2.8289794921875, 3.01751708984375, 3.2060546875, 3.39459228515625, 3.5831298828125, 3.77166748046875, 3.960205078125, 4.14874267578125, 4.3372802734375, 4.52581787109375, 4.71435546875, 4.90289306640625, 5.0914306640625, 5.27996826171875, 5.468505859375, 5.65704345703125, 5.8455810546875, 6.03411865234375, 6.22265625]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 6.0, 8.0, 9.0, 15.0, 14.0, 30.0, 42.0, 75.0, 135.0, 177.0, 248.0, 407.0, 579.0, 1011.0, 1480.0, 2231.0, 3385.0, 5242.0, 8063.0, 13327.0, 22180.0, 37596.0, 69155.0, 143328.0, 303455.0, 214169.0, 97224.0, 50420.0, 28531.0, 16940.0, 10431.0, 6532.0, 4226.0, 2714.0, 1849.0, 1170.0, 734.0, 493.0, 310.0, 224.0, 146.0, 90.0, 57.0, 36.0, 19.0, 19.0, 7.0, 7.0, 6.0, 8.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.302978515625, -0.2924385070800781, -0.28189849853515625, -0.2713584899902344, -0.2608184814453125, -0.2502784729003906, -0.23973846435546875, -0.22919845581054688, -0.218658447265625, -0.20811843872070312, -0.19757843017578125, -0.18703842163085938, -0.1764984130859375, -0.16595840454101562, -0.15541839599609375, -0.14487838745117188, -0.13433837890625, -0.12379837036132812, -0.11325836181640625, -0.10271835327148438, -0.0921783447265625, -0.08163833618164062, -0.07109832763671875, -0.060558319091796875, -0.050018310546875, -0.039478302001953125, -0.02893829345703125, -0.018398284912109375, -0.0078582763671875, 0.002681732177734375, 0.01322174072265625, 0.023761749267578125, 0.0343017578125, 0.044841766357421875, 0.05538177490234375, 0.06592178344726562, 0.0764617919921875, 0.08700180053710938, 0.09754180908203125, 0.10808181762695312, 0.118621826171875, 0.12916183471679688, 0.13970184326171875, 0.15024185180664062, 0.1607818603515625, 0.17132186889648438, 0.18186187744140625, 0.19240188598632812, 0.20294189453125, 0.21348190307617188, 0.22402191162109375, 0.23456192016601562, 0.2451019287109375, 0.2556419372558594, 0.26618194580078125, 0.2767219543457031, 0.287261962890625, 0.2978019714355469, 0.30834197998046875, 0.3188819885253906, 0.3294219970703125, 0.3399620056152344, 0.35050201416015625, 0.3610420227050781, 0.37158203125]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 3.0, 2.0, 6.0, 7.0, 3.0, 9.0, 8.0, 12.0, 8.0, 15.0, 22.0, 18.0, 18.0, 24.0, 22.0, 22.0, 37.0, 38.0, 38.0, 43.0, 30.0, 56.0, 47.0, 1060.0, 52.0, 42.0, 35.0, 37.0, 39.0, 38.0, 28.0, 37.0, 31.0, 25.0, 16.0, 22.0, 18.0, 17.0, 7.0, 10.0, 10.0, 5.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.51953125, -4.3863525390625, -4.253173828125, -4.1199951171875, -3.98681640625, -3.8536376953125, -3.720458984375, -3.5872802734375, -3.4541015625, -3.3209228515625, -3.187744140625, -3.0545654296875, -2.92138671875, -2.7882080078125, -2.655029296875, -2.5218505859375, -2.388671875, -2.2554931640625, -2.122314453125, -1.9891357421875, -1.85595703125, -1.7227783203125, -1.589599609375, -1.4564208984375, -1.3232421875, -1.1900634765625, -1.056884765625, -0.9237060546875, -0.79052734375, -0.6573486328125, -0.524169921875, -0.3909912109375, -0.2578125, -0.1246337890625, 0.008544921875, 0.1417236328125, 0.27490234375, 0.4080810546875, 0.541259765625, 0.6744384765625, 0.8076171875, 0.9407958984375, 1.073974609375, 1.2071533203125, 1.34033203125, 1.4735107421875, 1.606689453125, 1.7398681640625, 1.873046875, 2.0062255859375, 2.139404296875, 2.2725830078125, 2.40576171875, 2.5389404296875, 2.672119140625, 2.8052978515625, 2.9384765625, 3.0716552734375, 3.204833984375, 3.3380126953125, 3.47119140625, 3.6043701171875, 3.737548828125, 3.8707275390625, 4.00390625]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 7.0, 4.0, 6.0, 22.0, 25.0, 29.0, 32.0, 40.0, 80.0, 104.0, 155.0, 176.0, 271.0, 349.0, 444.0, 639.0, 899.0, 1279.0, 1740.0, 2401.0, 3596.0, 5064.0, 7300.0, 10776.0, 16064.0, 25047.0, 39144.0, 62357.0, 102925.0, 181339.0, 1275706.0, 136549.0, 79553.0, 49312.0, 30865.0, 20138.0, 13349.0, 8818.0, 6169.0, 4164.0, 2912.0, 2052.0, 1455.0, 983.0, 773.0, 586.0, 418.0, 302.0, 207.0, 128.0, 99.0, 87.0, 59.0, 35.0, 35.0, 27.0, 17.0, 11.0, 10.0, 9.0, 3.0, 3.0], "bins": [-0.1895751953125, -0.18369674682617188, -0.17781829833984375, -0.17193984985351562, -0.1660614013671875, -0.16018295288085938, -0.15430450439453125, -0.14842605590820312, -0.142547607421875, -0.13666915893554688, -0.13079071044921875, -0.12491226196289062, -0.1190338134765625, -0.11315536499023438, -0.10727691650390625, -0.10139846801757812, -0.09552001953125, -0.08964157104492188, -0.08376312255859375, -0.07788467407226562, -0.0720062255859375, -0.06612777709960938, -0.06024932861328125, -0.054370880126953125, -0.048492431640625, -0.042613983154296875, -0.03673553466796875, -0.030857086181640625, -0.0249786376953125, -0.019100189208984375, -0.01322174072265625, -0.007343292236328125, -0.00146484375, 0.004413604736328125, 0.01029205322265625, 0.016170501708984375, 0.0220489501953125, 0.027927398681640625, 0.03380584716796875, 0.039684295654296875, 0.045562744140625, 0.051441192626953125, 0.05731964111328125, 0.06319808959960938, 0.0690765380859375, 0.07495498657226562, 0.08083343505859375, 0.08671188354492188, 0.09259033203125, 0.09846878051757812, 0.10434722900390625, 0.11022567749023438, 0.1161041259765625, 0.12198257446289062, 0.12786102294921875, 0.13373947143554688, 0.139617919921875, 0.14549636840820312, 0.15137481689453125, 0.15725326538085938, 0.1631317138671875, 0.16901016235351562, 0.17488861083984375, 0.18076705932617188, 0.1866455078125]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 2.0, 3.0, 4.0, 2.0, 10.0, 6.0, 13.0, 20.0, 23.0, 23.0, 38.0, 40.0, 63.0, 60.0, 77.0, 110.0, 86.0, 86.0, 57.0, 50.0, 53.0, 46.0, 29.0, 24.0, 17.0, 19.0, 11.0, 7.0, 3.0, 7.0, 4.0, 6.0, 6.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00016629695892333984, -0.00016037747263908386, -0.00015445798635482788, -0.0001485385000705719, -0.00014261901378631592, -0.00013669952750205994, -0.00013078004121780396, -0.00012486055493354797, -0.00011894106864929199, -0.00011302158236503601, -0.00010710209608078003, -0.00010118260979652405, -9.526312351226807e-05, -8.934363722801208e-05, -8.34241509437561e-05, -7.750466465950012e-05, -7.158517837524414e-05, -6.566569209098816e-05, -5.974620580673218e-05, -5.3826719522476196e-05, -4.7907233238220215e-05, -4.1987746953964233e-05, -3.606826066970825e-05, -3.014877438545227e-05, -2.422928810119629e-05, -1.8309801816940308e-05, -1.2390315532684326e-05, -6.470829248428345e-06, -5.513429641723633e-07, 5.368143320083618e-06, 1.12876296043396e-05, 1.720711588859558e-05, 2.3126602172851562e-05, 2.9046088457107544e-05, 3.4965574741363525e-05, 4.088506102561951e-05, 4.680454730987549e-05, 5.272403359413147e-05, 5.864351987838745e-05, 6.456300616264343e-05, 7.048249244689941e-05, 7.64019787311554e-05, 8.232146501541138e-05, 8.824095129966736e-05, 9.416043758392334e-05, 0.00010007992386817932, 0.0001059994101524353, 0.00011191889643669128, 0.00011783838272094727, 0.00012375786900520325, 0.00012967735528945923, 0.0001355968415737152, 0.0001415163278579712, 0.00014743581414222717, 0.00015335530042648315, 0.00015927478671073914, 0.00016519427299499512, 0.0001711137592792511, 0.00017703324556350708, 0.00018295273184776306, 0.00018887221813201904, 0.00019479170441627502, 0.000200711190700531, 0.000206630676984787, 0.00021255016326904297]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 6.0, 2.0, 3.0, 7.0, 4.0, 9.0, 9.0, 20.0, 18.0, 21.0, 24.0, 30.0, 35.0, 57.0, 105.0, 172.0, 303.0, 527.0, 2102.0, 132420.0, 904750.0, 6270.0, 790.0, 323.0, 189.0, 110.0, 85.0, 49.0, 25.0, 30.0, 19.0, 7.0, 13.0, 7.0, 11.0, 4.0, 4.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.004146575927734375, -0.004031956195831299, -0.003917336463928223, -0.0038027167320251465, -0.0036880970001220703, -0.003573477268218994, -0.003458857536315918, -0.003344237804412842, -0.0032296180725097656, -0.0031149983406066895, -0.0030003786087036133, -0.002885758876800537, -0.002771139144897461, -0.0026565194129943848, -0.0025418996810913086, -0.0024272799491882324, -0.0023126602172851562, -0.00219804048538208, -0.002083420753479004, -0.0019688010215759277, -0.0018541812896728516, -0.0017395615577697754, -0.0016249418258666992, -0.001510322093963623, -0.0013957023620605469, -0.0012810826301574707, -0.0011664628982543945, -0.0010518431663513184, -0.0009372234344482422, -0.000822603702545166, -0.0007079839706420898, -0.0005933642387390137, -0.0004787445068359375, -0.00036412477493286133, -0.00024950504302978516, -0.00013488531112670898, -2.0265579223632812e-05, 9.435415267944336e-05, 0.00020897388458251953, 0.0003235936164855957, 0.0004382133483886719, 0.000552833080291748, 0.0006674528121948242, 0.0007820725440979004, 0.0008966922760009766, 0.0010113120079040527, 0.001125931739807129, 0.001240551471710205, 0.0013551712036132812, 0.0014697909355163574, 0.0015844106674194336, 0.0016990303993225098, 0.001813650131225586, 0.0019282698631286621, 0.0020428895950317383, 0.0021575093269348145, 0.0022721290588378906, 0.002386748790740967, 0.002501368522644043, 0.002615988254547119, 0.0027306079864501953, 0.0028452277183532715, 0.0029598474502563477, 0.003074467182159424, 0.0031890869140625]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 9.0, 43.0, 124.0, 290.0, 307.0, 157.0, 59.0, 14.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003818266559392214, -0.0003699302324093878, -0.00035803383798338473, -0.0003461374144535512, -0.0003342409909237176, -0.0003223445964977145, -0.00031044817296788096, -0.0002985517494380474, -0.00028665532590821385, -0.0002747589023783803, -0.0002628625079523772, -0.00025096608442254364, -0.0002390696608927101, -0.00022717325191479176, -0.00021527684293687344, -0.00020338041940703988, -0.00019148402498103678, -0.00017958761600311846, -0.0001676911924732849, -0.00015579478349536657, -0.00014389835996553302, -0.0001320019509876147, -0.00012010554200969636, -0.00010820912575582042, -9.631270950194448e-05, -8.441629324806854e-05, -7.25198769941926e-05, -6.0623468016274273e-05, -4.872705176239833e-05, -3.683063550852239e-05, -2.4934226530604064e-05, -1.3037810276728123e-05, -1.1413649190217257e-06, 1.0755049515864812e-05, 2.265146395075135e-05, 3.454787656664848e-05, 4.6444292820524424e-05, 5.8340709074400365e-05, 7.023711805231869e-05, 8.213353430619463e-05, 9.402995056007057e-05, 0.00010592636681394652, 0.00011782278306782246, 0.00012971919204574078, 0.0001416156010236591, 0.00015351202455349267, 0.000165408433531411, 0.00017730484250932932, 0.00018920126603916287, 0.0002010976750170812, 0.00021299409854691476, 0.00022489050752483308, 0.00023678693105466664, 0.00024868332548066974, 0.0002605797490105033, 0.00027247617254033685, 0.0002843725960701704, 0.00029626901960000396, 0.00030816541402600706, 0.0003200618375558406, 0.00033195826108567417, 0.00034385465551167727, 0.0003557510790415108, 0.0003676475025713444, 0.0003795438969973475]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 1.0, 0.0, 2.0, 5.0, 5.0, 5.0, 8.0, 12.0, 8.0, 16.0, 16.0, 19.0, 15.0, 22.0, 26.0, 27.0, 26.0, 46.0, 34.0, 29.0, 30.0, 44.0, 38.0, 45.0, 50.0, 34.0, 54.0, 27.0, 40.0, 34.0, 21.0, 35.0, 34.0, 37.0, 21.0, 31.0, 18.0, 14.0, 11.0, 16.0, 13.0, 8.0, 8.0, 8.0, 4.0, 2.0, 2.0, 4.0, 1.0, 3.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.450580596923828e-05, -7.209181785583496e-05, -6.967782974243164e-05, -6.726384162902832e-05, -6.4849853515625e-05, -6.243586540222168e-05, -6.002187728881836e-05, -5.760788917541504e-05, -5.519390106201172e-05, -5.27799129486084e-05, -5.036592483520508e-05, -4.795193672180176e-05, -4.553794860839844e-05, -4.312396049499512e-05, -4.07099723815918e-05, -3.8295984268188477e-05, -3.5881996154785156e-05, -3.3468008041381836e-05, -3.1054019927978516e-05, -2.8640031814575195e-05, -2.6226043701171875e-05, -2.3812055587768555e-05, -2.1398067474365234e-05, -1.8984079360961914e-05, -1.6570091247558594e-05, -1.4156103134155273e-05, -1.1742115020751953e-05, -9.328126907348633e-06, -6.9141387939453125e-06, -4.500150680541992e-06, -2.086162567138672e-06, 3.2782554626464844e-07, 2.7418136596679688e-06, 5.155801773071289e-06, 7.569789886474609e-06, 9.98377799987793e-06, 1.239776611328125e-05, 1.481175422668457e-05, 1.722574234008789e-05, 1.963973045349121e-05, 2.205371856689453e-05, 2.446770668029785e-05, 2.6881694793701172e-05, 2.9295682907104492e-05, 3.170967102050781e-05, 3.412365913391113e-05, 3.653764724731445e-05, 3.8951635360717773e-05, 4.1365623474121094e-05, 4.3779611587524414e-05, 4.6193599700927734e-05, 4.8607587814331055e-05, 5.1021575927734375e-05, 5.3435564041137695e-05, 5.5849552154541016e-05, 5.8263540267944336e-05, 6.0677528381347656e-05, 6.309151649475098e-05, 6.55055046081543e-05, 6.791949272155762e-05, 7.033348083496094e-05, 7.274746894836426e-05, 7.516145706176758e-05, 7.75754451751709e-05, 7.998943328857422e-05]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 4.0, 5.0, 7.0, 5.0, 7.0, 5.0, 8.0, 10.0, 17.0, 20.0, 14.0, 19.0, 17.0, 30.0, 26.0, 22.0, 26.0, 29.0, 42.0, 30.0, 46.0, 40.0, 52.0, 35.0, 38.0, 29.0, 34.0, 34.0, 38.0, 31.0, 40.0, 28.0, 24.0, 31.0, 21.0, 19.0, 19.0, 14.0, 14.0, 10.0, 12.0, 9.0, 12.0, 8.0, 5.0, 5.0, 4.0, 2.0, 3.0, 3.0, 0.0, 3.0, 4.0, 0.0, 0.0, 0.0, 3.0], "bins": [-5.84375, -5.65521240234375, -5.4666748046875, -5.27813720703125, -5.089599609375, -4.90106201171875, -4.7125244140625, -4.52398681640625, -4.33544921875, -4.14691162109375, -3.9583740234375, -3.76983642578125, -3.581298828125, -3.39276123046875, -3.2042236328125, -3.01568603515625, -2.8271484375, -2.63861083984375, -2.4500732421875, -2.26153564453125, -2.072998046875, -1.88446044921875, -1.6959228515625, -1.50738525390625, -1.31884765625, -1.13031005859375, -0.9417724609375, -0.75323486328125, -0.564697265625, -0.37615966796875, -0.1876220703125, 0.00091552734375, 0.189453125, 0.37799072265625, 0.5665283203125, 0.75506591796875, 0.943603515625, 1.13214111328125, 1.3206787109375, 1.50921630859375, 1.69775390625, 1.88629150390625, 2.0748291015625, 2.26336669921875, 2.451904296875, 2.64044189453125, 2.8289794921875, 3.01751708984375, 3.2060546875, 3.39459228515625, 3.5831298828125, 3.77166748046875, 3.960205078125, 4.14874267578125, 4.3372802734375, 4.52581787109375, 4.71435546875, 4.90289306640625, 5.0914306640625, 5.27996826171875, 5.468505859375, 5.65704345703125, 5.8455810546875, 6.03411865234375, 6.22265625]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 5.0, 1.0, 0.0, 4.0, 4.0, 6.0, 10.0, 10.0, 17.0, 14.0, 11.0, 28.0, 35.0, 47.0, 77.0, 81.0, 87.0, 132.0, 199.0, 203.0, 312.0, 431.0, 747.0, 1473.0, 3521.0, 10122.0, 32845.0, 216667.0, 690389.0, 63908.0, 16595.0, 5537.0, 2086.0, 959.0, 555.0, 357.0, 257.0, 170.0, 152.0, 118.0, 90.0, 78.0, 45.0, 44.0, 35.0, 19.0, 20.0, 15.0, 11.0, 11.0, 9.0, 4.0, 6.0, 3.0, 1.0, 2.0, 5.0, 0.0, 0.0, 1.0, 2.0], "bins": [-14.4140625, -13.952392578125, -13.49072265625, -13.029052734375, -12.5673828125, -12.105712890625, -11.64404296875, -11.182373046875, -10.720703125, -10.259033203125, -9.79736328125, -9.335693359375, -8.8740234375, -8.412353515625, -7.95068359375, -7.489013671875, -7.02734375, -6.565673828125, -6.10400390625, -5.642333984375, -5.1806640625, -4.718994140625, -4.25732421875, -3.795654296875, -3.333984375, -2.872314453125, -2.41064453125, -1.948974609375, -1.4873046875, -1.025634765625, -0.56396484375, -0.102294921875, 0.359375, 0.821044921875, 1.28271484375, 1.744384765625, 2.2060546875, 2.667724609375, 3.12939453125, 3.591064453125, 4.052734375, 4.514404296875, 4.97607421875, 5.437744140625, 5.8994140625, 6.361083984375, 6.82275390625, 7.284423828125, 7.74609375, 8.207763671875, 8.66943359375, 9.131103515625, 9.5927734375, 10.054443359375, 10.51611328125, 10.977783203125, 11.439453125, 11.901123046875, 12.36279296875, 12.824462890625, 13.2861328125, 13.747802734375, 14.20947265625, 14.671142578125, 15.1328125]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 1.0, 2.0, 5.0, 10.0, 6.0, 17.0, 21.0, 12.0, 30.0, 27.0, 28.0, 39.0, 43.0, 38.0, 48.0, 58.0, 70.0, 135.0, 347.0, 1502.0, 136.0, 83.0, 60.0, 40.0, 48.0, 39.0, 29.0, 25.0, 32.0, 23.0, 19.0, 10.0, 11.0, 4.0, 14.0, 10.0, 5.0, 8.0, 5.0, 7.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-18.4375, -17.863037109375, -17.28857421875, -16.714111328125, -16.1396484375, -15.565185546875, -14.99072265625, -14.416259765625, -13.841796875, -13.267333984375, -12.69287109375, -12.118408203125, -11.5439453125, -10.969482421875, -10.39501953125, -9.820556640625, -9.24609375, -8.671630859375, -8.09716796875, -7.522705078125, -6.9482421875, -6.373779296875, -5.79931640625, -5.224853515625, -4.650390625, -4.075927734375, -3.50146484375, -2.927001953125, -2.3525390625, -1.778076171875, -1.20361328125, -0.629150390625, -0.0546875, 0.519775390625, 1.09423828125, 1.668701171875, 2.2431640625, 2.817626953125, 3.39208984375, 3.966552734375, 4.541015625, 5.115478515625, 5.68994140625, 6.264404296875, 6.8388671875, 7.413330078125, 7.98779296875, 8.562255859375, 9.13671875, 9.711181640625, 10.28564453125, 10.860107421875, 11.4345703125, 12.009033203125, 12.58349609375, 13.157958984375, 13.732421875, 14.306884765625, 14.88134765625, 15.455810546875, 16.0302734375, 16.604736328125, 17.17919921875, 17.753662109375, 18.328125]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 5.0, 3.0, 9.0, 8.0, 7.0, 14.0, 21.0, 6.0, 9.0, 18.0, 28.0, 33.0, 40.0, 45.0, 51.0, 79.0, 146.0, 234.0, 592.0, 2202.0, 24798.0, 3049652.0, 62907.0, 3203.0, 757.0, 280.0, 128.0, 97.0, 70.0, 55.0, 40.0, 38.0, 35.0, 21.0, 23.0, 9.0, 16.0, 12.0, 2.0, 3.0, 6.0, 2.0, 3.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-46.71875, -45.24072265625, -43.7626953125, -42.28466796875, -40.806640625, -39.32861328125, -37.8505859375, -36.37255859375, -34.89453125, -33.41650390625, -31.9384765625, -30.46044921875, -28.982421875, -27.50439453125, -26.0263671875, -24.54833984375, -23.0703125, -21.59228515625, -20.1142578125, -18.63623046875, -17.158203125, -15.68017578125, -14.2021484375, -12.72412109375, -11.24609375, -9.76806640625, -8.2900390625, -6.81201171875, -5.333984375, -3.85595703125, -2.3779296875, -0.89990234375, 0.578125, 2.05615234375, 3.5341796875, 5.01220703125, 6.490234375, 7.96826171875, 9.4462890625, 10.92431640625, 12.40234375, 13.88037109375, 15.3583984375, 16.83642578125, 18.314453125, 19.79248046875, 21.2705078125, 22.74853515625, 24.2265625, 25.70458984375, 27.1826171875, 28.66064453125, 30.138671875, 31.61669921875, 33.0947265625, 34.57275390625, 36.05078125, 37.52880859375, 39.0068359375, 40.48486328125, 41.962890625, 43.44091796875, 44.9189453125, 46.39697265625, 47.875]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 7.0, 18.0, 93.0, 266.0, 357.0, 181.0, 76.0, 16.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.84257125854492, -34.94148635864258, -33.040401458740234, -31.13931655883789, -29.238231658935547, -27.337146759033203, -25.436059951782227, -23.534975051879883, -21.63389015197754, -19.732805252075195, -17.83172035217285, -15.930634498596191, -14.029549598693848, -12.128464698791504, -10.227378845214844, -8.3262939453125, -6.425209045410156, -4.5241241455078125, -2.6230387687683105, -0.7219533920288086, 1.1791315078735352, 3.080216407775879, 4.981302261352539, 6.882387161254883, 8.783472061157227, 10.68455696105957, 12.585641860961914, 14.486727714538574, 16.387813568115234, 18.288898468017578, 20.189983367919922, 22.091068267822266, 23.992156982421875, 25.89324188232422, 27.794326782226562, 29.695411682128906, 31.59649658203125, 33.497581481933594, 35.39866638183594, 37.29975128173828, 39.200836181640625, 41.10192108154297, 43.00300598144531, 44.904090881347656, 46.80517578125, 48.706260681152344, 50.60734558105469, 52.50843048095703, 54.40951919555664, 56.310604095458984, 58.21168899536133, 60.11277389526367, 62.013858795166016, 63.91494369506836, 65.81603240966797, 67.71711730957031, 69.61820220947266, 71.519287109375, 73.42037200927734, 75.32145690917969, 77.22254180908203, 79.12362670898438, 81.02471160888672, 82.92579650878906, 84.8268814086914]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 7.0, 4.0, 4.0, 6.0, 9.0, 9.0, 14.0, 12.0, 15.0, 19.0, 18.0, 31.0, 35.0, 30.0, 33.0, 28.0, 26.0, 35.0, 47.0, 45.0, 40.0, 60.0, 37.0, 36.0, 44.0, 43.0, 30.0, 34.0, 39.0, 37.0, 25.0, 28.0, 21.0, 17.0, 21.0, 11.0, 5.0, 17.0, 8.0, 8.0, 4.0, 5.0, 0.0, 3.0, 2.0, 5.0, 2.0, 1.0, 2.0, 1.0], "bins": [-47.06272506713867, -45.744659423828125, -44.42658996582031, -43.108524322509766, -41.79045486450195, -40.472389221191406, -39.154319763183594, -37.83625411987305, -36.5181884765625, -35.20012283325195, -33.88205337524414, -32.563987731933594, -31.24591827392578, -29.927852630615234, -28.609785079956055, -27.291717529296875, -25.973648071289062, -24.655580520629883, -23.337512969970703, -22.019445419311523, -20.701377868652344, -19.383312225341797, -18.065244674682617, -16.747177124023438, -15.429109573364258, -14.111042022705078, -12.792974472045898, -11.474907875061035, -10.156840324401855, -8.838772773742676, -7.520705699920654, -6.202638626098633, -4.884574890136719, -3.566507577896118, -2.2484402656555176, -0.930372953414917, 0.3876943588256836, 1.7057619094848633, 3.0238289833068848, 4.341896057128906, 5.659963607788086, 6.978031158447266, 8.296098709106445, 9.614165306091309, 10.932232856750488, 12.250300407409668, 13.568367004394531, 14.886434555053711, 16.20450210571289, 17.52256965637207, 18.84063720703125, 20.15870475769043, 21.47677230834961, 22.794837951660156, 24.112905502319336, 25.430973052978516, 26.749040603637695, 28.067108154296875, 29.385175704956055, 30.703243255615234, 32.02130889892578, 33.339378356933594, 34.65744400024414, 35.97550964355469, 37.2935791015625]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [4.0, 2.0, 2.0, 1.0, 4.0, 4.0, 4.0, 3.0, 8.0, 8.0, 4.0, 11.0, 14.0, 10.0, 18.0, 22.0, 17.0, 19.0, 24.0, 38.0, 21.0, 34.0, 32.0, 44.0, 29.0, 47.0, 34.0, 38.0, 38.0, 46.0, 51.0, 31.0, 30.0, 34.0, 32.0, 32.0, 25.0, 26.0, 25.0, 32.0, 21.0, 19.0, 14.0, 11.0, 8.0, 7.0, 10.0, 5.0, 3.0, 4.0, 5.0, 2.0, 3.0, 4.0, 5.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.66015625, -5.4608154296875, -5.261474609375, -5.0621337890625, -4.86279296875, -4.6634521484375, -4.464111328125, -4.2647705078125, -4.0654296875, -3.8660888671875, -3.666748046875, -3.4674072265625, -3.26806640625, -3.0687255859375, -2.869384765625, -2.6700439453125, -2.470703125, -2.2713623046875, -2.072021484375, -1.8726806640625, -1.67333984375, -1.4739990234375, -1.274658203125, -1.0753173828125, -0.8759765625, -0.6766357421875, -0.477294921875, -0.2779541015625, -0.07861328125, 0.1207275390625, 0.320068359375, 0.5194091796875, 0.71875, 0.9180908203125, 1.117431640625, 1.3167724609375, 1.51611328125, 1.7154541015625, 1.914794921875, 2.1141357421875, 2.3134765625, 2.5128173828125, 2.712158203125, 2.9114990234375, 3.11083984375, 3.3101806640625, 3.509521484375, 3.7088623046875, 3.908203125, 4.1075439453125, 4.306884765625, 4.5062255859375, 4.70556640625, 4.9049072265625, 5.104248046875, 5.3035888671875, 5.5029296875, 5.7022705078125, 5.901611328125, 6.1009521484375, 6.30029296875, 6.4996337890625, 6.698974609375, 6.8983154296875, 7.09765625]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 5.0, 6.0, 3.0, 17.0, 10.0, 15.0, 38.0, 42.0, 53.0, 69.0, 114.0, 132.0, 210.0, 297.0, 509.0, 948.0, 1623.0, 3432.0, 8155.0, 30882.0, 199027.0, 1352154.0, 2096572.0, 422061.0, 55816.0, 12366.0, 4674.0, 2142.0, 1102.0, 651.0, 379.0, 229.0, 153.0, 100.0, 95.0, 39.0, 45.0, 29.0, 21.0, 19.0, 13.0, 8.0, 10.0, 5.0, 6.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-10.7265625, -10.382568359375, -10.03857421875, -9.694580078125, -9.3505859375, -9.006591796875, -8.66259765625, -8.318603515625, -7.974609375, -7.630615234375, -7.28662109375, -6.942626953125, -6.5986328125, -6.254638671875, -5.91064453125, -5.566650390625, -5.22265625, -4.878662109375, -4.53466796875, -4.190673828125, -3.8466796875, -3.502685546875, -3.15869140625, -2.814697265625, -2.470703125, -2.126708984375, -1.78271484375, -1.438720703125, -1.0947265625, -0.750732421875, -0.40673828125, -0.062744140625, 0.28125, 0.625244140625, 0.96923828125, 1.313232421875, 1.6572265625, 2.001220703125, 2.34521484375, 2.689208984375, 3.033203125, 3.377197265625, 3.72119140625, 4.065185546875, 4.4091796875, 4.753173828125, 5.09716796875, 5.441162109375, 5.78515625, 6.129150390625, 6.47314453125, 6.817138671875, 7.1611328125, 7.505126953125, 7.84912109375, 8.193115234375, 8.537109375, 8.881103515625, 9.22509765625, 9.569091796875, 9.9130859375, 10.257080078125, 10.60107421875, 10.945068359375, 11.2890625]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 2.0, 5.0, 2.0, 4.0, 3.0, 8.0, 12.0, 17.0, 8.0, 24.0, 23.0, 43.0, 44.0, 50.0, 104.0, 155.0, 198.0, 281.0, 415.0, 512.0, 549.0, 492.0, 352.0, 224.0, 154.0, 116.0, 73.0, 50.0, 50.0, 27.0, 19.0, 8.0, 14.0, 18.0, 9.0, 5.0, 2.0, 3.0, 2.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.6953125, -9.384521484375, -9.07373046875, -8.762939453125, -8.4521484375, -8.141357421875, -7.83056640625, -7.519775390625, -7.208984375, -6.898193359375, -6.58740234375, -6.276611328125, -5.9658203125, -5.655029296875, -5.34423828125, -5.033447265625, -4.72265625, -4.411865234375, -4.10107421875, -3.790283203125, -3.4794921875, -3.168701171875, -2.85791015625, -2.547119140625, -2.236328125, -1.925537109375, -1.61474609375, -1.303955078125, -0.9931640625, -0.682373046875, -0.37158203125, -0.060791015625, 0.25, 0.560791015625, 0.87158203125, 1.182373046875, 1.4931640625, 1.803955078125, 2.11474609375, 2.425537109375, 2.736328125, 3.047119140625, 3.35791015625, 3.668701171875, 3.9794921875, 4.290283203125, 4.60107421875, 4.911865234375, 5.22265625, 5.533447265625, 5.84423828125, 6.155029296875, 6.4658203125, 6.776611328125, 7.08740234375, 7.398193359375, 7.708984375, 8.019775390625, 8.33056640625, 8.641357421875, 8.9521484375, 9.262939453125, 9.57373046875, 9.884521484375, 10.1953125]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 4.0, 2.0, 3.0, 3.0, 10.0, 14.0, 24.0, 25.0, 27.0, 42.0, 61.0, 118.0, 167.0, 281.0, 618.0, 1569.0, 6320.0, 58548.0, 2953365.0, 1135582.0, 30646.0, 4320.0, 1211.0, 532.0, 280.0, 168.0, 104.0, 64.0, 57.0, 32.0, 17.0, 21.0, 12.0, 14.0, 4.0, 3.0, 4.0, 3.0, 4.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.71875, -27.81787109375, -26.9169921875, -26.01611328125, -25.115234375, -24.21435546875, -23.3134765625, -22.41259765625, -21.51171875, -20.61083984375, -19.7099609375, -18.80908203125, -17.908203125, -17.00732421875, -16.1064453125, -15.20556640625, -14.3046875, -13.40380859375, -12.5029296875, -11.60205078125, -10.701171875, -9.80029296875, -8.8994140625, -7.99853515625, -7.09765625, -6.19677734375, -5.2958984375, -4.39501953125, -3.494140625, -2.59326171875, -1.6923828125, -0.79150390625, 0.109375, 1.01025390625, 1.9111328125, 2.81201171875, 3.712890625, 4.61376953125, 5.5146484375, 6.41552734375, 7.31640625, 8.21728515625, 9.1181640625, 10.01904296875, 10.919921875, 11.82080078125, 12.7216796875, 13.62255859375, 14.5234375, 15.42431640625, 16.3251953125, 17.22607421875, 18.126953125, 19.02783203125, 19.9287109375, 20.82958984375, 21.73046875, 22.63134765625, 23.5322265625, 24.43310546875, 25.333984375, 26.23486328125, 27.1357421875, 28.03662109375, 28.9375]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 6.0, 42.0, 240.0, 436.0, 247.0, 36.0, 6.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-78.63336181640625, -74.14485931396484, -69.65635681152344, -65.1678466796875, -60.679344177246094, -56.19084167480469, -51.702335357666016, -47.213829040527344, -42.72532653808594, -38.23682403564453, -33.74831771850586, -29.25981330871582, -24.77130889892578, -20.282804489135742, -15.794300079345703, -11.305795669555664, -6.817291259765625, -2.328786849975586, 2.159717559814453, 6.648221969604492, 11.136726379394531, 15.62523078918457, 20.11373519897461, 24.60223960876465, 29.090744018554688, 33.579246520996094, 38.067752838134766, 42.55625915527344, 47.044761657714844, 51.53326416015625, 56.02177047729492, 60.510276794433594, 64.99876403808594, 69.48726654052734, 73.97576904296875, 78.46427917480469, 82.9527816772461, 87.4412841796875, 91.92979431152344, 96.41829681396484, 100.90679931640625, 105.39530181884766, 109.88380432128906, 114.372314453125, 118.8608169555664, 123.34931945800781, 127.83782958984375, 132.32632446289062, 136.81483459472656, 141.3033447265625, 145.79183959960938, 150.2803497314453, 154.76885986328125, 159.25735473632812, 163.74586486816406, 168.23435974121094, 172.72286987304688, 177.2113800048828, 181.6998748779297, 186.18838500976562, 190.6768798828125, 195.16539001464844, 199.65390014648438, 204.14239501953125, 208.6309051513672]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 9.0, 8.0, 9.0, 7.0, 10.0, 20.0, 17.0, 27.0, 29.0, 29.0, 17.0, 25.0, 24.0, 42.0, 50.0, 35.0, 49.0, 41.0, 43.0, 45.0, 37.0, 50.0, 36.0, 37.0, 44.0, 31.0, 31.0, 21.0, 26.0, 29.0, 19.0, 19.0, 12.0, 14.0, 11.0, 6.0, 7.0, 16.0, 6.0, 4.0, 4.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-34.675350189208984, -33.692710876464844, -32.71007537841797, -31.727436065673828, -30.744796752929688, -29.76215934753418, -28.779521942138672, -27.79688262939453, -26.814245223999023, -25.831607818603516, -24.848968505859375, -23.866331100463867, -22.88369369506836, -21.90105438232422, -20.91841697692871, -19.935779571533203, -18.953140258789062, -17.970502853393555, -16.987863540649414, -16.005226135253906, -15.022587776184082, -14.039949417114258, -13.05731201171875, -12.074673652648926, -11.092035293579102, -10.109396934509277, -9.126758575439453, -8.144121170043945, -7.161482810974121, -6.178844451904297, -5.196206569671631, -4.213568687438965, -3.2309322357177734, -2.2482941150665283, -1.2656559944152832, -0.2830178737640381, 0.699620246887207, 1.6822586059570312, 2.6648964881896973, 3.6475343704223633, 4.6301727294921875, 5.612811088562012, 6.595448970794678, 7.578086853027344, 8.560725212097168, 9.543363571166992, 10.5260009765625, 11.508639335632324, 12.491277694702148, 13.473916053771973, 14.456554412841797, 15.439191818237305, 16.421829223632812, 17.404468536376953, 18.38710594177246, 19.36974334716797, 20.35238265991211, 21.335020065307617, 22.317659378051758, 23.300296783447266, 24.282936096191406, 25.265573501586914, 26.248210906982422, 27.230850219726562, 28.21348762512207]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 6.0, 1.0, 7.0, 8.0, 13.0, 9.0, 14.0, 15.0, 18.0, 16.0, 17.0, 26.0, 26.0, 22.0, 29.0, 36.0, 41.0, 35.0, 43.0, 52.0, 37.0, 43.0, 34.0, 48.0, 36.0, 47.0, 38.0, 32.0, 37.0, 32.0, 21.0, 22.0, 17.0, 14.0, 24.0, 13.0, 16.0, 12.0, 8.0, 7.0, 3.0, 7.0, 5.0, 4.0, 3.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-6.05859375, -5.8546142578125, -5.650634765625, -5.4466552734375, -5.24267578125, -5.0386962890625, -4.834716796875, -4.6307373046875, -4.4267578125, -4.2227783203125, -4.018798828125, -3.8148193359375, -3.61083984375, -3.4068603515625, -3.202880859375, -2.9989013671875, -2.794921875, -2.5909423828125, -2.386962890625, -2.1829833984375, -1.97900390625, -1.7750244140625, -1.571044921875, -1.3670654296875, -1.1630859375, -0.9591064453125, -0.755126953125, -0.5511474609375, -0.34716796875, -0.1431884765625, 0.060791015625, 0.2647705078125, 0.46875, 0.6727294921875, 0.876708984375, 1.0806884765625, 1.28466796875, 1.4886474609375, 1.692626953125, 1.8966064453125, 2.1005859375, 2.3045654296875, 2.508544921875, 2.7125244140625, 2.91650390625, 3.1204833984375, 3.324462890625, 3.5284423828125, 3.732421875, 3.9364013671875, 4.140380859375, 4.3443603515625, 4.54833984375, 4.7523193359375, 4.956298828125, 5.1602783203125, 5.3642578125, 5.5682373046875, 5.772216796875, 5.9761962890625, 6.18017578125, 6.3841552734375, 6.588134765625, 6.7921142578125, 6.99609375]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 12.0, 9.0, 15.0, 19.0, 36.0, 43.0, 77.0, 113.0, 171.0, 294.0, 445.0, 739.0, 1135.0, 1911.0, 3259.0, 5631.0, 9732.0, 17207.0, 30775.0, 56782.0, 113389.0, 258475.0, 285659.0, 123748.0, 61829.0, 33259.0, 18618.0, 10440.0, 5883.0, 3438.0, 2063.0, 1284.0, 756.0, 484.0, 288.0, 175.0, 108.0, 76.0, 63.0, 39.0, 31.0, 15.0, 17.0, 6.0, 7.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.35546875, -0.344024658203125, -0.33258056640625, -0.321136474609375, -0.3096923828125, -0.298248291015625, -0.28680419921875, -0.275360107421875, -0.263916015625, -0.252471923828125, -0.24102783203125, -0.229583740234375, -0.2181396484375, -0.206695556640625, -0.19525146484375, -0.183807373046875, -0.17236328125, -0.160919189453125, -0.14947509765625, -0.138031005859375, -0.1265869140625, -0.115142822265625, -0.10369873046875, -0.092254638671875, -0.080810546875, -0.069366455078125, -0.05792236328125, -0.046478271484375, -0.0350341796875, -0.023590087890625, -0.01214599609375, -0.000701904296875, 0.0107421875, 0.022186279296875, 0.03363037109375, 0.045074462890625, 0.0565185546875, 0.067962646484375, 0.07940673828125, 0.090850830078125, 0.102294921875, 0.113739013671875, 0.12518310546875, 0.136627197265625, 0.1480712890625, 0.159515380859375, 0.17095947265625, 0.182403564453125, 0.19384765625, 0.205291748046875, 0.21673583984375, 0.228179931640625, 0.2396240234375, 0.251068115234375, 0.26251220703125, 0.273956298828125, 0.285400390625, 0.296844482421875, 0.30828857421875, 0.319732666015625, 0.3311767578125, 0.342620849609375, 0.35406494140625, 0.365509033203125, 0.376953125]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 3.0, 0.0, 3.0, 5.0, 3.0, 3.0, 3.0, 9.0, 8.0, 5.0, 18.0, 13.0, 6.0, 13.0, 19.0, 25.0, 22.0, 24.0, 21.0, 35.0, 30.0, 35.0, 42.0, 22.0, 31.0, 38.0, 44.0, 35.0, 1066.0, 39.0, 31.0, 44.0, 31.0, 23.0, 42.0, 33.0, 37.0, 18.0, 21.0, 19.0, 21.0, 13.0, 16.0, 11.0, 14.0, 11.0, 9.0, 5.0, 5.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 5.0, 1.0, 0.0, 1.0], "bins": [-3.974609375, -3.850677490234375, -3.72674560546875, -3.602813720703125, -3.4788818359375, -3.354949951171875, -3.23101806640625, -3.107086181640625, -2.983154296875, -2.859222412109375, -2.73529052734375, -2.611358642578125, -2.4874267578125, -2.363494873046875, -2.23956298828125, -2.115631103515625, -1.99169921875, -1.867767333984375, -1.74383544921875, -1.619903564453125, -1.4959716796875, -1.372039794921875, -1.24810791015625, -1.124176025390625, -1.000244140625, -0.876312255859375, -0.75238037109375, -0.628448486328125, -0.5045166015625, -0.380584716796875, -0.25665283203125, -0.132720947265625, -0.0087890625, 0.115142822265625, 0.23907470703125, 0.363006591796875, 0.4869384765625, 0.610870361328125, 0.73480224609375, 0.858734130859375, 0.982666015625, 1.106597900390625, 1.23052978515625, 1.354461669921875, 1.4783935546875, 1.602325439453125, 1.72625732421875, 1.850189208984375, 1.97412109375, 2.098052978515625, 2.22198486328125, 2.345916748046875, 2.4698486328125, 2.593780517578125, 2.71771240234375, 2.841644287109375, 2.965576171875, 3.089508056640625, 3.21343994140625, 3.337371826171875, 3.4613037109375, 3.585235595703125, 3.70916748046875, 3.833099365234375, 3.95703125]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 12.0, 9.0, 23.0, 28.0, 55.0, 52.0, 83.0, 99.0, 135.0, 207.0, 343.0, 514.0, 664.0, 951.0, 1376.0, 2080.0, 3185.0, 4587.0, 6982.0, 11056.0, 16971.0, 27667.0, 45905.0, 77461.0, 135318.0, 1292015.0, 196389.0, 108482.0, 62532.0, 37726.0, 22690.0, 14345.0, 9189.0, 5954.0, 3859.0, 2555.0, 1764.0, 1228.0, 771.0, 567.0, 370.0, 276.0, 190.0, 156.0, 91.0, 60.0, 45.0, 37.0, 18.0, 18.0, 13.0, 13.0, 8.0, 5.0, 6.0, 3.0, 3.0], "bins": [-0.219970703125, -0.21326446533203125, -0.2065582275390625, -0.19985198974609375, -0.193145751953125, -0.18643951416015625, -0.1797332763671875, -0.17302703857421875, -0.16632080078125, -0.15961456298828125, -0.1529083251953125, -0.14620208740234375, -0.139495849609375, -0.13278961181640625, -0.1260833740234375, -0.11937713623046875, -0.1126708984375, -0.10596466064453125, -0.0992584228515625, -0.09255218505859375, -0.085845947265625, -0.07913970947265625, -0.0724334716796875, -0.06572723388671875, -0.05902099609375, -0.05231475830078125, -0.0456085205078125, -0.03890228271484375, -0.032196044921875, -0.02548980712890625, -0.0187835693359375, -0.01207733154296875, -0.00537109375, 0.00133514404296875, 0.0080413818359375, 0.01474761962890625, 0.021453857421875, 0.02816009521484375, 0.0348663330078125, 0.04157257080078125, 0.04827880859375, 0.05498504638671875, 0.0616912841796875, 0.06839752197265625, 0.075103759765625, 0.08180999755859375, 0.0885162353515625, 0.09522247314453125, 0.1019287109375, 0.10863494873046875, 0.1153411865234375, 0.12204742431640625, 0.128753662109375, 0.13545989990234375, 0.1421661376953125, 0.14887237548828125, 0.15557861328125, 0.16228485107421875, 0.1689910888671875, 0.17569732666015625, 0.182403564453125, 0.18910980224609375, 0.1958160400390625, 0.20252227783203125, 0.209228515625]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 7.0, 7.0, 4.0, 11.0, 9.0, 15.0, 21.0, 17.0, 18.0, 21.0, 29.0, 32.0, 39.0, 48.0, 63.0, 91.0, 97.0, 90.0, 67.0, 52.0, 62.0, 40.0, 26.0, 21.0, 13.0, 19.0, 14.0, 18.0, 10.0, 8.0, 9.0, 5.0, 4.0, 2.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.00022935867309570312, -0.00022295117378234863, -0.00021654367446899414, -0.00021013617515563965, -0.00020372867584228516, -0.00019732117652893066, -0.00019091367721557617, -0.00018450617790222168, -0.0001780986785888672, -0.0001716911792755127, -0.0001652836799621582, -0.0001588761806488037, -0.00015246868133544922, -0.00014606118202209473, -0.00013965368270874023, -0.00013324618339538574, -0.00012683868408203125, -0.00012043118476867676, -0.00011402368545532227, -0.00010761618614196777, -0.00010120868682861328, -9.480118751525879e-05, -8.83936882019043e-05, -8.19861888885498e-05, -7.557868957519531e-05, -6.917119026184082e-05, -6.276369094848633e-05, -5.6356191635131836e-05, -4.9948692321777344e-05, -4.354119300842285e-05, -3.713369369506836e-05, -3.072619438171387e-05, -2.4318695068359375e-05, -1.7911195755004883e-05, -1.150369644165039e-05, -5.0961971282958984e-06, 1.3113021850585938e-06, 7.718801498413086e-06, 1.4126300811767578e-05, 2.053380012512207e-05, 2.6941299438476562e-05, 3.3348798751831055e-05, 3.975629806518555e-05, 4.616379737854004e-05, 5.257129669189453e-05, 5.8978796005249023e-05, 6.538629531860352e-05, 7.179379463195801e-05, 7.82012939453125e-05, 8.460879325866699e-05, 9.101629257202148e-05, 9.742379188537598e-05, 0.00010383129119873047, 0.00011023879051208496, 0.00011664628982543945, 0.00012305378913879395, 0.00012946128845214844, 0.00013586878776550293, 0.00014227628707885742, 0.00014868378639221191, 0.0001550912857055664, 0.0001614987850189209, 0.0001679062843322754, 0.00017431378364562988, 0.00018072128295898438]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 0.0, 6.0, 4.0, 8.0, 10.0, 8.0, 10.0, 17.0, 25.0, 39.0, 39.0, 43.0, 67.0, 103.0, 153.0, 291.0, 714.0, 4782.0, 944448.0, 94874.0, 1709.0, 457.0, 215.0, 141.0, 81.0, 71.0, 44.0, 46.0, 26.0, 31.0, 25.0, 16.0, 11.0, 5.0, 6.0, 5.0, 5.0, 6.0, 5.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.0043182373046875, -0.00418245792388916, -0.00404667854309082, -0.0039108991622924805, -0.0037751197814941406, -0.0036393404006958008, -0.003503561019897461, -0.003367781639099121, -0.0032320022583007812, -0.0030962228775024414, -0.0029604434967041016, -0.0028246641159057617, -0.002688884735107422, -0.002553105354309082, -0.002417325973510742, -0.0022815465927124023, -0.0021457672119140625, -0.0020099878311157227, -0.0018742084503173828, -0.001738429069519043, -0.0016026496887207031, -0.0014668703079223633, -0.0013310909271240234, -0.0011953115463256836, -0.0010595321655273438, -0.0009237527847290039, -0.0007879734039306641, -0.0006521940231323242, -0.0005164146423339844, -0.00038063526153564453, -0.0002448558807373047, -0.00010907649993896484, 2.6702880859375e-05, 0.00016248226165771484, 0.0002982616424560547, 0.00043404102325439453, 0.0005698204040527344, 0.0007055997848510742, 0.0008413791656494141, 0.000977158546447754, 0.0011129379272460938, 0.0012487173080444336, 0.0013844966888427734, 0.0015202760696411133, 0.0016560554504394531, 0.001791834831237793, 0.0019276142120361328, 0.0020633935928344727, 0.0021991729736328125, 0.0023349523544311523, 0.002470731735229492, 0.002606511116027832, 0.002742290496826172, 0.0028780698776245117, 0.0030138492584228516, 0.0031496286392211914, 0.0032854080200195312, 0.003421187400817871, 0.003556966781616211, 0.0036927461624145508, 0.0038285255432128906, 0.0039643049240112305, 0.00410008430480957, 0.00423586368560791, 0.00437164306640625]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 19.0, 62.0, 261.0, 376.0, 215.0, 62.0, 10.0, 6.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002169082290492952, -0.00020182506705168635, -0.0001867419050540775, -0.00017165874305646867, -0.00015657558105885983, -0.00014149240450933576, -0.00012640925706364214, -0.00011132608779007569, -9.624292579246685e-05, -8.115976379485801e-05, -6.607660179724917e-05, -5.099343616166152e-05, -3.591027416405268e-05, -2.0827108528465033e-05, -5.743946530856192e-06, 9.339215466752648e-06, 2.442237746436149e-05, 3.950553946197033e-05, 5.458870145957917e-05, 6.967186345718801e-05, 8.475502545479685e-05, 9.98381947283633e-05, 0.00011492135672597215, 0.00013000451144762337, 0.00014508768799714744, 0.00016017084999475628, 0.00017525401199236512, 0.00019033717398997396, 0.0002054203359875828, 0.00022050351253710687, 0.00023558665998280048, 0.00025066983653232455, 0.00026575298397801816, 0.00028083616052754223, 0.00029591930797323585, 0.0003110024845227599, 0.0003260856319684535, 0.0003411688085179776, 0.0003562519559636712, 0.0003713351325131953, 0.0003864182799588889, 0.00040150145650841296, 0.00041658460395410657, 0.00043166778050363064, 0.00044675092794932425, 0.0004618341044988483, 0.00047691725194454193, 0.000492000428494066, 0.0005070836050435901, 0.0005221667815931141, 0.0005372499581426382, 0.0005523330764845014, 0.0005674162530340254, 0.0005824994295835495, 0.0005975826061330736, 0.0006126657244749367, 0.0006277489010244608, 0.0006428320775739849, 0.0006579152541235089, 0.0006729983724653721, 0.0006880815490148962, 0.0007031647255644202, 0.0007182479021139443, 0.0007333310204558074, 0.0007484141970053315]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 8.0, 6.0, 4.0, 7.0, 2.0, 5.0, 12.0, 13.0, 16.0, 18.0, 16.0, 15.0, 25.0, 21.0, 27.0, 22.0, 30.0, 36.0, 35.0, 38.0, 55.0, 55.0, 47.0, 47.0, 46.0, 38.0, 42.0, 40.0, 31.0, 35.0, 35.0, 24.0, 24.0, 23.0, 20.0, 19.0, 15.0, 11.0, 9.0, 8.0, 8.0, 6.0, 1.0, 7.0, 3.0, 4.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00011020898818969727, -0.00010703317821025848, -0.0001038573682308197, -0.00010068155825138092, -9.750574827194214e-05, -9.432993829250336e-05, -9.115412831306458e-05, -8.79783183336258e-05, -8.480250835418701e-05, -8.162669837474823e-05, -7.845088839530945e-05, -7.527507841587067e-05, -7.209926843643188e-05, -6.89234584569931e-05, -6.574764847755432e-05, -6.257183849811554e-05, -5.939602851867676e-05, -5.6220218539237976e-05, -5.3044408559799194e-05, -4.986859858036041e-05, -4.669278860092163e-05, -4.351697862148285e-05, -4.034116864204407e-05, -3.7165358662605286e-05, -3.3989548683166504e-05, -3.081373870372772e-05, -2.763792872428894e-05, -2.446211874485016e-05, -2.1286308765411377e-05, -1.8110498785972595e-05, -1.4934688806533813e-05, -1.1758878827095032e-05, -8.58306884765625e-06, -5.407258868217468e-06, -2.2314488887786865e-06, 9.443610906600952e-07, 4.120171070098877e-06, 7.295981049537659e-06, 1.047179102897644e-05, 1.3647601008415222e-05, 1.6823410987854004e-05, 1.9999220967292786e-05, 2.3175030946731567e-05, 2.635084092617035e-05, 2.952665090560913e-05, 3.270246088504791e-05, 3.5878270864486694e-05, 3.9054080843925476e-05, 4.222989082336426e-05, 4.540570080280304e-05, 4.858151078224182e-05, 5.17573207616806e-05, 5.4933130741119385e-05, 5.8108940720558167e-05, 6.128475069999695e-05, 6.446056067943573e-05, 6.763637065887451e-05, 7.08121806383133e-05, 7.398799061775208e-05, 7.716380059719086e-05, 8.033961057662964e-05, 8.351542055606842e-05, 8.66912305355072e-05, 8.986704051494598e-05, 9.304285049438477e-05]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 6.0, 1.0, 7.0, 8.0, 13.0, 9.0, 14.0, 15.0, 18.0, 16.0, 17.0, 26.0, 26.0, 22.0, 29.0, 36.0, 41.0, 36.0, 42.0, 52.0, 37.0, 43.0, 34.0, 48.0, 36.0, 47.0, 38.0, 32.0, 37.0, 32.0, 21.0, 22.0, 17.0, 14.0, 24.0, 13.0, 16.0, 12.0, 8.0, 7.0, 3.0, 7.0, 5.0, 4.0, 3.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-6.05859375, -5.8546142578125, -5.650634765625, -5.4466552734375, -5.24267578125, -5.0386962890625, -4.834716796875, -4.6307373046875, -4.4267578125, -4.2227783203125, -4.018798828125, -3.8148193359375, -3.61083984375, -3.4068603515625, -3.202880859375, -2.9989013671875, -2.794921875, -2.5909423828125, -2.386962890625, -2.1829833984375, -1.97900390625, -1.7750244140625, -1.571044921875, -1.3670654296875, -1.1630859375, -0.9591064453125, -0.755126953125, -0.5511474609375, -0.34716796875, -0.1431884765625, 0.060791015625, 0.2647705078125, 0.46875, 0.6727294921875, 0.876708984375, 1.0806884765625, 1.28466796875, 1.4886474609375, 1.692626953125, 1.8966064453125, 2.1005859375, 2.3045654296875, 2.508544921875, 2.7125244140625, 2.91650390625, 3.1204833984375, 3.324462890625, 3.5284423828125, 3.732421875, 3.9364013671875, 4.140380859375, 4.3443603515625, 4.54833984375, 4.7523193359375, 4.956298828125, 5.1602783203125, 5.3642578125, 5.5682373046875, 5.772216796875, 5.9761962890625, 6.18017578125, 6.3841552734375, 6.588134765625, 6.7921142578125, 6.99609375]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 1.0, 0.0, 3.0, 7.0, 6.0, 5.0, 10.0, 22.0, 24.0, 22.0, 39.0, 63.0, 83.0, 99.0, 153.0, 188.0, 294.0, 427.0, 647.0, 1077.0, 1788.0, 3308.0, 6428.0, 12836.0, 27325.0, 62595.0, 159004.0, 382407.0, 231709.0, 86157.0, 36889.0, 16574.0, 8294.0, 4136.0, 2243.0, 1335.0, 761.0, 486.0, 326.0, 225.0, 164.0, 114.0, 72.0, 56.0, 36.0, 30.0, 26.0, 20.0, 18.0, 8.0, 6.0, 8.0, 4.0, 3.0, 2.0, 0.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.546875, -7.2926025390625, -7.038330078125, -6.7840576171875, -6.52978515625, -6.2755126953125, -6.021240234375, -5.7669677734375, -5.5126953125, -5.2584228515625, -5.004150390625, -4.7498779296875, -4.49560546875, -4.2413330078125, -3.987060546875, -3.7327880859375, -3.478515625, -3.2242431640625, -2.969970703125, -2.7156982421875, -2.46142578125, -2.2071533203125, -1.952880859375, -1.6986083984375, -1.4443359375, -1.1900634765625, -0.935791015625, -0.6815185546875, -0.42724609375, -0.1729736328125, 0.081298828125, 0.3355712890625, 0.58984375, 0.8441162109375, 1.098388671875, 1.3526611328125, 1.60693359375, 1.8612060546875, 2.115478515625, 2.3697509765625, 2.6240234375, 2.8782958984375, 3.132568359375, 3.3868408203125, 3.64111328125, 3.8953857421875, 4.149658203125, 4.4039306640625, 4.658203125, 4.9124755859375, 5.166748046875, 5.4210205078125, 5.67529296875, 5.9295654296875, 6.183837890625, 6.4381103515625, 6.6923828125, 6.9466552734375, 7.200927734375, 7.4552001953125, 7.70947265625, 7.9637451171875, 8.218017578125, 8.4722900390625, 8.7265625]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 4.0, 6.0, 6.0, 4.0, 6.0, 12.0, 16.0, 18.0, 19.0, 22.0, 35.0, 26.0, 46.0, 36.0, 50.0, 50.0, 65.0, 74.0, 179.0, 1438.0, 352.0, 163.0, 68.0, 52.0, 43.0, 35.0, 32.0, 25.0, 21.0, 35.0, 27.0, 13.0, 16.0, 12.0, 7.0, 10.0, 7.0, 8.0, 3.0, 3.0, 4.0, 3.0, 3.0, 1.0, 0.0, 4.0, 0.0, 1.0, 1.0], "bins": [-19.875, -19.30419921875, -18.7333984375, -18.16259765625, -17.591796875, -17.02099609375, -16.4501953125, -15.87939453125, -15.30859375, -14.73779296875, -14.1669921875, -13.59619140625, -13.025390625, -12.45458984375, -11.8837890625, -11.31298828125, -10.7421875, -10.17138671875, -9.6005859375, -9.02978515625, -8.458984375, -7.88818359375, -7.3173828125, -6.74658203125, -6.17578125, -5.60498046875, -5.0341796875, -4.46337890625, -3.892578125, -3.32177734375, -2.7509765625, -2.18017578125, -1.609375, -1.03857421875, -0.4677734375, 0.10302734375, 0.673828125, 1.24462890625, 1.8154296875, 2.38623046875, 2.95703125, 3.52783203125, 4.0986328125, 4.66943359375, 5.240234375, 5.81103515625, 6.3818359375, 6.95263671875, 7.5234375, 8.09423828125, 8.6650390625, 9.23583984375, 9.806640625, 10.37744140625, 10.9482421875, 11.51904296875, 12.08984375, 12.66064453125, 13.2314453125, 13.80224609375, 14.373046875, 14.94384765625, 15.5146484375, 16.08544921875, 16.65625]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 7.0, 5.0, 4.0, 9.0, 8.0, 17.0, 16.0, 32.0, 46.0, 41.0, 74.0, 109.0, 175.0, 289.0, 523.0, 1373.0, 12487.0, 553706.0, 2542521.0, 30320.0, 2305.0, 641.0, 369.0, 199.0, 160.0, 71.0, 61.0, 26.0, 26.0, 24.0, 17.0, 14.0, 7.0, 6.0, 5.0, 2.0, 2.0, 8.0, 2.0, 4.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.59375, -25.64892578125, -24.7041015625, -23.75927734375, -22.814453125, -21.86962890625, -20.9248046875, -19.97998046875, -19.03515625, -18.09033203125, -17.1455078125, -16.20068359375, -15.255859375, -14.31103515625, -13.3662109375, -12.42138671875, -11.4765625, -10.53173828125, -9.5869140625, -8.64208984375, -7.697265625, -6.75244140625, -5.8076171875, -4.86279296875, -3.91796875, -2.97314453125, -2.0283203125, -1.08349609375, -0.138671875, 0.80615234375, 1.7509765625, 2.69580078125, 3.640625, 4.58544921875, 5.5302734375, 6.47509765625, 7.419921875, 8.36474609375, 9.3095703125, 10.25439453125, 11.19921875, 12.14404296875, 13.0888671875, 14.03369140625, 14.978515625, 15.92333984375, 16.8681640625, 17.81298828125, 18.7578125, 19.70263671875, 20.6474609375, 21.59228515625, 22.537109375, 23.48193359375, 24.4267578125, 25.37158203125, 26.31640625, 27.26123046875, 28.2060546875, 29.15087890625, 30.095703125, 31.04052734375, 31.9853515625, 32.93017578125, 33.875]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 10.0, 768.0, 238.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-362.8045959472656, -353.2045593261719, -343.6045227050781, -334.0044860839844, -324.4044494628906, -314.804443359375, -305.20440673828125, -295.6043701171875, -286.00433349609375, -276.404296875, -266.80426025390625, -257.2042236328125, -247.6042022705078, -238.00416564941406, -228.4041290283203, -218.80410766601562, -209.2040557861328, -199.60401916503906, -190.0039825439453, -180.40396118164062, -170.80392456054688, -161.20388793945312, -151.60385131835938, -142.00381469726562, -132.40377807617188, -122.80374145507812, -113.2037124633789, -103.60367584228516, -94.00364685058594, -84.40361022949219, -74.80357360839844, -65.20354461669922, -55.60353088378906, -46.00349807739258, -36.403465270996094, -26.803428649902344, -17.20339584350586, -7.603363037109375, 1.996673583984375, 11.596702575683594, 21.196739196777344, 30.796772003173828, 40.39680480957031, 49.99684143066406, 59.59687423706055, 69.19690704345703, 78.79694366455078, 88.39697265625, 97.99700927734375, 107.5970458984375, 117.19707489013672, 126.79711151123047, 136.3971405029297, 145.99717712402344, 155.5972137451172, 165.19723510742188, 174.79727172851562, 184.39730834960938, 193.99734497070312, 203.59738159179688, 213.19740295410156, 222.7974395751953, 232.39747619628906, 241.99749755859375, 251.59754943847656]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 1.0, 4.0, 1.0, 7.0, 7.0, 8.0, 4.0, 9.0, 8.0, 14.0, 18.0, 12.0, 28.0, 17.0, 26.0, 26.0, 25.0, 29.0, 32.0, 35.0, 46.0, 32.0, 41.0, 49.0, 43.0, 38.0, 39.0, 37.0, 34.0, 29.0, 30.0, 26.0, 35.0, 34.0, 34.0, 18.0, 18.0, 17.0, 14.0, 12.0, 14.0, 7.0, 14.0, 11.0, 4.0, 4.0, 6.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 3.0], "bins": [-35.90821838378906, -34.79539489746094, -33.68257141113281, -32.56974792480469, -31.456926345825195, -30.34410285949707, -29.231281280517578, -28.118457794189453, -27.005634307861328, -25.892810821533203, -24.779987335205078, -23.667165756225586, -22.55434226989746, -21.441518783569336, -20.328697204589844, -19.21587371826172, -18.103050231933594, -16.99022674560547, -15.87740421295166, -14.764581680297852, -13.651758193969727, -12.538934707641602, -11.426112174987793, -10.313289642333984, -9.20046615600586, -8.087642669677734, -6.974820137023926, -5.861997127532959, -4.749174118041992, -3.6363511085510254, -2.5235280990600586, -1.4107050895690918, -0.297882080078125, 0.8149409294128418, 1.9277639389038086, 3.0405869483947754, 4.153409957885742, 5.266232967376709, 6.379055976867676, 7.491878986358643, 8.60470199584961, 9.717525482177734, 10.830348014831543, 11.943170547485352, 13.055994033813477, 14.168817520141602, 15.28164005279541, 16.39446258544922, 17.507286071777344, 18.62010955810547, 19.732933044433594, 20.845754623413086, 21.95857810974121, 23.071401596069336, 24.184223175048828, 25.297046661376953, 26.409870147705078, 27.522693634033203, 28.635517120361328, 29.74833869934082, 30.861162185668945, 31.97398567199707, 33.08680725097656, 34.19963073730469, 35.31245422363281]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 2.0, 6.0, 2.0, 3.0, 4.0, 4.0, 7.0, 5.0, 17.0, 13.0, 15.0, 13.0, 13.0, 20.0, 19.0, 26.0, 25.0, 29.0, 36.0, 31.0, 38.0, 43.0, 46.0, 43.0, 38.0, 42.0, 47.0, 50.0, 33.0, 43.0, 36.0, 37.0, 29.0, 27.0, 20.0, 15.0, 22.0, 9.0, 24.0, 19.0, 10.0, 13.0, 8.0, 4.0, 6.0, 4.0, 6.0, 3.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.1171875, -5.9072265625, -5.697265625, -5.4873046875, -5.27734375, -5.0673828125, -4.857421875, -4.6474609375, -4.4375, -4.2275390625, -4.017578125, -3.8076171875, -3.59765625, -3.3876953125, -3.177734375, -2.9677734375, -2.7578125, -2.5478515625, -2.337890625, -2.1279296875, -1.91796875, -1.7080078125, -1.498046875, -1.2880859375, -1.078125, -0.8681640625, -0.658203125, -0.4482421875, -0.23828125, -0.0283203125, 0.181640625, 0.3916015625, 0.6015625, 0.8115234375, 1.021484375, 1.2314453125, 1.44140625, 1.6513671875, 1.861328125, 2.0712890625, 2.28125, 2.4912109375, 2.701171875, 2.9111328125, 3.12109375, 3.3310546875, 3.541015625, 3.7509765625, 3.9609375, 4.1708984375, 4.380859375, 4.5908203125, 4.80078125, 5.0107421875, 5.220703125, 5.4306640625, 5.640625, 5.8505859375, 6.060546875, 6.2705078125, 6.48046875, 6.6904296875, 6.900390625, 7.1103515625, 7.3203125]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 8.0, 7.0, 7.0, 10.0, 19.0, 18.0, 29.0, 34.0, 54.0, 68.0, 75.0, 121.0, 174.0, 284.0, 384.0, 644.0, 1080.0, 1883.0, 3429.0, 7264.0, 19712.0, 77012.0, 370679.0, 1434643.0, 1660833.0, 477064.0, 98234.0, 23270.0, 8293.0, 3799.0, 2024.0, 1105.0, 658.0, 416.0, 285.0, 189.0, 143.0, 95.0, 60.0, 40.0, 42.0, 28.0, 14.0, 21.0, 14.0, 5.0, 9.0, 2.0, 5.0, 4.0, 0.0, 1.0, 1.0, 1.0], "bins": [-8.703125, -8.44775390625, -8.1923828125, -7.93701171875, -7.681640625, -7.42626953125, -7.1708984375, -6.91552734375, -6.66015625, -6.40478515625, -6.1494140625, -5.89404296875, -5.638671875, -5.38330078125, -5.1279296875, -4.87255859375, -4.6171875, -4.36181640625, -4.1064453125, -3.85107421875, -3.595703125, -3.34033203125, -3.0849609375, -2.82958984375, -2.57421875, -2.31884765625, -2.0634765625, -1.80810546875, -1.552734375, -1.29736328125, -1.0419921875, -0.78662109375, -0.53125, -0.27587890625, -0.0205078125, 0.23486328125, 0.490234375, 0.74560546875, 1.0009765625, 1.25634765625, 1.51171875, 1.76708984375, 2.0224609375, 2.27783203125, 2.533203125, 2.78857421875, 3.0439453125, 3.29931640625, 3.5546875, 3.81005859375, 4.0654296875, 4.32080078125, 4.576171875, 4.83154296875, 5.0869140625, 5.34228515625, 5.59765625, 5.85302734375, 6.1083984375, 6.36376953125, 6.619140625, 6.87451171875, 7.1298828125, 7.38525390625, 7.640625]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 5.0, 4.0, 4.0, 4.0, 7.0, 9.0, 17.0, 22.0, 17.0, 18.0, 61.0, 56.0, 69.0, 135.0, 223.0, 314.0, 557.0, 727.0, 651.0, 407.0, 259.0, 188.0, 95.0, 72.0, 36.0, 21.0, 25.0, 18.0, 11.0, 13.0, 9.0, 8.0, 5.0, 3.0, 3.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.65625, -10.3087158203125, -9.961181640625, -9.6136474609375, -9.26611328125, -8.9185791015625, -8.571044921875, -8.2235107421875, -7.8759765625, -7.5284423828125, -7.180908203125, -6.8333740234375, -6.48583984375, -6.1383056640625, -5.790771484375, -5.4432373046875, -5.095703125, -4.7481689453125, -4.400634765625, -4.0531005859375, -3.70556640625, -3.3580322265625, -3.010498046875, -2.6629638671875, -2.3154296875, -1.9678955078125, -1.620361328125, -1.2728271484375, -0.92529296875, -0.5777587890625, -0.230224609375, 0.1173095703125, 0.46484375, 0.8123779296875, 1.159912109375, 1.5074462890625, 1.85498046875, 2.2025146484375, 2.550048828125, 2.8975830078125, 3.2451171875, 3.5926513671875, 3.940185546875, 4.2877197265625, 4.63525390625, 4.9827880859375, 5.330322265625, 5.6778564453125, 6.025390625, 6.3729248046875, 6.720458984375, 7.0679931640625, 7.41552734375, 7.7630615234375, 8.110595703125, 8.4581298828125, 8.8056640625, 9.1531982421875, 9.500732421875, 9.8482666015625, 10.19580078125, 10.5433349609375, 10.890869140625, 11.2384033203125, 11.5859375]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 5.0, 9.0, 3.0, 9.0, 16.0, 35.0, 41.0, 42.0, 79.0, 120.0, 212.0, 311.0, 710.0, 1500.0, 3634.0, 11162.0, 43019.0, 333421.0, 3208993.0, 515509.0, 54512.0, 13068.0, 4342.0, 1670.0, 771.0, 409.0, 246.0, 151.0, 100.0, 58.0, 34.0, 29.0, 16.0, 16.0, 11.0, 9.0, 7.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-17.578125, -17.0545654296875, -16.531005859375, -16.0074462890625, -15.48388671875, -14.9603271484375, -14.436767578125, -13.9132080078125, -13.3896484375, -12.8660888671875, -12.342529296875, -11.8189697265625, -11.29541015625, -10.7718505859375, -10.248291015625, -9.7247314453125, -9.201171875, -8.6776123046875, -8.154052734375, -7.6304931640625, -7.10693359375, -6.5833740234375, -6.059814453125, -5.5362548828125, -5.0126953125, -4.4891357421875, -3.965576171875, -3.4420166015625, -2.91845703125, -2.3948974609375, -1.871337890625, -1.3477783203125, -0.82421875, -0.3006591796875, 0.222900390625, 0.7464599609375, 1.27001953125, 1.7935791015625, 2.317138671875, 2.8406982421875, 3.3642578125, 3.8878173828125, 4.411376953125, 4.9349365234375, 5.45849609375, 5.9820556640625, 6.505615234375, 7.0291748046875, 7.552734375, 8.0762939453125, 8.599853515625, 9.1234130859375, 9.64697265625, 10.1705322265625, 10.694091796875, 11.2176513671875, 11.7412109375, 12.2647705078125, 12.788330078125, 13.3118896484375, 13.83544921875, 14.3590087890625, 14.882568359375, 15.4061279296875, 15.9296875]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 3.0, 11.0, 37.0, 107.0, 266.0, 276.0, 185.0, 87.0, 30.0, 7.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.15627670288086, -19.474689483642578, -16.793102264404297, -14.111513137817383, -11.429925918579102, -8.74833869934082, -6.066749572753906, -3.385162353515625, -0.7035751342773438, 1.9780125617980957, 4.659600257873535, 7.341188430786133, 10.022775650024414, 12.704362869262695, 15.38595199584961, 18.06753921508789, 20.749126434326172, 23.430713653564453, 26.112300872802734, 28.79388999938965, 31.47547721862793, 34.157066345214844, 36.838653564453125, 39.520240783691406, 42.20182800292969, 44.88341522216797, 47.56500244140625, 50.24658966064453, 52.92817687988281, 55.609764099121094, 58.29135513305664, 60.97294235229492, 63.65452575683594, 66.33611297607422, 69.0177001953125, 71.69928741455078, 74.38087463378906, 77.06246185302734, 79.74404907226562, 82.42564392089844, 85.10722351074219, 87.78881072998047, 90.47039794921875, 93.15198516845703, 95.83357238769531, 98.5151596069336, 101.19674682617188, 103.87834167480469, 106.55992889404297, 109.24151611328125, 111.92310333251953, 114.60469055175781, 117.2862777709961, 119.96786499023438, 122.64945983886719, 125.33103942871094, 128.01263427734375, 130.69422912597656, 133.3758087158203, 136.05740356445312, 138.73898315429688, 141.4205780029297, 144.10215759277344, 146.78375244140625, 149.46533203125]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 4.0, 2.0, 7.0, 7.0, 9.0, 10.0, 5.0, 12.0, 5.0, 16.0, 6.0, 24.0, 21.0, 32.0, 22.0, 32.0, 27.0, 28.0, 29.0, 36.0, 34.0, 52.0, 40.0, 32.0, 38.0, 48.0, 47.0, 39.0, 51.0, 31.0, 33.0, 32.0, 37.0, 33.0, 22.0, 12.0, 22.0, 15.0, 12.0, 9.0, 9.0, 8.0, 3.0, 7.0, 1.0, 4.0, 3.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-31.46980857849121, -30.543197631835938, -29.61658477783203, -28.689973831176758, -27.76336097717285, -26.836750030517578, -25.910137176513672, -24.9835262298584, -24.056915283203125, -23.13030433654785, -22.203691482543945, -21.277080535888672, -20.350467681884766, -19.423856735229492, -18.49724578857422, -17.570632934570312, -16.644020080566406, -15.717408180236816, -14.790796279907227, -13.864185333251953, -12.937572479248047, -12.010961532592773, -11.084349632263184, -10.157737731933594, -9.231125831604004, -8.304513931274414, -7.377902030944824, -6.451290607452393, -5.524678707122803, -4.598066806793213, -3.6714553833007812, -2.7448434829711914, -1.8182296752929688, -0.8916178941726685, 0.034993886947631836, 0.9616055488586426, 1.8882174491882324, 2.8148293495178223, 3.741440773010254, 4.668052673339844, 5.594664573669434, 6.521276473999023, 7.447888374328613, 8.374500274658203, 9.301111221313477, 10.227724075317383, 11.154335021972656, 12.080946922302246, 13.007558822631836, 13.934170722961426, 14.860782623291016, 15.787393569946289, 16.714006423950195, 17.64061737060547, 18.567230224609375, 19.49384117126465, 20.420452117919922, 21.347063064575195, 22.2736759185791, 23.200286865234375, 24.12689971923828, 25.053510665893555, 25.980121612548828, 26.906734466552734, 27.83334732055664]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 5.0, 3.0, 2.0, 5.0, 3.0, 8.0, 5.0, 7.0, 9.0, 8.0, 9.0, 12.0, 18.0, 21.0, 23.0, 28.0, 33.0, 23.0, 40.0, 33.0, 39.0, 36.0, 52.0, 39.0, 38.0, 42.0, 57.0, 33.0, 36.0, 31.0, 32.0, 29.0, 28.0, 29.0, 34.0, 19.0, 20.0, 19.0, 15.0, 18.0, 10.0, 8.0, 10.0, 10.0, 10.0, 5.0, 5.0, 1.0, 5.0, 2.0, 4.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-6.61328125, -6.40802001953125, -6.2027587890625, -5.99749755859375, -5.792236328125, -5.58697509765625, -5.3817138671875, -5.17645263671875, -4.97119140625, -4.76593017578125, -4.5606689453125, -4.35540771484375, -4.150146484375, -3.94488525390625, -3.7396240234375, -3.53436279296875, -3.3291015625, -3.12384033203125, -2.9185791015625, -2.71331787109375, -2.508056640625, -2.30279541015625, -2.0975341796875, -1.89227294921875, -1.68701171875, -1.48175048828125, -1.2764892578125, -1.07122802734375, -0.865966796875, -0.66070556640625, -0.4554443359375, -0.25018310546875, -0.044921875, 0.16033935546875, 0.3656005859375, 0.57086181640625, 0.776123046875, 0.98138427734375, 1.1866455078125, 1.39190673828125, 1.59716796875, 1.80242919921875, 2.0076904296875, 2.21295166015625, 2.418212890625, 2.62347412109375, 2.8287353515625, 3.03399658203125, 3.2392578125, 3.44451904296875, 3.6497802734375, 3.85504150390625, 4.060302734375, 4.26556396484375, 4.4708251953125, 4.67608642578125, 4.88134765625, 5.08660888671875, 5.2918701171875, 5.49713134765625, 5.702392578125, 5.90765380859375, 6.1129150390625, 6.31817626953125, 6.5234375]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 7.0, 12.0, 12.0, 18.0, 42.0, 65.0, 92.0, 161.0, 251.0, 357.0, 580.0, 895.0, 1178.0, 1956.0, 3026.0, 4539.0, 7349.0, 11501.0, 18434.0, 30857.0, 53748.0, 98229.0, 196597.0, 284532.0, 147429.0, 76829.0, 42438.0, 25047.0, 15401.0, 9587.0, 6129.0, 3891.0, 2480.0, 1702.0, 1106.0, 777.0, 463.0, 277.0, 223.0, 130.0, 73.0, 44.0, 29.0, 22.0, 18.0, 9.0, 3.0, 1.0, 7.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.312744140625, -0.30306243896484375, -0.2933807373046875, -0.28369903564453125, -0.274017333984375, -0.26433563232421875, -0.2546539306640625, -0.24497222900390625, -0.23529052734375, -0.22560882568359375, -0.2159271240234375, -0.20624542236328125, -0.196563720703125, -0.18688201904296875, -0.1772003173828125, -0.16751861572265625, -0.1578369140625, -0.14815521240234375, -0.1384735107421875, -0.12879180908203125, -0.119110107421875, -0.10942840576171875, -0.0997467041015625, -0.09006500244140625, -0.08038330078125, -0.07070159912109375, -0.0610198974609375, -0.05133819580078125, -0.041656494140625, -0.03197479248046875, -0.0222930908203125, -0.01261138916015625, -0.0029296875, 0.00675201416015625, 0.0164337158203125, 0.02611541748046875, 0.035797119140625, 0.04547882080078125, 0.0551605224609375, 0.06484222412109375, 0.07452392578125, 0.08420562744140625, 0.0938873291015625, 0.10356903076171875, 0.113250732421875, 0.12293243408203125, 0.1326141357421875, 0.14229583740234375, 0.1519775390625, 0.16165924072265625, 0.1713409423828125, 0.18102264404296875, 0.190704345703125, 0.20038604736328125, 0.2100677490234375, 0.21974945068359375, 0.22943115234375, 0.23911285400390625, 0.2487945556640625, 0.25847625732421875, 0.268157958984375, 0.27783966064453125, 0.2875213623046875, 0.29720306396484375, 0.306884765625]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 1.0, 6.0, 4.0, 5.0, 8.0, 10.0, 8.0, 11.0, 5.0, 21.0, 18.0, 30.0, 31.0, 30.0, 31.0, 37.0, 49.0, 44.0, 63.0, 55.0, 1058.0, 44.0, 49.0, 46.0, 46.0, 45.0, 35.0, 28.0, 37.0, 27.0, 32.0, 20.0, 21.0, 20.0, 8.0, 10.0, 9.0, 9.0, 5.0, 5.0, 3.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.53515625, -5.37103271484375, -5.2069091796875, -5.04278564453125, -4.878662109375, -4.71453857421875, -4.5504150390625, -4.38629150390625, -4.22216796875, -4.05804443359375, -3.8939208984375, -3.72979736328125, -3.565673828125, -3.40155029296875, -3.2374267578125, -3.07330322265625, -2.9091796875, -2.74505615234375, -2.5809326171875, -2.41680908203125, -2.252685546875, -2.08856201171875, -1.9244384765625, -1.76031494140625, -1.59619140625, -1.43206787109375, -1.2679443359375, -1.10382080078125, -0.939697265625, -0.77557373046875, -0.6114501953125, -0.44732666015625, -0.283203125, -0.11907958984375, 0.0450439453125, 0.20916748046875, 0.373291015625, 0.53741455078125, 0.7015380859375, 0.86566162109375, 1.02978515625, 1.19390869140625, 1.3580322265625, 1.52215576171875, 1.686279296875, 1.85040283203125, 2.0145263671875, 2.17864990234375, 2.3427734375, 2.50689697265625, 2.6710205078125, 2.83514404296875, 2.999267578125, 3.16339111328125, 3.3275146484375, 3.49163818359375, 3.65576171875, 3.81988525390625, 3.9840087890625, 4.14813232421875, 4.312255859375, 4.47637939453125, 4.6405029296875, 4.80462646484375, 4.96875]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 16.0, 9.0, 25.0, 22.0, 29.0, 35.0, 49.0, 76.0, 73.0, 133.0, 186.0, 243.0, 324.0, 492.0, 654.0, 879.0, 1226.0, 1667.0, 2456.0, 3574.0, 4955.0, 7081.0, 10610.0, 15706.0, 23857.0, 36767.0, 58570.0, 97580.0, 169920.0, 1281235.0, 144426.0, 84053.0, 50971.0, 32588.0, 20965.0, 13941.0, 9440.0, 6619.0, 4530.0, 3150.0, 2239.0, 1613.0, 1129.0, 817.0, 580.0, 458.0, 360.0, 238.0, 162.0, 110.0, 78.0, 67.0, 37.0, 35.0, 23.0, 27.0, 14.0, 12.0, 10.0, 1.0, 3.0], "bins": [-0.1976318359375, -0.19152450561523438, -0.18541717529296875, -0.17930984497070312, -0.1732025146484375, -0.16709518432617188, -0.16098785400390625, -0.15488052368164062, -0.148773193359375, -0.14266586303710938, -0.13655853271484375, -0.13045120239257812, -0.1243438720703125, -0.11823654174804688, -0.11212921142578125, -0.10602188110351562, -0.09991455078125, -0.09380722045898438, -0.08769989013671875, -0.08159255981445312, -0.0754852294921875, -0.06937789916992188, -0.06327056884765625, -0.057163238525390625, -0.051055908203125, -0.044948577880859375, -0.03884124755859375, -0.032733917236328125, -0.0266265869140625, -0.020519256591796875, -0.01441192626953125, -0.008304595947265625, -0.002197265625, 0.003910064697265625, 0.01001739501953125, 0.016124725341796875, 0.0222320556640625, 0.028339385986328125, 0.03444671630859375, 0.040554046630859375, 0.046661376953125, 0.052768707275390625, 0.05887603759765625, 0.06498336791992188, 0.0710906982421875, 0.07719802856445312, 0.08330535888671875, 0.08941268920898438, 0.09552001953125, 0.10162734985351562, 0.10773468017578125, 0.11384201049804688, 0.1199493408203125, 0.12605667114257812, 0.13216400146484375, 0.13827133178710938, 0.144378662109375, 0.15048599243164062, 0.15659332275390625, 0.16270065307617188, 0.1688079833984375, 0.17491531372070312, 0.18102264404296875, 0.18712997436523438, 0.1932373046875]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 4.0, 4.0, 8.0, 11.0, 9.0, 11.0, 10.0, 15.0, 15.0, 31.0, 39.0, 58.0, 57.0, 90.0, 83.0, 109.0, 81.0, 70.0, 58.0, 41.0, 45.0, 34.0, 19.0, 21.0, 15.0, 13.0, 16.0, 5.0, 9.0, 5.0, 5.0, 3.0, 3.0, 3.0, 0.0, 4.0, 1.0, 2.0, 1.0], "bins": [-0.0004286766052246094, -0.00041804462671279907, -0.00040741264820098877, -0.00039678066968917847, -0.00038614869117736816, -0.00037551671266555786, -0.00036488473415374756, -0.00035425275564193726, -0.00034362077713012695, -0.00033298879861831665, -0.00032235682010650635, -0.00031172484159469604, -0.00030109286308288574, -0.00029046088457107544, -0.00027982890605926514, -0.00026919692754745483, -0.00025856494903564453, -0.00024793297052383423, -0.00023730099201202393, -0.00022666901350021362, -0.00021603703498840332, -0.00020540505647659302, -0.00019477307796478271, -0.0001841410994529724, -0.0001735091209411621, -0.0001628771424293518, -0.0001522451639175415, -0.0001416131854057312, -0.0001309812068939209, -0.0001203492283821106, -0.00010971724987030029, -9.908527135848999e-05, -8.845329284667969e-05, -7.782131433486938e-05, -6.718933582305908e-05, -5.655735731124878e-05, -4.5925378799438477e-05, -3.5293400287628174e-05, -2.466142177581787e-05, -1.4029443264007568e-05, -3.3974647521972656e-06, 7.234513759613037e-06, 1.786649227142334e-05, 2.8498470783233643e-05, 3.9130449295043945e-05, 4.976242780685425e-05, 6.039440631866455e-05, 7.102638483047485e-05, 8.165836334228516e-05, 9.229034185409546e-05, 0.00010292232036590576, 0.00011355429887771606, 0.00012418627738952637, 0.00013481825590133667, 0.00014545023441314697, 0.00015608221292495728, 0.00016671419143676758, 0.00017734616994857788, 0.00018797814846038818, 0.00019861012697219849, 0.0002092421054840088, 0.0002198740839958191, 0.0002305060625076294, 0.0002411380410194397, 0.00025177001953125]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 2.0, 6.0, 4.0, 4.0, 6.0, 8.0, 10.0, 16.0, 14.0, 22.0, 22.0, 32.0, 49.0, 62.0, 88.0, 146.0, 176.0, 359.0, 706.0, 5878.0, 1024920.0, 14185.0, 805.0, 369.0, 229.0, 146.0, 89.0, 38.0, 39.0, 25.0, 21.0, 26.0, 17.0, 13.0, 9.0, 11.0, 2.0, 5.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004779815673828125, -0.0045771002769470215, -0.004374384880065918, -0.0041716694831848145, -0.003968954086303711, -0.0037662386894226074, -0.003563523292541504, -0.0033608078956604004, -0.003158092498779297, -0.0029553771018981934, -0.00275266170501709, -0.0025499463081359863, -0.002347230911254883, -0.0021445155143737793, -0.0019418001174926758, -0.0017390847206115723, -0.0015363693237304688, -0.0013336539268493652, -0.0011309385299682617, -0.0009282231330871582, -0.0007255077362060547, -0.0005227923393249512, -0.00032007694244384766, -0.00011736154556274414, 8.535385131835938e-05, 0.0002880692481994629, 0.0004907846450805664, 0.0006935000419616699, 0.0008962154388427734, 0.001098930835723877, 0.0013016462326049805, 0.001504361629486084, 0.0017070770263671875, 0.001909792423248291, 0.0021125078201293945, 0.002315223217010498, 0.0025179386138916016, 0.002720654010772705, 0.0029233694076538086, 0.003126084804534912, 0.0033288002014160156, 0.003531515598297119, 0.0037342309951782227, 0.003936946392059326, 0.00413966178894043, 0.004342377185821533, 0.004545092582702637, 0.00474780797958374, 0.004950523376464844, 0.005153238773345947, 0.005355954170227051, 0.005558669567108154, 0.005761384963989258, 0.005964100360870361, 0.006166815757751465, 0.006369531154632568, 0.006572246551513672, 0.006774961948394775, 0.006977677345275879, 0.007180392742156982, 0.007383108139038086, 0.0075858235359191895, 0.007788538932800293, 0.007991254329681396, 0.0081939697265625]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 7.0, 15.0, 90.0, 472.0, 358.0, 63.0, 5.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0013327023480087519, -0.0013069864362478256, -0.0012812705244868994, -0.0012555544963106513, -0.001229838584549725, -0.0012041226727887988, -0.0011784066446125507, -0.0011526907328516245, -0.0011269748210906982, -0.001101258909329772, -0.0010755429975688457, -0.0010498269693925977, -0.0010241110576316714, -0.0009983951458707452, -0.000972679175902158, -0.0009469632059335709, -0.0009212472941726446, -0.0008955313824117184, -0.0008698154124431312, -0.000844099442474544, -0.0008183835307136178, -0.0007926676189526916, -0.0007669516489841044, -0.0007412356790155172, -0.000715519767254591, -0.0006898038554936647, -0.0006640878855250776, -0.0006383719155564904, -0.0006126560037955642, -0.0005869400920346379, -0.0005612241220660508, -0.0005355081520974636, -0.0005097922403365374, -0.00048407629947178066, -0.00045836035860702395, -0.00043264441774226725, -0.00040692847687751055, -0.00038121253601275384, -0.00035549659514799714, -0.00032978065428324044, -0.0003040646843146533, -0.0002783487434498966, -0.00025263280258513987, -0.00022691686172038317, -0.00020120092085562646, -0.00017548497999086976, -0.00014976903912611306, -0.00012405309826135635, -9.833715739659965e-05, -7.262121653184295e-05, -4.6905275667086244e-05, -2.118933480232954e-05, 4.526606062427163e-06, 3.0242546927183867e-05, 5.595848779194057e-05, 8.167442865669727e-05, 0.00010739036952145398, 0.00013310631038621068, 0.00015882225125096738, 0.0001845381921157241, 0.0002102541329804808, 0.0002359700738452375, 0.0002616860147099942, 0.0002874019555747509, 0.0003131178964395076]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 3.0, 6.0, 7.0, 13.0, 14.0, 8.0, 14.0, 10.0, 21.0, 21.0, 21.0, 25.0, 33.0, 29.0, 38.0, 33.0, 47.0, 44.0, 34.0, 37.0, 35.0, 50.0, 33.0, 31.0, 33.0, 34.0, 39.0, 36.0, 39.0, 29.0, 22.0, 33.0, 23.0, 23.0, 16.0, 14.0, 9.0, 5.0, 10.0, 8.0, 10.0, 5.0, 5.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00014925003051757812, -0.0001447303220629692, -0.0001402106136083603, -0.00013569090515375137, -0.00013117119669914246, -0.00012665148824453354, -0.00012213177978992462, -0.0001176120713353157, -0.00011309236288070679, -0.00010857265442609787, -0.00010405294597148895, -9.953323751688004e-05, -9.501352906227112e-05, -9.04938206076622e-05, -8.597411215305328e-05, -8.145440369844437e-05, -7.693469524383545e-05, -7.241498678922653e-05, -6.789527833461761e-05, -6.33755698800087e-05, -5.885586142539978e-05, -5.433615297079086e-05, -4.9816444516181946e-05, -4.529673606157303e-05, -4.077702760696411e-05, -3.6257319152355194e-05, -3.173761069774628e-05, -2.721790224313736e-05, -2.2698193788528442e-05, -1.8178485333919525e-05, -1.3658776879310608e-05, -9.13906842470169e-06, -4.6193599700927734e-06, -9.96515154838562e-08, 4.420056939125061e-06, 8.939765393733978e-06, 1.3459473848342896e-05, 1.7979182302951813e-05, 2.249889075756073e-05, 2.7018599212169647e-05, 3.1538307666778564e-05, 3.605801612138748e-05, 4.05777245759964e-05, 4.5097433030605316e-05, 4.9617141485214233e-05, 5.413684993982315e-05, 5.865655839443207e-05, 6.317626684904099e-05, 6.76959753036499e-05, 7.221568375825882e-05, 7.673539221286774e-05, 8.125510066747665e-05, 8.577480912208557e-05, 9.029451757669449e-05, 9.48142260313034e-05, 9.933393448591232e-05, 0.00010385364294052124, 0.00010837335139513016, 0.00011289305984973907, 0.00011741276830434799, 0.00012193247675895691, 0.00012645218521356583, 0.00013097189366817474, 0.00013549160212278366, 0.00014001131057739258]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 5.0, 3.0, 2.0, 5.0, 3.0, 8.0, 5.0, 7.0, 9.0, 8.0, 9.0, 12.0, 18.0, 21.0, 23.0, 28.0, 33.0, 23.0, 40.0, 33.0, 39.0, 36.0, 52.0, 39.0, 38.0, 42.0, 57.0, 33.0, 36.0, 31.0, 32.0, 29.0, 28.0, 29.0, 34.0, 19.0, 20.0, 19.0, 15.0, 18.0, 10.0, 8.0, 10.0, 10.0, 10.0, 5.0, 5.0, 1.0, 5.0, 2.0, 4.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-6.61328125, -6.40802001953125, -6.2027587890625, -5.99749755859375, -5.792236328125, -5.58697509765625, -5.3817138671875, -5.17645263671875, -4.97119140625, -4.76593017578125, -4.5606689453125, -4.35540771484375, -4.150146484375, -3.94488525390625, -3.7396240234375, -3.53436279296875, -3.3291015625, -3.12384033203125, -2.9185791015625, -2.71331787109375, -2.508056640625, -2.30279541015625, -2.0975341796875, -1.89227294921875, -1.68701171875, -1.48175048828125, -1.2764892578125, -1.07122802734375, -0.865966796875, -0.66070556640625, -0.4554443359375, -0.25018310546875, -0.044921875, 0.16033935546875, 0.3656005859375, 0.57086181640625, 0.776123046875, 0.98138427734375, 1.1866455078125, 1.39190673828125, 1.59716796875, 1.80242919921875, 2.0076904296875, 2.21295166015625, 2.418212890625, 2.62347412109375, 2.8287353515625, 3.03399658203125, 3.2392578125, 3.44451904296875, 3.6497802734375, 3.85504150390625, 4.060302734375, 4.26556396484375, 4.4708251953125, 4.67608642578125, 4.88134765625, 5.08660888671875, 5.2918701171875, 5.49713134765625, 5.702392578125, 5.90765380859375, 6.1129150390625, 6.31817626953125, 6.5234375]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 4.0, 4.0, 7.0, 10.0, 12.0, 20.0, 23.0, 29.0, 34.0, 45.0, 65.0, 85.0, 140.0, 161.0, 247.0, 369.0, 581.0, 962.0, 1657.0, 3050.0, 6055.0, 13413.0, 33891.0, 96368.0, 270738.0, 379119.0, 151718.0, 52094.0, 19640.0, 8421.0, 4090.0, 2122.0, 1167.0, 706.0, 467.0, 295.0, 218.0, 157.0, 110.0, 64.0, 54.0, 39.0, 27.0, 24.0, 12.0, 17.0, 11.0, 7.0, 3.0, 9.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.6796875, -8.401611328125, -8.12353515625, -7.845458984375, -7.5673828125, -7.289306640625, -7.01123046875, -6.733154296875, -6.455078125, -6.177001953125, -5.89892578125, -5.620849609375, -5.3427734375, -5.064697265625, -4.78662109375, -4.508544921875, -4.23046875, -3.952392578125, -3.67431640625, -3.396240234375, -3.1181640625, -2.840087890625, -2.56201171875, -2.283935546875, -2.005859375, -1.727783203125, -1.44970703125, -1.171630859375, -0.8935546875, -0.615478515625, -0.33740234375, -0.059326171875, 0.21875, 0.496826171875, 0.77490234375, 1.052978515625, 1.3310546875, 1.609130859375, 1.88720703125, 2.165283203125, 2.443359375, 2.721435546875, 2.99951171875, 3.277587890625, 3.5556640625, 3.833740234375, 4.11181640625, 4.389892578125, 4.66796875, 4.946044921875, 5.22412109375, 5.502197265625, 5.7802734375, 6.058349609375, 6.33642578125, 6.614501953125, 6.892578125, 7.170654296875, 7.44873046875, 7.726806640625, 8.0048828125, 8.282958984375, 8.56103515625, 8.839111328125, 9.1171875]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 10.0, 6.0, 8.0, 10.0, 11.0, 15.0, 20.0, 23.0, 21.0, 29.0, 36.0, 39.0, 47.0, 52.0, 62.0, 89.0, 194.0, 1377.0, 374.0, 167.0, 91.0, 49.0, 63.0, 51.0, 57.0, 31.0, 32.0, 26.0, 17.0, 11.0, 7.0, 8.0, 3.0, 4.0, 6.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.796875, -16.19677734375, -15.5966796875, -14.99658203125, -14.396484375, -13.79638671875, -13.1962890625, -12.59619140625, -11.99609375, -11.39599609375, -10.7958984375, -10.19580078125, -9.595703125, -8.99560546875, -8.3955078125, -7.79541015625, -7.1953125, -6.59521484375, -5.9951171875, -5.39501953125, -4.794921875, -4.19482421875, -3.5947265625, -2.99462890625, -2.39453125, -1.79443359375, -1.1943359375, -0.59423828125, 0.005859375, 0.60595703125, 1.2060546875, 1.80615234375, 2.40625, 3.00634765625, 3.6064453125, 4.20654296875, 4.806640625, 5.40673828125, 6.0068359375, 6.60693359375, 7.20703125, 7.80712890625, 8.4072265625, 9.00732421875, 9.607421875, 10.20751953125, 10.8076171875, 11.40771484375, 12.0078125, 12.60791015625, 13.2080078125, 13.80810546875, 14.408203125, 15.00830078125, 15.6083984375, 16.20849609375, 16.80859375, 17.40869140625, 18.0087890625, 18.60888671875, 19.208984375, 19.80908203125, 20.4091796875, 21.00927734375, 21.609375]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 4.0, 7.0, 9.0, 5.0, 17.0, 9.0, 19.0, 24.0, 26.0, 49.0, 60.0, 90.0, 135.0, 187.0, 298.0, 514.0, 1081.0, 5032.0, 143675.0, 2925395.0, 63500.0, 3221.0, 927.0, 461.0, 278.0, 207.0, 125.0, 98.0, 63.0, 36.0, 38.0, 30.0, 22.0, 14.0, 14.0, 6.0, 4.0, 7.0, 5.0, 4.0, 3.0, 5.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.109375, -25.190185546875, -24.27099609375, -23.351806640625, -22.4326171875, -21.513427734375, -20.59423828125, -19.675048828125, -18.755859375, -17.836669921875, -16.91748046875, -15.998291015625, -15.0791015625, -14.159912109375, -13.24072265625, -12.321533203125, -11.40234375, -10.483154296875, -9.56396484375, -8.644775390625, -7.7255859375, -6.806396484375, -5.88720703125, -4.968017578125, -4.048828125, -3.129638671875, -2.21044921875, -1.291259765625, -0.3720703125, 0.547119140625, 1.46630859375, 2.385498046875, 3.3046875, 4.223876953125, 5.14306640625, 6.062255859375, 6.9814453125, 7.900634765625, 8.81982421875, 9.739013671875, 10.658203125, 11.577392578125, 12.49658203125, 13.415771484375, 14.3349609375, 15.254150390625, 16.17333984375, 17.092529296875, 18.01171875, 18.930908203125, 19.85009765625, 20.769287109375, 21.6884765625, 22.607666015625, 23.52685546875, 24.446044921875, 25.365234375, 26.284423828125, 27.20361328125, 28.122802734375, 29.0419921875, 29.961181640625, 30.88037109375, 31.799560546875, 32.71875]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 915.0, 104.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-437.2157897949219, -422.03289794921875, -406.8500061035156, -391.6671142578125, -376.4842224121094, -361.30133056640625, -346.1184387207031, -330.935546875, -315.7526550292969, -300.56976318359375, -285.3868713378906, -270.2039794921875, -255.02108764648438, -239.83819580078125, -224.65530395507812, -209.472412109375, -194.28952026367188, -179.10662841796875, -163.92373657226562, -148.7408447265625, -133.55795288085938, -118.37506103515625, -103.19216918945312, -88.00927734375, -72.82638549804688, -57.64349365234375, -42.460601806640625, -27.2777099609375, -12.094818115234375, 3.08807373046875, 18.270965576171875, 33.453857421875, 48.63671875, 63.819610595703125, 79.00250244140625, 94.18539428710938, 109.3682861328125, 124.55117797851562, 139.73406982421875, 154.91696166992188, 170.099853515625, 185.28274536132812, 200.46563720703125, 215.64852905273438, 230.8314208984375, 246.01431274414062, 261.19720458984375, 276.3800964355469, 291.56298828125, 306.7458801269531, 321.92877197265625, 337.1116638183594, 352.2945556640625, 367.4774475097656, 382.66033935546875, 397.8432312011719, 413.026123046875, 428.2090148925781, 443.39190673828125, 458.5747985839844, 473.7576904296875, 488.9405822753906, 504.12347412109375, 519.306396484375, 534.4892578125]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 6.0, 11.0, 8.0, 15.0, 9.0, 6.0, 22.0, 21.0, 21.0, 39.0, 32.0, 33.0, 48.0, 28.0, 39.0, 47.0, 30.0, 48.0, 44.0, 54.0, 45.0, 44.0, 34.0, 34.0, 36.0, 43.0, 32.0, 26.0, 24.0, 22.0, 18.0, 13.0, 9.0, 17.0, 12.0, 12.0, 5.0, 6.0, 1.0, 0.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-47.79768753051758, -46.52851486206055, -45.259342193603516, -43.990169525146484, -42.72099685668945, -41.45182800292969, -40.182655334472656, -38.913482666015625, -37.644309997558594, -36.37513732910156, -35.10596466064453, -33.8367919921875, -32.56761932373047, -31.29844856262207, -30.02927589416504, -28.76010513305664, -27.490930557250977, -26.221757888793945, -24.952585220336914, -23.683414459228516, -22.414241790771484, -21.145069122314453, -19.875896453857422, -18.60672378540039, -17.33755111694336, -16.068378448486328, -14.799206733703613, -13.530034065246582, -12.260862350463867, -10.991689682006836, -9.722517013549805, -8.45334529876709, -7.184173583984375, -5.915001392364502, -4.645829200744629, -3.3766565322875977, -2.1074843406677246, -0.8383121490478516, 0.4308605194091797, 1.7000322341918945, 2.969204902648926, 4.238377094268799, 5.507549285888672, 6.776721954345703, 8.045894622802734, 9.31506633758545, 10.58423900604248, 11.853410720825195, 13.122583389282227, 14.391756057739258, 15.660927772521973, 16.930099487304688, 18.19927215576172, 19.46844482421875, 20.73761749267578, 22.006790161132812, 23.275962829589844, 24.545135498046875, 25.814308166503906, 27.083480834960938, 28.352651596069336, 29.621824264526367, 30.8909969329834, 32.1601676940918, 33.42934036254883]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 8.0, 4.0, 3.0, 3.0, 2.0, 4.0, 5.0, 7.0, 6.0, 5.0, 12.0, 13.0, 10.0, 12.0, 18.0, 22.0, 26.0, 30.0, 39.0, 31.0, 29.0, 32.0, 38.0, 37.0, 24.0, 46.0, 35.0, 33.0, 42.0, 29.0, 39.0, 33.0, 27.0, 27.0, 27.0, 32.0, 25.0, 27.0, 26.0, 26.0, 16.0, 15.0, 13.0, 11.0, 11.0, 8.0, 5.0, 8.0, 3.0, 5.0, 8.0, 5.0, 1.0, 4.0, 4.0, 1.0, 3.0], "bins": [-6.42578125, -6.23797607421875, -6.0501708984375, -5.86236572265625, -5.674560546875, -5.48675537109375, -5.2989501953125, -5.11114501953125, -4.92333984375, -4.73553466796875, -4.5477294921875, -4.35992431640625, -4.172119140625, -3.98431396484375, -3.7965087890625, -3.60870361328125, -3.4208984375, -3.23309326171875, -3.0452880859375, -2.85748291015625, -2.669677734375, -2.48187255859375, -2.2940673828125, -2.10626220703125, -1.91845703125, -1.73065185546875, -1.5428466796875, -1.35504150390625, -1.167236328125, -0.97943115234375, -0.7916259765625, -0.60382080078125, -0.416015625, -0.22821044921875, -0.0404052734375, 0.14739990234375, 0.335205078125, 0.52301025390625, 0.7108154296875, 0.89862060546875, 1.08642578125, 1.27423095703125, 1.4620361328125, 1.64984130859375, 1.837646484375, 2.02545166015625, 2.2132568359375, 2.40106201171875, 2.5888671875, 2.77667236328125, 2.9644775390625, 3.15228271484375, 3.340087890625, 3.52789306640625, 3.7156982421875, 3.90350341796875, 4.09130859375, 4.27911376953125, 4.4669189453125, 4.65472412109375, 4.842529296875, 5.03033447265625, 5.2181396484375, 5.40594482421875, 5.59375]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 3.0, 4.0, 0.0, 2.0, 4.0, 3.0, 11.0, 13.0, 22.0, 14.0, 24.0, 22.0, 20.0, 33.0, 48.0, 59.0, 60.0, 94.0, 116.0, 164.0, 224.0, 327.0, 459.0, 1894.0, 47737.0, 4122540.0, 17479.0, 1274.0, 417.0, 302.0, 216.0, 156.0, 121.0, 91.0, 63.0, 43.0, 41.0, 36.0, 33.0, 22.0, 21.0, 16.0, 10.0, 13.0, 8.0, 9.0, 7.0, 2.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-64.0, -62.02490234375, -60.0498046875, -58.07470703125, -56.099609375, -54.12451171875, -52.1494140625, -50.17431640625, -48.19921875, -46.22412109375, -44.2490234375, -42.27392578125, -40.298828125, -38.32373046875, -36.3486328125, -34.37353515625, -32.3984375, -30.42333984375, -28.4482421875, -26.47314453125, -24.498046875, -22.52294921875, -20.5478515625, -18.57275390625, -16.59765625, -14.62255859375, -12.6474609375, -10.67236328125, -8.697265625, -6.72216796875, -4.7470703125, -2.77197265625, -0.796875, 1.17822265625, 3.1533203125, 5.12841796875, 7.103515625, 9.07861328125, 11.0537109375, 13.02880859375, 15.00390625, 16.97900390625, 18.9541015625, 20.92919921875, 22.904296875, 24.87939453125, 26.8544921875, 28.82958984375, 30.8046875, 32.77978515625, 34.7548828125, 36.72998046875, 38.705078125, 40.68017578125, 42.6552734375, 44.63037109375, 46.60546875, 48.58056640625, 50.5556640625, 52.53076171875, 54.505859375, 56.48095703125, 58.4560546875, 60.43115234375, 62.40625]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 0.0, 6.0, 3.0, 4.0, 5.0, 8.0, 9.0, 7.0, 7.0, 12.0, 11.0, 14.0, 19.0, 21.0, 38.0, 47.0, 51.0, 68.0, 98.0, 149.0, 232.0, 352.0, 494.0, 565.0, 549.0, 395.0, 257.0, 187.0, 114.0, 74.0, 71.0, 40.0, 29.0, 30.0, 24.0, 17.0, 20.0, 15.0, 7.0, 7.0, 8.0, 6.0, 7.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-11.28125, -10.98138427734375, -10.6815185546875, -10.38165283203125, -10.081787109375, -9.78192138671875, -9.4820556640625, -9.18218994140625, -8.88232421875, -8.58245849609375, -8.2825927734375, -7.98272705078125, -7.682861328125, -7.38299560546875, -7.0831298828125, -6.78326416015625, -6.4833984375, -6.18353271484375, -5.8836669921875, -5.58380126953125, -5.283935546875, -4.98406982421875, -4.6842041015625, -4.38433837890625, -4.08447265625, -3.78460693359375, -3.4847412109375, -3.18487548828125, -2.885009765625, -2.58514404296875, -2.2852783203125, -1.98541259765625, -1.685546875, -1.38568115234375, -1.0858154296875, -0.78594970703125, -0.486083984375, -0.18621826171875, 0.1136474609375, 0.41351318359375, 0.71337890625, 1.01324462890625, 1.3131103515625, 1.61297607421875, 1.912841796875, 2.21270751953125, 2.5125732421875, 2.81243896484375, 3.1123046875, 3.41217041015625, 3.7120361328125, 4.01190185546875, 4.311767578125, 4.61163330078125, 4.9114990234375, 5.21136474609375, 5.51123046875, 5.81109619140625, 6.1109619140625, 6.41082763671875, 6.710693359375, 7.01055908203125, 7.3104248046875, 7.61029052734375, 7.91015625]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 3.0, 12.0, 10.0, 16.0, 25.0, 22.0, 41.0, 57.0, 98.0, 284.0, 1011.0, 7152.0, 221403.0, 3916352.0, 43917.0, 2894.0, 516.0, 164.0, 96.0, 56.0, 42.0, 27.0, 24.0, 20.0, 11.0, 14.0, 3.0, 6.0, 3.0, 2.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.46875, -35.98828125, -34.5078125, -33.02734375, -31.546875, -30.06640625, -28.5859375, -27.10546875, -25.625, -24.14453125, -22.6640625, -21.18359375, -19.703125, -18.22265625, -16.7421875, -15.26171875, -13.78125, -12.30078125, -10.8203125, -9.33984375, -7.859375, -6.37890625, -4.8984375, -3.41796875, -1.9375, -0.45703125, 1.0234375, 2.50390625, 3.984375, 5.46484375, 6.9453125, 8.42578125, 9.90625, 11.38671875, 12.8671875, 14.34765625, 15.828125, 17.30859375, 18.7890625, 20.26953125, 21.75, 23.23046875, 24.7109375, 26.19140625, 27.671875, 29.15234375, 30.6328125, 32.11328125, 33.59375, 35.07421875, 36.5546875, 38.03515625, 39.515625, 40.99609375, 42.4765625, 43.95703125, 45.4375, 46.91796875, 48.3984375, 49.87890625, 51.359375, 52.83984375, 54.3203125, 55.80078125, 57.28125]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 9.0, 25.0, 111.0, 258.0, 328.0, 197.0, 63.0, 16.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-93.01484680175781, -89.48133850097656, -85.94783782958984, -82.4143295288086, -78.88082885742188, -75.34732055664062, -71.81381225585938, -68.28031158447266, -64.74681091308594, -61.21330642700195, -57.67980194091797, -54.14629364013672, -50.61279296875, -47.07928466796875, -43.545780181884766, -40.01227569580078, -36.47876739501953, -32.94526290893555, -29.411758422851562, -25.878252029418945, -22.34474754333496, -18.811243057250977, -15.27773666381836, -11.744232177734375, -8.21072769165039, -4.677222728729248, -1.1437177658081055, 2.3897876739501953, 5.92329216003418, 9.456796646118164, 12.990303039550781, 16.523807525634766, 20.05731201171875, 23.590816497802734, 27.12432098388672, 30.657827377319336, 34.19132995605469, 37.72483825683594, 41.25834274291992, 44.791847229003906, 48.32535171508789, 51.858856201171875, 55.39236068725586, 58.925865173339844, 62.459373474121094, 65.99287414550781, 69.52638244628906, 73.05989074707031, 76.59339141845703, 80.12689971923828, 83.660400390625, 87.19390869140625, 90.72740936279297, 94.26091766357422, 97.79441833496094, 101.32792663574219, 104.86143493652344, 108.39494323730469, 111.9284439086914, 115.46195220947266, 118.99545288085938, 122.52896118164062, 126.06246948242188, 129.59597778320312, 133.1294708251953]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 6.0, 4.0, 5.0, 5.0, 12.0, 16.0, 18.0, 12.0, 22.0, 11.0, 37.0, 39.0, 30.0, 46.0, 51.0, 45.0, 51.0, 55.0, 50.0, 50.0, 46.0, 48.0, 41.0, 46.0, 44.0, 25.0, 37.0, 31.0, 23.0, 17.0, 17.0, 10.0, 13.0, 11.0, 7.0, 5.0, 2.0, 2.0, 8.0, 3.0, 1.0, 3.0, 3.0, 3.0], "bins": [-45.58680725097656, -44.40829849243164, -43.22978973388672, -42.0512809753418, -40.872772216796875, -39.69426727294922, -38.5157585144043, -37.337249755859375, -36.15874099731445, -34.98023223876953, -33.80172348022461, -32.62321472167969, -31.4447078704834, -30.266199111938477, -29.087692260742188, -27.909183502197266, -26.730674743652344, -25.552165985107422, -24.3736572265625, -23.19515037536621, -22.01664161682129, -20.838132858276367, -19.659626007080078, -18.481117248535156, -17.302608489990234, -16.124099731445312, -14.945591926574707, -13.767084121704102, -12.58857536315918, -11.410066604614258, -10.231558799743652, -9.053050994873047, -7.874546051025391, -6.696037769317627, -5.517529487609863, -4.3390212059021, -3.160512924194336, -1.9820046424865723, -0.8034963607788086, 0.3750114440917969, 1.5535202026367188, 2.7320284843444824, 3.910536766052246, 5.08904504776001, 6.267553329467773, 7.446061611175537, 8.6245698928833, 9.803077697753906, 10.981586456298828, 12.16009521484375, 13.338603019714355, 14.517110824584961, 15.695619583129883, 16.874128341674805, 18.052635192871094, 19.231143951416016, 20.409652709960938, 21.58816146850586, 22.76667022705078, 23.94517707824707, 25.123685836791992, 26.302194595336914, 27.480701446533203, 28.659210205078125, 29.837718963623047]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 2.0, 6.0, 3.0, 2.0, 6.0, 7.0, 5.0, 15.0, 17.0, 17.0, 17.0, 25.0, 25.0, 27.0, 34.0, 24.0, 37.0, 45.0, 37.0, 42.0, 62.0, 48.0, 36.0, 30.0, 44.0, 46.0, 38.0, 38.0, 34.0, 33.0, 25.0, 27.0, 30.0, 17.0, 24.0, 15.0, 8.0, 16.0, 9.0, 9.0, 7.0, 2.0, 4.0, 7.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.3515625, -7.1251220703125, -6.898681640625, -6.6722412109375, -6.44580078125, -6.2193603515625, -5.992919921875, -5.7664794921875, -5.5400390625, -5.3135986328125, -5.087158203125, -4.8607177734375, -4.63427734375, -4.4078369140625, -4.181396484375, -3.9549560546875, -3.728515625, -3.5020751953125, -3.275634765625, -3.0491943359375, -2.82275390625, -2.5963134765625, -2.369873046875, -2.1434326171875, -1.9169921875, -1.6905517578125, -1.464111328125, -1.2376708984375, -1.01123046875, -0.7847900390625, -0.558349609375, -0.3319091796875, -0.10546875, 0.1209716796875, 0.347412109375, 0.5738525390625, 0.80029296875, 1.0267333984375, 1.253173828125, 1.4796142578125, 1.7060546875, 1.9324951171875, 2.158935546875, 2.3853759765625, 2.61181640625, 2.8382568359375, 3.064697265625, 3.2911376953125, 3.517578125, 3.7440185546875, 3.970458984375, 4.1968994140625, 4.42333984375, 4.6497802734375, 4.876220703125, 5.1026611328125, 5.3291015625, 5.5555419921875, 5.781982421875, 6.0084228515625, 6.23486328125, 6.4613037109375, 6.687744140625, 6.9141845703125, 7.140625]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 4.0, 7.0, 8.0, 16.0, 12.0, 20.0, 45.0, 71.0, 103.0, 167.0, 267.0, 413.0, 742.0, 1181.0, 1842.0, 3172.0, 5289.0, 9030.0, 15720.0, 27608.0, 52424.0, 108969.0, 247205.0, 303896.0, 131809.0, 62713.0, 32477.0, 18010.0, 10241.0, 5990.0, 3566.0, 2148.0, 1335.0, 778.0, 489.0, 298.0, 166.0, 110.0, 70.0, 54.0, 34.0, 18.0, 17.0, 12.0, 7.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.368896484375, -0.3570442199707031, -0.34519195556640625, -0.3333396911621094, -0.3214874267578125, -0.3096351623535156, -0.29778289794921875, -0.2859306335449219, -0.274078369140625, -0.2622261047363281, -0.25037384033203125, -0.23852157592773438, -0.2266693115234375, -0.21481704711914062, -0.20296478271484375, -0.19111251831054688, -0.17926025390625, -0.16740798950195312, -0.15555572509765625, -0.14370346069335938, -0.1318511962890625, -0.11999893188476562, -0.10814666748046875, -0.09629440307617188, -0.084442138671875, -0.07258987426757812, -0.06073760986328125, -0.048885345458984375, -0.0370330810546875, -0.025180816650390625, -0.01332855224609375, -0.001476287841796875, 0.0103759765625, 0.022228240966796875, 0.03408050537109375, 0.045932769775390625, 0.0577850341796875, 0.06963729858398438, 0.08148956298828125, 0.09334182739257812, 0.105194091796875, 0.11704635620117188, 0.12889862060546875, 0.14075088500976562, 0.1526031494140625, 0.16445541381835938, 0.17630767822265625, 0.18815994262695312, 0.20001220703125, 0.21186447143554688, 0.22371673583984375, 0.23556900024414062, 0.2474212646484375, 0.2592735290527344, 0.27112579345703125, 0.2829780578613281, 0.294830322265625, 0.3066825866699219, 0.31853485107421875, 0.3303871154785156, 0.3422393798828125, 0.3540916442871094, 0.36594390869140625, 0.3777961730957031, 0.3896484375]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 3.0, 4.0, 8.0, 9.0, 7.0, 11.0, 12.0, 18.0, 12.0, 19.0, 16.0, 30.0, 25.0, 25.0, 38.0, 29.0, 33.0, 46.0, 32.0, 37.0, 53.0, 1059.0, 35.0, 40.0, 38.0, 40.0, 39.0, 35.0, 29.0, 19.0, 26.0, 24.0, 20.0, 26.0, 18.0, 19.0, 15.0, 13.0, 13.0, 15.0, 10.0, 7.0, 7.0, 1.0, 5.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.28125, -4.150390625, -4.01953125, -3.888671875, -3.7578125, -3.626953125, -3.49609375, -3.365234375, -3.234375, -3.103515625, -2.97265625, -2.841796875, -2.7109375, -2.580078125, -2.44921875, -2.318359375, -2.1875, -2.056640625, -1.92578125, -1.794921875, -1.6640625, -1.533203125, -1.40234375, -1.271484375, -1.140625, -1.009765625, -0.87890625, -0.748046875, -0.6171875, -0.486328125, -0.35546875, -0.224609375, -0.09375, 0.037109375, 0.16796875, 0.298828125, 0.4296875, 0.560546875, 0.69140625, 0.822265625, 0.953125, 1.083984375, 1.21484375, 1.345703125, 1.4765625, 1.607421875, 1.73828125, 1.869140625, 2.0, 2.130859375, 2.26171875, 2.392578125, 2.5234375, 2.654296875, 2.78515625, 2.916015625, 3.046875, 3.177734375, 3.30859375, 3.439453125, 3.5703125, 3.701171875, 3.83203125, 3.962890625, 4.09375]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 10.0, 15.0, 18.0, 30.0, 36.0, 55.0, 83.0, 116.0, 168.0, 237.0, 338.0, 480.0, 692.0, 997.0, 1491.0, 2174.0, 3024.0, 4617.0, 7161.0, 10724.0, 16889.0, 26563.0, 43106.0, 70313.0, 121128.0, 1269629.0, 217216.0, 117080.0, 67680.0, 41148.0, 25819.0, 16144.0, 10572.0, 6864.0, 4661.0, 3089.0, 2069.0, 1451.0, 975.0, 728.0, 469.0, 326.0, 223.0, 163.0, 106.0, 90.0, 52.0, 36.0, 19.0, 21.0, 11.0, 12.0, 7.0, 6.0, 4.0, 4.0, 3.0], "bins": [-0.2186279296875, -0.21199607849121094, -0.20536422729492188, -0.1987323760986328, -0.19210052490234375, -0.1854686737060547, -0.17883682250976562, -0.17220497131347656, -0.1655731201171875, -0.15894126892089844, -0.15230941772460938, -0.1456775665283203, -0.13904571533203125, -0.1324138641357422, -0.12578201293945312, -0.11915016174316406, -0.112518310546875, -0.10588645935058594, -0.09925460815429688, -0.09262275695800781, -0.08599090576171875, -0.07935905456542969, -0.07272720336914062, -0.06609535217285156, -0.0594635009765625, -0.05283164978027344, -0.046199798583984375, -0.03956794738769531, -0.03293609619140625, -0.026304244995117188, -0.019672393798828125, -0.013040542602539062, -0.00640869140625, 0.0002231597900390625, 0.006855010986328125, 0.013486862182617188, 0.02011871337890625, 0.026750564575195312, 0.033382415771484375, 0.04001426696777344, 0.0466461181640625, 0.05327796936035156, 0.059909820556640625, 0.06654167175292969, 0.07317352294921875, 0.07980537414550781, 0.08643722534179688, 0.09306907653808594, 0.099700927734375, 0.10633277893066406, 0.11296463012695312, 0.11959648132324219, 0.12622833251953125, 0.1328601837158203, 0.13949203491210938, 0.14612388610839844, 0.1527557373046875, 0.15938758850097656, 0.16601943969726562, 0.1726512908935547, 0.17928314208984375, 0.1859149932861328, 0.19254684448242188, 0.19917869567871094, 0.205810546875]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 1.0, 2.0, 3.0, 2.0, 5.0, 3.0, 8.0, 15.0, 19.0, 39.0, 56.0, 91.0, 115.0, 156.0, 140.0, 112.0, 79.0, 56.0, 33.0, 19.0, 12.0, 11.0, 2.0, 7.0, 4.0, 2.0, 1.0, 4.0, 3.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00036978721618652344, -0.0003594718873500824, -0.00034915655851364136, -0.0003388412296772003, -0.0003285259008407593, -0.00031821057200431824, -0.0003078952431678772, -0.00029757991433143616, -0.0002872645854949951, -0.0002769492566585541, -0.00026663392782211304, -0.000256318598985672, -0.00024600327014923096, -0.00023568794131278992, -0.00022537261247634888, -0.00021505728363990784, -0.0002047419548034668, -0.00019442662596702576, -0.00018411129713058472, -0.00017379596829414368, -0.00016348063945770264, -0.0001531653106212616, -0.00014284998178482056, -0.00013253465294837952, -0.00012221932411193848, -0.00011190399527549744, -0.0001015886664390564, -9.127333760261536e-05, -8.095800876617432e-05, -7.064267992973328e-05, -6.0327351093292236e-05, -5.0012022256851196e-05, -3.9696693420410156e-05, -2.9381364583969116e-05, -1.9066035747528076e-05, -8.750706911087036e-06, 1.564621925354004e-06, 1.1879950761795044e-05, 2.2195279598236084e-05, 3.2510608434677124e-05, 4.2825937271118164e-05, 5.3141266107559204e-05, 6.345659494400024e-05, 7.377192378044128e-05, 8.408725261688232e-05, 9.440258145332336e-05, 0.0001047179102897644, 0.00011503323912620544, 0.00012534856796264648, 0.00013566389679908752, 0.00014597922563552856, 0.0001562945544719696, 0.00016660988330841064, 0.00017692521214485168, 0.00018724054098129272, 0.00019755586981773376, 0.0002078711986541748, 0.00021818652749061584, 0.00022850185632705688, 0.00023881718516349792, 0.00024913251399993896, 0.00025944784283638, 0.00026976317167282104, 0.0002800785005092621, 0.0002903938293457031]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 2.0, 4.0, 4.0, 1.0, 2.0, 9.0, 2.0, 4.0, 10.0, 16.0, 14.0, 30.0, 31.0, 59.0, 86.0, 167.0, 371.0, 949.0, 120268.0, 924132.0, 1533.0, 401.0, 182.0, 96.0, 60.0, 30.0, 22.0, 15.0, 10.0, 6.0, 9.0, 6.0, 3.0, 11.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.005306243896484375, -0.005117475986480713, -0.004928708076477051, -0.004739940166473389, -0.0045511722564697266, -0.0043624043464660645, -0.004173636436462402, -0.00398486852645874, -0.003796100616455078, -0.003607332706451416, -0.003418564796447754, -0.003229796886444092, -0.0030410289764404297, -0.0028522610664367676, -0.0026634931564331055, -0.0024747252464294434, -0.0022859573364257812, -0.002097189426422119, -0.001908421516418457, -0.001719653606414795, -0.0015308856964111328, -0.0013421177864074707, -0.0011533498764038086, -0.0009645819664001465, -0.0007758140563964844, -0.0005870461463928223, -0.00039827823638916016, -0.00020951032638549805, -2.0742416381835938e-05, 0.00016802549362182617, 0.0003567934036254883, 0.0005455613136291504, 0.0007343292236328125, 0.0009230971336364746, 0.0011118650436401367, 0.0013006329536437988, 0.001489400863647461, 0.001678168773651123, 0.0018669366836547852, 0.0020557045936584473, 0.0022444725036621094, 0.0024332404136657715, 0.0026220083236694336, 0.0028107762336730957, 0.002999544143676758, 0.00318831205368042, 0.003377079963684082, 0.003565847873687744, 0.0037546157836914062, 0.003943383693695068, 0.0041321516036987305, 0.004320919513702393, 0.004509687423706055, 0.004698455333709717, 0.004887223243713379, 0.005075991153717041, 0.005264759063720703, 0.005453526973724365, 0.005642294883728027, 0.0058310627937316895, 0.0060198307037353516, 0.006208598613739014, 0.006397366523742676, 0.006586134433746338, 0.00677490234375]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 5.0, 9.0, 18.0, 22.0, 33.0, 54.0, 76.0, 113.0, 128.0, 144.0, 112.0, 93.0, 70.0, 49.0, 26.0, 17.0, 13.0, 11.0, 5.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00020413870515767485, -0.0001996419596252963, -0.00019514521409291774, -0.00019064845400862396, -0.0001861517084762454, -0.00018165496294386685, -0.0001771582174114883, -0.00017266147187910974, -0.00016816472634673119, -0.00016366798081435263, -0.00015917123528197408, -0.0001546744751976803, -0.00015017772966530174, -0.00014568098413292319, -0.00014118423860054463, -0.00013668749306816608, -0.0001321907329838723, -0.00012769398745149374, -0.00012319724191911519, -0.00011870048911077902, -0.00011420373630244285, -0.0001097069907700643, -0.00010521024523768574, -0.00010071349970530719, -9.621674689697102e-05, -9.172000136459246e-05, -8.72232485562563e-05, -8.272650302387774e-05, -7.822975749149919e-05, -7.373300468316302e-05, -6.923625915078446e-05, -6.47395063424483e-05, -6.024277536198497e-05, -5.574602619162761e-05, -5.1249277021270245e-05, -4.675253148889169e-05, -4.225578231853433e-05, -3.775903314817697e-05, -3.3262287615798414e-05, -2.8765538445441052e-05, -2.426878927508369e-05, -1.977204010472633e-05, -1.527529275335837e-05, -1.0778544492495712e-05, -6.281796231633052e-06, -1.7850470612756908e-06, 2.711700290092267e-06, 7.208447641460225e-06, 1.1705196811817586e-05, 1.6201945982174948e-05, 2.0698693333542906e-05, 2.5195440684910864e-05, 2.9692189855268225e-05, 3.4188939025625587e-05, 3.868568455800414e-05, 4.31824337283615e-05, 4.7679182898718864e-05, 5.2175932069076225e-05, 5.6672681239433587e-05, 6.116942677181214e-05, 6.56661723041907e-05, 7.016292511252686e-05, 7.465967064490542e-05, 7.915642345324159e-05, 8.365316898562014e-05]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 4.0, 3.0, 6.0, 9.0, 9.0, 9.0, 14.0, 15.0, 12.0, 10.0, 22.0, 22.0, 32.0, 31.0, 30.0, 31.0, 30.0, 39.0, 40.0, 35.0, 32.0, 29.0, 37.0, 34.0, 33.0, 44.0, 39.0, 35.0, 33.0, 32.0, 29.0, 31.0, 27.0, 27.0, 20.0, 17.0, 16.0, 17.0, 8.0, 12.0, 9.0, 8.0, 12.0, 7.0, 3.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-9.161233901977539e-05, -8.865073323249817e-05, -8.568912744522095e-05, -8.272752165794373e-05, -7.97659158706665e-05, -7.680431008338928e-05, -7.384270429611206e-05, -7.088109850883484e-05, -6.791949272155762e-05, -6.49578869342804e-05, -6.199628114700317e-05, -5.903467535972595e-05, -5.607306957244873e-05, -5.311146378517151e-05, -5.014985799789429e-05, -4.7188252210617065e-05, -4.4226646423339844e-05, -4.126504063606262e-05, -3.83034348487854e-05, -3.534182906150818e-05, -3.238022327423096e-05, -2.9418617486953735e-05, -2.6457011699676514e-05, -2.3495405912399292e-05, -2.053380012512207e-05, -1.757219433784485e-05, -1.4610588550567627e-05, -1.1648982763290405e-05, -8.687376976013184e-06, -5.725771188735962e-06, -2.7641654014587402e-06, 1.9744038581848145e-07, 3.159046173095703e-06, 6.120651960372925e-06, 9.082257747650146e-06, 1.2043863534927368e-05, 1.500546932220459e-05, 1.796707510948181e-05, 2.0928680896759033e-05, 2.3890286684036255e-05, 2.6851892471313477e-05, 2.9813498258590698e-05, 3.277510404586792e-05, 3.573670983314514e-05, 3.869831562042236e-05, 4.1659921407699585e-05, 4.462152719497681e-05, 4.758313298225403e-05, 5.054473876953125e-05, 5.350634455680847e-05, 5.646795034408569e-05, 5.9429556131362915e-05, 6.239116191864014e-05, 6.535276770591736e-05, 6.831437349319458e-05, 7.12759792804718e-05, 7.423758506774902e-05, 7.719919085502625e-05, 8.016079664230347e-05, 8.312240242958069e-05, 8.608400821685791e-05, 8.904561400413513e-05, 9.200721979141235e-05, 9.496882557868958e-05, 9.79304313659668e-05]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 2.0, 6.0, 3.0, 2.0, 6.0, 7.0, 5.0, 15.0, 17.0, 17.0, 17.0, 25.0, 25.0, 27.0, 34.0, 24.0, 37.0, 45.0, 37.0, 42.0, 62.0, 48.0, 36.0, 30.0, 44.0, 46.0, 38.0, 38.0, 34.0, 33.0, 25.0, 27.0, 30.0, 17.0, 24.0, 15.0, 8.0, 16.0, 9.0, 9.0, 7.0, 2.0, 4.0, 7.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.3515625, -7.1251220703125, -6.898681640625, -6.6722412109375, -6.44580078125, -6.2193603515625, -5.992919921875, -5.7664794921875, -5.5400390625, -5.3135986328125, -5.087158203125, -4.8607177734375, -4.63427734375, -4.4078369140625, -4.181396484375, -3.9549560546875, -3.728515625, -3.5020751953125, -3.275634765625, -3.0491943359375, -2.82275390625, -2.5963134765625, -2.369873046875, -2.1434326171875, -1.9169921875, -1.6905517578125, -1.464111328125, -1.2376708984375, -1.01123046875, -0.7847900390625, -0.558349609375, -0.3319091796875, -0.10546875, 0.1209716796875, 0.347412109375, 0.5738525390625, 0.80029296875, 1.0267333984375, 1.253173828125, 1.4796142578125, 1.7060546875, 1.9324951171875, 2.158935546875, 2.3853759765625, 2.61181640625, 2.8382568359375, 3.064697265625, 3.2911376953125, 3.517578125, 3.7440185546875, 3.970458984375, 4.1968994140625, 4.42333984375, 4.6497802734375, 4.876220703125, 5.1026611328125, 5.3291015625, 5.5555419921875, 5.781982421875, 6.0084228515625, 6.23486328125, 6.4613037109375, 6.687744140625, 6.9141845703125, 7.140625]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 7.0, 5.0, 4.0, 9.0, 12.0, 15.0, 24.0, 17.0, 39.0, 41.0, 81.0, 114.0, 152.0, 209.0, 293.0, 400.0, 632.0, 881.0, 1436.0, 3082.0, 9379.0, 45160.0, 280564.0, 552357.0, 121644.0, 20951.0, 5372.0, 2087.0, 1135.0, 765.0, 508.0, 340.0, 230.0, 156.0, 140.0, 94.0, 59.0, 50.0, 34.0, 17.0, 21.0, 17.0, 6.0, 10.0, 9.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.9453125, -14.482177734375, -14.01904296875, -13.555908203125, -13.0927734375, -12.629638671875, -12.16650390625, -11.703369140625, -11.240234375, -10.777099609375, -10.31396484375, -9.850830078125, -9.3876953125, -8.924560546875, -8.46142578125, -7.998291015625, -7.53515625, -7.072021484375, -6.60888671875, -6.145751953125, -5.6826171875, -5.219482421875, -4.75634765625, -4.293212890625, -3.830078125, -3.366943359375, -2.90380859375, -2.440673828125, -1.9775390625, -1.514404296875, -1.05126953125, -0.588134765625, -0.125, 0.338134765625, 0.80126953125, 1.264404296875, 1.7275390625, 2.190673828125, 2.65380859375, 3.116943359375, 3.580078125, 4.043212890625, 4.50634765625, 4.969482421875, 5.4326171875, 5.895751953125, 6.35888671875, 6.822021484375, 7.28515625, 7.748291015625, 8.21142578125, 8.674560546875, 9.1376953125, 9.600830078125, 10.06396484375, 10.527099609375, 10.990234375, 11.453369140625, 11.91650390625, 12.379638671875, 12.8427734375, 13.305908203125, 13.76904296875, 14.232177734375, 14.6953125]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 6.0, 4.0, 0.0, 7.0, 5.0, 10.0, 11.0, 12.0, 7.0, 17.0, 23.0, 32.0, 25.0, 34.0, 35.0, 64.0, 54.0, 72.0, 147.0, 313.0, 1469.0, 220.0, 104.0, 64.0, 53.0, 52.0, 28.0, 34.0, 34.0, 20.0, 23.0, 13.0, 13.0, 10.0, 13.0, 7.0, 8.0, 5.0, 4.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.90625, -16.348876953125, -15.79150390625, -15.234130859375, -14.6767578125, -14.119384765625, -13.56201171875, -13.004638671875, -12.447265625, -11.889892578125, -11.33251953125, -10.775146484375, -10.2177734375, -9.660400390625, -9.10302734375, -8.545654296875, -7.98828125, -7.430908203125, -6.87353515625, -6.316162109375, -5.7587890625, -5.201416015625, -4.64404296875, -4.086669921875, -3.529296875, -2.971923828125, -2.41455078125, -1.857177734375, -1.2998046875, -0.742431640625, -0.18505859375, 0.372314453125, 0.9296875, 1.487060546875, 2.04443359375, 2.601806640625, 3.1591796875, 3.716552734375, 4.27392578125, 4.831298828125, 5.388671875, 5.946044921875, 6.50341796875, 7.060791015625, 7.6181640625, 8.175537109375, 8.73291015625, 9.290283203125, 9.84765625, 10.405029296875, 10.96240234375, 11.519775390625, 12.0771484375, 12.634521484375, 13.19189453125, 13.749267578125, 14.306640625, 14.864013671875, 15.42138671875, 15.978759765625, 16.5361328125, 17.093505859375, 17.65087890625, 18.208251953125, 18.765625]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 2.0, 1.0, 4.0, 7.0, 8.0, 20.0, 15.0, 15.0, 20.0, 41.0, 47.0, 77.0, 120.0, 203.0, 368.0, 687.0, 1953.0, 2818998.0, 319889.0, 1678.0, 681.0, 362.0, 191.0, 90.0, 72.0, 41.0, 29.0, 18.0, 14.0, 15.0, 7.0, 10.0, 11.0, 1.0, 3.0, 4.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-82.3125, -79.8125, -77.3125, -74.8125, -72.3125, -69.8125, -67.3125, -64.8125, -62.3125, -59.8125, -57.3125, -54.8125, -52.3125, -49.8125, -47.3125, -44.8125, -42.3125, -39.8125, -37.3125, -34.8125, -32.3125, -29.8125, -27.3125, -24.8125, -22.3125, -19.8125, -17.3125, -14.8125, -12.3125, -9.8125, -7.3125, -4.8125, -2.3125, 0.1875, 2.6875, 5.1875, 7.6875, 10.1875, 12.6875, 15.1875, 17.6875, 20.1875, 22.6875, 25.1875, 27.6875, 30.1875, 32.6875, 35.1875, 37.6875, 40.1875, 42.6875, 45.1875, 47.6875, 50.1875, 52.6875, 55.1875, 57.6875, 60.1875, 62.6875, 65.1875, 67.6875, 70.1875, 72.6875, 75.1875, 77.6875]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 7.0, 177.0, 634.0, 186.0, 10.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-143.6464385986328, -137.5465850830078, -131.44671630859375, -125.34686279296875, -119.24700164794922, -113.14714050292969, -107.04728698730469, -100.94742584228516, -94.84756469726562, -88.7477035522461, -82.64784240722656, -76.54798889160156, -70.44812774658203, -64.3482666015625, -58.248409271240234, -52.14855194091797, -46.04869079589844, -39.948829650878906, -33.84897232055664, -27.749113082885742, -21.649253845214844, -15.549394607543945, -9.449535369873047, -3.3496780395507812, 2.75018310546875, 8.850042343139648, 14.949901580810547, 21.049760818481445, 27.149620056152344, 33.249481201171875, 39.34933853149414, 45.449195861816406, 51.54905700683594, 57.64891815185547, 63.748775482177734, 69.8486328125, 75.94849395751953, 82.04835510253906, 88.14820861816406, 94.2480697631836, 100.34793090820312, 106.44779205322266, 112.54765319824219, 118.64750671386719, 124.74736785888672, 130.84722900390625, 136.94708251953125, 143.04693603515625, 149.1468048095703, 155.2466583251953, 161.34652709960938, 167.44638061523438, 173.54623413085938, 179.64610290527344, 185.74595642089844, 191.8458251953125, 197.9456787109375, 204.0455322265625, 210.14540100097656, 216.24525451660156, 222.34512329101562, 228.44497680664062, 234.54483032226562, 240.64468383789062, 246.7445526123047]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 4.0, 5.0, 6.0, 11.0, 9.0, 6.0, 6.0, 10.0, 9.0, 9.0, 17.0, 19.0, 19.0, 25.0, 26.0, 26.0, 36.0, 34.0, 36.0, 33.0, 32.0, 47.0, 41.0, 44.0, 47.0, 45.0, 49.0, 39.0, 36.0, 26.0, 31.0, 24.0, 35.0, 20.0, 23.0, 19.0, 12.0, 13.0, 19.0, 9.0, 10.0, 6.0, 1.0, 10.0, 5.0, 6.0, 3.0, 5.0, 4.0, 2.0, 0.0, 2.0, 2.0], "bins": [-47.49513244628906, -46.16862869262695, -44.842124938964844, -43.515625, -42.18912124633789, -40.86261749267578, -39.53611373901367, -38.20960998535156, -36.88310623168945, -35.556602478027344, -34.230098724365234, -32.903594970703125, -31.57709312438965, -30.250591278076172, -28.924087524414062, -27.597583770751953, -26.271081924438477, -24.944578170776367, -23.61807632446289, -22.29157257080078, -20.965068817138672, -19.638565063476562, -18.312063217163086, -16.985559463500977, -15.659056663513184, -14.33255386352539, -13.006050109863281, -11.679547309875488, -10.353044509887695, -9.026540756225586, -7.700037956237793, -6.373534202575684, -5.047031402587891, -3.7205281257629395, -2.3940250873565674, -1.0675220489501953, 0.25898122787475586, 1.585484504699707, 2.9119873046875, 4.238491058349609, 5.564993858337402, 6.8914971351623535, 8.218000411987305, 9.544503211975098, 10.87100601196289, 12.197509765625, 13.524012565612793, 14.850516319274902, 16.177019119262695, 17.503522872924805, 18.83002471923828, 20.15652847290039, 21.4830322265625, 22.80953598022461, 24.136037826538086, 25.462541580200195, 26.789043426513672, 28.11554718017578, 29.442049026489258, 30.768552780151367, 32.095054626464844, 33.42155838012695, 34.74806213378906, 36.07456588745117, 37.40106964111328]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 4.0, 3.0, 3.0, 3.0, 3.0, 3.0, 9.0, 6.0, 10.0, 9.0, 14.0, 12.0, 12.0, 21.0, 23.0, 35.0, 25.0, 33.0, 28.0, 26.0, 37.0, 39.0, 34.0, 56.0, 34.0, 42.0, 40.0, 40.0, 43.0, 39.0, 38.0, 35.0, 29.0, 34.0, 37.0, 15.0, 23.0, 24.0, 18.0, 10.0, 16.0, 6.0, 5.0, 6.0, 7.0, 8.0, 4.0, 3.0, 4.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.5234375, -6.30291748046875, -6.0823974609375, -5.86187744140625, -5.641357421875, -5.42083740234375, -5.2003173828125, -4.97979736328125, -4.75927734375, -4.53875732421875, -4.3182373046875, -4.09771728515625, -3.877197265625, -3.65667724609375, -3.4361572265625, -3.21563720703125, -2.9951171875, -2.77459716796875, -2.5540771484375, -2.33355712890625, -2.113037109375, -1.89251708984375, -1.6719970703125, -1.45147705078125, -1.23095703125, -1.01043701171875, -0.7899169921875, -0.56939697265625, -0.348876953125, -0.12835693359375, 0.0921630859375, 0.31268310546875, 0.533203125, 0.75372314453125, 0.9742431640625, 1.19476318359375, 1.415283203125, 1.63580322265625, 1.8563232421875, 2.07684326171875, 2.29736328125, 2.51788330078125, 2.7384033203125, 2.95892333984375, 3.179443359375, 3.39996337890625, 3.6204833984375, 3.84100341796875, 4.0615234375, 4.28204345703125, 4.5025634765625, 4.72308349609375, 4.943603515625, 5.16412353515625, 5.3846435546875, 5.60516357421875, 5.82568359375, 6.04620361328125, 6.2667236328125, 6.48724365234375, 6.707763671875, 6.92828369140625, 7.1488037109375, 7.36932373046875, 7.58984375]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 5.0, 3.0, 5.0, 7.0, 11.0, 11.0, 18.0, 26.0, 30.0, 76.0, 68.0, 138.0, 148.0, 197.0, 309.0, 438.0, 639.0, 1006.0, 1665.0, 3426.0, 8617.0, 29884.0, 195266.0, 1706759.0, 1959980.0, 233557.0, 33713.0, 9515.0, 3662.0, 1873.0, 1081.0, 669.0, 410.0, 313.0, 243.0, 160.0, 96.0, 81.0, 57.0, 42.0, 27.0, 19.0, 14.0, 7.0, 8.0, 1.0, 7.0, 5.0, 2.0], "bins": [-18.453125, -17.98046875, -17.5078125, -17.03515625, -16.5625, -16.08984375, -15.6171875, -15.14453125, -14.671875, -14.19921875, -13.7265625, -13.25390625, -12.78125, -12.30859375, -11.8359375, -11.36328125, -10.890625, -10.41796875, -9.9453125, -9.47265625, -9.0, -8.52734375, -8.0546875, -7.58203125, -7.109375, -6.63671875, -6.1640625, -5.69140625, -5.21875, -4.74609375, -4.2734375, -3.80078125, -3.328125, -2.85546875, -2.3828125, -1.91015625, -1.4375, -0.96484375, -0.4921875, -0.01953125, 0.453125, 0.92578125, 1.3984375, 1.87109375, 2.34375, 2.81640625, 3.2890625, 3.76171875, 4.234375, 4.70703125, 5.1796875, 5.65234375, 6.125, 6.59765625, 7.0703125, 7.54296875, 8.015625, 8.48828125, 8.9609375, 9.43359375, 9.90625, 10.37890625, 10.8515625, 11.32421875, 11.796875]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 4.0, 6.0, 15.0, 11.0, 25.0, 31.0, 50.0, 69.0, 79.0, 133.0, 205.0, 347.0, 636.0, 836.0, 601.0, 338.0, 220.0, 150.0, 107.0, 73.0, 54.0, 27.0, 28.0, 17.0, 10.0, 6.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.8359375, -9.2735595703125, -8.711181640625, -8.1488037109375, -7.58642578125, -7.0240478515625, -6.461669921875, -5.8992919921875, -5.3369140625, -4.7745361328125, -4.212158203125, -3.6497802734375, -3.08740234375, -2.5250244140625, -1.962646484375, -1.4002685546875, -0.837890625, -0.2755126953125, 0.286865234375, 0.8492431640625, 1.41162109375, 1.9739990234375, 2.536376953125, 3.0987548828125, 3.6611328125, 4.2235107421875, 4.785888671875, 5.3482666015625, 5.91064453125, 6.4730224609375, 7.035400390625, 7.5977783203125, 8.16015625, 8.7225341796875, 9.284912109375, 9.8472900390625, 10.40966796875, 10.9720458984375, 11.534423828125, 12.0968017578125, 12.6591796875, 13.2215576171875, 13.783935546875, 14.3463134765625, 14.90869140625, 15.4710693359375, 16.033447265625, 16.5958251953125, 17.158203125, 17.7205810546875, 18.282958984375, 18.8453369140625, 19.40771484375, 19.9700927734375, 20.532470703125, 21.0948486328125, 21.6572265625, 22.2196044921875, 22.781982421875, 23.3443603515625, 23.90673828125, 24.4691162109375, 25.031494140625, 25.5938720703125, 26.15625]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 1.0, 9.0, 9.0, 16.0, 17.0, 24.0, 23.0, 47.0, 95.0, 114.0, 231.0, 523.0, 1222.0, 4202.0, 25103.0, 384727.0, 3580564.0, 176849.0, 15691.0, 2938.0, 948.0, 406.0, 202.0, 107.0, 78.0, 46.0, 30.0, 14.0, 11.0, 9.0, 11.0, 7.0, 6.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.203125, -28.241943359375, -27.28076171875, -26.319580078125, -25.3583984375, -24.397216796875, -23.43603515625, -22.474853515625, -21.513671875, -20.552490234375, -19.59130859375, -18.630126953125, -17.6689453125, -16.707763671875, -15.74658203125, -14.785400390625, -13.82421875, -12.863037109375, -11.90185546875, -10.940673828125, -9.9794921875, -9.018310546875, -8.05712890625, -7.095947265625, -6.134765625, -5.173583984375, -4.21240234375, -3.251220703125, -2.2900390625, -1.328857421875, -0.36767578125, 0.593505859375, 1.5546875, 2.515869140625, 3.47705078125, 4.438232421875, 5.3994140625, 6.360595703125, 7.32177734375, 8.282958984375, 9.244140625, 10.205322265625, 11.16650390625, 12.127685546875, 13.0888671875, 14.050048828125, 15.01123046875, 15.972412109375, 16.93359375, 17.894775390625, 18.85595703125, 19.817138671875, 20.7783203125, 21.739501953125, 22.70068359375, 23.661865234375, 24.623046875, 25.584228515625, 26.54541015625, 27.506591796875, 28.4677734375, 29.428955078125, 30.39013671875, 31.351318359375, 32.3125]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 56.0, 821.0, 135.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-681.2179565429688, -663.0795288085938, -644.9411010742188, -626.8026733398438, -608.6642456054688, -590.5258178710938, -572.3873901367188, -554.2490234375, -536.110595703125, -517.97216796875, -499.833740234375, -481.6953125, -463.556884765625, -445.41845703125, -427.2800598144531, -409.1416320800781, -391.003173828125, -372.86474609375, -354.726318359375, -336.587890625, -318.449462890625, -300.31103515625, -282.1726379394531, -264.0342102050781, -245.89578247070312, -227.75735473632812, -209.61892700195312, -191.4805145263672, -173.3420867919922, -155.2036590576172, -137.06524658203125, -118.92681884765625, -100.78842163085938, -82.64999389648438, -64.5115737915039, -46.37314987182617, -28.234725952148438, -10.096298217773438, 8.042121887207031, 26.1805419921875, 44.3189697265625, 62.457393646240234, 80.59581756591797, 98.73423767089844, 116.87266540527344, 135.01109313964844, 153.14950561523438, 171.28793334960938, 189.42636108398438, 207.56478881835938, 225.70321655273438, 243.8416290283203, 261.98004150390625, 280.11846923828125, 298.25689697265625, 316.39532470703125, 334.53375244140625, 352.67218017578125, 370.81060791015625, 388.94903564453125, 407.08746337890625, 425.22589111328125, 443.3642883300781, 461.5027160644531, 479.6411437988281]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 0.0, 5.0, 4.0, 6.0, 10.0, 13.0, 12.0, 16.0, 12.0, 23.0, 14.0, 23.0, 18.0, 29.0, 35.0, 35.0, 38.0, 34.0, 40.0, 44.0, 49.0, 48.0, 38.0, 46.0, 44.0, 44.0, 42.0, 42.0, 29.0, 28.0, 26.0, 30.0, 17.0, 21.0, 15.0, 14.0, 13.0, 17.0, 4.0, 8.0, 6.0, 6.0, 5.0, 2.0, 1.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.875518798828125, -46.12812042236328, -44.38072204589844, -42.633323669433594, -40.88592529296875, -39.138526916503906, -37.39112854003906, -35.64373016357422, -33.896331787109375, -32.14893341064453, -30.401535034179688, -28.654136657714844, -26.90673828125, -25.159339904785156, -23.411941528320312, -21.66454315185547, -19.917144775390625, -18.16974639892578, -16.422348022460938, -14.674949645996094, -12.92755126953125, -11.180152893066406, -9.432754516601562, -7.685356140136719, -5.937957763671875, -4.190559387207031, -2.4431610107421875, -0.6957626342773438, 1.0516357421875, 2.7990341186523438, 4.5464324951171875, 6.293830871582031, 8.041229248046875, 9.788627624511719, 11.536026000976562, 13.283424377441406, 15.03082275390625, 16.778221130371094, 18.525619506835938, 20.27301788330078, 22.020416259765625, 23.76781463623047, 25.515213012695312, 27.262611389160156, 29.010009765625, 30.757408142089844, 32.50480651855469, 34.25220489501953, 35.999603271484375, 37.74700164794922, 39.49440002441406, 41.241798400878906, 42.98919677734375, 44.736595153808594, 46.48399353027344, 48.23139190673828, 49.978790283203125, 51.72618865966797, 53.47358703613281, 55.220985412597656, 56.9683837890625, 58.715782165527344, 60.46318054199219, 62.21057891845703, 63.957977294921875]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 7.0, 4.0, 2.0, 5.0, 2.0, 3.0, 5.0, 8.0, 14.0, 24.0, 20.0, 22.0, 28.0, 27.0, 29.0, 35.0, 35.0, 53.0, 40.0, 31.0, 59.0, 48.0, 58.0, 37.0, 40.0, 31.0, 56.0, 34.0, 51.0, 28.0, 30.0, 25.0, 19.0, 23.0, 14.0, 19.0, 5.0, 6.0, 9.0, 5.0, 1.0, 7.0, 9.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.0390625, -6.8204345703125, -6.601806640625, -6.3831787109375, -6.16455078125, -5.9459228515625, -5.727294921875, -5.5086669921875, -5.2900390625, -5.0714111328125, -4.852783203125, -4.6341552734375, -4.41552734375, -4.1968994140625, -3.978271484375, -3.7596435546875, -3.541015625, -3.3223876953125, -3.103759765625, -2.8851318359375, -2.66650390625, -2.4478759765625, -2.229248046875, -2.0106201171875, -1.7919921875, -1.5733642578125, -1.354736328125, -1.1361083984375, -0.91748046875, -0.6988525390625, -0.480224609375, -0.2615966796875, -0.04296875, 0.1756591796875, 0.394287109375, 0.6129150390625, 0.83154296875, 1.0501708984375, 1.268798828125, 1.4874267578125, 1.7060546875, 1.9246826171875, 2.143310546875, 2.3619384765625, 2.58056640625, 2.7991943359375, 3.017822265625, 3.2364501953125, 3.455078125, 3.6737060546875, 3.892333984375, 4.1109619140625, 4.32958984375, 4.5482177734375, 4.766845703125, 4.9854736328125, 5.2041015625, 5.4227294921875, 5.641357421875, 5.8599853515625, 6.07861328125, 6.2972412109375, 6.515869140625, 6.7344970703125, 6.953125]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 7.0, 9.0, 10.0, 26.0, 22.0, 37.0, 69.0, 84.0, 112.0, 192.0, 238.0, 403.0, 525.0, 845.0, 1150.0, 1829.0, 2803.0, 4170.0, 6552.0, 10267.0, 16707.0, 28188.0, 48480.0, 90425.0, 185873.0, 310203.0, 153485.0, 77248.0, 42682.0, 24531.0, 14969.0, 9338.0, 5829.0, 3784.0, 2472.0, 1607.0, 1082.0, 744.0, 503.0, 341.0, 204.0, 195.0, 93.0, 83.0, 38.0, 40.0, 18.0, 15.0, 13.0, 8.0, 5.0, 4.0, 5.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.291748046875, -0.28273773193359375, -0.2737274169921875, -0.26471710205078125, -0.255706787109375, -0.24669647216796875, -0.2376861572265625, -0.22867584228515625, -0.21966552734375, -0.21065521240234375, -0.2016448974609375, -0.19263458251953125, -0.183624267578125, -0.17461395263671875, -0.1656036376953125, -0.15659332275390625, -0.1475830078125, -0.13857269287109375, -0.1295623779296875, -0.12055206298828125, -0.111541748046875, -0.10253143310546875, -0.0935211181640625, -0.08451080322265625, -0.07550048828125, -0.06649017333984375, -0.0574798583984375, -0.04846954345703125, -0.039459228515625, -0.03044891357421875, -0.0214385986328125, -0.01242828369140625, -0.00341796875, 0.00559234619140625, 0.0146026611328125, 0.02361297607421875, 0.032623291015625, 0.04163360595703125, 0.0506439208984375, 0.05965423583984375, 0.06866455078125, 0.07767486572265625, 0.0866851806640625, 0.09569549560546875, 0.104705810546875, 0.11371612548828125, 0.1227264404296875, 0.13173675537109375, 0.1407470703125, 0.14975738525390625, 0.1587677001953125, 0.16777801513671875, 0.176788330078125, 0.18579864501953125, 0.1948089599609375, 0.20381927490234375, 0.21282958984375, 0.22183990478515625, 0.2308502197265625, 0.23986053466796875, 0.248870849609375, 0.25788116455078125, 0.2668914794921875, 0.27590179443359375, 0.284912109375]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 6.0, 9.0, 4.0, 8.0, 8.0, 7.0, 9.0, 21.0, 25.0, 22.0, 23.0, 20.0, 30.0, 26.0, 33.0, 32.0, 35.0, 39.0, 44.0, 43.0, 48.0, 1070.0, 37.0, 38.0, 41.0, 40.0, 35.0, 29.0, 36.0, 26.0, 30.0, 23.0, 15.0, 16.0, 17.0, 18.0, 13.0, 13.0, 3.0, 5.0, 6.0, 4.0, 9.0, 4.0, 6.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-4.4296875, -4.29766845703125, -4.1656494140625, -4.03363037109375, -3.901611328125, -3.76959228515625, -3.6375732421875, -3.50555419921875, -3.37353515625, -3.24151611328125, -3.1094970703125, -2.97747802734375, -2.845458984375, -2.71343994140625, -2.5814208984375, -2.44940185546875, -2.3173828125, -2.18536376953125, -2.0533447265625, -1.92132568359375, -1.789306640625, -1.65728759765625, -1.5252685546875, -1.39324951171875, -1.26123046875, -1.12921142578125, -0.9971923828125, -0.86517333984375, -0.733154296875, -0.60113525390625, -0.4691162109375, -0.33709716796875, -0.205078125, -0.07305908203125, 0.0589599609375, 0.19097900390625, 0.322998046875, 0.45501708984375, 0.5870361328125, 0.71905517578125, 0.85107421875, 0.98309326171875, 1.1151123046875, 1.24713134765625, 1.379150390625, 1.51116943359375, 1.6431884765625, 1.77520751953125, 1.9072265625, 2.03924560546875, 2.1712646484375, 2.30328369140625, 2.435302734375, 2.56732177734375, 2.6993408203125, 2.83135986328125, 2.96337890625, 3.09539794921875, 3.2274169921875, 3.35943603515625, 3.491455078125, 3.62347412109375, 3.7554931640625, 3.88751220703125, 4.01953125]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 4.0, 1.0, 6.0, 4.0, 3.0, 13.0, 30.0, 34.0, 59.0, 100.0, 130.0, 167.0, 231.0, 382.0, 503.0, 743.0, 988.0, 1511.0, 2276.0, 3170.0, 4605.0, 7087.0, 10905.0, 16619.0, 26677.0, 43204.0, 71334.0, 124210.0, 1281843.0, 212140.0, 112676.0, 65409.0, 39698.0, 24215.0, 15533.0, 9782.0, 6648.0, 4418.0, 2981.0, 2011.0, 1531.0, 1014.0, 672.0, 457.0, 345.0, 265.0, 167.0, 127.0, 79.0, 40.0, 38.0, 18.0, 21.0, 7.0, 6.0, 4.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.2044677734375, -0.1980609893798828, -0.19165420532226562, -0.18524742126464844, -0.17884063720703125, -0.17243385314941406, -0.16602706909179688, -0.1596202850341797, -0.1532135009765625, -0.1468067169189453, -0.14039993286132812, -0.13399314880371094, -0.12758636474609375, -0.12117958068847656, -0.11477279663085938, -0.10836601257324219, -0.101959228515625, -0.09555244445800781, -0.08914566040039062, -0.08273887634277344, -0.07633209228515625, -0.06992530822753906, -0.06351852416992188, -0.05711174011230469, -0.0507049560546875, -0.04429817199707031, -0.037891387939453125, -0.03148460388183594, -0.02507781982421875, -0.018671035766601562, -0.012264251708984375, -0.0058574676513671875, 0.00054931640625, 0.0069561004638671875, 0.013362884521484375, 0.019769668579101562, 0.02617645263671875, 0.03258323669433594, 0.038990020751953125, 0.04539680480957031, 0.0518035888671875, 0.05821037292480469, 0.06461715698242188, 0.07102394104003906, 0.07743072509765625, 0.08383750915527344, 0.09024429321289062, 0.09665107727050781, 0.103057861328125, 0.10946464538574219, 0.11587142944335938, 0.12227821350097656, 0.12868499755859375, 0.13509178161621094, 0.14149856567382812, 0.1479053497314453, 0.1543121337890625, 0.1607189178466797, 0.16712570190429688, 0.17353248596191406, 0.17993927001953125, 0.18634605407714844, 0.19275283813476562, 0.1991596221923828, 0.20556640625]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 6.0, 1.0, 6.0, 4.0, 0.0, 8.0, 6.0, 5.0, 7.0, 5.0, 11.0, 10.0, 11.0, 19.0, 14.0, 20.0, 29.0, 30.0, 47.0, 78.0, 168.0, 148.0, 94.0, 60.0, 43.0, 38.0, 28.0, 27.0, 14.0, 12.0, 9.0, 11.0, 6.0, 4.0, 4.0, 6.0, 5.0, 4.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.00025463104248046875, -0.0002467148005962372, -0.00023879855871200562, -0.00023088231682777405, -0.00022296607494354248, -0.0002150498330593109, -0.00020713359117507935, -0.00019921734929084778, -0.0001913011074066162, -0.00018338486552238464, -0.00017546862363815308, -0.0001675523817539215, -0.00015963613986968994, -0.00015171989798545837, -0.0001438036561012268, -0.00013588741421699524, -0.00012797117233276367, -0.0001200549304485321, -0.00011213868856430054, -0.00010422244668006897, -9.63062047958374e-05, -8.838996291160583e-05, -8.047372102737427e-05, -7.25574791431427e-05, -6.464123725891113e-05, -5.6724995374679565e-05, -4.8808753490448e-05, -4.089251160621643e-05, -3.297626972198486e-05, -2.5060027837753296e-05, -1.714378595352173e-05, -9.227544069290161e-06, -1.3113021850585938e-06, 6.604939699172974e-06, 1.4521181583404541e-05, 2.243742346763611e-05, 3.0353665351867676e-05, 3.826990723609924e-05, 4.618614912033081e-05, 5.410239100456238e-05, 6.201863288879395e-05, 6.993487477302551e-05, 7.785111665725708e-05, 8.576735854148865e-05, 9.368360042572021e-05, 0.00010159984230995178, 0.00010951608419418335, 0.00011743232607841492, 0.00012534856796264648, 0.00013326480984687805, 0.00014118105173110962, 0.0001490972936153412, 0.00015701353549957275, 0.00016492977738380432, 0.0001728460192680359, 0.00018076226115226746, 0.00018867850303649902, 0.0001965947449207306, 0.00020451098680496216, 0.00021242722868919373, 0.0002203434705734253, 0.00022825971245765686, 0.00023617595434188843, 0.00024409219622612, 0.00025200843811035156]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 4.0, 10.0, 7.0, 10.0, 8.0, 16.0, 20.0, 23.0, 29.0, 29.0, 39.0, 76.0, 90.0, 171.0, 262.0, 540.0, 3356.0, 982615.0, 59155.0, 1029.0, 386.0, 174.0, 138.0, 82.0, 51.0, 49.0, 32.0, 23.0, 22.0, 18.0, 14.0, 10.0, 7.0, 7.0, 8.0, 17.0, 7.0, 5.0, 6.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.00449371337890625, -0.004352271556854248, -0.004210829734802246, -0.004069387912750244, -0.003927946090698242, -0.0037865042686462402, -0.0036450624465942383, -0.0035036206245422363, -0.0033621788024902344, -0.0032207369804382324, -0.0030792951583862305, -0.0029378533363342285, -0.0027964115142822266, -0.0026549696922302246, -0.0025135278701782227, -0.0023720860481262207, -0.0022306442260742188, -0.002089202404022217, -0.0019477605819702148, -0.0018063187599182129, -0.001664876937866211, -0.001523435115814209, -0.001381993293762207, -0.001240551471710205, -0.0010991096496582031, -0.0009576678276062012, -0.0008162260055541992, -0.0006747841835021973, -0.0005333423614501953, -0.00039190053939819336, -0.0002504587173461914, -0.00010901689529418945, 3.24249267578125e-05, 0.00017386674880981445, 0.0003153085708618164, 0.00045675039291381836, 0.0005981922149658203, 0.0007396340370178223, 0.0008810758590698242, 0.0010225176811218262, 0.0011639595031738281, 0.00130540132522583, 0.001446843147277832, 0.001588284969329834, 0.001729726791381836, 0.0018711686134338379, 0.00201261043548584, 0.002154052257537842, 0.0022954940795898438, 0.0024369359016418457, 0.0025783777236938477, 0.0027198195457458496, 0.0028612613677978516, 0.0030027031898498535, 0.0031441450119018555, 0.0032855868339538574, 0.0034270286560058594, 0.0035684704780578613, 0.0037099123001098633, 0.0038513541221618652, 0.003992795944213867, 0.004134237766265869, 0.004275679588317871, 0.004417121410369873, 0.004558563232421875]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 23.0, 461.0, 495.0, 31.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0002590591611806303, -0.00023027369752526283, -0.00020148824842181057, -0.00017270278476644307, -0.0001439173356629908, -0.00011513187200762331, -8.634640835225582e-05, -5.7560959248803556e-05, -2.8775495593436062e-05, 9.962604963220656e-09, 2.8795420803362504e-05, 5.758088082075119e-05, 8.636633720016107e-05, 0.00011515179357957095, 0.00014393725723493844, 0.0001727227063383907, 0.0002015081699937582, 0.0002302936336491257, 0.0002590790973044932, 0.0002878645318560302, 0.0003166499955113977, 0.0003454354591667652, 0.0003742209228221327, 0.0004030063864775002, 0.00043179182102903724, 0.00046057728468440473, 0.0004893627483397722, 0.0005181481828913093, 0.0005469336756505072, 0.0005757191102020442, 0.0006045046029612422, 0.0006332900375127792, 0.0006620755302719772, 0.0006908609648235142, 0.0007196464575827122, 0.0007484318921342492, 0.0007772173848934472, 0.0008060028194449842, 0.0008347883122041821, 0.0008635737467557192, 0.0008923591813072562, 0.0009211446158587933, 0.0009499301086179912, 0.0009787156013771892, 0.0010075010359287262, 0.0010362864704802632, 0.0010650719050318003, 0.0010938573395833373, 0.0011226428905501962, 0.0011514283251017332, 0.0011802137596532702, 0.0012089993106201291, 0.0012377847451716661, 0.0012665701797232032, 0.0012953556142747402, 0.0013241410488262773, 0.0013529264833778143, 0.0013817119179293513, 0.0014104973524808884, 0.0014392829034477472, 0.0014680683379992843, 0.0014968537725508213, 0.0015256392071023583, 0.0015544246416538954, 0.0015832101926207542]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 2.0, 2.0, 5.0, 9.0, 7.0, 10.0, 17.0, 14.0, 19.0, 25.0, 15.0, 25.0, 25.0, 29.0, 37.0, 36.0, 29.0, 41.0, 49.0, 41.0, 30.0, 42.0, 47.0, 45.0, 37.0, 38.0, 31.0, 34.0, 33.0, 31.0, 33.0, 22.0, 20.0, 18.0, 25.0, 19.0, 11.0, 11.0, 12.0, 3.0, 8.0, 5.0, 4.0, 3.0, 3.0, 0.0, 4.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.0001271367073059082, -0.00012324098497629166, -0.00011934526264667511, -0.00011544954031705856, -0.00011155381798744202, -0.00010765809565782547, -0.00010376237332820892, -9.986665099859238e-05, -9.597092866897583e-05, -9.207520633935928e-05, -8.817948400974274e-05, -8.428376168012619e-05, -8.038803935050964e-05, -7.64923170208931e-05, -7.259659469127655e-05, -6.870087236166e-05, -6.480515003204346e-05, -6.090942770242691e-05, -5.7013705372810364e-05, -5.311798304319382e-05, -4.922226071357727e-05, -4.5326538383960724e-05, -4.143081605434418e-05, -3.753509372472763e-05, -3.3639371395111084e-05, -2.9743649065494537e-05, -2.584792673587799e-05, -2.1952204406261444e-05, -1.8056482076644897e-05, -1.416075974702835e-05, -1.0265037417411804e-05, -6.3693150877952576e-06, -2.473592758178711e-06, 1.4221295714378357e-06, 5.317851901054382e-06, 9.213574230670929e-06, 1.3109296560287476e-05, 1.7005018889904022e-05, 2.090074121952057e-05, 2.4796463549137115e-05, 2.8692185878753662e-05, 3.258790820837021e-05, 3.6483630537986755e-05, 4.03793528676033e-05, 4.427507519721985e-05, 4.8170797526836395e-05, 5.206651985645294e-05, 5.596224218606949e-05, 5.9857964515686035e-05, 6.375368684530258e-05, 6.764940917491913e-05, 7.154513150453568e-05, 7.544085383415222e-05, 7.933657616376877e-05, 8.323229849338531e-05, 8.712802082300186e-05, 9.102374315261841e-05, 9.491946548223495e-05, 9.88151878118515e-05, 0.00010271091014146805, 0.0001066066324710846, 0.00011050235480070114, 0.00011439807713031769, 0.00011829379945993423, 0.00012218952178955078]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 7.0, 4.0, 2.0, 5.0, 2.0, 3.0, 5.0, 8.0, 14.0, 24.0, 20.0, 22.0, 28.0, 27.0, 29.0, 35.0, 35.0, 53.0, 40.0, 31.0, 59.0, 47.0, 59.0, 37.0, 40.0, 31.0, 56.0, 34.0, 51.0, 28.0, 30.0, 25.0, 19.0, 23.0, 14.0, 19.0, 5.0, 6.0, 9.0, 5.0, 1.0, 7.0, 9.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.0390625, -6.8204345703125, -6.601806640625, -6.3831787109375, -6.16455078125, -5.9459228515625, -5.727294921875, -5.5086669921875, -5.2900390625, -5.0714111328125, -4.852783203125, -4.6341552734375, -4.41552734375, -4.1968994140625, -3.978271484375, -3.7596435546875, -3.541015625, -3.3223876953125, -3.103759765625, -2.8851318359375, -2.66650390625, -2.4478759765625, -2.229248046875, -2.0106201171875, -1.7919921875, -1.5733642578125, -1.354736328125, -1.1361083984375, -0.91748046875, -0.6988525390625, -0.480224609375, -0.2615966796875, -0.04296875, 0.1756591796875, 0.394287109375, 0.6129150390625, 0.83154296875, 1.0501708984375, 1.268798828125, 1.4874267578125, 1.7060546875, 1.9246826171875, 2.143310546875, 2.3619384765625, 2.58056640625, 2.7991943359375, 3.017822265625, 3.2364501953125, 3.455078125, 3.6737060546875, 3.892333984375, 4.1109619140625, 4.32958984375, 4.5482177734375, 4.766845703125, 4.9854736328125, 5.2041015625, 5.4227294921875, 5.641357421875, 5.8599853515625, 6.07861328125, 6.2972412109375, 6.515869140625, 6.7344970703125, 6.953125]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 6.0, 6.0, 6.0, 9.0, 10.0, 23.0, 23.0, 37.0, 49.0, 49.0, 77.0, 101.0, 155.0, 250.0, 312.0, 460.0, 691.0, 1175.0, 2081.0, 4041.0, 9836.0, 38024.0, 420594.0, 506787.0, 43125.0, 10761.0, 4207.0, 2044.0, 1212.0, 766.0, 488.0, 331.0, 256.0, 176.0, 112.0, 79.0, 61.0, 42.0, 32.0, 23.0, 9.0, 9.0, 7.0, 8.0, 6.0, 3.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.421875, -18.833984375, -18.24609375, -17.658203125, -17.0703125, -16.482421875, -15.89453125, -15.306640625, -14.71875, -14.130859375, -13.54296875, -12.955078125, -12.3671875, -11.779296875, -11.19140625, -10.603515625, -10.015625, -9.427734375, -8.83984375, -8.251953125, -7.6640625, -7.076171875, -6.48828125, -5.900390625, -5.3125, -4.724609375, -4.13671875, -3.548828125, -2.9609375, -2.373046875, -1.78515625, -1.197265625, -0.609375, -0.021484375, 0.56640625, 1.154296875, 1.7421875, 2.330078125, 2.91796875, 3.505859375, 4.09375, 4.681640625, 5.26953125, 5.857421875, 6.4453125, 7.033203125, 7.62109375, 8.208984375, 8.796875, 9.384765625, 9.97265625, 10.560546875, 11.1484375, 11.736328125, 12.32421875, 12.912109375, 13.5, 14.087890625, 14.67578125, 15.263671875, 15.8515625, 16.439453125, 17.02734375, 17.615234375, 18.203125]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 3.0, 7.0, 0.0, 3.0, 4.0, 11.0, 6.0, 11.0, 11.0, 24.0, 13.0, 16.0, 28.0, 23.0, 27.0, 32.0, 42.0, 47.0, 72.0, 101.0, 268.0, 1521.0, 252.0, 104.0, 74.0, 58.0, 50.0, 40.0, 30.0, 26.0, 25.0, 25.0, 14.0, 15.0, 15.0, 13.0, 11.0, 9.0, 1.0, 3.0, 8.0, 5.0, 3.0, 2.0, 4.0, 0.0, 1.0, 3.0], "bins": [-18.828125, -18.325439453125, -17.82275390625, -17.320068359375, -16.8173828125, -16.314697265625, -15.81201171875, -15.309326171875, -14.806640625, -14.303955078125, -13.80126953125, -13.298583984375, -12.7958984375, -12.293212890625, -11.79052734375, -11.287841796875, -10.78515625, -10.282470703125, -9.77978515625, -9.277099609375, -8.7744140625, -8.271728515625, -7.76904296875, -7.266357421875, -6.763671875, -6.260986328125, -5.75830078125, -5.255615234375, -4.7529296875, -4.250244140625, -3.74755859375, -3.244873046875, -2.7421875, -2.239501953125, -1.73681640625, -1.234130859375, -0.7314453125, -0.228759765625, 0.27392578125, 0.776611328125, 1.279296875, 1.781982421875, 2.28466796875, 2.787353515625, 3.2900390625, 3.792724609375, 4.29541015625, 4.798095703125, 5.30078125, 5.803466796875, 6.30615234375, 6.808837890625, 7.3115234375, 7.814208984375, 8.31689453125, 8.819580078125, 9.322265625, 9.824951171875, 10.32763671875, 10.830322265625, 11.3330078125, 11.835693359375, 12.33837890625, 12.841064453125, 13.34375]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 1.0, 4.0, 3.0, 3.0, 10.0, 8.0, 14.0, 9.0, 16.0, 20.0, 22.0, 35.0, 56.0, 68.0, 94.0, 173.0, 269.0, 458.0, 887.0, 2457.0, 1548124.0, 1588433.0, 2486.0, 860.0, 444.0, 249.0, 158.0, 90.0, 67.0, 55.0, 28.0, 23.0, 22.0, 17.0, 7.0, 13.0, 6.0, 7.0, 7.0, 2.0, 6.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.4375, -46.6435546875, -44.849609375, -43.0556640625, -41.26171875, -39.4677734375, -37.673828125, -35.8798828125, -34.0859375, -32.2919921875, -30.498046875, -28.7041015625, -26.91015625, -25.1162109375, -23.322265625, -21.5283203125, -19.734375, -17.9404296875, -16.146484375, -14.3525390625, -12.55859375, -10.7646484375, -8.970703125, -7.1767578125, -5.3828125, -3.5888671875, -1.794921875, -0.0009765625, 1.79296875, 3.5869140625, 5.380859375, 7.1748046875, 8.96875, 10.7626953125, 12.556640625, 14.3505859375, 16.14453125, 17.9384765625, 19.732421875, 21.5263671875, 23.3203125, 25.1142578125, 26.908203125, 28.7021484375, 30.49609375, 32.2900390625, 34.083984375, 35.8779296875, 37.671875, 39.4658203125, 41.259765625, 43.0537109375, 44.84765625, 46.6416015625, 48.435546875, 50.2294921875, 52.0234375, 53.8173828125, 55.611328125, 57.4052734375, 59.19921875, 60.9931640625, 62.787109375, 64.5810546875, 66.375]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 8.0, 18.0, 120.0, 349.0, 339.0, 143.0, 31.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-140.62673950195312, -137.43357849121094, -134.24041748046875, -131.04725646972656, -127.85409545898438, -124.66093444824219, -121.4677734375, -118.27461242675781, -115.08145141601562, -111.88829040527344, -108.69512939453125, -105.50196838378906, -102.30880737304688, -99.11564636230469, -95.9224853515625, -92.72932434082031, -89.5361557006836, -86.3429946899414, -83.14983367919922, -79.95667266845703, -76.76351165771484, -73.57035064697266, -70.37718200683594, -67.18402099609375, -63.99086380004883, -60.79770278930664, -57.60454177856445, -54.411376953125, -51.21821594238281, -48.025054931640625, -44.83189392089844, -41.63873291015625, -38.4455680847168, -35.25240707397461, -32.05924606323242, -28.8660831451416, -25.672922134399414, -22.479761123657227, -19.286598205566406, -16.09343719482422, -12.900276184082031, -9.707115173339844, -6.51395320892334, -3.320791244506836, -0.12763023376464844, 3.065530776977539, 6.258693695068359, 9.451854705810547, 12.645015716552734, 15.838176727294922, 19.03133773803711, 22.22450065612793, 25.417661666870117, 28.610822677612305, 31.803985595703125, 34.99714660644531, 38.1903076171875, 41.38346862792969, 44.576629638671875, 47.76979064941406, 50.96295166015625, 54.15611267089844, 57.34927749633789, 60.54243850708008, 63.735599517822266]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 2.0, 11.0, 10.0, 6.0, 14.0, 11.0, 17.0, 16.0, 16.0, 24.0, 29.0, 27.0, 24.0, 32.0, 34.0, 35.0, 36.0, 36.0, 45.0, 37.0, 43.0, 38.0, 34.0, 38.0, 25.0, 39.0, 28.0, 44.0, 19.0, 30.0, 24.0, 23.0, 25.0, 19.0, 16.0, 19.0, 14.0, 14.0, 10.0, 5.0, 5.0, 6.0, 3.0, 8.0, 6.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-42.93523406982422, -41.71271896362305, -40.490203857421875, -39.26769256591797, -38.0451774597168, -36.822662353515625, -35.60014724731445, -34.37763214111328, -33.15511703491211, -31.932601928710938, -30.7100887298584, -29.487573623657227, -28.265058517456055, -27.042545318603516, -25.820030212402344, -24.597515106201172, -23.375001907348633, -22.15248680114746, -20.929973602294922, -19.70745849609375, -18.484943389892578, -17.262428283691406, -16.039915084838867, -14.817399978637695, -13.59488582611084, -12.372371673583984, -11.149856567382812, -9.927342414855957, -8.704828262329102, -7.48231315612793, -6.259799003601074, -5.037283897399902, -3.814769744873047, -2.592255115509033, -1.3697407245635986, -0.14722633361816406, 1.0752882957458496, 2.2978029251098633, 3.5203170776367188, 4.742832183837891, 5.965346336364746, 7.18786096572876, 8.410375595092773, 9.632889747619629, 10.855403900146484, 12.077919006347656, 13.300433158874512, 14.522948265075684, 15.745462417602539, 16.96797752380371, 18.19049072265625, 19.413005828857422, 20.635520935058594, 21.858036041259766, 23.080549240112305, 24.303064346313477, 25.525577545166016, 26.748092651367188, 27.970605850219727, 29.1931209564209, 30.41563606262207, 31.63814926147461, 32.86066436767578, 34.08317947387695, 35.305694580078125]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 3.0, 2.0, 4.0, 3.0, 11.0, 8.0, 8.0, 9.0, 8.0, 16.0, 18.0, 24.0, 22.0, 28.0, 32.0, 27.0, 25.0, 35.0, 32.0, 39.0, 46.0, 46.0, 54.0, 48.0, 40.0, 47.0, 39.0, 30.0, 38.0, 28.0, 32.0, 33.0, 23.0, 23.0, 17.0, 24.0, 21.0, 9.0, 9.0, 10.0, 11.0, 7.0, 5.0, 5.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0], "bins": [-6.68359375, -6.4759521484375, -6.268310546875, -6.0606689453125, -5.85302734375, -5.6453857421875, -5.437744140625, -5.2301025390625, -5.0224609375, -4.8148193359375, -4.607177734375, -4.3995361328125, -4.19189453125, -3.9842529296875, -3.776611328125, -3.5689697265625, -3.361328125, -3.1536865234375, -2.946044921875, -2.7384033203125, -2.53076171875, -2.3231201171875, -2.115478515625, -1.9078369140625, -1.7001953125, -1.4925537109375, -1.284912109375, -1.0772705078125, -0.86962890625, -0.6619873046875, -0.454345703125, -0.2467041015625, -0.0390625, 0.1685791015625, 0.376220703125, 0.5838623046875, 0.79150390625, 0.9991455078125, 1.206787109375, 1.4144287109375, 1.6220703125, 1.8297119140625, 2.037353515625, 2.2449951171875, 2.45263671875, 2.6602783203125, 2.867919921875, 3.0755615234375, 3.283203125, 3.4908447265625, 3.698486328125, 3.9061279296875, 4.11376953125, 4.3214111328125, 4.529052734375, 4.7366943359375, 4.9443359375, 5.1519775390625, 5.359619140625, 5.5672607421875, 5.77490234375, 5.9825439453125, 6.190185546875, 6.3978271484375, 6.60546875]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 4.0, 3.0, 5.0, 8.0, 6.0, 19.0, 27.0, 28.0, 38.0, 55.0, 67.0, 110.0, 122.0, 172.0, 227.0, 305.0, 453.0, 598.0, 906.0, 1319.0, 2127.0, 3967.0, 8239.0, 20419.0, 70801.0, 460040.0, 2265999.0, 1140421.0, 159300.0, 33431.0, 11763.0, 5222.0, 2781.0, 1643.0, 1068.0, 758.0, 501.0, 356.0, 259.0, 199.0, 146.0, 112.0, 66.0, 54.0, 39.0, 35.0, 20.0, 18.0, 14.0, 6.0, 8.0, 4.0, 4.0, 1.0, 0.0, 1.0], "bins": [-14.1484375, -13.7410888671875, -13.333740234375, -12.9263916015625, -12.51904296875, -12.1116943359375, -11.704345703125, -11.2969970703125, -10.8896484375, -10.4822998046875, -10.074951171875, -9.6676025390625, -9.26025390625, -8.8529052734375, -8.445556640625, -8.0382080078125, -7.630859375, -7.2235107421875, -6.816162109375, -6.4088134765625, -6.00146484375, -5.5941162109375, -5.186767578125, -4.7794189453125, -4.3720703125, -3.9647216796875, -3.557373046875, -3.1500244140625, -2.74267578125, -2.3353271484375, -1.927978515625, -1.5206298828125, -1.11328125, -0.7059326171875, -0.298583984375, 0.1087646484375, 0.51611328125, 0.9234619140625, 1.330810546875, 1.7381591796875, 2.1455078125, 2.5528564453125, 2.960205078125, 3.3675537109375, 3.77490234375, 4.1822509765625, 4.589599609375, 4.9969482421875, 5.404296875, 5.8116455078125, 6.218994140625, 6.6263427734375, 7.03369140625, 7.4410400390625, 7.848388671875, 8.2557373046875, 8.6630859375, 9.0704345703125, 9.477783203125, 9.8851318359375, 10.29248046875, 10.6998291015625, 11.107177734375, 11.5145263671875, 11.921875]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 2.0, 11.0, 12.0, 26.0, 47.0, 70.0, 138.0, 244.0, 432.0, 835.0, 972.0, 571.0, 301.0, 168.0, 107.0, 63.0, 41.0, 21.0, 10.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.2890625, -12.5938720703125, -11.898681640625, -11.2034912109375, -10.50830078125, -9.8131103515625, -9.117919921875, -8.4227294921875, -7.7275390625, -7.0323486328125, -6.337158203125, -5.6419677734375, -4.94677734375, -4.2515869140625, -3.556396484375, -2.8612060546875, -2.166015625, -1.4708251953125, -0.775634765625, -0.0804443359375, 0.61474609375, 1.3099365234375, 2.005126953125, 2.7003173828125, 3.3955078125, 4.0906982421875, 4.785888671875, 5.4810791015625, 6.17626953125, 6.8714599609375, 7.566650390625, 8.2618408203125, 8.95703125, 9.6522216796875, 10.347412109375, 11.0426025390625, 11.73779296875, 12.4329833984375, 13.128173828125, 13.8233642578125, 14.5185546875, 15.2137451171875, 15.908935546875, 16.6041259765625, 17.29931640625, 17.9945068359375, 18.689697265625, 19.3848876953125, 20.080078125, 20.7752685546875, 21.470458984375, 22.1656494140625, 22.86083984375, 23.5560302734375, 24.251220703125, 24.9464111328125, 25.6416015625, 26.3367919921875, 27.031982421875, 27.7271728515625, 28.42236328125, 29.1175537109375, 29.812744140625, 30.5079345703125, 31.203125]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 5.0, 11.0, 9.0, 10.0, 20.0, 38.0, 59.0, 84.0, 137.0, 241.0, 398.0, 946.0, 3363.0, 31919.0, 3158954.0, 978333.0, 15929.0, 2291.0, 705.0, 319.0, 171.0, 101.0, 73.0, 46.0, 37.0, 21.0, 17.0, 18.0, 7.0, 6.0, 9.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-41.71875, -40.55615234375, -39.3935546875, -38.23095703125, -37.068359375, -35.90576171875, -34.7431640625, -33.58056640625, -32.41796875, -31.25537109375, -30.0927734375, -28.93017578125, -27.767578125, -26.60498046875, -25.4423828125, -24.27978515625, -23.1171875, -21.95458984375, -20.7919921875, -19.62939453125, -18.466796875, -17.30419921875, -16.1416015625, -14.97900390625, -13.81640625, -12.65380859375, -11.4912109375, -10.32861328125, -9.166015625, -8.00341796875, -6.8408203125, -5.67822265625, -4.515625, -3.35302734375, -2.1904296875, -1.02783203125, 0.134765625, 1.29736328125, 2.4599609375, 3.62255859375, 4.78515625, 5.94775390625, 7.1103515625, 8.27294921875, 9.435546875, 10.59814453125, 11.7607421875, 12.92333984375, 14.0859375, 15.24853515625, 16.4111328125, 17.57373046875, 18.736328125, 19.89892578125, 21.0615234375, 22.22412109375, 23.38671875, 24.54931640625, 25.7119140625, 26.87451171875, 28.037109375, 29.19970703125, 30.3623046875, 31.52490234375, 32.6875]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 15.0, 65.0, 301.0, 462.0, 134.0, 32.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.3144760131836, -60.042022705078125, -52.76956558227539, -45.497108459472656, -38.22465515136719, -30.95220184326172, -23.679744720458984, -16.40728759765625, -9.134834289550781, -1.8623790740966797, 5.410076141357422, 12.682531356811523, 19.954986572265625, 27.227439880371094, 34.49989700317383, 41.77235412597656, 49.04480743408203, 56.3172607421875, 63.589717864990234, 70.86217498779297, 78.13462829589844, 85.4070816040039, 92.67953491210938, 99.95199584960938, 107.22444915771484, 114.49690246582031, 121.76936340332031, 129.04180908203125, 136.31427001953125, 143.58673095703125, 150.8591766357422, 158.1316375732422, 165.40408325195312, 172.67654418945312, 179.94898986816406, 187.22145080566406, 194.493896484375, 201.766357421875, 209.038818359375, 216.311279296875, 223.58372497558594, 230.85618591308594, 238.12863159179688, 245.40109252929688, 252.67355346679688, 259.94598388671875, 267.21844482421875, 274.49090576171875, 281.76336669921875, 289.03582763671875, 296.30828857421875, 303.5807189941406, 310.8531799316406, 318.1256408691406, 325.3981018066406, 332.6705627441406, 339.9429931640625, 347.2154541015625, 354.4879150390625, 361.7603454589844, 369.0328063964844, 376.3052673339844, 383.5777282714844, 390.8501892089844, 398.1226501464844]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 5.0, 2.0, 9.0, 7.0, 9.0, 9.0, 10.0, 12.0, 16.0, 20.0, 15.0, 16.0, 21.0, 24.0, 34.0, 30.0, 40.0, 33.0, 37.0, 36.0, 42.0, 46.0, 27.0, 38.0, 49.0, 26.0, 41.0, 36.0, 38.0, 35.0, 28.0, 24.0, 29.0, 17.0, 21.0, 25.0, 17.0, 19.0, 14.0, 13.0, 8.0, 5.0, 10.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0], "bins": [-45.9328727722168, -44.4693717956543, -43.0058708190918, -41.5423698425293, -40.0788688659668, -38.6153678894043, -37.1518669128418, -35.6883659362793, -34.2248649597168, -32.7613639831543, -31.297863006591797, -29.834362030029297, -28.370861053466797, -26.907360076904297, -25.443859100341797, -23.980358123779297, -22.516857147216797, -21.053356170654297, -19.589855194091797, -18.126354217529297, -16.662853240966797, -15.199352264404297, -13.735851287841797, -12.272350311279297, -10.808849334716797, -9.345348358154297, -7.881847381591797, -6.418346405029297, -4.954845428466797, -3.491344451904297, -2.027843475341797, -0.5643424987792969, 0.8991584777832031, 2.362659454345703, 3.826160430908203, 5.289661407470703, 6.753162384033203, 8.216663360595703, 9.680164337158203, 11.143665313720703, 12.607166290283203, 14.070667266845703, 15.534168243408203, 16.997669219970703, 18.461170196533203, 19.924671173095703, 21.388172149658203, 22.851673126220703, 24.315174102783203, 25.778675079345703, 27.242176055908203, 28.705677032470703, 30.169178009033203, 31.632678985595703, 33.0961799621582, 34.5596809387207, 36.0231819152832, 37.4866828918457, 38.9501838684082, 40.4136848449707, 41.8771858215332, 43.3406867980957, 44.8041877746582, 46.2676887512207, 47.7311897277832]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 5.0, 5.0, 7.0, 2.0, 11.0, 11.0, 10.0, 11.0, 21.0, 25.0, 28.0, 32.0, 25.0, 44.0, 33.0, 36.0, 49.0, 40.0, 43.0, 50.0, 37.0, 56.0, 43.0, 45.0, 37.0, 30.0, 34.0, 35.0, 35.0, 32.0, 17.0, 17.0, 22.0, 14.0, 10.0, 8.0, 13.0, 10.0, 3.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.671875, -6.4588623046875, -6.245849609375, -6.0328369140625, -5.81982421875, -5.6068115234375, -5.393798828125, -5.1807861328125, -4.9677734375, -4.7547607421875, -4.541748046875, -4.3287353515625, -4.11572265625, -3.9027099609375, -3.689697265625, -3.4766845703125, -3.263671875, -3.0506591796875, -2.837646484375, -2.6246337890625, -2.41162109375, -2.1986083984375, -1.985595703125, -1.7725830078125, -1.5595703125, -1.3465576171875, -1.133544921875, -0.9205322265625, -0.70751953125, -0.4945068359375, -0.281494140625, -0.0684814453125, 0.14453125, 0.3575439453125, 0.570556640625, 0.7835693359375, 0.99658203125, 1.2095947265625, 1.422607421875, 1.6356201171875, 1.8486328125, 2.0616455078125, 2.274658203125, 2.4876708984375, 2.70068359375, 2.9136962890625, 3.126708984375, 3.3397216796875, 3.552734375, 3.7657470703125, 3.978759765625, 4.1917724609375, 4.40478515625, 4.6177978515625, 4.830810546875, 5.0438232421875, 5.2568359375, 5.4698486328125, 5.682861328125, 5.8958740234375, 6.10888671875, 6.3218994140625, 6.534912109375, 6.7479248046875, 6.9609375]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 3.0, 4.0, 3.0, 10.0, 19.0, 15.0, 24.0, 38.0, 65.0, 107.0, 121.0, 182.0, 256.0, 376.0, 563.0, 764.0, 1043.0, 1620.0, 2294.0, 3536.0, 5205.0, 7867.0, 11968.0, 18461.0, 28973.0, 47850.0, 83073.0, 162082.0, 291845.0, 164310.0, 83983.0, 47676.0, 29343.0, 18661.0, 12088.0, 7967.0, 5206.0, 3422.0, 2331.0, 1600.0, 1105.0, 762.0, 484.0, 382.0, 249.0, 194.0, 121.0, 98.0, 72.0, 37.0, 34.0, 24.0, 16.0, 18.0, 10.0, 2.0, 2.0, 0.0, 1.0, 2.0, 4.0], "bins": [-0.25732421875, -0.24915695190429688, -0.24098968505859375, -0.23282241821289062, -0.2246551513671875, -0.21648788452148438, -0.20832061767578125, -0.20015335083007812, -0.191986083984375, -0.18381881713867188, -0.17565155029296875, -0.16748428344726562, -0.1593170166015625, -0.15114974975585938, -0.14298248291015625, -0.13481521606445312, -0.12664794921875, -0.11848068237304688, -0.11031341552734375, -0.10214614868164062, -0.0939788818359375, -0.08581161499023438, -0.07764434814453125, -0.06947708129882812, -0.061309814453125, -0.053142547607421875, -0.04497528076171875, -0.036808013916015625, -0.0286407470703125, -0.020473480224609375, -0.01230621337890625, -0.004138946533203125, 0.0040283203125, 0.012195587158203125, 0.02036285400390625, 0.028530120849609375, 0.0366973876953125, 0.044864654541015625, 0.05303192138671875, 0.061199188232421875, 0.069366455078125, 0.07753372192382812, 0.08570098876953125, 0.09386825561523438, 0.1020355224609375, 0.11020278930664062, 0.11837005615234375, 0.12653732299804688, 0.13470458984375, 0.14287185668945312, 0.15103912353515625, 0.15920639038085938, 0.1673736572265625, 0.17554092407226562, 0.18370819091796875, 0.19187545776367188, 0.200042724609375, 0.20820999145507812, 0.21637725830078125, 0.22454452514648438, 0.2327117919921875, 0.24087905883789062, 0.24904632568359375, 0.2572135925292969, 0.265380859375]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 2.0, 3.0, 10.0, 11.0, 8.0, 17.0, 15.0, 19.0, 27.0, 21.0, 20.0, 20.0, 35.0, 35.0, 30.0, 29.0, 43.0, 37.0, 31.0, 35.0, 1071.0, 45.0, 31.0, 50.0, 39.0, 37.0, 39.0, 46.0, 37.0, 22.0, 17.0, 25.0, 21.0, 17.0, 9.0, 19.0, 13.0, 13.0, 5.0, 9.0, 0.0, 5.0, 3.0, 1.0, 3.0, 1.0, 1.0], "bins": [-5.09375, -4.95831298828125, -4.8228759765625, -4.68743896484375, -4.552001953125, -4.41656494140625, -4.2811279296875, -4.14569091796875, -4.01025390625, -3.87481689453125, -3.7393798828125, -3.60394287109375, -3.468505859375, -3.33306884765625, -3.1976318359375, -3.06219482421875, -2.9267578125, -2.79132080078125, -2.6558837890625, -2.52044677734375, -2.385009765625, -2.24957275390625, -2.1141357421875, -1.97869873046875, -1.84326171875, -1.70782470703125, -1.5723876953125, -1.43695068359375, -1.301513671875, -1.16607666015625, -1.0306396484375, -0.89520263671875, -0.759765625, -0.62432861328125, -0.4888916015625, -0.35345458984375, -0.218017578125, -0.08258056640625, 0.0528564453125, 0.18829345703125, 0.32373046875, 0.45916748046875, 0.5946044921875, 0.73004150390625, 0.865478515625, 1.00091552734375, 1.1363525390625, 1.27178955078125, 1.4072265625, 1.54266357421875, 1.6781005859375, 1.81353759765625, 1.948974609375, 2.08441162109375, 2.2198486328125, 2.35528564453125, 2.49072265625, 2.62615966796875, 2.7615966796875, 2.89703369140625, 3.032470703125, 3.16790771484375, 3.3033447265625, 3.43878173828125, 3.57421875]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 4.0, 5.0, 4.0, 13.0, 17.0, 25.0, 47.0, 57.0, 94.0, 130.0, 168.0, 260.0, 374.0, 536.0, 728.0, 1137.0, 1600.0, 2368.0, 3525.0, 5225.0, 7946.0, 12026.0, 18849.0, 30319.0, 48888.0, 82873.0, 149090.0, 1317241.0, 171968.0, 92922.0, 54981.0, 33350.0, 20686.0, 13363.0, 8633.0, 5790.0, 3798.0, 2501.0, 1695.0, 1235.0, 831.0, 606.0, 401.0, 265.0, 179.0, 120.0, 86.0, 57.0, 48.0, 32.0, 24.0, 9.0, 5.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.2105712890625, -0.20390892028808594, -0.19724655151367188, -0.1905841827392578, -0.18392181396484375, -0.1772594451904297, -0.17059707641601562, -0.16393470764160156, -0.1572723388671875, -0.15060997009277344, -0.14394760131835938, -0.1372852325439453, -0.13062286376953125, -0.12396049499511719, -0.11729812622070312, -0.11063575744628906, -0.103973388671875, -0.09731101989746094, -0.09064865112304688, -0.08398628234863281, -0.07732391357421875, -0.07066154479980469, -0.06399917602539062, -0.05733680725097656, -0.0506744384765625, -0.04401206970214844, -0.037349700927734375, -0.030687332153320312, -0.02402496337890625, -0.017362594604492188, -0.010700225830078125, -0.0040378570556640625, 0.00262451171875, 0.009286880493164062, 0.015949249267578125, 0.022611618041992188, 0.02927398681640625, 0.03593635559082031, 0.042598724365234375, 0.04926109313964844, 0.0559234619140625, 0.06258583068847656, 0.06924819946289062, 0.07591056823730469, 0.08257293701171875, 0.08923530578613281, 0.09589767456054688, 0.10256004333496094, 0.109222412109375, 0.11588478088378906, 0.12254714965820312, 0.1292095184326172, 0.13587188720703125, 0.1425342559814453, 0.14919662475585938, 0.15585899353027344, 0.1625213623046875, 0.16918373107910156, 0.17584609985351562, 0.1825084686279297, 0.18917083740234375, 0.1958332061767578, 0.20249557495117188, 0.20915794372558594, 0.2158203125]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 6.0, 4.0, 6.0, 7.0, 12.0, 17.0, 10.0, 14.0, 27.0, 20.0, 25.0, 36.0, 25.0, 42.0, 53.0, 57.0, 58.0, 61.0, 68.0, 64.0, 61.0, 51.0, 43.0, 33.0, 32.0, 34.0, 19.0, 19.0, 21.0, 16.0, 15.0, 8.0, 9.0, 4.0, 5.0, 5.0, 2.0, 3.0, 1.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011307001113891602, -0.0001094769686460495, -0.00010588392615318298, -0.00010229088366031647, -9.869784116744995e-05, -9.510479867458344e-05, -9.151175618171692e-05, -8.79187136888504e-05, -8.432567119598389e-05, -8.073262870311737e-05, -7.713958621025085e-05, -7.354654371738434e-05, -6.995350122451782e-05, -6.63604587316513e-05, -6.276741623878479e-05, -5.9174373745918274e-05, -5.558133125305176e-05, -5.198828876018524e-05, -4.8395246267318726e-05, -4.480220377445221e-05, -4.120916128158569e-05, -3.761611878871918e-05, -3.402307629585266e-05, -3.0430033802986145e-05, -2.683699131011963e-05, -2.3243948817253113e-05, -1.9650906324386597e-05, -1.605786383152008e-05, -1.2464821338653564e-05, -8.871778845787048e-06, -5.278736352920532e-06, -1.6856938600540161e-06, 1.9073486328125e-06, 5.500391125679016e-06, 9.093433618545532e-06, 1.2686476111412048e-05, 1.6279518604278564e-05, 1.987256109714508e-05, 2.3465603590011597e-05, 2.7058646082878113e-05, 3.065168857574463e-05, 3.4244731068611145e-05, 3.783777356147766e-05, 4.143081605434418e-05, 4.502385854721069e-05, 4.861690104007721e-05, 5.2209943532943726e-05, 5.580298602581024e-05, 5.939602851867676e-05, 6.298907101154327e-05, 6.658211350440979e-05, 7.01751559972763e-05, 7.376819849014282e-05, 7.736124098300934e-05, 8.095428347587585e-05, 8.454732596874237e-05, 8.814036846160889e-05, 9.17334109544754e-05, 9.532645344734192e-05, 9.891949594020844e-05, 0.00010251253843307495, 0.00010610558092594147, 0.00010969862341880798, 0.0001132916659116745, 0.00011688470840454102]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 6.0, 3.0, 5.0, 10.0, 2.0, 6.0, 7.0, 14.0, 13.0, 22.0, 27.0, 39.0, 33.0, 54.0, 67.0, 75.0, 115.0, 152.0, 215.0, 334.0, 640.0, 2475.0, 81453.0, 945710.0, 14522.0, 1217.0, 410.0, 252.0, 173.0, 110.0, 100.0, 67.0, 53.0, 37.0, 36.0, 22.0, 19.0, 18.0, 7.0, 11.0, 7.0, 3.0, 7.0, 5.0, 4.0, 2.0, 1.0, 4.0, 2.0, 0.0, 3.0, 1.0], "bins": [-0.002300262451171875, -0.002235099673271179, -0.0021699368953704834, -0.0021047741174697876, -0.002039611339569092, -0.001974448561668396, -0.0019092857837677002, -0.0018441230058670044, -0.0017789602279663086, -0.0017137974500656128, -0.001648634672164917, -0.0015834718942642212, -0.0015183091163635254, -0.0014531463384628296, -0.0013879835605621338, -0.001322820782661438, -0.0012576580047607422, -0.0011924952268600464, -0.0011273324489593506, -0.0010621696710586548, -0.000997006893157959, -0.0009318441152572632, -0.0008666813373565674, -0.0008015185594558716, -0.0007363557815551758, -0.00067119300365448, -0.0006060302257537842, -0.0005408674478530884, -0.0004757046699523926, -0.0004105418920516968, -0.000345379114151001, -0.0002802163362503052, -0.00021505355834960938, -0.00014989078044891357, -8.472800254821777e-05, -1.9565224647521973e-05, 4.559755325317383e-05, 0.00011076033115386963, 0.00017592310905456543, 0.00024108588695526123, 0.00030624866485595703, 0.00037141144275665283, 0.00043657422065734863, 0.0005017369985580444, 0.0005668997764587402, 0.000632062554359436, 0.0006972253322601318, 0.0007623881101608276, 0.0008275508880615234, 0.0008927136659622192, 0.000957876443862915, 0.0010230392217636108, 0.0010882019996643066, 0.0011533647775650024, 0.0012185275554656982, 0.001283690333366394, 0.0013488531112670898, 0.0014140158891677856, 0.0014791786670684814, 0.0015443414449691772, 0.001609504222869873, 0.0016746670007705688, 0.0017398297786712646, 0.0018049925565719604, 0.0018701553344726562]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 3.0, 12.0, 28.0, 71.0, 158.0, 243.0, 292.0, 122.0, 56.0, 23.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.687364707933739e-05, -4.00920762331225e-05, -3.33105017489288e-05, -2.6528929083724506e-05, -1.9747356418520212e-05, -1.2965785572305322e-05, -6.184211088111624e-06, 5.973633960820735e-07, 7.378934242296964e-06, 1.4160506907501258e-05, 2.0942079572705552e-05, 2.7723652237909846e-05, 3.450522490311414e-05, 4.128679574932903e-05, 4.806837023352273e-05, 5.4849944717716426e-05, 6.163151556393132e-05, 6.84130864101462e-05, 7.519466453231871e-05, 8.19762353785336e-05, 8.875780622474849e-05, 9.553937707096338e-05, 0.00010232094791717827, 0.00010910252603935078, 0.00011588409688556567, 0.00012266567500773817, 0.00012944724585395306, 0.00013622881670016795, 0.00014301038754638284, 0.00014979195839259773, 0.00015657352923881263, 0.00016335511463694274, 0.00017013668548315763, 0.00017691825632937253, 0.00018369982717558742, 0.0001904813980218023, 0.0001972629688680172, 0.0002040445397142321, 0.0002108261251123622, 0.0002176076959585771, 0.000224389266804792, 0.00023117083765100688, 0.00023795240849722177, 0.0002447339938953519, 0.0002515155647415668, 0.00025829713558778167, 0.00026507870643399656, 0.00027186027728021145, 0.00027864184812642634, 0.00028542341897264123, 0.0002922049898188561, 0.000298986560665071, 0.0003057681315112859, 0.0003125497023575008, 0.0003193312732037157, 0.00032611284404993057, 0.0003328944439999759, 0.0003396760148461908, 0.0003464575856924057, 0.0003532391565386206, 0.0003600207273848355, 0.00036680229823105037, 0.00037358386907726526, 0.0003803654690273106, 0.00038714701076969504]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 4.0, 5.0, 2.0, 7.0, 6.0, 11.0, 13.0, 17.0, 17.0, 23.0, 17.0, 27.0, 25.0, 31.0, 27.0, 39.0, 28.0, 37.0, 37.0, 36.0, 43.0, 46.0, 37.0, 32.0, 54.0, 36.0, 42.0, 29.0, 40.0, 28.0, 27.0, 23.0, 23.0, 24.0, 21.0, 16.0, 16.0, 11.0, 20.0, 13.0, 4.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.878376007080078e-05, -6.683450192213058e-05, -6.488524377346039e-05, -6.293598562479019e-05, -6.0986727476119995e-05, -5.90374693274498e-05, -5.70882111787796e-05, -5.5138953030109406e-05, -5.318969488143921e-05, -5.124043673276901e-05, -4.9291178584098816e-05, -4.734192043542862e-05, -4.539266228675842e-05, -4.3443404138088226e-05, -4.149414598941803e-05, -3.954488784074783e-05, -3.759562969207764e-05, -3.564637154340744e-05, -3.3697113394737244e-05, -3.174785524606705e-05, -2.979859709739685e-05, -2.7849338948726654e-05, -2.5900080800056458e-05, -2.395082265138626e-05, -2.2001564502716064e-05, -2.0052306354045868e-05, -1.810304820537567e-05, -1.6153790056705475e-05, -1.4204531908035278e-05, -1.2255273759365082e-05, -1.0306015610694885e-05, -8.356757462024689e-06, -6.407499313354492e-06, -4.458241164684296e-06, -2.508983016014099e-06, -5.597248673439026e-07, 1.389533281326294e-06, 3.3387914299964905e-06, 5.288049578666687e-06, 7.2373077273368835e-06, 9.18656587600708e-06, 1.1135824024677277e-05, 1.3085082173347473e-05, 1.503434032201767e-05, 1.6983598470687866e-05, 1.8932856619358063e-05, 2.088211476802826e-05, 2.2831372916698456e-05, 2.4780631065368652e-05, 2.672988921403885e-05, 2.8679147362709045e-05, 3.062840551137924e-05, 3.257766366004944e-05, 3.4526921808719635e-05, 3.647617995738983e-05, 3.842543810606003e-05, 4.0374696254730225e-05, 4.232395440340042e-05, 4.427321255207062e-05, 4.6222470700740814e-05, 4.817172884941101e-05, 5.012098699808121e-05, 5.2070245146751404e-05, 5.40195032954216e-05, 5.59687614440918e-05]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 5.0, 5.0, 7.0, 2.0, 11.0, 11.0, 10.0, 11.0, 21.0, 25.0, 28.0, 32.0, 25.0, 44.0, 33.0, 36.0, 49.0, 40.0, 43.0, 50.0, 37.0, 56.0, 43.0, 45.0, 37.0, 30.0, 34.0, 35.0, 35.0, 32.0, 17.0, 17.0, 22.0, 14.0, 10.0, 8.0, 13.0, 10.0, 3.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.671875, -6.4588623046875, -6.245849609375, -6.0328369140625, -5.81982421875, -5.6068115234375, -5.393798828125, -5.1807861328125, -4.9677734375, -4.7547607421875, -4.541748046875, -4.3287353515625, -4.11572265625, -3.9027099609375, -3.689697265625, -3.4766845703125, -3.263671875, -3.0506591796875, -2.837646484375, -2.6246337890625, -2.41162109375, -2.1986083984375, -1.985595703125, -1.7725830078125, -1.5595703125, -1.3465576171875, -1.133544921875, -0.9205322265625, -0.70751953125, -0.4945068359375, -0.281494140625, -0.0684814453125, 0.14453125, 0.3575439453125, 0.570556640625, 0.7835693359375, 0.99658203125, 1.2095947265625, 1.422607421875, 1.6356201171875, 1.8486328125, 2.0616455078125, 2.274658203125, 2.4876708984375, 2.70068359375, 2.9136962890625, 3.126708984375, 3.3397216796875, 3.552734375, 3.7657470703125, 3.978759765625, 4.1917724609375, 4.40478515625, 4.6177978515625, 4.830810546875, 5.0438232421875, 5.2568359375, 5.4698486328125, 5.682861328125, 5.8958740234375, 6.10888671875, 6.3218994140625, 6.534912109375, 6.7479248046875, 6.9609375]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 4.0, 2.0, 5.0, 8.0, 11.0, 10.0, 11.0, 21.0, 24.0, 40.0, 37.0, 52.0, 87.0, 133.0, 156.0, 235.0, 338.0, 506.0, 854.0, 1213.0, 2265.0, 4172.0, 9086.0, 23327.0, 84663.0, 468341.0, 353237.0, 63608.0, 19376.0, 7592.0, 3656.0, 2006.0, 1215.0, 707.0, 468.0, 309.0, 209.0, 161.0, 104.0, 81.0, 68.0, 40.0, 33.0, 19.0, 16.0, 16.0, 9.0, 10.0, 8.0, 5.0, 2.0, 3.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-11.4296875, -11.0474853515625, -10.665283203125, -10.2830810546875, -9.90087890625, -9.5186767578125, -9.136474609375, -8.7542724609375, -8.3720703125, -7.9898681640625, -7.607666015625, -7.2254638671875, -6.84326171875, -6.4610595703125, -6.078857421875, -5.6966552734375, -5.314453125, -4.9322509765625, -4.550048828125, -4.1678466796875, -3.78564453125, -3.4034423828125, -3.021240234375, -2.6390380859375, -2.2568359375, -1.8746337890625, -1.492431640625, -1.1102294921875, -0.72802734375, -0.3458251953125, 0.036376953125, 0.4185791015625, 0.80078125, 1.1829833984375, 1.565185546875, 1.9473876953125, 2.32958984375, 2.7117919921875, 3.093994140625, 3.4761962890625, 3.8583984375, 4.2406005859375, 4.622802734375, 5.0050048828125, 5.38720703125, 5.7694091796875, 6.151611328125, 6.5338134765625, 6.916015625, 7.2982177734375, 7.680419921875, 8.0626220703125, 8.44482421875, 8.8270263671875, 9.209228515625, 9.5914306640625, 9.9736328125, 10.3558349609375, 10.738037109375, 11.1202392578125, 11.50244140625, 11.8846435546875, 12.266845703125, 12.6490478515625, 13.03125]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 2.0, 5.0, 6.0, 7.0, 7.0, 11.0, 17.0, 16.0, 24.0, 24.0, 43.0, 51.0, 47.0, 54.0, 83.0, 152.0, 289.0, 1504.0, 210.0, 123.0, 83.0, 48.0, 40.0, 41.0, 37.0, 29.0, 25.0, 17.0, 10.0, 15.0, 5.0, 4.0, 7.0, 6.0, 4.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-23.84375, -23.12744140625, -22.4111328125, -21.69482421875, -20.978515625, -20.26220703125, -19.5458984375, -18.82958984375, -18.11328125, -17.39697265625, -16.6806640625, -15.96435546875, -15.248046875, -14.53173828125, -13.8154296875, -13.09912109375, -12.3828125, -11.66650390625, -10.9501953125, -10.23388671875, -9.517578125, -8.80126953125, -8.0849609375, -7.36865234375, -6.65234375, -5.93603515625, -5.2197265625, -4.50341796875, -3.787109375, -3.07080078125, -2.3544921875, -1.63818359375, -0.921875, -0.20556640625, 0.5107421875, 1.22705078125, 1.943359375, 2.65966796875, 3.3759765625, 4.09228515625, 4.80859375, 5.52490234375, 6.2412109375, 6.95751953125, 7.673828125, 8.39013671875, 9.1064453125, 9.82275390625, 10.5390625, 11.25537109375, 11.9716796875, 12.68798828125, 13.404296875, 14.12060546875, 14.8369140625, 15.55322265625, 16.26953125, 16.98583984375, 17.7021484375, 18.41845703125, 19.134765625, 19.85107421875, 20.5673828125, 21.28369140625, 22.0]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 6.0, 4.0, 2.0, 5.0, 8.0, 15.0, 13.0, 20.0, 18.0, 45.0, 59.0, 100.0, 173.0, 344.0, 940.0, 3480.0, 37244.0, 3042283.0, 54866.0, 4238.0, 989.0, 361.0, 191.0, 104.0, 55.0, 39.0, 29.0, 27.0, 12.0, 10.0, 10.0, 5.0, 3.0, 5.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-51.75, -50.05615234375, -48.3623046875, -46.66845703125, -44.974609375, -43.28076171875, -41.5869140625, -39.89306640625, -38.19921875, -36.50537109375, -34.8115234375, -33.11767578125, -31.423828125, -29.72998046875, -28.0361328125, -26.34228515625, -24.6484375, -22.95458984375, -21.2607421875, -19.56689453125, -17.873046875, -16.17919921875, -14.4853515625, -12.79150390625, -11.09765625, -9.40380859375, -7.7099609375, -6.01611328125, -4.322265625, -2.62841796875, -0.9345703125, 0.75927734375, 2.453125, 4.14697265625, 5.8408203125, 7.53466796875, 9.228515625, 10.92236328125, 12.6162109375, 14.31005859375, 16.00390625, 17.69775390625, 19.3916015625, 21.08544921875, 22.779296875, 24.47314453125, 26.1669921875, 27.86083984375, 29.5546875, 31.24853515625, 32.9423828125, 34.63623046875, 36.330078125, 38.02392578125, 39.7177734375, 41.41162109375, 43.10546875, 44.79931640625, 46.4931640625, 48.18701171875, 49.880859375, 51.57470703125, 53.2685546875, 54.96240234375, 56.65625]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 13.0, 73.0, 478.0, 381.0, 45.0, 13.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-419.5840148925781, -410.0306701660156, -400.477294921875, -390.9239501953125, -381.3705749511719, -371.8172302246094, -362.26385498046875, -352.71051025390625, -343.15716552734375, -333.60382080078125, -324.0504455566406, -314.4971008300781, -304.9437255859375, -295.390380859375, -285.8370056152344, -276.2836608886719, -266.73028564453125, -257.17694091796875, -247.62356567382812, -238.07020568847656, -228.516845703125, -218.9635009765625, -209.41014099121094, -199.85678100585938, -190.3034210205078, -180.75006103515625, -171.1967010498047, -161.64334106445312, -152.08999633789062, -142.53662109375, -132.9832763671875, -123.42991638183594, -113.87657165527344, -104.32321166992188, -94.76985168457031, -85.21649932861328, -75.66313934326172, -66.10977935791016, -56.55642318725586, -47.00306701660156, -37.44970703125, -27.89634895324707, -18.34299087524414, -8.789632797241211, 0.7637252807617188, 10.317085266113281, 19.870441436767578, 29.423797607421875, 38.97715759277344, 48.530517578125, 58.0838737487793, 67.6372299194336, 77.19058990478516, 86.74394989013672, 96.29730224609375, 105.85066223144531, 115.40402221679688, 124.95738220214844, 134.5107421875, 144.06410217285156, 153.61746215820312, 163.17080688476562, 172.7241668701172, 182.27752685546875, 191.8308868408203]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 2.0, 6.0, 7.0, 9.0, 8.0, 9.0, 9.0, 12.0, 7.0, 23.0, 21.0, 19.0, 24.0, 31.0, 39.0, 31.0, 28.0, 37.0, 41.0, 43.0, 30.0, 31.0, 37.0, 37.0, 29.0, 43.0, 46.0, 36.0, 34.0, 32.0, 45.0, 30.0, 29.0, 21.0, 7.0, 23.0, 16.0, 12.0, 11.0, 8.0, 11.0, 6.0, 5.0, 3.0, 4.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-39.6685676574707, -38.464664459228516, -37.26076126098633, -36.05685806274414, -34.85295486450195, -33.649051666259766, -32.44514846801758, -31.241247177124023, -30.037343978881836, -28.83344078063965, -27.62953758239746, -26.425634384155273, -25.22173309326172, -24.01782989501953, -22.813926696777344, -21.610023498535156, -20.40612030029297, -19.20221710205078, -17.998313903808594, -16.794410705566406, -15.590508460998535, -14.386605262756348, -13.182703018188477, -11.978799819946289, -10.774896621704102, -9.570993423461914, -8.367090225219727, -7.1631879806518555, -5.959284782409668, -4.7553815841674805, -3.551478862762451, -2.347576141357422, -1.1436729431152344, 0.06023001670837402, 1.2641329765319824, 2.468035936355591, 3.671938896179199, 4.875842094421387, 6.079744815826416, 7.283647537231445, 8.487550735473633, 9.69145393371582, 10.895357131958008, 12.099259376525879, 13.303162574768066, 14.507065773010254, 15.710968017578125, 16.914871215820312, 18.1187744140625, 19.322677612304688, 20.526580810546875, 21.730484008789062, 22.93438720703125, 24.138290405273438, 25.342191696166992, 26.54609489440918, 27.749998092651367, 28.953901290893555, 30.157804489135742, 31.36170768737793, 32.565608978271484, 33.76951217651367, 34.97341537475586, 36.17731857299805, 37.381221771240234]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 6.0, 8.0, 10.0, 6.0, 16.0, 14.0, 15.0, 19.0, 29.0, 18.0, 21.0, 21.0, 34.0, 31.0, 34.0, 36.0, 41.0, 58.0, 47.0, 39.0, 38.0, 38.0, 42.0, 45.0, 34.0, 36.0, 31.0, 25.0, 26.0, 29.0, 18.0, 24.0, 19.0, 20.0, 14.0, 10.0, 8.0, 10.0, 7.0, 7.0, 4.0, 2.0, 1.0, 4.0, 4.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.2109375, -6.971923828125, -6.73291015625, -6.493896484375, -6.2548828125, -6.015869140625, -5.77685546875, -5.537841796875, -5.298828125, -5.059814453125, -4.82080078125, -4.581787109375, -4.3427734375, -4.103759765625, -3.86474609375, -3.625732421875, -3.38671875, -3.147705078125, -2.90869140625, -2.669677734375, -2.4306640625, -2.191650390625, -1.95263671875, -1.713623046875, -1.474609375, -1.235595703125, -0.99658203125, -0.757568359375, -0.5185546875, -0.279541015625, -0.04052734375, 0.198486328125, 0.4375, 0.676513671875, 0.91552734375, 1.154541015625, 1.3935546875, 1.632568359375, 1.87158203125, 2.110595703125, 2.349609375, 2.588623046875, 2.82763671875, 3.066650390625, 3.3056640625, 3.544677734375, 3.78369140625, 4.022705078125, 4.26171875, 4.500732421875, 4.73974609375, 4.978759765625, 5.2177734375, 5.456787109375, 5.69580078125, 5.934814453125, 6.173828125, 6.412841796875, 6.65185546875, 6.890869140625, 7.1298828125, 7.368896484375, 7.60791015625, 7.846923828125, 8.0859375]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 5.0, 5.0, 5.0, 5.0, 11.0, 21.0, 21.0, 24.0, 34.0, 53.0, 75.0, 117.0, 137.0, 192.0, 255.0, 349.0, 538.0, 937.0, 1953.0, 4646.0, 14872.0, 78215.0, 2272957.0, 1737448.0, 59731.0, 12775.0, 4381.0, 1874.0, 907.0, 518.0, 344.0, 244.0, 183.0, 107.0, 84.0, 70.0, 49.0, 35.0, 27.0, 24.0, 20.0, 7.0, 9.0, 10.0, 6.0, 7.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.90625, -26.87060546875, -25.8349609375, -24.79931640625, -23.763671875, -22.72802734375, -21.6923828125, -20.65673828125, -19.62109375, -18.58544921875, -17.5498046875, -16.51416015625, -15.478515625, -14.44287109375, -13.4072265625, -12.37158203125, -11.3359375, -10.30029296875, -9.2646484375, -8.22900390625, -7.193359375, -6.15771484375, -5.1220703125, -4.08642578125, -3.05078125, -2.01513671875, -0.9794921875, 0.05615234375, 1.091796875, 2.12744140625, 3.1630859375, 4.19873046875, 5.234375, 6.27001953125, 7.3056640625, 8.34130859375, 9.376953125, 10.41259765625, 11.4482421875, 12.48388671875, 13.51953125, 14.55517578125, 15.5908203125, 16.62646484375, 17.662109375, 18.69775390625, 19.7333984375, 20.76904296875, 21.8046875, 22.84033203125, 23.8759765625, 24.91162109375, 25.947265625, 26.98291015625, 28.0185546875, 29.05419921875, 30.08984375, 31.12548828125, 32.1611328125, 33.19677734375, 34.232421875, 35.26806640625, 36.3037109375, 37.33935546875, 38.375]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 5.0, 3.0, 7.0, 15.0, 17.0, 26.0, 39.0, 66.0, 98.0, 178.0, 348.0, 608.0, 858.0, 753.0, 445.0, 238.0, 156.0, 70.0, 52.0, 28.0, 28.0, 15.0, 4.0, 6.0, 5.0, 4.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-28.171875, -27.5126953125, -26.853515625, -26.1943359375, -25.53515625, -24.8759765625, -24.216796875, -23.5576171875, -22.8984375, -22.2392578125, -21.580078125, -20.9208984375, -20.26171875, -19.6025390625, -18.943359375, -18.2841796875, -17.625, -16.9658203125, -16.306640625, -15.6474609375, -14.98828125, -14.3291015625, -13.669921875, -13.0107421875, -12.3515625, -11.6923828125, -11.033203125, -10.3740234375, -9.71484375, -9.0556640625, -8.396484375, -7.7373046875, -7.078125, -6.4189453125, -5.759765625, -5.1005859375, -4.44140625, -3.7822265625, -3.123046875, -2.4638671875, -1.8046875, -1.1455078125, -0.486328125, 0.1728515625, 0.83203125, 1.4912109375, 2.150390625, 2.8095703125, 3.46875, 4.1279296875, 4.787109375, 5.4462890625, 6.10546875, 6.7646484375, 7.423828125, 8.0830078125, 8.7421875, 9.4013671875, 10.060546875, 10.7197265625, 11.37890625, 12.0380859375, 12.697265625, 13.3564453125, 14.015625]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 5.0, 0.0, 2.0, 6.0, 4.0, 9.0, 9.0, 11.0, 9.0, 16.0, 15.0, 27.0, 33.0, 47.0, 63.0, 67.0, 79.0, 119.0, 195.0, 294.0, 489.0, 1024.0, 2788.0, 8131.0, 29659.0, 156763.0, 2441680.0, 1414089.0, 105472.0, 22456.0, 6329.0, 2221.0, 912.0, 480.0, 239.0, 135.0, 127.0, 67.0, 46.0, 36.0, 28.0, 27.0, 22.0, 10.0, 18.0, 12.0, 6.0, 3.0, 7.0, 5.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.828125, -18.21875, -17.609375, -17.0, -16.390625, -15.78125, -15.171875, -14.5625, -13.953125, -13.34375, -12.734375, -12.125, -11.515625, -10.90625, -10.296875, -9.6875, -9.078125, -8.46875, -7.859375, -7.25, -6.640625, -6.03125, -5.421875, -4.8125, -4.203125, -3.59375, -2.984375, -2.375, -1.765625, -1.15625, -0.546875, 0.0625, 0.671875, 1.28125, 1.890625, 2.5, 3.109375, 3.71875, 4.328125, 4.9375, 5.546875, 6.15625, 6.765625, 7.375, 7.984375, 8.59375, 9.203125, 9.8125, 10.421875, 11.03125, 11.640625, 12.25, 12.859375, 13.46875, 14.078125, 14.6875, 15.296875, 15.90625, 16.515625, 17.125, 17.734375, 18.34375, 18.953125, 19.5625, 20.171875]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 6.0, 5.0, 3.0, 6.0, 9.0, 13.0, 13.0, 16.0, 26.0, 34.0, 26.0, 53.0, 67.0, 76.0, 79.0, 89.0, 80.0, 73.0, 71.0, 49.0, 39.0, 47.0, 28.0, 20.0, 17.0, 13.0, 14.0, 12.0, 9.0, 3.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-91.79130554199219, -89.21698760986328, -86.64266204833984, -84.06834411621094, -81.4940185546875, -78.9197006225586, -76.34538269042969, -73.77105712890625, -71.19673919677734, -68.62242126464844, -66.048095703125, -63.473777770996094, -60.89945602416992, -58.32513427734375, -55.75081253051758, -53.176490783691406, -50.602169036865234, -48.02784729003906, -45.45352554321289, -42.87920379638672, -40.30488586425781, -37.73056411743164, -35.15624237060547, -32.58192443847656, -30.007600784301758, -27.433279037475586, -24.858959197998047, -22.284637451171875, -19.710315704345703, -17.135995864868164, -14.561674118041992, -11.987354278564453, -9.413032531738281, -6.838711738586426, -4.264390468597412, -1.6900691986083984, 0.884251594543457, 3.4585723876953125, 6.032894134521484, 8.607213973999023, 11.181535720825195, 13.75585651397705, 16.330177307128906, 18.904499053955078, 21.47882080078125, 24.05314064025879, 26.62746238708496, 29.2017822265625, 31.776103973388672, 34.350425720214844, 36.924747467041016, 39.49906921386719, 42.073387145996094, 44.647708892822266, 47.22203063964844, 49.796348571777344, 52.37067413330078, 54.94499588012695, 57.519317626953125, 60.09363555908203, 62.6679573059082, 65.24227905273438, 67.81660461425781, 70.39092254638672, 72.96524047851562]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 4.0, 3.0, 2.0, 3.0, 9.0, 6.0, 11.0, 12.0, 18.0, 22.0, 29.0, 22.0, 36.0, 37.0, 49.0, 42.0, 54.0, 53.0, 71.0, 62.0, 61.0, 61.0, 49.0, 44.0, 33.0, 40.0, 29.0, 28.0, 23.0, 20.0, 12.0, 13.0, 11.0, 7.0, 8.0, 5.0, 4.0, 2.0, 4.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-69.92576599121094, -67.708984375, -65.49220275878906, -63.27542495727539, -61.05864715576172, -58.84186553955078, -56.625083923339844, -54.40830612182617, -52.1915283203125, -49.97474670410156, -47.75796890258789, -45.54118728637695, -43.32440948486328, -41.107627868652344, -38.890846252441406, -36.674068450927734, -34.4572868347168, -32.24050521850586, -30.023727416992188, -27.80694580078125, -25.590167999267578, -23.37338638305664, -21.156606674194336, -18.93982696533203, -16.723047256469727, -14.506267547607422, -12.289487838745117, -10.072707176208496, -7.855927467346191, -5.639147758483887, -3.4223670959472656, -1.205587387084961, 1.0111923217773438, 3.2279722690582275, 5.444752216339111, 7.661532402038574, 9.878312110900879, 12.095091819763184, 14.311872482299805, 16.52865219116211, 18.745431900024414, 20.96221160888672, 23.178991317749023, 25.395771026611328, 27.612552642822266, 29.829330444335938, 32.046112060546875, 34.26289367675781, 36.479671478271484, 38.69645309448242, 40.913230895996094, 43.13001251220703, 45.3467903137207, 47.56357192993164, 49.78034973144531, 51.99713134765625, 54.21391296386719, 56.430694580078125, 58.6474723815918, 60.864253997802734, 63.081031799316406, 65.29781341552734, 67.51459503173828, 69.73136901855469, 71.94815063476562]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 2.0, 1.0, 2.0, 4.0, 1.0, 3.0, 7.0, 4.0, 8.0, 11.0, 12.0, 8.0, 11.0, 14.0, 16.0, 25.0, 40.0, 28.0, 32.0, 42.0, 33.0, 32.0, 41.0, 40.0, 27.0, 43.0, 38.0, 32.0, 56.0, 36.0, 36.0, 48.0, 27.0, 35.0, 36.0, 20.0, 25.0, 23.0, 13.0, 20.0, 12.0, 16.0, 7.0, 7.0, 11.0, 4.0, 4.0, 6.0, 4.0, 4.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-96.0, -93.115234375, -90.23046875, -87.345703125, -84.4609375, -81.576171875, -78.69140625, -75.806640625, -72.921875, -70.037109375, -67.15234375, -64.267578125, -61.3828125, -58.498046875, -55.61328125, -52.728515625, -49.84375, -46.958984375, -44.07421875, -41.189453125, -38.3046875, -35.419921875, -32.53515625, -29.650390625, -26.765625, -23.880859375, -20.99609375, -18.111328125, -15.2265625, -12.341796875, -9.45703125, -6.572265625, -3.6875, -0.802734375, 2.08203125, 4.966796875, 7.8515625, 10.736328125, 13.62109375, 16.505859375, 19.390625, 22.275390625, 25.16015625, 28.044921875, 30.9296875, 33.814453125, 36.69921875, 39.583984375, 42.46875, 45.353515625, 48.23828125, 51.123046875, 54.0078125, 56.892578125, 59.77734375, 62.662109375, 65.546875, 68.431640625, 71.31640625, 74.201171875, 77.0859375, 79.970703125, 82.85546875, 85.740234375, 88.625]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 5.0, 7.0, 6.0, 11.0, 18.0, 19.0, 42.0, 51.0, 84.0, 129.0, 193.0, 271.0, 457.0, 654.0, 943.0, 1435.0, 2162.0, 3188.0, 4928.0, 7651.0, 11372.0, 17390.0, 27254.0, 42984.0, 68931.0, 111789.0, 191741.0, 214021.0, 127683.0, 77426.0, 48398.0, 30406.0, 19762.0, 12552.0, 8386.0, 5444.0, 3663.0, 2400.0, 1595.0, 1008.0, 713.0, 471.0, 302.0, 213.0, 148.0, 86.0, 58.0, 41.0, 25.0, 13.0, 17.0, 10.0, 5.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.1953125, -3.085601806640625, -2.97589111328125, -2.866180419921875, -2.7564697265625, -2.646759033203125, -2.53704833984375, -2.427337646484375, -2.317626953125, -2.207916259765625, -2.09820556640625, -1.988494873046875, -1.8787841796875, -1.769073486328125, -1.65936279296875, -1.549652099609375, -1.43994140625, -1.330230712890625, -1.22052001953125, -1.110809326171875, -1.0010986328125, -0.891387939453125, -0.78167724609375, -0.671966552734375, -0.562255859375, -0.452545166015625, -0.34283447265625, -0.233123779296875, -0.1234130859375, -0.013702392578125, 0.09600830078125, 0.205718994140625, 0.3154296875, 0.425140380859375, 0.53485107421875, 0.644561767578125, 0.7542724609375, 0.863983154296875, 0.97369384765625, 1.083404541015625, 1.193115234375, 1.302825927734375, 1.41253662109375, 1.522247314453125, 1.6319580078125, 1.741668701171875, 1.85137939453125, 1.961090087890625, 2.07080078125, 2.180511474609375, 2.29022216796875, 2.399932861328125, 2.5096435546875, 2.619354248046875, 2.72906494140625, 2.838775634765625, 2.948486328125, 3.058197021484375, 3.16790771484375, 3.277618408203125, 3.3873291015625, 3.497039794921875, 3.60675048828125, 3.716461181640625, 3.826171875]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 4.0, 8.0, 5.0, 9.0, 14.0, 10.0, 16.0, 22.0, 12.0, 17.0, 15.0, 21.0, 29.0, 29.0, 37.0, 36.0, 28.0, 46.0, 33.0, 53.0, 46.0, 1061.0, 33.0, 46.0, 33.0, 41.0, 30.0, 22.0, 39.0, 36.0, 26.0, 23.0, 19.0, 17.0, 15.0, 12.0, 12.0, 14.0, 16.0, 6.0, 12.0, 8.0, 8.0, 5.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-59.5625, -57.74853515625, -55.9345703125, -54.12060546875, -52.306640625, -50.49267578125, -48.6787109375, -46.86474609375, -45.05078125, -43.23681640625, -41.4228515625, -39.60888671875, -37.794921875, -35.98095703125, -34.1669921875, -32.35302734375, -30.5390625, -28.72509765625, -26.9111328125, -25.09716796875, -23.283203125, -21.46923828125, -19.6552734375, -17.84130859375, -16.02734375, -14.21337890625, -12.3994140625, -10.58544921875, -8.771484375, -6.95751953125, -5.1435546875, -3.32958984375, -1.515625, 0.29833984375, 2.1123046875, 3.92626953125, 5.740234375, 7.55419921875, 9.3681640625, 11.18212890625, 12.99609375, 14.81005859375, 16.6240234375, 18.43798828125, 20.251953125, 22.06591796875, 23.8798828125, 25.69384765625, 27.5078125, 29.32177734375, 31.1357421875, 32.94970703125, 34.763671875, 36.57763671875, 38.3916015625, 40.20556640625, 42.01953125, 43.83349609375, 45.6474609375, 47.46142578125, 49.275390625, 51.08935546875, 52.9033203125, 54.71728515625, 56.53125]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 3.0, 6.0, 8.0, 12.0, 11.0, 22.0, 16.0, 22.0, 44.0, 74.0, 108.0, 186.0, 248.0, 326.0, 510.0, 771.0, 1062.0, 1602.0, 2297.0, 3635.0, 5236.0, 8196.0, 12743.0, 20532.0, 32601.0, 53416.0, 91772.0, 167776.0, 1303029.0, 161899.0, 88895.0, 52049.0, 32056.0, 19699.0, 12411.0, 7892.0, 5273.0, 3549.0, 2313.0, 1623.0, 1016.0, 701.0, 477.0, 321.0, 231.0, 161.0, 94.0, 76.0, 40.0, 27.0, 33.0, 15.0, 5.0, 5.0, 5.0, 6.0, 4.0, 4.0, 1.0, 3.0], "bins": [-3.01953125, -2.926544189453125, -2.83355712890625, -2.740570068359375, -2.6475830078125, -2.554595947265625, -2.46160888671875, -2.368621826171875, -2.275634765625, -2.182647705078125, -2.08966064453125, -1.996673583984375, -1.9036865234375, -1.810699462890625, -1.71771240234375, -1.624725341796875, -1.53173828125, -1.438751220703125, -1.34576416015625, -1.252777099609375, -1.1597900390625, -1.066802978515625, -0.97381591796875, -0.880828857421875, -0.787841796875, -0.694854736328125, -0.60186767578125, -0.508880615234375, -0.4158935546875, -0.322906494140625, -0.22991943359375, -0.136932373046875, -0.0439453125, 0.049041748046875, 0.14202880859375, 0.235015869140625, 0.3280029296875, 0.420989990234375, 0.51397705078125, 0.606964111328125, 0.699951171875, 0.792938232421875, 0.88592529296875, 0.978912353515625, 1.0718994140625, 1.164886474609375, 1.25787353515625, 1.350860595703125, 1.44384765625, 1.536834716796875, 1.62982177734375, 1.722808837890625, 1.8157958984375, 1.908782958984375, 2.00177001953125, 2.094757080078125, 2.187744140625, 2.280731201171875, 2.37371826171875, 2.466705322265625, 2.5596923828125, 2.652679443359375, 2.74566650390625, 2.838653564453125, 2.931640625]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 0.0, 3.0, 2.0, 2.0, 4.0, 5.0, 7.0, 6.0, 6.0, 7.0, 20.0, 23.0, 13.0, 30.0, 49.0, 106.0, 143.0, 154.0, 123.0, 93.0, 66.0, 36.0, 30.0, 15.0, 12.0, 11.0, 7.0, 6.0, 4.0, 3.0, 6.0, 0.0, 4.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.006519317626953125, -0.0063405632972717285, -0.006161808967590332, -0.0059830546379089355, -0.005804300308227539, -0.005625545978546143, -0.005446791648864746, -0.00526803731918335, -0.005089282989501953, -0.004910528659820557, -0.00473177433013916, -0.004553020000457764, -0.004374265670776367, -0.004195511341094971, -0.004016757011413574, -0.0038380026817321777, -0.0036592483520507812, -0.0034804940223693848, -0.0033017396926879883, -0.003122985363006592, -0.0029442310333251953, -0.002765476703643799, -0.0025867223739624023, -0.002407968044281006, -0.0022292137145996094, -0.002050459384918213, -0.0018717050552368164, -0.00169295072555542, -0.0015141963958740234, -0.001335442066192627, -0.0011566877365112305, -0.000977933406829834, -0.0007991790771484375, -0.000620424747467041, -0.00044167041778564453, -0.00026291608810424805, -8.416175842285156e-05, 9.459257125854492e-05, 0.0002733469009399414, 0.0004521012306213379, 0.0006308555603027344, 0.0008096098899841309, 0.0009883642196655273, 0.0011671185493469238, 0.0013458728790283203, 0.0015246272087097168, 0.0017033815383911133, 0.0018821358680725098, 0.0020608901977539062, 0.0022396445274353027, 0.0024183988571166992, 0.0025971531867980957, 0.002775907516479492, 0.0029546618461608887, 0.003133416175842285, 0.0033121705055236816, 0.003490924835205078, 0.0036696791648864746, 0.003848433494567871, 0.004027187824249268, 0.004205942153930664, 0.0043846964836120605, 0.004563450813293457, 0.0047422051429748535, 0.00492095947265625]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 5.0, 1.0, 3.0, 4.0, 2.0, 9.0, 8.0, 9.0, 7.0, 18.0, 18.0, 25.0, 38.0, 61.0, 113.0, 205.0, 403.0, 701.0, 1365.0, 2567.0, 5839.0, 14286.0, 41111.0, 159506.0, 614819.0, 144649.0, 38488.0, 13421.0, 5472.0, 2536.0, 1287.0, 699.0, 371.0, 195.0, 102.0, 64.0, 40.0, 27.0, 20.0, 13.0, 9.0, 8.0, 10.0, 8.0, 7.0, 4.0, 4.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.02276611328125, -0.02196645736694336, -0.02116680145263672, -0.020367145538330078, -0.019567489624023438, -0.018767833709716797, -0.017968177795410156, -0.017168521881103516, -0.016368865966796875, -0.015569210052490234, -0.014769554138183594, -0.013969898223876953, -0.013170242309570312, -0.012370586395263672, -0.011570930480957031, -0.01077127456665039, -0.00997161865234375, -0.00917196273803711, -0.008372306823730469, -0.007572650909423828, -0.0067729949951171875, -0.005973339080810547, -0.005173683166503906, -0.004374027252197266, -0.003574371337890625, -0.0027747154235839844, -0.0019750595092773438, -0.0011754035949707031, -0.0003757476806640625, 0.0004239082336425781, 0.0012235641479492188, 0.0020232200622558594, 0.0028228759765625, 0.0036225318908691406, 0.004422187805175781, 0.005221843719482422, 0.0060214996337890625, 0.006821155548095703, 0.007620811462402344, 0.008420467376708984, 0.009220123291015625, 0.010019779205322266, 0.010819435119628906, 0.011619091033935547, 0.012418746948242188, 0.013218402862548828, 0.014018058776855469, 0.01481771469116211, 0.01561737060546875, 0.01641702651977539, 0.01721668243408203, 0.018016338348388672, 0.018815994262695312, 0.019615650177001953, 0.020415306091308594, 0.021214962005615234, 0.022014617919921875, 0.022814273834228516, 0.023613929748535156, 0.024413585662841797, 0.025213241577148438, 0.026012897491455078, 0.02681255340576172, 0.02761220932006836, 0.028411865234375]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 8.0, 2.0, 16.0, 25.0, 23.0, 34.0, 52.0, 64.0, 103.0, 119.0, 117.0, 127.0, 83.0, 52.0, 60.0, 42.0, 12.0, 21.0, 12.0, 11.0, 8.0, 6.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.006828643381595612, -0.0066714719869196415, -0.006514300592243671, -0.006357129197567701, -0.006199957802891731, -0.006042786408215761, -0.005885615013539791, -0.005728443618863821, -0.005571272224187851, -0.005414100829511881, -0.005256929434835911, -0.005099758040159941, -0.004942586645483971, -0.0047854152508080006, -0.0046282438561320305, -0.00447107246145606, -0.00431390106678009, -0.00415672967210412, -0.00399955827742815, -0.00384238688275218, -0.00368521548807621, -0.00352804409340024, -0.00337087269872427, -0.0032137013040483, -0.0030565294437110424, -0.0028993580490350723, -0.0027421866543591022, -0.002585015259683132, -0.002427843865007162, -0.002270672470331192, -0.002113501075655222, -0.001956329680979252, -0.0017991585191339254, -0.0016419871244579554, -0.0014848157297819853, -0.0013276443351060152, -0.0011704729404300451, -0.001013301545754075, -0.0008561300346627831, -0.0006989586399868131, -0.000541787245310843, -0.0003846158506348729, -0.00022744442685507238, -7.027300307527184e-05, 8.689839160069823e-05, 0.0002440697862766683, 0.0004012412391602993, 0.0005584126338362694, 0.0007155840285122395, 0.0008727554231882095, 0.0010299268178641796, 0.0011870982125401497, 0.0013442696072161198, 0.0015014410018920898, 0.0016586125129833817, 0.0018157839076593518, 0.00197295518592, 0.00213012658059597, 0.0022872979752719402, 0.0024444693699479103, 0.0026016407646238804, 0.0027588121592998505, 0.0029159835539758205, 0.0030731549486517906, 0.0032303265761584044]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 3.0, 5.0, 2.0, 2.0, 3.0, 6.0, 5.0, 7.0, 8.0, 13.0, 18.0, 10.0, 10.0, 14.0, 23.0, 21.0, 31.0, 31.0, 39.0, 34.0, 27.0, 36.0, 31.0, 36.0, 35.0, 45.0, 29.0, 28.0, 45.0, 37.0, 37.0, 29.0, 44.0, 34.0, 20.0, 30.0, 25.0, 27.0, 24.0, 16.0, 13.0, 16.0, 9.0, 9.0, 10.0, 5.0, 7.0, 5.0, 6.0, 1.0, 6.0, 3.0, 1.0, 1.0, 2.0, 0.0, 3.0], "bins": [-0.0022095441818237305, -0.0021430132910609245, -0.0020764824002981186, -0.0020099515095353127, -0.0019434206187725067, -0.0018768897280097008, -0.0018103588372468948, -0.001743827946484089, -0.001677297055721283, -0.001610766164958477, -0.001544235274195671, -0.0014777043834328651, -0.0014111734926700592, -0.0013446426019072533, -0.0012781117111444473, -0.0012115808203816414, -0.0011450499296188354, -0.0010785190388560295, -0.0010119881480932236, -0.0009454572573304176, -0.0008789263665676117, -0.0008123954758048058, -0.0007458645850419998, -0.0006793336942791939, -0.0006128028035163879, -0.000546271912753582, -0.00047974102199077606, -0.0004132101312279701, -0.0003466792404651642, -0.00028014834970235825, -0.0002136174589395523, -0.00014708656817674637, -8.055567741394043e-05, -1.4024786651134491e-05, 5.250610411167145e-05, 0.00011903699487447739, 0.00018556788563728333, 0.00025209877640008926, 0.0003186296671628952, 0.00038516055792570114, 0.0004516914486885071, 0.000518222339451313, 0.000584753230214119, 0.0006512841209769249, 0.0007178150117397308, 0.0007843459025025368, 0.0008508767932653427, 0.0009174076840281487, 0.0009839385747909546, 0.0010504694655537605, 0.0011170003563165665, 0.0011835312470793724, 0.0012500621378421783, 0.0013165930286049843, 0.0013831239193677902, 0.0014496548101305962, 0.001516185700893402, 0.001582716591656208, 0.001649247482419014, 0.00171577837318182, 0.0017823092639446259, 0.0018488401547074318, 0.0019153710454702377, 0.0019819019362330437, 0.0020484328269958496]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 2.0, 1.0, 2.0, 4.0, 1.0, 3.0, 7.0, 4.0, 8.0, 11.0, 12.0, 8.0, 11.0, 14.0, 16.0, 25.0, 40.0, 28.0, 32.0, 42.0, 33.0, 32.0, 41.0, 40.0, 27.0, 43.0, 38.0, 33.0, 55.0, 36.0, 36.0, 47.0, 28.0, 35.0, 36.0, 20.0, 25.0, 23.0, 13.0, 20.0, 12.0, 16.0, 6.0, 8.0, 11.0, 4.0, 4.0, 6.0, 4.0, 4.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-96.0, -93.115234375, -90.23046875, -87.345703125, -84.4609375, -81.576171875, -78.69140625, -75.806640625, -72.921875, -70.037109375, -67.15234375, -64.267578125, -61.3828125, -58.498046875, -55.61328125, -52.728515625, -49.84375, -46.958984375, -44.07421875, -41.189453125, -38.3046875, -35.419921875, -32.53515625, -29.650390625, -26.765625, -23.880859375, -20.99609375, -18.111328125, -15.2265625, -12.341796875, -9.45703125, -6.572265625, -3.6875, -0.802734375, 2.08203125, 4.966796875, 7.8515625, 10.736328125, 13.62109375, 16.505859375, 19.390625, 22.275390625, 25.16015625, 28.044921875, 30.9296875, 33.814453125, 36.69921875, 39.583984375, 42.46875, 45.353515625, 48.23828125, 51.123046875, 54.0078125, 56.892578125, 59.77734375, 62.662109375, 65.546875, 68.431640625, 71.31640625, 74.201171875, 77.0859375, 79.970703125, 82.85546875, 85.740234375, 88.625]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 4.0, 3.0, 3.0, 4.0, 6.0, 8.0, 11.0, 12.0, 13.0, 21.0, 20.0, 35.0, 42.0, 57.0, 65.0, 85.0, 127.0, 168.0, 230.0, 398.0, 647.0, 1310.0, 2845.0, 6721.0, 18497.0, 61082.0, 236245.0, 480986.0, 168851.0, 44986.0, 14346.0, 5551.0, 2267.0, 1150.0, 604.0, 368.0, 180.0, 135.0, 97.0, 84.0, 68.0, 47.0, 43.0, 30.0, 24.0, 21.0, 18.0, 14.0, 11.0, 8.0, 6.0, 4.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0], "bins": [-14.5546875, -14.11865234375, -13.6826171875, -13.24658203125, -12.810546875, -12.37451171875, -11.9384765625, -11.50244140625, -11.06640625, -10.63037109375, -10.1943359375, -9.75830078125, -9.322265625, -8.88623046875, -8.4501953125, -8.01416015625, -7.578125, -7.14208984375, -6.7060546875, -6.27001953125, -5.833984375, -5.39794921875, -4.9619140625, -4.52587890625, -4.08984375, -3.65380859375, -3.2177734375, -2.78173828125, -2.345703125, -1.90966796875, -1.4736328125, -1.03759765625, -0.6015625, -0.16552734375, 0.2705078125, 0.70654296875, 1.142578125, 1.57861328125, 2.0146484375, 2.45068359375, 2.88671875, 3.32275390625, 3.7587890625, 4.19482421875, 4.630859375, 5.06689453125, 5.5029296875, 5.93896484375, 6.375, 6.81103515625, 7.2470703125, 7.68310546875, 8.119140625, 8.55517578125, 8.9912109375, 9.42724609375, 9.86328125, 10.29931640625, 10.7353515625, 11.17138671875, 11.607421875, 12.04345703125, 12.4794921875, 12.91552734375, 13.3515625]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 1.0, 1.0, 0.0, 2.0, 5.0, 6.0, 8.0, 13.0, 13.0, 14.0, 25.0, 27.0, 44.0, 51.0, 47.0, 57.0, 68.0, 67.0, 2074.0, 107.0, 58.0, 62.0, 61.0, 68.0, 37.0, 34.0, 30.0, 18.0, 18.0, 8.0, 14.0, 3.0, 4.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-233.625, -227.267578125, -220.91015625, -214.552734375, -208.1953125, -201.837890625, -195.48046875, -189.123046875, -182.765625, -176.408203125, -170.05078125, -163.693359375, -157.3359375, -150.978515625, -144.62109375, -138.263671875, -131.90625, -125.548828125, -119.19140625, -112.833984375, -106.4765625, -100.119140625, -93.76171875, -87.404296875, -81.046875, -74.689453125, -68.33203125, -61.974609375, -55.6171875, -49.259765625, -42.90234375, -36.544921875, -30.1875, -23.830078125, -17.47265625, -11.115234375, -4.7578125, 1.599609375, 7.95703125, 14.314453125, 20.671875, 27.029296875, 33.38671875, 39.744140625, 46.1015625, 52.458984375, 58.81640625, 65.173828125, 71.53125, 77.888671875, 84.24609375, 90.603515625, 96.9609375, 103.318359375, 109.67578125, 116.033203125, 122.390625, 128.748046875, 135.10546875, 141.462890625, 147.8203125, 154.177734375, 160.53515625, 166.892578125, 173.25]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 4.0, 1.0, 9.0, 7.0, 4.0, 18.0, 19.0, 41.0, 43.0, 63.0, 85.0, 131.0, 211.0, 355.0, 554.0, 1019.0, 2384.0, 8939.0, 78084.0, 2868548.0, 165138.0, 14049.0, 2969.0, 1252.0, 643.0, 385.0, 238.0, 144.0, 95.0, 72.0, 43.0, 38.0, 32.0, 21.0, 13.0, 10.0, 8.0, 5.0, 5.0, 8.0, 5.0, 3.0, 4.0, 1.0, 5.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-26.234375, -25.284912109375, -24.33544921875, -23.385986328125, -22.4365234375, -21.487060546875, -20.53759765625, -19.588134765625, -18.638671875, -17.689208984375, -16.73974609375, -15.790283203125, -14.8408203125, -13.891357421875, -12.94189453125, -11.992431640625, -11.04296875, -10.093505859375, -9.14404296875, -8.194580078125, -7.2451171875, -6.295654296875, -5.34619140625, -4.396728515625, -3.447265625, -2.497802734375, -1.54833984375, -0.598876953125, 0.3505859375, 1.300048828125, 2.24951171875, 3.198974609375, 4.1484375, 5.097900390625, 6.04736328125, 6.996826171875, 7.9462890625, 8.895751953125, 9.84521484375, 10.794677734375, 11.744140625, 12.693603515625, 13.64306640625, 14.592529296875, 15.5419921875, 16.491455078125, 17.44091796875, 18.390380859375, 19.33984375, 20.289306640625, 21.23876953125, 22.188232421875, 23.1376953125, 24.087158203125, 25.03662109375, 25.986083984375, 26.935546875, 27.885009765625, 28.83447265625, 29.783935546875, 30.7333984375, 31.682861328125, 32.63232421875, 33.581787109375, 34.53125]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 9.0, 12.0, 17.0, 44.0, 101.0, 260.0, 282.0, 159.0, 52.0, 21.0, 16.0, 8.0, 5.0, 6.0, 2.0, 2.0, 3.0, 3.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-219.9298553466797, -207.06796264648438, -194.20608520507812, -181.34420776367188, -168.48231506347656, -155.62042236328125, -142.758544921875, -129.89666748046875, -117.03477478027344, -104.17288970947266, -91.31100463867188, -78.4491195678711, -65.58723449707031, -52.72534942626953, -39.86346435546875, -27.00157928466797, -14.139694213867188, -1.2778091430664062, 11.584075927734375, 24.445960998535156, 37.30784606933594, 50.16973114013672, 63.0316162109375, 75.89350128173828, 88.75538635253906, 101.61727142333984, 114.47915649414062, 127.3410415649414, 140.2029266357422, 153.0648193359375, 165.92669677734375, 178.78857421875, 191.65045166015625, 204.5123291015625, 217.3742218017578, 230.23611450195312, 243.09799194335938, 255.95986938476562, 268.82177734375, 281.68365478515625, 294.5455322265625, 307.40740966796875, 320.269287109375, 333.1311950683594, 345.9930725097656, 358.8549499511719, 371.71685791015625, 384.5787353515625, 397.44061279296875, 410.302490234375, 423.16436767578125, 436.0262756347656, 448.8881530761719, 461.7500305175781, 474.6119384765625, 487.47381591796875, 500.335693359375, 513.1975708007812, 526.0594482421875, 538.9213256835938, 551.783203125, 564.6451416015625, 577.5070190429688, 590.368896484375, 603.2307739257812]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 5.0, 7.0, 5.0, 8.0, 10.0, 18.0, 19.0, 18.0, 8.0, 34.0, 27.0, 36.0, 45.0, 37.0, 50.0, 48.0, 54.0, 74.0, 51.0, 51.0, 50.0, 41.0, 35.0, 35.0, 27.0, 30.0, 40.0, 23.0, 22.0, 14.0, 10.0, 15.0, 14.0, 10.0, 9.0, 5.0, 7.0, 1.0, 1.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-209.44200134277344, -202.90267944335938, -196.3633575439453, -189.82403564453125, -183.28469848632812, -176.74537658691406, -170.2060546875, -163.66673278808594, -157.12741088867188, -150.5880889892578, -144.04876708984375, -137.50942993164062, -130.97010803222656, -124.4307861328125, -117.89146423339844, -111.35214233398438, -104.81281280517578, -98.27349090576172, -91.73416137695312, -85.19483947753906, -78.655517578125, -72.11619567871094, -65.57686614990234, -59.03754425048828, -52.49821853637695, -45.958892822265625, -39.41957092285156, -32.880245208740234, -26.34092140197754, -19.801597595214844, -13.262271881103516, -6.722949981689453, -0.183624267578125, 6.3557000160217285, 12.895024299621582, 19.434349060058594, 25.97367286682129, 32.512996673583984, 39.05232238769531, 45.591644287109375, 52.1309700012207, 58.67029571533203, 65.2096176147461, 71.74894714355469, 78.28826904296875, 84.82759094238281, 91.36691284179688, 97.90623474121094, 104.44556427001953, 110.9848861694336, 117.52421569824219, 124.06353759765625, 130.6028594970703, 137.14218139648438, 143.6815185546875, 150.2208251953125, 156.76016235351562, 163.2994842529297, 169.83880615234375, 176.37814331054688, 182.91746520996094, 189.456787109375, 195.99610900878906, 202.53543090820312, 209.0747528076172]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 6.0, 7.0, 9.0, 17.0, 21.0, 27.0, 37.0, 60.0, 81.0, 96.0, 154.0, 156.0, 223.0, 358.0, 920.0, 3063.0, 18819.0, 1019169.0, 3162.0, 864.0, 385.0, 252.0, 173.0, 121.0, 107.0, 74.0, 51.0, 48.0, 32.0, 15.0, 23.0, 11.0, 4.0, 5.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.69109344482422, -59.22428512573242, -56.757476806640625, -54.29066848754883, -51.82386016845703, -49.357051849365234, -46.89024353027344, -44.42343521118164, -41.956626892089844, -39.48981857299805, -37.02301025390625, -34.55620193481445, -32.089393615722656, -29.62258529663086, -27.155776977539062, -24.688968658447266, -22.22216033935547, -19.755352020263672, -17.288543701171875, -14.821735382080078, -12.354927062988281, -9.888118743896484, -7.4213104248046875, -4.954502105712891, -2.4876937866210938, -0.020885467529296875, 2.4459228515625, 4.912731170654297, 7.379539489746094, 9.84634780883789, 12.313156127929688, 14.779964447021484, 17.246780395507812, 19.71358871459961, 22.180397033691406, 24.647205352783203, 27.114013671875, 29.580821990966797, 32.047630310058594, 34.51443862915039, 36.98124694824219, 39.448055267333984, 41.91486358642578, 44.38167190551758, 46.848480224609375, 49.31528854370117, 51.78209686279297, 54.248905181884766, 56.71571350097656, 59.18252182006836, 61.649330139160156, 64.11613464355469, 66.58294677734375, 69.04975891113281, 71.51656341552734, 73.98336791992188, 76.45018005371094, 78.9169921875, 81.38379669189453, 83.85060119628906, 86.31741333007812, 88.78422546386719, 91.25102996826172, 93.71783447265625, 96.18464660644531]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 8.0, 3.0, 12.0, 12.0, 23.0, 44.0, 75.0, 98.0, 264.0, 51461152.0, 1280.0, 87.0, 48.0, 13.0, 12.0, 14.0, 5.0, 5.0, 6.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1333.872802734375, -1262.6396484375, -1191.4066162109375, -1120.1734619140625, -1048.9404296875, -977.707275390625, -906.47412109375, -835.2410278320312, -764.0079345703125, -692.7748413085938, -621.541748046875, -550.30859375, -479.07550048828125, -407.8424072265625, -336.6092834472656, -265.37615966796875, -194.14306640625, -122.90995788574219, -51.676849365234375, 19.556259155273438, 90.78936767578125, 162.0224609375, 233.25558471679688, 304.48870849609375, 375.7218017578125, 446.95489501953125, 518.18798828125, 589.421142578125, 660.6542358398438, 731.8873291015625, 803.1204833984375, 874.3535766601562, 945.5869140625, 1016.8200073242188, 1088.0531005859375, 1159.2862548828125, 1230.519287109375, 1301.75244140625, 1372.985595703125, 1444.21875, 1515.4517822265625, 1586.6849365234375, 1657.91796875, 1729.151123046875, 1800.38427734375, 1871.6173095703125, 1942.8504638671875, 2014.08349609375, 2085.316650390625, 2156.5498046875, 2227.782958984375, 2299.015869140625, 2370.2490234375, 2441.482177734375, 2512.71533203125, 2583.948486328125, 2655.181640625, 2726.414794921875, 2797.64794921875, 2868.880859375, 2940.114013671875, 3011.34716796875, 3082.580322265625, 3153.8134765625, 3225.04638671875]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [5.0, 2.0, 9.0, 17.0, 13.0, 28.0, 45.0, 87.0, 130.0, 171.0, 287.0, 404.0, 513.0, 792.0, 1142.0, 1736.0, 2455.0, 3389.0, 4951.0, 7019.0, 10164.0, 13943.0, 19905.0, 28626.0, 42515.0, 61402.0, 90923.0, 136972.0, 212281.0, 339661.0, 753858.0, 3516213.0, 365068.0, 226110.0, 146436.0, 96844.0, 65054.0, 43158.0, 29787.0, 20764.0, 14106.0, 10249.0, 7402.0, 5136.0, 3564.0, 2483.0, 1731.0, 1351.0, 875.0, 566.0, 368.0, 241.0, 176.0, 106.0, 76.0, 54.0, 28.0, 24.0, 21.0, 7.0, 3.0, 2.0, 4.0, 4.0], "bins": [-0.84765625, -0.82037353515625, -0.7930908203125, -0.76580810546875, -0.738525390625, -0.71124267578125, -0.6839599609375, -0.65667724609375, -0.62939453125, -0.60211181640625, -0.5748291015625, -0.54754638671875, -0.520263671875, -0.49298095703125, -0.4656982421875, -0.43841552734375, -0.4111328125, -0.38385009765625, -0.3565673828125, -0.32928466796875, -0.302001953125, -0.27471923828125, -0.2474365234375, -0.22015380859375, -0.19287109375, -0.16558837890625, -0.1383056640625, -0.11102294921875, -0.083740234375, -0.05645751953125, -0.0291748046875, -0.00189208984375, 0.025390625, 0.05267333984375, 0.0799560546875, 0.10723876953125, 0.134521484375, 0.16180419921875, 0.1890869140625, 0.21636962890625, 0.24365234375, 0.27093505859375, 0.2982177734375, 0.32550048828125, 0.352783203125, 0.38006591796875, 0.4073486328125, 0.43463134765625, 0.4619140625, 0.48919677734375, 0.5164794921875, 0.54376220703125, 0.571044921875, 0.59832763671875, 0.6256103515625, 0.65289306640625, 0.68017578125, 0.70745849609375, 0.7347412109375, 0.76202392578125, 0.789306640625, 0.81658935546875, 0.8438720703125, 0.87115478515625, 0.8984375]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 1.0, 0.0, 2.0, 4.0, 2.0, 2.0, 3.0, 6.0, 8.0, 6.0, 8.0, 8.0, 9.0, 16.0, 13.0, 24.0, 21.0, 25.0, 30.0, 29.0, 31.0, 38.0, 26.0, 35.0, 43.0, 44.0, 39.0, 1050.0, 59.0, 38.0, 45.0, 34.0, 34.0, 43.0, 27.0, 30.0, 27.0, 28.0, 26.0, 24.0, 14.0, 15.0, 10.0, 10.0, 10.0, 9.0, 1.0, 9.0, 5.0, 5.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-21.296875, -20.601806640625, -19.90673828125, -19.211669921875, -18.5166015625, -17.821533203125, -17.12646484375, -16.431396484375, -15.736328125, -15.041259765625, -14.34619140625, -13.651123046875, -12.9560546875, -12.260986328125, -11.56591796875, -10.870849609375, -10.17578125, -9.480712890625, -8.78564453125, -8.090576171875, -7.3955078125, -6.700439453125, -6.00537109375, -5.310302734375, -4.615234375, -3.920166015625, -3.22509765625, -2.530029296875, -1.8349609375, -1.139892578125, -0.44482421875, 0.250244140625, 0.9453125, 1.640380859375, 2.33544921875, 3.030517578125, 3.7255859375, 4.420654296875, 5.11572265625, 5.810791015625, 6.505859375, 7.200927734375, 7.89599609375, 8.591064453125, 9.2861328125, 9.981201171875, 10.67626953125, 11.371337890625, 12.06640625, 12.761474609375, 13.45654296875, 14.151611328125, 14.8466796875, 15.541748046875, 16.23681640625, 16.931884765625, 17.626953125, 18.322021484375, 19.01708984375, 19.712158203125, 20.4072265625, 21.102294921875, 21.79736328125, 22.492431640625, 23.1875]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [7.0, 16.0, 16.0, 20.0, 29.0, 38.0, 68.0, 103.0, 137.0, 211.0, 264.0, 437.0, 676.0, 804.0, 1109.0, 1705.0, 2428.0, 3487.0, 5093.0, 7185.0, 10734.0, 14955.0, 21819.0, 31267.0, 45911.0, 66778.0, 98442.0, 147554.0, 223210.0, 337975.0, 768068.0, 3425171.0, 356987.0, 233995.0, 155807.0, 103673.0, 69706.0, 47731.0, 33269.0, 22777.0, 15642.0, 10829.0, 7406.0, 5422.0, 3779.0, 2746.0, 1847.0, 1249.0, 875.0, 642.0, 382.0, 301.0, 194.0, 145.0, 98.0, 93.0, 45.0, 43.0, 15.0, 9.0, 13.0, 10.0, 6.0, 3.0], "bins": [-0.66552734375, -0.64410400390625, -0.6226806640625, -0.60125732421875, -0.579833984375, -0.55841064453125, -0.5369873046875, -0.51556396484375, -0.494140625, -0.47271728515625, -0.4512939453125, -0.42987060546875, -0.408447265625, -0.38702392578125, -0.3656005859375, -0.34417724609375, -0.32275390625, -0.30133056640625, -0.2799072265625, -0.25848388671875, -0.237060546875, -0.21563720703125, -0.1942138671875, -0.17279052734375, -0.1513671875, -0.12994384765625, -0.1085205078125, -0.08709716796875, -0.065673828125, -0.04425048828125, -0.0228271484375, -0.00140380859375, 0.02001953125, 0.04144287109375, 0.0628662109375, 0.08428955078125, 0.105712890625, 0.12713623046875, 0.1485595703125, 0.16998291015625, 0.19140625, 0.21282958984375, 0.2342529296875, 0.25567626953125, 0.277099609375, 0.29852294921875, 0.3199462890625, 0.34136962890625, 0.36279296875, 0.38421630859375, 0.4056396484375, 0.42706298828125, 0.448486328125, 0.46990966796875, 0.4913330078125, 0.51275634765625, 0.5341796875, 0.55560302734375, 0.5770263671875, 0.59844970703125, 0.619873046875, 0.64129638671875, 0.6627197265625, 0.68414306640625, 0.70556640625]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 4.0, 2.0, 5.0, 7.0, 10.0, 13.0, 9.0, 17.0, 10.0, 20.0, 11.0, 21.0, 23.0, 19.0, 28.0, 26.0, 36.0, 38.0, 38.0, 42.0, 34.0, 25.0, 43.0, 1054.0, 34.0, 32.0, 51.0, 41.0, 29.0, 39.0, 26.0, 31.0, 32.0, 23.0, 24.0, 25.0, 9.0, 17.0, 10.0, 17.0, 12.0, 14.0, 9.0, 5.0, 2.0, 3.0, 4.0, 2.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-16.671875, -16.157470703125, -15.64306640625, -15.128662109375, -14.6142578125, -14.099853515625, -13.58544921875, -13.071044921875, -12.556640625, -12.042236328125, -11.52783203125, -11.013427734375, -10.4990234375, -9.984619140625, -9.47021484375, -8.955810546875, -8.44140625, -7.927001953125, -7.41259765625, -6.898193359375, -6.3837890625, -5.869384765625, -5.35498046875, -4.840576171875, -4.326171875, -3.811767578125, -3.29736328125, -2.782958984375, -2.2685546875, -1.754150390625, -1.23974609375, -0.725341796875, -0.2109375, 0.303466796875, 0.81787109375, 1.332275390625, 1.8466796875, 2.361083984375, 2.87548828125, 3.389892578125, 3.904296875, 4.418701171875, 4.93310546875, 5.447509765625, 5.9619140625, 6.476318359375, 6.99072265625, 7.505126953125, 8.01953125, 8.533935546875, 9.04833984375, 9.562744140625, 10.0771484375, 10.591552734375, 11.10595703125, 11.620361328125, 12.134765625, 12.649169921875, 13.16357421875, 13.677978515625, 14.1923828125, 14.706787109375, 15.22119140625, 15.735595703125, 16.25]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [4.0, 2.0, 4.0, 5.0, 2.0, 6.0, 2.0, 5.0, 5.0, 17.0, 20.0, 14.0, 23.0, 15.0, 41.0, 47.0, 75.0, 99.0, 97.0, 134.0, 204.0, 203.0, 307.0, 413.0, 631.0, 947.0, 1550.0, 2538.0, 4273.0, 8225.0, 16822.0, 37119.0, 101221.0, 5776834.0, 215639.0, 68114.0, 26859.0, 12834.0, 6280.0, 3679.0, 1961.0, 1203.0, 834.0, 548.0, 371.0, 271.0, 244.0, 171.0, 86.0, 100.0, 54.0, 64.0, 51.0, 33.0, 42.0, 47.0, 21.0, 10.0, 10.0, 6.0, 7.0, 7.0, 3.0, 3.0], "bins": [-2.728515625, -2.6478271484375, -2.567138671875, -2.4864501953125, -2.40576171875, -2.3250732421875, -2.244384765625, -2.1636962890625, -2.0830078125, -2.0023193359375, -1.921630859375, -1.8409423828125, -1.76025390625, -1.6795654296875, -1.598876953125, -1.5181884765625, -1.4375, -1.3568115234375, -1.276123046875, -1.1954345703125, -1.11474609375, -1.0340576171875, -0.953369140625, -0.8726806640625, -0.7919921875, -0.7113037109375, -0.630615234375, -0.5499267578125, -0.46923828125, -0.3885498046875, -0.307861328125, -0.2271728515625, -0.146484375, -0.0657958984375, 0.014892578125, 0.0955810546875, 0.17626953125, 0.2569580078125, 0.337646484375, 0.4183349609375, 0.4990234375, 0.5797119140625, 0.660400390625, 0.7410888671875, 0.82177734375, 0.9024658203125, 0.983154296875, 1.0638427734375, 1.14453125, 1.2252197265625, 1.305908203125, 1.3865966796875, 1.46728515625, 1.5479736328125, 1.628662109375, 1.7093505859375, 1.7900390625, 1.8707275390625, 1.951416015625, 2.0321044921875, 2.11279296875, 2.1934814453125, 2.274169921875, 2.3548583984375, 2.435546875]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 7.0, 6.0, 5.0, 6.0, 6.0, 10.0, 4.0, 16.0, 22.0, 14.0, 15.0, 21.0, 22.0, 17.0, 27.0, 24.0, 31.0, 31.0, 40.0, 38.0, 36.0, 28.0, 33.0, 445.0, 649.0, 27.0, 41.0, 30.0, 35.0, 37.0, 33.0, 33.0, 30.0, 22.0, 21.0, 13.0, 15.0, 19.0, 18.0, 21.0, 19.0, 13.0, 13.0, 6.0, 4.0, 7.0, 7.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 3.0], "bins": [-11.8046875, -11.43603515625, -11.0673828125, -10.69873046875, -10.330078125, -9.96142578125, -9.5927734375, -9.22412109375, -8.85546875, -8.48681640625, -8.1181640625, -7.74951171875, -7.380859375, -7.01220703125, -6.6435546875, -6.27490234375, -5.90625, -5.53759765625, -5.1689453125, -4.80029296875, -4.431640625, -4.06298828125, -3.6943359375, -3.32568359375, -2.95703125, -2.58837890625, -2.2197265625, -1.85107421875, -1.482421875, -1.11376953125, -0.7451171875, -0.37646484375, -0.0078125, 0.36083984375, 0.7294921875, 1.09814453125, 1.466796875, 1.83544921875, 2.2041015625, 2.57275390625, 2.94140625, 3.31005859375, 3.6787109375, 4.04736328125, 4.416015625, 4.78466796875, 5.1533203125, 5.52197265625, 5.890625, 6.25927734375, 6.6279296875, 6.99658203125, 7.365234375, 7.73388671875, 8.1025390625, 8.47119140625, 8.83984375, 9.20849609375, 9.5771484375, 9.94580078125, 10.314453125, 10.68310546875, 11.0517578125, 11.42041015625, 11.7890625]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 9.0, 7.0, 31.0, 61.0, 147.0, 468.0, 173.0, 63.0, 20.0, 14.0, 7.0, 5.0, 4.0, 1.0], "bins": [-115.35600280761719, -113.27873992919922, -111.20148468017578, -109.12422180175781, -107.04696655273438, -104.9697036743164, -102.89244842529297, -100.815185546875, -98.73793029785156, -96.6606674194336, -94.58341217041016, -92.50614929199219, -90.42889404296875, -88.35163116455078, -86.27437591552734, -84.19711303710938, -82.11985778808594, -80.04259490966797, -77.96533966064453, -75.88807678222656, -73.81082153320312, -71.73355865478516, -69.65630340576172, -67.57904052734375, -65.50177764892578, -63.42451858520508, -61.347259521484375, -59.27000045776367, -57.19274139404297, -55.115482330322266, -53.03822326660156, -50.960960388183594, -48.88370895385742, -46.80644989013672, -44.729190826416016, -42.65193176269531, -40.57467269897461, -38.497413635253906, -36.42015075683594, -34.3428955078125, -32.26563262939453, -30.188373565673828, -28.111114501953125, -26.033855438232422, -23.95659637451172, -21.879337310791016, -19.80207633972168, -17.724817276000977, -15.647560119628906, -13.570301055908203, -11.4930419921875, -9.41578197479248, -7.338522911071777, -5.261263847351074, -3.1840038299560547, -1.1067447662353516, 0.9705142974853516, 3.047773599624634, 5.125032901763916, 7.202292442321777, 9.27955150604248, 11.356810569763184, 13.434070587158203, 15.511329650878906, 17.58858871459961]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 3.0, 3.0, 6.0, 8.0, 10.0, 9.0, 17.0, 8.0, 21.0, 20.0, 24.0, 25.0, 31.0, 23.0, 30.0, 28.0, 48.0, 34.0, 35.0, 39.0, 45.0, 37.0, 46.0, 44.0, 27.0, 41.0, 50.0, 26.0, 34.0, 34.0, 33.0, 24.0, 28.0, 13.0, 16.0, 13.0, 18.0, 11.0, 7.0, 8.0, 8.0, 4.0, 1.0, 5.0, 5.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-25.787487030029297, -25.029155731201172, -24.270824432373047, -23.512493133544922, -22.754161834716797, -21.995830535888672, -21.237499237060547, -20.479167938232422, -19.720836639404297, -18.962505340576172, -18.204174041748047, -17.445842742919922, -16.687511444091797, -15.929180145263672, -15.170848846435547, -14.412517547607422, -13.65418529510498, -12.895853996276855, -12.13752269744873, -11.379191398620605, -10.62086009979248, -9.862528800964355, -9.104196548461914, -8.345865249633789, -7.587534427642822, -6.829203128814697, -6.070871829986572, -5.312540054321289, -4.554208755493164, -3.795877695083618, -3.037546157836914, -2.279214859008789, -1.520883560180664, -0.7625522017478943, -0.004220843315124512, 0.75411057472229, 1.512441873550415, 2.27077317237854, 3.029104709625244, 3.787436008453369, 4.545767307281494, 5.304098606109619, 6.062429904937744, 6.820761680603027, 7.579092979431152, 8.337424278259277, 9.095755577087402, 9.854086875915527, 10.612418174743652, 11.370749473571777, 12.129080772399902, 12.887412071228027, 13.645743370056152, 14.404074668884277, 15.162406921386719, 15.920738220214844, 16.67906951904297, 17.437400817871094, 18.19573211669922, 18.954063415527344, 19.71239471435547, 20.470726013183594, 21.22905731201172, 21.987388610839844, 22.74571990966797]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 4.0, 1.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 9.0, 13.0, 15.0, 19.0, 20.0, 23.0, 43.0, 57.0, 70.0, 87.0, 140.0, 240.0, 391.0, 576.0, 964.0, 1828.0, 3782.0, 18009.0, 4025695.0, 129534.0, 7183.0, 2289.0, 1217.0, 665.0, 413.0, 285.0, 178.0, 143.0, 93.0, 62.0, 55.0, 33.0, 30.0, 26.0, 28.0, 16.0, 9.0, 11.0, 7.0, 8.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.289794921875, -0.28006744384765625, -0.2703399658203125, -0.26061248779296875, -0.250885009765625, -0.24115753173828125, -0.2314300537109375, -0.22170257568359375, -0.21197509765625, -0.20224761962890625, -0.1925201416015625, -0.18279266357421875, -0.173065185546875, -0.16333770751953125, -0.1536102294921875, -0.14388275146484375, -0.1341552734375, -0.12442779541015625, -0.1147003173828125, -0.10497283935546875, -0.095245361328125, -0.08551788330078125, -0.0757904052734375, -0.06606292724609375, -0.05633544921875, -0.04660797119140625, -0.0368804931640625, -0.02715301513671875, -0.017425537109375, -0.00769805908203125, 0.0020294189453125, 0.01175689697265625, 0.021484375, 0.03121185302734375, 0.0409393310546875, 0.05066680908203125, 0.060394287109375, 0.07012176513671875, 0.0798492431640625, 0.08957672119140625, 0.09930419921875, 0.10903167724609375, 0.1187591552734375, 0.12848663330078125, 0.138214111328125, 0.14794158935546875, 0.1576690673828125, 0.16739654541015625, 0.1771240234375, 0.18685150146484375, 0.1965789794921875, 0.20630645751953125, 0.216033935546875, 0.22576141357421875, 0.2354888916015625, 0.24521636962890625, 0.25494384765625, 0.26467132568359375, 0.2743988037109375, 0.28412628173828125, 0.293853759765625, 0.30358123779296875, 0.3133087158203125, 0.32303619384765625, 0.332763671875]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 7.0, 8.0, 5.0, 5.0, 6.0, 13.0, 10.0, 10.0, 12.0, 13.0, 22.0, 782.0, 26.0, 15.0, 14.0, 12.0, 9.0, 5.0, 3.0, 5.0, 4.0, 3.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09613037109375, -0.09288215637207031, -0.08963394165039062, -0.08638572692871094, -0.08313751220703125, -0.07988929748535156, -0.07664108276367188, -0.07339286804199219, -0.0701446533203125, -0.06689643859863281, -0.06364822387695312, -0.06040000915527344, -0.05715179443359375, -0.05390357971191406, -0.050655364990234375, -0.04740715026855469, -0.044158935546875, -0.04091072082519531, -0.037662506103515625, -0.03441429138183594, -0.03116607666015625, -0.027917861938476562, -0.024669647216796875, -0.021421432495117188, -0.0181732177734375, -0.014925003051757812, -0.011676788330078125, -0.008428573608398438, -0.00518035888671875, -0.0019321441650390625, 0.001316070556640625, 0.0045642852783203125, 0.0078125, 0.011060714721679688, 0.014308929443359375, 0.017557144165039062, 0.02080535888671875, 0.024053573608398438, 0.027301788330078125, 0.030550003051757812, 0.0337982177734375, 0.03704643249511719, 0.040294647216796875, 0.04354286193847656, 0.04679107666015625, 0.05003929138183594, 0.053287506103515625, 0.05653572082519531, 0.059783935546875, 0.06303215026855469, 0.06628036499023438, 0.06952857971191406, 0.07277679443359375, 0.07602500915527344, 0.07927322387695312, 0.08252143859863281, 0.0857696533203125, 0.08901786804199219, 0.09226608276367188, 0.09551429748535156, 0.09876251220703125, 0.10201072692871094, 0.10525894165039062, 0.10850715637207031, 0.11175537109375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 8.0, 4.0, 3.0, 3.0, 16.0, 16.0, 16.0, 38.0, 46.0, 73.0, 120.0, 180.0, 235.0, 373.0, 567.0, 828.0, 1441.0, 2416.0, 4057.0, 7212.0, 14375.0, 33102.0, 132246.0, 3650657.0, 261356.0, 45835.0, 18258.0, 8897.0, 4712.0, 2707.0, 1643.0, 961.0, 636.0, 403.0, 261.0, 185.0, 140.0, 81.0, 59.0, 27.0, 32.0, 27.0, 9.0, 9.0, 12.0, 5.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.22607421875, -0.219146728515625, -0.21221923828125, -0.205291748046875, -0.1983642578125, -0.191436767578125, -0.18450927734375, -0.177581787109375, -0.170654296875, -0.163726806640625, -0.15679931640625, -0.149871826171875, -0.1429443359375, -0.136016845703125, -0.12908935546875, -0.122161865234375, -0.115234375, -0.108306884765625, -0.10137939453125, -0.094451904296875, -0.0875244140625, -0.080596923828125, -0.07366943359375, -0.066741943359375, -0.059814453125, -0.052886962890625, -0.04595947265625, -0.039031982421875, -0.0321044921875, -0.025177001953125, -0.01824951171875, -0.011322021484375, -0.00439453125, 0.002532958984375, 0.00946044921875, 0.016387939453125, 0.0233154296875, 0.030242919921875, 0.03717041015625, 0.044097900390625, 0.051025390625, 0.057952880859375, 0.06488037109375, 0.071807861328125, 0.0787353515625, 0.085662841796875, 0.09259033203125, 0.099517822265625, 0.1064453125, 0.113372802734375, 0.12030029296875, 0.127227783203125, 0.1341552734375, 0.141082763671875, 0.14801025390625, 0.154937744140625, 0.161865234375, 0.168792724609375, 0.17572021484375, 0.182647705078125, 0.1895751953125, 0.196502685546875, 0.20343017578125, 0.210357666015625, 0.21728515625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 4.0, 6.0, 3.0, 8.0, 11.0, 10.0, 10.0, 15.0, 13.0, 22.0, 29.0, 47.0, 73.0, 195.0, 751.0, 1956.0, 514.0, 149.0, 74.0, 35.0, 35.0, 20.0, 21.0, 18.0, 20.0, 8.0, 8.0, 5.0, 2.0, 5.0, 3.0, 3.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1275634765625, -0.12290191650390625, -0.1182403564453125, -0.11357879638671875, -0.108917236328125, -0.10425567626953125, -0.0995941162109375, -0.09493255615234375, -0.09027099609375, -0.08560943603515625, -0.0809478759765625, -0.07628631591796875, -0.071624755859375, -0.06696319580078125, -0.0623016357421875, -0.05764007568359375, -0.052978515625, -0.04831695556640625, -0.0436553955078125, -0.03899383544921875, -0.034332275390625, -0.02967071533203125, -0.0250091552734375, -0.02034759521484375, -0.01568603515625, -0.01102447509765625, -0.0063629150390625, -0.00170135498046875, 0.002960205078125, 0.00762176513671875, 0.0122833251953125, 0.01694488525390625, 0.0216064453125, 0.02626800537109375, 0.0309295654296875, 0.03559112548828125, 0.040252685546875, 0.04491424560546875, 0.0495758056640625, 0.05423736572265625, 0.05889892578125, 0.06356048583984375, 0.0682220458984375, 0.07288360595703125, 0.077545166015625, 0.08220672607421875, 0.0868682861328125, 0.09152984619140625, 0.09619140625, 0.10085296630859375, 0.1055145263671875, 0.11017608642578125, 0.114837646484375, 0.11949920654296875, 0.1241607666015625, 0.12882232666015625, 0.13348388671875, 0.13814544677734375, 0.1428070068359375, 0.14746856689453125, 0.152130126953125, 0.15679168701171875, 0.1614532470703125, 0.16611480712890625, 0.1707763671875]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 8.0, 5.0, 19.0, 43.0, 149.0, 480.0, 193.0, 54.0, 26.0, 16.0, 8.0, 3.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7148686647415161, -0.6844812035560608, -0.6540937423706055, -0.6237062215805054, -0.59331876039505, -0.5629312992095947, -0.5325438380241394, -0.5021563768386841, -0.47176891565322876, -0.44138145446777344, -0.4109939634799957, -0.3806065022945404, -0.3502190411090851, -0.3198315501213074, -0.28944408893585205, -0.25905662775039673, -0.22866913676261902, -0.1982816606760025, -0.16789419949054718, -0.13750672340393066, -0.10711925476789474, -0.07673178613185883, -0.04634431004524231, -0.015956848859786987, 0.014430627226829529, 0.04481809586286545, 0.07520556449890137, 0.10559304058551788, 0.1359805166721344, 0.16636797785758972, 0.19675545394420624, 0.22714291512966156, 0.2575303912162781, 0.2879178524017334, 0.3183053433895111, 0.34869280457496643, 0.37908026576042175, 0.40946775674819946, 0.4398552179336548, 0.4702426791191101, 0.5006301403045654, 0.5310176014900208, 0.5614050626754761, 0.5917925834655762, 0.6221800446510315, 0.6525675058364868, 0.6829549670219421, 0.7133424282073975, 0.7437299489974976, 0.7741174101829529, 0.8045048713684082, 0.8348923921585083, 0.8652798533439636, 0.895667314529419, 0.9260547757148743, 0.9564422369003296, 0.9868296980857849, 1.0172171592712402, 1.0476046800613403, 1.0779920816421509, 1.108379602432251, 1.1387670040130615, 1.1691545248031616, 1.1995420455932617, 1.2299294471740723]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 7.0, 6.0, 8.0, 19.0, 23.0, 15.0, 32.0, 43.0, 51.0, 43.0, 54.0, 50.0, 54.0, 71.0, 61.0, 66.0, 54.0, 51.0, 53.0, 46.0, 42.0, 28.0, 21.0, 21.0, 15.0, 18.0, 17.0, 5.0, 8.0, 8.0, 7.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.53624027967453, -0.5210390686988831, -0.5058379173278809, -0.4906367063522339, -0.4754355251789093, -0.4602343440055847, -0.44503316283226013, -0.42983198165893555, -0.4146307706832886, -0.399429589509964, -0.3842284083366394, -0.36902719736099243, -0.35382601618766785, -0.33862483501434326, -0.3234236538410187, -0.3082224726676941, -0.2930212616920471, -0.27782008051872253, -0.26261889934539795, -0.24741770327091217, -0.2322165071964264, -0.2170153260231018, -0.20181414484977722, -0.18661294877529144, -0.17141178250312805, -0.15621060132980347, -0.1410094052553177, -0.1258082240819931, -0.11060702800750732, -0.09540584683418274, -0.08020465821027756, -0.06500346958637238, -0.0498022735118866, -0.034601084887981415, -0.019399898126721382, -0.0041987113654613495, 0.011002477258443832, 0.026203662157058716, 0.0414048507809639, 0.05660603940486908, 0.07180722802877426, 0.08700841665267944, 0.10220960527658463, 0.11741079390048981, 0.1326119750738144, 0.14781317114830017, 0.16301435232162476, 0.17821553349494934, 0.19341672956943512, 0.2086179107427597, 0.22381910681724548, 0.23902028799057007, 0.25422146916389465, 0.26942265033721924, 0.2846238613128662, 0.2998250424861908, 0.3150262236595154, 0.33022740483283997, 0.34542858600616455, 0.3606297969818115, 0.3758309781551361, 0.3910321593284607, 0.4062333405017853, 0.42143452167510986, 0.43663573265075684]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 0.0, 2.0, 2.0, 1.0, 8.0, 8.0, 8.0, 13.0, 21.0, 29.0, 33.0, 62.0, 86.0, 96.0, 147.0, 184.0, 280.0, 419.0, 635.0, 979.0, 1560.0, 2650.0, 4553.0, 8565.0, 18704.0, 56461.0, 892865.0, 31630.0, 12860.0, 6220.0, 3574.0, 2017.0, 1229.0, 855.0, 565.0, 368.0, 297.0, 172.0, 122.0, 82.0, 59.0, 59.0, 16.0, 18.0, 16.0, 12.0, 10.0, 3.0, 4.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.43994140625, -0.42671966552734375, -0.4134979248046875, -0.40027618408203125, -0.387054443359375, -0.37383270263671875, -0.3606109619140625, -0.34738922119140625, -0.33416748046875, -0.32094573974609375, -0.3077239990234375, -0.29450225830078125, -0.281280517578125, -0.26805877685546875, -0.2548370361328125, -0.24161529541015625, -0.2283935546875, -0.21517181396484375, -0.2019500732421875, -0.18872833251953125, -0.175506591796875, -0.16228485107421875, -0.1490631103515625, -0.13584136962890625, -0.12261962890625, -0.10939788818359375, -0.0961761474609375, -0.08295440673828125, -0.069732666015625, -0.05651092529296875, -0.0432891845703125, -0.03006744384765625, -0.016845703125, -0.00362396240234375, 0.0095977783203125, 0.02281951904296875, 0.036041259765625, 0.04926300048828125, 0.0624847412109375, 0.07570648193359375, 0.08892822265625, 0.10214996337890625, 0.1153717041015625, 0.12859344482421875, 0.141815185546875, 0.15503692626953125, 0.1682586669921875, 0.18148040771484375, 0.1947021484375, 0.20792388916015625, 0.2211456298828125, 0.23436737060546875, 0.247589111328125, 0.26081085205078125, 0.2740325927734375, 0.28725433349609375, 0.30047607421875, 0.31369781494140625, 0.3269195556640625, 0.34014129638671875, 0.353363037109375, 0.36658477783203125, 0.3798065185546875, 0.39302825927734375, 0.40625]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 2.0, 6.0, 6.0, 8.0, 6.0, 5.0, 4.0, 17.0, 9.0, 12.0, 14.0, 15.0, 136.0, 670.0, 18.0, 16.0, 14.0, 9.0, 6.0, 5.0, 3.0, 6.0, 5.0, 2.0, 5.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09716796875, -0.09394454956054688, -0.09072113037109375, -0.08749771118164062, -0.0842742919921875, -0.08105087280273438, -0.07782745361328125, -0.07460403442382812, -0.071380615234375, -0.06815719604492188, -0.06493377685546875, -0.061710357666015625, -0.0584869384765625, -0.055263519287109375, -0.05204010009765625, -0.048816680908203125, -0.04559326171875, -0.042369842529296875, -0.03914642333984375, -0.035923004150390625, -0.0326995849609375, -0.029476165771484375, -0.02625274658203125, -0.023029327392578125, -0.019805908203125, -0.016582489013671875, -0.01335906982421875, -0.010135650634765625, -0.0069122314453125, -0.003688812255859375, -0.00046539306640625, 0.002758026123046875, 0.0059814453125, 0.009204864501953125, 0.01242828369140625, 0.015651702880859375, 0.0188751220703125, 0.022098541259765625, 0.02532196044921875, 0.028545379638671875, 0.031768798828125, 0.034992218017578125, 0.03821563720703125, 0.041439056396484375, 0.0446624755859375, 0.047885894775390625, 0.05110931396484375, 0.054332733154296875, 0.05755615234375, 0.060779571533203125, 0.06400299072265625, 0.06722640991210938, 0.0704498291015625, 0.07367324829101562, 0.07689666748046875, 0.08012008666992188, 0.083343505859375, 0.08656692504882812, 0.08979034423828125, 0.09301376342773438, 0.0962371826171875, 0.09946060180664062, 0.10268402099609375, 0.10590744018554688, 0.109130859375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [5.0, 3.0, 3.0, 3.0, 7.0, 9.0, 0.0, 10.0, 10.0, 12.0, 22.0, 34.0, 38.0, 55.0, 72.0, 100.0, 105.0, 194.0, 230.0, 380.0, 593.0, 1056.0, 1684.0, 2872.0, 4867.0, 8357.0, 15084.0, 27625.0, 52570.0, 109260.0, 274659.0, 307122.0, 117993.0, 56140.0, 29485.0, 15894.0, 9018.0, 5090.0, 3022.0, 1813.0, 1088.0, 622.0, 427.0, 281.0, 147.0, 135.0, 96.0, 72.0, 55.0, 51.0, 21.0, 20.0, 19.0, 4.0, 8.0, 12.0, 3.0, 4.0, 4.0, 2.0, 3.0, 1.0, 1.0, 4.0], "bins": [-0.2015380859375, -0.19504737854003906, -0.18855667114257812, -0.1820659637451172, -0.17557525634765625, -0.1690845489501953, -0.16259384155273438, -0.15610313415527344, -0.1496124267578125, -0.14312171936035156, -0.13663101196289062, -0.1301403045654297, -0.12364959716796875, -0.11715888977050781, -0.11066818237304688, -0.10417747497558594, -0.097686767578125, -0.09119606018066406, -0.08470535278320312, -0.07821464538574219, -0.07172393798828125, -0.06523323059082031, -0.058742523193359375, -0.05225181579589844, -0.0457611083984375, -0.03927040100097656, -0.032779693603515625, -0.026288986206054688, -0.01979827880859375, -0.013307571411132812, -0.006816864013671875, -0.0003261566162109375, 0.00616455078125, 0.012655258178710938, 0.019145965576171875, 0.025636672973632812, 0.03212738037109375, 0.03861808776855469, 0.045108795166015625, 0.05159950256347656, 0.0580902099609375, 0.06458091735839844, 0.07107162475585938, 0.07756233215332031, 0.08405303955078125, 0.09054374694824219, 0.09703445434570312, 0.10352516174316406, 0.110015869140625, 0.11650657653808594, 0.12299728393554688, 0.1294879913330078, 0.13597869873046875, 0.1424694061279297, 0.14896011352539062, 0.15545082092285156, 0.1619415283203125, 0.16843223571777344, 0.17492294311523438, 0.1814136505126953, 0.18790435791015625, 0.1943950653076172, 0.20088577270507812, 0.20737648010253906, 0.2138671875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 5.0, 4.0, 8.0, 10.0, 9.0, 9.0, 15.0, 18.0, 13.0, 17.0, 17.0, 19.0, 24.0, 35.0, 26.0, 34.0, 39.0, 31.0, 37.0, 30.0, 33.0, 37.0, 36.0, 40.0, 37.0, 38.0, 47.0, 28.0, 34.0, 30.0, 30.0, 35.0, 20.0, 21.0, 21.0, 16.0, 15.0, 12.0, 11.0, 17.0, 15.0, 12.0, 4.0, 6.0, 4.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.291748046875, -0.2823486328125, -0.27294921875, -0.2635498046875, -0.254150390625, -0.2447509765625, -0.2353515625, -0.2259521484375, -0.216552734375, -0.2071533203125, -0.19775390625, -0.1883544921875, -0.178955078125, -0.1695556640625, -0.16015625, -0.1507568359375, -0.141357421875, -0.1319580078125, -0.12255859375, -0.1131591796875, -0.103759765625, -0.0943603515625, -0.0849609375, -0.0755615234375, -0.066162109375, -0.0567626953125, -0.04736328125, -0.0379638671875, -0.028564453125, -0.0191650390625, -0.009765625, -0.0003662109375, 0.009033203125, 0.0184326171875, 0.02783203125, 0.0372314453125, 0.046630859375, 0.0560302734375, 0.0654296875, 0.0748291015625, 0.084228515625, 0.0936279296875, 0.10302734375, 0.1124267578125, 0.121826171875, 0.1312255859375, 0.140625, 0.1500244140625, 0.159423828125, 0.1688232421875, 0.17822265625, 0.1876220703125, 0.197021484375, 0.2064208984375, 0.2158203125, 0.2252197265625, 0.234619140625, 0.2440185546875, 0.25341796875, 0.2628173828125, 0.272216796875, 0.2816162109375, 0.291015625, 0.3004150390625, 0.309814453125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 6.0, 3.0, 2.0, 8.0, 7.0, 6.0, 25.0, 30.0, 44.0, 74.0, 136.0, 248.0, 539.0, 1433.0, 5306.0, 56661.0, 949558.0, 28508.0, 3859.0, 1126.0, 464.0, 218.0, 98.0, 81.0, 36.0, 23.0, 15.0, 12.0, 9.0, 4.0, 6.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0433349609375, -0.04195451736450195, -0.040574073791503906, -0.03919363021850586, -0.03781318664550781, -0.036432743072509766, -0.03505229949951172, -0.03367185592651367, -0.032291412353515625, -0.030910968780517578, -0.02953052520751953, -0.028150081634521484, -0.026769638061523438, -0.02538919448852539, -0.024008750915527344, -0.022628307342529297, -0.02124786376953125, -0.019867420196533203, -0.018486976623535156, -0.01710653305053711, -0.015726089477539062, -0.014345645904541016, -0.012965202331542969, -0.011584758758544922, -0.010204315185546875, -0.008823871612548828, -0.007443428039550781, -0.006062984466552734, -0.0046825408935546875, -0.0033020973205566406, -0.0019216537475585938, -0.0005412101745605469, 0.0008392333984375, 0.002219676971435547, 0.0036001205444335938, 0.004980564117431641, 0.0063610076904296875, 0.007741451263427734, 0.009121894836425781, 0.010502338409423828, 0.011882781982421875, 0.013263225555419922, 0.014643669128417969, 0.016024112701416016, 0.017404556274414062, 0.01878499984741211, 0.020165443420410156, 0.021545886993408203, 0.02292633056640625, 0.024306774139404297, 0.025687217712402344, 0.02706766128540039, 0.028448104858398438, 0.029828548431396484, 0.03120899200439453, 0.03258943557739258, 0.033969879150390625, 0.03535032272338867, 0.03673076629638672, 0.038111209869384766, 0.03949165344238281, 0.04087209701538086, 0.042252540588378906, 0.04363298416137695, 0.045013427734375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 4.0, 4.0, 0.0, 5.0, 14.0, 13.0, 20.0, 24.0, 23.0, 64.0, 89.0, 129.0, 182.0, 158.0, 86.0, 48.0, 40.0, 36.0, 11.0, 8.0, 8.0, 7.0, 5.0, 4.0, 6.0, 4.0, 4.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.698204040527344e-05, -5.4838135838508606e-05, -5.2694231271743774e-05, -5.055032670497894e-05, -4.840642213821411e-05, -4.626251757144928e-05, -4.411861300468445e-05, -4.197470843791962e-05, -3.9830803871154785e-05, -3.7686899304389954e-05, -3.554299473762512e-05, -3.339909017086029e-05, -3.125518560409546e-05, -2.9111281037330627e-05, -2.6967376470565796e-05, -2.4823471903800964e-05, -2.2679567337036133e-05, -2.05356627702713e-05, -1.839175820350647e-05, -1.6247853636741638e-05, -1.4103949069976807e-05, -1.1960044503211975e-05, -9.816139936447144e-06, -7.672235369682312e-06, -5.5283308029174805e-06, -3.384426236152649e-06, -1.2405216693878174e-06, 9.033828973770142e-07, 3.0472874641418457e-06, 5.191192030906677e-06, 7.335096597671509e-06, 9.47900116443634e-06, 1.1622905731201172e-05, 1.3766810297966003e-05, 1.5910714864730835e-05, 1.8054619431495667e-05, 2.0198523998260498e-05, 2.234242856502533e-05, 2.448633313179016e-05, 2.6630237698554993e-05, 2.8774142265319824e-05, 3.0918046832084656e-05, 3.306195139884949e-05, 3.520585596561432e-05, 3.734976053237915e-05, 3.949366509914398e-05, 4.1637569665908813e-05, 4.3781474232673645e-05, 4.5925378799438477e-05, 4.806928336620331e-05, 5.021318793296814e-05, 5.235709249973297e-05, 5.45009970664978e-05, 5.6644901633262634e-05, 5.8788806200027466e-05, 6.09327107667923e-05, 6.307661533355713e-05, 6.522051990032196e-05, 6.736442446708679e-05, 6.950832903385162e-05, 7.165223360061646e-05, 7.379613816738129e-05, 7.594004273414612e-05, 7.808394730091095e-05, 8.022785186767578e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 7.0, 8.0, 8.0, 14.0, 20.0, 22.0, 28.0, 61.0, 86.0, 161.0, 289.0, 494.0, 1095.0, 2334.0, 5576.0, 17101.0, 80855.0, 750950.0, 150917.0, 25351.0, 7454.0, 2945.0, 1285.0, 673.0, 381.0, 181.0, 92.0, 47.0, 38.0, 32.0, 18.0, 12.0, 8.0, 10.0, 2.0, 5.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.022064208984375, -0.02134418487548828, -0.020624160766601562, -0.019904136657714844, -0.019184112548828125, -0.018464088439941406, -0.017744064331054688, -0.01702404022216797, -0.01630401611328125, -0.015583992004394531, -0.014863967895507812, -0.014143943786621094, -0.013423919677734375, -0.012703895568847656, -0.011983871459960938, -0.011263847351074219, -0.0105438232421875, -0.009823799133300781, -0.009103775024414062, -0.008383750915527344, -0.007663726806640625, -0.006943702697753906, -0.0062236785888671875, -0.005503654479980469, -0.00478363037109375, -0.004063606262207031, -0.0033435821533203125, -0.0026235580444335938, -0.001903533935546875, -0.0011835098266601562, -0.0004634857177734375, 0.00025653839111328125, 0.0009765625, 0.0016965866088867188, 0.0024166107177734375, 0.0031366348266601562, 0.003856658935546875, 0.004576683044433594, 0.0052967071533203125, 0.006016731262207031, 0.00673675537109375, 0.007456779479980469, 0.008176803588867188, 0.008896827697753906, 0.009616851806640625, 0.010336875915527344, 0.011056900024414062, 0.011776924133300781, 0.0124969482421875, 0.013216972351074219, 0.013936996459960938, 0.014657020568847656, 0.015377044677734375, 0.016097068786621094, 0.016817092895507812, 0.01753711700439453, 0.01825714111328125, 0.01897716522216797, 0.019697189331054688, 0.020417213439941406, 0.021137237548828125, 0.021857261657714844, 0.022577285766601562, 0.02329730987548828, 0.024017333984375]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 4.0, 0.0, 2.0, 7.0, 8.0, 16.0, 10.0, 18.0, 27.0, 32.0, 52.0, 71.0, 110.0, 128.0, 123.0, 102.0, 78.0, 60.0, 40.0, 30.0, 26.0, 16.0, 6.0, 9.0, 10.0, 4.0, 3.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.019256591796875, -0.018428325653076172, -0.017600059509277344, -0.016771793365478516, -0.015943527221679688, -0.01511526107788086, -0.014286994934082031, -0.013458728790283203, -0.012630462646484375, -0.011802196502685547, -0.010973930358886719, -0.01014566421508789, -0.009317398071289062, -0.008489131927490234, -0.007660865783691406, -0.006832599639892578, -0.00600433349609375, -0.005176067352294922, -0.004347801208496094, -0.0035195350646972656, -0.0026912689208984375, -0.0018630027770996094, -0.0010347366333007812, -0.00020647048950195312, 0.000621795654296875, 0.0014500617980957031, 0.0022783279418945312, 0.0031065940856933594, 0.0039348602294921875, 0.004763126373291016, 0.005591392517089844, 0.006419658660888672, 0.0072479248046875, 0.008076190948486328, 0.008904457092285156, 0.009732723236083984, 0.010560989379882812, 0.01138925552368164, 0.012217521667480469, 0.013045787811279297, 0.013874053955078125, 0.014702320098876953, 0.015530586242675781, 0.01635885238647461, 0.017187118530273438, 0.018015384674072266, 0.018843650817871094, 0.019671916961669922, 0.02050018310546875, 0.021328449249267578, 0.022156715393066406, 0.022984981536865234, 0.023813247680664062, 0.02464151382446289, 0.02546977996826172, 0.026298046112060547, 0.027126312255859375, 0.027954578399658203, 0.02878284454345703, 0.02961111068725586, 0.030439376831054688, 0.031267642974853516, 0.032095909118652344, 0.03292417526245117, 0.03375244140625]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 7.0, 6.0, 5.0, 8.0, 11.0, 18.0, 24.0, 30.0, 63.0, 90.0, 176.0, 214.0, 123.0, 70.0, 36.0, 36.0, 21.0, 15.0, 15.0, 9.0, 5.0, 2.0, 4.0, 6.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-3.1755661964416504, -3.1022655963897705, -3.0289649963378906, -2.9556643962860107, -2.882363796234131, -2.809062957763672, -2.735762357711792, -2.662461757659912, -2.5891611576080322, -2.5158605575561523, -2.4425599575042725, -2.3692593574523926, -2.2959585189819336, -2.2226579189300537, -2.149357318878174, -2.076056718826294, -2.002756118774414, -1.9294555187225342, -1.8561549186706543, -1.7828541994094849, -1.709553599357605, -1.636252999305725, -1.5629522800445557, -1.4896516799926758, -1.416351079940796, -1.343050479888916, -1.2697498798370361, -1.1964491605758667, -1.1231485605239868, -1.049847960472107, -0.9765473008155823, -0.9032466411590576, -0.8299460411071777, -0.7566454410552979, -0.6833447813987732, -0.6100441217422485, -0.5367435216903687, -0.4634428918361664, -0.3901422619819641, -0.31684160232543945, -0.24354100227355957, -0.1702403724193573, -0.09693974256515503, -0.02363911271095276, 0.04966151714324951, 0.12296214699745178, 0.19626277685165405, 0.2695634365081787, 0.3428640365600586, 0.41616466641426086, 0.48946529626846313, 0.5627659559249878, 0.6360665559768677, 0.7093671560287476, 0.7826678156852722, 0.8559684753417969, 0.9292690753936768, 1.0025696754455566, 1.0758702754974365, 1.149170994758606, 1.2224715948104858, 1.2957721948623657, 1.3690729141235352, 1.442373514175415, 1.515674114227295]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 5.0, 1.0, 1.0, 5.0, 3.0, 5.0, 10.0, 14.0, 23.0, 34.0, 57.0, 88.0, 187.0, 201.0, 150.0, 81.0, 47.0, 27.0, 15.0, 16.0, 12.0, 8.0, 4.0, 3.0, 1.0, 5.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.211030960083008, -8.9646577835083, -8.718283653259277, -8.47191047668457, -8.225537300109863, -7.979163646697998, -7.732790470123291, -7.486416816711426, -7.240043640136719, -6.9936699867248535, -6.7472968101501465, -6.500923156738281, -6.254549980163574, -6.008176326751709, -5.761803150177002, -5.515429496765137, -5.26905632019043, -5.0226826667785645, -4.776309490203857, -4.529935836791992, -4.283562660217285, -4.03718900680542, -3.790815830230713, -3.5444421768188477, -3.2980685234069824, -3.0516951084136963, -2.80532169342041, -2.558948278427124, -2.312574863433838, -2.0662012100219727, -1.819827914237976, -1.57345449924469, -1.3270812034606934, -1.0807077884674072, -0.8343343734741211, -0.5879608988761902, -0.34158748388290405, -0.09521400928497314, 0.151159405708313, 0.3975328207015991, 0.6439062356948853, 0.8902796506881714, 1.1366530656814575, 1.3830265998840332, 1.6294000148773193, 1.8757734298706055, 2.1221468448638916, 2.3685202598571777, 2.614893674850464, 2.86126708984375, 3.107640504837036, 3.3540139198303223, 3.6003873348236084, 3.8467607498168945, 4.09313440322876, 4.339507579803467, 4.585881233215332, 4.832254886627197, 5.078628063201904, 5.3250017166137695, 5.571374893188477, 5.817748546600342, 6.064121723175049, 6.310495376586914, 6.556868553161621]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 7.0, 5.0, 11.0, 9.0, 16.0, 22.0, 23.0, 34.0, 36.0, 62.0, 89.0, 125.0, 140.0, 218.0, 313.0, 451.0, 681.0, 1008.0, 1601.0, 2653.0, 4503.0, 8020.0, 18447.0, 320644.0, 3798389.0, 19306.0, 7264.0, 3820.0, 2232.0, 1388.0, 829.0, 601.0, 389.0, 262.0, 167.0, 142.0, 102.0, 65.0, 61.0, 45.0, 26.0, 20.0, 12.0, 16.0, 9.0, 5.0, 4.0, 6.0, 3.0, 1.0, 5.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.8525390625, -0.82672119140625, -0.8009033203125, -0.77508544921875, -0.749267578125, -0.72344970703125, -0.6976318359375, -0.67181396484375, -0.64599609375, -0.62017822265625, -0.5943603515625, -0.56854248046875, -0.542724609375, -0.51690673828125, -0.4910888671875, -0.46527099609375, -0.439453125, -0.41363525390625, -0.3878173828125, -0.36199951171875, -0.336181640625, -0.31036376953125, -0.2845458984375, -0.25872802734375, -0.23291015625, -0.20709228515625, -0.1812744140625, -0.15545654296875, -0.129638671875, -0.10382080078125, -0.0780029296875, -0.05218505859375, -0.0263671875, -0.00054931640625, 0.0252685546875, 0.05108642578125, 0.076904296875, 0.10272216796875, 0.1285400390625, 0.15435791015625, 0.18017578125, 0.20599365234375, 0.2318115234375, 0.25762939453125, 0.283447265625, 0.30926513671875, 0.3350830078125, 0.36090087890625, 0.38671875, 0.41253662109375, 0.4383544921875, 0.46417236328125, 0.489990234375, 0.51580810546875, 0.5416259765625, 0.56744384765625, 0.59326171875, 0.61907958984375, 0.6448974609375, 0.67071533203125, 0.696533203125, 0.72235107421875, 0.7481689453125, 0.77398681640625, 0.7998046875]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 5.0, 3.0, 6.0, 5.0, 6.0, 7.0, 8.0, 4.0, 10.0, 9.0, 4.0, 12.0, 17.0, 56.0, 215.0, 409.0, 108.0, 31.0, 17.0, 10.0, 8.0, 8.0, 5.0, 5.0, 7.0, 5.0, 3.0, 3.0, 3.0, 3.0, 3.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0648193359375, -0.06286191940307617, -0.060904502868652344, -0.058947086334228516, -0.05698966979980469, -0.05503225326538086, -0.05307483673095703, -0.0511174201965332, -0.049160003662109375, -0.04720258712768555, -0.04524517059326172, -0.04328775405883789, -0.04133033752441406, -0.039372920989990234, -0.037415504455566406, -0.03545808792114258, -0.03350067138671875, -0.03154325485229492, -0.029585838317871094, -0.027628421783447266, -0.025671005249023438, -0.02371358871459961, -0.02175617218017578, -0.019798755645751953, -0.017841339111328125, -0.015883922576904297, -0.013926506042480469, -0.01196908950805664, -0.010011672973632812, -0.008054256439208984, -0.006096839904785156, -0.004139423370361328, -0.0021820068359375, -0.00022459030151367188, 0.0017328262329101562, 0.0036902427673339844, 0.0056476593017578125, 0.007605075836181641, 0.009562492370605469, 0.011519908905029297, 0.013477325439453125, 0.015434741973876953, 0.01739215850830078, 0.01934957504272461, 0.021306991577148438, 0.023264408111572266, 0.025221824645996094, 0.027179241180419922, 0.02913665771484375, 0.031094074249267578, 0.033051490783691406, 0.035008907318115234, 0.03696632385253906, 0.03892374038696289, 0.04088115692138672, 0.04283857345581055, 0.044795989990234375, 0.0467534065246582, 0.04871082305908203, 0.05066823959350586, 0.05262565612792969, 0.054583072662353516, 0.056540489196777344, 0.05849790573120117, 0.060455322265625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 6.0, 9.0, 11.0, 21.0, 17.0, 25.0, 37.0, 72.0, 114.0, 165.0, 237.0, 418.0, 683.0, 1114.0, 2000.0, 3636.0, 6863.0, 13982.0, 33043.0, 98742.0, 3681769.0, 250098.0, 56956.0, 22182.0, 10084.0, 5074.0, 2861.0, 1616.0, 932.0, 566.0, 330.0, 186.0, 150.0, 97.0, 64.0, 45.0, 25.0, 21.0, 9.0, 8.0, 6.0, 4.0, 3.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.5625, -0.5458450317382812, -0.5291900634765625, -0.5125350952148438, -0.495880126953125, -0.47922515869140625, -0.4625701904296875, -0.44591522216796875, -0.42926025390625, -0.41260528564453125, -0.3959503173828125, -0.37929534912109375, -0.362640380859375, -0.34598541259765625, -0.3293304443359375, -0.31267547607421875, -0.2960205078125, -0.27936553955078125, -0.2627105712890625, -0.24605560302734375, -0.229400634765625, -0.21274566650390625, -0.1960906982421875, -0.17943572998046875, -0.16278076171875, -0.14612579345703125, -0.1294708251953125, -0.11281585693359375, -0.096160888671875, -0.07950592041015625, -0.0628509521484375, -0.04619598388671875, -0.029541015625, -0.01288604736328125, 0.0037689208984375, 0.02042388916015625, 0.037078857421875, 0.05373382568359375, 0.0703887939453125, 0.08704376220703125, 0.10369873046875, 0.12035369873046875, 0.1370086669921875, 0.15366363525390625, 0.170318603515625, 0.18697357177734375, 0.2036285400390625, 0.22028350830078125, 0.2369384765625, 0.25359344482421875, 0.2702484130859375, 0.28690338134765625, 0.303558349609375, 0.32021331787109375, 0.3368682861328125, 0.35352325439453125, 0.37017822265625, 0.38683319091796875, 0.4034881591796875, 0.42014312744140625, 0.436798095703125, 0.45345306396484375, 0.4701080322265625, 0.48676300048828125, 0.50341796875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 6.0, 6.0, 6.0, 8.0, 10.0, 16.0, 6.0, 16.0, 24.0, 34.0, 46.0, 41.0, 68.0, 104.0, 181.0, 2996.0, 180.0, 62.0, 34.0, 52.0, 35.0, 29.0, 23.0, 20.0, 17.0, 7.0, 7.0, 9.0, 6.0, 6.0, 3.0, 8.0, 2.0, 3.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1141357421875, -0.1099853515625, -0.1058349609375, -0.1016845703125, -0.0975341796875, -0.0933837890625, -0.0892333984375, -0.0850830078125, -0.0809326171875, -0.0767822265625, -0.0726318359375, -0.0684814453125, -0.0643310546875, -0.0601806640625, -0.0560302734375, -0.0518798828125, -0.0477294921875, -0.0435791015625, -0.0394287109375, -0.0352783203125, -0.0311279296875, -0.0269775390625, -0.0228271484375, -0.0186767578125, -0.0145263671875, -0.0103759765625, -0.0062255859375, -0.0020751953125, 0.0020751953125, 0.0062255859375, 0.0103759765625, 0.0145263671875, 0.0186767578125, 0.0228271484375, 0.0269775390625, 0.0311279296875, 0.0352783203125, 0.0394287109375, 0.0435791015625, 0.0477294921875, 0.0518798828125, 0.0560302734375, 0.0601806640625, 0.0643310546875, 0.0684814453125, 0.0726318359375, 0.0767822265625, 0.0809326171875, 0.0850830078125, 0.0892333984375, 0.0933837890625, 0.0975341796875, 0.1016845703125, 0.1058349609375, 0.1099853515625, 0.1141357421875, 0.1182861328125, 0.1224365234375, 0.1265869140625, 0.1307373046875, 0.1348876953125, 0.1390380859375, 0.1431884765625, 0.1473388671875, 0.1514892578125]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 2.0, 6.0, 13.0, 24.0, 79.0, 269.0, 404.0, 111.0, 58.0, 30.0, 8.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9773894548416138, -0.9351291656494141, -0.8928689360618591, -0.8506086468696594, -0.8083484172821045, -0.7660881280899048, -0.7238278388977051, -0.6815675497055054, -0.6393073201179504, -0.5970470309257507, -0.5547868013381958, -0.5125265121459961, -0.4702662527561188, -0.42800599336624146, -0.38574570417404175, -0.34348544478416443, -0.3012251853942871, -0.2589649260044098, -0.21670465171337128, -0.17444437742233276, -0.13218411803245544, -0.08992385864257812, -0.04766356945037842, -0.005403310060501099, 0.03685694932937622, 0.07911721616983414, 0.12137748301029205, 0.16363775730133057, 0.20589801669120789, 0.2481582760810852, 0.2904185652732849, 0.33267882466316223, 0.3749392032623291, 0.4171994626522064, 0.45945972204208374, 0.5017200112342834, 0.5439802408218384, 0.5862405300140381, 0.6285008192062378, 0.6707611083984375, 0.7130213379859924, 0.7552816271781921, 0.7975418567657471, 0.8398021459579468, 0.8820624351501465, 0.9243226647377014, 0.9665829539299011, 1.008843183517456, 1.0511034727096558, 1.0933637619018555, 1.1356240510940552, 1.1778843402862549, 1.220144510269165, 1.2624047994613647, 1.3046650886535645, 1.3469253778457642, 1.3891856670379639, 1.4314459562301636, 1.4737062454223633, 1.5159664154052734, 1.5582267045974731, 1.6004869937896729, 1.6427472829818726, 1.6850075721740723, 1.7272677421569824]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 8.0, 5.0, 7.0, 8.0, 10.0, 15.0, 25.0, 36.0, 42.0, 58.0, 83.0, 74.0, 72.0, 103.0, 81.0, 82.0, 66.0, 71.0, 35.0, 38.0, 30.0, 17.0, 13.0, 9.0, 8.0, 7.0, 1.0, 2.0, 6.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7235525250434875, -0.6980715990066528, -0.6725906133651733, -0.6471096277236938, -0.6216287016868591, -0.5961477756500244, -0.5706667900085449, -0.5451858043670654, -0.5197048783302307, -0.4942239224910736, -0.4687429666519165, -0.4432620108127594, -0.4177810549736023, -0.3923000991344452, -0.3668191432952881, -0.341338187456131, -0.3158572316169739, -0.2903762757778168, -0.26489531993865967, -0.23941436409950256, -0.21393340826034546, -0.18845245242118835, -0.16297149658203125, -0.13749054074287415, -0.11200958490371704, -0.08652862906455994, -0.06104767322540283, -0.03556671738624573, -0.010085761547088623, 0.015395194292068481, 0.040876150131225586, 0.06635710597038269, 0.0918380618095398, 0.1173190176486969, 0.142799973487854, 0.1682809293270111, 0.1937618851661682, 0.21924284100532532, 0.24472379684448242, 0.2702047526836395, 0.29568570852279663, 0.32116666436195374, 0.34664762020111084, 0.37212857604026794, 0.39760953187942505, 0.42309048771858215, 0.44857144355773926, 0.47405239939689636, 0.49953335523605347, 0.5250142812728882, 0.5504952669143677, 0.5759762525558472, 0.6014571785926819, 0.6269381046295166, 0.6524190902709961, 0.6779000759124756, 0.7033810019493103, 0.728861927986145, 0.7543429136276245, 0.779823899269104, 0.8053048253059387, 0.8307857513427734, 0.8562667369842529, 0.8817477226257324, 0.9072286486625671]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 6.0, 5.0, 3.0, 9.0, 16.0, 24.0, 31.0, 51.0, 65.0, 129.0, 173.0, 307.0, 481.0, 821.0, 1413.0, 2576.0, 4832.0, 10082.0, 28144.0, 429311.0, 519259.0, 29320.0, 10296.0, 4967.0, 2593.0, 1514.0, 802.0, 492.0, 290.0, 192.0, 106.0, 94.0, 56.0, 19.0, 16.0, 17.0, 18.0, 8.0, 8.0, 4.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5693359375, -0.549713134765625, -0.53009033203125, -0.510467529296875, -0.4908447265625, -0.471221923828125, -0.45159912109375, -0.431976318359375, -0.412353515625, -0.392730712890625, -0.37310791015625, -0.353485107421875, -0.3338623046875, -0.314239501953125, -0.29461669921875, -0.274993896484375, -0.25537109375, -0.235748291015625, -0.21612548828125, -0.196502685546875, -0.1768798828125, -0.157257080078125, -0.13763427734375, -0.118011474609375, -0.098388671875, -0.078765869140625, -0.05914306640625, -0.039520263671875, -0.0198974609375, -0.000274658203125, 0.01934814453125, 0.038970947265625, 0.05859375, 0.078216552734375, 0.09783935546875, 0.117462158203125, 0.1370849609375, 0.156707763671875, 0.17633056640625, 0.195953369140625, 0.215576171875, 0.235198974609375, 0.25482177734375, 0.274444580078125, 0.2940673828125, 0.313690185546875, 0.33331298828125, 0.352935791015625, 0.37255859375, 0.392181396484375, 0.41180419921875, 0.431427001953125, 0.4510498046875, 0.470672607421875, 0.49029541015625, 0.509918212890625, 0.529541015625, 0.549163818359375, 0.56878662109375, 0.588409423828125, 0.6080322265625, 0.627655029296875, 0.64727783203125, 0.666900634765625, 0.6865234375]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 5.0, 5.0, 4.0, 4.0, 6.0, 10.0, 11.0, 2.0, 11.0, 20.0, 42.0, 105.0, 224.0, 273.0, 139.0, 55.0, 20.0, 12.0, 18.0, 6.0, 5.0, 5.0, 6.0, 2.0, 3.0, 1.0, 7.0, 0.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.078369140625, -0.07613849639892578, -0.07390785217285156, -0.07167720794677734, -0.06944656372070312, -0.0672159194946289, -0.06498527526855469, -0.06275463104248047, -0.06052398681640625, -0.05829334259033203, -0.05606269836425781, -0.053832054138183594, -0.051601409912109375, -0.049370765686035156, -0.04714012145996094, -0.04490947723388672, -0.0426788330078125, -0.04044818878173828, -0.03821754455566406, -0.035986900329589844, -0.033756256103515625, -0.031525611877441406, -0.029294967651367188, -0.02706432342529297, -0.02483367919921875, -0.02260303497314453, -0.020372390747070312, -0.018141746520996094, -0.015911102294921875, -0.013680458068847656, -0.011449813842773438, -0.009219169616699219, -0.006988525390625, -0.004757881164550781, -0.0025272369384765625, -0.00029659271240234375, 0.001934051513671875, 0.004164695739746094, 0.0063953399658203125, 0.008625984191894531, 0.01085662841796875, 0.013087272644042969, 0.015317916870117188, 0.017548561096191406, 0.019779205322265625, 0.022009849548339844, 0.024240493774414062, 0.02647113800048828, 0.0287017822265625, 0.03093242645263672, 0.03316307067871094, 0.035393714904785156, 0.037624359130859375, 0.039855003356933594, 0.04208564758300781, 0.04431629180908203, 0.04654693603515625, 0.04877758026123047, 0.05100822448730469, 0.053238868713378906, 0.055469512939453125, 0.057700157165527344, 0.05993080139160156, 0.06216144561767578, 0.06439208984375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 0.0, 4.0, 2.0, 5.0, 5.0, 6.0, 7.0, 11.0, 13.0, 17.0, 15.0, 22.0, 29.0, 62.0, 82.0, 164.0, 329.0, 625.0, 1391.0, 2973.0, 7049.0, 16281.0, 40716.0, 116312.0, 425290.0, 297198.0, 85556.0, 31378.0, 12625.0, 5597.0, 2461.0, 1155.0, 516.0, 275.0, 139.0, 73.0, 59.0, 31.0, 12.0, 20.0, 15.0, 11.0, 5.0, 6.0, 7.0, 5.0, 3.0, 1.0, 3.0, 3.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.295166015625, -0.284942626953125, -0.27471923828125, -0.264495849609375, -0.2542724609375, -0.244049072265625, -0.23382568359375, -0.223602294921875, -0.21337890625, -0.203155517578125, -0.19293212890625, -0.182708740234375, -0.1724853515625, -0.162261962890625, -0.15203857421875, -0.141815185546875, -0.131591796875, -0.121368408203125, -0.11114501953125, -0.100921630859375, -0.0906982421875, -0.080474853515625, -0.07025146484375, -0.060028076171875, -0.0498046875, -0.039581298828125, -0.02935791015625, -0.019134521484375, -0.0089111328125, 0.001312255859375, 0.01153564453125, 0.021759033203125, 0.031982421875, 0.042205810546875, 0.05242919921875, 0.062652587890625, 0.0728759765625, 0.083099365234375, 0.09332275390625, 0.103546142578125, 0.11376953125, 0.123992919921875, 0.13421630859375, 0.144439697265625, 0.1546630859375, 0.164886474609375, 0.17510986328125, 0.185333251953125, 0.195556640625, 0.205780029296875, 0.21600341796875, 0.226226806640625, 0.2364501953125, 0.246673583984375, 0.25689697265625, 0.267120361328125, 0.27734375, 0.287567138671875, 0.29779052734375, 0.308013916015625, 0.3182373046875, 0.328460693359375, 0.33868408203125, 0.348907470703125, 0.359130859375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 1.0, 4.0, 1.0, 5.0, 3.0, 7.0, 13.0, 10.0, 11.0, 16.0, 11.0, 14.0, 19.0, 22.0, 33.0, 28.0, 34.0, 32.0, 34.0, 34.0, 45.0, 47.0, 37.0, 31.0, 41.0, 43.0, 36.0, 52.0, 30.0, 38.0, 38.0, 22.0, 31.0, 26.0, 16.0, 33.0, 21.0, 13.0, 12.0, 18.0, 9.0, 9.0, 7.0, 10.0, 5.0, 3.0, 2.0, 2.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1658935546875, -0.16012954711914062, -0.15436553955078125, -0.14860153198242188, -0.1428375244140625, -0.13707351684570312, -0.13130950927734375, -0.12554550170898438, -0.119781494140625, -0.11401748657226562, -0.10825347900390625, -0.10248947143554688, -0.0967254638671875, -0.09096145629882812, -0.08519744873046875, -0.07943344116210938, -0.07366943359375, -0.06790542602539062, -0.06214141845703125, -0.056377410888671875, -0.0506134033203125, -0.044849395751953125, -0.03908538818359375, -0.033321380615234375, -0.027557373046875, -0.021793365478515625, -0.01602935791015625, -0.010265350341796875, -0.0045013427734375, 0.001262664794921875, 0.00702667236328125, 0.012790679931640625, 0.0185546875, 0.024318695068359375, 0.03008270263671875, 0.035846710205078125, 0.0416107177734375, 0.047374725341796875, 0.05313873291015625, 0.058902740478515625, 0.064666748046875, 0.07043075561523438, 0.07619476318359375, 0.08195877075195312, 0.0877227783203125, 0.09348678588867188, 0.09925079345703125, 0.10501480102539062, 0.11077880859375, 0.11654281616210938, 0.12230682373046875, 0.12807083129882812, 0.1338348388671875, 0.13959884643554688, 0.14536285400390625, 0.15112686157226562, 0.156890869140625, 0.16265487670898438, 0.16841888427734375, 0.17418289184570312, 0.1799468994140625, 0.18571090698242188, 0.19147491455078125, 0.19723892211914062, 0.2030029296875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 6.0, 9.0, 10.0, 13.0, 22.0, 31.0, 63.0, 100.0, 142.0, 249.0, 384.0, 786.0, 1770.0, 5149.0, 20592.0, 169203.0, 782445.0, 52325.0, 9827.0, 2925.0, 1152.0, 521.0, 286.0, 206.0, 111.0, 79.0, 44.0, 32.0, 21.0, 11.0, 7.0, 4.0, 8.0, 3.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0], "bins": [-0.060760498046875, -0.05881643295288086, -0.05687236785888672, -0.05492830276489258, -0.05298423767089844, -0.0510401725769043, -0.049096107482910156, -0.047152042388916016, -0.045207977294921875, -0.043263912200927734, -0.041319847106933594, -0.03937578201293945, -0.03743171691894531, -0.03548765182495117, -0.03354358673095703, -0.03159952163696289, -0.02965545654296875, -0.02771139144897461, -0.02576732635498047, -0.023823261260986328, -0.021879196166992188, -0.019935131072998047, -0.017991065979003906, -0.016047000885009766, -0.014102935791015625, -0.012158870697021484, -0.010214805603027344, -0.008270740509033203, -0.0063266754150390625, -0.004382610321044922, -0.0024385452270507812, -0.0004944801330566406, 0.0014495849609375, 0.0033936500549316406, 0.005337715148925781, 0.007281780242919922, 0.009225845336914062, 0.011169910430908203, 0.013113975524902344, 0.015058040618896484, 0.017002105712890625, 0.018946170806884766, 0.020890235900878906, 0.022834300994873047, 0.024778366088867188, 0.026722431182861328, 0.02866649627685547, 0.03061056137084961, 0.03255462646484375, 0.03449869155883789, 0.03644275665283203, 0.03838682174682617, 0.04033088684082031, 0.04227495193481445, 0.044219017028808594, 0.046163082122802734, 0.048107147216796875, 0.050051212310791016, 0.051995277404785156, 0.0539393424987793, 0.05588340759277344, 0.05782747268676758, 0.05977153778076172, 0.06171560287475586, 0.06365966796875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 2.0, 1.0, 4.0, 4.0, 10.0, 14.0, 11.0, 20.0, 20.0, 42.0, 43.0, 63.0, 90.0, 108.0, 129.0, 94.0, 92.0, 84.0, 34.0, 39.0, 28.0, 17.0, 17.0, 8.0, 11.0, 7.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-4.2557716369628906e-05, -4.1425228118896484e-05, -4.029273986816406e-05, -3.916025161743164e-05, -3.802776336669922e-05, -3.68952751159668e-05, -3.5762786865234375e-05, -3.463029861450195e-05, -3.349781036376953e-05, -3.236532211303711e-05, -3.123283386230469e-05, -3.0100345611572266e-05, -2.8967857360839844e-05, -2.7835369110107422e-05, -2.6702880859375e-05, -2.5570392608642578e-05, -2.4437904357910156e-05, -2.3305416107177734e-05, -2.2172927856445312e-05, -2.104043960571289e-05, -1.990795135498047e-05, -1.8775463104248047e-05, -1.7642974853515625e-05, -1.6510486602783203e-05, -1.537799835205078e-05, -1.424551010131836e-05, -1.3113021850585938e-05, -1.1980533599853516e-05, -1.0848045349121094e-05, -9.715557098388672e-06, -8.58306884765625e-06, -7.450580596923828e-06, -6.318092346191406e-06, -5.185604095458984e-06, -4.0531158447265625e-06, -2.9206275939941406e-06, -1.7881393432617188e-06, -6.556510925292969e-07, 4.76837158203125e-07, 1.6093254089355469e-06, 2.7418136596679688e-06, 3.874301910400391e-06, 5.0067901611328125e-06, 6.139278411865234e-06, 7.271766662597656e-06, 8.404254913330078e-06, 9.5367431640625e-06, 1.0669231414794922e-05, 1.1801719665527344e-05, 1.2934207916259766e-05, 1.4066696166992188e-05, 1.519918441772461e-05, 1.633167266845703e-05, 1.7464160919189453e-05, 1.8596649169921875e-05, 1.9729137420654297e-05, 2.086162567138672e-05, 2.199411392211914e-05, 2.3126602172851562e-05, 2.4259090423583984e-05, 2.5391578674316406e-05, 2.6524066925048828e-05, 2.765655517578125e-05, 2.8789043426513672e-05, 2.9921531677246094e-05]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 1.0, 3.0, 1.0, 2.0, 0.0, 3.0, 3.0, 4.0, 7.0, 13.0, 20.0, 37.0, 63.0, 104.0, 176.0, 295.0, 606.0, 1196.0, 2506.0, 6017.0, 16876.0, 59031.0, 395299.0, 469227.0, 66581.0, 18658.0, 6570.0, 2666.0, 1166.0, 635.0, 349.0, 183.0, 94.0, 69.0, 37.0, 22.0, 12.0, 13.0, 7.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03173828125, -0.030644893646240234, -0.02955150604248047, -0.028458118438720703, -0.027364730834960938, -0.026271343231201172, -0.025177955627441406, -0.02408456802368164, -0.022991180419921875, -0.02189779281616211, -0.020804405212402344, -0.019711017608642578, -0.018617630004882812, -0.017524242401123047, -0.01643085479736328, -0.015337467193603516, -0.01424407958984375, -0.013150691986083984, -0.012057304382324219, -0.010963916778564453, -0.009870529174804688, -0.008777141571044922, -0.007683753967285156, -0.006590366363525391, -0.005496978759765625, -0.004403591156005859, -0.0033102035522460938, -0.002216815948486328, -0.0011234283447265625, -3.0040740966796875e-05, 0.0010633468627929688, 0.0021567344665527344, 0.0032501220703125, 0.004343509674072266, 0.005436897277832031, 0.006530284881591797, 0.0076236724853515625, 0.008717060089111328, 0.009810447692871094, 0.01090383529663086, 0.011997222900390625, 0.01309061050415039, 0.014183998107910156, 0.015277385711669922, 0.016370773315429688, 0.017464160919189453, 0.01855754852294922, 0.019650936126708984, 0.02074432373046875, 0.021837711334228516, 0.02293109893798828, 0.024024486541748047, 0.025117874145507812, 0.026211261749267578, 0.027304649353027344, 0.02839803695678711, 0.029491424560546875, 0.03058481216430664, 0.031678199768066406, 0.03277158737182617, 0.03386497497558594, 0.0349583625793457, 0.03605175018310547, 0.037145137786865234, 0.038238525390625]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 3.0, 4.0, 2.0, 4.0, 5.0, 4.0, 11.0, 12.0, 16.0, 21.0, 18.0, 19.0, 30.0, 40.0, 51.0, 73.0, 82.0, 99.0, 80.0, 69.0, 59.0, 56.0, 45.0, 43.0, 24.0, 34.0, 25.0, 22.0, 15.0, 11.0, 4.0, 7.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0186004638671875, -0.017957210540771484, -0.01731395721435547, -0.016670703887939453, -0.016027450561523438, -0.015384197235107422, -0.014740943908691406, -0.01409769058227539, -0.013454437255859375, -0.01281118392944336, -0.012167930603027344, -0.011524677276611328, -0.010881423950195312, -0.010238170623779297, -0.009594917297363281, -0.008951663970947266, -0.00830841064453125, -0.007665157318115234, -0.007021903991699219, -0.006378650665283203, -0.0057353973388671875, -0.005092144012451172, -0.004448890686035156, -0.0038056373596191406, -0.003162384033203125, -0.0025191307067871094, -0.0018758773803710938, -0.0012326240539550781, -0.0005893707275390625, 5.3882598876953125e-05, 0.0006971359252929688, 0.0013403892517089844, 0.001983642578125, 0.0026268959045410156, 0.0032701492309570312, 0.003913402557373047, 0.0045566558837890625, 0.005199909210205078, 0.005843162536621094, 0.006486415863037109, 0.007129669189453125, 0.007772922515869141, 0.008416175842285156, 0.009059429168701172, 0.009702682495117188, 0.010345935821533203, 0.010989189147949219, 0.011632442474365234, 0.01227569580078125, 0.012918949127197266, 0.013562202453613281, 0.014205455780029297, 0.014848709106445312, 0.015491962432861328, 0.016135215759277344, 0.01677846908569336, 0.017421722412109375, 0.01806497573852539, 0.018708229064941406, 0.019351482391357422, 0.019994735717773438, 0.020637989044189453, 0.02128124237060547, 0.021924495697021484, 0.0225677490234375]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 12.0, 39.0, 144.0, 590.0, 165.0, 38.0, 11.0, 6.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.771942138671875, -3.578969717025757, -3.3859972953796387, -3.1930251121520996, -3.0000526905059814, -2.8070802688598633, -2.614107847213745, -2.421135425567627, -2.228163242340088, -2.0351908206939697, -1.8422185182571411, -1.649246096611023, -1.4562737941741943, -1.2633013725280762, -1.070328950881958, -0.8773566484451294, -0.6843841075897217, -0.4914117455482483, -0.2984393537044525, -0.10546696186065674, 0.08750540018081665, 0.28047776222229004, 0.4734501838684082, 0.6664224863052368, 0.859394907951355, 1.0523673295974731, 1.2453396320343018, 1.43831205368042, 1.631284475326538, 1.8242567777633667, 2.0172290802001953, 2.2102015018463135, 2.4031739234924316, 2.59614634513855, 2.789118766784668, 2.982090950012207, 3.175063371658325, 3.3680357933044434, 3.5610082149505615, 3.7539806365966797, 3.9469528198242188, 4.139925003051758, 4.332897663116455, 4.525869846343994, 4.718842506408691, 4.9118146896362305, 5.1047868728637695, 5.297759532928467, 5.490732192993164, 5.683704376220703, 5.8766770362854, 6.0696492195129395, 6.262621879577637, 6.455594062805176, 6.648566246032715, 6.841538906097412, 7.034511089324951, 7.22748327255249, 7.4204559326171875, 7.613428115844727, 7.806400775909424, 7.999372959136963, 8.19234561920166, 8.3853178024292, 8.578289985656738]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 1.0, 4.0, 8.0, 12.0, 10.0, 19.0, 25.0, 33.0, 47.0, 64.0, 68.0, 74.0, 78.0, 105.0, 92.0, 89.0, 59.0, 51.0, 41.0, 27.0, 21.0, 14.0, 10.0, 9.0, 5.0, 4.0, 6.0, 4.0, 2.0, 7.0, 3.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.1868035793304443, -2.1156365871429443, -2.0444695949554443, -1.9733024835586548, -1.9021354913711548, -1.8309684991836548, -1.7598013877868652, -1.6886343955993652, -1.6174674034118652, -1.5463004112243652, -1.4751334190368652, -1.4039663076400757, -1.3327993154525757, -1.2616323232650757, -1.1904652118682861, -1.1192982196807861, -1.0481312274932861, -0.9769642353057861, -0.9057971835136414, -0.8346301317214966, -0.7634631395339966, -0.6922961473464966, -0.6211290955543518, -0.549962043762207, -0.47879505157470703, -0.40762802958488464, -0.33646100759506226, -0.26529398560523987, -0.19412696361541748, -0.12295994162559509, -0.051792919635772705, 0.019374102354049683, 0.09054088592529297, 0.16170790791511536, 0.23287492990493774, 0.30404195189476013, 0.3752089738845825, 0.4463759958744049, 0.5175430178642273, 0.5887100696563721, 0.6598770618438721, 0.7310440540313721, 0.8022111058235168, 0.8733781576156616, 0.9445451498031616, 1.0157121419906616, 1.0868792533874512, 1.1580462455749512, 1.2292132377624512, 1.3003802299499512, 1.3715472221374512, 1.4427143335342407, 1.5138813257217407, 1.5850483179092407, 1.6562154293060303, 1.7273824214935303, 1.7985494136810303, 1.8697164058685303, 1.9408833980560303, 2.0120503902435303, 2.0832176208496094, 2.1543846130371094, 2.2255516052246094, 2.2967185974121094, 2.3678855895996094]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 6.0, 2.0, 0.0, 7.0, 4.0, 6.0, 2.0, 7.0, 8.0, 6.0, 13.0, 18.0, 17.0, 25.0, 44.0, 54.0, 104.0, 122.0, 223.0, 308.0, 465.0, 711.0, 1134.0, 1996.0, 4022.0, 10605.0, 56391.0, 4075008.0, 28449.0, 7128.0, 3103.0, 1571.0, 924.0, 545.0, 389.0, 281.0, 188.0, 123.0, 88.0, 65.0, 42.0, 29.0, 25.0, 13.0, 7.0, 5.0, 3.0, 1.0, 3.0, 1.0], "bins": [-1.89453125, -1.84869384765625, -1.8028564453125, -1.75701904296875, -1.711181640625, -1.66534423828125, -1.6195068359375, -1.57366943359375, -1.52783203125, -1.48199462890625, -1.4361572265625, -1.39031982421875, -1.344482421875, -1.29864501953125, -1.2528076171875, -1.20697021484375, -1.1611328125, -1.11529541015625, -1.0694580078125, -1.02362060546875, -0.977783203125, -0.93194580078125, -0.8861083984375, -0.84027099609375, -0.79443359375, -0.74859619140625, -0.7027587890625, -0.65692138671875, -0.611083984375, -0.56524658203125, -0.5194091796875, -0.47357177734375, -0.427734375, -0.38189697265625, -0.3360595703125, -0.29022216796875, -0.244384765625, -0.19854736328125, -0.1527099609375, -0.10687255859375, -0.06103515625, -0.01519775390625, 0.0306396484375, 0.07647705078125, 0.122314453125, 0.16815185546875, 0.2139892578125, 0.25982666015625, 0.3056640625, 0.35150146484375, 0.3973388671875, 0.44317626953125, 0.489013671875, 0.53485107421875, 0.5806884765625, 0.62652587890625, 0.67236328125, 0.71820068359375, 0.7640380859375, 0.80987548828125, 0.855712890625, 0.90155029296875, 0.9473876953125, 0.99322509765625, 1.0390625]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 3.0, 2.0, 2.0, 3.0, 8.0, 7.0, 13.0, 17.0, 13.0, 26.0, 51.0, 78.0, 173.0, 202.0, 155.0, 101.0, 47.0, 20.0, 26.0, 11.0, 9.0, 7.0, 5.0, 3.0, 6.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 3.0, 0.0, 1.0], "bins": [-0.0750732421875, -0.07326364517211914, -0.07145404815673828, -0.06964445114135742, -0.06783485412597656, -0.0660252571105957, -0.06421566009521484, -0.062406063079833984, -0.060596466064453125, -0.058786869049072266, -0.056977272033691406, -0.05516767501831055, -0.05335807800292969, -0.05154848098754883, -0.04973888397216797, -0.04792928695678711, -0.04611968994140625, -0.04431009292602539, -0.04250049591064453, -0.04069089889526367, -0.03888130187988281, -0.03707170486450195, -0.035262107849121094, -0.033452510833740234, -0.031642913818359375, -0.029833316802978516, -0.028023719787597656, -0.026214122772216797, -0.024404525756835938, -0.022594928741455078, -0.02078533172607422, -0.01897573471069336, -0.0171661376953125, -0.01535654067993164, -0.013546943664550781, -0.011737346649169922, -0.009927749633789062, -0.008118152618408203, -0.006308555603027344, -0.004498958587646484, -0.002689361572265625, -0.0008797645568847656, 0.0009298324584960938, 0.002739429473876953, 0.0045490264892578125, 0.006358623504638672, 0.008168220520019531, 0.00997781753540039, 0.01178741455078125, 0.01359701156616211, 0.015406608581542969, 0.017216205596923828, 0.019025802612304688, 0.020835399627685547, 0.022644996643066406, 0.024454593658447266, 0.026264190673828125, 0.028073787689208984, 0.029883384704589844, 0.0316929817199707, 0.03350257873535156, 0.03531217575073242, 0.03712177276611328, 0.03893136978149414, 0.040740966796875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 2.0, 3.0, 3.0, 3.0, 5.0, 9.0, 7.0, 9.0, 10.0, 21.0, 12.0, 16.0, 9.0, 30.0, 30.0, 113.0, 1148.0, 27353.0, 4146984.0, 17449.0, 799.0, 104.0, 32.0, 22.0, 12.0, 18.0, 16.0, 7.0, 12.0, 8.0, 10.0, 6.0, 6.0, 3.0, 4.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.720703125, -2.621551513671875, -2.52239990234375, -2.423248291015625, -2.3240966796875, -2.224945068359375, -2.12579345703125, -2.026641845703125, -1.927490234375, -1.828338623046875, -1.72918701171875, -1.630035400390625, -1.5308837890625, -1.431732177734375, -1.33258056640625, -1.233428955078125, -1.13427734375, -1.035125732421875, -0.93597412109375, -0.836822509765625, -0.7376708984375, -0.638519287109375, -0.53936767578125, -0.440216064453125, -0.341064453125, -0.241912841796875, -0.14276123046875, -0.043609619140625, 0.0555419921875, 0.154693603515625, 0.25384521484375, 0.352996826171875, 0.4521484375, 0.551300048828125, 0.65045166015625, 0.749603271484375, 0.8487548828125, 0.947906494140625, 1.04705810546875, 1.146209716796875, 1.245361328125, 1.344512939453125, 1.44366455078125, 1.542816162109375, 1.6419677734375, 1.741119384765625, 1.84027099609375, 1.939422607421875, 2.03857421875, 2.137725830078125, 2.23687744140625, 2.336029052734375, 2.4351806640625, 2.534332275390625, 2.63348388671875, 2.732635498046875, 2.831787109375, 2.930938720703125, 3.03009033203125, 3.129241943359375, 3.2283935546875, 3.327545166015625, 3.42669677734375, 3.525848388671875, 3.625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 1.0, 3.0, 3.0, 4.0, 5.0, 5.0, 13.0, 6.0, 11.0, 8.0, 21.0, 16.0, 14.0, 26.0, 29.0, 41.0, 54.0, 216.0, 3305.0, 66.0, 38.0, 40.0, 19.0, 19.0, 15.0, 12.0, 18.0, 15.0, 7.0, 8.0, 9.0, 8.0, 4.0, 4.0, 3.0, 1.0, 3.0, 6.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.12237548828125, -0.11908149719238281, -0.11578750610351562, -0.11249351501464844, -0.10919952392578125, -0.10590553283691406, -0.10261154174804688, -0.09931755065917969, -0.0960235595703125, -0.09272956848144531, -0.08943557739257812, -0.08614158630371094, -0.08284759521484375, -0.07955360412597656, -0.07625961303710938, -0.07296562194824219, -0.069671630859375, -0.06637763977050781, -0.06308364868164062, -0.05978965759277344, -0.05649566650390625, -0.05320167541503906, -0.049907684326171875, -0.04661369323730469, -0.0433197021484375, -0.04002571105957031, -0.036731719970703125, -0.03343772888183594, -0.03014373779296875, -0.026849746704101562, -0.023555755615234375, -0.020261764526367188, -0.0169677734375, -0.013673782348632812, -0.010379791259765625, -0.0070858001708984375, -0.00379180908203125, -0.0004978179931640625, 0.002796173095703125, 0.0060901641845703125, 0.0093841552734375, 0.012678146362304688, 0.015972137451171875, 0.019266128540039062, 0.02256011962890625, 0.025854110717773438, 0.029148101806640625, 0.03244209289550781, 0.035736083984375, 0.03903007507324219, 0.042324066162109375, 0.04561805725097656, 0.04891204833984375, 0.05220603942871094, 0.055500030517578125, 0.05879402160644531, 0.0620880126953125, 0.06538200378417969, 0.06867599487304688, 0.07196998596191406, 0.07526397705078125, 0.07855796813964844, 0.08185195922851562, 0.08514595031738281, 0.08843994140625]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 10.0, 18.0, 44.0, 138.0, 543.0, 181.0, 53.0, 18.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.260511636734009, -2.2157864570617676, -2.1710615158081055, -2.1263363361358643, -2.081611394882202, -2.036886215209961, -1.9921611547470093, -1.9474360942840576, -1.902711033821106, -1.8579859733581543, -1.8132609128952026, -1.768535852432251, -1.7238106727600098, -1.679085612297058, -1.6343605518341064, -1.5896354913711548, -1.5449104309082031, -1.5001853704452515, -1.4554603099822998, -1.4107352495193481, -1.3660101890563965, -1.3212850093841553, -1.2765599489212036, -1.231834888458252, -1.1871098279953003, -1.1423847675323486, -1.097659707069397, -1.0529346466064453, -1.008209466934204, -0.9634844660758972, -0.9187593460083008, -0.8740342855453491, -0.829309344291687, -0.7845842838287354, -0.7398592233657837, -0.6951341032981873, -0.6504090428352356, -0.6056839823722839, -0.5609588623046875, -0.5162338018417358, -0.4715087413787842, -0.4267836809158325, -0.38205859065055847, -0.3373335003852844, -0.29260843992233276, -0.2478833645582199, -0.20315828919410706, -0.158433198928833, -0.11370813846588135, -0.0689830631017685, -0.02425798773765564, 0.020467087626457214, 0.06519216299057007, 0.10991723835468292, 0.15464231371879578, 0.19936740398406982, 0.24409246444702148, 0.28881752490997314, 0.3335426151752472, 0.37826770544052124, 0.4229927659034729, 0.46771782636642456, 0.512442946434021, 0.5571680068969727, 0.6018930673599243]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 7.0, 5.0, 5.0, 8.0, 8.0, 15.0, 29.0, 24.0, 37.0, 54.0, 59.0, 82.0, 76.0, 87.0, 87.0, 83.0, 78.0, 55.0, 72.0, 39.0, 24.0, 26.0, 12.0, 14.0, 8.0, 6.0, 4.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.7095207571983337, -0.6930294632911682, -0.6765381693840027, -0.6600468158721924, -0.6435555219650269, -0.6270642280578613, -0.6105729341506958, -0.5940816402435303, -0.57759028673172, -0.5610989928245544, -0.5446076989173889, -0.5281163454055786, -0.5116250514984131, -0.49513375759124756, -0.47864246368408203, -0.4621511399745941, -0.4456598460674286, -0.42916855216026306, -0.41267722845077515, -0.3961859345436096, -0.3796946108341217, -0.3632033169269562, -0.34671199321746826, -0.33022069931030273, -0.3137294054031372, -0.2972381114959717, -0.28074678778648376, -0.26425549387931824, -0.24776417016983032, -0.2312728762626648, -0.21478156745433807, -0.19829025864601135, -0.18179893493652344, -0.16530762612819672, -0.14881631731987, -0.13232502341270447, -0.11583370715379715, -0.09934239834547043, -0.0828510969877243, -0.06635978817939758, -0.04986847937107086, -0.03337717056274414, -0.016885865479707718, -0.00039456039667129517, 0.016096748411655426, 0.03258805721998215, 0.04907935857772827, 0.06557066738605499, 0.08206197619438171, 0.09855328500270844, 0.11504459381103516, 0.13153588771820068, 0.1480272114276886, 0.16451850533485413, 0.18100981414318085, 0.19750112295150757, 0.2139924317598343, 0.230483740568161, 0.24697504937648773, 0.26346635818481445, 0.27995765209198, 0.2964489758014679, 0.3129402697086334, 0.32943159341812134, 0.34592288732528687]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 2.0, 1.0, 9.0, 9.0, 12.0, 13.0, 17.0, 23.0, 33.0, 67.0, 116.0, 179.0, 320.0, 666.0, 1311.0, 3253.0, 9789.0, 47056.0, 793158.0, 163967.0, 19058.0, 5462.0, 2059.0, 887.0, 481.0, 234.0, 121.0, 78.0, 60.0, 27.0, 19.0, 19.0, 6.0, 11.0, 10.0, 8.0, 7.0, 5.0, 2.0, 0.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.78515625, -0.7604217529296875, -0.735687255859375, -0.7109527587890625, -0.68621826171875, -0.6614837646484375, -0.636749267578125, -0.6120147705078125, -0.5872802734375, -0.5625457763671875, -0.537811279296875, -0.5130767822265625, -0.48834228515625, -0.4636077880859375, -0.438873291015625, -0.4141387939453125, -0.389404296875, -0.3646697998046875, -0.339935302734375, -0.3152008056640625, -0.29046630859375, -0.2657318115234375, -0.240997314453125, -0.2162628173828125, -0.1915283203125, -0.1667938232421875, -0.142059326171875, -0.1173248291015625, -0.09259033203125, -0.0678558349609375, -0.043121337890625, -0.0183868408203125, 0.00634765625, 0.0310821533203125, 0.055816650390625, 0.0805511474609375, 0.10528564453125, 0.1300201416015625, 0.154754638671875, 0.1794891357421875, 0.2042236328125, 0.2289581298828125, 0.253692626953125, 0.2784271240234375, 0.30316162109375, 0.3278961181640625, 0.352630615234375, 0.3773651123046875, 0.402099609375, 0.4268341064453125, 0.451568603515625, 0.4763031005859375, 0.50103759765625, 0.5257720947265625, 0.550506591796875, 0.5752410888671875, 0.5999755859375, 0.6247100830078125, 0.649444580078125, 0.6741790771484375, 0.69891357421875, 0.7236480712890625, 0.748382568359375, 0.7731170654296875, 0.7978515625]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 3.0, 5.0, 5.0, 8.0, 18.0, 16.0, 16.0, 47.0, 80.0, 134.0, 183.0, 191.0, 130.0, 67.0, 37.0, 19.0, 13.0, 12.0, 4.0, 3.0, 6.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.08050537109375, -0.07866621017456055, -0.0768270492553711, -0.07498788833618164, -0.07314872741699219, -0.07130956649780273, -0.06947040557861328, -0.06763124465942383, -0.06579208374023438, -0.06395292282104492, -0.06211376190185547, -0.060274600982666016, -0.05843544006347656, -0.05659627914428711, -0.054757118225097656, -0.0529179573059082, -0.05107879638671875, -0.0492396354675293, -0.047400474548339844, -0.04556131362915039, -0.04372215270996094, -0.041882991790771484, -0.04004383087158203, -0.03820466995239258, -0.036365509033203125, -0.03452634811401367, -0.03268718719482422, -0.030848026275634766, -0.029008865356445312, -0.02716970443725586, -0.025330543518066406, -0.023491382598876953, -0.0216522216796875, -0.019813060760498047, -0.017973899841308594, -0.01613473892211914, -0.014295578002929688, -0.012456417083740234, -0.010617256164550781, -0.008778095245361328, -0.006938934326171875, -0.005099773406982422, -0.0032606124877929688, -0.0014214515686035156, 0.0004177093505859375, 0.0022568702697753906, 0.004096031188964844, 0.005935192108154297, 0.00777435302734375, 0.009613513946533203, 0.011452674865722656, 0.01329183578491211, 0.015130996704101562, 0.016970157623291016, 0.01880931854248047, 0.020648479461669922, 0.022487640380859375, 0.024326801300048828, 0.02616596221923828, 0.028005123138427734, 0.029844284057617188, 0.03168344497680664, 0.033522605895996094, 0.03536176681518555, 0.037200927734375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 3.0, 7.0, 13.0, 5.0, 13.0, 22.0, 34.0, 31.0, 73.0, 91.0, 111.0, 216.0, 264.0, 435.0, 734.0, 1111.0, 1819.0, 3167.0, 5751.0, 10729.0, 20494.0, 40610.0, 91612.0, 249822.0, 368430.0, 137052.0, 57599.0, 27208.0, 13673.0, 7315.0, 4053.0, 2247.0, 1369.0, 853.0, 530.0, 339.0, 226.0, 169.0, 113.0, 61.0, 46.0, 33.0, 23.0, 22.0, 7.0, 5.0, 10.0, 7.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.2344970703125, -0.22698402404785156, -0.21947097778320312, -0.2119579315185547, -0.20444488525390625, -0.1969318389892578, -0.18941879272460938, -0.18190574645996094, -0.1743927001953125, -0.16687965393066406, -0.15936660766601562, -0.1518535614013672, -0.14434051513671875, -0.1368274688720703, -0.12931442260742188, -0.12180137634277344, -0.114288330078125, -0.10677528381347656, -0.09926223754882812, -0.09174919128417969, -0.08423614501953125, -0.07672309875488281, -0.06921005249023438, -0.06169700622558594, -0.0541839599609375, -0.04667091369628906, -0.039157867431640625, -0.03164482116699219, -0.02413177490234375, -0.016618728637695312, -0.009105682373046875, -0.0015926361083984375, 0.00592041015625, 0.013433456420898438, 0.020946502685546875, 0.028459548950195312, 0.03597259521484375, 0.04348564147949219, 0.050998687744140625, 0.05851173400878906, 0.0660247802734375, 0.07353782653808594, 0.08105087280273438, 0.08856391906738281, 0.09607696533203125, 0.10359001159667969, 0.11110305786132812, 0.11861610412597656, 0.126129150390625, 0.13364219665527344, 0.14115524291992188, 0.1486682891845703, 0.15618133544921875, 0.1636943817138672, 0.17120742797851562, 0.17872047424316406, 0.1862335205078125, 0.19374656677246094, 0.20125961303710938, 0.2087726593017578, 0.21628570556640625, 0.2237987518310547, 0.23131179809570312, 0.23882484436035156, 0.246337890625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 6.0, 6.0, 6.0, 14.0, 15.0, 19.0, 12.0, 21.0, 19.0, 20.0, 31.0, 33.0, 38.0, 35.0, 46.0, 46.0, 54.0, 50.0, 49.0, 47.0, 41.0, 54.0, 42.0, 38.0, 43.0, 42.0, 43.0, 25.0, 26.0, 6.0, 15.0, 14.0, 8.0, 15.0, 5.0, 6.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.152099609375, -0.1467304229736328, -0.14136123657226562, -0.13599205017089844, -0.13062286376953125, -0.12525367736816406, -0.11988449096679688, -0.11451530456542969, -0.1091461181640625, -0.10377693176269531, -0.09840774536132812, -0.09303855895996094, -0.08766937255859375, -0.08230018615722656, -0.07693099975585938, -0.07156181335449219, -0.066192626953125, -0.06082344055175781, -0.055454254150390625, -0.05008506774902344, -0.04471588134765625, -0.03934669494628906, -0.033977508544921875, -0.028608322143554688, -0.0232391357421875, -0.017869949340820312, -0.012500762939453125, -0.0071315765380859375, -0.00176239013671875, 0.0036067962646484375, 0.008975982666015625, 0.014345169067382812, 0.01971435546875, 0.025083541870117188, 0.030452728271484375, 0.03582191467285156, 0.04119110107421875, 0.04656028747558594, 0.051929473876953125, 0.05729866027832031, 0.0626678466796875, 0.06803703308105469, 0.07340621948242188, 0.07877540588378906, 0.08414459228515625, 0.08951377868652344, 0.09488296508789062, 0.10025215148925781, 0.105621337890625, 0.11099052429199219, 0.11635971069335938, 0.12172889709472656, 0.12709808349609375, 0.13246726989746094, 0.13783645629882812, 0.1432056427001953, 0.1485748291015625, 0.1539440155029297, 0.15931320190429688, 0.16468238830566406, 0.17005157470703125, 0.17542076110839844, 0.18078994750976562, 0.1861591339111328, 0.1915283203125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 2.0, 1.0, 7.0, 9.0, 7.0, 16.0, 10.0, 16.0, 28.0, 40.0, 52.0, 64.0, 126.0, 183.0, 305.0, 556.0, 1151.0, 2778.0, 8270.0, 38335.0, 702950.0, 259247.0, 24132.0, 5989.0, 2123.0, 897.0, 521.0, 271.0, 154.0, 97.0, 64.0, 40.0, 36.0, 15.0, 18.0, 7.0, 14.0, 9.0, 4.0, 7.0, 5.0, 0.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.297607421875, -0.28826904296875, -0.2789306640625, -0.26959228515625, -0.26025390625, -0.25091552734375, -0.2415771484375, -0.23223876953125, -0.222900390625, -0.21356201171875, -0.2042236328125, -0.19488525390625, -0.185546875, -0.17620849609375, -0.1668701171875, -0.15753173828125, -0.148193359375, -0.13885498046875, -0.1295166015625, -0.12017822265625, -0.11083984375, -0.10150146484375, -0.0921630859375, -0.08282470703125, -0.073486328125, -0.06414794921875, -0.0548095703125, -0.04547119140625, -0.0361328125, -0.02679443359375, -0.0174560546875, -0.00811767578125, 0.001220703125, 0.01055908203125, 0.0198974609375, 0.02923583984375, 0.03857421875, 0.04791259765625, 0.0572509765625, 0.06658935546875, 0.075927734375, 0.08526611328125, 0.0946044921875, 0.10394287109375, 0.11328125, 0.12261962890625, 0.1319580078125, 0.14129638671875, 0.150634765625, 0.15997314453125, 0.1693115234375, 0.17864990234375, 0.18798828125, 0.19732666015625, 0.2066650390625, 0.21600341796875, 0.225341796875, 0.23468017578125, 0.2440185546875, 0.25335693359375, 0.2626953125, 0.27203369140625, 0.2813720703125, 0.29071044921875, 0.300048828125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 3.0, 5.0, 3.0, 2.0, 2.0, 3.0, 1.0, 5.0, 8.0, 7.0, 12.0, 26.0, 34.0, 64.0, 419.0, 257.0, 53.0, 22.0, 12.0, 8.0, 14.0, 5.0, 7.0, 7.0, 6.0, 0.0, 3.0, 2.0, 5.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00023865699768066406, -0.00023065879940986633, -0.0002226606011390686, -0.00021466240286827087, -0.00020666420459747314, -0.00019866600632667542, -0.00019066780805587769, -0.00018266960978507996, -0.00017467141151428223, -0.0001666732132434845, -0.00015867501497268677, -0.00015067681670188904, -0.0001426786184310913, -0.00013468042016029358, -0.00012668222188949585, -0.00011868402361869812, -0.00011068582534790039, -0.00010268762707710266, -9.468942880630493e-05, -8.66912305355072e-05, -7.869303226470947e-05, -7.069483399391174e-05, -6.269663572311401e-05, -5.4698437452316284e-05, -4.6700239181518555e-05, -3.8702040910720825e-05, -3.0703842639923096e-05, -2.2705644369125366e-05, -1.4707446098327637e-05, -6.709247827529907e-06, 1.2889504432678223e-06, 9.287148714065552e-06, 1.728534698486328e-05, 2.528354525566101e-05, 3.328174352645874e-05, 4.127994179725647e-05, 4.92781400680542e-05, 5.727633833885193e-05, 6.527453660964966e-05, 7.327273488044739e-05, 8.127093315124512e-05, 8.926913142204285e-05, 9.726732969284058e-05, 0.0001052655279636383, 0.00011326372623443604, 0.00012126192450523376, 0.0001292601227760315, 0.00013725832104682922, 0.00014525651931762695, 0.00015325471758842468, 0.0001612529158592224, 0.00016925111413002014, 0.00017724931240081787, 0.0001852475106716156, 0.00019324570894241333, 0.00020124390721321106, 0.0002092421054840088, 0.00021724030375480652, 0.00022523850202560425, 0.00023323670029640198, 0.0002412348985671997, 0.00024923309683799744, 0.00025723129510879517, 0.0002652294933795929, 0.0002732276916503906]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 8.0, 4.0, 5.0, 16.0, 20.0, 22.0, 34.0, 44.0, 72.0, 73.0, 131.0, 224.0, 343.0, 566.0, 870.0, 1479.0, 2769.0, 5775.0, 14142.0, 44373.0, 305833.0, 580240.0, 59833.0, 17548.0, 6835.0, 3090.0, 1622.0, 903.0, 571.0, 359.0, 216.0, 168.0, 117.0, 82.0, 55.0, 40.0, 20.0, 14.0, 10.0, 7.0, 10.0, 7.0, 3.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.19189453125, -0.18552017211914062, -0.17914581298828125, -0.17277145385742188, -0.1663970947265625, -0.16002273559570312, -0.15364837646484375, -0.14727401733398438, -0.140899658203125, -0.13452529907226562, -0.12815093994140625, -0.12177658081054688, -0.1154022216796875, -0.10902786254882812, -0.10265350341796875, -0.09627914428710938, -0.08990478515625, -0.08353042602539062, -0.07715606689453125, -0.07078170776367188, -0.0644073486328125, -0.058032989501953125, -0.05165863037109375, -0.045284271240234375, -0.038909912109375, -0.032535552978515625, -0.02616119384765625, -0.019786834716796875, -0.0134124755859375, -0.007038116455078125, -0.00066375732421875, 0.005710601806640625, 0.0120849609375, 0.018459320068359375, 0.02483367919921875, 0.031208038330078125, 0.0375823974609375, 0.043956756591796875, 0.05033111572265625, 0.056705474853515625, 0.063079833984375, 0.06945419311523438, 0.07582855224609375, 0.08220291137695312, 0.0885772705078125, 0.09495162963867188, 0.10132598876953125, 0.10770034790039062, 0.11407470703125, 0.12044906616210938, 0.12682342529296875, 0.13319778442382812, 0.1395721435546875, 0.14594650268554688, 0.15232086181640625, 0.15869522094726562, 0.165069580078125, 0.17144393920898438, 0.17781829833984375, 0.18419265747070312, 0.1905670166015625, 0.19694137573242188, 0.20331573486328125, 0.20969009399414062, 0.216064453125]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 5.0, 5.0, 8.0, 12.0, 13.0, 16.0, 32.0, 31.0, 41.0, 80.0, 112.0, 166.0, 149.0, 94.0, 64.0, 47.0, 32.0, 26.0, 16.0, 17.0, 8.0, 7.0, 7.0, 2.0, 3.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1131591796875, -0.10878372192382812, -0.10440826416015625, -0.10003280639648438, -0.0956573486328125, -0.09128189086914062, -0.08690643310546875, -0.08253097534179688, -0.078155517578125, -0.07378005981445312, -0.06940460205078125, -0.06502914428710938, -0.0606536865234375, -0.056278228759765625, -0.05190277099609375, -0.047527313232421875, -0.04315185546875, -0.038776397705078125, -0.03440093994140625, -0.030025482177734375, -0.0256500244140625, -0.021274566650390625, -0.01689910888671875, -0.012523651123046875, -0.008148193359375, -0.003772735595703125, 0.00060272216796875, 0.004978179931640625, 0.0093536376953125, 0.013729095458984375, 0.01810455322265625, 0.022480010986328125, 0.02685546875, 0.031230926513671875, 0.03560638427734375, 0.039981842041015625, 0.0443572998046875, 0.048732757568359375, 0.05310821533203125, 0.057483673095703125, 0.061859130859375, 0.06623458862304688, 0.07061004638671875, 0.07498550415039062, 0.0793609619140625, 0.08373641967773438, 0.08811187744140625, 0.09248733520507812, 0.09686279296875, 0.10123825073242188, 0.10561370849609375, 0.10998916625976562, 0.1143646240234375, 0.11874008178710938, 0.12311553955078125, 0.12749099731445312, 0.131866455078125, 0.13624191284179688, 0.14061737060546875, 0.14499282836914062, 0.1493682861328125, 0.15374374389648438, 0.15811920166015625, 0.16249465942382812, 0.1668701171875]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 1.0, 5.0, 7.0, 20.0, 23.0, 36.0, 72.0, 135.0, 243.0, 195.0, 101.0, 63.0, 42.0, 17.0, 14.0, 9.0, 8.0, 6.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.8489274978637695, -2.771926164627075, -2.69492506980896, -2.6179237365722656, -2.5409226417541504, -2.463921308517456, -2.3869199752807617, -2.3099188804626465, -2.232917547225952, -2.155916213989258, -2.0789151191711426, -2.0019137859344482, -1.9249125719070435, -1.8479113578796387, -1.7709100246429443, -1.6939088106155396, -1.6169075965881348, -1.53990638256073, -1.4629051685333252, -1.3859038352966309, -1.308902621269226, -1.2319014072418213, -1.154900074005127, -1.0778988599777222, -1.0008976459503174, -0.9238964319229126, -0.846895158290863, -0.7698938846588135, -0.6928926706314087, -0.6158914566040039, -0.5388901829719543, -0.4618889093399048, -0.3848876953125, -0.3078864514827728, -0.23088520765304565, -0.15388396382331848, -0.07688271999359131, 0.00011852383613586426, 0.07711976766586304, 0.1541210412979126, 0.23112225532531738, 0.30812349915504456, 0.38512474298477173, 0.4621259868144989, 0.5391272306442261, 0.6161284446716309, 0.6931297183036804, 0.77013099193573, 0.8471322059631348, 0.9241334199905396, 1.0011346340179443, 1.0781359672546387, 1.1551371812820435, 1.2321383953094482, 1.3091397285461426, 1.3861409425735474, 1.4631421566009521, 1.540143370628357, 1.6171445846557617, 1.694145917892456, 1.7711471319198608, 1.8481483459472656, 1.92514967918396, 2.0021510124206543, 2.0791521072387695]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 9.0, 10.0, 18.0, 21.0, 36.0, 51.0, 50.0, 72.0, 83.0, 84.0, 103.0, 73.0, 91.0, 66.0, 58.0, 54.0, 41.0, 32.0, 14.0, 11.0, 9.0, 4.0, 1.0, 6.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.4346957206726074, -2.3685531616210938, -2.302410840988159, -2.2362682819366455, -2.170125961303711, -2.1039834022521973, -2.0378408432006836, -1.9716984033584595, -1.9055559635162354, -1.8394135236740112, -1.773271083831787, -1.7071285247802734, -1.6409860849380493, -1.5748436450958252, -1.5087010860443115, -1.4425586462020874, -1.3764162063598633, -1.3102737665176392, -1.244131326675415, -1.1779887676239014, -1.1118463277816772, -1.0457038879394531, -0.9795613884925842, -0.9134188890457153, -0.8472764492034912, -0.7811340093612671, -0.7149915099143982, -0.6488490104675293, -0.5827065706253052, -0.516564130783081, -0.45042163133621216, -0.38427916169166565, -0.31813669204711914, -0.25199422240257263, -0.18585175275802612, -0.11970928311347961, -0.053566813468933105, 0.012575656175613403, 0.07871812582015991, 0.14486059546470642, 0.21100306510925293, 0.27714553475379944, 0.34328800439834595, 0.40943047404289246, 0.47557294368743896, 0.5417153835296631, 0.607857882976532, 0.6740003824234009, 0.740142822265625, 0.8062852621078491, 0.872427761554718, 0.9385702610015869, 1.004712700843811, 1.0708551406860352, 1.1369976997375488, 1.203140139579773, 1.269282579421997, 1.3354250192642212, 1.4015674591064453, 1.467710018157959, 1.533852458000183, 1.5999948978424072, 1.666137456893921, 1.732279896736145, 1.7984223365783691]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 5.0, 7.0, 9.0, 16.0, 18.0, 37.0, 41.0, 70.0, 121.0, 405.0, 1952.0, 33027.0, 4149003.0, 8113.0, 1032.0, 296.0, 76.0, 31.0, 10.0, 7.0, 6.0, 1.0, 1.0, 5.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-5.56640625, -5.44354248046875, -5.3206787109375, -5.19781494140625, -5.074951171875, -4.95208740234375, -4.8292236328125, -4.70635986328125, -4.58349609375, -4.46063232421875, -4.3377685546875, -4.21490478515625, -4.092041015625, -3.96917724609375, -3.8463134765625, -3.72344970703125, -3.6005859375, -3.47772216796875, -3.3548583984375, -3.23199462890625, -3.109130859375, -2.98626708984375, -2.8634033203125, -2.74053955078125, -2.61767578125, -2.49481201171875, -2.3719482421875, -2.24908447265625, -2.126220703125, -2.00335693359375, -1.8804931640625, -1.75762939453125, -1.634765625, -1.51190185546875, -1.3890380859375, -1.26617431640625, -1.143310546875, -1.02044677734375, -0.8975830078125, -0.77471923828125, -0.65185546875, -0.52899169921875, -0.4061279296875, -0.28326416015625, -0.160400390625, -0.03753662109375, 0.0853271484375, 0.20819091796875, 0.3310546875, 0.45391845703125, 0.5767822265625, 0.69964599609375, 0.822509765625, 0.94537353515625, 1.0682373046875, 1.19110107421875, 1.31396484375, 1.43682861328125, 1.5596923828125, 1.68255615234375, 1.805419921875, 1.92828369140625, 2.0511474609375, 2.17401123046875, 2.296875]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 4.0, 1.0, 9.0, 12.0, 29.0, 23.0, 67.0, 137.0, 184.0, 190.0, 149.0, 91.0, 48.0, 19.0, 16.0, 7.0, 7.0, 4.0, 1.0, 4.0, 4.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.11407470703125, -0.11154890060424805, -0.1090230941772461, -0.10649728775024414, -0.10397148132324219, -0.10144567489624023, -0.09891986846923828, -0.09639406204223633, -0.09386825561523438, -0.09134244918823242, -0.08881664276123047, -0.08629083633422852, -0.08376502990722656, -0.08123922348022461, -0.07871341705322266, -0.0761876106262207, -0.07366180419921875, -0.0711359977722168, -0.06861019134521484, -0.06608438491821289, -0.06355857849121094, -0.061032772064208984, -0.05850696563720703, -0.05598115921020508, -0.053455352783203125, -0.05092954635620117, -0.04840373992919922, -0.045877933502197266, -0.04335212707519531, -0.04082632064819336, -0.038300514221191406, -0.03577470779418945, -0.0332489013671875, -0.030723094940185547, -0.028197288513183594, -0.02567148208618164, -0.023145675659179688, -0.020619869232177734, -0.01809406280517578, -0.015568256378173828, -0.013042449951171875, -0.010516643524169922, -0.007990837097167969, -0.005465030670166016, -0.0029392242431640625, -0.0004134178161621094, 0.0021123886108398438, 0.004638195037841797, 0.00716400146484375, 0.009689807891845703, 0.012215614318847656, 0.01474142074584961, 0.017267227172851562, 0.019793033599853516, 0.02231884002685547, 0.024844646453857422, 0.027370452880859375, 0.029896259307861328, 0.03242206573486328, 0.034947872161865234, 0.03747367858886719, 0.03999948501586914, 0.042525291442871094, 0.04505109786987305, 0.047576904296875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 4.0, 3.0, 3.0, 5.0, 4.0, 9.0, 11.0, 19.0, 32.0, 26.0, 40.0, 69.0, 116.0, 131.0, 218.0, 367.0, 582.0, 971.0, 1662.0, 2989.0, 5564.0, 11149.0, 24490.0, 66202.0, 782486.0, 3181529.0, 66624.0, 24588.0, 11341.0, 5691.0, 3073.0, 1660.0, 980.0, 594.0, 349.0, 244.0, 153.0, 94.0, 64.0, 46.0, 27.0, 22.0, 19.0, 13.0, 11.0, 9.0, 5.0, 4.0, 2.0, 2.0], "bins": [-0.5849609375, -0.5699653625488281, -0.5549697875976562, -0.5399742126464844, -0.5249786376953125, -0.5099830627441406, -0.49498748779296875, -0.4799919128417969, -0.464996337890625, -0.4500007629394531, -0.43500518798828125, -0.4200096130371094, -0.4050140380859375, -0.3900184631347656, -0.37502288818359375, -0.3600273132324219, -0.34503173828125, -0.3300361633300781, -0.31504058837890625, -0.3000450134277344, -0.2850494384765625, -0.2700538635253906, -0.25505828857421875, -0.24006271362304688, -0.225067138671875, -0.21007156372070312, -0.19507598876953125, -0.18008041381835938, -0.1650848388671875, -0.15008926391601562, -0.13509368896484375, -0.12009811401367188, -0.1051025390625, -0.09010696411132812, -0.07511138916015625, -0.060115814208984375, -0.0451202392578125, -0.030124664306640625, -0.01512908935546875, -0.000133514404296875, 0.014862060546875, 0.029857635498046875, 0.04485321044921875, 0.059848785400390625, 0.0748443603515625, 0.08983993530273438, 0.10483551025390625, 0.11983108520507812, 0.13482666015625, 0.14982223510742188, 0.16481781005859375, 0.17981338500976562, 0.1948089599609375, 0.20980453491210938, 0.22480010986328125, 0.23979568481445312, 0.254791259765625, 0.2697868347167969, 0.28478240966796875, 0.2997779846191406, 0.3147735595703125, 0.3297691345214844, 0.34476470947265625, 0.3597602844238281, 0.374755859375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 6.0, 8.0, 4.0, 6.0, 7.0, 9.0, 10.0, 22.0, 26.0, 24.0, 32.0, 34.0, 49.0, 72.0, 151.0, 3053.0, 226.0, 96.0, 50.0, 38.0, 26.0, 28.0, 15.0, 15.0, 9.0, 11.0, 8.0, 8.0, 7.0, 8.0, 3.0, 3.0, 3.0, 5.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.11639404296875, -0.11313056945800781, -0.10986709594726562, -0.10660362243652344, -0.10334014892578125, -0.10007667541503906, -0.09681320190429688, -0.09354972839355469, -0.0902862548828125, -0.08702278137207031, -0.08375930786132812, -0.08049583435058594, -0.07723236083984375, -0.07396888732910156, -0.07070541381835938, -0.06744194030761719, -0.064178466796875, -0.06091499328613281, -0.057651519775390625, -0.05438804626464844, -0.05112457275390625, -0.04786109924316406, -0.044597625732421875, -0.04133415222167969, -0.0380706787109375, -0.03480720520019531, -0.031543731689453125, -0.028280258178710938, -0.02501678466796875, -0.021753311157226562, -0.018489837646484375, -0.015226364135742188, -0.011962890625, -0.008699417114257812, -0.005435943603515625, -0.0021724700927734375, 0.00109100341796875, 0.0043544769287109375, 0.007617950439453125, 0.010881423950195312, 0.0141448974609375, 0.017408370971679688, 0.020671844482421875, 0.023935317993164062, 0.02719879150390625, 0.030462265014648438, 0.033725738525390625, 0.03698921203613281, 0.040252685546875, 0.04351615905761719, 0.046779632568359375, 0.05004310607910156, 0.05330657958984375, 0.05657005310058594, 0.059833526611328125, 0.06309700012207031, 0.0663604736328125, 0.06962394714355469, 0.07288742065429688, 0.07615089416503906, 0.07941436767578125, 0.08267784118652344, 0.08594131469726562, 0.08920478820800781, 0.09246826171875]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 0.0, 6.0, 5.0, 4.0, 13.0, 15.0, 22.0, 23.0, 41.0, 62.0, 77.0, 113.0, 161.0, 142.0, 89.0, 74.0, 38.0, 45.0, 17.0, 13.0, 10.0, 5.0, 9.0, 3.0, 6.0, 4.0, 6.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.418947696685791, -0.40444493293762207, -0.3899421691894531, -0.3754394054412842, -0.3609366714954376, -0.3464339077472687, -0.33193114399909973, -0.3174283802509308, -0.30292564630508423, -0.2884228825569153, -0.27392011880874634, -0.2594173550605774, -0.24491462111473083, -0.2304118573665619, -0.21590909361839294, -0.201406329870224, -0.18690356612205505, -0.1724008023738861, -0.15789805352687836, -0.1433952897787094, -0.12889254093170166, -0.11438977718353271, -0.09988701343536377, -0.08538425713777542, -0.07088150084018707, -0.056378744542598724, -0.04187598451972008, -0.02737322449684143, -0.012870468199253082, 0.0016322880983352661, 0.01613505184650421, 0.03063780814409256, 0.04514056444168091, 0.05964332073926926, 0.0741460770368576, 0.08864884078502655, 0.1031515970826149, 0.11765435338020325, 0.1321571171283722, 0.14665988087654114, 0.1611626297235489, 0.17566539347171783, 0.19016814231872559, 0.20467090606689453, 0.21917366981506348, 0.23367641866207123, 0.24817918241024017, 0.2626819312572479, 0.27718469500541687, 0.2916874587535858, 0.30619022250175476, 0.3206929564476013, 0.33519572019577026, 0.3496984839439392, 0.36420124769210815, 0.3787040114402771, 0.39320677518844604, 0.407709538936615, 0.42221230268478394, 0.4367150664329529, 0.45121780037879944, 0.4657205641269684, 0.48022332787513733, 0.4947260916233063, 0.5092288255691528]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 5.0, 7.0, 8.0, 6.0, 12.0, 20.0, 14.0, 26.0, 20.0, 26.0, 28.0, 38.0, 41.0, 44.0, 52.0, 57.0, 41.0, 46.0, 49.0, 46.0, 44.0, 43.0, 36.0, 30.0, 41.0, 36.0, 35.0, 29.0, 17.0, 23.0, 15.0, 16.0, 19.0, 5.0, 6.0, 9.0, 3.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.3641483187675476, -0.35382455587387085, -0.3435007929801941, -0.33317703008651733, -0.3228532671928406, -0.3125295042991638, -0.30220574140548706, -0.2918819785118103, -0.28155821561813354, -0.2712344527244568, -0.26091068983078003, -0.25058692693710327, -0.2402631640434265, -0.22993940114974976, -0.219615638256073, -0.20929187536239624, -0.1989680975675583, -0.18864433467388153, -0.17832057178020477, -0.16799680888652802, -0.15767304599285126, -0.1473492830991745, -0.13702550530433655, -0.1267017424106598, -0.11637798696756363, -0.10605422407388687, -0.09573046118021011, -0.08540669083595276, -0.075082927942276, -0.06475916504859924, -0.054435402154922485, -0.04411163926124573, -0.03378787636756897, -0.023464113473892212, -0.013140348717570305, -0.002816583961248398, 0.00750717893242836, 0.017830941826105118, 0.028154708445072174, 0.03847847133874893, 0.04880223423242569, 0.05912599712610245, 0.0694497600197792, 0.07977353036403656, 0.09009729325771332, 0.10042105615139008, 0.11074481904506683, 0.12106858193874359, 0.13139234483242035, 0.1417161077260971, 0.15203987061977386, 0.16236363351345062, 0.17268739640712738, 0.18301115930080414, 0.1933349370956421, 0.20365869998931885, 0.2139824628829956, 0.22430622577667236, 0.23462998867034912, 0.24495375156402588, 0.25527751445770264, 0.2656012773513794, 0.27592504024505615, 0.2862488031387329, 0.29657256603240967]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 7.0, 4.0, 7.0, 4.0, 11.0, 4.0, 8.0, 12.0, 15.0, 20.0, 27.0, 38.0, 68.0, 90.0, 165.0, 247.0, 522.0, 975.0, 2257.0, 6841.0, 37848.0, 632038.0, 333216.0, 25068.0, 5299.0, 1863.0, 838.0, 373.0, 239.0, 144.0, 85.0, 54.0, 39.0, 28.0, 30.0, 18.0, 11.0, 11.0, 10.0, 5.0, 5.0, 4.0, 6.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.69677734375, -0.6749343872070312, -0.6530914306640625, -0.6312484741210938, -0.609405517578125, -0.5875625610351562, -0.5657196044921875, -0.5438766479492188, -0.52203369140625, -0.5001907348632812, -0.4783477783203125, -0.45650482177734375, -0.434661865234375, -0.41281890869140625, -0.3909759521484375, -0.36913299560546875, -0.3472900390625, -0.32544708251953125, -0.3036041259765625, -0.28176116943359375, -0.259918212890625, -0.23807525634765625, -0.2162322998046875, -0.19438934326171875, -0.17254638671875, -0.15070343017578125, -0.1288604736328125, -0.10701751708984375, -0.085174560546875, -0.06333160400390625, -0.0414886474609375, -0.01964569091796875, 0.002197265625, 0.02404022216796875, 0.0458831787109375, 0.06772613525390625, 0.089569091796875, 0.11141204833984375, 0.1332550048828125, 0.15509796142578125, 0.17694091796875, 0.19878387451171875, 0.2206268310546875, 0.24246978759765625, 0.264312744140625, 0.28615570068359375, 0.3079986572265625, 0.32984161376953125, 0.3516845703125, 0.37352752685546875, 0.3953704833984375, 0.41721343994140625, 0.439056396484375, 0.46089935302734375, 0.4827423095703125, 0.5045852661132812, 0.52642822265625, 0.5482711791992188, 0.5701141357421875, 0.5919570922851562, 0.613800048828125, 0.6356430053710938, 0.6574859619140625, 0.6793289184570312, 0.701171875]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 5.0, 8.0, 6.0, 16.0, 38.0, 82.0, 126.0, 187.0, 186.0, 136.0, 107.0, 51.0, 26.0, 13.0, 6.0, 4.0, 2.0, 4.0, 3.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.10980224609375, -0.10732030868530273, -0.10483837127685547, -0.1023564338684082, -0.09987449645996094, -0.09739255905151367, -0.0949106216430664, -0.09242868423461914, -0.08994674682617188, -0.08746480941772461, -0.08498287200927734, -0.08250093460083008, -0.08001899719238281, -0.07753705978393555, -0.07505512237548828, -0.07257318496704102, -0.07009124755859375, -0.06760931015014648, -0.06512737274169922, -0.06264543533325195, -0.06016349792480469, -0.05768156051635742, -0.055199623107910156, -0.05271768569946289, -0.050235748291015625, -0.04775381088256836, -0.045271873474121094, -0.04278993606567383, -0.04030799865722656, -0.0378260612487793, -0.03534412384033203, -0.032862186431884766, -0.0303802490234375, -0.027898311614990234, -0.02541637420654297, -0.022934436798095703, -0.020452499389648438, -0.017970561981201172, -0.015488624572753906, -0.01300668716430664, -0.010524749755859375, -0.00804281234741211, -0.005560874938964844, -0.003078937530517578, -0.0005970001220703125, 0.0018849372863769531, 0.004366874694824219, 0.006848812103271484, 0.00933074951171875, 0.011812686920166016, 0.014294624328613281, 0.016776561737060547, 0.019258499145507812, 0.021740436553955078, 0.024222373962402344, 0.02670431137084961, 0.029186248779296875, 0.03166818618774414, 0.034150123596191406, 0.03663206100463867, 0.03911399841308594, 0.0415959358215332, 0.04407787322998047, 0.046559810638427734, 0.049041748046875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 0.0, 4.0, 4.0, 10.0, 6.0, 8.0, 23.0, 28.0, 25.0, 56.0, 100.0, 117.0, 229.0, 368.0, 549.0, 1037.0, 1856.0, 3452.0, 7120.0, 16365.0, 45737.0, 162472.0, 530883.0, 190293.0, 53000.0, 18419.0, 7994.0, 3676.0, 1981.0, 1046.0, 631.0, 368.0, 247.0, 148.0, 106.0, 83.0, 34.0, 25.0, 22.0, 18.0, 6.0, 4.0, 4.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.329345703125, -0.32033538818359375, -0.3113250732421875, -0.30231475830078125, -0.293304443359375, -0.28429412841796875, -0.2752838134765625, -0.26627349853515625, -0.25726318359375, -0.24825286865234375, -0.2392425537109375, -0.23023223876953125, -0.221221923828125, -0.21221160888671875, -0.2032012939453125, -0.19419097900390625, -0.1851806640625, -0.17617034912109375, -0.1671600341796875, -0.15814971923828125, -0.149139404296875, -0.14012908935546875, -0.1311187744140625, -0.12210845947265625, -0.11309814453125, -0.10408782958984375, -0.0950775146484375, -0.08606719970703125, -0.077056884765625, -0.06804656982421875, -0.0590362548828125, -0.05002593994140625, -0.041015625, -0.03200531005859375, -0.0229949951171875, -0.01398468017578125, -0.004974365234375, 0.00403594970703125, 0.0130462646484375, 0.02205657958984375, 0.03106689453125, 0.04007720947265625, 0.0490875244140625, 0.05809783935546875, 0.067108154296875, 0.07611846923828125, 0.0851287841796875, 0.09413909912109375, 0.1031494140625, 0.11215972900390625, 0.1211700439453125, 0.13018035888671875, 0.139190673828125, 0.14820098876953125, 0.1572113037109375, 0.16622161865234375, 0.17523193359375, 0.18424224853515625, 0.1932525634765625, 0.20226287841796875, 0.211273193359375, 0.22028350830078125, 0.2292938232421875, 0.23830413818359375, 0.247314453125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 5.0, 6.0, 4.0, 10.0, 5.0, 29.0, 24.0, 26.0, 39.0, 59.0, 54.0, 55.0, 59.0, 70.0, 72.0, 60.0, 60.0, 54.0, 59.0, 45.0, 36.0, 45.0, 28.0, 27.0, 13.0, 10.0, 8.0, 8.0, 6.0, 4.0, 5.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2232666015625, -0.21695518493652344, -0.21064376831054688, -0.2043323516845703, -0.19802093505859375, -0.1917095184326172, -0.18539810180664062, -0.17908668518066406, -0.1727752685546875, -0.16646385192871094, -0.16015243530273438, -0.1538410186767578, -0.14752960205078125, -0.1412181854248047, -0.13490676879882812, -0.12859535217285156, -0.122283935546875, -0.11597251892089844, -0.10966110229492188, -0.10334968566894531, -0.09703826904296875, -0.09072685241699219, -0.08441543579101562, -0.07810401916503906, -0.0717926025390625, -0.06548118591308594, -0.059169769287109375, -0.05285835266113281, -0.04654693603515625, -0.04023551940917969, -0.033924102783203125, -0.027612686157226562, -0.02130126953125, -0.014989852905273438, -0.008678436279296875, -0.0023670196533203125, 0.00394439697265625, 0.010255813598632812, 0.016567230224609375, 0.022878646850585938, 0.0291900634765625, 0.03550148010253906, 0.041812896728515625, 0.04812431335449219, 0.05443572998046875, 0.06074714660644531, 0.06705856323242188, 0.07336997985839844, 0.079681396484375, 0.08599281311035156, 0.09230422973632812, 0.09861564636230469, 0.10492706298828125, 0.11123847961425781, 0.11754989624023438, 0.12386131286621094, 0.1301727294921875, 0.13648414611816406, 0.14279556274414062, 0.1491069793701172, 0.15541839599609375, 0.1617298126220703, 0.16804122924804688, 0.17435264587402344, 0.1806640625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 0.0, 5.0, 4.0, 6.0, 6.0, 5.0, 7.0, 16.0, 16.0, 32.0, 43.0, 77.0, 101.0, 204.0, 345.0, 676.0, 1481.0, 4155.0, 17975.0, 664243.0, 338509.0, 14334.0, 3500.0, 1385.0, 610.0, 319.0, 177.0, 105.0, 74.0, 43.0, 35.0, 19.0, 17.0, 7.0, 9.0, 8.0, 3.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.446044921875, -0.4316291809082031, -0.41721343994140625, -0.4027976989746094, -0.3883819580078125, -0.3739662170410156, -0.35955047607421875, -0.3451347351074219, -0.330718994140625, -0.3163032531738281, -0.30188751220703125, -0.2874717712402344, -0.2730560302734375, -0.2586402893066406, -0.24422454833984375, -0.22980880737304688, -0.21539306640625, -0.20097732543945312, -0.18656158447265625, -0.17214584350585938, -0.1577301025390625, -0.14331436157226562, -0.12889862060546875, -0.11448287963867188, -0.100067138671875, -0.08565139770507812, -0.07123565673828125, -0.056819915771484375, -0.0424041748046875, -0.027988433837890625, -0.01357269287109375, 0.000843048095703125, 0.0152587890625, 0.029674530029296875, 0.04409027099609375, 0.058506011962890625, 0.0729217529296875, 0.08733749389648438, 0.10175323486328125, 0.11616897583007812, 0.130584716796875, 0.14500045776367188, 0.15941619873046875, 0.17383193969726562, 0.1882476806640625, 0.20266342163085938, 0.21707916259765625, 0.23149490356445312, 0.24591064453125, 0.2603263854980469, 0.27474212646484375, 0.2891578674316406, 0.3035736083984375, 0.3179893493652344, 0.33240509033203125, 0.3468208312988281, 0.361236572265625, 0.3756523132324219, 0.39006805419921875, 0.4044837951660156, 0.4188995361328125, 0.4333152770996094, 0.44773101806640625, 0.4621467590332031, 0.4765625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 4.0, 0.0, 1.0, 4.0, 2.0, 8.0, 9.0, 25.0, 31.0, 46.0, 90.0, 319.0, 235.0, 77.0, 48.0, 27.0, 26.0, 13.0, 7.0, 5.0, 4.0, 5.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.000492095947265625, -0.0004761815071105957, -0.0004602670669555664, -0.0004443526268005371, -0.0004284381866455078, -0.0004125237464904785, -0.0003966093063354492, -0.0003806948661804199, -0.0003647804260253906, -0.00034886598587036133, -0.00033295154571533203, -0.00031703710556030273, -0.00030112266540527344, -0.00028520822525024414, -0.00026929378509521484, -0.00025337934494018555, -0.00023746490478515625, -0.00022155046463012695, -0.00020563602447509766, -0.00018972158432006836, -0.00017380714416503906, -0.00015789270401000977, -0.00014197826385498047, -0.00012606382369995117, -0.00011014938354492188, -9.423494338989258e-05, -7.832050323486328e-05, -6.240606307983398e-05, -4.649162292480469e-05, -3.057718276977539e-05, -1.4662742614746094e-05, 1.2516975402832031e-06, 1.71661376953125e-05, 3.30805778503418e-05, 4.8995018005371094e-05, 6.490945816040039e-05, 8.082389831542969e-05, 9.673833847045898e-05, 0.00011265277862548828, 0.00012856721878051758, 0.00014448165893554688, 0.00016039609909057617, 0.00017631053924560547, 0.00019222497940063477, 0.00020813941955566406, 0.00022405385971069336, 0.00023996829986572266, 0.00025588274002075195, 0.00027179718017578125, 0.00028771162033081055, 0.00030362606048583984, 0.00031954050064086914, 0.00033545494079589844, 0.00035136938095092773, 0.00036728382110595703, 0.00038319826126098633, 0.0003991127014160156, 0.0004150271415710449, 0.0004309415817260742, 0.0004468560218811035, 0.0004627704620361328, 0.0004786849021911621, 0.0004945993423461914, 0.0005105137825012207, 0.00052642822265625]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 2.0, 4.0, 6.0, 4.0, 9.0, 10.0, 7.0, 17.0, 22.0, 28.0, 32.0, 47.0, 80.0, 122.0, 138.0, 238.0, 366.0, 520.0, 766.0, 1303.0, 2205.0, 4044.0, 9127.0, 27924.0, 165683.0, 716853.0, 85714.0, 18574.0, 6713.0, 3215.0, 1678.0, 1036.0, 663.0, 430.0, 315.0, 192.0, 121.0, 107.0, 76.0, 44.0, 33.0, 19.0, 23.0, 10.0, 11.0, 11.0, 6.0, 3.0, 4.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.204345703125, -0.19821739196777344, -0.19208908081054688, -0.1859607696533203, -0.17983245849609375, -0.1737041473388672, -0.16757583618164062, -0.16144752502441406, -0.1553192138671875, -0.14919090270996094, -0.14306259155273438, -0.1369342803955078, -0.13080596923828125, -0.12467765808105469, -0.11854934692382812, -0.11242103576660156, -0.106292724609375, -0.10016441345214844, -0.09403610229492188, -0.08790779113769531, -0.08177947998046875, -0.07565116882324219, -0.06952285766601562, -0.06339454650878906, -0.0572662353515625, -0.05113792419433594, -0.045009613037109375, -0.03888130187988281, -0.03275299072265625, -0.026624679565429688, -0.020496368408203125, -0.014368057250976562, -0.00823974609375, -0.0021114349365234375, 0.004016876220703125, 0.010145187377929688, 0.01627349853515625, 0.022401809692382812, 0.028530120849609375, 0.03465843200683594, 0.0407867431640625, 0.04691505432128906, 0.053043365478515625, 0.05917167663574219, 0.06529998779296875, 0.07142829895019531, 0.07755661010742188, 0.08368492126464844, 0.089813232421875, 0.09594154357910156, 0.10206985473632812, 0.10819816589355469, 0.11432647705078125, 0.12045478820800781, 0.12658309936523438, 0.13271141052246094, 0.1388397216796875, 0.14496803283691406, 0.15109634399414062, 0.1572246551513672, 0.16335296630859375, 0.1694812774658203, 0.17560958862304688, 0.18173789978027344, 0.1878662109375]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 2.0, 5.0, 1.0, 3.0, 6.0, 6.0, 6.0, 17.0, 24.0, 33.0, 47.0, 88.0, 148.0, 162.0, 142.0, 105.0, 80.0, 41.0, 34.0, 14.0, 12.0, 10.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.1790771484375, -0.1740550994873047, -0.16903305053710938, -0.16401100158691406, -0.15898895263671875, -0.15396690368652344, -0.14894485473632812, -0.1439228057861328, -0.1389007568359375, -0.1338787078857422, -0.12885665893554688, -0.12383460998535156, -0.11881256103515625, -0.11379051208496094, -0.10876846313476562, -0.10374641418457031, -0.098724365234375, -0.09370231628417969, -0.08868026733398438, -0.08365821838378906, -0.07863616943359375, -0.07361412048339844, -0.06859207153320312, -0.06357002258300781, -0.0585479736328125, -0.05352592468261719, -0.048503875732421875, -0.04348182678222656, -0.03845977783203125, -0.03343772888183594, -0.028415679931640625, -0.023393630981445312, -0.01837158203125, -0.013349533081054688, -0.008327484130859375, -0.0033054351806640625, 0.00171661376953125, 0.0067386627197265625, 0.011760711669921875, 0.016782760620117188, 0.0218048095703125, 0.026826858520507812, 0.031848907470703125, 0.03687095642089844, 0.04189300537109375, 0.04691505432128906, 0.051937103271484375, 0.05695915222167969, 0.061981201171875, 0.06700325012207031, 0.07202529907226562, 0.07704734802246094, 0.08206939697265625, 0.08709144592285156, 0.09211349487304688, 0.09713554382324219, 0.1021575927734375, 0.10717964172363281, 0.11220169067382812, 0.11722373962402344, 0.12224578857421875, 0.12726783752441406, 0.13228988647460938, 0.1373119354248047, 0.142333984375]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 8.0, 48.0, 182.0, 488.0, 204.0, 57.0, 17.0, 8.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.388756036758423, -2.2235968112945557, -2.0584378242492676, -1.8932785987854004, -1.7281194925308228, -1.5629603862762451, -1.397801160812378, -1.2326420545578003, -1.0674829483032227, -0.902323842048645, -0.7371646761894226, -0.5720055103302002, -0.40684640407562256, -0.24168729782104492, -0.07652813196182251, 0.0886310338973999, 0.25379014015197754, 0.41894927620887756, 0.5841084122657776, 0.749267578125, 0.9144266843795776, 1.0795857906341553, 1.2447450160980225, 1.4099041223526, 1.5750632286071777, 1.7402223348617554, 1.905381441116333, 2.0705406665802, 2.2356996536254883, 2.4008588790893555, 2.5660181045532227, 2.73117733001709, 2.896336555480957, 3.061495780944824, 3.2266547679901123, 3.3918139934539795, 3.5569729804992676, 3.7221322059631348, 3.887291431427002, 4.052450656890869, 4.217609405517578, 4.382768630981445, 4.5479278564453125, 4.7130866050720215, 4.878245830535889, 5.043405055999756, 5.208564281463623, 5.37372350692749, 5.538882732391357, 5.704041957855225, 5.869201183319092, 6.034359931945801, 6.199519157409668, 6.364678382873535, 6.529837608337402, 6.6949968338012695, 6.860156059265137, 7.025315284729004, 7.190474510192871, 7.35563325881958, 7.520792484283447, 7.6859517097473145, 7.851110935211182, 8.01626968383789, 8.181428909301758]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 9.0, 7.0, 8.0, 11.0, 15.0, 15.0, 13.0, 16.0, 27.0, 30.0, 34.0, 40.0, 49.0, 47.0, 54.0, 62.0, 62.0, 51.0, 41.0, 53.0, 59.0, 40.0, 38.0, 43.0, 40.0, 25.0, 14.0, 13.0, 13.0, 18.0, 12.0, 14.0, 8.0, 6.0, 4.0, 7.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9719880819320679, -0.9380923509597778, -0.904196560382843, -0.870300829410553, -0.8364050388336182, -0.8025093078613281, -0.7686135768890381, -0.734717845916748, -0.7008220553398132, -0.6669263243675232, -0.6330305337905884, -0.5991348028182983, -0.5652390718460083, -0.5313432812690735, -0.49744755029678345, -0.463551789522171, -0.4296560287475586, -0.39576026797294617, -0.36186450719833374, -0.3279687762260437, -0.2940730154514313, -0.26017725467681885, -0.22628150880336761, -0.19238576292991638, -0.15849000215530396, -0.12459424883127213, -0.0906984955072403, -0.056802742183208466, -0.022906988859176636, 0.010988771915435791, 0.044884517788887024, 0.07878026366233826, 0.11267602443695068, 0.1465717852115631, 0.18046753108501434, 0.21436327695846558, 0.248259037733078, 0.28215479850769043, 0.31605052947998047, 0.3499462902545929, 0.3838420510292053, 0.41773781180381775, 0.4516335725784302, 0.4855293035507202, 0.5194250345230103, 0.5533208250999451, 0.5872165560722351, 0.6211123466491699, 0.65500807762146, 0.68890380859375, 0.7227995991706848, 0.7566953301429749, 0.7905911207199097, 0.8244868516921997, 0.8583825826644897, 0.8922783136367798, 0.9261741042137146, 0.9600698351860046, 0.9939656257629395, 1.0278613567352295, 1.0617570877075195, 1.0956528186798096, 1.1295486688613892, 1.1634443998336792, 1.1973401308059692]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 7.0, 11.0, 18.0, 20.0, 30.0, 51.0, 94.0, 149.0, 316.0, 1319.0, 14432.0, 4129983.0, 43969.0, 2711.0, 728.0, 267.0, 91.0, 46.0, 16.0, 10.0, 5.0, 2.0, 1.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.9580078125, -1.9109954833984375, -1.863983154296875, -1.8169708251953125, -1.76995849609375, -1.7229461669921875, -1.675933837890625, -1.6289215087890625, -1.5819091796875, -1.5348968505859375, -1.487884521484375, -1.4408721923828125, -1.39385986328125, -1.3468475341796875, -1.299835205078125, -1.2528228759765625, -1.205810546875, -1.1587982177734375, -1.111785888671875, -1.0647735595703125, -1.01776123046875, -0.9707489013671875, -0.923736572265625, -0.8767242431640625, -0.8297119140625, -0.7826995849609375, -0.735687255859375, -0.6886749267578125, -0.64166259765625, -0.5946502685546875, -0.547637939453125, -0.5006256103515625, -0.45361328125, -0.4066009521484375, -0.359588623046875, -0.3125762939453125, -0.26556396484375, -0.2185516357421875, -0.171539306640625, -0.1245269775390625, -0.0775146484375, -0.0305023193359375, 0.016510009765625, 0.0635223388671875, 0.11053466796875, 0.1575469970703125, 0.204559326171875, 0.2515716552734375, 0.298583984375, 0.3455963134765625, 0.392608642578125, 0.4396209716796875, 0.48663330078125, 0.5336456298828125, 0.580657958984375, 0.6276702880859375, 0.6746826171875, 0.7216949462890625, 0.768707275390625, 0.8157196044921875, 0.86273193359375, 0.9097442626953125, 0.956756591796875, 1.0037689208984375, 1.05078125]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 3.0, 1.0, 10.0, 15.0, 15.0, 37.0, 54.0, 92.0, 135.0, 152.0, 135.0, 133.0, 91.0, 64.0, 38.0, 10.0, 9.0, 6.0, 3.0, 0.0, 2.0, 6.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.10235595703125, -0.1000823974609375, -0.097808837890625, -0.0955352783203125, -0.09326171875, -0.0909881591796875, -0.088714599609375, -0.0864410400390625, -0.08416748046875, -0.0818939208984375, -0.079620361328125, -0.0773468017578125, -0.0750732421875, -0.0727996826171875, -0.070526123046875, -0.0682525634765625, -0.06597900390625, -0.0637054443359375, -0.061431884765625, -0.0591583251953125, -0.056884765625, -0.0546112060546875, -0.052337646484375, -0.0500640869140625, -0.04779052734375, -0.0455169677734375, -0.043243408203125, -0.0409698486328125, -0.0386962890625, -0.0364227294921875, -0.034149169921875, -0.0318756103515625, -0.02960205078125, -0.0273284912109375, -0.025054931640625, -0.0227813720703125, -0.0205078125, -0.0182342529296875, -0.015960693359375, -0.0136871337890625, -0.01141357421875, -0.0091400146484375, -0.006866455078125, -0.0045928955078125, -0.0023193359375, -4.57763671875e-05, 0.002227783203125, 0.0045013427734375, 0.00677490234375, 0.0090484619140625, 0.011322021484375, 0.0135955810546875, 0.015869140625, 0.0181427001953125, 0.020416259765625, 0.0226898193359375, 0.02496337890625, 0.0272369384765625, 0.029510498046875, 0.0317840576171875, 0.0340576171875, 0.0363311767578125, 0.038604736328125, 0.0408782958984375, 0.04315185546875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 4.0, 12.0, 16.0, 38.0, 59.0, 131.0, 258.0, 530.0, 1101.0, 2434.0, 5923.0, 18467.0, 96773.0, 3886697.0, 146158.0, 23484.0, 7051.0, 2796.0, 1238.0, 594.0, 276.0, 125.0, 64.0, 31.0, 11.0, 9.0, 7.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.51416015625, -0.5001068115234375, -0.486053466796875, -0.4720001220703125, -0.45794677734375, -0.4438934326171875, -0.429840087890625, -0.4157867431640625, -0.4017333984375, -0.3876800537109375, -0.373626708984375, -0.3595733642578125, -0.34552001953125, -0.3314666748046875, -0.317413330078125, -0.3033599853515625, -0.289306640625, -0.2752532958984375, -0.261199951171875, -0.2471466064453125, -0.23309326171875, -0.2190399169921875, -0.204986572265625, -0.1909332275390625, -0.1768798828125, -0.1628265380859375, -0.148773193359375, -0.1347198486328125, -0.12066650390625, -0.1066131591796875, -0.092559814453125, -0.0785064697265625, -0.064453125, -0.0503997802734375, -0.036346435546875, -0.0222930908203125, -0.00823974609375, 0.0058135986328125, 0.019866943359375, 0.0339202880859375, 0.0479736328125, 0.0620269775390625, 0.076080322265625, 0.0901336669921875, 0.10418701171875, 0.1182403564453125, 0.132293701171875, 0.1463470458984375, 0.160400390625, 0.1744537353515625, 0.188507080078125, 0.2025604248046875, 0.21661376953125, 0.2306671142578125, 0.244720458984375, 0.2587738037109375, 0.2728271484375, 0.2868804931640625, 0.300933837890625, 0.3149871826171875, 0.32904052734375, 0.3430938720703125, 0.357147216796875, 0.3712005615234375, 0.38525390625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 5.0, 5.0, 3.0, 3.0, 8.0, 5.0, 6.0, 8.0, 10.0, 18.0, 12.0, 30.0, 25.0, 55.0, 68.0, 110.0, 190.0, 2357.0, 666.0, 157.0, 107.0, 58.0, 39.0, 24.0, 17.0, 20.0, 15.0, 7.0, 8.0, 10.0, 3.0, 7.0, 5.0, 4.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 5.0], "bins": [-0.08148193359375, -0.07933378219604492, -0.07718563079833984, -0.07503747940063477, -0.07288932800292969, -0.07074117660522461, -0.06859302520751953, -0.06644487380981445, -0.06429672241210938, -0.0621485710144043, -0.06000041961669922, -0.05785226821899414, -0.05570411682128906, -0.053555965423583984, -0.051407814025878906, -0.04925966262817383, -0.04711151123046875, -0.04496335983276367, -0.042815208435058594, -0.040667057037353516, -0.03851890563964844, -0.03637075424194336, -0.03422260284423828, -0.0320744514465332, -0.029926300048828125, -0.027778148651123047, -0.02562999725341797, -0.02348184585571289, -0.021333694458007812, -0.019185543060302734, -0.017037391662597656, -0.014889240264892578, -0.0127410888671875, -0.010592937469482422, -0.008444786071777344, -0.006296634674072266, -0.0041484832763671875, -0.0020003318786621094, 0.00014781951904296875, 0.002295970916748047, 0.004444122314453125, 0.006592273712158203, 0.008740425109863281, 0.01088857650756836, 0.013036727905273438, 0.015184879302978516, 0.017333030700683594, 0.019481182098388672, 0.02162933349609375, 0.023777484893798828, 0.025925636291503906, 0.028073787689208984, 0.030221939086914062, 0.03237009048461914, 0.03451824188232422, 0.0366663932800293, 0.038814544677734375, 0.04096269607543945, 0.04311084747314453, 0.04525899887084961, 0.04740715026855469, 0.049555301666259766, 0.051703453063964844, 0.05385160446166992, 0.055999755859375]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 9.0, 25.0, 96.0, 401.0, 363.0, 87.0, 24.0, 6.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1147541999816895, -2.0706465244293213, -2.026538848876953, -1.982431173324585, -1.9383234977722168, -1.8942158222198486, -1.8501081466674805, -1.8060004711151123, -1.7618927955627441, -1.717785120010376, -1.6736774444580078, -1.6295697689056396, -1.5854620933532715, -1.5413544178009033, -1.4972467422485352, -1.453139066696167, -1.4090313911437988, -1.3649237155914307, -1.3208160400390625, -1.2767083644866943, -1.2326006889343262, -1.188493013381958, -1.1443853378295898, -1.1002776622772217, -1.056170105934143, -1.012062430381775, -0.9679547548294067, -0.9238470792770386, -0.8797394037246704, -0.8356317281723022, -0.7915240526199341, -0.7474163770675659, -0.7033087611198425, -0.6592010855674744, -0.6150934100151062, -0.570985734462738, -0.5268780589103699, -0.4827703833580017, -0.43866273760795593, -0.39455506205558777, -0.3504473865032196, -0.30633971095085144, -0.2622320353984833, -0.2181243747472763, -0.17401669919490814, -0.12990902364253998, -0.08580136299133301, -0.041693687438964844, 0.0024139881134033203, 0.046521659940481186, 0.09062933176755905, 0.13473699986934662, 0.17884467542171478, 0.22295235097408295, 0.2670600116252899, 0.3111676871776581, 0.35527536273002625, 0.3993830382823944, 0.4434907138347626, 0.48759835958480835, 0.5317060351371765, 0.5758137106895447, 0.6199213862419128, 0.664029061794281, 0.7081367373466492]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 6.0, 2.0, 10.0, 11.0, 13.0, 6.0, 9.0, 13.0, 22.0, 26.0, 22.0, 32.0, 36.0, 35.0, 42.0, 30.0, 44.0, 43.0, 54.0, 42.0, 34.0, 50.0, 50.0, 43.0, 39.0, 36.0, 39.0, 26.0, 31.0, 25.0, 18.0, 15.0, 20.0, 21.0, 16.0, 13.0, 11.0, 4.0, 3.0, 4.0, 3.0, 2.0, 6.0, 1.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.21758371591567993, -0.21080443263053894, -0.20402516424655914, -0.19724588096141815, -0.19046659767627716, -0.18368732929229736, -0.17690804600715637, -0.17012876272201538, -0.1633494794368744, -0.1565701961517334, -0.1497909277677536, -0.1430116444826126, -0.13623236119747162, -0.12945309281349182, -0.12267380952835083, -0.11589452624320984, -0.10911525785923004, -0.10233598202466965, -0.09555669873952866, -0.08877742290496826, -0.08199813961982727, -0.07521886378526688, -0.06843958795070648, -0.06166030839085579, -0.054881028831005096, -0.048101749271154404, -0.04132246971130371, -0.03454319387674332, -0.027763914316892624, -0.02098463475704193, -0.014205358922481537, -0.007426079362630844, -0.0006467998027801514, 0.006132478825747967, 0.012911757454276085, 0.01969103515148163, 0.02647031471133232, 0.033249594271183014, 0.04002887010574341, 0.0468081496655941, 0.053587429225444794, 0.060366708785295486, 0.06714598834514618, 0.07392526417970657, 0.08070454001426697, 0.08748382329940796, 0.09426309913396835, 0.10104237496852875, 0.10782165825366974, 0.11460093408823013, 0.12138021737337112, 0.12815949320793152, 0.1349387764930725, 0.1417180597782135, 0.1484973281621933, 0.1552766114473343, 0.1620558798313141, 0.16883516311645508, 0.17561443150043488, 0.18239371478557587, 0.18917299807071686, 0.19595226645469666, 0.20273154973983765, 0.20951083302497864, 0.21629011631011963]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 9.0, 9.0, 6.0, 9.0, 14.0, 10.0, 17.0, 25.0, 26.0, 45.0, 77.0, 131.0, 212.0, 449.0, 1050.0, 2779.0, 10221.0, 70101.0, 747976.0, 189411.0, 18939.0, 4192.0, 1381.0, 654.0, 343.0, 172.0, 94.0, 56.0, 43.0, 32.0, 20.0, 13.0, 8.0, 14.0, 7.0, 8.0, 2.0, 1.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.611328125, -0.59466552734375, -0.5780029296875, -0.56134033203125, -0.544677734375, -0.52801513671875, -0.5113525390625, -0.49468994140625, -0.47802734375, -0.46136474609375, -0.4447021484375, -0.42803955078125, -0.411376953125, -0.39471435546875, -0.3780517578125, -0.36138916015625, -0.3447265625, -0.32806396484375, -0.3114013671875, -0.29473876953125, -0.278076171875, -0.26141357421875, -0.2447509765625, -0.22808837890625, -0.21142578125, -0.19476318359375, -0.1781005859375, -0.16143798828125, -0.144775390625, -0.12811279296875, -0.1114501953125, -0.09478759765625, -0.078125, -0.06146240234375, -0.0447998046875, -0.02813720703125, -0.011474609375, 0.00518798828125, 0.0218505859375, 0.03851318359375, 0.05517578125, 0.07183837890625, 0.0885009765625, 0.10516357421875, 0.121826171875, 0.13848876953125, 0.1551513671875, 0.17181396484375, 0.1884765625, 0.20513916015625, 0.2218017578125, 0.23846435546875, 0.255126953125, 0.27178955078125, 0.2884521484375, 0.30511474609375, 0.32177734375, 0.33843994140625, 0.3551025390625, 0.37176513671875, 0.388427734375, 0.40509033203125, 0.4217529296875, 0.43841552734375, 0.455078125]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 5.0, 13.0, 14.0, 40.0, 63.0, 92.0, 150.0, 162.0, 137.0, 130.0, 86.0, 49.0, 26.0, 10.0, 11.0, 4.0, 3.0, 5.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.105224609375, -0.10288047790527344, -0.10053634643554688, -0.09819221496582031, -0.09584808349609375, -0.09350395202636719, -0.09115982055664062, -0.08881568908691406, -0.0864715576171875, -0.08412742614746094, -0.08178329467773438, -0.07943916320800781, -0.07709503173828125, -0.07475090026855469, -0.07240676879882812, -0.07006263732910156, -0.067718505859375, -0.06537437438964844, -0.06303024291992188, -0.06068611145019531, -0.05834197998046875, -0.05599784851074219, -0.053653717041015625, -0.05130958557128906, -0.0489654541015625, -0.04662132263183594, -0.044277191162109375, -0.04193305969238281, -0.03958892822265625, -0.03724479675292969, -0.034900665283203125, -0.03255653381347656, -0.03021240234375, -0.027868270874023438, -0.025524139404296875, -0.023180007934570312, -0.02083587646484375, -0.018491744995117188, -0.016147613525390625, -0.013803482055664062, -0.0114593505859375, -0.009115219116210938, -0.006771087646484375, -0.0044269561767578125, -0.00208282470703125, 0.0002613067626953125, 0.002605438232421875, 0.0049495697021484375, 0.007293701171875, 0.009637832641601562, 0.011981964111328125, 0.014326095581054688, 0.01667022705078125, 0.019014358520507812, 0.021358489990234375, 0.023702621459960938, 0.0260467529296875, 0.028390884399414062, 0.030735015869140625, 0.03307914733886719, 0.03542327880859375, 0.03776741027832031, 0.040111541748046875, 0.04245567321777344, 0.0447998046875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 4.0, 3.0, 5.0, 4.0, 9.0, 14.0, 23.0, 30.0, 51.0, 64.0, 93.0, 161.0, 214.0, 365.0, 569.0, 923.0, 1483.0, 2617.0, 4521.0, 8247.0, 15817.0, 31743.0, 68441.0, 160074.0, 366375.0, 215657.0, 87861.0, 40280.0, 19673.0, 10097.0, 5346.0, 3021.0, 1843.0, 1067.0, 654.0, 423.0, 237.0, 181.0, 127.0, 73.0, 60.0, 36.0, 27.0, 19.0, 15.0, 8.0, 3.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1318359375, -0.12723541259765625, -0.1226348876953125, -0.11803436279296875, -0.113433837890625, -0.10883331298828125, -0.1042327880859375, -0.09963226318359375, -0.09503173828125, -0.09043121337890625, -0.0858306884765625, -0.08123016357421875, -0.076629638671875, -0.07202911376953125, -0.0674285888671875, -0.06282806396484375, -0.0582275390625, -0.05362701416015625, -0.0490264892578125, -0.04442596435546875, -0.039825439453125, -0.03522491455078125, -0.0306243896484375, -0.02602386474609375, -0.02142333984375, -0.01682281494140625, -0.0122222900390625, -0.00762176513671875, -0.003021240234375, 0.00157928466796875, 0.0061798095703125, 0.01078033447265625, 0.015380859375, 0.01998138427734375, 0.0245819091796875, 0.02918243408203125, 0.033782958984375, 0.03838348388671875, 0.0429840087890625, 0.04758453369140625, 0.05218505859375, 0.05678558349609375, 0.0613861083984375, 0.06598663330078125, 0.070587158203125, 0.07518768310546875, 0.0797882080078125, 0.08438873291015625, 0.0889892578125, 0.09358978271484375, 0.0981903076171875, 0.10279083251953125, 0.107391357421875, 0.11199188232421875, 0.1165924072265625, 0.12119293212890625, 0.12579345703125, 0.13039398193359375, 0.1349945068359375, 0.13959503173828125, 0.144195556640625, 0.14879608154296875, 0.1533966064453125, 0.15799713134765625, 0.16259765625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 2.0, 1.0, 2.0, 2.0, 3.0, 8.0, 12.0, 4.0, 13.0, 17.0, 19.0, 28.0, 28.0, 27.0, 30.0, 35.0, 43.0, 48.0, 52.0, 51.0, 51.0, 67.0, 54.0, 51.0, 39.0, 48.0, 41.0, 35.0, 28.0, 27.0, 27.0, 18.0, 21.0, 15.0, 17.0, 7.0, 8.0, 9.0, 5.0, 3.0, 5.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.135498046875, -0.13073348999023438, -0.12596893310546875, -0.12120437622070312, -0.1164398193359375, -0.11167526245117188, -0.10691070556640625, -0.10214614868164062, -0.097381591796875, -0.09261703491210938, -0.08785247802734375, -0.08308792114257812, -0.0783233642578125, -0.07355880737304688, -0.06879425048828125, -0.06402969360351562, -0.05926513671875, -0.054500579833984375, -0.04973602294921875, -0.044971466064453125, -0.0402069091796875, -0.035442352294921875, -0.03067779541015625, -0.025913238525390625, -0.021148681640625, -0.016384124755859375, -0.01161956787109375, -0.006855010986328125, -0.0020904541015625, 0.002674102783203125, 0.00743865966796875, 0.012203216552734375, 0.0169677734375, 0.021732330322265625, 0.02649688720703125, 0.031261444091796875, 0.0360260009765625, 0.040790557861328125, 0.04555511474609375, 0.050319671630859375, 0.055084228515625, 0.059848785400390625, 0.06461334228515625, 0.06937789916992188, 0.0741424560546875, 0.07890701293945312, 0.08367156982421875, 0.08843612670898438, 0.09320068359375, 0.09796524047851562, 0.10272979736328125, 0.10749435424804688, 0.1122589111328125, 0.11702346801757812, 0.12178802490234375, 0.12655258178710938, 0.131317138671875, 0.13608169555664062, 0.14084625244140625, 0.14561080932617188, 0.1503753662109375, 0.15513992309570312, 0.15990447998046875, 0.16466903686523438, 0.16943359375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 7.0, 2.0, 9.0, 10.0, 23.0, 26.0, 37.0, 59.0, 132.0, 260.0, 605.0, 1510.0, 4867.0, 21559.0, 237932.0, 722995.0, 46381.0, 8320.0, 2335.0, 797.0, 356.0, 143.0, 91.0, 40.0, 27.0, 12.0, 12.0, 5.0, 4.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1927490234375, -0.18676185607910156, -0.18077468872070312, -0.1747875213623047, -0.16880035400390625, -0.1628131866455078, -0.15682601928710938, -0.15083885192871094, -0.1448516845703125, -0.13886451721191406, -0.13287734985351562, -0.1268901824951172, -0.12090301513671875, -0.11491584777832031, -0.10892868041992188, -0.10294151306152344, -0.096954345703125, -0.09096717834472656, -0.08498001098632812, -0.07899284362792969, -0.07300567626953125, -0.06701850891113281, -0.061031341552734375, -0.05504417419433594, -0.0490570068359375, -0.04306983947753906, -0.037082672119140625, -0.031095504760742188, -0.02510833740234375, -0.019121170043945312, -0.013134002685546875, -0.0071468353271484375, -0.00115966796875, 0.0048274993896484375, 0.010814666748046875, 0.016801834106445312, 0.02278900146484375, 0.028776168823242188, 0.034763336181640625, 0.04075050354003906, 0.0467376708984375, 0.05272483825683594, 0.058712005615234375, 0.06469917297363281, 0.07068634033203125, 0.07667350769042969, 0.08266067504882812, 0.08864784240722656, 0.094635009765625, 0.10062217712402344, 0.10660934448242188, 0.11259651184082031, 0.11858367919921875, 0.12457084655761719, 0.13055801391601562, 0.13654518127441406, 0.1425323486328125, 0.14851951599121094, 0.15450668334960938, 0.1604938507080078, 0.16648101806640625, 0.1724681854248047, 0.17845535278320312, 0.18444252014160156, 0.1904296875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 3.0, 5.0, 4.0, 8.0, 4.0, 9.0, 23.0, 18.0, 40.0, 79.0, 153.0, 363.0, 118.0, 62.0, 29.0, 26.0, 12.0, 16.0, 14.0, 4.0, 3.0, 6.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004100799560546875, -0.0003966018557548523, -0.0003831237554550171, -0.0003696456551551819, -0.0003561675548553467, -0.0003426894545555115, -0.00032921135425567627, -0.00031573325395584106, -0.00030225515365600586, -0.00028877705335617065, -0.00027529895305633545, -0.00026182085275650024, -0.00024834275245666504, -0.00023486465215682983, -0.00022138655185699463, -0.00020790845155715942, -0.00019443035125732422, -0.00018095225095748901, -0.0001674741506576538, -0.0001539960503578186, -0.0001405179500579834, -0.0001270398497581482, -0.00011356174945831299, -0.00010008364915847778, -8.660554885864258e-05, -7.312744855880737e-05, -5.964934825897217e-05, -4.617124795913696e-05, -3.269314765930176e-05, -1.9215047359466553e-05, -5.736947059631348e-06, 7.741153240203857e-06, 2.1219253540039062e-05, 3.469735383987427e-05, 4.817545413970947e-05, 6.165355443954468e-05, 7.513165473937988e-05, 8.860975503921509e-05, 0.00010208785533905029, 0.0001155659556388855, 0.0001290440559387207, 0.0001425221562385559, 0.0001560002565383911, 0.00016947835683822632, 0.00018295645713806152, 0.00019643455743789673, 0.00020991265773773193, 0.00022339075803756714, 0.00023686885833740234, 0.00025034695863723755, 0.00026382505893707275, 0.00027730315923690796, 0.00029078125953674316, 0.00030425935983657837, 0.0003177374601364136, 0.0003312155604362488, 0.000344693660736084, 0.0003581717610359192, 0.0003716498613357544, 0.0003851279616355896, 0.0003986060619354248, 0.00041208416223526, 0.0004255622625350952, 0.0004390403628349304, 0.0004525184631347656]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 7.0, 5.0, 12.0, 21.0, 25.0, 29.0, 55.0, 76.0, 129.0, 240.0, 358.0, 605.0, 1075.0, 2000.0, 3979.0, 8997.0, 24788.0, 99937.0, 646539.0, 198611.0, 37717.0, 12452.0, 5184.0, 2491.0, 1351.0, 750.0, 425.0, 271.0, 165.0, 92.0, 71.0, 32.0, 23.0, 15.0, 14.0, 6.0, 7.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1168212890625, -0.11324596405029297, -0.10967063903808594, -0.1060953140258789, -0.10251998901367188, -0.09894466400146484, -0.09536933898925781, -0.09179401397705078, -0.08821868896484375, -0.08464336395263672, -0.08106803894042969, -0.07749271392822266, -0.07391738891601562, -0.0703420639038086, -0.06676673889160156, -0.06319141387939453, -0.0596160888671875, -0.05604076385498047, -0.05246543884277344, -0.048890113830566406, -0.045314788818359375, -0.041739463806152344, -0.03816413879394531, -0.03458881378173828, -0.03101348876953125, -0.02743816375732422, -0.023862838745117188, -0.020287513732910156, -0.016712188720703125, -0.013136863708496094, -0.009561538696289062, -0.005986213684082031, -0.002410888671875, 0.0011644363403320312, 0.0047397613525390625, 0.008315086364746094, 0.011890411376953125, 0.015465736389160156, 0.019041061401367188, 0.02261638641357422, 0.02619171142578125, 0.02976703643798828, 0.03334236145019531, 0.036917686462402344, 0.040493011474609375, 0.044068336486816406, 0.04764366149902344, 0.05121898651123047, 0.0547943115234375, 0.05836963653564453, 0.06194496154785156, 0.0655202865600586, 0.06909561157226562, 0.07267093658447266, 0.07624626159667969, 0.07982158660888672, 0.08339691162109375, 0.08697223663330078, 0.09054756164550781, 0.09412288665771484, 0.09769821166992188, 0.1012735366821289, 0.10484886169433594, 0.10842418670654297, 0.11199951171875]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 2.0, 1.0, 4.0, 3.0, 6.0, 8.0, 4.0, 9.0, 13.0, 15.0, 28.0, 30.0, 39.0, 54.0, 79.0, 120.0, 134.0, 99.0, 99.0, 66.0, 48.0, 27.0, 32.0, 18.0, 9.0, 19.0, 10.0, 5.0, 6.0, 4.0, 1.0, 5.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.09600830078125, -0.09288501739501953, -0.08976173400878906, -0.0866384506225586, -0.08351516723632812, -0.08039188385009766, -0.07726860046386719, -0.07414531707763672, -0.07102203369140625, -0.06789875030517578, -0.06477546691894531, -0.061652183532714844, -0.058528900146484375, -0.055405616760253906, -0.05228233337402344, -0.04915904998779297, -0.0460357666015625, -0.04291248321533203, -0.03978919982910156, -0.036665916442871094, -0.033542633056640625, -0.030419349670410156, -0.027296066284179688, -0.02417278289794922, -0.02104949951171875, -0.01792621612548828, -0.014802932739257812, -0.011679649353027344, -0.008556365966796875, -0.005433082580566406, -0.0023097991943359375, 0.0008134841918945312, 0.003936767578125, 0.007060050964355469, 0.010183334350585938, 0.013306617736816406, 0.016429901123046875, 0.019553184509277344, 0.022676467895507812, 0.02579975128173828, 0.02892303466796875, 0.03204631805419922, 0.03516960144042969, 0.038292884826660156, 0.041416168212890625, 0.044539451599121094, 0.04766273498535156, 0.05078601837158203, 0.0539093017578125, 0.05703258514404297, 0.06015586853027344, 0.0632791519165039, 0.06640243530273438, 0.06952571868896484, 0.07264900207519531, 0.07577228546142578, 0.07889556884765625, 0.08201885223388672, 0.08514213562011719, 0.08826541900634766, 0.09138870239257812, 0.0945119857788086, 0.09763526916503906, 0.10075855255126953, 0.1038818359375]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 1.0, 6.0, 8.0, 8.0, 28.0, 46.0, 80.0, 166.0, 228.0, 196.0, 93.0, 59.0, 37.0, 20.0, 13.0, 2.0, 5.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.867201566696167, -1.8060872554779053, -1.744972825050354, -1.6838585138320923, -1.622744083404541, -1.5616297721862793, -1.500515341758728, -1.4394010305404663, -1.378286600112915, -1.3171722888946533, -1.256057858467102, -1.1949435472488403, -1.133829116821289, -1.0727148056030273, -1.011600375175476, -0.9504860639572144, -0.8893716931343079, -0.8282573223114014, -0.7671429514884949, -0.7060285806655884, -0.6449142098426819, -0.5837998390197754, -0.5226855278015137, -0.4615711271762848, -0.4004567563533783, -0.3393423855304718, -0.2782280147075653, -0.21711365878582, -0.1559992879629135, -0.09488493204116821, -0.03377056121826172, 0.027343809604644775, 0.08845818042755127, 0.14957255125045776, 0.21068692207336426, 0.27180129289627075, 0.33291566371917725, 0.39403000473976135, 0.45514437556266785, 0.516258716583252, 0.5773731470108032, 0.6384875178337097, 0.6996018886566162, 0.7607162594795227, 0.8218306303024292, 0.8829449415206909, 0.9440593719482422, 1.005173683166504, 1.0662879943847656, 1.1274023056030273, 1.1885167360305786, 1.2496310472488403, 1.3107454776763916, 1.3718597888946533, 1.4329742193222046, 1.4940885305404663, 1.5552029609680176, 1.6163172721862793, 1.6774317026138306, 1.7385460138320923, 1.7996604442596436, 1.8607747554779053, 1.9218891859054565, 1.9830034971237183, 2.0441179275512695]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 5.0, 5.0, 2.0, 11.0, 11.0, 7.0, 13.0, 22.0, 23.0, 22.0, 42.0, 43.0, 48.0, 52.0, 38.0, 41.0, 48.0, 62.0, 54.0, 48.0, 60.0, 38.0, 27.0, 50.0, 35.0, 38.0, 34.0, 26.0, 22.0, 24.0, 11.0, 9.0, 9.0, 6.0, 5.0, 8.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1428098678588867, -1.1130892038345337, -1.0833685398101807, -1.0536479949951172, -1.0239273309707642, -0.9942066669464111, -0.9644860625267029, -0.9347654581069946, -0.9050447940826416, -0.8753241300582886, -0.8456035256385803, -0.8158829212188721, -0.786162257194519, -0.756441593170166, -0.7267209887504578, -0.6970003843307495, -0.6672797203063965, -0.6375590562820435, -0.6078384518623352, -0.578117847442627, -0.5483971834182739, -0.5186765193939209, -0.48895591497421265, -0.459235280752182, -0.42951464653015137, -0.3997940123081207, -0.3700733780860901, -0.34035274386405945, -0.3106321096420288, -0.28091147541999817, -0.25119084119796753, -0.2214702069759369, -0.19174951314926147, -0.16202887892723083, -0.1323082447052002, -0.10258761048316956, -0.07286697626113892, -0.043146342039108276, -0.013425707817077637, 0.016294926404953003, 0.04601556062698364, 0.07573619484901428, 0.10545682907104492, 0.13517746329307556, 0.1648980975151062, 0.19461873173713684, 0.22433936595916748, 0.2540600001811981, 0.28378063440322876, 0.3135012686252594, 0.34322190284729004, 0.3729425370693207, 0.4026631712913513, 0.43238380551338196, 0.4621044397354126, 0.49182507395744324, 0.5215457081794739, 0.5512663125991821, 0.5809869766235352, 0.6107076406478882, 0.6404282450675964, 0.6701488494873047, 0.6998695135116577, 0.7295901775360107, 0.759310781955719]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 4.0, 2.0, 3.0, 2.0, 3.0, 7.0, 8.0, 6.0, 6.0, 17.0, 24.0, 33.0, 39.0, 46.0, 89.0, 151.0, 305.0, 620.0, 1472.0, 4713.0, 24617.0, 3988276.0, 156167.0, 12227.0, 3001.0, 1150.0, 526.0, 302.0, 145.0, 105.0, 92.0, 37.0, 33.0, 23.0, 12.0, 7.0, 0.0, 9.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5341796875, -0.5196685791015625, -0.505157470703125, -0.4906463623046875, -0.47613525390625, -0.4616241455078125, -0.447113037109375, -0.4326019287109375, -0.4180908203125, -0.4035797119140625, -0.389068603515625, -0.3745574951171875, -0.36004638671875, -0.3455352783203125, -0.331024169921875, -0.3165130615234375, -0.302001953125, -0.2874908447265625, -0.272979736328125, -0.2584686279296875, -0.24395751953125, -0.2294464111328125, -0.214935302734375, -0.2004241943359375, -0.1859130859375, -0.1714019775390625, -0.156890869140625, -0.1423797607421875, -0.12786865234375, -0.1133575439453125, -0.098846435546875, -0.0843353271484375, -0.06982421875, -0.0553131103515625, -0.040802001953125, -0.0262908935546875, -0.01177978515625, 0.0027313232421875, 0.017242431640625, 0.0317535400390625, 0.0462646484375, 0.0607757568359375, 0.075286865234375, 0.0897979736328125, 0.10430908203125, 0.1188201904296875, 0.133331298828125, 0.1478424072265625, 0.162353515625, 0.1768646240234375, 0.191375732421875, 0.2058868408203125, 0.22039794921875, 0.2349090576171875, 0.249420166015625, 0.2639312744140625, 0.2784423828125, 0.2929534912109375, 0.307464599609375, 0.3219757080078125, 0.33648681640625, 0.3509979248046875, 0.365509033203125, 0.3800201416015625, 0.39453125]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 9.0, 10.0, 7.0, 33.0, 39.0, 70.0, 104.0, 137.0, 140.0, 131.0, 119.0, 89.0, 46.0, 27.0, 17.0, 12.0, 4.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0], "bins": [-0.099853515625, -0.09761953353881836, -0.09538555145263672, -0.09315156936645508, -0.09091758728027344, -0.0886836051940918, -0.08644962310791016, -0.08421564102172852, -0.08198165893554688, -0.07974767684936523, -0.0775136947631836, -0.07527971267700195, -0.07304573059082031, -0.07081174850463867, -0.06857776641845703, -0.06634378433227539, -0.06410980224609375, -0.06187582015991211, -0.05964183807373047, -0.05740785598754883, -0.05517387390136719, -0.05293989181518555, -0.050705909729003906, -0.048471927642822266, -0.046237945556640625, -0.044003963470458984, -0.041769981384277344, -0.0395359992980957, -0.03730201721191406, -0.03506803512573242, -0.03283405303955078, -0.03060007095336914, -0.0283660888671875, -0.02613210678100586, -0.02389812469482422, -0.021664142608642578, -0.019430160522460938, -0.017196178436279297, -0.014962196350097656, -0.012728214263916016, -0.010494232177734375, -0.008260250091552734, -0.006026268005371094, -0.003792285919189453, -0.0015583038330078125, 0.0006756782531738281, 0.0029096603393554688, 0.005143642425537109, 0.00737762451171875, 0.00961160659790039, 0.011845588684082031, 0.014079570770263672, 0.016313552856445312, 0.018547534942626953, 0.020781517028808594, 0.023015499114990234, 0.025249481201171875, 0.027483463287353516, 0.029717445373535156, 0.0319514274597168, 0.03418540954589844, 0.03641939163208008, 0.03865337371826172, 0.04088735580444336, 0.043121337890625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 3.0, 0.0, 6.0, 7.0, 4.0, 9.0, 16.0, 27.0, 36.0, 45.0, 56.0, 71.0, 120.0, 124.0, 218.0, 330.0, 531.0, 850.0, 1412.0, 2674.0, 5121.0, 11071.0, 28910.0, 123749.0, 3769360.0, 186690.0, 36439.0, 13205.0, 5966.0, 3040.0, 1680.0, 977.0, 594.0, 282.0, 210.0, 143.0, 90.0, 72.0, 40.0, 29.0, 23.0, 10.0, 18.0, 11.0, 7.0, 9.0, 0.0, 6.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.1700439453125, -0.16409683227539062, -0.15814971923828125, -0.15220260620117188, -0.1462554931640625, -0.14030838012695312, -0.13436126708984375, -0.12841415405273438, -0.122467041015625, -0.11651992797851562, -0.11057281494140625, -0.10462570190429688, -0.0986785888671875, -0.09273147583007812, -0.08678436279296875, -0.08083724975585938, -0.07489013671875, -0.06894302368164062, -0.06299591064453125, -0.057048797607421875, -0.0511016845703125, -0.045154571533203125, -0.03920745849609375, -0.033260345458984375, -0.027313232421875, -0.021366119384765625, -0.01541900634765625, -0.009471893310546875, -0.0035247802734375, 0.002422332763671875, 0.00836944580078125, 0.014316558837890625, 0.020263671875, 0.026210784912109375, 0.03215789794921875, 0.038105010986328125, 0.0440521240234375, 0.049999237060546875, 0.05594635009765625, 0.061893463134765625, 0.067840576171875, 0.07378768920898438, 0.07973480224609375, 0.08568191528320312, 0.0916290283203125, 0.09757614135742188, 0.10352325439453125, 0.10947036743164062, 0.11541748046875, 0.12136459350585938, 0.12731170654296875, 0.13325881958007812, 0.1392059326171875, 0.14515304565429688, 0.15110015869140625, 0.15704727172851562, 0.162994384765625, 0.16894149780273438, 0.17488861083984375, 0.18083572387695312, 0.1867828369140625, 0.19272994995117188, 0.19867706298828125, 0.20462417602539062, 0.2105712890625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 4.0, 3.0, 3.0, 10.0, 9.0, 10.0, 19.0, 21.0, 32.0, 58.0, 105.0, 207.0, 2773.0, 449.0, 135.0, 87.0, 37.0, 24.0, 33.0, 9.0, 8.0, 10.0, 5.0, 4.0, 5.0, 7.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06964111328125, -0.06751346588134766, -0.06538581848144531, -0.06325817108154297, -0.061130523681640625, -0.05900287628173828, -0.05687522888183594, -0.054747581481933594, -0.05261993408203125, -0.050492286682128906, -0.04836463928222656, -0.04623699188232422, -0.044109344482421875, -0.04198169708251953, -0.03985404968261719, -0.037726402282714844, -0.0355987548828125, -0.033471107482910156, -0.03134346008300781, -0.02921581268310547, -0.027088165283203125, -0.02496051788330078, -0.022832870483398438, -0.020705223083496094, -0.01857757568359375, -0.016449928283691406, -0.014322280883789062, -0.012194633483886719, -0.010066986083984375, -0.007939338684082031, -0.0058116912841796875, -0.0036840438842773438, -0.001556396484375, 0.0005712509155273438, 0.0026988983154296875, 0.004826545715332031, 0.006954193115234375, 0.009081840515136719, 0.011209487915039062, 0.013337135314941406, 0.01546478271484375, 0.017592430114746094, 0.019720077514648438, 0.02184772491455078, 0.023975372314453125, 0.02610301971435547, 0.028230667114257812, 0.030358314514160156, 0.0324859619140625, 0.034613609313964844, 0.03674125671386719, 0.03886890411376953, 0.040996551513671875, 0.04312419891357422, 0.04525184631347656, 0.047379493713378906, 0.04950714111328125, 0.051634788513183594, 0.05376243591308594, 0.05589008331298828, 0.058017730712890625, 0.06014537811279297, 0.06227302551269531, 0.06440067291259766, 0.0665283203125]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 4.0, 21.0, 75.0, 426.0, 394.0, 77.0, 10.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.846519947052002, -1.8109623193740845, -1.775404691696167, -1.73984694480896, -1.7042893171310425, -1.668731689453125, -1.6331740617752075, -1.59761643409729, -1.562058687210083, -1.5265010595321655, -1.490943431854248, -1.455385684967041, -1.4198280572891235, -1.384270429611206, -1.3487128019332886, -1.313155174255371, -1.2775975465774536, -1.2420399188995361, -1.2064822912216187, -1.1709245443344116, -1.1353669166564941, -1.0998092889785767, -1.0642516613006592, -1.0286940336227417, -0.9931363463401794, -0.957578718662262, -0.9220210313796997, -0.8864634037017822, -0.8509057760238647, -0.8153480887413025, -0.779790461063385, -0.7442327737808228, -0.7086750268936157, -0.6731173992156982, -0.637559711933136, -0.6020020842552185, -0.5664443969726562, -0.5308867692947388, -0.4953291416168213, -0.4597714841365814, -0.42421382665634155, -0.3886561691761017, -0.3530985116958618, -0.31754088401794434, -0.28198322653770447, -0.2464255690574646, -0.21086792647838593, -0.17531028389930725, -0.13975262641906738, -0.10419497638940811, -0.06863732635974884, -0.03307967633008957, 0.002477973699569702, 0.03803563117980957, 0.07359327375888824, 0.10915091633796692, 0.1447085738182068, 0.18026623129844666, 0.21582387387752533, 0.251381516456604, 0.28693917393684387, 0.32249683141708374, 0.3580544590950012, 0.3936121165752411, 0.42916977405548096]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 7.0, 5.0, 7.0, 20.0, 16.0, 54.0, 44.0, 44.0, 66.0, 86.0, 71.0, 83.0, 74.0, 77.0, 56.0, 51.0, 50.0, 60.0, 37.0, 33.0, 19.0, 14.0, 11.0, 13.0, 5.0, 6.0, 2.0, 2.0], "bins": [-0.41808414459228516, -0.4095260202884674, -0.40096792578697205, -0.3924098014831543, -0.38385167717933655, -0.3752935528755188, -0.36673545837402344, -0.3581773340702057, -0.34961920976638794, -0.3410610854625702, -0.33250299096107483, -0.3239448666572571, -0.31538674235343933, -0.3068286180496216, -0.2982705235481262, -0.28971239924430847, -0.2811542749404907, -0.272596150636673, -0.2640380561351776, -0.25547993183135986, -0.24692180752754211, -0.23836369812488556, -0.229805588722229, -0.22124746441841125, -0.2126893699169159, -0.20413126051425934, -0.1955731362104416, -0.18701502680778503, -0.17845690250396729, -0.16989879310131073, -0.16134068369865417, -0.15278255939483643, -0.14422443509101868, -0.13566632568836212, -0.12710820138454437, -0.11855009198188782, -0.10999196767807007, -0.10143385827541351, -0.09287574142217636, -0.08431762456893921, -0.07575950771570206, -0.0672013908624649, -0.05864327400922775, -0.0500851608812809, -0.04152704402804375, -0.032968927174806595, -0.02441081404685974, -0.01585269719362259, -0.007294580340385437, 0.0012635355815291405, 0.009821651503443718, 0.01837976649403572, 0.026937883347272873, 0.035496000200510025, 0.04405411332845688, 0.05261223018169403, 0.06117034703493118, 0.06972846388816833, 0.07828658074140549, 0.08684469759464264, 0.0954028069972992, 0.10396093130111694, 0.1125190407037735, 0.12107715755701065, 0.1296352744102478]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 1.0, 1.0, 6.0, 2.0, 4.0, 6.0, 13.0, 6.0, 16.0, 10.0, 29.0, 15.0, 33.0, 49.0, 85.0, 118.0, 166.0, 300.0, 478.0, 807.0, 1334.0, 2697.0, 7036.0, 25274.0, 132770.0, 631351.0, 195764.0, 34172.0, 8812.0, 3403.0, 1584.0, 831.0, 493.0, 302.0, 174.0, 122.0, 71.0, 55.0, 36.0, 23.0, 28.0, 15.0, 17.0, 11.0, 6.0, 15.0, 4.0, 6.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 3.0], "bins": [-0.328125, -0.318359375, -0.30859375, -0.298828125, -0.2890625, -0.279296875, -0.26953125, -0.259765625, -0.25, -0.240234375, -0.23046875, -0.220703125, -0.2109375, -0.201171875, -0.19140625, -0.181640625, -0.171875, -0.162109375, -0.15234375, -0.142578125, -0.1328125, -0.123046875, -0.11328125, -0.103515625, -0.09375, -0.083984375, -0.07421875, -0.064453125, -0.0546875, -0.044921875, -0.03515625, -0.025390625, -0.015625, -0.005859375, 0.00390625, 0.013671875, 0.0234375, 0.033203125, 0.04296875, 0.052734375, 0.0625, 0.072265625, 0.08203125, 0.091796875, 0.1015625, 0.111328125, 0.12109375, 0.130859375, 0.140625, 0.150390625, 0.16015625, 0.169921875, 0.1796875, 0.189453125, 0.19921875, 0.208984375, 0.21875, 0.228515625, 0.23828125, 0.248046875, 0.2578125, 0.267578125, 0.27734375, 0.287109375, 0.296875]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 7.0, 6.0, 8.0, 20.0, 52.0, 70.0, 96.0, 115.0, 136.0, 142.0, 120.0, 97.0, 52.0, 31.0, 21.0, 8.0, 10.0, 2.0, 0.0, 4.0, 2.0, 0.0, 3.0, 4.0, 1.0, 0.0, 1.0, 3.0], "bins": [-0.09930419921875, -0.0970926284790039, -0.09488105773925781, -0.09266948699951172, -0.09045791625976562, -0.08824634552001953, -0.08603477478027344, -0.08382320404052734, -0.08161163330078125, -0.07940006256103516, -0.07718849182128906, -0.07497692108154297, -0.07276535034179688, -0.07055377960205078, -0.06834220886230469, -0.0661306381225586, -0.0639190673828125, -0.061707496643066406, -0.05949592590332031, -0.05728435516357422, -0.055072784423828125, -0.05286121368408203, -0.05064964294433594, -0.048438072204589844, -0.04622650146484375, -0.044014930725097656, -0.04180335998535156, -0.03959178924560547, -0.037380218505859375, -0.03516864776611328, -0.03295707702636719, -0.030745506286621094, -0.028533935546875, -0.026322364807128906, -0.024110794067382812, -0.02189922332763672, -0.019687652587890625, -0.01747608184814453, -0.015264511108398438, -0.013052940368652344, -0.01084136962890625, -0.008629798889160156, -0.0064182281494140625, -0.004206657409667969, -0.001995086669921875, 0.00021648406982421875, 0.0024280548095703125, 0.004639625549316406, 0.0068511962890625, 0.009062767028808594, 0.011274337768554688, 0.013485908508300781, 0.015697479248046875, 0.01790904998779297, 0.020120620727539062, 0.022332191467285156, 0.02454376220703125, 0.026755332946777344, 0.028966903686523438, 0.03117847442626953, 0.033390045166015625, 0.03560161590576172, 0.03781318664550781, 0.040024757385253906, 0.042236328125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 3.0, 4.0, 7.0, 9.0, 10.0, 17.0, 50.0, 47.0, 82.0, 133.0, 219.0, 337.0, 636.0, 1135.0, 2235.0, 4570.0, 10121.0, 24979.0, 68452.0, 223924.0, 460899.0, 162641.0, 51985.0, 19801.0, 8189.0, 3835.0, 1864.0, 1000.0, 571.0, 297.0, 181.0, 117.0, 68.0, 38.0, 45.0, 23.0, 9.0, 10.0, 6.0, 5.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1566162109375, -0.15109634399414062, -0.14557647705078125, -0.14005661010742188, -0.1345367431640625, -0.12901687622070312, -0.12349700927734375, -0.11797714233398438, -0.112457275390625, -0.10693740844726562, -0.10141754150390625, -0.09589767456054688, -0.0903778076171875, -0.08485794067382812, -0.07933807373046875, -0.07381820678710938, -0.06829833984375, -0.06277847290039062, -0.05725860595703125, -0.051738739013671875, -0.0462188720703125, -0.040699005126953125, -0.03517913818359375, -0.029659271240234375, -0.024139404296875, -0.018619537353515625, -0.01309967041015625, -0.007579803466796875, -0.0020599365234375, 0.003459930419921875, 0.00897979736328125, 0.014499664306640625, 0.02001953125, 0.025539398193359375, 0.03105926513671875, 0.036579132080078125, 0.0420989990234375, 0.047618865966796875, 0.05313873291015625, 0.058658599853515625, 0.064178466796875, 0.06969833374023438, 0.07521820068359375, 0.08073806762695312, 0.0862579345703125, 0.09177780151367188, 0.09729766845703125, 0.10281753540039062, 0.10833740234375, 0.11385726928710938, 0.11937713623046875, 0.12489700317382812, 0.1304168701171875, 0.13593673706054688, 0.14145660400390625, 0.14697647094726562, 0.152496337890625, 0.15801620483398438, 0.16353607177734375, 0.16905593872070312, 0.1745758056640625, 0.18009567260742188, 0.18561553955078125, 0.19113540649414062, 0.1966552734375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 6.0, 0.0, 2.0, 3.0, 1.0, 10.0, 4.0, 6.0, 18.0, 12.0, 19.0, 20.0, 27.0, 33.0, 28.0, 33.0, 44.0, 35.0, 50.0, 33.0, 53.0, 57.0, 52.0, 47.0, 44.0, 53.0, 50.0, 41.0, 41.0, 30.0, 28.0, 25.0, 19.0, 12.0, 8.0, 21.0, 10.0, 12.0, 7.0, 6.0, 5.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1322021484375, -0.1275196075439453, -0.12283706665039062, -0.11815452575683594, -0.11347198486328125, -0.10878944396972656, -0.10410690307617188, -0.09942436218261719, -0.0947418212890625, -0.09005928039550781, -0.08537673950195312, -0.08069419860839844, -0.07601165771484375, -0.07132911682128906, -0.06664657592773438, -0.06196403503417969, -0.057281494140625, -0.05259895324707031, -0.047916412353515625, -0.04323387145996094, -0.03855133056640625, -0.03386878967285156, -0.029186248779296875, -0.024503707885742188, -0.0198211669921875, -0.015138626098632812, -0.010456085205078125, -0.0057735443115234375, -0.00109100341796875, 0.0035915374755859375, 0.008274078369140625, 0.012956619262695312, 0.01763916015625, 0.022321701049804688, 0.027004241943359375, 0.03168678283691406, 0.03636932373046875, 0.04105186462402344, 0.045734405517578125, 0.05041694641113281, 0.0550994873046875, 0.05978202819824219, 0.06446456909179688, 0.06914710998535156, 0.07382965087890625, 0.07851219177246094, 0.08319473266601562, 0.08787727355957031, 0.092559814453125, 0.09724235534667969, 0.10192489624023438, 0.10660743713378906, 0.11128997802734375, 0.11597251892089844, 0.12065505981445312, 0.1253376007080078, 0.1300201416015625, 0.1347026824951172, 0.13938522338867188, 0.14406776428222656, 0.14875030517578125, 0.15343284606933594, 0.15811538696289062, 0.1627979278564453, 0.16748046875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 2.0, 3.0, 4.0, 1.0, 10.0, 14.0, 19.0, 26.0, 67.0, 174.0, 928.0, 21230.0, 1009261.0, 15674.0, 868.0, 144.0, 52.0, 22.0, 16.0, 16.0, 2.0, 10.0, 10.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.6640625, -0.6480484008789062, -0.6320343017578125, -0.6160202026367188, -0.600006103515625, -0.5839920043945312, -0.5679779052734375, -0.5519638061523438, -0.53594970703125, -0.5199356079101562, -0.5039215087890625, -0.48790740966796875, -0.471893310546875, -0.45587921142578125, -0.4398651123046875, -0.42385101318359375, -0.4078369140625, -0.39182281494140625, -0.3758087158203125, -0.35979461669921875, -0.343780517578125, -0.32776641845703125, -0.3117523193359375, -0.29573822021484375, -0.27972412109375, -0.26371002197265625, -0.2476959228515625, -0.23168182373046875, -0.215667724609375, -0.19965362548828125, -0.1836395263671875, -0.16762542724609375, -0.151611328125, -0.13559722900390625, -0.1195831298828125, -0.10356903076171875, -0.087554931640625, -0.07154083251953125, -0.0555267333984375, -0.03951263427734375, -0.02349853515625, -0.00748443603515625, 0.0085296630859375, 0.02454376220703125, 0.040557861328125, 0.05657196044921875, 0.0725860595703125, 0.08860015869140625, 0.1046142578125, 0.12062835693359375, 0.1366424560546875, 0.15265655517578125, 0.168670654296875, 0.18468475341796875, 0.2006988525390625, 0.21671295166015625, 0.23272705078125, 0.24874114990234375, 0.2647552490234375, 0.28076934814453125, 0.296783447265625, 0.31279754638671875, 0.3288116455078125, 0.34482574462890625, 0.36083984375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 2.0, 2.0, 5.0, 4.0, 8.0, 13.0, 12.0, 14.0, 23.0, 34.0, 58.0, 115.0, 268.0, 194.0, 92.0, 50.0, 35.0, 22.0, 11.0, 14.0, 5.0, 3.0, 2.0, 8.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00018310546875, -0.00017539411783218384, -0.00016768276691436768, -0.00015997141599655151, -0.00015226006507873535, -0.0001445487141609192, -0.00013683736324310303, -0.00012912601232528687, -0.0001214146614074707, -0.00011370331048965454, -0.00010599195957183838, -9.828060865402222e-05, -9.056925773620605e-05, -8.285790681838989e-05, -7.514655590057373e-05, -6.743520498275757e-05, -5.9723854064941406e-05, -5.2012503147125244e-05, -4.430115222930908e-05, -3.658980131149292e-05, -2.8878450393676758e-05, -2.1167099475860596e-05, -1.3455748558044434e-05, -5.7443976402282715e-06, 1.9669532775878906e-06, 9.678304195404053e-06, 1.7389655113220215e-05, 2.5101006031036377e-05, 3.281235694885254e-05, 4.05237078666687e-05, 4.823505878448486e-05, 5.5946409702301025e-05, 6.365776062011719e-05, 7.136911153793335e-05, 7.908046245574951e-05, 8.679181337356567e-05, 9.450316429138184e-05, 0.000102214515209198, 0.00010992586612701416, 0.00011763721704483032, 0.00012534856796264648, 0.00013305991888046265, 0.0001407712697982788, 0.00014848262071609497, 0.00015619397163391113, 0.0001639053225517273, 0.00017161667346954346, 0.00017932802438735962, 0.00018703937530517578, 0.00019475072622299194, 0.0002024620771408081, 0.00021017342805862427, 0.00021788477897644043, 0.0002255961298942566, 0.00023330748081207275, 0.00024101883172988892, 0.0002487301826477051, 0.00025644153356552124, 0.0002641528844833374, 0.00027186423540115356, 0.0002795755863189697, 0.0002872869372367859, 0.00029499828815460205, 0.0003027096390724182, 0.0003104209899902344]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 6.0, 3.0, 2.0, 9.0, 15.0, 20.0, 30.0, 64.0, 89.0, 160.0, 343.0, 795.0, 2300.0, 8692.0, 53736.0, 746540.0, 208949.0, 20096.0, 4320.0, 1327.0, 512.0, 222.0, 125.0, 78.0, 40.0, 33.0, 19.0, 9.0, 11.0, 5.0, 2.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.18310546875, -0.17751502990722656, -0.17192459106445312, -0.1663341522216797, -0.16074371337890625, -0.1551532745361328, -0.14956283569335938, -0.14397239685058594, -0.1383819580078125, -0.13279151916503906, -0.12720108032226562, -0.12161064147949219, -0.11602020263671875, -0.11042976379394531, -0.10483932495117188, -0.09924888610839844, -0.093658447265625, -0.08806800842285156, -0.08247756958007812, -0.07688713073730469, -0.07129669189453125, -0.06570625305175781, -0.060115814208984375, -0.05452537536621094, -0.0489349365234375, -0.04334449768066406, -0.037754058837890625, -0.03216361999511719, -0.02657318115234375, -0.020982742309570312, -0.015392303466796875, -0.009801864624023438, -0.00421142578125, 0.0013790130615234375, 0.006969451904296875, 0.012559890747070312, 0.01815032958984375, 0.023740768432617188, 0.029331207275390625, 0.03492164611816406, 0.0405120849609375, 0.04610252380371094, 0.051692962646484375, 0.05728340148925781, 0.06287384033203125, 0.06846427917480469, 0.07405471801757812, 0.07964515686035156, 0.085235595703125, 0.09082603454589844, 0.09641647338867188, 0.10200691223144531, 0.10759735107421875, 0.11318778991699219, 0.11877822875976562, 0.12436866760253906, 0.1299591064453125, 0.13554954528808594, 0.14113998413085938, 0.1467304229736328, 0.15232086181640625, 0.1579113006591797, 0.16350173950195312, 0.16909217834472656, 0.1746826171875]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 6.0, 4.0, 6.0, 13.0, 9.0, 17.0, 29.0, 47.0, 60.0, 78.0, 127.0, 124.0, 138.0, 96.0, 72.0, 55.0, 41.0, 19.0, 22.0, 15.0, 9.0, 5.0, 9.0, 3.0, 1.0, 4.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09002685546875, -0.08607959747314453, -0.08213233947753906, -0.0781850814819336, -0.07423782348632812, -0.07029056549072266, -0.06634330749511719, -0.06239604949951172, -0.05844879150390625, -0.05450153350830078, -0.05055427551269531, -0.046607017517089844, -0.042659759521484375, -0.038712501525878906, -0.03476524353027344, -0.03081798553466797, -0.0268707275390625, -0.02292346954345703, -0.018976211547851562, -0.015028953552246094, -0.011081695556640625, -0.007134437561035156, -0.0031871795654296875, 0.0007600784301757812, 0.00470733642578125, 0.008654594421386719, 0.012601852416992188, 0.016549110412597656, 0.020496368408203125, 0.024443626403808594, 0.028390884399414062, 0.03233814239501953, 0.036285400390625, 0.04023265838623047, 0.04417991638183594, 0.048127174377441406, 0.052074432373046875, 0.056021690368652344, 0.05996894836425781, 0.06391620635986328, 0.06786346435546875, 0.07181072235107422, 0.07575798034667969, 0.07970523834228516, 0.08365249633789062, 0.0875997543334961, 0.09154701232910156, 0.09549427032470703, 0.0994415283203125, 0.10338878631591797, 0.10733604431152344, 0.1112833023071289, 0.11523056030273438, 0.11917781829833984, 0.12312507629394531, 0.12707233428955078, 0.13101959228515625, 0.13496685028076172, 0.1389141082763672, 0.14286136627197266, 0.14680862426757812, 0.1507558822631836, 0.15470314025878906, 0.15865039825439453, 0.16259765625]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 13.0, 11.0, 9.0, 26.0, 36.0, 39.0, 95.0, 148.0, 162.0, 160.0, 110.0, 68.0, 51.0, 21.0, 24.0, 12.0, 11.0, 2.0, 4.0, 3.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9016638994216919, -0.8558385968208313, -0.8100132942199707, -0.7641879916191101, -0.7183626890182495, -0.6725373864173889, -0.6267120838165283, -0.5808867812156677, -0.5350614786148071, -0.48923617601394653, -0.44341087341308594, -0.39758557081222534, -0.35176026821136475, -0.30593496561050415, -0.26010966300964355, -0.21428436040878296, -0.16845905780792236, -0.12263375520706177, -0.07680845260620117, -0.030983150005340576, 0.01484215259552002, 0.060667455196380615, 0.10649275779724121, 0.1523180603981018, 0.1981433629989624, 0.243968665599823, 0.2897939682006836, 0.3356192708015442, 0.3814445734024048, 0.4272698760032654, 0.473095178604126, 0.5189204812049866, 0.5647459030151367, 0.6105712056159973, 0.6563965082168579, 0.7022218108177185, 0.7480471134185791, 0.7938724160194397, 0.8396977186203003, 0.8855230212211609, 0.9313483238220215, 0.9771736264228821, 1.0229989290237427, 1.068824291229248, 1.1146495342254639, 1.1604747772216797, 1.206300139427185, 1.2521255016326904, 1.2979507446289062, 1.343775987625122, 1.3896013498306274, 1.4354267120361328, 1.4812519550323486, 1.5270771980285645, 1.5729025602340698, 1.6187279224395752, 1.664553165435791, 1.7103784084320068, 1.7562037706375122, 1.8020291328430176, 1.8478543758392334, 1.8936796188354492, 1.9395049810409546, 1.98533034324646, 2.031155586242676]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 1.0, 3.0, 4.0, 4.0, 3.0, 6.0, 10.0, 9.0, 8.0, 13.0, 12.0, 17.0, 30.0, 16.0, 16.0, 40.0, 29.0, 29.0, 42.0, 48.0, 53.0, 58.0, 56.0, 52.0, 50.0, 43.0, 50.0, 35.0, 28.0, 31.0, 38.0, 32.0, 25.0, 18.0, 23.0, 12.0, 11.0, 11.0, 12.0, 8.0, 11.0, 3.0, 1.0, 3.0, 5.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7087627053260803, -0.6819206476211548, -0.6550785899162292, -0.6282365322113037, -0.6013944149017334, -0.5745524168014526, -0.5477102994918823, -0.5208682417869568, -0.49402618408203125, -0.4671841263771057, -0.4403420686721802, -0.41349998116493225, -0.3866579234600067, -0.3598158657550812, -0.33297377824783325, -0.3061317205429077, -0.2792896628379822, -0.25244760513305664, -0.2256055325269699, -0.19876345992088318, -0.17192140221595764, -0.1450793445110321, -0.11823727190494537, -0.09139519929885864, -0.0645531415939331, -0.03771107643842697, -0.010869011282920837, 0.015973053872585297, 0.04281511902809143, 0.06965717673301697, 0.0964992493391037, 0.12334132194519043, 0.15018343925476074, 0.17702549695968628, 0.203867569565773, 0.23070964217185974, 0.2575516998767853, 0.2843937575817108, 0.31123584508895874, 0.3380779027938843, 0.3649199604988098, 0.39176201820373535, 0.4186040759086609, 0.4454461634159088, 0.47228822112083435, 0.4991302788257599, 0.5259723663330078, 0.5528144240379333, 0.5796564817428589, 0.6064985394477844, 0.63334059715271, 0.6601826548576355, 0.687024712562561, 0.7138668298721313, 0.7407088875770569, 0.7675509452819824, 0.794393002986908, 0.8212350606918335, 0.848077118396759, 0.8749191761016846, 0.9017612934112549, 0.9286032915115356, 0.955445408821106, 0.9822874665260315, 1.009129524230957]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 5.0, 3.0, 2.0, 8.0, 3.0, 3.0, 9.0, 9.0, 7.0, 19.0, 23.0, 17.0, 15.0, 38.0, 50.0, 74.0, 132.0, 204.0, 377.0, 741.0, 1756.0, 5145.0, 21613.0, 3054061.0, 1080081.0, 20991.0, 5041.0, 1921.0, 842.0, 408.0, 216.0, 142.0, 116.0, 59.0, 42.0, 47.0, 23.0, 15.0, 11.0, 2.0, 4.0, 7.0, 2.0, 4.0, 2.0], "bins": [-0.55908203125, -0.5460777282714844, -0.5330734252929688, -0.5200691223144531, -0.5070648193359375, -0.4940605163574219, -0.48105621337890625, -0.4680519104003906, -0.455047607421875, -0.4420433044433594, -0.42903900146484375, -0.4160346984863281, -0.4030303955078125, -0.3900260925292969, -0.37702178955078125, -0.3640174865722656, -0.35101318359375, -0.3380088806152344, -0.32500457763671875, -0.3120002746582031, -0.2989959716796875, -0.2859916687011719, -0.27298736572265625, -0.2599830627441406, -0.246978759765625, -0.23397445678710938, -0.22097015380859375, -0.20796585083007812, -0.1949615478515625, -0.18195724487304688, -0.16895294189453125, -0.15594863891601562, -0.1429443359375, -0.12994003295898438, -0.11693572998046875, -0.10393142700195312, -0.0909271240234375, -0.07792282104492188, -0.06491851806640625, -0.051914215087890625, -0.038909912109375, -0.025905609130859375, -0.01290130615234375, 0.000102996826171875, 0.0131072998046875, 0.026111602783203125, 0.03911590576171875, 0.052120208740234375, 0.06512451171875, 0.07812881469726562, 0.09113311767578125, 0.10413742065429688, 0.1171417236328125, 0.13014602661132812, 0.14315032958984375, 0.15615463256835938, 0.169158935546875, 0.18216323852539062, 0.19516754150390625, 0.20817184448242188, 0.2211761474609375, 0.23418045043945312, 0.24718475341796875, 0.2601890563964844, 0.273193359375]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 7.0, 4.0, 11.0, 13.0, 19.0, 54.0, 86.0, 98.0, 126.0, 132.0, 137.0, 131.0, 75.0, 52.0, 25.0, 10.0, 10.0, 7.0, 0.0, 2.0, 5.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.0972900390625, -0.09500646591186523, -0.09272289276123047, -0.0904393196105957, -0.08815574645996094, -0.08587217330932617, -0.0835886001586914, -0.08130502700805664, -0.07902145385742188, -0.07673788070678711, -0.07445430755615234, -0.07217073440551758, -0.06988716125488281, -0.06760358810424805, -0.06532001495361328, -0.06303644180297852, -0.06075286865234375, -0.058469295501708984, -0.05618572235107422, -0.05390214920043945, -0.05161857604980469, -0.04933500289916992, -0.047051429748535156, -0.04476785659790039, -0.042484283447265625, -0.04020071029663086, -0.037917137145996094, -0.03563356399536133, -0.03334999084472656, -0.031066417694091797, -0.02878284454345703, -0.026499271392822266, -0.0242156982421875, -0.021932125091552734, -0.01964855194091797, -0.017364978790283203, -0.015081405639648438, -0.012797832489013672, -0.010514259338378906, -0.00823068618774414, -0.005947113037109375, -0.0036635398864746094, -0.0013799667358398438, 0.0009036064147949219, 0.0031871795654296875, 0.005470752716064453, 0.007754325866699219, 0.010037899017333984, 0.01232147216796875, 0.014605045318603516, 0.01688861846923828, 0.019172191619873047, 0.021455764770507812, 0.023739337921142578, 0.026022911071777344, 0.02830648422241211, 0.030590057373046875, 0.03287363052368164, 0.035157203674316406, 0.03744077682495117, 0.03972434997558594, 0.0420079231262207, 0.04429149627685547, 0.046575069427490234, 0.048858642578125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 5.0, 4.0, 6.0, 6.0, 10.0, 12.0, 22.0, 37.0, 56.0, 98.0, 247.0, 499.0, 1066.0, 2751.0, 9117.0, 44722.0, 3656837.0, 439289.0, 29114.0, 6365.0, 2153.0, 887.0, 456.0, 212.0, 121.0, 70.0, 39.0, 31.0, 25.0, 11.0, 5.0, 6.0, 4.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.419921875, -0.4091224670410156, -0.39832305908203125, -0.3875236511230469, -0.3767242431640625, -0.3659248352050781, -0.35512542724609375, -0.3443260192871094, -0.333526611328125, -0.3227272033691406, -0.31192779541015625, -0.3011283874511719, -0.2903289794921875, -0.2795295715332031, -0.26873016357421875, -0.2579307556152344, -0.24713134765625, -0.23633193969726562, -0.22553253173828125, -0.21473312377929688, -0.2039337158203125, -0.19313430786132812, -0.18233489990234375, -0.17153549194335938, -0.160736083984375, -0.14993667602539062, -0.13913726806640625, -0.12833786010742188, -0.1175384521484375, -0.10673904418945312, -0.09593963623046875, -0.08514022827148438, -0.0743408203125, -0.06354141235351562, -0.05274200439453125, -0.041942596435546875, -0.0311431884765625, -0.020343780517578125, -0.00954437255859375, 0.001255035400390625, 0.012054443359375, 0.022853851318359375, 0.03365325927734375, 0.044452667236328125, 0.0552520751953125, 0.06605148315429688, 0.07685089111328125, 0.08765029907226562, 0.09844970703125, 0.10924911499023438, 0.12004852294921875, 0.13084793090820312, 0.1416473388671875, 0.15244674682617188, 0.16324615478515625, 0.17404556274414062, 0.184844970703125, 0.19564437866210938, 0.20644378662109375, 0.21724319458007812, 0.2280426025390625, 0.23884201049804688, 0.24964141845703125, 0.2604408264160156, 0.271240234375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 6.0, 3.0, 6.0, 9.0, 12.0, 12.0, 23.0, 31.0, 28.0, 62.0, 127.0, 247.0, 2643.0, 467.0, 147.0, 81.0, 64.0, 35.0, 26.0, 14.0, 8.0, 9.0, 5.0, 6.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08331298828125, -0.07993602752685547, -0.07655906677246094, -0.0731821060180664, -0.06980514526367188, -0.06642818450927734, -0.06305122375488281, -0.05967426300048828, -0.05629730224609375, -0.05292034149169922, -0.04954338073730469, -0.046166419982910156, -0.042789459228515625, -0.039412498474121094, -0.03603553771972656, -0.03265857696533203, -0.0292816162109375, -0.02590465545654297, -0.022527694702148438, -0.019150733947753906, -0.015773773193359375, -0.012396812438964844, -0.009019851684570312, -0.005642890930175781, -0.00226593017578125, 0.0011110305786132812, 0.0044879913330078125, 0.007864952087402344, 0.011241912841796875, 0.014618873596191406, 0.017995834350585938, 0.02137279510498047, 0.024749755859375, 0.02812671661376953, 0.03150367736816406, 0.034880638122558594, 0.038257598876953125, 0.041634559631347656, 0.04501152038574219, 0.04838848114013672, 0.05176544189453125, 0.05514240264892578, 0.05851936340332031, 0.061896324157714844, 0.06527328491210938, 0.0686502456665039, 0.07202720642089844, 0.07540416717529297, 0.0787811279296875, 0.08215808868408203, 0.08553504943847656, 0.0889120101928711, 0.09228897094726562, 0.09566593170166016, 0.09904289245605469, 0.10241985321044922, 0.10579681396484375, 0.10917377471923828, 0.11255073547363281, 0.11592769622802734, 0.11930465698242188, 0.1226816177368164, 0.12605857849121094, 0.12943553924560547, 0.1328125]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 8.0, 57.0, 394.0, 465.0, 65.0, 16.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3852362632751465, -2.3208463191986084, -2.2564563751220703, -2.192066192626953, -2.127676248550415, -2.063286304473877, -1.9988962411880493, -1.9345061779022217, -1.8701162338256836, -1.8057262897491455, -1.7413362264633179, -1.6769461631774902, -1.6125562191009521, -1.548166275024414, -1.4837762117385864, -1.4193861484527588, -1.3549962043762207, -1.2906062602996826, -1.226216197013855, -1.1618261337280273, -1.0974361896514893, -1.0330462455749512, -0.9686561822891235, -0.9042661786079407, -0.8398761749267578, -0.775486171245575, -0.7110961675643921, -0.6467061638832092, -0.5823161602020264, -0.5179261565208435, -0.45353615283966064, -0.3891461491584778, -0.3247559070587158, -0.26036590337753296, -0.1959758996963501, -0.13158589601516724, -0.06719589233398438, -0.0028058886528015137, 0.06158411502838135, 0.1259741187095642, 0.19036412239074707, 0.25475412607192993, 0.3191441297531128, 0.38353413343429565, 0.4479241371154785, 0.5123141407966614, 0.5767041444778442, 0.6410941481590271, 0.70548415184021, 0.7698741555213928, 0.8342641592025757, 0.8986541628837585, 0.9630441665649414, 1.0274341106414795, 1.0918241739273071, 1.1562142372131348, 1.2206041812896729, 1.284994125366211, 1.3493841886520386, 1.4137742519378662, 1.4781641960144043, 1.5425541400909424, 1.60694420337677, 1.6713342666625977, 1.7357242107391357]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 2.0, 3.0, 3.0, 8.0, 13.0, 10.0, 28.0, 23.0, 24.0, 24.0, 29.0, 47.0, 46.0, 61.0, 57.0, 61.0, 71.0, 65.0, 44.0, 55.0, 56.0, 54.0, 50.0, 44.0, 35.0, 25.0, 19.0, 16.0, 11.0, 5.0, 5.0, 6.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.3651965260505676, -0.3546462953090668, -0.34409603476524353, -0.3335458040237427, -0.32299554347991943, -0.3124453127384186, -0.3018950819969177, -0.2913448214530945, -0.28079459071159363, -0.2702443599700928, -0.25969409942626953, -0.24914386868476868, -0.23859362304210663, -0.22804337739944458, -0.21749314665794373, -0.20694290101528168, -0.19639265537261963, -0.18584240972995758, -0.17529216408729553, -0.16474193334579468, -0.15419168770313263, -0.14364144206047058, -0.13309121131896973, -0.12254096567630768, -0.11199072003364563, -0.10144047439098358, -0.09089023619890213, -0.08033999800682068, -0.06978975236415863, -0.05923951044678688, -0.04868926852941513, -0.03813903033733368, -0.02758878469467163, -0.01703854277729988, -0.006488300859928131, 0.004061941057443619, 0.014612182974815369, 0.02516242489218712, 0.03571266680955887, 0.04626290500164032, 0.05681315064430237, 0.06736339628696442, 0.07791363447904587, 0.08846387267112732, 0.09901411831378937, 0.10956436395645142, 0.12011460214853287, 0.13066484034061432, 0.14121508598327637, 0.15176533162593842, 0.16231557726860046, 0.17286580801010132, 0.18341605365276337, 0.19396629929542542, 0.20451653003692627, 0.21506677567958832, 0.22561702132225037, 0.23616726696491241, 0.24671751260757446, 0.2572677433490753, 0.26781797409057617, 0.2783682346343994, 0.28891846537590027, 0.2994686961174011, 0.31001895666122437]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 1.0, 6.0, 6.0, 7.0, 16.0, 23.0, 23.0, 43.0, 51.0, 56.0, 84.0, 104.0, 183.0, 219.0, 371.0, 531.0, 867.0, 1550.0, 3022.0, 7585.0, 28433.0, 161700.0, 642550.0, 158799.0, 27653.0, 7615.0, 2943.0, 1519.0, 820.0, 543.0, 383.0, 226.0, 179.0, 135.0, 88.0, 60.0, 46.0, 40.0, 26.0, 12.0, 10.0, 9.0, 7.0, 4.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.31494140625, -0.30606842041015625, -0.2971954345703125, -0.28832244873046875, -0.279449462890625, -0.27057647705078125, -0.2617034912109375, -0.25283050537109375, -0.24395751953125, -0.23508453369140625, -0.2262115478515625, -0.21733856201171875, -0.208465576171875, -0.19959259033203125, -0.1907196044921875, -0.18184661865234375, -0.1729736328125, -0.16410064697265625, -0.1552276611328125, -0.14635467529296875, -0.137481689453125, -0.12860870361328125, -0.1197357177734375, -0.11086273193359375, -0.10198974609375, -0.09311676025390625, -0.0842437744140625, -0.07537078857421875, -0.066497802734375, -0.05762481689453125, -0.0487518310546875, -0.03987884521484375, -0.031005859375, -0.02213287353515625, -0.0132598876953125, -0.00438690185546875, 0.004486083984375, 0.01335906982421875, 0.0222320556640625, 0.03110504150390625, 0.03997802734375, 0.04885101318359375, 0.0577239990234375, 0.06659698486328125, 0.075469970703125, 0.08434295654296875, 0.0932159423828125, 0.10208892822265625, 0.1109619140625, 0.11983489990234375, 0.1287078857421875, 0.13758087158203125, 0.146453857421875, 0.15532684326171875, 0.1641998291015625, 0.17307281494140625, 0.18194580078125, 0.19081878662109375, 0.1996917724609375, 0.20856475830078125, 0.217437744140625, 0.22631072998046875, 0.2351837158203125, 0.24405670166015625, 0.2529296875]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 5.0, 5.0, 14.0, 16.0, 51.0, 75.0, 103.0, 128.0, 125.0, 145.0, 136.0, 91.0, 42.0, 27.0, 14.0, 9.0, 3.0, 3.0, 2.0, 3.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.09063720703125, -0.08830022811889648, -0.08596324920654297, -0.08362627029418945, -0.08128929138183594, -0.07895231246948242, -0.0766153335571289, -0.07427835464477539, -0.07194137573242188, -0.06960439682006836, -0.06726741790771484, -0.06493043899536133, -0.06259346008300781, -0.0602564811706543, -0.05791950225830078, -0.055582523345947266, -0.05324554443359375, -0.050908565521240234, -0.04857158660888672, -0.0462346076965332, -0.04389762878417969, -0.04156064987182617, -0.039223670959472656, -0.03688669204711914, -0.034549713134765625, -0.03221273422241211, -0.029875755310058594, -0.027538776397705078, -0.025201797485351562, -0.022864818572998047, -0.02052783966064453, -0.018190860748291016, -0.0158538818359375, -0.013516902923583984, -0.011179924011230469, -0.008842945098876953, -0.0065059661865234375, -0.004168987274169922, -0.0018320083618164062, 0.0005049705505371094, 0.002841949462890625, 0.005178928375244141, 0.007515907287597656, 0.009852886199951172, 0.012189865112304688, 0.014526844024658203, 0.01686382293701172, 0.019200801849365234, 0.02153778076171875, 0.023874759674072266, 0.02621173858642578, 0.028548717498779297, 0.030885696411132812, 0.03322267532348633, 0.035559654235839844, 0.03789663314819336, 0.040233612060546875, 0.04257059097290039, 0.044907569885253906, 0.04724454879760742, 0.04958152770996094, 0.05191850662231445, 0.05425548553466797, 0.056592464447021484, 0.058929443359375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 5.0, 6.0, 4.0, 4.0, 7.0, 11.0, 12.0, 22.0, 27.0, 56.0, 80.0, 114.0, 207.0, 315.0, 471.0, 817.0, 1391.0, 2362.0, 3832.0, 6920.0, 12609.0, 22556.0, 42987.0, 85359.0, 176835.0, 294668.0, 196539.0, 95582.0, 47371.0, 25184.0, 13828.0, 7634.0, 4271.0, 2511.0, 1482.0, 954.0, 546.0, 325.0, 225.0, 135.0, 80.0, 75.0, 45.0, 31.0, 25.0, 15.0, 12.0, 6.0, 6.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.094970703125, -0.0920553207397461, -0.08913993835449219, -0.08622455596923828, -0.08330917358398438, -0.08039379119873047, -0.07747840881347656, -0.07456302642822266, -0.07164764404296875, -0.06873226165771484, -0.06581687927246094, -0.06290149688720703, -0.059986114501953125, -0.05707073211669922, -0.05415534973144531, -0.051239967346191406, -0.0483245849609375, -0.045409202575683594, -0.04249382019042969, -0.03957843780517578, -0.036663055419921875, -0.03374767303466797, -0.030832290649414062, -0.027916908264160156, -0.02500152587890625, -0.022086143493652344, -0.019170761108398438, -0.01625537872314453, -0.013339996337890625, -0.010424613952636719, -0.0075092315673828125, -0.004593849182128906, -0.001678466796875, 0.0012369155883789062, 0.0041522979736328125, 0.007067680358886719, 0.009983062744140625, 0.012898445129394531, 0.015813827514648438, 0.018729209899902344, 0.02164459228515625, 0.024559974670410156, 0.027475357055664062, 0.03039073944091797, 0.033306121826171875, 0.03622150421142578, 0.03913688659667969, 0.042052268981933594, 0.0449676513671875, 0.047883033752441406, 0.05079841613769531, 0.05371379852294922, 0.056629180908203125, 0.05954456329345703, 0.06245994567871094, 0.06537532806396484, 0.06829071044921875, 0.07120609283447266, 0.07412147521972656, 0.07703685760498047, 0.07995223999023438, 0.08286762237548828, 0.08578300476074219, 0.0886983871459961, 0.09161376953125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 5.0, 7.0, 7.0, 15.0, 6.0, 19.0, 10.0, 26.0, 22.0, 15.0, 20.0, 22.0, 36.0, 42.0, 34.0, 36.0, 41.0, 48.0, 37.0, 43.0, 46.0, 38.0, 46.0, 55.0, 38.0, 43.0, 38.0, 33.0, 24.0, 30.0, 18.0, 19.0, 23.0, 18.0, 10.0, 6.0, 8.0, 5.0, 3.0, 2.0, 3.0, 1.0, 7.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1021728515625, -0.09841537475585938, -0.09465789794921875, -0.09090042114257812, -0.0871429443359375, -0.08338546752929688, -0.07962799072265625, -0.07587051391601562, -0.072113037109375, -0.06835556030273438, -0.06459808349609375, -0.060840606689453125, -0.0570831298828125, -0.053325653076171875, -0.04956817626953125, -0.045810699462890625, -0.04205322265625, -0.038295745849609375, -0.03453826904296875, -0.030780792236328125, -0.0270233154296875, -0.023265838623046875, -0.01950836181640625, -0.015750885009765625, -0.011993408203125, -0.008235931396484375, -0.00447845458984375, -0.000720977783203125, 0.0030364990234375, 0.006793975830078125, 0.01055145263671875, 0.014308929443359375, 0.01806640625, 0.021823883056640625, 0.02558135986328125, 0.029338836669921875, 0.0330963134765625, 0.036853790283203125, 0.04061126708984375, 0.044368743896484375, 0.048126220703125, 0.051883697509765625, 0.05564117431640625, 0.059398651123046875, 0.0631561279296875, 0.06691360473632812, 0.07067108154296875, 0.07442855834960938, 0.07818603515625, 0.08194351196289062, 0.08570098876953125, 0.08945846557617188, 0.0932159423828125, 0.09697341918945312, 0.10073089599609375, 0.10448837280273438, 0.108245849609375, 0.11200332641601562, 0.11576080322265625, 0.11951828002929688, 0.1232757568359375, 0.12703323364257812, 0.13079071044921875, 0.13454818725585938, 0.1383056640625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 8.0, 3.0, 11.0, 16.0, 9.0, 19.0, 40.0, 62.0, 87.0, 158.0, 301.0, 570.0, 1181.0, 2992.0, 8815.0, 33301.0, 204506.0, 670549.0, 96334.0, 19595.0, 5895.0, 2172.0, 893.0, 475.0, 236.0, 119.0, 72.0, 47.0, 40.0, 15.0, 13.0, 9.0, 5.0, 5.0, 6.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.075927734375, -0.07267189025878906, -0.06941604614257812, -0.06616020202636719, -0.06290435791015625, -0.05964851379394531, -0.056392669677734375, -0.05313682556152344, -0.0498809814453125, -0.04662513732910156, -0.043369293212890625, -0.04011344909667969, -0.03685760498046875, -0.03360176086425781, -0.030345916748046875, -0.027090072631835938, -0.023834228515625, -0.020578384399414062, -0.017322540283203125, -0.014066696166992188, -0.01081085205078125, -0.0075550079345703125, -0.004299163818359375, -0.0010433197021484375, 0.0022125244140625, 0.0054683685302734375, 0.008724212646484375, 0.011980056762695312, 0.01523590087890625, 0.018491744995117188, 0.021747589111328125, 0.025003433227539062, 0.02825927734375, 0.03151512145996094, 0.034770965576171875, 0.03802680969238281, 0.04128265380859375, 0.04453849792480469, 0.047794342041015625, 0.05105018615722656, 0.0543060302734375, 0.05756187438964844, 0.060817718505859375, 0.06407356262207031, 0.06732940673828125, 0.07058525085449219, 0.07384109497070312, 0.07709693908691406, 0.080352783203125, 0.08360862731933594, 0.08686447143554688, 0.09012031555175781, 0.09337615966796875, 0.09663200378417969, 0.09988784790039062, 0.10314369201660156, 0.1063995361328125, 0.10965538024902344, 0.11291122436523438, 0.11616706848144531, 0.11942291259765625, 0.12267875671386719, 0.12593460083007812, 0.12919044494628906, 0.1324462890625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 3.0, 6.0, 4.0, 8.0, 14.0, 19.0, 60.0, 80.0, 181.0, 276.0, 183.0, 74.0, 45.0, 19.0, 8.0, 8.0, 3.0, 2.0, 2.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00013637542724609375, -0.00013203173875808716, -0.00012768805027008057, -0.00012334436178207397, -0.00011900067329406738, -0.00011465698480606079, -0.0001103132963180542, -0.00010596960783004761, -0.00010162591934204102, -9.728223085403442e-05, -9.293854236602783e-05, -8.859485387802124e-05, -8.425116539001465e-05, -7.990747690200806e-05, -7.556378841400146e-05, -7.122009992599487e-05, -6.687641143798828e-05, -6.253272294998169e-05, -5.81890344619751e-05, -5.3845345973968506e-05, -4.9501657485961914e-05, -4.515796899795532e-05, -4.081428050994873e-05, -3.647059202194214e-05, -3.212690353393555e-05, -2.7783215045928955e-05, -2.3439526557922363e-05, -1.909583806991577e-05, -1.475214958190918e-05, -1.0408461093902588e-05, -6.064772605895996e-06, -1.7210841178894043e-06, 2.6226043701171875e-06, 6.966292858123779e-06, 1.1309981346130371e-05, 1.5653669834136963e-05, 1.9997358322143555e-05, 2.4341046810150146e-05, 2.8684735298156738e-05, 3.302842378616333e-05, 3.737211227416992e-05, 4.1715800762176514e-05, 4.6059489250183105e-05, 5.04031777381897e-05, 5.474686622619629e-05, 5.909055471420288e-05, 6.343424320220947e-05, 6.777793169021606e-05, 7.212162017822266e-05, 7.646530866622925e-05, 8.080899715423584e-05, 8.515268564224243e-05, 8.949637413024902e-05, 9.384006261825562e-05, 9.818375110626221e-05, 0.0001025274395942688, 0.00010687112808227539, 0.00011121481657028198, 0.00011555850505828857, 0.00011990219354629517, 0.00012424588203430176, 0.00012858957052230835, 0.00013293325901031494, 0.00013727694749832153, 0.00014162063598632812]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 6.0, 5.0, 10.0, 14.0, 19.0, 28.0, 43.0, 57.0, 88.0, 160.0, 246.0, 427.0, 696.0, 1112.0, 2080.0, 4020.0, 7668.0, 15953.0, 36602.0, 97546.0, 327136.0, 368748.0, 109698.0, 40599.0, 17611.0, 8323.0, 4258.0, 2244.0, 1256.0, 727.0, 433.0, 246.0, 157.0, 107.0, 66.0, 52.0, 33.0, 28.0, 14.0, 8.0, 10.0, 12.0, 5.0, 3.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.050689697265625, -0.04900312423706055, -0.047316551208496094, -0.04562997817993164, -0.04394340515136719, -0.042256832122802734, -0.04057025909423828, -0.03888368606567383, -0.037197113037109375, -0.03551054000854492, -0.03382396697998047, -0.032137393951416016, -0.030450820922851562, -0.02876424789428711, -0.027077674865722656, -0.025391101837158203, -0.02370452880859375, -0.022017955780029297, -0.020331382751464844, -0.01864480972290039, -0.016958236694335938, -0.015271663665771484, -0.013585090637207031, -0.011898517608642578, -0.010211944580078125, -0.008525371551513672, -0.006838798522949219, -0.005152225494384766, -0.0034656524658203125, -0.0017790794372558594, -9.250640869140625e-05, 0.0015940666198730469, 0.0032806396484375, 0.004967212677001953, 0.006653785705566406, 0.00834035873413086, 0.010026931762695312, 0.011713504791259766, 0.013400077819824219, 0.015086650848388672, 0.016773223876953125, 0.018459796905517578, 0.02014636993408203, 0.021832942962646484, 0.023519515991210938, 0.02520608901977539, 0.026892662048339844, 0.028579235076904297, 0.03026580810546875, 0.0319523811340332, 0.033638954162597656, 0.03532552719116211, 0.03701210021972656, 0.038698673248291016, 0.04038524627685547, 0.04207181930541992, 0.043758392333984375, 0.04544496536254883, 0.04713153839111328, 0.048818111419677734, 0.05050468444824219, 0.05219125747680664, 0.053877830505371094, 0.05556440353393555, 0.0572509765625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 1.0, 3.0, 2.0, 4.0, 8.0, 11.0, 13.0, 12.0, 8.0, 15.0, 18.0, 21.0, 32.0, 46.0, 54.0, 63.0, 87.0, 74.0, 82.0, 86.0, 70.0, 50.0, 55.0, 40.0, 39.0, 24.0, 23.0, 14.0, 10.0, 13.0, 7.0, 7.0, 7.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07244873046875, -0.07020854949951172, -0.06796836853027344, -0.06572818756103516, -0.06348800659179688, -0.061247825622558594, -0.05900764465332031, -0.05676746368408203, -0.05452728271484375, -0.05228710174560547, -0.05004692077636719, -0.047806739807128906, -0.045566558837890625, -0.043326377868652344, -0.04108619689941406, -0.03884601593017578, -0.0366058349609375, -0.03436565399169922, -0.03212547302246094, -0.029885292053222656, -0.027645111083984375, -0.025404930114746094, -0.023164749145507812, -0.02092456817626953, -0.01868438720703125, -0.01644420623779297, -0.014204025268554688, -0.011963844299316406, -0.009723663330078125, -0.007483482360839844, -0.0052433013916015625, -0.0030031204223632812, -0.000762939453125, 0.0014772415161132812, 0.0037174224853515625, 0.005957603454589844, 0.008197784423828125, 0.010437965393066406, 0.012678146362304688, 0.014918327331542969, 0.01715850830078125, 0.01939868927001953, 0.021638870239257812, 0.023879051208496094, 0.026119232177734375, 0.028359413146972656, 0.030599594116210938, 0.03283977508544922, 0.0350799560546875, 0.03732013702392578, 0.03956031799316406, 0.041800498962402344, 0.044040679931640625, 0.046280860900878906, 0.04852104187011719, 0.05076122283935547, 0.05300140380859375, 0.05524158477783203, 0.05748176574707031, 0.059721946716308594, 0.061962127685546875, 0.06420230865478516, 0.06644248962402344, 0.06868267059326172, 0.0709228515625]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 7.0, 3.0, 15.0, 43.0, 93.0, 277.0, 352.0, 134.0, 48.0, 28.0, 8.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4928957223892212, -1.4060356616973877, -1.3191754817962646, -1.2323154211044312, -1.145455241203308, -1.0585951805114746, -0.9717350602149963, -0.8848749399185181, -0.7980148196220398, -0.7111546993255615, -0.6242945790290833, -0.537434458732605, -0.4505743682384491, -0.3637142479419708, -0.27685415744781494, -0.18999403715133667, -0.1031339168548584, -0.016273804008960724, 0.07058630883693695, 0.15744641423225403, 0.2443065345287323, 0.33116665482521057, 0.41802674531936646, 0.5048868656158447, 0.591746985912323, 0.6786071062088013, 0.7654672265052795, 0.8523273468017578, 0.9391874074935913, 1.0260475873947144, 1.1129076480865479, 1.199767827987671, 1.286628007888794, 1.3734880685806274, 1.4603482484817505, 1.547208309173584, 1.634068489074707, 1.7209285497665405, 1.807788610458374, 1.894648790359497, 1.9815089702606201, 2.068369150161743, 2.155229091644287, 2.24208927154541, 2.328949451446533, 2.4158096313476562, 2.5026695728302, 2.5895297527313232, 2.676389694213867, 2.7632498741149902, 2.850109815597534, 2.9369699954986572, 3.0238301753997803, 3.1106903553009033, 3.1975502967834473, 3.2844104766845703, 3.3712706565856934, 3.4581308364868164, 3.5449907779693604, 3.6318509578704834, 3.7187111377716064, 3.8055713176727295, 3.8924312591552734, 3.9792914390563965, 4.0661516189575195]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 2.0, 1.0, 13.0, 8.0, 7.0, 9.0, 11.0, 17.0, 19.0, 12.0, 23.0, 25.0, 35.0, 42.0, 38.0, 41.0, 47.0, 50.0, 56.0, 48.0, 47.0, 48.0, 46.0, 57.0, 46.0, 45.0, 29.0, 31.0, 24.0, 28.0, 15.0, 19.0, 15.0, 15.0, 10.0, 9.0, 8.0, 5.0, 1.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.8184596300125122, -0.794048011302948, -0.7696363925933838, -0.7452247142791748, -0.7208130955696106, -0.6964014768600464, -0.6719898581504822, -0.647578239440918, -0.6231666207313538, -0.5987550020217896, -0.5743433833122253, -0.5499317646026611, -0.5255200862884521, -0.5011084675788879, -0.47669684886932373, -0.4522852301597595, -0.4278735816478729, -0.4034619629383087, -0.3790503144264221, -0.3546386957168579, -0.3302270770072937, -0.3058154582977295, -0.2814038097858429, -0.2569921910762787, -0.23258055746555328, -0.20816892385482788, -0.18375730514526367, -0.15934567153453827, -0.13493403792381287, -0.11052241921424866, -0.08611078560352325, -0.061699166893959045, -0.03728753328323364, -0.012875905260443687, 0.011535722762346268, 0.03594735264778137, 0.06035897880792618, 0.08477060496807098, 0.10918223857879639, 0.1335938572883606, 0.158005490899086, 0.1824171245098114, 0.2068287432193756, 0.231240376830101, 0.2556520104408264, 0.2800636291503906, 0.30447524785995483, 0.32888686656951904, 0.35329851508140564, 0.37771013379096985, 0.40212178230285645, 0.42653340101242065, 0.45094501972198486, 0.4753566384315491, 0.49976828694343567, 0.5241799354553223, 0.5485915541648865, 0.5730031728744507, 0.5974147915840149, 0.6218264102935791, 0.6462380886077881, 0.6706497073173523, 0.6950613260269165, 0.7194729447364807, 0.7438845634460449]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 6.0, 3.0, 6.0, 10.0, 8.0, 12.0, 20.0, 23.0, 26.0, 28.0, 69.0, 92.0, 201.0, 402.0, 1001.0, 3476.0, 20633.0, 4096880.0, 62257.0, 6098.0, 1664.0, 625.0, 306.0, 138.0, 94.0, 63.0, 39.0, 27.0, 21.0, 25.0, 12.0, 5.0, 7.0, 4.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.404541015625, -0.3932037353515625, -0.381866455078125, -0.3705291748046875, -0.35919189453125, -0.3478546142578125, -0.336517333984375, -0.3251800537109375, -0.3138427734375, -0.3025054931640625, -0.291168212890625, -0.2798309326171875, -0.26849365234375, -0.2571563720703125, -0.245819091796875, -0.2344818115234375, -0.22314453125, -0.2118072509765625, -0.200469970703125, -0.1891326904296875, -0.17779541015625, -0.1664581298828125, -0.155120849609375, -0.1437835693359375, -0.1324462890625, -0.1211090087890625, -0.109771728515625, -0.0984344482421875, -0.08709716796875, -0.0757598876953125, -0.064422607421875, -0.0530853271484375, -0.041748046875, -0.0304107666015625, -0.019073486328125, -0.0077362060546875, 0.00360107421875, 0.0149383544921875, 0.026275634765625, 0.0376129150390625, 0.0489501953125, 0.0602874755859375, 0.071624755859375, 0.0829620361328125, 0.09429931640625, 0.1056365966796875, 0.116973876953125, 0.1283111572265625, 0.1396484375, 0.1509857177734375, 0.162322998046875, 0.1736602783203125, 0.18499755859375, 0.1963348388671875, 0.207672119140625, 0.2190093994140625, 0.2303466796875, 0.2416839599609375, 0.253021240234375, 0.2643585205078125, 0.27569580078125, 0.2870330810546875, 0.298370361328125, 0.3097076416015625, 0.321044921875]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 11.0, 12.0, 27.0, 49.0, 79.0, 101.0, 135.0, 141.0, 138.0, 116.0, 75.0, 47.0, 25.0, 17.0, 8.0, 3.0, 3.0, 3.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0914306640625, -0.08906269073486328, -0.08669471740722656, -0.08432674407958984, -0.08195877075195312, -0.0795907974243164, -0.07722282409667969, -0.07485485076904297, -0.07248687744140625, -0.07011890411376953, -0.06775093078613281, -0.0653829574584961, -0.06301498413085938, -0.060647010803222656, -0.05827903747558594, -0.05591106414794922, -0.0535430908203125, -0.05117511749267578, -0.04880714416503906, -0.046439170837402344, -0.044071197509765625, -0.041703224182128906, -0.03933525085449219, -0.03696727752685547, -0.03459930419921875, -0.03223133087158203, -0.029863357543945312, -0.027495384216308594, -0.025127410888671875, -0.022759437561035156, -0.020391464233398438, -0.01802349090576172, -0.015655517578125, -0.013287544250488281, -0.010919570922851562, -0.008551597595214844, -0.006183624267578125, -0.0038156509399414062, -0.0014476776123046875, 0.0009202957153320312, 0.00328826904296875, 0.005656242370605469, 0.008024215698242188, 0.010392189025878906, 0.012760162353515625, 0.015128135681152344, 0.017496109008789062, 0.01986408233642578, 0.0222320556640625, 0.02460002899169922, 0.026968002319335938, 0.029335975646972656, 0.031703948974609375, 0.034071922302246094, 0.03643989562988281, 0.03880786895751953, 0.04117584228515625, 0.04354381561279297, 0.04591178894042969, 0.048279762268066406, 0.050647735595703125, 0.053015708923339844, 0.05538368225097656, 0.05775165557861328, 0.06011962890625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 4.0, 6.0, 9.0, 26.0, 30.0, 40.0, 84.0, 121.0, 212.0, 314.0, 593.0, 1135.0, 2692.0, 7286.0, 26544.0, 366148.0, 3733942.0, 39565.0, 9314.0, 3276.0, 1334.0, 679.0, 369.0, 199.0, 144.0, 88.0, 48.0, 27.0, 14.0, 15.0, 9.0, 9.0, 5.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.197265625, -0.19025039672851562, -0.18323516845703125, -0.17621994018554688, -0.1692047119140625, -0.16218948364257812, -0.15517425537109375, -0.14815902709960938, -0.141143798828125, -0.13412857055664062, -0.12711334228515625, -0.12009811401367188, -0.1130828857421875, -0.10606765747070312, -0.09905242919921875, -0.09203720092773438, -0.08502197265625, -0.07800674438476562, -0.07099151611328125, -0.06397628784179688, -0.0569610595703125, -0.049945831298828125, -0.04293060302734375, -0.035915374755859375, -0.028900146484375, -0.021884918212890625, -0.01486968994140625, -0.007854461669921875, -0.0008392333984375, 0.006175994873046875, 0.01319122314453125, 0.020206451416015625, 0.0272216796875, 0.034236907958984375, 0.04125213623046875, 0.048267364501953125, 0.0552825927734375, 0.062297821044921875, 0.06931304931640625, 0.07632827758789062, 0.083343505859375, 0.09035873413085938, 0.09737396240234375, 0.10438919067382812, 0.1114044189453125, 0.11841964721679688, 0.12543487548828125, 0.13245010375976562, 0.13946533203125, 0.14648056030273438, 0.15349578857421875, 0.16051101684570312, 0.1675262451171875, 0.17454147338867188, 0.18155670166015625, 0.18857192993164062, 0.195587158203125, 0.20260238647460938, 0.20961761474609375, 0.21663284301757812, 0.2236480712890625, 0.23066329956054688, 0.23767852783203125, 0.24469375610351562, 0.251708984375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 7.0, 3.0, 4.0, 7.0, 7.0, 7.0, 11.0, 12.0, 13.0, 31.0, 50.0, 92.0, 188.0, 2847.0, 498.0, 129.0, 64.0, 37.0, 14.0, 16.0, 15.0, 8.0, 4.0, 6.0, 6.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0843505859375, -0.08205747604370117, -0.07976436614990234, -0.07747125625610352, -0.07517814636230469, -0.07288503646850586, -0.07059192657470703, -0.0682988166809082, -0.06600570678710938, -0.06371259689331055, -0.06141948699951172, -0.05912637710571289, -0.05683326721191406, -0.054540157318115234, -0.052247047424316406, -0.04995393753051758, -0.04766082763671875, -0.04536771774291992, -0.043074607849121094, -0.040781497955322266, -0.03848838806152344, -0.03619527816772461, -0.03390216827392578, -0.03160905838012695, -0.029315948486328125, -0.027022838592529297, -0.02472972869873047, -0.02243661880493164, -0.020143508911132812, -0.017850399017333984, -0.015557289123535156, -0.013264179229736328, -0.0109710693359375, -0.008677959442138672, -0.006384849548339844, -0.004091739654541016, -0.0017986297607421875, 0.0004944801330566406, 0.0027875900268554688, 0.005080699920654297, 0.007373809814453125, 0.009666919708251953, 0.011960029602050781, 0.01425313949584961, 0.016546249389648438, 0.018839359283447266, 0.021132469177246094, 0.023425579071044922, 0.02571868896484375, 0.028011798858642578, 0.030304908752441406, 0.032598018646240234, 0.03489112854003906, 0.03718423843383789, 0.03947734832763672, 0.04177045822143555, 0.044063568115234375, 0.0463566780090332, 0.04864978790283203, 0.05094289779663086, 0.05323600769042969, 0.055529117584228516, 0.057822227478027344, 0.06011533737182617, 0.062408447265625]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 3.0, 4.0, 10.0, 43.0, 134.0, 371.0, 312.0, 92.0, 21.0, 15.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8899651765823364, -0.8644610047340393, -0.8389568328857422, -0.8134527206420898, -0.7879485487937927, -0.7624443769454956, -0.7369402050971985, -0.7114360332489014, -0.685931921005249, -0.6604277491569519, -0.6349235773086548, -0.6094194650650024, -0.5839152932167053, -0.5584111213684082, -0.5329069495201111, -0.507402777671814, -0.48189860582351685, -0.4563944339752197, -0.430890291929245, -0.4053861200809479, -0.37988197803497314, -0.354377806186676, -0.3288736343383789, -0.3033694624900818, -0.27786532044410706, -0.25236114859580994, -0.2268570065498352, -0.20135283470153809, -0.17584867775440216, -0.15034452080726624, -0.12484034895896912, -0.09933619201183319, -0.07383203506469727, -0.04832787439227104, -0.022823713719844818, 0.002680450677871704, 0.02818460762500763, 0.053688764572143555, 0.07919293642044067, 0.1046970933675766, 0.13020125031471252, 0.15570540726184845, 0.18120956420898438, 0.2067137360572815, 0.23221789300441742, 0.25772204995155334, 0.28322622179985046, 0.3087303638458252, 0.3342345356941223, 0.35973870754241943, 0.38524284958839417, 0.4107470214366913, 0.436251163482666, 0.46175533533096313, 0.48725950717926025, 0.5127636790275574, 0.5382678508758545, 0.5637720227241516, 0.5892761945724487, 0.6147803068161011, 0.6402844786643982, 0.6657886505126953, 0.6912928223609924, 0.7167969942092896, 0.7423011064529419]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 8.0, 11.0, 11.0, 6.0, 10.0, 24.0, 19.0, 24.0, 20.0, 20.0, 36.0, 28.0, 20.0, 43.0, 37.0, 38.0, 38.0, 52.0, 47.0, 49.0, 22.0, 38.0, 39.0, 39.0, 41.0, 49.0, 32.0, 24.0, 23.0, 27.0, 13.0, 19.0, 16.0, 14.0, 12.0, 12.0, 6.0, 9.0, 5.0, 3.0, 3.0, 3.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.15403872728347778, -0.14933548867702484, -0.1446322500705719, -0.13992901146411896, -0.13522577285766602, -0.13052251935005188, -0.12581928074359894, -0.121116042137146, -0.11641280353069305, -0.11170956492424011, -0.10700632631778717, -0.10230308026075363, -0.09759984165430069, -0.09289660304784775, -0.08819335699081421, -0.08349011838436127, -0.07878687977790833, -0.07408364117145538, -0.06938040256500244, -0.0646771565079689, -0.05997391790151596, -0.05527067929506302, -0.05056743696331978, -0.04586419463157654, -0.041160956025123596, -0.036457717418670654, -0.031754475086927414, -0.027051234617829323, -0.02234799414873123, -0.01764475367963314, -0.01294151321053505, -0.008238270878791809, -0.003535032272338867, 0.001168208196759224, 0.005871448665857315, 0.010574689134955406, 0.015277929604053497, 0.01998117007315159, 0.02468441054224968, 0.02938765287399292, 0.03409089148044586, 0.038794130086898804, 0.043497372418642044, 0.048200614750385284, 0.052903853356838226, 0.05760709196329117, 0.06231033429503441, 0.06701357662677765, 0.07171681523323059, 0.07642005383968353, 0.08112329244613647, 0.08582653850317001, 0.09052977710962296, 0.0952330157160759, 0.09993626177310944, 0.10463950037956238, 0.10934273898601532, 0.11404597759246826, 0.1187492161989212, 0.12345246225595474, 0.12815570831298828, 0.13285894691944122, 0.13756218552589417, 0.1422654241323471, 0.14696866273880005]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 7.0, 8.0, 14.0, 7.0, 22.0, 22.0, 38.0, 34.0, 64.0, 86.0, 99.0, 154.0, 168.0, 271.0, 384.0, 572.0, 862.0, 1462.0, 2846.0, 7188.0, 24378.0, 116452.0, 588543.0, 241384.0, 43258.0, 11338.0, 3969.0, 1755.0, 1029.0, 582.0, 429.0, 267.0, 215.0, 162.0, 110.0, 77.0, 65.0, 59.0, 35.0, 41.0, 20.0, 17.0, 22.0, 11.0, 10.0, 10.0, 4.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2291259765625, -0.22189712524414062, -0.21466827392578125, -0.20743942260742188, -0.2002105712890625, -0.19298171997070312, -0.18575286865234375, -0.17852401733398438, -0.171295166015625, -0.16406631469726562, -0.15683746337890625, -0.14960861206054688, -0.1423797607421875, -0.13515090942382812, -0.12792205810546875, -0.12069320678710938, -0.11346435546875, -0.10623550415039062, -0.09900665283203125, -0.09177780151367188, -0.0845489501953125, -0.07732009887695312, -0.07009124755859375, -0.06286239624023438, -0.055633544921875, -0.048404693603515625, -0.04117584228515625, -0.033946990966796875, -0.0267181396484375, -0.019489288330078125, -0.01226043701171875, -0.005031585693359375, 0.002197265625, 0.009426116943359375, 0.01665496826171875, 0.023883819580078125, 0.0311126708984375, 0.038341522216796875, 0.04557037353515625, 0.052799224853515625, 0.060028076171875, 0.06725692749023438, 0.07448577880859375, 0.08171463012695312, 0.0889434814453125, 0.09617233276367188, 0.10340118408203125, 0.11063003540039062, 0.11785888671875, 0.12508773803710938, 0.13231658935546875, 0.13954544067382812, 0.1467742919921875, 0.15400314331054688, 0.16123199462890625, 0.16846084594726562, 0.175689697265625, 0.18291854858398438, 0.19014739990234375, 0.19737625122070312, 0.2046051025390625, 0.21183395385742188, 0.21906280517578125, 0.22629165649414062, 0.2335205078125]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 13.0, 19.0, 38.0, 63.0, 91.0, 116.0, 137.0, 134.0, 138.0, 95.0, 62.0, 35.0, 18.0, 19.0, 4.0, 4.0, 2.0, 1.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.08843994140625, -0.08612203598022461, -0.08380413055419922, -0.08148622512817383, -0.07916831970214844, -0.07685041427612305, -0.07453250885009766, -0.07221460342407227, -0.06989669799804688, -0.06757879257202148, -0.0652608871459961, -0.0629429817199707, -0.06062507629394531, -0.05830717086791992, -0.05598926544189453, -0.05367136001586914, -0.05135345458984375, -0.04903554916381836, -0.04671764373779297, -0.04439973831176758, -0.04208183288574219, -0.0397639274597168, -0.037446022033691406, -0.035128116607666016, -0.032810211181640625, -0.030492305755615234, -0.028174400329589844, -0.025856494903564453, -0.023538589477539062, -0.021220684051513672, -0.01890277862548828, -0.01658487319946289, -0.0142669677734375, -0.01194906234741211, -0.009631156921386719, -0.007313251495361328, -0.0049953460693359375, -0.002677440643310547, -0.00035953521728515625, 0.0019583702087402344, 0.004276275634765625, 0.006594181060791016, 0.008912086486816406, 0.011229991912841797, 0.013547897338867188, 0.015865802764892578, 0.01818370819091797, 0.02050161361694336, 0.02281951904296875, 0.02513742446899414, 0.02745532989501953, 0.029773235321044922, 0.03209114074707031, 0.0344090461730957, 0.036726951599121094, 0.039044857025146484, 0.041362762451171875, 0.043680667877197266, 0.045998573303222656, 0.04831647872924805, 0.05063438415527344, 0.05295228958129883, 0.05527019500732422, 0.05758810043334961, 0.059906005859375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 3.0, 2.0, 10.0, 7.0, 15.0, 27.0, 37.0, 63.0, 112.0, 221.0, 384.0, 727.0, 1525.0, 3189.0, 7215.0, 17643.0, 47374.0, 140784.0, 417914.0, 274596.0, 84965.0, 30264.0, 11866.0, 5040.0, 2231.0, 1060.0, 570.0, 306.0, 157.0, 99.0, 44.0, 39.0, 16.0, 15.0, 7.0, 10.0, 3.0, 5.0, 7.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11492919921875, -0.1110696792602539, -0.10721015930175781, -0.10335063934326172, -0.09949111938476562, -0.09563159942626953, -0.09177207946777344, -0.08791255950927734, -0.08405303955078125, -0.08019351959228516, -0.07633399963378906, -0.07247447967529297, -0.06861495971679688, -0.06475543975830078, -0.06089591979980469, -0.057036399841308594, -0.0531768798828125, -0.049317359924316406, -0.04545783996582031, -0.04159832000732422, -0.037738800048828125, -0.03387928009033203, -0.030019760131835938, -0.026160240173339844, -0.02230072021484375, -0.018441200256347656, -0.014581680297851562, -0.010722160339355469, -0.006862640380859375, -0.0030031204223632812, 0.0008563995361328125, 0.004715919494628906, 0.008575439453125, 0.012434959411621094, 0.016294479370117188, 0.02015399932861328, 0.024013519287109375, 0.02787303924560547, 0.03173255920410156, 0.035592079162597656, 0.03945159912109375, 0.043311119079589844, 0.04717063903808594, 0.05103015899658203, 0.054889678955078125, 0.05874919891357422, 0.06260871887207031, 0.0664682388305664, 0.0703277587890625, 0.0741872787475586, 0.07804679870605469, 0.08190631866455078, 0.08576583862304688, 0.08962535858154297, 0.09348487854003906, 0.09734439849853516, 0.10120391845703125, 0.10506343841552734, 0.10892295837402344, 0.11278247833251953, 0.11664199829101562, 0.12050151824951172, 0.12436103820800781, 0.1282205581665039, 0.132080078125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 6.0, 9.0, 1.0, 4.0, 16.0, 15.0, 12.0, 16.0, 12.0, 15.0, 25.0, 23.0, 28.0, 41.0, 38.0, 36.0, 51.0, 52.0, 30.0, 32.0, 40.0, 53.0, 53.0, 32.0, 51.0, 25.0, 35.0, 25.0, 48.0, 29.0, 23.0, 25.0, 23.0, 14.0, 18.0, 7.0, 7.0, 10.0, 5.0, 8.0, 3.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.1156005859375, -0.11217594146728516, -0.10875129699707031, -0.10532665252685547, -0.10190200805664062, -0.09847736358642578, -0.09505271911621094, -0.0916280746459961, -0.08820343017578125, -0.0847787857055664, -0.08135414123535156, -0.07792949676513672, -0.07450485229492188, -0.07108020782470703, -0.06765556335449219, -0.06423091888427734, -0.0608062744140625, -0.057381629943847656, -0.05395698547363281, -0.05053234100341797, -0.047107696533203125, -0.04368305206298828, -0.04025840759277344, -0.036833763122558594, -0.03340911865234375, -0.029984474182128906, -0.026559829711914062, -0.02313518524169922, -0.019710540771484375, -0.01628589630126953, -0.012861251831054688, -0.009436607360839844, -0.006011962890625, -0.0025873184204101562, 0.0008373260498046875, 0.004261970520019531, 0.007686614990234375, 0.011111259460449219, 0.014535903930664062, 0.017960548400878906, 0.02138519287109375, 0.024809837341308594, 0.028234481811523438, 0.03165912628173828, 0.035083770751953125, 0.03850841522216797, 0.04193305969238281, 0.045357704162597656, 0.0487823486328125, 0.052206993103027344, 0.05563163757324219, 0.05905628204345703, 0.062480926513671875, 0.06590557098388672, 0.06933021545410156, 0.0727548599243164, 0.07617950439453125, 0.0796041488647461, 0.08302879333496094, 0.08645343780517578, 0.08987808227539062, 0.09330272674560547, 0.09672737121582031, 0.10015201568603516, 0.10357666015625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 6.0, 2.0, 5.0, 6.0, 16.0, 17.0, 23.0, 38.0, 65.0, 115.0, 194.0, 350.0, 841.0, 2121.0, 6168.0, 22295.0, 107091.0, 609580.0, 241506.0, 41977.0, 10547.0, 3248.0, 1181.0, 529.0, 294.0, 119.0, 87.0, 57.0, 28.0, 16.0, 21.0, 8.0, 5.0, 5.0, 0.0, 2.0, 0.0, 0.0, 3.0], "bins": [-0.090576171875, -0.0884556770324707, -0.0863351821899414, -0.08421468734741211, -0.08209419250488281, -0.07997369766235352, -0.07785320281982422, -0.07573270797729492, -0.07361221313476562, -0.07149171829223633, -0.06937122344970703, -0.06725072860717773, -0.06513023376464844, -0.06300973892211914, -0.060889244079589844, -0.05876874923706055, -0.05664825439453125, -0.05452775955200195, -0.052407264709472656, -0.05028676986694336, -0.04816627502441406, -0.046045780181884766, -0.04392528533935547, -0.04180479049682617, -0.039684295654296875, -0.03756380081176758, -0.03544330596923828, -0.033322811126708984, -0.031202316284179688, -0.02908182144165039, -0.026961326599121094, -0.024840831756591797, -0.0227203369140625, -0.020599842071533203, -0.018479347229003906, -0.01635885238647461, -0.014238357543945312, -0.012117862701416016, -0.009997367858886719, -0.007876873016357422, -0.005756378173828125, -0.003635883331298828, -0.0015153884887695312, 0.0006051063537597656, 0.0027256011962890625, 0.004846096038818359, 0.006966590881347656, 0.009087085723876953, 0.01120758056640625, 0.013328075408935547, 0.015448570251464844, 0.01756906509399414, 0.019689559936523438, 0.021810054779052734, 0.02393054962158203, 0.026051044464111328, 0.028171539306640625, 0.030292034149169922, 0.03241252899169922, 0.034533023834228516, 0.03665351867675781, 0.03877401351928711, 0.040894508361816406, 0.0430150032043457, 0.045135498046875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 5.0, 5.0, 7.0, 7.0, 16.0, 10.0, 50.0, 74.0, 163.0, 270.0, 200.0, 90.0, 45.0, 20.0, 11.0, 4.0, 10.0, 4.0, 3.0, 6.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.18235969543457e-05, -6.849970668554306e-05, -6.517581641674042e-05, -6.185192614793777e-05, -5.852803587913513e-05, -5.520414561033249e-05, -5.1880255341529846e-05, -4.85563650727272e-05, -4.523247480392456e-05, -4.190858453512192e-05, -3.8584694266319275e-05, -3.526080399751663e-05, -3.193691372871399e-05, -2.8613023459911346e-05, -2.5289133191108704e-05, -2.196524292230606e-05, -1.8641352653503418e-05, -1.5317462384700775e-05, -1.1993572115898132e-05, -8.66968184709549e-06, -5.345791578292847e-06, -2.021901309490204e-06, 1.301988959312439e-06, 4.625879228115082e-06, 7.949769496917725e-06, 1.1273659765720367e-05, 1.459755003452301e-05, 1.7921440303325653e-05, 2.1245330572128296e-05, 2.456922084093094e-05, 2.789311110973358e-05, 3.1217001378536224e-05, 3.454089164733887e-05, 3.786478191614151e-05, 4.118867218494415e-05, 4.4512562453746796e-05, 4.783645272254944e-05, 5.116034299135208e-05, 5.4484233260154724e-05, 5.780812352895737e-05, 6.113201379776001e-05, 6.445590406656265e-05, 6.77797943353653e-05, 7.110368460416794e-05, 7.442757487297058e-05, 7.775146514177322e-05, 8.107535541057587e-05, 8.439924567937851e-05, 8.772313594818115e-05, 9.10470262169838e-05, 9.437091648578644e-05, 9.769480675458908e-05, 0.00010101869702339172, 0.00010434258729219437, 0.00010766647756099701, 0.00011099036782979965, 0.0001143142580986023, 0.00011763814836740494, 0.00012096203863620758, 0.00012428592890501022, 0.00012760981917381287, 0.0001309337094426155, 0.00013425759971141815, 0.0001375814899802208, 0.00014090538024902344]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 4.0, 3.0, 8.0, 19.0, 32.0, 41.0, 80.0, 158.0, 322.0, 739.0, 1767.0, 4762.0, 16510.0, 88362.0, 622328.0, 263127.0, 36712.0, 8731.0, 2757.0, 1105.0, 485.0, 219.0, 134.0, 73.0, 31.0, 17.0, 14.0, 9.0, 5.0, 2.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.083251953125, -0.08110380172729492, -0.07895565032958984, -0.07680749893188477, -0.07465934753417969, -0.07251119613647461, -0.07036304473876953, -0.06821489334106445, -0.06606674194335938, -0.0639185905456543, -0.06177043914794922, -0.05962228775024414, -0.05747413635253906, -0.055325984954833984, -0.053177833557128906, -0.05102968215942383, -0.04888153076171875, -0.04673337936401367, -0.044585227966308594, -0.042437076568603516, -0.04028892517089844, -0.03814077377319336, -0.03599262237548828, -0.0338444709777832, -0.031696319580078125, -0.029548168182373047, -0.02740001678466797, -0.02525186538696289, -0.023103713989257812, -0.020955562591552734, -0.018807411193847656, -0.016659259796142578, -0.0145111083984375, -0.012362957000732422, -0.010214805603027344, -0.008066654205322266, -0.0059185028076171875, -0.0037703514099121094, -0.0016222000122070312, 0.0005259513854980469, 0.002674102783203125, 0.004822254180908203, 0.006970405578613281, 0.00911855697631836, 0.011266708374023438, 0.013414859771728516, 0.015563011169433594, 0.017711162567138672, 0.01985931396484375, 0.022007465362548828, 0.024155616760253906, 0.026303768157958984, 0.028451919555664062, 0.03060007095336914, 0.03274822235107422, 0.0348963737487793, 0.037044525146484375, 0.03919267654418945, 0.04134082794189453, 0.04348897933959961, 0.04563713073730469, 0.047785282135009766, 0.049933433532714844, 0.05208158493041992, 0.054229736328125]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 8.0, 3.0, 5.0, 7.0, 4.0, 10.0, 5.0, 17.0, 25.0, 39.0, 33.0, 53.0, 71.0, 96.0, 83.0, 79.0, 90.0, 68.0, 63.0, 65.0, 34.0, 43.0, 31.0, 22.0, 12.0, 9.0, 6.0, 8.0, 5.0, 4.0, 5.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0491943359375, -0.04763984680175781, -0.046085357666015625, -0.04453086853027344, -0.04297637939453125, -0.04142189025878906, -0.039867401123046875, -0.03831291198730469, -0.0367584228515625, -0.03520393371582031, -0.033649444580078125, -0.03209495544433594, -0.03054046630859375, -0.028985977172851562, -0.027431488037109375, -0.025876998901367188, -0.024322509765625, -0.022768020629882812, -0.021213531494140625, -0.019659042358398438, -0.01810455322265625, -0.016550064086914062, -0.014995574951171875, -0.013441085815429688, -0.0118865966796875, -0.010332107543945312, -0.008777618408203125, -0.0072231292724609375, -0.00566864013671875, -0.0041141510009765625, -0.002559661865234375, -0.0010051727294921875, 0.00054931640625, 0.0021038055419921875, 0.003658294677734375, 0.0052127838134765625, 0.00676727294921875, 0.008321762084960938, 0.009876251220703125, 0.011430740356445312, 0.0129852294921875, 0.014539718627929688, 0.016094207763671875, 0.017648696899414062, 0.01920318603515625, 0.020757675170898438, 0.022312164306640625, 0.023866653442382812, 0.025421142578125, 0.026975631713867188, 0.028530120849609375, 0.030084609985351562, 0.03163909912109375, 0.03319358825683594, 0.034748077392578125, 0.03630256652832031, 0.0378570556640625, 0.03941154479980469, 0.040966033935546875, 0.04252052307128906, 0.04407501220703125, 0.04562950134277344, 0.047183990478515625, 0.04873847961425781, 0.05029296875]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 9.0, 30.0, 87.0, 244.0, 390.0, 152.0, 63.0, 23.0, 8.0, 4.0, 0.0, 0.0, 3.0], "bins": [-4.071187973022461, -3.997525691986084, -3.923863410949707, -3.850201368331909, -3.7765390872955322, -3.7028768062591553, -3.6292145252227783, -3.5555522441864014, -3.4818902015686035, -3.4082279205322266, -3.3345656394958496, -3.2609035968780518, -3.187241315841675, -3.113579034805298, -3.039916753768921, -2.966254472732544, -2.892592191696167, -2.81892991065979, -2.745267629623413, -2.6716055870056152, -2.5979433059692383, -2.5242810249328613, -2.4506187438964844, -2.3769564628601074, -2.3032941818237305, -2.2296319007873535, -2.1559696197509766, -2.0823075771331787, -2.0086452960968018, -1.9349830150604248, -1.8613207340240479, -1.787658452987671, -1.713996171951294, -1.640333890914917, -1.5666717290878296, -1.4930094480514526, -1.4193472862243652, -1.3456850051879883, -1.2720227241516113, -1.1983604431152344, -1.1246984004974365, -1.0510361194610596, -0.9773739576339722, -0.9037116765975952, -0.830049455165863, -0.7563872337341309, -0.6827249526977539, -0.6090627312660217, -0.5354004502296448, -0.4617382287979126, -0.38807597756385803, -0.31441372632980347, -0.2407515048980713, -0.1670892834663391, -0.09342703223228455, -0.01976478099822998, 0.0538974404335022, 0.12755967676639557, 0.20122191309928894, 0.2748841643333435, 0.3485463857650757, 0.42220860719680786, 0.4958708584308624, 0.569533109664917, 0.6431953310966492]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 4.0, 6.0, 4.0, 8.0, 12.0, 14.0, 10.0, 17.0, 18.0, 18.0, 28.0, 21.0, 26.0, 32.0, 30.0, 26.0, 32.0, 33.0, 43.0, 46.0, 59.0, 45.0, 37.0, 51.0, 37.0, 34.0, 51.0, 43.0, 33.0, 29.0, 18.0, 22.0, 18.0, 16.0, 18.0, 12.0, 9.0, 9.0, 8.0, 8.0, 7.0, 5.0, 6.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.5050162076950073, -0.487313836812973, -0.46961143612861633, -0.45190906524658203, -0.43420666456222534, -0.41650429368019104, -0.39880192279815674, -0.38109952211380005, -0.36339715123176575, -0.34569478034973145, -0.32799237966537476, -0.31029000878334045, -0.29258763790130615, -0.27488523721694946, -0.25718286633491516, -0.23948048055171967, -0.22177809476852417, -0.20407570898532867, -0.18637332320213318, -0.16867095232009888, -0.15096856653690338, -0.13326618075370789, -0.11556380242109299, -0.09786142408847809, -0.08015903830528259, -0.062456656247377396, -0.0447542741894722, -0.027051892131567, -0.009349510073661804, 0.008352875709533691, 0.02605525404214859, 0.04375763237476349, 0.06146007776260376, 0.07916246354579926, 0.09686484187841415, 0.11456722021102905, 0.13226960599422455, 0.14997199177742004, 0.16767436265945435, 0.18537674844264984, 0.20307913422584534, 0.22078152000904083, 0.23848390579223633, 0.25618627667427063, 0.27388864755630493, 0.2915910482406616, 0.3092934191226959, 0.3269957900047302, 0.3446981906890869, 0.3624005615711212, 0.3801029622554779, 0.3978053331375122, 0.4155077338218689, 0.4332101047039032, 0.4509124755859375, 0.4686148762702942, 0.4863172471523285, 0.5040196180343628, 0.5217220187187195, 0.5394244194030762, 0.5571267604827881, 0.5748291611671448, 0.5925315618515015, 0.6102339029312134, 0.6279363036155701]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 6.0, 2.0, 6.0, 7.0, 5.0, 7.0, 15.0, 13.0, 21.0, 32.0, 34.0, 86.0, 153.0, 276.0, 605.0, 1746.0, 7285.0, 447195.0, 3725286.0, 8180.0, 1897.0, 670.0, 318.0, 164.0, 85.0, 63.0, 32.0, 31.0, 19.0, 14.0, 11.0, 6.0, 5.0, 5.0, 0.0, 5.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.47900390625, -0.4670372009277344, -0.45507049560546875, -0.4431037902832031, -0.4311370849609375, -0.4191703796386719, -0.40720367431640625, -0.3952369689941406, -0.383270263671875, -0.3713035583496094, -0.35933685302734375, -0.3473701477050781, -0.3354034423828125, -0.3234367370605469, -0.31147003173828125, -0.2995033264160156, -0.28753662109375, -0.2755699157714844, -0.26360321044921875, -0.2516365051269531, -0.2396697998046875, -0.22770309448242188, -0.21573638916015625, -0.20376968383789062, -0.191802978515625, -0.17983627319335938, -0.16786956787109375, -0.15590286254882812, -0.1439361572265625, -0.13196945190429688, -0.12000274658203125, -0.10803604125976562, -0.0960693359375, -0.08410263061523438, -0.07213592529296875, -0.060169219970703125, -0.0482025146484375, -0.036235809326171875, -0.02426910400390625, -0.012302398681640625, -0.000335693359375, 0.011631011962890625, 0.02359771728515625, 0.035564422607421875, 0.0475311279296875, 0.059497833251953125, 0.07146453857421875, 0.08343124389648438, 0.09539794921875, 0.10736465454101562, 0.11933135986328125, 0.13129806518554688, 0.1432647705078125, 0.15523147583007812, 0.16719818115234375, 0.17916488647460938, 0.191131591796875, 0.20309829711914062, 0.21506500244140625, 0.22703170776367188, 0.2389984130859375, 0.2509651184082031, 0.26293182373046875, 0.2748985290527344, 0.286865234375]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 10.0, 16.0, 33.0, 62.0, 92.0, 112.0, 128.0, 135.0, 152.0, 97.0, 70.0, 40.0, 17.0, 11.0, 10.0, 1.0, 4.0, 2.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.09674072265625, -0.09427833557128906, -0.09181594848632812, -0.08935356140136719, -0.08689117431640625, -0.08442878723144531, -0.08196640014648438, -0.07950401306152344, -0.0770416259765625, -0.07457923889160156, -0.07211685180664062, -0.06965446472167969, -0.06719207763671875, -0.06472969055175781, -0.062267303466796875, -0.05980491638183594, -0.057342529296875, -0.05488014221191406, -0.052417755126953125, -0.04995536804199219, -0.04749298095703125, -0.04503059387207031, -0.042568206787109375, -0.04010581970214844, -0.0376434326171875, -0.03518104553222656, -0.032718658447265625, -0.030256271362304688, -0.02779388427734375, -0.025331497192382812, -0.022869110107421875, -0.020406723022460938, -0.0179443359375, -0.015481948852539062, -0.013019561767578125, -0.010557174682617188, -0.00809478759765625, -0.0056324005126953125, -0.003170013427734375, -0.0007076263427734375, 0.0017547607421875, 0.0042171478271484375, 0.006679534912109375, 0.009141921997070312, 0.01160430908203125, 0.014066696166992188, 0.016529083251953125, 0.018991470336914062, 0.021453857421875, 0.023916244506835938, 0.026378631591796875, 0.028841018676757812, 0.03130340576171875, 0.03376579284667969, 0.036228179931640625, 0.03869056701660156, 0.0411529541015625, 0.04361534118652344, 0.046077728271484375, 0.04854011535644531, 0.05100250244140625, 0.05346488952636719, 0.055927276611328125, 0.05838966369628906, 0.06085205078125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 4.0, 2.0, 9.0, 6.0, 12.0, 10.0, 24.0, 43.0, 51.0, 86.0, 181.0, 339.0, 564.0, 1320.0, 2867.0, 7462.0, 24597.0, 173783.0, 3896289.0, 63140.0, 14534.0, 4827.0, 2004.0, 932.0, 517.0, 276.0, 164.0, 88.0, 62.0, 24.0, 23.0, 20.0, 10.0, 7.0, 3.0, 4.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.177734375, -0.1723957061767578, -0.16705703735351562, -0.16171836853027344, -0.15637969970703125, -0.15104103088378906, -0.14570236206054688, -0.1403636932373047, -0.1350250244140625, -0.1296863555908203, -0.12434768676757812, -0.11900901794433594, -0.11367034912109375, -0.10833168029785156, -0.10299301147460938, -0.09765434265136719, -0.092315673828125, -0.08697700500488281, -0.08163833618164062, -0.07629966735839844, -0.07096099853515625, -0.06562232971191406, -0.060283660888671875, -0.05494499206542969, -0.0496063232421875, -0.04426765441894531, -0.038928985595703125, -0.03359031677246094, -0.02825164794921875, -0.022912979125976562, -0.017574310302734375, -0.012235641479492188, -0.00689697265625, -0.0015583038330078125, 0.003780364990234375, 0.009119033813476562, 0.01445770263671875, 0.019796371459960938, 0.025135040283203125, 0.030473709106445312, 0.0358123779296875, 0.04115104675292969, 0.046489715576171875, 0.05182838439941406, 0.05716705322265625, 0.06250572204589844, 0.06784439086914062, 0.07318305969238281, 0.078521728515625, 0.08386039733886719, 0.08919906616210938, 0.09453773498535156, 0.09987640380859375, 0.10521507263183594, 0.11055374145507812, 0.11589241027832031, 0.1212310791015625, 0.1265697479248047, 0.13190841674804688, 0.13724708557128906, 0.14258575439453125, 0.14792442321777344, 0.15326309204101562, 0.1586017608642578, 0.1639404296875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 5.0, 4.0, 12.0, 11.0, 7.0, 20.0, 20.0, 47.0, 81.0, 198.0, 2871.0, 516.0, 106.0, 59.0, 32.0, 28.0, 12.0, 18.0, 8.0, 3.0, 4.0, 1.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0606689453125, -0.05821514129638672, -0.05576133728027344, -0.053307533264160156, -0.050853729248046875, -0.048399925231933594, -0.04594612121582031, -0.04349231719970703, -0.04103851318359375, -0.03858470916748047, -0.03613090515136719, -0.033677101135253906, -0.031223297119140625, -0.028769493103027344, -0.026315689086914062, -0.02386188507080078, -0.0214080810546875, -0.01895427703857422, -0.016500473022460938, -0.014046669006347656, -0.011592864990234375, -0.009139060974121094, -0.0066852569580078125, -0.004231452941894531, -0.00177764892578125, 0.0006761550903320312, 0.0031299591064453125, 0.005583763122558594, 0.008037567138671875, 0.010491371154785156, 0.012945175170898438, 0.015398979187011719, 0.017852783203125, 0.02030658721923828, 0.022760391235351562, 0.025214195251464844, 0.027667999267578125, 0.030121803283691406, 0.03257560729980469, 0.03502941131591797, 0.03748321533203125, 0.03993701934814453, 0.04239082336425781, 0.044844627380371094, 0.047298431396484375, 0.049752235412597656, 0.05220603942871094, 0.05465984344482422, 0.0571136474609375, 0.05956745147705078, 0.06202125549316406, 0.06447505950927734, 0.06692886352539062, 0.0693826675415039, 0.07183647155761719, 0.07429027557373047, 0.07674407958984375, 0.07919788360595703, 0.08165168762207031, 0.0841054916381836, 0.08655929565429688, 0.08901309967041016, 0.09146690368652344, 0.09392070770263672, 0.09637451171875]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 9.0, 46.0, 298.0, 506.0, 112.0, 28.0, 5.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.38780465722084045, -0.353226900100708, -0.31864914298057556, -0.2840713858604431, -0.24949364364147186, -0.21491588652133942, -0.18033814430236816, -0.14576038718223572, -0.11118263006210327, -0.07660487294197083, -0.042027123272418976, -0.0074493736028671265, 0.02712838351726532, 0.061706140637397766, 0.09628388285636902, 0.13086163997650146, 0.1654393970966339, 0.20001715421676636, 0.2345949113368988, 0.26917266845703125, 0.3037503957748413, 0.33832818269729614, 0.3729059100151062, 0.40748366713523865, 0.4420614242553711, 0.47663918137550354, 0.511216938495636, 0.545794665813446, 0.5803724527359009, 0.6149501800537109, 0.649527907371521, 0.6841056942939758, 0.7186833620071411, 0.7532610893249512, 0.787838876247406, 0.8224166035652161, 0.8569943904876709, 0.891572117805481, 0.926149845123291, 0.9607276320457458, 0.9953054189682007, 1.0298831462860107, 1.0644608736038208, 1.0990387201309204, 1.1336164474487305, 1.1681941747665405, 1.2027719020843506, 1.2373497486114502, 1.2719273567199707, 1.3065050840377808, 1.3410828113555908, 1.3756606578826904, 1.4102383852005005, 1.4448161125183105, 1.4793938398361206, 1.5139715671539307, 1.5485494136810303, 1.5831271409988403, 1.6177048683166504, 1.65228271484375, 1.68686044216156, 1.7214381694793701, 1.7560158967971802, 1.7905936241149902, 1.8251714706420898]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 11.0, 7.0, 10.0, 12.0, 22.0, 28.0, 24.0, 41.0, 55.0, 61.0, 67.0, 75.0, 64.0, 67.0, 59.0, 89.0, 62.0, 55.0, 54.0, 28.0, 29.0, 21.0, 18.0, 13.0, 12.0, 6.0, 6.0, 4.0, 2.0, 1.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2892959713935852, -0.28160953521728516, -0.2739230990409851, -0.26623666286468506, -0.258550226688385, -0.25086379051208496, -0.2431773692369461, -0.23549093306064606, -0.2278045117855072, -0.22011807560920715, -0.2124316394329071, -0.20474520325660706, -0.1970587819814682, -0.18937234580516815, -0.1816859096288681, -0.17399947345256805, -0.166313037276268, -0.15862660109996796, -0.1509401649236679, -0.14325374364852905, -0.135567307472229, -0.12788087129592896, -0.1201944351196289, -0.11250799894332886, -0.1048215702176094, -0.09713513404130936, -0.0894487053155899, -0.08176226913928986, -0.07407583296298981, -0.06638940423727036, -0.058702968060970306, -0.051016535609960556, -0.043330103158950806, -0.035643670707941055, -0.027957236394286156, -0.020270802080631256, -0.012584369629621506, -0.004897937178611755, 0.0027884989976882935, 0.010474931448698044, 0.018161363899707794, 0.025847796350717545, 0.033534228801727295, 0.041220664978027344, 0.048907097429037094, 0.056593529880046844, 0.0642799660563469, 0.07196639478206635, 0.0796528309583664, 0.08733926713466644, 0.0950256958603859, 0.10271213203668594, 0.1103985607624054, 0.11808499693870544, 0.1257714331150055, 0.13345786929130554, 0.1411443054676056, 0.14883074164390564, 0.1565171778202057, 0.16420361399650574, 0.1718900352716446, 0.17957647144794464, 0.1872629076242447, 0.19494934380054474, 0.2026357650756836]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 5.0, 5.0, 10.0, 8.0, 19.0, 28.0, 27.0, 39.0, 67.0, 86.0, 154.0, 172.0, 236.0, 452.0, 716.0, 1313.0, 2817.0, 8714.0, 47696.0, 555483.0, 382442.0, 35313.0, 7322.0, 2519.0, 1118.0, 620.0, 340.0, 241.0, 165.0, 117.0, 84.0, 63.0, 36.0, 35.0, 15.0, 20.0, 21.0, 8.0, 9.0, 9.0, 3.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.328125, -0.3187294006347656, -0.30933380126953125, -0.2999382019042969, -0.2905426025390625, -0.2811470031738281, -0.27175140380859375, -0.2623558044433594, -0.252960205078125, -0.24356460571289062, -0.23416900634765625, -0.22477340698242188, -0.2153778076171875, -0.20598220825195312, -0.19658660888671875, -0.18719100952148438, -0.17779541015625, -0.16839981079101562, -0.15900421142578125, -0.14960861206054688, -0.1402130126953125, -0.13081741333007812, -0.12142181396484375, -0.11202621459960938, -0.102630615234375, -0.09323501586914062, -0.08383941650390625, -0.07444381713867188, -0.0650482177734375, -0.055652618408203125, -0.04625701904296875, -0.036861419677734375, -0.0274658203125, -0.018070220947265625, -0.00867462158203125, 0.000720977783203125, 0.0101165771484375, 0.019512176513671875, 0.02890777587890625, 0.038303375244140625, 0.047698974609375, 0.057094573974609375, 0.06649017333984375, 0.07588577270507812, 0.0852813720703125, 0.09467697143554688, 0.10407257080078125, 0.11346817016601562, 0.12286376953125, 0.13225936889648438, 0.14165496826171875, 0.15105056762695312, 0.1604461669921875, 0.16984176635742188, 0.17923736572265625, 0.18863296508789062, 0.198028564453125, 0.20742416381835938, 0.21681976318359375, 0.22621536254882812, 0.2356109619140625, 0.24500656127929688, 0.25440216064453125, 0.2637977600097656, 0.273193359375]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 9.0, 3.0, 18.0, 30.0, 56.0, 80.0, 114.0, 141.0, 127.0, 151.0, 111.0, 72.0, 45.0, 16.0, 11.0, 8.0, 4.0, 1.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.09869384765625, -0.09618997573852539, -0.09368610382080078, -0.09118223190307617, -0.08867835998535156, -0.08617448806762695, -0.08367061614990234, -0.08116674423217773, -0.07866287231445312, -0.07615900039672852, -0.0736551284790039, -0.0711512565612793, -0.06864738464355469, -0.06614351272583008, -0.06363964080810547, -0.06113576889038086, -0.05863189697265625, -0.05612802505493164, -0.05362415313720703, -0.05112028121948242, -0.04861640930175781, -0.0461125373840332, -0.043608665466308594, -0.041104793548583984, -0.038600921630859375, -0.036097049713134766, -0.033593177795410156, -0.031089305877685547, -0.028585433959960938, -0.026081562042236328, -0.02357769012451172, -0.02107381820678711, -0.0185699462890625, -0.01606607437133789, -0.013562202453613281, -0.011058330535888672, -0.008554458618164062, -0.006050586700439453, -0.0035467147827148438, -0.0010428428649902344, 0.001461029052734375, 0.003964900970458984, 0.006468772888183594, 0.008972644805908203, 0.011476516723632812, 0.013980388641357422, 0.01648426055908203, 0.01898813247680664, 0.02149200439453125, 0.02399587631225586, 0.02649974822998047, 0.029003620147705078, 0.03150749206542969, 0.0340113639831543, 0.036515235900878906, 0.039019107818603516, 0.041522979736328125, 0.044026851654052734, 0.046530723571777344, 0.04903459548950195, 0.05153846740722656, 0.05404233932495117, 0.05654621124267578, 0.05905008316040039, 0.061553955078125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 4.0, 5.0, 9.0, 4.0, 15.0, 19.0, 29.0, 26.0, 44.0, 78.0, 111.0, 213.0, 412.0, 912.0, 2108.0, 5408.0, 16306.0, 55086.0, 213357.0, 516726.0, 171053.0, 45009.0, 13559.0, 4624.0, 1811.0, 743.0, 329.0, 220.0, 128.0, 72.0, 46.0, 28.0, 15.0, 9.0, 10.0, 8.0, 12.0, 4.0, 6.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.156982421875, -0.1524219512939453, -0.14786148071289062, -0.14330101013183594, -0.13874053955078125, -0.13418006896972656, -0.12961959838867188, -0.1250591278076172, -0.1204986572265625, -0.11593818664550781, -0.11137771606445312, -0.10681724548339844, -0.10225677490234375, -0.09769630432128906, -0.09313583374023438, -0.08857536315917969, -0.084014892578125, -0.07945442199707031, -0.07489395141601562, -0.07033348083496094, -0.06577301025390625, -0.06121253967285156, -0.056652069091796875, -0.05209159851074219, -0.0475311279296875, -0.04297065734863281, -0.038410186767578125, -0.03384971618652344, -0.02928924560546875, -0.024728775024414062, -0.020168304443359375, -0.015607833862304688, -0.01104736328125, -0.0064868927001953125, -0.001926422119140625, 0.0026340484619140625, 0.00719451904296875, 0.011754989624023438, 0.016315460205078125, 0.020875930786132812, 0.0254364013671875, 0.029996871948242188, 0.034557342529296875, 0.03911781311035156, 0.04367828369140625, 0.04823875427246094, 0.052799224853515625, 0.05735969543457031, 0.061920166015625, 0.06648063659667969, 0.07104110717773438, 0.07560157775878906, 0.08016204833984375, 0.08472251892089844, 0.08928298950195312, 0.09384346008300781, 0.0984039306640625, 0.10296440124511719, 0.10752487182617188, 0.11208534240722656, 0.11664581298828125, 0.12120628356933594, 0.12576675415039062, 0.1303272247314453, 0.1348876953125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 6.0, 2.0, 12.0, 8.0, 10.0, 9.0, 19.0, 15.0, 18.0, 18.0, 26.0, 26.0, 31.0, 26.0, 38.0, 36.0, 42.0, 37.0, 34.0, 60.0, 39.0, 51.0, 39.0, 48.0, 41.0, 50.0, 38.0, 21.0, 28.0, 36.0, 20.0, 19.0, 18.0, 17.0, 15.0, 9.0, 14.0, 10.0, 4.0, 9.0, 4.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.11663818359375, -0.11319637298583984, -0.10975456237792969, -0.10631275177001953, -0.10287094116210938, -0.09942913055419922, -0.09598731994628906, -0.0925455093383789, -0.08910369873046875, -0.0856618881225586, -0.08222007751464844, -0.07877826690673828, -0.07533645629882812, -0.07189464569091797, -0.06845283508300781, -0.06501102447509766, -0.0615692138671875, -0.058127403259277344, -0.05468559265136719, -0.05124378204345703, -0.047801971435546875, -0.04436016082763672, -0.04091835021972656, -0.037476539611816406, -0.03403472900390625, -0.030592918395996094, -0.027151107788085938, -0.02370929718017578, -0.020267486572265625, -0.01682567596435547, -0.013383865356445312, -0.009942054748535156, -0.006500244140625, -0.0030584335327148438, 0.0003833770751953125, 0.0038251876831054688, 0.007266998291015625, 0.010708808898925781, 0.014150619506835938, 0.017592430114746094, 0.02103424072265625, 0.024476051330566406, 0.027917861938476562, 0.03135967254638672, 0.034801483154296875, 0.03824329376220703, 0.04168510437011719, 0.045126914978027344, 0.0485687255859375, 0.052010536193847656, 0.05545234680175781, 0.05889415740966797, 0.062335968017578125, 0.06577777862548828, 0.06921958923339844, 0.0726613998413086, 0.07610321044921875, 0.0795450210571289, 0.08298683166503906, 0.08642864227294922, 0.08987045288085938, 0.09331226348876953, 0.09675407409667969, 0.10019588470458984, 0.1036376953125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 1.0, 2.0, 7.0, 7.0, 6.0, 15.0, 19.0, 31.0, 55.0, 61.0, 88.0, 160.0, 223.0, 350.0, 597.0, 980.0, 1845.0, 4096.0, 10553.0, 39355.0, 254097.0, 627708.0, 78359.0, 18206.0, 6014.0, 2543.0, 1236.0, 716.0, 435.0, 279.0, 156.0, 121.0, 87.0, 49.0, 40.0, 23.0, 17.0, 9.0, 7.0, 3.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.064208984375, -0.06221580505371094, -0.060222625732421875, -0.05822944641113281, -0.05623626708984375, -0.05424308776855469, -0.052249908447265625, -0.05025672912597656, -0.0482635498046875, -0.04627037048339844, -0.044277191162109375, -0.04228401184082031, -0.04029083251953125, -0.03829765319824219, -0.036304473876953125, -0.03431129455566406, -0.032318115234375, -0.030324935913085938, -0.028331756591796875, -0.026338577270507812, -0.02434539794921875, -0.022352218627929688, -0.020359039306640625, -0.018365859985351562, -0.0163726806640625, -0.014379501342773438, -0.012386322021484375, -0.010393142700195312, -0.00839996337890625, -0.0064067840576171875, -0.004413604736328125, -0.0024204254150390625, -0.00042724609375, 0.0015659332275390625, 0.003559112548828125, 0.0055522918701171875, 0.00754547119140625, 0.009538650512695312, 0.011531829833984375, 0.013525009155273438, 0.0155181884765625, 0.017511367797851562, 0.019504547119140625, 0.021497726440429688, 0.02349090576171875, 0.025484085083007812, 0.027477264404296875, 0.029470443725585938, 0.031463623046875, 0.03345680236816406, 0.035449981689453125, 0.03744316101074219, 0.03943634033203125, 0.04142951965332031, 0.043422698974609375, 0.04541587829589844, 0.0474090576171875, 0.04940223693847656, 0.051395416259765625, 0.05338859558105469, 0.05538177490234375, 0.05737495422363281, 0.059368133544921875, 0.06136131286621094, 0.0633544921875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 4.0, 5.0, 4.0, 5.0, 6.0, 13.0, 20.0, 19.0, 35.0, 77.0, 178.0, 309.0, 162.0, 65.0, 29.0, 23.0, 13.0, 9.0, 6.0, 4.0, 3.0, 2.0, 1.0, 4.0, 4.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00013256072998046875, -0.00012754276394844055, -0.00012252479791641235, -0.00011750683188438416, -0.00011248886585235596, -0.00010747089982032776, -0.00010245293378829956, -9.743496775627136e-05, -9.241700172424316e-05, -8.739903569221497e-05, -8.238106966018677e-05, -7.736310362815857e-05, -7.234513759613037e-05, -6.732717156410217e-05, -6.230920553207397e-05, -5.7291239500045776e-05, -5.227327346801758e-05, -4.725530743598938e-05, -4.223734140396118e-05, -3.7219375371932983e-05, -3.2201409339904785e-05, -2.7183443307876587e-05, -2.216547727584839e-05, -1.714751124382019e-05, -1.2129545211791992e-05, -7.111579179763794e-06, -2.0936131477355957e-06, 2.9243528842926025e-06, 7.9423189163208e-06, 1.2960284948348999e-05, 1.7978250980377197e-05, 2.2996217012405396e-05, 2.8014183044433594e-05, 3.303214907646179e-05, 3.805011510848999e-05, 4.306808114051819e-05, 4.808604717254639e-05, 5.3104013204574585e-05, 5.812197923660278e-05, 6.313994526863098e-05, 6.815791130065918e-05, 7.317587733268738e-05, 7.819384336471558e-05, 8.321180939674377e-05, 8.822977542877197e-05, 9.324774146080017e-05, 9.826570749282837e-05, 0.00010328367352485657, 0.00010830163955688477, 0.00011331960558891296, 0.00011833757162094116, 0.00012335553765296936, 0.00012837350368499756, 0.00013339146971702576, 0.00013840943574905396, 0.00014342740178108215, 0.00014844536781311035, 0.00015346333384513855, 0.00015848129987716675, 0.00016349926590919495, 0.00016851723194122314, 0.00017353519797325134, 0.00017855316400527954, 0.00018357113003730774, 0.00018858909606933594]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 1.0, 8.0, 5.0, 8.0, 8.0, 13.0, 30.0, 31.0, 73.0, 112.0, 225.0, 416.0, 878.0, 2056.0, 5094.0, 16216.0, 86052.0, 727478.0, 172581.0, 25482.0, 6995.0, 2599.0, 1092.0, 505.0, 238.0, 156.0, 69.0, 43.0, 31.0, 17.0, 17.0, 10.0, 4.0, 7.0, 0.0, 3.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0887451171875, -0.08625602722167969, -0.08376693725585938, -0.08127784729003906, -0.07878875732421875, -0.07629966735839844, -0.07381057739257812, -0.07132148742675781, -0.0688323974609375, -0.06634330749511719, -0.06385421752929688, -0.06136512756347656, -0.05887603759765625, -0.05638694763183594, -0.053897857666015625, -0.05140876770019531, -0.048919677734375, -0.04643058776855469, -0.043941497802734375, -0.04145240783691406, -0.03896331787109375, -0.03647422790527344, -0.033985137939453125, -0.03149604797363281, -0.0290069580078125, -0.026517868041992188, -0.024028778076171875, -0.021539688110351562, -0.01905059814453125, -0.016561508178710938, -0.014072418212890625, -0.011583328247070312, -0.00909423828125, -0.0066051483154296875, -0.004116058349609375, -0.0016269683837890625, 0.00086212158203125, 0.0033512115478515625, 0.005840301513671875, 0.008329391479492188, 0.0108184814453125, 0.013307571411132812, 0.015796661376953125, 0.018285751342773438, 0.02077484130859375, 0.023263931274414062, 0.025753021240234375, 0.028242111206054688, 0.030731201171875, 0.03322029113769531, 0.035709381103515625, 0.03819847106933594, 0.04068756103515625, 0.04317665100097656, 0.045665740966796875, 0.04815483093261719, 0.0506439208984375, 0.05313301086425781, 0.055622100830078125, 0.05811119079589844, 0.06060028076171875, 0.06308937072753906, 0.06557846069335938, 0.06806755065917969, 0.070556640625]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 2.0, 3.0, 6.0, 11.0, 11.0, 6.0, 19.0, 29.0, 42.0, 41.0, 57.0, 59.0, 83.0, 110.0, 97.0, 85.0, 75.0, 54.0, 44.0, 27.0, 36.0, 24.0, 16.0, 17.0, 3.0, 7.0, 5.0, 10.0, 2.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.060638427734375, -0.05891895294189453, -0.05719947814941406, -0.055480003356933594, -0.053760528564453125, -0.052041053771972656, -0.05032157897949219, -0.04860210418701172, -0.04688262939453125, -0.04516315460205078, -0.04344367980957031, -0.041724205017089844, -0.040004730224609375, -0.038285255432128906, -0.03656578063964844, -0.03484630584716797, -0.0331268310546875, -0.03140735626220703, -0.029687881469726562, -0.027968406677246094, -0.026248931884765625, -0.024529457092285156, -0.022809982299804688, -0.02109050750732422, -0.01937103271484375, -0.01765155792236328, -0.015932083129882812, -0.014212608337402344, -0.012493133544921875, -0.010773658752441406, -0.009054183959960938, -0.007334709167480469, -0.005615234375, -0.0038957595825195312, -0.0021762847900390625, -0.00045680999755859375, 0.001262664794921875, 0.0029821395874023438, 0.0047016143798828125, 0.006421089172363281, 0.00814056396484375, 0.009860038757324219, 0.011579513549804688, 0.013298988342285156, 0.015018463134765625, 0.016737937927246094, 0.018457412719726562, 0.02017688751220703, 0.0218963623046875, 0.02361583709716797, 0.025335311889648438, 0.027054786682128906, 0.028774261474609375, 0.030493736267089844, 0.03221321105957031, 0.03393268585205078, 0.03565216064453125, 0.03737163543701172, 0.03909111022949219, 0.040810585021972656, 0.042530059814453125, 0.044249534606933594, 0.04596900939941406, 0.04768848419189453, 0.049407958984375]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 5.0, 5.0, 11.0, 35.0, 46.0, 120.0, 241.0, 280.0, 143.0, 63.0, 27.0, 15.0, 5.0, 9.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9402272701263428, -1.8894137144088745, -1.8386001586914062, -1.787786602973938, -1.7369730472564697, -1.6861594915390015, -1.6353459358215332, -1.584532380104065, -1.5337188243865967, -1.4829052686691284, -1.4320917129516602, -1.381278157234192, -1.3304646015167236, -1.2796510457992554, -1.228837490081787, -1.1780239343643188, -1.1272103786468506, -1.0763968229293823, -1.025583267211914, -0.9747697114944458, -0.9239561557769775, -0.8731426000595093, -0.822329044342041, -0.7715154886245728, -0.720702052116394, -0.6698884963989258, -0.6190749406814575, -0.5682613849639893, -0.517447829246521, -0.4666343033313751, -0.41582074761390686, -0.3650071918964386, -0.31419360637664795, -0.2633800506591797, -0.21256649494171143, -0.16175295412540436, -0.1109393984079361, -0.06012585759162903, -0.009312301874160767, 0.041501253843307495, 0.09231480956077576, 0.14312836527824402, 0.19394192099571228, 0.24475546181201935, 0.2955690026283264, 0.3463825583457947, 0.39719611406326294, 0.4480096697807312, 0.49882322549819946, 0.5496367812156677, 0.600450336933136, 0.6512638926506042, 0.7020774483680725, 0.752890944480896, 0.8037045001983643, 0.8545180559158325, 0.9053316116333008, 0.956145167350769, 1.0069587230682373, 1.0577722787857056, 1.1085858345031738, 1.159399390220642, 1.2102129459381104, 1.2610265016555786, 1.3118400573730469]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 3.0, 4.0, 4.0, 5.0, 12.0, 11.0, 11.0, 18.0, 14.0, 17.0, 23.0, 27.0, 17.0, 31.0, 35.0, 35.0, 35.0, 36.0, 51.0, 48.0, 47.0, 44.0, 59.0, 46.0, 42.0, 39.0, 36.0, 37.0, 33.0, 34.0, 26.0, 21.0, 18.0, 17.0, 14.0, 13.0, 11.0, 10.0, 6.0, 5.0, 2.0, 2.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5247740149497986, -0.5074394941329956, -0.49010494351387024, -0.4727703928947449, -0.4554358720779419, -0.4381013512611389, -0.42076680064201355, -0.4034322500228882, -0.3860977292060852, -0.3687632083892822, -0.35142865777015686, -0.3340941071510315, -0.3167595863342285, -0.29942506551742554, -0.28209051489830017, -0.2647559642791748, -0.24742144346237183, -0.23008690774440765, -0.21275237202644348, -0.1954178363084793, -0.17808330059051514, -0.16074876487255096, -0.1434142291545868, -0.12607969343662262, -0.10874515771865845, -0.09141062200069427, -0.0740760862827301, -0.05674155056476593, -0.03940701484680176, -0.022072479128837585, -0.004737943410873413, 0.01259659230709076, 0.029931187629699707, 0.04726572334766388, 0.06460025906562805, 0.08193479478359222, 0.0992693305015564, 0.11660386621952057, 0.13393840193748474, 0.1512729376554489, 0.16860747337341309, 0.18594200909137726, 0.20327654480934143, 0.2206110805273056, 0.23794561624526978, 0.25528013706207275, 0.2726146876811981, 0.2899492383003235, 0.30728375911712646, 0.32461827993392944, 0.3419528305530548, 0.3592873811721802, 0.37662190198898315, 0.39395642280578613, 0.4112909734249115, 0.42862552404403687, 0.44596004486083984, 0.4632945656776428, 0.4806291162967682, 0.49796366691589355, 0.5152981877326965, 0.5326327085494995, 0.5499672889709473, 0.5673018097877502, 0.5846363306045532]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 1.0, 2.0, 6.0, 6.0, 7.0, 3.0, 8.0, 13.0, 18.0, 22.0, 24.0, 33.0, 62.0, 89.0, 153.0, 333.0, 872.0, 2919.0, 20325.0, 4136401.0, 27494.0, 3503.0, 1010.0, 444.0, 188.0, 110.0, 81.0, 40.0, 32.0, 24.0, 17.0, 9.0, 11.0, 4.0, 6.0, 2.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.302734375, -0.29488182067871094, -0.2870292663574219, -0.2791767120361328, -0.27132415771484375, -0.2634716033935547, -0.2556190490722656, -0.24776649475097656, -0.2399139404296875, -0.23206138610839844, -0.22420883178710938, -0.2163562774658203, -0.20850372314453125, -0.2006511688232422, -0.19279861450195312, -0.18494606018066406, -0.177093505859375, -0.16924095153808594, -0.16138839721679688, -0.1535358428955078, -0.14568328857421875, -0.1378307342529297, -0.12997817993164062, -0.12212562561035156, -0.1142730712890625, -0.10642051696777344, -0.09856796264648438, -0.09071540832519531, -0.08286285400390625, -0.07501029968261719, -0.06715774536132812, -0.05930519104003906, -0.05145263671875, -0.04360008239746094, -0.035747528076171875, -0.027894973754882812, -0.02004241943359375, -0.012189865112304688, -0.004337310791015625, 0.0035152435302734375, 0.0113677978515625, 0.019220352172851562, 0.027072906494140625, 0.03492546081542969, 0.04277801513671875, 0.05063056945800781, 0.058483123779296875, 0.06633567810058594, 0.074188232421875, 0.08204078674316406, 0.08989334106445312, 0.09774589538574219, 0.10559844970703125, 0.11345100402832031, 0.12130355834960938, 0.12915611267089844, 0.1370086669921875, 0.14486122131347656, 0.15271377563476562, 0.1605663299560547, 0.16841888427734375, 0.1762714385986328, 0.18412399291992188, 0.19197654724121094, 0.1998291015625]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 9.0, 4.0, 18.0, 36.0, 67.0, 99.0, 126.0, 136.0, 155.0, 126.0, 93.0, 66.0, 25.0, 22.0, 4.0, 5.0, 3.0, 1.0, 6.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.10357666015625, -0.10098886489868164, -0.09840106964111328, -0.09581327438354492, -0.09322547912597656, -0.0906376838684082, -0.08804988861083984, -0.08546209335327148, -0.08287429809570312, -0.08028650283813477, -0.0776987075805664, -0.07511091232299805, -0.07252311706542969, -0.06993532180786133, -0.06734752655029297, -0.06475973129272461, -0.06217193603515625, -0.05958414077758789, -0.05699634552001953, -0.05440855026245117, -0.05182075500488281, -0.04923295974731445, -0.046645164489746094, -0.044057369232177734, -0.041469573974609375, -0.038881778717041016, -0.036293983459472656, -0.0337061882019043, -0.031118392944335938, -0.028530597686767578, -0.02594280242919922, -0.02335500717163086, -0.0207672119140625, -0.01817941665649414, -0.015591621398925781, -0.013003826141357422, -0.010416030883789062, -0.007828235626220703, -0.005240440368652344, -0.0026526451110839844, -6.4849853515625e-05, 0.0025229454040527344, 0.005110740661621094, 0.007698535919189453, 0.010286331176757812, 0.012874126434326172, 0.015461921691894531, 0.01804971694946289, 0.02063751220703125, 0.02322530746459961, 0.02581310272216797, 0.028400897979736328, 0.030988693237304688, 0.03357648849487305, 0.036164283752441406, 0.038752079010009766, 0.041339874267578125, 0.043927669525146484, 0.046515464782714844, 0.0491032600402832, 0.05169105529785156, 0.05427885055541992, 0.05686664581298828, 0.05945444107055664, 0.062042236328125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 1.0, 3.0, 5.0, 5.0, 21.0, 31.0, 40.0, 41.0, 76.0, 146.0, 278.0, 576.0, 1477.0, 6539.0, 119024.0, 4049027.0, 13129.0, 2233.0, 794.0, 353.0, 184.0, 103.0, 57.0, 31.0, 32.0, 27.0, 22.0, 8.0, 8.0, 10.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.40625, -0.3963813781738281, -0.38651275634765625, -0.3766441345214844, -0.3667755126953125, -0.3569068908691406, -0.34703826904296875, -0.3371696472167969, -0.327301025390625, -0.3174324035644531, -0.30756378173828125, -0.2976951599121094, -0.2878265380859375, -0.2779579162597656, -0.26808929443359375, -0.2582206726074219, -0.24835205078125, -0.23848342895507812, -0.22861480712890625, -0.21874618530273438, -0.2088775634765625, -0.19900894165039062, -0.18914031982421875, -0.17927169799804688, -0.169403076171875, -0.15953445434570312, -0.14966583251953125, -0.13979721069335938, -0.1299285888671875, -0.12005996704101562, -0.11019134521484375, -0.10032272338867188, -0.0904541015625, -0.08058547973632812, -0.07071685791015625, -0.060848236083984375, -0.0509796142578125, -0.041110992431640625, -0.03124237060546875, -0.021373748779296875, -0.011505126953125, -0.001636505126953125, 0.00823211669921875, 0.018100738525390625, 0.0279693603515625, 0.037837982177734375, 0.04770660400390625, 0.057575225830078125, 0.06744384765625, 0.07731246948242188, 0.08718109130859375, 0.09704971313476562, 0.1069183349609375, 0.11678695678710938, 0.12665557861328125, 0.13652420043945312, 0.146392822265625, 0.15626144409179688, 0.16613006591796875, 0.17599868774414062, 0.1858673095703125, 0.19573593139648438, 0.20560455322265625, 0.21547317504882812, 0.225341796875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 5.0, 4.0, 11.0, 20.0, 46.0, 118.0, 3573.0, 220.0, 46.0, 15.0, 7.0, 12.0, 4.0, 5.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06951904296875, -0.06578731536865234, -0.06205558776855469, -0.05832386016845703, -0.054592132568359375, -0.05086040496826172, -0.04712867736816406, -0.043396949768066406, -0.03966522216796875, -0.035933494567871094, -0.03220176696777344, -0.02847003936767578, -0.024738311767578125, -0.02100658416748047, -0.017274856567382812, -0.013543128967285156, -0.0098114013671875, -0.006079673767089844, -0.0023479461669921875, 0.0013837814331054688, 0.005115509033203125, 0.008847236633300781, 0.012578964233398438, 0.016310691833496094, 0.02004241943359375, 0.023774147033691406, 0.027505874633789062, 0.03123760223388672, 0.034969329833984375, 0.03870105743408203, 0.04243278503417969, 0.046164512634277344, 0.049896240234375, 0.053627967834472656, 0.05735969543457031, 0.06109142303466797, 0.06482315063476562, 0.06855487823486328, 0.07228660583496094, 0.0760183334350586, 0.07975006103515625, 0.0834817886352539, 0.08721351623535156, 0.09094524383544922, 0.09467697143554688, 0.09840869903564453, 0.10214042663574219, 0.10587215423583984, 0.1096038818359375, 0.11333560943603516, 0.11706733703613281, 0.12079906463623047, 0.12453079223632812, 0.12826251983642578, 0.13199424743652344, 0.1357259750366211, 0.13945770263671875, 0.1431894302368164, 0.14692115783691406, 0.15065288543701172, 0.15438461303710938, 0.15811634063720703, 0.1618480682373047, 0.16557979583740234, 0.1693115234375]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 9.0, 11.0, 86.0, 279.0, 421.0, 140.0, 31.0, 14.0, 8.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.3846874237060547, -0.3673533499240875, -0.35001927614212036, -0.3326852023601532, -0.31535112857818604, -0.29801705479621887, -0.2806829810142517, -0.26334890723228455, -0.24601483345031738, -0.22868075966835022, -0.21134668588638306, -0.1940126121044159, -0.17667853832244873, -0.15934446454048157, -0.1420103907585144, -0.12467631697654724, -0.10734224319458008, -0.09000816941261292, -0.07267409563064575, -0.05534002184867859, -0.038005948066711426, -0.020671874284744263, -0.0033378005027770996, 0.013996273279190063, 0.03133034706115723, 0.04866442084312439, 0.06599849462509155, 0.08333256840705872, 0.10066664218902588, 0.11800071597099304, 0.1353347897529602, 0.15266886353492737, 0.1700029969215393, 0.18733707070350647, 0.20467114448547363, 0.2220052182674408, 0.23933929204940796, 0.2566733658313751, 0.2740074396133423, 0.29134151339530945, 0.3086755871772766, 0.3260096609592438, 0.34334373474121094, 0.3606778085231781, 0.37801188230514526, 0.3953459560871124, 0.4126800298690796, 0.43001410365104675, 0.4473481774330139, 0.4646822512149811, 0.48201632499694824, 0.4993503987789154, 0.5166844725608826, 0.5340185165405273, 0.5513526201248169, 0.5686867237091064, 0.5860207676887512, 0.603354811668396, 0.6206889152526855, 0.6380230188369751, 0.6553570628166199, 0.6726911067962646, 0.6900252103805542, 0.7073593139648438, 0.7246933579444885]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 14.0, 25.0, 35.0, 80.0, 98.0, 158.0, 156.0, 117.0, 123.0, 66.0, 57.0, 40.0, 15.0, 8.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.3285573124885559, -0.31906038522720337, -0.3095634877681732, -0.3000665605068207, -0.2905696630477905, -0.281072735786438, -0.27157580852508545, -0.2620789110660553, -0.25258198380470276, -0.2430850714445114, -0.23358815908432007, -0.22409123182296753, -0.21459431946277618, -0.20509740710258484, -0.1956004947423935, -0.18610358238220215, -0.1766066700220108, -0.16710975766181946, -0.1576128453016281, -0.14811593294143677, -0.13861900568008423, -0.12912209331989288, -0.11962518095970154, -0.1101282611489296, -0.10063134878873825, -0.0911344364285469, -0.08163751661777496, -0.07214060425758362, -0.06264369189739227, -0.05314677208662033, -0.043649859726428986, -0.03415293991565704, -0.024656027555465698, -0.01515911240130663, -0.00566219724714756, 0.0038347169756889343, 0.013331633061170578, 0.02282854914665222, 0.03232546150684357, 0.04182238131761551, 0.051319293677806854, 0.0608162097632885, 0.07031312584877014, 0.07981003820896149, 0.08930695056915283, 0.09880387037992477, 0.10830078274011612, 0.11779770255088806, 0.1272946149110794, 0.13679152727127075, 0.1462884396314621, 0.15578535199165344, 0.16528227925300598, 0.17477919161319733, 0.18427610397338867, 0.1937730312347412, 0.20326992869377136, 0.2127668410539627, 0.22226375341415405, 0.2317606806755066, 0.24125759303569794, 0.2507545053958893, 0.26025140285491943, 0.269748330116272, 0.2792452573776245]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 4.0, 3.0, 3.0, 6.0, 12.0, 13.0, 8.0, 12.0, 15.0, 22.0, 39.0, 35.0, 56.0, 75.0, 76.0, 100.0, 135.0, 188.0, 251.0, 424.0, 538.0, 845.0, 1574.0, 3148.0, 8878.0, 38014.0, 261664.0, 609553.0, 94857.0, 17367.0, 5025.0, 1982.0, 1171.0, 710.0, 495.0, 324.0, 223.0, 178.0, 124.0, 87.0, 73.0, 68.0, 35.0, 37.0, 26.0, 19.0, 16.0, 20.0, 10.0, 9.0, 4.0, 3.0, 2.0, 4.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.193359375, -0.18717193603515625, -0.1809844970703125, -0.17479705810546875, -0.168609619140625, -0.16242218017578125, -0.1562347412109375, -0.15004730224609375, -0.14385986328125, -0.13767242431640625, -0.1314849853515625, -0.12529754638671875, -0.119110107421875, -0.11292266845703125, -0.1067352294921875, -0.10054779052734375, -0.0943603515625, -0.08817291259765625, -0.0819854736328125, -0.07579803466796875, -0.069610595703125, -0.06342315673828125, -0.0572357177734375, -0.05104827880859375, -0.04486083984375, -0.03867340087890625, -0.0324859619140625, -0.02629852294921875, -0.020111083984375, -0.01392364501953125, -0.0077362060546875, -0.00154876708984375, 0.004638671875, 0.01082611083984375, 0.0170135498046875, 0.02320098876953125, 0.029388427734375, 0.03557586669921875, 0.0417633056640625, 0.04795074462890625, 0.05413818359375, 0.06032562255859375, 0.0665130615234375, 0.07270050048828125, 0.078887939453125, 0.08507537841796875, 0.0912628173828125, 0.09745025634765625, 0.1036376953125, 0.10982513427734375, 0.1160125732421875, 0.12220001220703125, 0.128387451171875, 0.13457489013671875, 0.1407623291015625, 0.14694976806640625, 0.15313720703125, 0.15932464599609375, 0.1655120849609375, 0.17169952392578125, 0.177886962890625, 0.18407440185546875, 0.1902618408203125, 0.19644927978515625, 0.20263671875]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 7.0, 6.0, 25.0, 42.0, 86.0, 114.0, 146.0, 160.0, 145.0, 119.0, 75.0, 34.0, 24.0, 4.0, 5.0, 2.0, 2.0, 5.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1129150390625, -0.11012649536132812, -0.10733795166015625, -0.10454940795898438, -0.1017608642578125, -0.09897232055664062, -0.09618377685546875, -0.09339523315429688, -0.090606689453125, -0.08781814575195312, -0.08502960205078125, -0.08224105834960938, -0.0794525146484375, -0.07666397094726562, -0.07387542724609375, -0.07108688354492188, -0.06829833984375, -0.06550979614257812, -0.06272125244140625, -0.059932708740234375, -0.0571441650390625, -0.054355621337890625, -0.05156707763671875, -0.048778533935546875, -0.045989990234375, -0.043201446533203125, -0.04041290283203125, -0.037624359130859375, -0.0348358154296875, -0.032047271728515625, -0.02925872802734375, -0.026470184326171875, -0.023681640625, -0.020893096923828125, -0.01810455322265625, -0.015316009521484375, -0.0125274658203125, -0.009738922119140625, -0.00695037841796875, -0.004161834716796875, -0.001373291015625, 0.001415252685546875, 0.00420379638671875, 0.006992340087890625, 0.0097808837890625, 0.012569427490234375, 0.01535797119140625, 0.018146514892578125, 0.02093505859375, 0.023723602294921875, 0.02651214599609375, 0.029300689697265625, 0.0320892333984375, 0.034877777099609375, 0.03766632080078125, 0.040454864501953125, 0.043243408203125, 0.046031951904296875, 0.04882049560546875, 0.051609039306640625, 0.0543975830078125, 0.057186126708984375, 0.05997467041015625, 0.06276321411132812, 0.0655517578125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 5.0, 7.0, 4.0, 5.0, 9.0, 15.0, 22.0, 16.0, 21.0, 25.0, 53.0, 94.0, 195.0, 376.0, 766.0, 1598.0, 3544.0, 8470.0, 20617.0, 53286.0, 151649.0, 413138.0, 255118.0, 85171.0, 31490.0, 12877.0, 5438.0, 2443.0, 1012.0, 451.0, 254.0, 125.0, 59.0, 47.0, 36.0, 21.0, 13.0, 17.0, 12.0, 8.0, 13.0, 6.0, 6.0, 5.0, 7.0, 4.0, 4.0, 1.0, 0.0, 1.0, 4.0, 4.0], "bins": [-0.10107421875, -0.09807777404785156, -0.09508132934570312, -0.09208488464355469, -0.08908843994140625, -0.08609199523925781, -0.08309555053710938, -0.08009910583496094, -0.0771026611328125, -0.07410621643066406, -0.07110977172851562, -0.06811332702636719, -0.06511688232421875, -0.06212043762207031, -0.059123992919921875, -0.05612754821777344, -0.053131103515625, -0.05013465881347656, -0.047138214111328125, -0.04414176940917969, -0.04114532470703125, -0.03814888000488281, -0.035152435302734375, -0.03215599060058594, -0.0291595458984375, -0.026163101196289062, -0.023166656494140625, -0.020170211791992188, -0.01717376708984375, -0.014177322387695312, -0.011180877685546875, -0.008184432983398438, -0.00518798828125, -0.0021915435791015625, 0.000804901123046875, 0.0038013458251953125, 0.00679779052734375, 0.009794235229492188, 0.012790679931640625, 0.015787124633789062, 0.0187835693359375, 0.021780014038085938, 0.024776458740234375, 0.027772903442382812, 0.03076934814453125, 0.03376579284667969, 0.036762237548828125, 0.03975868225097656, 0.042755126953125, 0.04575157165527344, 0.048748016357421875, 0.05174446105957031, 0.05474090576171875, 0.05773735046386719, 0.060733795166015625, 0.06373023986816406, 0.0667266845703125, 0.06972312927246094, 0.07271957397460938, 0.07571601867675781, 0.07871246337890625, 0.08170890808105469, 0.08470535278320312, 0.08770179748535156, 0.0906982421875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 1.0, 6.0, 9.0, 12.0, 15.0, 14.0, 9.0, 13.0, 14.0, 16.0, 13.0, 25.0, 19.0, 21.0, 33.0, 37.0, 31.0, 44.0, 38.0, 41.0, 41.0, 40.0, 31.0, 40.0, 46.0, 34.0, 38.0, 32.0, 30.0, 35.0, 31.0, 21.0, 17.0, 29.0, 13.0, 15.0, 13.0, 11.0, 12.0, 10.0, 14.0, 6.0, 8.0, 8.0, 3.0, 6.0, 4.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0809326171875, -0.07821178436279297, -0.07549095153808594, -0.0727701187133789, -0.07004928588867188, -0.06732845306396484, -0.06460762023925781, -0.06188678741455078, -0.05916595458984375, -0.05644512176513672, -0.05372428894042969, -0.051003456115722656, -0.048282623291015625, -0.045561790466308594, -0.04284095764160156, -0.04012012481689453, -0.0373992919921875, -0.03467845916748047, -0.03195762634277344, -0.029236793518066406, -0.026515960693359375, -0.023795127868652344, -0.021074295043945312, -0.01835346221923828, -0.01563262939453125, -0.012911796569824219, -0.010190963745117188, -0.007470130920410156, -0.004749298095703125, -0.0020284652709960938, 0.0006923675537109375, 0.0034132003784179688, 0.006134033203125, 0.008854866027832031, 0.011575698852539062, 0.014296531677246094, 0.017017364501953125, 0.019738197326660156, 0.022459030151367188, 0.02517986297607422, 0.02790069580078125, 0.03062152862548828, 0.03334236145019531, 0.036063194274902344, 0.038784027099609375, 0.041504859924316406, 0.04422569274902344, 0.04694652557373047, 0.0496673583984375, 0.05238819122314453, 0.05510902404785156, 0.057829856872558594, 0.060550689697265625, 0.06327152252197266, 0.06599235534667969, 0.06871318817138672, 0.07143402099609375, 0.07415485382080078, 0.07687568664550781, 0.07959651947021484, 0.08231735229492188, 0.0850381851196289, 0.08775901794433594, 0.09047985076904297, 0.09320068359375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 8.0, 6.0, 4.0, 5.0, 15.0, 25.0, 27.0, 55.0, 75.0, 126.0, 245.0, 377.0, 674.0, 1324.0, 2687.0, 6293.0, 16660.0, 63133.0, 517232.0, 364722.0, 50212.0, 14174.0, 5442.0, 2315.0, 1216.0, 608.0, 361.0, 205.0, 103.0, 81.0, 61.0, 20.0, 22.0, 16.0, 10.0, 9.0, 5.0, 3.0, 4.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0430908203125, -0.04160118103027344, -0.040111541748046875, -0.03862190246582031, -0.03713226318359375, -0.03564262390136719, -0.034152984619140625, -0.03266334533691406, -0.0311737060546875, -0.029684066772460938, -0.028194427490234375, -0.026704788208007812, -0.02521514892578125, -0.023725509643554688, -0.022235870361328125, -0.020746231079101562, -0.019256591796875, -0.017766952514648438, -0.016277313232421875, -0.014787673950195312, -0.01329803466796875, -0.011808395385742188, -0.010318756103515625, -0.008829116821289062, -0.0073394775390625, -0.0058498382568359375, -0.004360198974609375, -0.0028705596923828125, -0.00138092041015625, 0.0001087188720703125, 0.001598358154296875, 0.0030879974365234375, 0.00457763671875, 0.0060672760009765625, 0.007556915283203125, 0.009046554565429688, 0.01053619384765625, 0.012025833129882812, 0.013515472412109375, 0.015005111694335938, 0.0164947509765625, 0.017984390258789062, 0.019474029541015625, 0.020963668823242188, 0.02245330810546875, 0.023942947387695312, 0.025432586669921875, 0.026922225952148438, 0.028411865234375, 0.029901504516601562, 0.031391143798828125, 0.03288078308105469, 0.03437042236328125, 0.03586006164550781, 0.037349700927734375, 0.03883934020996094, 0.0403289794921875, 0.04181861877441406, 0.043308258056640625, 0.04479789733886719, 0.04628753662109375, 0.04777717590332031, 0.049266815185546875, 0.05075645446777344, 0.05224609375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 6.0, 10.0, 4.0, 18.0, 18.0, 28.0, 47.0, 83.0, 145.0, 221.0, 185.0, 93.0, 59.0, 28.0, 11.0, 13.0, 10.0, 8.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00022161006927490234, -0.0002161506563425064, -0.00021069124341011047, -0.00020523183047771454, -0.0001997724175453186, -0.00019431300461292267, -0.00018885359168052673, -0.0001833941787481308, -0.00017793476581573486, -0.00017247535288333893, -0.000167015939950943, -0.00016155652701854706, -0.00015609711408615112, -0.0001506377011537552, -0.00014517828822135925, -0.00013971887528896332, -0.00013425946235656738, -0.00012880004942417145, -0.0001233406364917755, -0.00011788122355937958, -0.00011242181062698364, -0.00010696239769458771, -0.00010150298476219177, -9.604357182979584e-05, -9.05841588973999e-05, -8.512474596500397e-05, -7.966533303260803e-05, -7.42059201002121e-05, -6.874650716781616e-05, -6.328709423542023e-05, -5.782768130302429e-05, -5.236826837062836e-05, -4.690885543823242e-05, -4.144944250583649e-05, -3.599002957344055e-05, -3.053061664104462e-05, -2.507120370864868e-05, -1.9611790776252747e-05, -1.4152377843856812e-05, -8.692964911460876e-06, -3.2335519790649414e-06, 2.2258609533309937e-06, 7.685273885726929e-06, 1.3144686818122864e-05, 1.86040997505188e-05, 2.4063512682914734e-05, 2.952292561531067e-05, 3.4982338547706604e-05, 4.044175148010254e-05, 4.5901164412498474e-05, 5.136057734489441e-05, 5.6819990277290344e-05, 6.227940320968628e-05, 6.773881614208221e-05, 7.319822907447815e-05, 7.865764200687408e-05, 8.411705493927002e-05, 8.957646787166595e-05, 9.503588080406189e-05, 0.00010049529373645782, 0.00010595470666885376, 0.0001114141196012497, 0.00011687353253364563, 0.00012233294546604156, 0.0001277923583984375]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 5.0, 6.0, 10.0, 20.0, 32.0, 53.0, 106.0, 142.0, 307.0, 603.0, 1200.0, 3631.0, 13876.0, 107925.0, 810255.0, 92268.0, 12384.0, 3303.0, 1229.0, 575.0, 273.0, 152.0, 83.0, 51.0, 27.0, 16.0, 9.0, 4.0, 5.0, 5.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.078369140625, -0.07595539093017578, -0.07354164123535156, -0.07112789154052734, -0.06871414184570312, -0.0663003921508789, -0.06388664245605469, -0.06147289276123047, -0.05905914306640625, -0.05664539337158203, -0.05423164367675781, -0.051817893981933594, -0.049404144287109375, -0.046990394592285156, -0.04457664489746094, -0.04216289520263672, -0.0397491455078125, -0.03733539581298828, -0.03492164611816406, -0.032507896423339844, -0.030094146728515625, -0.027680397033691406, -0.025266647338867188, -0.02285289764404297, -0.02043914794921875, -0.01802539825439453, -0.015611648559570312, -0.013197898864746094, -0.010784149169921875, -0.008370399475097656, -0.0059566497802734375, -0.0035429000854492188, -0.001129150390625, 0.0012845993041992188, 0.0036983489990234375, 0.006112098693847656, 0.008525848388671875, 0.010939598083496094, 0.013353347778320312, 0.01576709747314453, 0.01818084716796875, 0.02059459686279297, 0.023008346557617188, 0.025422096252441406, 0.027835845947265625, 0.030249595642089844, 0.03266334533691406, 0.03507709503173828, 0.0374908447265625, 0.03990459442138672, 0.04231834411621094, 0.044732093811035156, 0.047145843505859375, 0.049559593200683594, 0.05197334289550781, 0.05438709259033203, 0.05680084228515625, 0.05921459197998047, 0.06162834167480469, 0.0640420913696289, 0.06645584106445312, 0.06886959075927734, 0.07128334045410156, 0.07369709014892578, 0.07611083984375]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 2.0, 1.0, 3.0, 7.0, 9.0, 12.0, 11.0, 12.0, 23.0, 51.0, 64.0, 99.0, 132.0, 172.0, 143.0, 77.0, 65.0, 39.0, 33.0, 18.0, 14.0, 11.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0677490234375, -0.06572341918945312, -0.06369781494140625, -0.061672210693359375, -0.0596466064453125, -0.057621002197265625, -0.05559539794921875, -0.053569793701171875, -0.051544189453125, -0.049518585205078125, -0.04749298095703125, -0.045467376708984375, -0.0434417724609375, -0.041416168212890625, -0.03939056396484375, -0.037364959716796875, -0.03533935546875, -0.033313751220703125, -0.03128814697265625, -0.029262542724609375, -0.0272369384765625, -0.025211334228515625, -0.02318572998046875, -0.021160125732421875, -0.019134521484375, -0.017108917236328125, -0.01508331298828125, -0.013057708740234375, -0.0110321044921875, -0.009006500244140625, -0.00698089599609375, -0.004955291748046875, -0.0029296875, -0.000904083251953125, 0.00112152099609375, 0.003147125244140625, 0.0051727294921875, 0.007198333740234375, 0.00922393798828125, 0.011249542236328125, 0.013275146484375, 0.015300750732421875, 0.01732635498046875, 0.019351959228515625, 0.0213775634765625, 0.023403167724609375, 0.02542877197265625, 0.027454376220703125, 0.02947998046875, 0.031505584716796875, 0.03353118896484375, 0.035556793212890625, 0.0375823974609375, 0.039608001708984375, 0.04163360595703125, 0.043659210205078125, 0.045684814453125, 0.047710418701171875, 0.04973602294921875, 0.051761627197265625, 0.0537872314453125, 0.055812835693359375, 0.05783843994140625, 0.059864044189453125, 0.0618896484375]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 7.0, 11.0, 22.0, 38.0, 91.0, 204.0, 293.0, 165.0, 108.0, 33.0, 18.0, 12.0, 5.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0629701614379883, -1.0213743448257446, -0.979778528213501, -0.9381826519966125, -0.8965868353843689, -0.8549910187721252, -0.8133951425552368, -0.7717993259429932, -0.7302035093307495, -0.6886076927185059, -0.6470118761062622, -0.6054159998893738, -0.5638201832771301, -0.5222243666648865, -0.48062852025032043, -0.4390326738357544, -0.39743685722351074, -0.3558410406112671, -0.31424519419670105, -0.272649347782135, -0.23105353116989136, -0.1894576996564865, -0.14786186814308167, -0.10626602172851562, -0.06467020511627197, -0.023074373602867126, 0.01852145791053772, 0.060117289423942566, 0.10171312093734741, 0.14330895245075226, 0.1849047839641571, 0.22650063037872314, 0.2680964469909668, 0.30969226360321045, 0.3512881100177765, 0.39288395643234253, 0.4344797730445862, 0.47607558965682983, 0.5176714658737183, 0.5592672824859619, 0.6008630990982056, 0.6424589157104492, 0.6840547323226929, 0.7256506085395813, 0.767246425151825, 0.8088422417640686, 0.850438117980957, 0.8920339345932007, 0.9336297512054443, 0.975225567817688, 1.0168213844299316, 1.0584172010421753, 1.100013017654419, 1.1416089534759521, 1.1832047700881958, 1.2248005867004395, 1.266396403312683, 1.3079922199249268, 1.3495880365371704, 1.391183853149414, 1.4327797889709473, 1.474375605583191, 1.5159714221954346, 1.5575672388076782, 1.5991630554199219]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 5.0, 0.0, 3.0, 12.0, 8.0, 11.0, 9.0, 10.0, 7.0, 10.0, 12.0, 20.0, 20.0, 19.0, 25.0, 33.0, 29.0, 34.0, 30.0, 36.0, 44.0, 36.0, 50.0, 34.0, 33.0, 40.0, 31.0, 33.0, 29.0, 35.0, 24.0, 28.0, 33.0, 35.0, 20.0, 18.0, 25.0, 14.0, 18.0, 10.0, 8.0, 10.0, 11.0, 9.0, 11.0, 8.0, 8.0, 7.0, 3.0, 1.0, 3.0, 2.0, 3.0, 5.0, 0.0, 1.0], "bins": [-0.3973597288131714, -0.38521525263786316, -0.37307077646255493, -0.3609262704849243, -0.3487817943096161, -0.33663731813430786, -0.32449284195899963, -0.3123483657836914, -0.3002038598060608, -0.28805938363075256, -0.27591490745544434, -0.2637704014778137, -0.2516259253025055, -0.23948144912719727, -0.22733697295188904, -0.2151924967765808, -0.20304802060127258, -0.19090354442596436, -0.17875905334949493, -0.1666145771741867, -0.15447008609771729, -0.14232560992240906, -0.13018113374710083, -0.118036650121212, -0.10589216649532318, -0.09374768286943436, -0.08160319924354553, -0.0694587230682373, -0.05731423944234848, -0.045169755816459656, -0.03302527964115143, -0.020880796015262604, -0.00873631238937378, 0.003408169373869896, 0.015552651137113571, 0.027697131037712097, 0.03984161466360092, 0.051986098289489746, 0.06413057446479797, 0.0762750580906868, 0.08841954171657562, 0.10056402534246445, 0.11270850896835327, 0.1248529851436615, 0.13699746131896973, 0.14914195239543915, 0.16128642857074738, 0.1734309196472168, 0.18557539582252502, 0.19771987199783325, 0.20986436307430267, 0.2220088392496109, 0.23415333032608032, 0.24629780650138855, 0.2584422826766968, 0.270586758852005, 0.28273123502731323, 0.29487571120262146, 0.3070201873779297, 0.3191646933555603, 0.33130916953086853, 0.34345364570617676, 0.355598121881485, 0.3677425980567932, 0.37988710403442383]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 5.0, 7.0, 5.0, 6.0, 10.0, 10.0, 8.0, 18.0, 14.0, 22.0, 30.0, 32.0, 52.0, 106.0, 157.0, 396.0, 1431.0, 7548.0, 4122418.0, 56029.0, 4085.0, 1044.0, 403.0, 168.0, 121.0, 55.0, 44.0, 23.0, 13.0, 9.0, 6.0, 4.0, 6.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.609375, -0.5936851501464844, -0.5779953002929688, -0.5623054504394531, -0.5466156005859375, -0.5309257507324219, -0.5152359008789062, -0.4995460510253906, -0.483856201171875, -0.4681663513183594, -0.45247650146484375, -0.4367866516113281, -0.4210968017578125, -0.4054069519042969, -0.38971710205078125, -0.3740272521972656, -0.35833740234375, -0.3426475524902344, -0.32695770263671875, -0.3112678527832031, -0.2955780029296875, -0.2798881530761719, -0.26419830322265625, -0.24850845336914062, -0.232818603515625, -0.21712875366210938, -0.20143890380859375, -0.18574905395507812, -0.1700592041015625, -0.15436935424804688, -0.13867950439453125, -0.12298965454101562, -0.1072998046875, -0.09160995483398438, -0.07592010498046875, -0.060230255126953125, -0.0445404052734375, -0.028850555419921875, -0.01316070556640625, 0.002529144287109375, 0.018218994140625, 0.033908843994140625, 0.04959869384765625, 0.06528854370117188, 0.0809783935546875, 0.09666824340820312, 0.11235809326171875, 0.12804794311523438, 0.14373779296875, 0.15942764282226562, 0.17511749267578125, 0.19080734252929688, 0.2064971923828125, 0.22218704223632812, 0.23787689208984375, 0.2535667419433594, 0.269256591796875, 0.2849464416503906, 0.30063629150390625, 0.3163261413574219, 0.3320159912109375, 0.3477058410644531, 0.36339569091796875, 0.3790855407714844, 0.394775390625]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 5.0, 10.0, 22.0, 37.0, 63.0, 117.0, 131.0, 178.0, 140.0, 117.0, 101.0, 40.0, 21.0, 9.0, 4.0, 0.0, 3.0, 3.0, 6.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.11468505859375, -0.11186885833740234, -0.10905265808105469, -0.10623645782470703, -0.10342025756835938, -0.10060405731201172, -0.09778785705566406, -0.0949716567993164, -0.09215545654296875, -0.0893392562866211, -0.08652305603027344, -0.08370685577392578, -0.08089065551757812, -0.07807445526123047, -0.07525825500488281, -0.07244205474853516, -0.0696258544921875, -0.06680965423583984, -0.06399345397949219, -0.06117725372314453, -0.058361053466796875, -0.05554485321044922, -0.05272865295410156, -0.049912452697753906, -0.04709625244140625, -0.044280052185058594, -0.04146385192871094, -0.03864765167236328, -0.035831451416015625, -0.03301525115966797, -0.030199050903320312, -0.027382850646972656, -0.024566650390625, -0.021750450134277344, -0.018934249877929688, -0.01611804962158203, -0.013301849365234375, -0.010485649108886719, -0.0076694488525390625, -0.004853248596191406, -0.00203704833984375, 0.0007791519165039062, 0.0035953521728515625, 0.006411552429199219, 0.009227752685546875, 0.012043952941894531, 0.014860153198242188, 0.017676353454589844, 0.0204925537109375, 0.023308753967285156, 0.026124954223632812, 0.02894115447998047, 0.031757354736328125, 0.03457355499267578, 0.03738975524902344, 0.040205955505371094, 0.04302215576171875, 0.045838356018066406, 0.04865455627441406, 0.05147075653076172, 0.054286956787109375, 0.05710315704345703, 0.05991935729980469, 0.06273555755615234, 0.0655517578125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 6.0, 5.0, 13.0, 16.0, 13.0, 15.0, 40.0, 68.0, 103.0, 149.0, 272.0, 499.0, 940.0, 2103.0, 5734.0, 23111.0, 4008737.0, 132143.0, 12976.0, 3962.0, 1612.0, 772.0, 410.0, 208.0, 127.0, 97.0, 51.0, 30.0, 24.0, 22.0, 16.0, 8.0, 2.0, 2.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.287353515625, -0.27955055236816406, -0.2717475891113281, -0.2639446258544922, -0.25614166259765625, -0.2483386993408203, -0.24053573608398438, -0.23273277282714844, -0.2249298095703125, -0.21712684631347656, -0.20932388305664062, -0.2015209197998047, -0.19371795654296875, -0.1859149932861328, -0.17811203002929688, -0.17030906677246094, -0.162506103515625, -0.15470314025878906, -0.14690017700195312, -0.1390972137451172, -0.13129425048828125, -0.12349128723144531, -0.11568832397460938, -0.10788536071777344, -0.1000823974609375, -0.09227943420410156, -0.08447647094726562, -0.07667350769042969, -0.06887054443359375, -0.06106758117675781, -0.053264617919921875, -0.04546165466308594, -0.03765869140625, -0.029855728149414062, -0.022052764892578125, -0.014249801635742188, -0.00644683837890625, 0.0013561248779296875, 0.009159088134765625, 0.016962051391601562, 0.0247650146484375, 0.03256797790527344, 0.040370941162109375, 0.04817390441894531, 0.05597686767578125, 0.06377983093261719, 0.07158279418945312, 0.07938575744628906, 0.087188720703125, 0.09499168395996094, 0.10279464721679688, 0.11059761047363281, 0.11840057373046875, 0.1262035369873047, 0.13400650024414062, 0.14180946350097656, 0.1496124267578125, 0.15741539001464844, 0.16521835327148438, 0.1730213165283203, 0.18082427978515625, 0.1886272430419922, 0.19643020629882812, 0.20423316955566406, 0.2120361328125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 1.0, 2.0, 2.0, 5.0, 10.0, 11.0, 20.0, 40.0, 138.0, 3649.0, 111.0, 40.0, 21.0, 11.0, 3.0, 4.0, 1.0, 3.0, 6.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09356689453125, -0.08988666534423828, -0.08620643615722656, -0.08252620697021484, -0.07884597778320312, -0.0751657485961914, -0.07148551940917969, -0.06780529022216797, -0.06412506103515625, -0.06044483184814453, -0.05676460266113281, -0.053084373474121094, -0.049404144287109375, -0.045723915100097656, -0.04204368591308594, -0.03836345672607422, -0.0346832275390625, -0.03100299835205078, -0.027322769165039062, -0.023642539978027344, -0.019962310791015625, -0.016282081604003906, -0.012601852416992188, -0.008921623229980469, -0.00524139404296875, -0.0015611648559570312, 0.0021190643310546875, 0.005799293518066406, 0.009479522705078125, 0.013159751892089844, 0.016839981079101562, 0.02052021026611328, 0.024200439453125, 0.02788066864013672, 0.03156089782714844, 0.035241127014160156, 0.038921356201171875, 0.042601585388183594, 0.04628181457519531, 0.04996204376220703, 0.05364227294921875, 0.05732250213623047, 0.06100273132324219, 0.0646829605102539, 0.06836318969726562, 0.07204341888427734, 0.07572364807128906, 0.07940387725830078, 0.0830841064453125, 0.08676433563232422, 0.09044456481933594, 0.09412479400634766, 0.09780502319335938, 0.1014852523803711, 0.10516548156738281, 0.10884571075439453, 0.11252593994140625, 0.11620616912841797, 0.11988639831542969, 0.1235666275024414, 0.12724685668945312, 0.13092708587646484, 0.13460731506347656, 0.13828754425048828, 0.1419677734375]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 8.0, 24.0, 144.0, 556.0, 205.0, 53.0, 11.0, 2.0, 3.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7478407621383667, -0.7255522012710571, -0.7032635807991028, -0.6809750199317932, -0.6586863994598389, -0.6363978385925293, -0.6141092777252197, -0.5918206572532654, -0.569532036781311, -0.5472434759140015, -0.5249548554420471, -0.5026662945747375, -0.4803776741027832, -0.45808911323547363, -0.4358005225658417, -0.4135119318962097, -0.39122337102890015, -0.3689347803592682, -0.34664618968963623, -0.32435762882232666, -0.3020690083503723, -0.27978044748306274, -0.2574918568134308, -0.23520326614379883, -0.21291467547416687, -0.1906260848045349, -0.16833749413490295, -0.1460489183664322, -0.12376032769680023, -0.10147173702716827, -0.07918316125869751, -0.05689457058906555, -0.034605979919433594, -0.012317392975091934, 0.009971193969249725, 0.032259777188301086, 0.054548367857933044, 0.076836958527565, 0.09912553429603577, 0.12141412496566772, 0.14370271563529968, 0.16599130630493164, 0.1882798969745636, 0.21056847274303436, 0.23285706341266632, 0.2551456689834595, 0.27743422985076904, 0.299722820520401, 0.32201141119003296, 0.3443000018596649, 0.3665885925292969, 0.38887715339660645, 0.4111657738685608, 0.43345433473587036, 0.4557429254055023, 0.4780315160751343, 0.5003200769424438, 0.5226086378097534, 0.5448972582817078, 0.5671858191490173, 0.5894744396209717, 0.6117630004882812, 0.6340515613555908, 0.6563401818275452, 0.6786288022994995]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 12.0, 19.0, 49.0, 75.0, 124.0, 137.0, 116.0, 143.0, 120.0, 90.0, 59.0, 23.0, 18.0, 12.0, 3.0, 5.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.486997127532959, -0.4758654236793518, -0.46473371982574463, -0.45360201597213745, -0.4424703121185303, -0.4313386082649231, -0.4202069044113159, -0.40907520055770874, -0.39794349670410156, -0.3868117928504944, -0.3756800889968872, -0.36454838514328003, -0.35341668128967285, -0.3422849774360657, -0.3311532735824585, -0.3200215697288513, -0.30888983607292175, -0.2977581322193146, -0.2866264283657074, -0.2754947245121002, -0.26436302065849304, -0.25323131680488586, -0.2420995980501175, -0.23096789419651031, -0.21983619034290314, -0.20870448648929596, -0.19757278263568878, -0.1864410638809204, -0.17530936002731323, -0.16417765617370605, -0.15304595232009888, -0.1419142484664917, -0.13078254461288452, -0.11965084075927734, -0.10851913690567017, -0.09738742560148239, -0.08625572174787521, -0.07512401789426804, -0.06399230659008026, -0.052860602736473083, -0.041728898882865906, -0.03059719316661358, -0.019465487450361252, -0.008333779871463776, 0.002797923982143402, 0.01392962783575058, 0.025061339139938354, 0.03619304299354553, 0.04732474684715271, 0.05845645070075989, 0.06958815455436707, 0.08071986585855484, 0.09185156971216202, 0.1029832735657692, 0.11411498486995697, 0.12524668872356415, 0.13637839257717133, 0.1475100964307785, 0.15864180028438568, 0.16977351903915405, 0.18090522289276123, 0.1920369267463684, 0.20316863059997559, 0.21430033445358276, 0.22543203830718994]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 4.0, 8.0, 5.0, 16.0, 21.0, 20.0, 27.0, 45.0, 36.0, 56.0, 95.0, 114.0, 154.0, 196.0, 291.0, 404.0, 630.0, 1052.0, 1769.0, 4042.0, 14277.0, 86033.0, 640936.0, 252983.0, 31933.0, 7043.0, 2537.0, 1314.0, 754.0, 498.0, 332.0, 246.0, 171.0, 119.0, 88.0, 68.0, 48.0, 40.0, 49.0, 25.0, 14.0, 12.0, 14.0, 9.0, 8.0, 9.0, 8.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.21728515625, -0.20998001098632812, -0.20267486572265625, -0.19536972045898438, -0.1880645751953125, -0.18075942993164062, -0.17345428466796875, -0.16614913940429688, -0.158843994140625, -0.15153884887695312, -0.14423370361328125, -0.13692855834960938, -0.1296234130859375, -0.12231826782226562, -0.11501312255859375, -0.10770797729492188, -0.10040283203125, -0.09309768676757812, -0.08579254150390625, -0.07848739624023438, -0.0711822509765625, -0.06387710571289062, -0.05657196044921875, -0.049266815185546875, -0.041961669921875, -0.034656524658203125, -0.02735137939453125, -0.020046234130859375, -0.0127410888671875, -0.005435943603515625, 0.00186920166015625, 0.009174346923828125, 0.0164794921875, 0.023784637451171875, 0.03108978271484375, 0.038394927978515625, 0.0457000732421875, 0.053005218505859375, 0.06031036376953125, 0.06761550903320312, 0.074920654296875, 0.08222579956054688, 0.08953094482421875, 0.09683609008789062, 0.1041412353515625, 0.11144638061523438, 0.11875152587890625, 0.12605667114257812, 0.13336181640625, 0.14066696166992188, 0.14797210693359375, 0.15527725219726562, 0.1625823974609375, 0.16988754272460938, 0.17719268798828125, 0.18449783325195312, 0.191802978515625, 0.19910812377929688, 0.20641326904296875, 0.21371841430664062, 0.2210235595703125, 0.22832870483398438, 0.23563385009765625, 0.24293899536132812, 0.250244140625]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 7.0, 17.0, 43.0, 62.0, 119.0, 144.0, 183.0, 141.0, 129.0, 88.0, 35.0, 15.0, 6.0, 3.0, 3.0, 4.0, 4.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.12371826171875, -0.12074565887451172, -0.11777305603027344, -0.11480045318603516, -0.11182785034179688, -0.1088552474975586, -0.10588264465332031, -0.10291004180908203, -0.09993743896484375, -0.09696483612060547, -0.09399223327636719, -0.0910196304321289, -0.08804702758789062, -0.08507442474365234, -0.08210182189941406, -0.07912921905517578, -0.0761566162109375, -0.07318401336669922, -0.07021141052246094, -0.06723880767822266, -0.06426620483398438, -0.061293601989746094, -0.05832099914550781, -0.05534839630126953, -0.05237579345703125, -0.04940319061279297, -0.04643058776855469, -0.043457984924316406, -0.040485382080078125, -0.037512779235839844, -0.03454017639160156, -0.03156757354736328, -0.028594970703125, -0.02562236785888672, -0.022649765014648438, -0.019677162170410156, -0.016704559326171875, -0.013731956481933594, -0.010759353637695312, -0.007786750793457031, -0.00481414794921875, -0.0018415451049804688, 0.0011310577392578125, 0.004103660583496094, 0.007076263427734375, 0.010048866271972656, 0.013021469116210938, 0.01599407196044922, 0.0189666748046875, 0.02193927764892578, 0.024911880493164062, 0.027884483337402344, 0.030857086181640625, 0.033829689025878906, 0.03680229187011719, 0.03977489471435547, 0.04274749755859375, 0.04572010040283203, 0.04869270324707031, 0.051665306091308594, 0.054637908935546875, 0.057610511779785156, 0.06058311462402344, 0.06355571746826172, 0.0665283203125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 2.0, 6.0, 5.0, 2.0, 7.0, 16.0, 27.0, 24.0, 40.0, 54.0, 82.0, 152.0, 279.0, 528.0, 1011.0, 2137.0, 4788.0, 11331.0, 28437.0, 75570.0, 213206.0, 425467.0, 178766.0, 63867.0, 24509.0, 9964.0, 4191.0, 1981.0, 966.0, 493.0, 254.0, 143.0, 86.0, 50.0, 33.0, 21.0, 22.0, 9.0, 8.0, 9.0, 5.0, 6.0, 2.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.09405517578125, -0.09115409851074219, -0.08825302124023438, -0.08535194396972656, -0.08245086669921875, -0.07954978942871094, -0.07664871215820312, -0.07374763488769531, -0.0708465576171875, -0.06794548034667969, -0.06504440307617188, -0.06214332580566406, -0.05924224853515625, -0.05634117126464844, -0.053440093994140625, -0.05053901672363281, -0.047637939453125, -0.04473686218261719, -0.041835784912109375, -0.03893470764160156, -0.03603363037109375, -0.03313255310058594, -0.030231475830078125, -0.027330398559570312, -0.0244293212890625, -0.021528244018554688, -0.018627166748046875, -0.015726089477539062, -0.01282501220703125, -0.009923934936523438, -0.007022857666015625, -0.0041217803955078125, -0.001220703125, 0.0016803741455078125, 0.004581451416015625, 0.0074825286865234375, 0.01038360595703125, 0.013284683227539062, 0.016185760498046875, 0.019086837768554688, 0.0219879150390625, 0.024888992309570312, 0.027790069580078125, 0.030691146850585938, 0.03359222412109375, 0.03649330139160156, 0.039394378662109375, 0.04229545593261719, 0.045196533203125, 0.04809761047363281, 0.050998687744140625, 0.05389976501464844, 0.05680084228515625, 0.05970191955566406, 0.06260299682617188, 0.06550407409667969, 0.0684051513671875, 0.07130622863769531, 0.07420730590820312, 0.07710838317871094, 0.08000946044921875, 0.08291053771972656, 0.08581161499023438, 0.08871269226074219, 0.09161376953125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 7.0, 1.0, 3.0, 8.0, 7.0, 11.0, 3.0, 18.0, 17.0, 14.0, 20.0, 21.0, 25.0, 38.0, 32.0, 35.0, 28.0, 28.0, 42.0, 29.0, 47.0, 49.0, 45.0, 43.0, 45.0, 36.0, 44.0, 41.0, 32.0, 35.0, 23.0, 28.0, 21.0, 24.0, 21.0, 17.0, 7.0, 13.0, 4.0, 12.0, 8.0, 6.0, 7.0, 3.0, 3.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.100830078125, -0.09771060943603516, -0.09459114074707031, -0.09147167205810547, -0.08835220336914062, -0.08523273468017578, -0.08211326599121094, -0.0789937973022461, -0.07587432861328125, -0.0727548599243164, -0.06963539123535156, -0.06651592254638672, -0.06339645385742188, -0.06027698516845703, -0.05715751647949219, -0.054038047790527344, -0.0509185791015625, -0.047799110412597656, -0.04467964172363281, -0.04156017303466797, -0.038440704345703125, -0.03532123565673828, -0.03220176696777344, -0.029082298278808594, -0.02596282958984375, -0.022843360900878906, -0.019723892211914062, -0.01660442352294922, -0.013484954833984375, -0.010365486145019531, -0.0072460174560546875, -0.004126548767089844, -0.001007080078125, 0.0021123886108398438, 0.0052318572998046875, 0.008351325988769531, 0.011470794677734375, 0.014590263366699219, 0.017709732055664062, 0.020829200744628906, 0.02394866943359375, 0.027068138122558594, 0.030187606811523438, 0.03330707550048828, 0.036426544189453125, 0.03954601287841797, 0.04266548156738281, 0.045784950256347656, 0.0489044189453125, 0.052023887634277344, 0.05514335632324219, 0.05826282501220703, 0.061382293701171875, 0.06450176239013672, 0.06762123107910156, 0.0707406997680664, 0.07386016845703125, 0.0769796371459961, 0.08009910583496094, 0.08321857452392578, 0.08633804321289062, 0.08945751190185547, 0.09257698059082031, 0.09569644927978516, 0.09881591796875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 2.0, 9.0, 15.0, 12.0, 16.0, 23.0, 57.0, 81.0, 134.0, 209.0, 395.0, 707.0, 1326.0, 2657.0, 6555.0, 18694.0, 68429.0, 423821.0, 426496.0, 68145.0, 18385.0, 6593.0, 2839.0, 1361.0, 709.0, 388.0, 192.0, 112.0, 63.0, 54.0, 24.0, 12.0, 12.0, 10.0, 12.0, 5.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.04449462890625, -0.04332375526428223, -0.04215288162231445, -0.04098200798034668, -0.039811134338378906, -0.03864026069641113, -0.03746938705444336, -0.036298513412475586, -0.03512763977050781, -0.03395676612854004, -0.032785892486572266, -0.03161501884460449, -0.03044414520263672, -0.029273271560668945, -0.028102397918701172, -0.0269315242767334, -0.025760650634765625, -0.02458977699279785, -0.023418903350830078, -0.022248029708862305, -0.02107715606689453, -0.019906282424926758, -0.018735408782958984, -0.01756453514099121, -0.016393661499023438, -0.015222787857055664, -0.01405191421508789, -0.012881040573120117, -0.011710166931152344, -0.01053929328918457, -0.009368419647216797, -0.008197546005249023, -0.00702667236328125, -0.0058557987213134766, -0.004684925079345703, -0.0035140514373779297, -0.0023431777954101562, -0.0011723041534423828, -1.430511474609375e-06, 0.001169443130493164, 0.0023403167724609375, 0.003511190414428711, 0.004682064056396484, 0.005852937698364258, 0.007023811340332031, 0.008194684982299805, 0.009365558624267578, 0.010536432266235352, 0.011707305908203125, 0.012878179550170898, 0.014049053192138672, 0.015219926834106445, 0.01639080047607422, 0.017561674118041992, 0.018732547760009766, 0.01990342140197754, 0.021074295043945312, 0.022245168685913086, 0.02341604232788086, 0.024586915969848633, 0.025757789611816406, 0.02692866325378418, 0.028099536895751953, 0.029270410537719727, 0.0304412841796875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 4.0, 6.0, 6.0, 5.0, 9.0, 14.0, 16.0, 27.0, 32.0, 60.0, 110.0, 244.0, 243.0, 84.0, 57.0, 29.0, 18.0, 13.0, 7.0, 7.0, 10.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00017154216766357422, -0.0001659989356994629, -0.00016045570373535156, -0.00015491247177124023, -0.0001493692398071289, -0.00014382600784301758, -0.00013828277587890625, -0.00013273954391479492, -0.0001271963119506836, -0.00012165307998657227, -0.00011610984802246094, -0.00011056661605834961, -0.00010502338409423828, -9.948015213012695e-05, -9.393692016601562e-05, -8.83936882019043e-05, -8.285045623779297e-05, -7.730722427368164e-05, -7.176399230957031e-05, -6.622076034545898e-05, -6.0677528381347656e-05, -5.513429641723633e-05, -4.9591064453125e-05, -4.404783248901367e-05, -3.8504600524902344e-05, -3.2961368560791016e-05, -2.7418136596679688e-05, -2.187490463256836e-05, -1.633167266845703e-05, -1.0788440704345703e-05, -5.245208740234375e-06, 2.980232238769531e-07, 5.841255187988281e-06, 1.138448715209961e-05, 1.6927719116210938e-05, 2.2470951080322266e-05, 2.8014183044433594e-05, 3.355741500854492e-05, 3.910064697265625e-05, 4.464387893676758e-05, 5.0187110900878906e-05, 5.5730342864990234e-05, 6.127357482910156e-05, 6.681680679321289e-05, 7.236003875732422e-05, 7.790327072143555e-05, 8.344650268554688e-05, 8.89897346496582e-05, 9.453296661376953e-05, 0.00010007619857788086, 0.00010561943054199219, 0.00011116266250610352, 0.00011670589447021484, 0.00012224912643432617, 0.0001277923583984375, 0.00013333559036254883, 0.00013887882232666016, 0.00014442205429077148, 0.0001499652862548828, 0.00015550851821899414, 0.00016105175018310547, 0.0001665949821472168, 0.00017213821411132812, 0.00017768144607543945, 0.00018322467803955078]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 10.0, 14.0, 17.0, 18.0, 40.0, 90.0, 174.0, 293.0, 838.0, 2962.0, 13167.0, 90736.0, 731920.0, 180705.0, 21291.0, 4270.0, 1189.0, 431.0, 182.0, 88.0, 45.0, 39.0, 19.0, 9.0, 6.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.059295654296875, -0.0576319694519043, -0.055968284606933594, -0.05430459976196289, -0.05264091491699219, -0.050977230072021484, -0.04931354522705078, -0.04764986038208008, -0.045986175537109375, -0.04432249069213867, -0.04265880584716797, -0.040995121002197266, -0.03933143615722656, -0.03766775131225586, -0.036004066467285156, -0.03434038162231445, -0.03267669677734375, -0.031013011932373047, -0.029349327087402344, -0.02768564224243164, -0.026021957397460938, -0.024358272552490234, -0.02269458770751953, -0.021030902862548828, -0.019367218017578125, -0.017703533172607422, -0.01603984832763672, -0.014376163482666016, -0.012712478637695312, -0.01104879379272461, -0.009385108947753906, -0.007721424102783203, -0.0060577392578125, -0.004394054412841797, -0.0027303695678710938, -0.0010666847229003906, 0.0005970001220703125, 0.0022606849670410156, 0.003924369812011719, 0.005588054656982422, 0.007251739501953125, 0.008915424346923828, 0.010579109191894531, 0.012242794036865234, 0.013906478881835938, 0.01557016372680664, 0.017233848571777344, 0.018897533416748047, 0.02056121826171875, 0.022224903106689453, 0.023888587951660156, 0.02555227279663086, 0.027215957641601562, 0.028879642486572266, 0.03054332733154297, 0.03220701217651367, 0.033870697021484375, 0.03553438186645508, 0.03719806671142578, 0.038861751556396484, 0.04052543640136719, 0.04218912124633789, 0.043852806091308594, 0.0455164909362793, 0.04718017578125]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 3.0, 4.0, 4.0, 9.0, 15.0, 25.0, 30.0, 35.0, 55.0, 76.0, 104.0, 125.0, 110.0, 118.0, 100.0, 70.0, 45.0, 26.0, 17.0, 13.0, 7.0, 7.0, 8.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0640869140625, -0.06270146369934082, -0.06131601333618164, -0.05993056297302246, -0.05854511260986328, -0.0571596622467041, -0.05577421188354492, -0.05438876152038574, -0.05300331115722656, -0.05161786079406738, -0.0502324104309082, -0.04884696006774902, -0.047461509704589844, -0.046076059341430664, -0.044690608978271484, -0.043305158615112305, -0.041919708251953125, -0.040534257888793945, -0.039148807525634766, -0.037763357162475586, -0.036377906799316406, -0.03499245643615723, -0.03360700607299805, -0.03222155570983887, -0.030836105346679688, -0.029450654983520508, -0.028065204620361328, -0.02667975425720215, -0.02529430389404297, -0.02390885353088379, -0.02252340316772461, -0.02113795280456543, -0.01975250244140625, -0.01836705207824707, -0.01698160171508789, -0.015596151351928711, -0.014210700988769531, -0.012825250625610352, -0.011439800262451172, -0.010054349899291992, -0.008668899536132812, -0.007283449172973633, -0.005897998809814453, -0.0045125484466552734, -0.0031270980834960938, -0.001741647720336914, -0.0003561973571777344, 0.0010292530059814453, 0.002414703369140625, 0.0038001537322998047, 0.005185604095458984, 0.006571054458618164, 0.007956504821777344, 0.009341955184936523, 0.010727405548095703, 0.012112855911254883, 0.013498306274414062, 0.014883756637573242, 0.016269207000732422, 0.0176546573638916, 0.01904010772705078, 0.02042555809020996, 0.02181100845336914, 0.02319645881652832, 0.0245819091796875]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 12.0, 14.0, 15.0, 27.0, 44.0, 49.0, 94.0, 138.0, 133.0, 162.0, 107.0, 78.0, 41.0, 31.0, 14.0, 21.0, 8.0, 6.0, 4.0, 3.0, 1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0081660747528076, -0.9827969074249268, -0.9574277997016907, -0.9320586323738098, -0.9066895246505737, -0.8813203573226929, -0.855951189994812, -0.8305820822715759, -0.8052129745483398, -0.779843807220459, -0.7544746994972229, -0.729105532169342, -0.703736424446106, -0.6783672571182251, -0.6529980897903442, -0.6276289820671082, -0.6022598147392273, -0.5768906474113464, -0.5515215396881104, -0.5261523723602295, -0.5007832646369934, -0.47541409730911255, -0.4500449597835541, -0.4246758222579956, -0.39930668473243713, -0.37393754720687866, -0.3485684096813202, -0.3231992721557617, -0.29783010482788086, -0.2724609971046448, -0.24709182977676392, -0.22172269225120544, -0.19635355472564697, -0.1709844172000885, -0.14561527967453003, -0.12024612724781036, -0.09487698972225189, -0.06950785219669342, -0.044138699769973755, -0.018769562244415283, 0.0065995752811431885, 0.03196871653199196, 0.05733785778284073, 0.0827070027589798, 0.10807614028453827, 0.13344527781009674, 0.1588144302368164, 0.18418356776237488, 0.20955270528793335, 0.23492184281349182, 0.2602909803390503, 0.28566014766693115, 0.31102925539016724, 0.3363984227180481, 0.36176756024360657, 0.38713669776916504, 0.4125058352947235, 0.437874972820282, 0.46324411034584045, 0.4886132478713989, 0.5139824151992798, 0.5393515229225159, 0.5647206902503967, 0.5900897979736328, 0.6154589653015137]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 3.0, 8.0, 4.0, 8.0, 6.0, 13.0, 18.0, 21.0, 21.0, 29.0, 26.0, 25.0, 34.0, 35.0, 43.0, 49.0, 34.0, 53.0, 51.0, 54.0, 54.0, 37.0, 43.0, 52.0, 40.0, 33.0, 32.0, 28.0, 21.0, 26.0, 17.0, 13.0, 18.0, 11.0, 10.0, 8.0, 10.0, 7.0, 5.0, 5.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.5147621631622314, -0.4973222017288208, -0.47988224029541016, -0.4624422788619995, -0.44500231742858887, -0.4275623559951782, -0.41012242436408997, -0.3926824629306793, -0.3752425014972687, -0.35780254006385803, -0.3403625786304474, -0.32292261719703674, -0.3054826855659485, -0.28804272413253784, -0.2706027626991272, -0.25316280126571655, -0.2357228398323059, -0.21828287839889526, -0.20084291696548462, -0.18340297043323517, -0.16596300899982452, -0.14852304756641388, -0.13108310103416443, -0.11364313960075378, -0.09620317816734314, -0.0787632167339325, -0.06132326275110245, -0.0438833050429821, -0.026443347334861755, -0.00900338590145111, 0.008436568081378937, 0.025876522064208984, 0.04331648349761963, 0.060756441205739975, 0.07819639891386032, 0.09563635289669037, 0.11307631433010101, 0.13051627576351166, 0.1479562222957611, 0.16539618372917175, 0.1828361451625824, 0.20027610659599304, 0.2177160680294037, 0.23515601456165314, 0.2525959610939026, 0.27003592252731323, 0.2874758839607239, 0.3049158453941345, 0.32235580682754517, 0.3397957682609558, 0.35723572969436646, 0.3746756911277771, 0.39211565256118774, 0.4095556139945984, 0.42699554562568665, 0.4444355070590973, 0.46187546849250793, 0.4793154299259186, 0.4967553913593292, 0.5141953229904175, 0.5316352844238281, 0.5490752458572388, 0.5665152072906494, 0.5839551687240601, 0.6013951301574707]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 0.0, 4.0, 3.0, 2.0, 4.0, 5.0, 5.0, 11.0, 6.0, 11.0, 10.0, 10.0, 15.0, 16.0, 23.0, 26.0, 28.0, 58.0, 67.0, 125.0, 220.0, 512.0, 1495.0, 5942.0, 107310.0, 4065869.0, 8825.0, 2127.0, 743.0, 334.0, 161.0, 103.0, 78.0, 42.0, 31.0, 24.0, 7.0, 11.0, 6.0, 8.0, 5.0, 0.0, 2.0, 1.0, 0.0, 3.0], "bins": [-0.6025390625, -0.5885581970214844, -0.5745773315429688, -0.5605964660644531, -0.5466156005859375, -0.5326347351074219, -0.5186538696289062, -0.5046730041503906, -0.490692138671875, -0.4767112731933594, -0.46273040771484375, -0.4487495422363281, -0.4347686767578125, -0.4207878112792969, -0.40680694580078125, -0.3928260803222656, -0.37884521484375, -0.3648643493652344, -0.35088348388671875, -0.3369026184082031, -0.3229217529296875, -0.3089408874511719, -0.29496002197265625, -0.2809791564941406, -0.266998291015625, -0.2530174255371094, -0.23903656005859375, -0.22505569458007812, -0.2110748291015625, -0.19709396362304688, -0.18311309814453125, -0.16913223266601562, -0.1551513671875, -0.14117050170898438, -0.12718963623046875, -0.11320877075195312, -0.0992279052734375, -0.08524703979492188, -0.07126617431640625, -0.057285308837890625, -0.043304443359375, -0.029323577880859375, -0.01534271240234375, -0.001361846923828125, 0.0126190185546875, 0.026599884033203125, 0.04058074951171875, 0.054561614990234375, 0.06854248046875, 0.08252334594726562, 0.09650421142578125, 0.11048507690429688, 0.1244659423828125, 0.13844680786132812, 0.15242767333984375, 0.16640853881835938, 0.180389404296875, 0.19437026977539062, 0.20835113525390625, 0.22233200073242188, 0.2363128662109375, 0.2502937316894531, 0.26427459716796875, 0.2782554626464844, 0.292236328125]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 19.0, 40.0, 61.0, 102.0, 150.0, 191.0, 161.0, 118.0, 81.0, 46.0, 10.0, 4.0, 5.0, 1.0, 4.0, 6.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.1253662109375, -0.1223592758178711, -0.11935234069824219, -0.11634540557861328, -0.11333847045898438, -0.11033153533935547, -0.10732460021972656, -0.10431766510009766, -0.10131072998046875, -0.09830379486083984, -0.09529685974121094, -0.09228992462158203, -0.08928298950195312, -0.08627605438232422, -0.08326911926269531, -0.0802621841430664, -0.0772552490234375, -0.0742483139038086, -0.07124137878417969, -0.06823444366455078, -0.06522750854492188, -0.06222057342529297, -0.05921363830566406, -0.056206703186035156, -0.05319976806640625, -0.050192832946777344, -0.04718589782714844, -0.04417896270751953, -0.041172027587890625, -0.03816509246826172, -0.03515815734863281, -0.032151222229003906, -0.029144287109375, -0.026137351989746094, -0.023130416870117188, -0.02012348175048828, -0.017116546630859375, -0.014109611511230469, -0.011102676391601562, -0.008095741271972656, -0.00508880615234375, -0.0020818710327148438, 0.0009250640869140625, 0.003931999206542969, 0.006938934326171875, 0.009945869445800781, 0.012952804565429688, 0.015959739685058594, 0.0189666748046875, 0.021973609924316406, 0.024980545043945312, 0.02798748016357422, 0.030994415283203125, 0.03400135040283203, 0.03700828552246094, 0.040015220642089844, 0.04302215576171875, 0.046029090881347656, 0.04903602600097656, 0.05204296112060547, 0.055049896240234375, 0.05805683135986328, 0.06106376647949219, 0.0640707015991211, 0.06707763671875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 4.0, 6.0, 13.0, 18.0, 18.0, 34.0, 37.0, 74.0, 97.0, 187.0, 342.0, 768.0, 2055.0, 6661.0, 40218.0, 4088710.0, 44314.0, 7056.0, 1994.0, 786.0, 363.0, 200.0, 116.0, 72.0, 51.0, 29.0, 20.0, 11.0, 15.0, 5.0, 3.0, 7.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2471923828125, -0.2378711700439453, -0.22854995727539062, -0.21922874450683594, -0.20990753173828125, -0.20058631896972656, -0.19126510620117188, -0.1819438934326172, -0.1726226806640625, -0.1633014678955078, -0.15398025512695312, -0.14465904235839844, -0.13533782958984375, -0.12601661682128906, -0.11669540405273438, -0.10737419128417969, -0.098052978515625, -0.08873176574707031, -0.07941055297851562, -0.07008934020996094, -0.06076812744140625, -0.05144691467285156, -0.042125701904296875, -0.03280448913574219, -0.0234832763671875, -0.014162063598632812, -0.004840850830078125, 0.0044803619384765625, 0.01380157470703125, 0.023122787475585938, 0.032444000244140625, 0.04176521301269531, 0.05108642578125, 0.06040763854980469, 0.06972885131835938, 0.07905006408691406, 0.08837127685546875, 0.09769248962402344, 0.10701370239257812, 0.11633491516113281, 0.1256561279296875, 0.1349773406982422, 0.14429855346679688, 0.15361976623535156, 0.16294097900390625, 0.17226219177246094, 0.18158340454101562, 0.1909046173095703, 0.200225830078125, 0.2095470428466797, 0.21886825561523438, 0.22818946838378906, 0.23751068115234375, 0.24683189392089844, 0.2561531066894531, 0.2654743194580078, 0.2747955322265625, 0.2841167449951172, 0.2934379577636719, 0.30275917053222656, 0.31208038330078125, 0.32140159606933594, 0.3307228088378906, 0.3400440216064453, 0.349365234375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 1.0, 1.0, 5.0, 4.0, 8.0, 8.0, 9.0, 17.0, 28.0, 72.0, 3430.0, 363.0, 60.0, 32.0, 17.0, 9.0, 6.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11749267578125, -0.11327266693115234, -0.10905265808105469, -0.10483264923095703, -0.10061264038085938, -0.09639263153076172, -0.09217262268066406, -0.0879526138305664, -0.08373260498046875, -0.0795125961303711, -0.07529258728027344, -0.07107257843017578, -0.06685256958007812, -0.06263256072998047, -0.05841255187988281, -0.054192543029785156, -0.0499725341796875, -0.045752525329589844, -0.04153251647949219, -0.03731250762939453, -0.033092498779296875, -0.02887248992919922, -0.024652481079101562, -0.020432472229003906, -0.01621246337890625, -0.011992454528808594, -0.0077724456787109375, -0.0035524368286132812, 0.000667572021484375, 0.004887580871582031, 0.009107589721679688, 0.013327598571777344, 0.017547607421875, 0.021767616271972656, 0.025987625122070312, 0.03020763397216797, 0.034427642822265625, 0.03864765167236328, 0.04286766052246094, 0.047087669372558594, 0.05130767822265625, 0.055527687072753906, 0.05974769592285156, 0.06396770477294922, 0.06818771362304688, 0.07240772247314453, 0.07662773132324219, 0.08084774017333984, 0.0850677490234375, 0.08928775787353516, 0.09350776672363281, 0.09772777557373047, 0.10194778442382812, 0.10616779327392578, 0.11038780212402344, 0.1146078109741211, 0.11882781982421875, 0.1230478286743164, 0.12726783752441406, 0.13148784637451172, 0.13570785522460938, 0.13992786407470703, 0.1441478729248047, 0.14836788177490234, 0.152587890625]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 10.0, 19.0, 55.0, 217.0, 447.0, 169.0, 47.0, 18.0, 6.0, 3.0, 3.0, 3.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9195607900619507, -0.8955643177032471, -0.8715678453445435, -0.8475714325904846, -0.823574960231781, -0.7995784878730774, -0.7755820751190186, -0.7515856027603149, -0.7275891304016113, -0.7035926580429077, -0.6795961856842041, -0.6555997729301453, -0.6316033005714417, -0.607606828212738, -0.5836104154586792, -0.5596139430999756, -0.535617470741272, -0.5116209983825684, -0.48762455582618713, -0.4636281132698059, -0.4396316409111023, -0.4156351685523987, -0.39163872599601746, -0.36764228343963623, -0.3436458110809326, -0.319649338722229, -0.2956528961658478, -0.27165645360946655, -0.24765998125076294, -0.22366352379322052, -0.1996670663356781, -0.17567060887813568, -0.15167415142059326, -0.12767769396305084, -0.10368123650550842, -0.079684779047966, -0.055688321590423584, -0.031691864132881165, -0.007695406675338745, 0.016301050782203674, 0.040297508239746094, 0.06429396569728851, 0.08829042315483093, 0.11228688061237335, 0.13628333806991577, 0.1602797955274582, 0.1842762529850006, 0.20827271044254303, 0.23226916790008545, 0.25626564025878906, 0.2802620828151703, 0.3042585253715515, 0.3282549977302551, 0.35225147008895874, 0.37624791264533997, 0.4002443552017212, 0.4242408275604248, 0.4482372999191284, 0.47223374247550964, 0.49623018503189087, 0.5202266573905945, 0.5442231297492981, 0.5682195425033569, 0.5922160148620605, 0.6162124872207642]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 6.0, 2.0, 4.0, 11.0, 17.0, 23.0, 49.0, 58.0, 78.0, 97.0, 101.0, 127.0, 77.0, 102.0, 69.0, 53.0, 42.0, 34.0, 24.0, 11.0, 7.0, 5.0, 6.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.36791157722473145, -0.3569802939891815, -0.3460490107536316, -0.33511772751808167, -0.32418644428253174, -0.3132551610469818, -0.3023238778114319, -0.29139259457588196, -0.28046131134033203, -0.2695300281047821, -0.2585987448692322, -0.24766746163368225, -0.23673617839813232, -0.2258048951625824, -0.21487361192703247, -0.20394232869148254, -0.19301104545593262, -0.1820797622203827, -0.17114847898483276, -0.16021719574928284, -0.1492859125137329, -0.13835462927818298, -0.12742334604263306, -0.11649206280708313, -0.1055607795715332, -0.09462949633598328, -0.08369821310043335, -0.07276692986488342, -0.061835646629333496, -0.05090436339378357, -0.03997308015823364, -0.029041796922683716, -0.01811051368713379, -0.007179230451583862, 0.0037520527839660645, 0.014683336019515991, 0.025614619255065918, 0.036545902490615845, 0.04747718572616577, 0.0584084689617157, 0.06933975219726562, 0.08027103543281555, 0.09120231866836548, 0.1021336019039154, 0.11306488513946533, 0.12399616837501526, 0.13492745161056519, 0.1458587348461151, 0.15679001808166504, 0.16772130131721497, 0.1786525845527649, 0.18958386778831482, 0.20051515102386475, 0.21144643425941467, 0.2223777174949646, 0.23330900073051453, 0.24424028396606445, 0.2551715672016144, 0.2661028504371643, 0.27703413367271423, 0.28796541690826416, 0.2988967001438141, 0.309827983379364, 0.32075926661491394, 0.33169054985046387]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 2.0, 2.0, 3.0, 7.0, 13.0, 14.0, 7.0, 17.0, 23.0, 37.0, 68.0, 71.0, 110.0, 156.0, 224.0, 372.0, 701.0, 1149.0, 2705.0, 8919.0, 80115.0, 805894.0, 129604.0, 12067.0, 2980.0, 1332.0, 691.0, 427.0, 256.0, 202.0, 119.0, 73.0, 46.0, 43.0, 27.0, 35.0, 17.0, 11.0, 6.0, 4.0, 3.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.361328125, -0.3502388000488281, -0.33914947509765625, -0.3280601501464844, -0.3169708251953125, -0.3058815002441406, -0.29479217529296875, -0.2837028503417969, -0.272613525390625, -0.2615242004394531, -0.25043487548828125, -0.23934555053710938, -0.2282562255859375, -0.21716690063476562, -0.20607757568359375, -0.19498825073242188, -0.18389892578125, -0.17280960083007812, -0.16172027587890625, -0.15063095092773438, -0.1395416259765625, -0.12845230102539062, -0.11736297607421875, -0.10627365112304688, -0.095184326171875, -0.08409500122070312, -0.07300567626953125, -0.061916351318359375, -0.0508270263671875, -0.039737701416015625, -0.02864837646484375, -0.017559051513671875, -0.0064697265625, 0.004619598388671875, 0.01570892333984375, 0.026798248291015625, 0.0378875732421875, 0.048976898193359375, 0.06006622314453125, 0.07115554809570312, 0.082244873046875, 0.09333419799804688, 0.10442352294921875, 0.11551284790039062, 0.1266021728515625, 0.13769149780273438, 0.14878082275390625, 0.15987014770507812, 0.17095947265625, 0.18204879760742188, 0.19313812255859375, 0.20422744750976562, 0.2153167724609375, 0.22640609741210938, 0.23749542236328125, 0.24858474731445312, 0.259674072265625, 0.2707633972167969, 0.28185272216796875, 0.2929420471191406, 0.3040313720703125, 0.3151206970214844, 0.32621002197265625, 0.3372993469238281, 0.348388671875]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 6.0, 22.0, 39.0, 72.0, 109.0, 161.0, 201.0, 159.0, 103.0, 77.0, 25.0, 8.0, 8.0, 2.0, 1.0, 4.0, 5.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1278076171875, -0.1247243881225586, -0.12164115905761719, -0.11855792999267578, -0.11547470092773438, -0.11239147186279297, -0.10930824279785156, -0.10622501373291016, -0.10314178466796875, -0.10005855560302734, -0.09697532653808594, -0.09389209747314453, -0.09080886840820312, -0.08772563934326172, -0.08464241027832031, -0.0815591812133789, -0.0784759521484375, -0.0753927230834961, -0.07230949401855469, -0.06922626495361328, -0.06614303588867188, -0.06305980682373047, -0.05997657775878906, -0.056893348693847656, -0.05381011962890625, -0.050726890563964844, -0.04764366149902344, -0.04456043243408203, -0.041477203369140625, -0.03839397430419922, -0.03531074523925781, -0.032227516174316406, -0.029144287109375, -0.026061058044433594, -0.022977828979492188, -0.01989459991455078, -0.016811370849609375, -0.013728141784667969, -0.010644912719726562, -0.007561683654785156, -0.00447845458984375, -0.0013952255249023438, 0.0016880035400390625, 0.004771232604980469, 0.007854461669921875, 0.010937690734863281, 0.014020919799804688, 0.017104148864746094, 0.0201873779296875, 0.023270606994628906, 0.026353836059570312, 0.02943706512451172, 0.032520294189453125, 0.03560352325439453, 0.03868675231933594, 0.041769981384277344, 0.04485321044921875, 0.047936439514160156, 0.05101966857910156, 0.05410289764404297, 0.057186126708984375, 0.06026935577392578, 0.06335258483886719, 0.0664358139038086, 0.06951904296875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 5.0, 6.0, 6.0, 16.0, 22.0, 38.0, 61.0, 99.0, 165.0, 314.0, 603.0, 1612.0, 5041.0, 18565.0, 89839.0, 516311.0, 339996.0, 57057.0, 12707.0, 3686.0, 1287.0, 532.0, 258.0, 131.0, 71.0, 44.0, 29.0, 16.0, 22.0, 11.0, 5.0, 8.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2044677734375, -0.1990680694580078, -0.19366836547851562, -0.18826866149902344, -0.18286895751953125, -0.17746925354003906, -0.17206954956054688, -0.1666698455810547, -0.1612701416015625, -0.1558704376220703, -0.15047073364257812, -0.14507102966308594, -0.13967132568359375, -0.13427162170410156, -0.12887191772460938, -0.12347221374511719, -0.118072509765625, -0.11267280578613281, -0.10727310180664062, -0.10187339782714844, -0.09647369384765625, -0.09107398986816406, -0.08567428588867188, -0.08027458190917969, -0.0748748779296875, -0.06947517395019531, -0.06407546997070312, -0.05867576599121094, -0.05327606201171875, -0.04787635803222656, -0.042476654052734375, -0.03707695007324219, -0.03167724609375, -0.026277542114257812, -0.020877838134765625, -0.015478134155273438, -0.01007843017578125, -0.0046787261962890625, 0.000720977783203125, 0.0061206817626953125, 0.0115203857421875, 0.016920089721679688, 0.022319793701171875, 0.027719497680664062, 0.03311920166015625, 0.03851890563964844, 0.043918609619140625, 0.04931831359863281, 0.054718017578125, 0.06011772155761719, 0.06551742553710938, 0.07091712951660156, 0.07631683349609375, 0.08171653747558594, 0.08711624145507812, 0.09251594543457031, 0.0979156494140625, 0.10331535339355469, 0.10871505737304688, 0.11411476135253906, 0.11951446533203125, 0.12491416931152344, 0.13031387329101562, 0.1357135772705078, 0.14111328125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 2.0, 3.0, 6.0, 10.0, 11.0, 28.0, 36.0, 44.0, 71.0, 75.0, 60.0, 86.0, 107.0, 88.0, 76.0, 86.0, 59.0, 38.0, 38.0, 29.0, 15.0, 16.0, 5.0, 6.0, 3.0, 3.0, 5.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2484130859375, -0.24182701110839844, -0.23524093627929688, -0.2286548614501953, -0.22206878662109375, -0.2154827117919922, -0.20889663696289062, -0.20231056213378906, -0.1957244873046875, -0.18913841247558594, -0.18255233764648438, -0.1759662628173828, -0.16938018798828125, -0.1627941131591797, -0.15620803833007812, -0.14962196350097656, -0.143035888671875, -0.13644981384277344, -0.12986373901367188, -0.12327766418457031, -0.11669158935546875, -0.11010551452636719, -0.10351943969726562, -0.09693336486816406, -0.0903472900390625, -0.08376121520996094, -0.07717514038085938, -0.07058906555175781, -0.06400299072265625, -0.05741691589355469, -0.050830841064453125, -0.04424476623535156, -0.03765869140625, -0.031072616577148438, -0.024486541748046875, -0.017900466918945312, -0.01131439208984375, -0.0047283172607421875, 0.001857757568359375, 0.008443832397460938, 0.0150299072265625, 0.021615982055664062, 0.028202056884765625, 0.03478813171386719, 0.04137420654296875, 0.04796028137207031, 0.054546356201171875, 0.06113243103027344, 0.067718505859375, 0.07430458068847656, 0.08089065551757812, 0.08747673034667969, 0.09406280517578125, 0.10064888000488281, 0.10723495483398438, 0.11382102966308594, 0.1204071044921875, 0.12699317932128906, 0.13357925415039062, 0.1401653289794922, 0.14675140380859375, 0.1533374786376953, 0.15992355346679688, 0.16650962829589844, 0.173095703125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 5.0, 6.0, 4.0, 4.0, 4.0, 7.0, 16.0, 21.0, 25.0, 32.0, 50.0, 87.0, 130.0, 155.0, 258.0, 413.0, 761.0, 1357.0, 2981.0, 7535.0, 26086.0, 145564.0, 711600.0, 116479.0, 22285.0, 6838.0, 2746.0, 1276.0, 693.0, 388.0, 236.0, 152.0, 114.0, 63.0, 57.0, 32.0, 34.0, 18.0, 13.0, 11.0, 3.0, 7.0, 3.0, 3.0, 2.0, 5.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06256103515625, -0.06057167053222656, -0.058582305908203125, -0.05659294128417969, -0.05460357666015625, -0.05261421203613281, -0.050624847412109375, -0.04863548278808594, -0.0466461181640625, -0.04465675354003906, -0.042667388916015625, -0.04067802429199219, -0.03868865966796875, -0.03669929504394531, -0.034709930419921875, -0.03272056579589844, -0.030731201171875, -0.028741836547851562, -0.026752471923828125, -0.024763107299804688, -0.02277374267578125, -0.020784378051757812, -0.018795013427734375, -0.016805648803710938, -0.0148162841796875, -0.012826919555664062, -0.010837554931640625, -0.008848190307617188, -0.00685882568359375, -0.0048694610595703125, -0.002880096435546875, -0.0008907318115234375, 0.0010986328125, 0.0030879974365234375, 0.005077362060546875, 0.0070667266845703125, 0.00905609130859375, 0.011045455932617188, 0.013034820556640625, 0.015024185180664062, 0.0170135498046875, 0.019002914428710938, 0.020992279052734375, 0.022981643676757812, 0.02497100830078125, 0.026960372924804688, 0.028949737548828125, 0.030939102172851562, 0.032928466796875, 0.03491783142089844, 0.036907196044921875, 0.03889656066894531, 0.04088592529296875, 0.04287528991699219, 0.044864654541015625, 0.04685401916503906, 0.0488433837890625, 0.05083274841308594, 0.052822113037109375, 0.05481147766113281, 0.05680084228515625, 0.05879020690917969, 0.060779571533203125, 0.06276893615722656, 0.06475830078125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 6.0, 4.0, 2.0, 7.0, 6.0, 7.0, 10.0, 19.0, 18.0, 27.0, 37.0, 57.0, 90.0, 187.0, 187.0, 120.0, 67.0, 35.0, 30.0, 25.0, 13.0, 9.0, 9.0, 7.0, 6.0, 6.0, 5.0, 6.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00019168853759765625, -0.00018637627363204956, -0.00018106400966644287, -0.00017575174570083618, -0.0001704394817352295, -0.0001651272177696228, -0.0001598149538040161, -0.00015450268983840942, -0.00014919042587280273, -0.00014387816190719604, -0.00013856589794158936, -0.00013325363397598267, -0.00012794137001037598, -0.0001226291060447693, -0.0001173168420791626, -0.00011200457811355591, -0.00010669231414794922, -0.00010138005018234253, -9.606778621673584e-05, -9.075552225112915e-05, -8.544325828552246e-05, -8.013099431991577e-05, -7.481873035430908e-05, -6.950646638870239e-05, -6.41942024230957e-05, -5.8881938457489014e-05, -5.3569674491882324e-05, -4.8257410526275635e-05, -4.2945146560668945e-05, -3.7632882595062256e-05, -3.2320618629455566e-05, -2.7008354663848877e-05, -2.1696090698242188e-05, -1.6383826732635498e-05, -1.1071562767028809e-05, -5.759298801422119e-06, -4.470348358154297e-07, 4.86522912979126e-06, 1.017749309539795e-05, 1.548975706100464e-05, 2.0802021026611328e-05, 2.6114284992218018e-05, 3.142654895782471e-05, 3.6738812923431396e-05, 4.2051076889038086e-05, 4.7363340854644775e-05, 5.2675604820251465e-05, 5.7987868785858154e-05, 6.330013275146484e-05, 6.861239671707153e-05, 7.392466068267822e-05, 7.923692464828491e-05, 8.45491886138916e-05, 8.986145257949829e-05, 9.517371654510498e-05, 0.00010048598051071167, 0.00010579824447631836, 0.00011111050844192505, 0.00011642277240753174, 0.00012173503637313843, 0.00012704730033874512, 0.0001323595643043518, 0.0001376718282699585, 0.00014298409223556519, 0.00014829635620117188]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 3.0, 5.0, 7.0, 12.0, 18.0, 20.0, 35.0, 49.0, 111.0, 227.0, 410.0, 817.0, 1613.0, 3230.0, 7797.0, 24794.0, 110279.0, 610607.0, 226518.0, 41314.0, 11950.0, 4503.0, 2068.0, 1001.0, 550.0, 262.0, 150.0, 82.0, 47.0, 31.0, 13.0, 9.0, 3.0, 8.0, 9.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0501708984375, -0.048587799072265625, -0.04700469970703125, -0.045421600341796875, -0.0438385009765625, -0.042255401611328125, -0.04067230224609375, -0.039089202880859375, -0.037506103515625, -0.035923004150390625, -0.03433990478515625, -0.032756805419921875, -0.0311737060546875, -0.029590606689453125, -0.02800750732421875, -0.026424407958984375, -0.02484130859375, -0.023258209228515625, -0.02167510986328125, -0.020092010498046875, -0.0185089111328125, -0.016925811767578125, -0.01534271240234375, -0.013759613037109375, -0.012176513671875, -0.010593414306640625, -0.00901031494140625, -0.007427215576171875, -0.0058441162109375, -0.004261016845703125, -0.00267791748046875, -0.001094818115234375, 0.00048828125, 0.002071380615234375, 0.00365447998046875, 0.005237579345703125, 0.0068206787109375, 0.008403778076171875, 0.00998687744140625, 0.011569976806640625, 0.013153076171875, 0.014736175537109375, 0.01631927490234375, 0.017902374267578125, 0.0194854736328125, 0.021068572998046875, 0.02265167236328125, 0.024234771728515625, 0.02581787109375, 0.027400970458984375, 0.02898406982421875, 0.030567169189453125, 0.0321502685546875, 0.033733367919921875, 0.03531646728515625, 0.036899566650390625, 0.038482666015625, 0.040065765380859375, 0.04164886474609375, 0.043231964111328125, 0.0448150634765625, 0.046398162841796875, 0.04798126220703125, 0.049564361572265625, 0.0511474609375]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 4.0, 1.0, 0.0, 3.0, 2.0, 3.0, 3.0, 3.0, 4.0, 9.0, 24.0, 25.0, 40.0, 40.0, 56.0, 93.0, 87.0, 118.0, 118.0, 103.0, 74.0, 63.0, 38.0, 33.0, 23.0, 8.0, 8.0, 4.0, 3.0, 2.0, 3.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.04937744140625, -0.047616004943847656, -0.04585456848144531, -0.04409313201904297, -0.042331695556640625, -0.04057025909423828, -0.03880882263183594, -0.037047386169433594, -0.03528594970703125, -0.033524513244628906, -0.03176307678222656, -0.03000164031982422, -0.028240203857421875, -0.02647876739501953, -0.024717330932617188, -0.022955894470214844, -0.0211944580078125, -0.019433021545410156, -0.017671585083007812, -0.01591014862060547, -0.014148712158203125, -0.012387275695800781, -0.010625839233398438, -0.008864402770996094, -0.00710296630859375, -0.005341529846191406, -0.0035800933837890625, -0.0018186569213867188, -5.7220458984375e-05, 0.0017042160034179688, 0.0034656524658203125, 0.005227088928222656, 0.006988525390625, 0.008749961853027344, 0.010511398315429688, 0.012272834777832031, 0.014034271240234375, 0.01579570770263672, 0.017557144165039062, 0.019318580627441406, 0.02108001708984375, 0.022841453552246094, 0.024602890014648438, 0.02636432647705078, 0.028125762939453125, 0.02988719940185547, 0.03164863586425781, 0.033410072326660156, 0.0351715087890625, 0.036932945251464844, 0.03869438171386719, 0.04045581817626953, 0.042217254638671875, 0.04397869110107422, 0.04574012756347656, 0.047501564025878906, 0.04926300048828125, 0.051024436950683594, 0.05278587341308594, 0.05454730987548828, 0.056308746337890625, 0.05807018280029297, 0.05983161926269531, 0.061593055725097656, 0.0633544921875]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 20.0, 85.0, 458.0, 376.0, 57.0, 11.0, 4.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.944631814956665, -2.8104360103607178, -2.6762404441833496, -2.5420446395874023, -2.407849073410034, -2.273653268814087, -2.1394577026367188, -2.0052618980407715, -1.8710662126541138, -1.736870527267456, -1.6026748418807983, -1.4684791564941406, -1.3342833518981934, -1.2000877857208252, -1.065891981124878, -0.9316962957382202, -0.7975006103515625, -0.6633049249649048, -0.5291092395782471, -0.3949134945869446, -0.26071780920028687, -0.12652212381362915, 0.00767362117767334, 0.14186930656433105, 0.27606499195098877, 0.4102606773376465, 0.5444563627243042, 0.6786521077156067, 0.8128477931022644, 0.9470434784889221, 1.0812392234802246, 1.2154349088668823, 1.3496308326721191, 1.4838265180587769, 1.6180222034454346, 1.7522180080413818, 1.88641357421875, 2.0206093788146973, 2.1548051834106445, 2.2890007495880127, 2.423196315765381, 2.557392120361328, 2.6915876865386963, 2.8257834911346436, 2.9599790573120117, 3.094174861907959, 3.2283706665039062, 3.3625662326812744, 3.4967620372772217, 3.630957841873169, 3.765153408050537, 3.8993492126464844, 4.033545017242432, 4.167740345001221, 4.301936149597168, 4.436131954193115, 4.5703277587890625, 4.70452356338501, 4.838719367980957, 4.972914695739746, 5.107110500335693, 5.241306304931641, 5.375502109527588, 5.509697914123535, 5.643893241882324]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 6.0, 0.0, 1.0, 8.0, 5.0, 14.0, 14.0, 24.0, 18.0, 25.0, 26.0, 47.0, 54.0, 43.0, 68.0, 56.0, 63.0, 65.0, 63.0, 60.0, 49.0, 51.0, 30.0, 38.0, 41.0, 35.0, 31.0, 26.0, 12.0, 16.0, 13.0, 8.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.9334578514099121, -0.9087934494018555, -0.8841290473937988, -0.8594646453857422, -0.8348002433776855, -0.8101358413696289, -0.7854714393615723, -0.7608070373535156, -0.736142635345459, -0.7114782333374023, -0.6868138313293457, -0.6621494293212891, -0.6374850273132324, -0.6128206253051758, -0.5881562232971191, -0.5634918212890625, -0.5388274192810059, -0.5141630172729492, -0.4894986152648926, -0.46483421325683594, -0.4401698112487793, -0.41550540924072266, -0.390841007232666, -0.3661766052246094, -0.3415122628211975, -0.31684786081314087, -0.29218345880508423, -0.2675190567970276, -0.24285465478897095, -0.2181902527809143, -0.19352586567401886, -0.16886146366596222, -0.14419704675674438, -0.11953264474868774, -0.0948682427406311, -0.07020384818315506, -0.04553944617509842, -0.02087504416704178, 0.003789350390434265, 0.028453752398490906, 0.053118154406547546, 0.07778255641460419, 0.10244695842266083, 0.12711134552955627, 0.15177574753761292, 0.17644014954566956, 0.2011045515537262, 0.22576895356178284, 0.2504333555698395, 0.2750977575778961, 0.29976215958595276, 0.3244265615940094, 0.34909096360206604, 0.3737553656101227, 0.39841973781585693, 0.4230841398239136, 0.4477485418319702, 0.47241294384002686, 0.4970773458480835, 0.5217417478561401, 0.5464061498641968, 0.5710705518722534, 0.5957349538803101, 0.6203993558883667, 0.6450637578964233]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 2.0, 1.0, 3.0, 5.0, 3.0, 10.0, 25.0, 37.0, 91.0, 240.0, 1241.0, 4187118.0, 4824.0, 430.0, 136.0, 54.0, 32.0, 13.0, 4.0, 8.0, 6.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.31298828125, -0.3044624328613281, -0.29593658447265625, -0.2874107360839844, -0.2788848876953125, -0.2703590393066406, -0.26183319091796875, -0.2533073425292969, -0.244781494140625, -0.23625564575195312, -0.22772979736328125, -0.21920394897460938, -0.2106781005859375, -0.20215225219726562, -0.19362640380859375, -0.18510055541992188, -0.17657470703125, -0.16804885864257812, -0.15952301025390625, -0.15099716186523438, -0.1424713134765625, -0.13394546508789062, -0.12541961669921875, -0.11689376831054688, -0.108367919921875, -0.09984207153320312, -0.09131622314453125, -0.08279037475585938, -0.0742645263671875, -0.06573867797851562, -0.05721282958984375, -0.048686981201171875, -0.0401611328125, -0.031635284423828125, -0.02310943603515625, -0.014583587646484375, -0.0060577392578125, 0.002468109130859375, 0.01099395751953125, 0.019519805908203125, 0.028045654296875, 0.036571502685546875, 0.04509735107421875, 0.053623199462890625, 0.0621490478515625, 0.07067489624023438, 0.07920074462890625, 0.08772659301757812, 0.09625244140625, 0.10477828979492188, 0.11330413818359375, 0.12182998657226562, 0.1303558349609375, 0.13888168334960938, 0.14740753173828125, 0.15593338012695312, 0.164459228515625, 0.17298507690429688, 0.18151092529296875, 0.19003677368164062, 0.1985626220703125, 0.20708847045898438, 0.21561431884765625, 0.22414016723632812, 0.232666015625]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 9.0, 26.0, 52.0, 96.0, 139.0, 181.0, 189.0, 148.0, 80.0, 40.0, 20.0, 4.0, 7.0, 1.0, 3.0, 5.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.13330078125, -0.13012409210205078, -0.12694740295410156, -0.12377071380615234, -0.12059402465820312, -0.1174173355102539, -0.11424064636230469, -0.11106395721435547, -0.10788726806640625, -0.10471057891845703, -0.10153388977050781, -0.0983572006225586, -0.09518051147460938, -0.09200382232666016, -0.08882713317871094, -0.08565044403076172, -0.0824737548828125, -0.07929706573486328, -0.07612037658691406, -0.07294368743896484, -0.06976699829101562, -0.0665903091430664, -0.06341361999511719, -0.06023693084716797, -0.05706024169921875, -0.05388355255126953, -0.05070686340332031, -0.047530174255371094, -0.044353485107421875, -0.041176795959472656, -0.03800010681152344, -0.03482341766357422, -0.031646728515625, -0.02847003936767578, -0.025293350219726562, -0.022116661071777344, -0.018939971923828125, -0.015763282775878906, -0.012586593627929688, -0.009409904479980469, -0.00623321533203125, -0.0030565261840820312, 0.0001201629638671875, 0.0032968521118164062, 0.006473541259765625, 0.009650230407714844, 0.012826919555664062, 0.01600360870361328, 0.0191802978515625, 0.02235698699951172, 0.025533676147460938, 0.028710365295410156, 0.031887054443359375, 0.035063743591308594, 0.03824043273925781, 0.04141712188720703, 0.04459381103515625, 0.04777050018310547, 0.05094718933105469, 0.054123878479003906, 0.057300567626953125, 0.060477256774902344, 0.06365394592285156, 0.06683063507080078, 0.07000732421875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 5.0, 3.0, 7.0, 10.0, 24.0, 41.0, 56.0, 75.0, 138.0, 146.0, 252.0, 398.0, 619.0, 1035.0, 2011.0, 5499.0, 4108306.0, 66890.0, 4358.0, 1806.0, 976.0, 564.0, 350.0, 224.0, 167.0, 106.0, 68.0, 58.0, 37.0, 20.0, 12.0, 10.0, 6.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0875244140625, -0.08478260040283203, -0.08204078674316406, -0.0792989730834961, -0.07655715942382812, -0.07381534576416016, -0.07107353210449219, -0.06833171844482422, -0.06558990478515625, -0.06284809112548828, -0.06010627746582031, -0.057364463806152344, -0.054622650146484375, -0.051880836486816406, -0.04913902282714844, -0.04639720916748047, -0.0436553955078125, -0.04091358184814453, -0.03817176818847656, -0.035429954528808594, -0.032688140869140625, -0.029946327209472656, -0.027204513549804688, -0.02446269989013672, -0.02172088623046875, -0.01897907257080078, -0.016237258911132812, -0.013495445251464844, -0.010753631591796875, -0.008011817932128906, -0.0052700042724609375, -0.0025281906127929688, 0.000213623046875, 0.0029554367065429688, 0.0056972503662109375, 0.008439064025878906, 0.011180877685546875, 0.013922691345214844, 0.016664505004882812, 0.01940631866455078, 0.02214813232421875, 0.02488994598388672, 0.027631759643554688, 0.030373573303222656, 0.033115386962890625, 0.035857200622558594, 0.03859901428222656, 0.04134082794189453, 0.0440826416015625, 0.04682445526123047, 0.04956626892089844, 0.052308082580566406, 0.055049896240234375, 0.057791709899902344, 0.06053352355957031, 0.06327533721923828, 0.06601715087890625, 0.06875896453857422, 0.07150077819824219, 0.07424259185791016, 0.07698440551757812, 0.0797262191772461, 0.08246803283691406, 0.08520984649658203, 0.08795166015625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 9.0, 3.0, 24.0, 3916.0, 75.0, 26.0, 8.0, 2.0, 4.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0124969482421875, -0.012076258659362793, -0.011655569076538086, -0.011234879493713379, -0.010814189910888672, -0.010393500328063965, -0.009972810745239258, -0.00955212116241455, -0.009131431579589844, -0.008710741996765137, -0.00829005241394043, -0.007869362831115723, -0.007448673248291016, -0.007027983665466309, -0.0066072940826416016, -0.0061866044998168945, -0.0057659149169921875, -0.0053452253341674805, -0.0049245357513427734, -0.004503846168518066, -0.004083156585693359, -0.0036624670028686523, -0.0032417774200439453, -0.0028210878372192383, -0.0024003982543945312, -0.0019797086715698242, -0.0015590190887451172, -0.0011383295059204102, -0.0007176399230957031, -0.0002969503402709961, 0.00012373924255371094, 0.000544428825378418, 0.000965118408203125, 0.001385807991027832, 0.001806497573852539, 0.002227187156677246, 0.002647876739501953, 0.00306856632232666, 0.003489255905151367, 0.003909945487976074, 0.004330635070800781, 0.004751324653625488, 0.005172014236450195, 0.005592703819274902, 0.006013393402099609, 0.006434082984924316, 0.0068547725677490234, 0.0072754621505737305, 0.0076961517333984375, 0.008116841316223145, 0.008537530899047852, 0.008958220481872559, 0.009378910064697266, 0.009799599647521973, 0.01022028923034668, 0.010640978813171387, 0.011061668395996094, 0.0114823579788208, 0.011903047561645508, 0.012323737144470215, 0.012744426727294922, 0.013165116310119629, 0.013585805892944336, 0.014006495475769043, 0.01442718505859375]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 5.0, 26.0, 58.0, 257.0, 443.0, 166.0, 40.0, 16.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02175716683268547, -0.018298236653208733, -0.014839304611086845, -0.011380374431610107, -0.007921443320810795, -0.004462512210011482, -0.0010035820305347443, 0.002455350011587143, 0.005914280191063881, 0.009373211301863194, 0.012832142412662506, 0.016291072592139244, 0.019750002771615982, 0.02320893481373787, 0.026667864993214607, 0.030126797035336494, 0.03358572721481323, 0.03704465925693512, 0.04050358757376671, 0.043962519615888596, 0.04742145165801048, 0.05088037997484207, 0.05433931201696396, 0.057798244059085846, 0.06125717610120773, 0.06471610814332962, 0.06817504018545151, 0.0716339647769928, 0.07509289681911469, 0.07855182886123657, 0.08201076090335846, 0.08546969294548035, 0.08892861753702164, 0.09238754957914352, 0.09584648162126541, 0.0993054062128067, 0.10276433825492859, 0.10622327029705048, 0.10968220233917236, 0.11314113438129425, 0.11660006642341614, 0.12005899846553802, 0.12351793050765991, 0.1269768625497818, 0.1304357945919037, 0.13389472663402557, 0.13735365867614746, 0.14081257581710815, 0.14427150785923004, 0.14773043990135193, 0.15118937194347382, 0.1546483039855957, 0.1581072360277176, 0.16156616806983948, 0.16502508521080017, 0.16848403215408325, 0.17194296419620514, 0.17540189623832703, 0.1788608282804489, 0.1823197603225708, 0.1857786923646927, 0.18923762440681458, 0.19269654154777527, 0.19615548849105835, 0.19961440563201904]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 4.0, 3.0, 9.0, 9.0, 12.0, 13.0, 22.0, 27.0, 29.0, 34.0, 38.0, 48.0, 43.0, 51.0, 51.0, 49.0, 64.0, 63.0, 49.0, 52.0, 54.0, 50.0, 38.0, 40.0, 38.0, 22.0, 27.0, 15.0, 17.0, 9.0, 7.0, 11.0, 6.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.02491670846939087, -0.02418903261423111, -0.0234613586217165, -0.02273368462920189, -0.02200600877404213, -0.02127833291888237, -0.02055065892636776, -0.01982298493385315, -0.01909530907869339, -0.01836763322353363, -0.01763995923101902, -0.01691228523850441, -0.01618460938334465, -0.015456934459507465, -0.01472925953567028, -0.014001584611833096, -0.01327390968799591, -0.012546234764158726, -0.01181855984032154, -0.011090884916484356, -0.010363209992647171, -0.009635535068809986, -0.008907860144972801, -0.008180185221135616, -0.007452510297298431, -0.0067248353734612465, -0.005997160449624062, -0.005269485525786877, -0.004541810601949692, -0.003814135678112507, -0.003086460754275322, -0.002358785830438137, -0.0016311109066009521, -0.0009034359827637672, -0.00017576105892658234, 0.0005519138649106026, 0.0012795887887477875, 0.0020072637125849724, 0.0027349386364221573, 0.003462613560259342, 0.004190288484096527, 0.004917963407933712, 0.005645638331770897, 0.006373313255608082, 0.007100988179445267, 0.007828663103282452, 0.008556338027119637, 0.009284012950956821, 0.010011687874794006, 0.010739362798631191, 0.011467037722468376, 0.012194712646305561, 0.012922387570142746, 0.013650062493979931, 0.014377737417817116, 0.0151054123416543, 0.015833087265491486, 0.016560763120651245, 0.017288437113165855, 0.018016111105680466, 0.018743786960840225, 0.019471462815999985, 0.020199136808514595, 0.020926810801029205, 0.021654486656188965]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 4.0, 4.0, 3.0, 10.0, 7.0, 13.0, 17.0, 28.0, 32.0, 50.0, 65.0, 113.0, 148.0, 206.0, 302.0, 588.0, 997.0, 1857.0, 4633.0, 22341.0, 304704.0, 654459.0, 45824.0, 6796.0, 2400.0, 1140.0, 627.0, 353.0, 259.0, 173.0, 102.0, 84.0, 61.0, 41.0, 28.0, 27.0, 25.0, 10.0, 7.0, 6.0, 6.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.331787109375, -0.32234954833984375, -0.3129119873046875, -0.30347442626953125, -0.294036865234375, -0.28459930419921875, -0.2751617431640625, -0.26572418212890625, -0.25628662109375, -0.24684906005859375, -0.2374114990234375, -0.22797393798828125, -0.218536376953125, -0.20909881591796875, -0.1996612548828125, -0.19022369384765625, -0.1807861328125, -0.17134857177734375, -0.1619110107421875, -0.15247344970703125, -0.143035888671875, -0.13359832763671875, -0.1241607666015625, -0.11472320556640625, -0.10528564453125, -0.09584808349609375, -0.0864105224609375, -0.07697296142578125, -0.067535400390625, -0.05809783935546875, -0.0486602783203125, -0.03922271728515625, -0.02978515625, -0.02034759521484375, -0.0109100341796875, -0.00147247314453125, 0.007965087890625, 0.01740264892578125, 0.0268402099609375, 0.03627777099609375, 0.04571533203125, 0.05515289306640625, 0.0645904541015625, 0.07402801513671875, 0.083465576171875, 0.09290313720703125, 0.1023406982421875, 0.11177825927734375, 0.1212158203125, 0.13065338134765625, 0.1400909423828125, 0.14952850341796875, 0.158966064453125, 0.16840362548828125, 0.1778411865234375, 0.18727874755859375, 0.19671630859375, 0.20615386962890625, 0.2155914306640625, 0.22502899169921875, 0.234466552734375, 0.24390411376953125, 0.2533416748046875, 0.26277923583984375, 0.272216796875]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 9.0, 26.0, 56.0, 94.0, 140.0, 180.0, 192.0, 147.0, 80.0, 37.0, 19.0, 5.0, 6.0, 1.0, 3.0, 5.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1331787109375, -0.1300039291381836, -0.1268291473388672, -0.12365436553955078, -0.12047958374023438, -0.11730480194091797, -0.11413002014160156, -0.11095523834228516, -0.10778045654296875, -0.10460567474365234, -0.10143089294433594, -0.09825611114501953, -0.09508132934570312, -0.09190654754638672, -0.08873176574707031, -0.0855569839477539, -0.0823822021484375, -0.0792074203491211, -0.07603263854980469, -0.07285785675048828, -0.06968307495117188, -0.06650829315185547, -0.06333351135253906, -0.060158729553222656, -0.05698394775390625, -0.053809165954589844, -0.05063438415527344, -0.04745960235595703, -0.044284820556640625, -0.04111003875732422, -0.03793525695800781, -0.034760475158691406, -0.031585693359375, -0.028410911560058594, -0.025236129760742188, -0.02206134796142578, -0.018886566162109375, -0.01571178436279297, -0.012537002563476562, -0.009362220764160156, -0.00618743896484375, -0.0030126571655273438, 0.0001621246337890625, 0.0033369064331054688, 0.006511688232421875, 0.009686470031738281, 0.012861251831054688, 0.016036033630371094, 0.0192108154296875, 0.022385597229003906, 0.025560379028320312, 0.02873516082763672, 0.031909942626953125, 0.03508472442626953, 0.03825950622558594, 0.041434288024902344, 0.04460906982421875, 0.047783851623535156, 0.05095863342285156, 0.05413341522216797, 0.057308197021484375, 0.06048297882080078, 0.06365776062011719, 0.0668325424194336, 0.07000732421875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 3.0, 5.0, 7.0, 13.0, 7.0, 14.0, 19.0, 26.0, 34.0, 93.0, 120.0, 187.0, 341.0, 593.0, 1137.0, 2315.0, 4844.0, 11264.0, 27497.0, 73601.0, 218574.0, 436271.0, 172102.0, 59274.0, 22530.0, 9294.0, 4116.0, 1981.0, 1001.0, 553.0, 274.0, 161.0, 89.0, 59.0, 49.0, 32.0, 22.0, 15.0, 14.0, 4.0, 6.0, 3.0, 5.0, 5.0, 4.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07763671875, -0.0752401351928711, -0.07284355163574219, -0.07044696807861328, -0.06805038452148438, -0.06565380096435547, -0.06325721740722656, -0.060860633850097656, -0.05846405029296875, -0.056067466735839844, -0.05367088317871094, -0.05127429962158203, -0.048877716064453125, -0.04648113250732422, -0.04408454895019531, -0.041687965393066406, -0.0392913818359375, -0.036894798278808594, -0.03449821472167969, -0.03210163116455078, -0.029705047607421875, -0.02730846405029297, -0.024911880493164062, -0.022515296936035156, -0.02011871337890625, -0.017722129821777344, -0.015325546264648438, -0.012928962707519531, -0.010532379150390625, -0.008135795593261719, -0.0057392120361328125, -0.0033426284790039062, -0.000946044921875, 0.0014505386352539062, 0.0038471221923828125, 0.006243705749511719, 0.008640289306640625, 0.011036872863769531, 0.013433456420898438, 0.015830039978027344, 0.01822662353515625, 0.020623207092285156, 0.023019790649414062, 0.02541637420654297, 0.027812957763671875, 0.03020954132080078, 0.03260612487792969, 0.035002708435058594, 0.0373992919921875, 0.039795875549316406, 0.04219245910644531, 0.04458904266357422, 0.046985626220703125, 0.04938220977783203, 0.05177879333496094, 0.054175376892089844, 0.05657196044921875, 0.058968544006347656, 0.06136512756347656, 0.06376171112060547, 0.06615829467773438, 0.06855487823486328, 0.07095146179199219, 0.0733480453491211, 0.07574462890625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 1.0, 3.0, 6.0, 12.0, 14.0, 17.0, 15.0, 22.0, 23.0, 30.0, 35.0, 41.0, 44.0, 60.0, 56.0, 40.0, 58.0, 66.0, 71.0, 45.0, 40.0, 54.0, 47.0, 33.0, 25.0, 21.0, 28.0, 20.0, 19.0, 18.0, 10.0, 13.0, 11.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09649658203125, -0.09310054779052734, -0.08970451354980469, -0.08630847930908203, -0.08291244506835938, -0.07951641082763672, -0.07612037658691406, -0.0727243423461914, -0.06932830810546875, -0.0659322738647461, -0.06253623962402344, -0.05914020538330078, -0.055744171142578125, -0.05234813690185547, -0.04895210266113281, -0.045556068420410156, -0.0421600341796875, -0.038763999938964844, -0.03536796569824219, -0.03197193145751953, -0.028575897216796875, -0.02517986297607422, -0.021783828735351562, -0.018387794494628906, -0.01499176025390625, -0.011595726013183594, -0.008199691772460938, -0.004803657531738281, -0.001407623291015625, 0.0019884109497070312, 0.0053844451904296875, 0.008780479431152344, 0.012176513671875, 0.015572547912597656, 0.018968582153320312, 0.02236461639404297, 0.025760650634765625, 0.02915668487548828, 0.03255271911621094, 0.035948753356933594, 0.03934478759765625, 0.042740821838378906, 0.04613685607910156, 0.04953289031982422, 0.052928924560546875, 0.05632495880126953, 0.05972099304199219, 0.06311702728271484, 0.0665130615234375, 0.06990909576416016, 0.07330513000488281, 0.07670116424560547, 0.08009719848632812, 0.08349323272705078, 0.08688926696777344, 0.0902853012084961, 0.09368133544921875, 0.0970773696899414, 0.10047340393066406, 0.10386943817138672, 0.10726547241210938, 0.11066150665283203, 0.11405754089355469, 0.11745357513427734, 0.120849609375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 2.0, 4.0, 1.0, 5.0, 7.0, 13.0, 12.0, 20.0, 29.0, 26.0, 44.0, 82.0, 133.0, 219.0, 331.0, 572.0, 1064.0, 2048.0, 4177.0, 10098.0, 27914.0, 107877.0, 633574.0, 194202.0, 41376.0, 13647.0, 5463.0, 2593.0, 1233.0, 694.0, 408.0, 253.0, 144.0, 101.0, 58.0, 31.0, 35.0, 20.0, 19.0, 8.0, 5.0, 8.0, 9.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.033935546875, -0.03282880783081055, -0.031722068786621094, -0.03061532974243164, -0.029508590698242188, -0.028401851654052734, -0.02729511260986328, -0.026188373565673828, -0.025081634521484375, -0.023974895477294922, -0.02286815643310547, -0.021761417388916016, -0.020654678344726562, -0.01954793930053711, -0.018441200256347656, -0.017334461212158203, -0.01622772216796875, -0.015120983123779297, -0.014014244079589844, -0.01290750503540039, -0.011800765991210938, -0.010694026947021484, -0.009587287902832031, -0.008480548858642578, -0.007373809814453125, -0.006267070770263672, -0.005160331726074219, -0.004053592681884766, -0.0029468536376953125, -0.0018401145935058594, -0.0007333755493164062, 0.0003733634948730469, 0.0014801025390625, 0.002586841583251953, 0.0036935806274414062, 0.004800319671630859, 0.0059070587158203125, 0.007013797760009766, 0.008120536804199219, 0.009227275848388672, 0.010334014892578125, 0.011440753936767578, 0.012547492980957031, 0.013654232025146484, 0.014760971069335938, 0.01586771011352539, 0.016974449157714844, 0.018081188201904297, 0.01918792724609375, 0.020294666290283203, 0.021401405334472656, 0.02250814437866211, 0.023614883422851562, 0.024721622467041016, 0.02582836151123047, 0.026935100555419922, 0.028041839599609375, 0.029148578643798828, 0.03025531768798828, 0.031362056732177734, 0.03246879577636719, 0.03357553482055664, 0.034682273864746094, 0.03578901290893555, 0.036895751953125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 4.0, 5.0, 7.0, 13.0, 7.0, 11.0, 18.0, 23.0, 19.0, 23.0, 27.0, 33.0, 48.0, 57.0, 71.0, 107.0, 95.0, 78.0, 65.0, 55.0, 37.0, 35.0, 27.0, 25.0, 21.0, 18.0, 12.0, 10.0, 10.0, 8.0, 2.0, 6.0, 5.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-9.900331497192383e-05, -9.592156857252121e-05, -9.283982217311859e-05, -8.975807577371597e-05, -8.667632937431335e-05, -8.359458297491074e-05, -8.051283657550812e-05, -7.74310901761055e-05, -7.434934377670288e-05, -7.126759737730026e-05, -6.818585097789764e-05, -6.510410457849503e-05, -6.202235817909241e-05, -5.894061177968979e-05, -5.585886538028717e-05, -5.277711898088455e-05, -4.9695372581481934e-05, -4.6613626182079315e-05, -4.35318797826767e-05, -4.045013338327408e-05, -3.736838698387146e-05, -3.428664058446884e-05, -3.120489418506622e-05, -2.8123147785663605e-05, -2.5041401386260986e-05, -2.1959654986858368e-05, -1.887790858745575e-05, -1.579616218805313e-05, -1.2714415788650513e-05, -9.632669389247894e-06, -6.550922989845276e-06, -3.4691765904426575e-06, -3.8743019104003906e-07, 2.6943162083625793e-06, 5.776062607765198e-06, 8.857809007167816e-06, 1.1939555406570435e-05, 1.5021301805973053e-05, 1.810304820537567e-05, 2.118479460477829e-05, 2.4266541004180908e-05, 2.7348287403583527e-05, 3.0430033802986145e-05, 3.3511780202388763e-05, 3.659352660179138e-05, 3.9675273001194e-05, 4.275701940059662e-05, 4.583876579999924e-05, 4.8920512199401855e-05, 5.2002258598804474e-05, 5.508400499820709e-05, 5.816575139760971e-05, 6.124749779701233e-05, 6.432924419641495e-05, 6.741099059581757e-05, 7.049273699522018e-05, 7.35744833946228e-05, 7.665622979402542e-05, 7.973797619342804e-05, 8.281972259283066e-05, 8.590146899223328e-05, 8.89832153916359e-05, 9.206496179103851e-05, 9.514670819044113e-05, 9.822845458984375e-05]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 2.0, 4.0, 0.0, 9.0, 10.0, 9.0, 15.0, 22.0, 24.0, 27.0, 55.0, 116.0, 150.0, 268.0, 472.0, 894.0, 1882.0, 4940.0, 15821.0, 76246.0, 677390.0, 224045.0, 31972.0, 8398.0, 2942.0, 1304.0, 638.0, 344.0, 186.0, 135.0, 76.0, 50.0, 29.0, 33.0, 10.0, 13.0, 9.0, 7.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.04339599609375, -0.041886329650878906, -0.04037666320800781, -0.03886699676513672, -0.037357330322265625, -0.03584766387939453, -0.03433799743652344, -0.032828330993652344, -0.03131866455078125, -0.029808998107910156, -0.028299331665039062, -0.02678966522216797, -0.025279998779296875, -0.02377033233642578, -0.022260665893554688, -0.020750999450683594, -0.0192413330078125, -0.017731666564941406, -0.016222000122070312, -0.014712333679199219, -0.013202667236328125, -0.011693000793457031, -0.010183334350585938, -0.008673667907714844, -0.00716400146484375, -0.005654335021972656, -0.0041446685791015625, -0.0026350021362304688, -0.001125335693359375, 0.00038433074951171875, 0.0018939971923828125, 0.0034036636352539062, 0.004913330078125, 0.006422996520996094, 0.007932662963867188, 0.009442329406738281, 0.010951995849609375, 0.012461662292480469, 0.013971328735351562, 0.015480995178222656, 0.01699066162109375, 0.018500328063964844, 0.020009994506835938, 0.02151966094970703, 0.023029327392578125, 0.02453899383544922, 0.026048660278320312, 0.027558326721191406, 0.0290679931640625, 0.030577659606933594, 0.03208732604980469, 0.03359699249267578, 0.035106658935546875, 0.03661632537841797, 0.03812599182128906, 0.039635658264160156, 0.04114532470703125, 0.042654991149902344, 0.04416465759277344, 0.04567432403564453, 0.047183990478515625, 0.04869365692138672, 0.05020332336425781, 0.051712989807128906, 0.05322265625]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 6.0, 16.0, 14.0, 24.0, 22.0, 49.0, 61.0, 116.0, 145.0, 165.0, 113.0, 97.0, 57.0, 34.0, 26.0, 20.0, 20.0, 7.0, 6.0, 3.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0657958984375, -0.0636281967163086, -0.06146049499511719, -0.05929279327392578, -0.057125091552734375, -0.05495738983154297, -0.05278968811035156, -0.050621986389160156, -0.04845428466796875, -0.046286582946777344, -0.04411888122558594, -0.04195117950439453, -0.039783477783203125, -0.03761577606201172, -0.03544807434082031, -0.033280372619628906, -0.0311126708984375, -0.028944969177246094, -0.026777267456054688, -0.02460956573486328, -0.022441864013671875, -0.02027416229248047, -0.018106460571289062, -0.015938758850097656, -0.01377105712890625, -0.011603355407714844, -0.009435653686523438, -0.007267951965332031, -0.005100250244140625, -0.0029325485229492188, -0.0007648468017578125, 0.0014028549194335938, 0.003570556640625, 0.005738258361816406, 0.007905960083007812, 0.010073661804199219, 0.012241363525390625, 0.014409065246582031, 0.016576766967773438, 0.018744468688964844, 0.02091217041015625, 0.023079872131347656, 0.025247573852539062, 0.02741527557373047, 0.029582977294921875, 0.03175067901611328, 0.03391838073730469, 0.036086082458496094, 0.0382537841796875, 0.040421485900878906, 0.04258918762207031, 0.04475688934326172, 0.046924591064453125, 0.04909229278564453, 0.05125999450683594, 0.053427696228027344, 0.05559539794921875, 0.057763099670410156, 0.05993080139160156, 0.06209850311279297, 0.06426620483398438, 0.06643390655517578, 0.06860160827636719, 0.0707693099975586, 0.07293701171875]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 6.0, 22.0, 88.0, 256.0, 395.0, 180.0, 48.0, 19.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.401869535446167, -2.335577964782715, -2.2692861557006836, -2.2029945850372314, -2.1367027759552, -2.070411205291748, -2.004119396209717, -1.9378278255462646, -1.871536135673523, -1.8052444458007812, -1.7389527559280396, -1.6726610660552979, -1.6063694953918457, -1.5400776863098145, -1.4737861156463623, -1.4074944257736206, -1.341202735900879, -1.2749110460281372, -1.2086193561553955, -1.1423276662826538, -1.076035976409912, -1.00974440574646, -0.9434527158737183, -0.8771610260009766, -0.8108693361282349, -0.7445776462554932, -0.6782859563827515, -0.6119943261146545, -0.5457026362419128, -0.47941094636917114, -0.41311928629875183, -0.3468276262283325, -0.2805356979370117, -0.2142440229654312, -0.1479523479938507, -0.0816606730222702, -0.015368998050689697, 0.050922691822052, 0.11721435189247131, 0.18350601196289062, 0.24979770183563232, 0.316089391708374, 0.38238105177879333, 0.44867271184921265, 0.5149644017219543, 0.581256091594696, 0.647547721862793, 0.7138394117355347, 0.7801311016082764, 0.8464227914810181, 0.9127144813537598, 0.9790061116218567, 1.0452978610992432, 1.1115894317626953, 1.177881121635437, 1.2441728115081787, 1.3104645013809204, 1.376756191253662, 1.4430478811264038, 1.5093395709991455, 1.5756311416625977, 1.641922950744629, 1.708214521408081, 1.7745062112808228, 1.8407979011535645]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 1.0, 2.0, 6.0, 10.0, 4.0, 2.0, 9.0, 14.0, 13.0, 12.0, 8.0, 19.0, 17.0, 24.0, 23.0, 32.0, 30.0, 28.0, 46.0, 39.0, 40.0, 49.0, 49.0, 49.0, 41.0, 45.0, 35.0, 31.0, 42.0, 37.0, 36.0, 30.0, 21.0, 17.0, 22.0, 17.0, 27.0, 12.0, 12.0, 8.0, 13.0, 7.0, 5.0, 1.0, 5.0, 3.0, 6.0, 2.0, 4.0, 1.0, 5.0, 1.0, 1.0, 2.0], "bins": [-0.4238309860229492, -0.41121748089790344, -0.39860397577285767, -0.3859904408454895, -0.3733769357204437, -0.36076343059539795, -0.3481499254703522, -0.3355364203453064, -0.32292288541793823, -0.31030938029289246, -0.2976958751678467, -0.2850823402404785, -0.27246883511543274, -0.25985532999038696, -0.2472418248653412, -0.2346283197402954, -0.22201481461524963, -0.20940130949020386, -0.1967877894639969, -0.1841742843389511, -0.17156076431274414, -0.15894725918769836, -0.1463337540626526, -0.1337202489376068, -0.12110672891139984, -0.10849321633577347, -0.0958797037601471, -0.08326619863510132, -0.07065268605947495, -0.05803917348384857, -0.045425668358802795, -0.03281215578317642, -0.02019864320755005, -0.007585132494568825, 0.005028378218412399, 0.017641887068748474, 0.030255399644374847, 0.04286891222000122, 0.055482417345047, 0.06809592992067337, 0.08070944249629974, 0.09332295507192612, 0.10593646764755249, 0.11854997277259827, 0.13116347789764404, 0.143776997923851, 0.1563905030488968, 0.16900402307510376, 0.18161752820014954, 0.1942310333251953, 0.20684455335140228, 0.21945805847644806, 0.23207157850265503, 0.2446850836277008, 0.2572985887527466, 0.26991209387779236, 0.28252559900283813, 0.2951391041278839, 0.3077526092529297, 0.32036614418029785, 0.33297964930534363, 0.3455931544303894, 0.3582066595554352, 0.37082016468048096, 0.3834336996078491]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 7.0, 6.0, 4.0, 10.0, 11.0, 10.0, 23.0, 39.0, 99.0, 329.0, 1275.0, 15065.0, 4174600.0, 2034.0, 428.0, 159.0, 68.0, 39.0, 20.0, 22.0, 10.0, 6.0, 7.0, 7.0, 0.0, 1.0, 2.0, 2.0, 3.0], "bins": [-0.33203125, -0.32498645782470703, -0.31794166564941406, -0.3108968734741211, -0.3038520812988281, -0.29680728912353516, -0.2897624969482422, -0.2827177047729492, -0.27567291259765625, -0.2686281204223633, -0.2615833282470703, -0.25453853607177734, -0.24749374389648438, -0.2404489517211914, -0.23340415954589844, -0.22635936737060547, -0.2193145751953125, -0.21226978302001953, -0.20522499084472656, -0.1981801986694336, -0.19113540649414062, -0.18409061431884766, -0.1770458221435547, -0.17000102996826172, -0.16295623779296875, -0.15591144561767578, -0.1488666534423828, -0.14182186126708984, -0.13477706909179688, -0.1277322769165039, -0.12068748474121094, -0.11364269256591797, -0.106597900390625, -0.09955310821533203, -0.09250831604003906, -0.0854635238647461, -0.07841873168945312, -0.07137393951416016, -0.06432914733886719, -0.05728435516357422, -0.05023956298828125, -0.04319477081298828, -0.03614997863769531, -0.029105186462402344, -0.022060394287109375, -0.015015602111816406, -0.007970809936523438, -0.0009260177612304688, 0.0061187744140625, 0.013163566589355469, 0.020208358764648438, 0.027253150939941406, 0.034297943115234375, 0.041342735290527344, 0.04838752746582031, 0.05543231964111328, 0.06247711181640625, 0.06952190399169922, 0.07656669616699219, 0.08361148834228516, 0.09065628051757812, 0.0977010726928711, 0.10474586486816406, 0.11179065704345703, 0.11883544921875]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 8.0, 27.0, 57.0, 82.0, 139.0, 190.0, 194.0, 147.0, 81.0, 39.0, 17.0, 4.0, 7.0, 1.0, 2.0, 5.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1331787109375, -0.1300048828125, -0.1268310546875, -0.1236572265625, -0.1204833984375, -0.1173095703125, -0.1141357421875, -0.1109619140625, -0.1077880859375, -0.1046142578125, -0.1014404296875, -0.0982666015625, -0.0950927734375, -0.0919189453125, -0.0887451171875, -0.0855712890625, -0.0823974609375, -0.0792236328125, -0.0760498046875, -0.0728759765625, -0.0697021484375, -0.0665283203125, -0.0633544921875, -0.0601806640625, -0.0570068359375, -0.0538330078125, -0.0506591796875, -0.0474853515625, -0.0443115234375, -0.0411376953125, -0.0379638671875, -0.0347900390625, -0.0316162109375, -0.0284423828125, -0.0252685546875, -0.0220947265625, -0.0189208984375, -0.0157470703125, -0.0125732421875, -0.0093994140625, -0.0062255859375, -0.0030517578125, 0.0001220703125, 0.0032958984375, 0.0064697265625, 0.0096435546875, 0.0128173828125, 0.0159912109375, 0.0191650390625, 0.0223388671875, 0.0255126953125, 0.0286865234375, 0.0318603515625, 0.0350341796875, 0.0382080078125, 0.0413818359375, 0.0445556640625, 0.0477294921875, 0.0509033203125, 0.0540771484375, 0.0572509765625, 0.0604248046875, 0.0635986328125, 0.0667724609375, 0.0699462890625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 7.0, 3.0, 6.0, 19.0, 30.0, 35.0, 53.0, 91.0, 161.0, 289.0, 550.0, 1239.0, 3549.0, 23424.0, 4152883.0, 8103.0, 2055.0, 861.0, 423.0, 208.0, 118.0, 67.0, 37.0, 31.0, 15.0, 9.0, 8.0, 6.0, 5.0, 4.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0689697265625, -0.06612873077392578, -0.06328773498535156, -0.060446739196777344, -0.057605743408203125, -0.054764747619628906, -0.05192375183105469, -0.04908275604248047, -0.04624176025390625, -0.04340076446533203, -0.04055976867675781, -0.037718772888183594, -0.034877777099609375, -0.032036781311035156, -0.029195785522460938, -0.02635478973388672, -0.0235137939453125, -0.02067279815673828, -0.017831802368164062, -0.014990806579589844, -0.012149810791015625, -0.009308815002441406, -0.0064678192138671875, -0.0036268234252929688, -0.00078582763671875, 0.0020551681518554688, 0.0048961639404296875, 0.007737159729003906, 0.010578155517578125, 0.013419151306152344, 0.016260147094726562, 0.01910114288330078, 0.021942138671875, 0.02478313446044922, 0.027624130249023438, 0.030465126037597656, 0.033306121826171875, 0.036147117614746094, 0.03898811340332031, 0.04182910919189453, 0.04467010498046875, 0.04751110076904297, 0.05035209655761719, 0.053193092346191406, 0.056034088134765625, 0.058875083923339844, 0.06171607971191406, 0.06455707550048828, 0.0673980712890625, 0.07023906707763672, 0.07308006286621094, 0.07592105865478516, 0.07876205444335938, 0.0816030502319336, 0.08444404602050781, 0.08728504180908203, 0.09012603759765625, 0.09296703338623047, 0.09580802917480469, 0.0986490249633789, 0.10149002075195312, 0.10433101654052734, 0.10717201232910156, 0.11001300811767578, 0.11285400390625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 6.0, 6.0, 7.0, 26.0, 3884.0, 94.0, 23.0, 8.0, 6.0, 4.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01016998291015625, -0.009775638580322266, -0.009381294250488281, -0.008986949920654297, -0.008592605590820312, -0.008198261260986328, -0.007803916931152344, -0.007409572601318359, -0.007015228271484375, -0.006620883941650391, -0.006226539611816406, -0.005832195281982422, -0.0054378509521484375, -0.005043506622314453, -0.004649162292480469, -0.004254817962646484, -0.0038604736328125, -0.0034661293029785156, -0.0030717849731445312, -0.002677440643310547, -0.0022830963134765625, -0.0018887519836425781, -0.0014944076538085938, -0.0011000633239746094, -0.000705718994140625, -0.0003113746643066406, 8.296966552734375e-05, 0.0004773139953613281, 0.0008716583251953125, 0.0012660026550292969, 0.0016603469848632812, 0.0020546913146972656, 0.00244903564453125, 0.0028433799743652344, 0.0032377243041992188, 0.003632068634033203, 0.0040264129638671875, 0.004420757293701172, 0.004815101623535156, 0.005209445953369141, 0.005603790283203125, 0.005998134613037109, 0.006392478942871094, 0.006786823272705078, 0.0071811676025390625, 0.007575511932373047, 0.007969856262207031, 0.008364200592041016, 0.008758544921875, 0.009152889251708984, 0.009547233581542969, 0.009941577911376953, 0.010335922241210938, 0.010730266571044922, 0.011124610900878906, 0.01151895523071289, 0.011913299560546875, 0.01230764389038086, 0.012701988220214844, 0.013096332550048828, 0.013490676879882812, 0.013885021209716797, 0.014279365539550781, 0.014673709869384766, 0.01506805419921875]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 10.0, 14.0, 63.0, 194.0, 339.0, 228.0, 100.0, 41.0, 15.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03993437439203262, -0.03752191364765167, -0.03510945290327072, -0.03269699215888977, -0.03028452955186367, -0.02787206880748272, -0.02545960620045662, -0.02304714545607567, -0.020634684711694717, -0.018222223967313766, -0.015809763222932816, -0.013397300615906715, -0.010984839871525764, -0.008572379127144814, -0.006159917451441288, -0.0037474557757377625, -0.0013349950313568115, 0.0010774661786854267, 0.003489927388727665, 0.005902388598769903, 0.008314849808812141, 0.010727310553193092, 0.013139772228896618, 0.015552233904600143, 0.017964694648981094, 0.020377155393362045, 0.022789616137742996, 0.025202078744769096, 0.027614539489150047, 0.030027000233530998, 0.0324394628405571, 0.03485192358493805, 0.0372643768787384, 0.039676837623119354, 0.042089298367500305, 0.044501759111881256, 0.04691421985626221, 0.04932668060064316, 0.05173914507031441, 0.05415160581469536, 0.05656406655907631, 0.05897652730345726, 0.06138898804783821, 0.06380145251750946, 0.06621391326189041, 0.06862637400627136, 0.07103883475065231, 0.07345129549503326, 0.07586375623941422, 0.07827621698379517, 0.08068867772817612, 0.08310113847255707, 0.08551359921693802, 0.08792605996131897, 0.09033852070569992, 0.09275098145008087, 0.09516344964504242, 0.09757591038942337, 0.09998837113380432, 0.10240083187818527, 0.10481329262256622, 0.10722575336694717, 0.10963821411132812, 0.11205068230628967, 0.11446313560009003]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 4.0, 11.0, 10.0, 2.0, 10.0, 13.0, 15.0, 14.0, 30.0, 29.0, 22.0, 32.0, 32.0, 33.0, 40.0, 45.0, 47.0, 46.0, 50.0, 52.0, 42.0, 37.0, 51.0, 53.0, 46.0, 30.0, 37.0, 24.0, 29.0, 30.0, 17.0, 11.0, 6.0, 13.0, 12.0, 8.0, 6.0, 4.0, 1.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.016213417053222656, -0.015672829002141953, -0.015132240951061249, -0.014591652899980545, -0.014051064848899841, -0.013510476797819138, -0.012969888746738434, -0.01242930069565773, -0.011888712644577026, -0.011348124593496323, -0.010807536542415619, -0.010266948491334915, -0.009726360440254211, -0.009185772389173508, -0.008645184338092804, -0.0081045962870121, -0.0075640082359313965, -0.007023420184850693, -0.006482832133769989, -0.005942244082689285, -0.0054016560316085815, -0.004861067980527878, -0.004320479929447174, -0.0037798918783664703, -0.0032393038272857666, -0.002698715776205063, -0.002158127725124359, -0.0016175396740436554, -0.0010769516229629517, -0.0005363635718822479, 4.2244791984558105e-06, 0.0005448125302791595, 0.0010854005813598633, 0.001625988632440567, 0.0021665766835212708, 0.0027071647346019745, 0.0032477527856826782, 0.003788340836763382, 0.004328928887844086, 0.004869516938924789, 0.005410104990005493, 0.005950693041086197, 0.006491281092166901, 0.007031869143247604, 0.007572457194328308, 0.008113045245409012, 0.008653633296489716, 0.00919422134757042, 0.009734809398651123, 0.010275397449731827, 0.01081598550081253, 0.011356573551893234, 0.011897161602973938, 0.012437749654054642, 0.012978337705135345, 0.01351892575621605, 0.014059513807296753, 0.014600101858377457, 0.01514068990945816, 0.015681277960538864, 0.016221866011619568, 0.01676245406270027, 0.017303042113780975, 0.01784363016486168, 0.018384218215942383]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 6.0, 5.0, 5.0, 8.0, 8.0, 17.0, 22.0, 35.0, 34.0, 47.0, 77.0, 89.0, 151.0, 208.0, 356.0, 464.0, 819.0, 1384.0, 2993.0, 9317.0, 65309.0, 690845.0, 243884.0, 22798.0, 4915.0, 1841.0, 1016.0, 612.0, 369.0, 297.0, 170.0, 106.0, 94.0, 62.0, 42.0, 44.0, 21.0, 23.0, 13.0, 13.0, 12.0, 8.0, 5.0, 2.0, 3.0, 3.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2578125, -0.2499408721923828, -0.24206924438476562, -0.23419761657714844, -0.22632598876953125, -0.21845436096191406, -0.21058273315429688, -0.2027111053466797, -0.1948394775390625, -0.1869678497314453, -0.17909622192382812, -0.17122459411621094, -0.16335296630859375, -0.15548133850097656, -0.14760971069335938, -0.1397380828857422, -0.131866455078125, -0.12399482727050781, -0.11612319946289062, -0.10825157165527344, -0.10037994384765625, -0.09250831604003906, -0.08463668823242188, -0.07676506042480469, -0.0688934326171875, -0.06102180480957031, -0.053150177001953125, -0.04527854919433594, -0.03740692138671875, -0.029535293579101562, -0.021663665771484375, -0.013792037963867188, -0.00592041015625, 0.0019512176513671875, 0.009822845458984375, 0.017694473266601562, 0.02556610107421875, 0.03343772888183594, 0.041309356689453125, 0.04918098449707031, 0.0570526123046875, 0.06492424011230469, 0.07279586791992188, 0.08066749572753906, 0.08853912353515625, 0.09641075134277344, 0.10428237915039062, 0.11215400695800781, 0.120025634765625, 0.1278972625732422, 0.13576889038085938, 0.14364051818847656, 0.15151214599609375, 0.15938377380371094, 0.16725540161132812, 0.1751270294189453, 0.1829986572265625, 0.1908702850341797, 0.19874191284179688, 0.20661354064941406, 0.21448516845703125, 0.22235679626464844, 0.23022842407226562, 0.2381000518798828, 0.2459716796875]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 7.0, 27.0, 53.0, 81.0, 147.0, 187.0, 193.0, 146.0, 82.0, 41.0, 18.0, 3.0, 7.0, 1.0, 2.0, 5.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.13330078125, -0.1301250457763672, -0.12694931030273438, -0.12377357482910156, -0.12059783935546875, -0.11742210388183594, -0.11424636840820312, -0.11107063293457031, -0.1078948974609375, -0.10471916198730469, -0.10154342651367188, -0.09836769104003906, -0.09519195556640625, -0.09201622009277344, -0.08884048461914062, -0.08566474914550781, -0.082489013671875, -0.07931327819824219, -0.07613754272460938, -0.07296180725097656, -0.06978607177734375, -0.06661033630371094, -0.06343460083007812, -0.06025886535644531, -0.0570831298828125, -0.05390739440917969, -0.050731658935546875, -0.04755592346191406, -0.04438018798828125, -0.04120445251464844, -0.038028717041015625, -0.03485298156738281, -0.03167724609375, -0.028501510620117188, -0.025325775146484375, -0.022150039672851562, -0.01897430419921875, -0.015798568725585938, -0.012622833251953125, -0.009447097778320312, -0.0062713623046875, -0.0030956268310546875, 8.0108642578125e-05, 0.0032558441162109375, 0.00643157958984375, 0.009607315063476562, 0.012783050537109375, 0.015958786010742188, 0.019134521484375, 0.022310256958007812, 0.025485992431640625, 0.028661727905273438, 0.03183746337890625, 0.03501319885253906, 0.038188934326171875, 0.04136466979980469, 0.0445404052734375, 0.04771614074707031, 0.050891876220703125, 0.05406761169433594, 0.05724334716796875, 0.06041908264160156, 0.06359481811523438, 0.06677055358886719, 0.0699462890625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 8.0, 4.0, 8.0, 11.0, 11.0, 20.0, 24.0, 35.0, 76.0, 97.0, 163.0, 235.0, 545.0, 1001.0, 1994.0, 4376.0, 10111.0, 25770.0, 76556.0, 263829.0, 451640.0, 139634.0, 43916.0, 15865.0, 6614.0, 2870.0, 1407.0, 754.0, 386.0, 236.0, 118.0, 81.0, 45.0, 36.0, 25.0, 17.0, 9.0, 6.0, 7.0, 10.0, 1.0, 2.0, 1.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.0762939453125, -0.0738525390625, -0.0714111328125, -0.0689697265625, -0.0665283203125, -0.0640869140625, -0.0616455078125, -0.0592041015625, -0.0567626953125, -0.0543212890625, -0.0518798828125, -0.0494384765625, -0.0469970703125, -0.0445556640625, -0.0421142578125, -0.0396728515625, -0.0372314453125, -0.0347900390625, -0.0323486328125, -0.0299072265625, -0.0274658203125, -0.0250244140625, -0.0225830078125, -0.0201416015625, -0.0177001953125, -0.0152587890625, -0.0128173828125, -0.0103759765625, -0.0079345703125, -0.0054931640625, -0.0030517578125, -0.0006103515625, 0.0018310546875, 0.0042724609375, 0.0067138671875, 0.0091552734375, 0.0115966796875, 0.0140380859375, 0.0164794921875, 0.0189208984375, 0.0213623046875, 0.0238037109375, 0.0262451171875, 0.0286865234375, 0.0311279296875, 0.0335693359375, 0.0360107421875, 0.0384521484375, 0.0408935546875, 0.0433349609375, 0.0457763671875, 0.0482177734375, 0.0506591796875, 0.0531005859375, 0.0555419921875, 0.0579833984375, 0.0604248046875, 0.0628662109375, 0.0653076171875, 0.0677490234375, 0.0701904296875, 0.0726318359375, 0.0750732421875, 0.0775146484375, 0.0799560546875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 2.0, 6.0, 7.0, 12.0, 13.0, 17.0, 4.0, 23.0, 25.0, 30.0, 39.0, 33.0, 37.0, 53.0, 50.0, 63.0, 52.0, 55.0, 57.0, 51.0, 37.0, 42.0, 49.0, 40.0, 29.0, 37.0, 27.0, 21.0, 26.0, 17.0, 10.0, 12.0, 13.0, 8.0, 1.0, 3.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.081298828125, -0.07800865173339844, -0.07471847534179688, -0.07142829895019531, -0.06813812255859375, -0.06484794616699219, -0.061557769775390625, -0.05826759338378906, -0.0549774169921875, -0.05168724060058594, -0.048397064208984375, -0.04510688781738281, -0.04181671142578125, -0.03852653503417969, -0.035236358642578125, -0.03194618225097656, -0.028656005859375, -0.025365829467773438, -0.022075653076171875, -0.018785476684570312, -0.01549530029296875, -0.012205123901367188, -0.008914947509765625, -0.0056247711181640625, -0.0023345947265625, 0.0009555816650390625, 0.004245758056640625, 0.0075359344482421875, 0.01082611083984375, 0.014116287231445312, 0.017406463623046875, 0.020696640014648438, 0.02398681640625, 0.027276992797851562, 0.030567169189453125, 0.03385734558105469, 0.03714752197265625, 0.04043769836425781, 0.043727874755859375, 0.04701805114746094, 0.0503082275390625, 0.05359840393066406, 0.056888580322265625, 0.06017875671386719, 0.06346893310546875, 0.06675910949707031, 0.07004928588867188, 0.07333946228027344, 0.076629638671875, 0.07991981506347656, 0.08320999145507812, 0.08650016784667969, 0.08979034423828125, 0.09308052062988281, 0.09637069702148438, 0.09966087341308594, 0.1029510498046875, 0.10624122619628906, 0.10953140258789062, 0.11282157897949219, 0.11611175537109375, 0.11940193176269531, 0.12269210815429688, 0.12598228454589844, 0.1292724609375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 0.0, 4.0, 4.0, 5.0, 12.0, 9.0, 15.0, 26.0, 33.0, 43.0, 50.0, 88.0, 96.0, 134.0, 198.0, 323.0, 559.0, 863.0, 1532.0, 2779.0, 6047.0, 15034.0, 50087.0, 371145.0, 509828.0, 58853.0, 16903.0, 6547.0, 3156.0, 1576.0, 905.0, 558.0, 343.0, 247.0, 150.0, 107.0, 93.0, 51.0, 40.0, 32.0, 25.0, 18.0, 7.0, 7.0, 7.0, 4.0, 3.0, 0.0, 6.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.041595458984375, -0.04025602340698242, -0.038916587829589844, -0.037577152252197266, -0.03623771667480469, -0.03489828109741211, -0.03355884552001953, -0.03221940994262695, -0.030879974365234375, -0.029540538787841797, -0.02820110321044922, -0.02686166763305664, -0.025522232055664062, -0.024182796478271484, -0.022843360900878906, -0.021503925323486328, -0.02016448974609375, -0.018825054168701172, -0.017485618591308594, -0.016146183013916016, -0.014806747436523438, -0.01346731185913086, -0.012127876281738281, -0.010788440704345703, -0.009449005126953125, -0.008109569549560547, -0.006770133972167969, -0.005430698394775391, -0.0040912628173828125, -0.0027518272399902344, -0.0014123916625976562, -7.295608520507812e-05, 0.0012664794921875, 0.002605915069580078, 0.003945350646972656, 0.005284786224365234, 0.0066242218017578125, 0.00796365737915039, 0.009303092956542969, 0.010642528533935547, 0.011981964111328125, 0.013321399688720703, 0.014660835266113281, 0.01600027084350586, 0.017339706420898438, 0.018679141998291016, 0.020018577575683594, 0.021358013153076172, 0.02269744873046875, 0.024036884307861328, 0.025376319885253906, 0.026715755462646484, 0.028055191040039062, 0.02939462661743164, 0.03073406219482422, 0.0320734977722168, 0.033412933349609375, 0.03475236892700195, 0.03609180450439453, 0.03743124008178711, 0.03877067565917969, 0.040110111236572266, 0.041449546813964844, 0.04278898239135742, 0.04412841796875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 3.0, 2.0, 6.0, 4.0, 6.0, 7.0, 9.0, 19.0, 16.0, 27.0, 32.0, 39.0, 51.0, 74.0, 123.0, 146.0, 131.0, 76.0, 60.0, 30.0, 30.0, 15.0, 15.0, 15.0, 10.0, 14.0, 9.0, 7.0, 5.0, 7.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0001277923583984375, -0.00012397393584251404, -0.00012015551328659058, -0.00011633709073066711, -0.00011251866817474365, -0.00010870024561882019, -0.00010488182306289673, -0.00010106340050697327, -9.72449779510498e-05, -9.342655539512634e-05, -8.960813283920288e-05, -8.578971028327942e-05, -8.197128772735596e-05, -7.81528651714325e-05, -7.433444261550903e-05, -7.051602005958557e-05, -6.669759750366211e-05, -6.287917494773865e-05, -5.9060752391815186e-05, -5.5242329835891724e-05, -5.142390727996826e-05, -4.76054847240448e-05, -4.378706216812134e-05, -3.9968639612197876e-05, -3.6150217056274414e-05, -3.233179450035095e-05, -2.851337194442749e-05, -2.469494938850403e-05, -2.0876526832580566e-05, -1.7058104276657104e-05, -1.3239681720733643e-05, -9.42125916481018e-06, -5.602836608886719e-06, -1.7844140529632568e-06, 2.034008502960205e-06, 5.852431058883667e-06, 9.670853614807129e-06, 1.348927617073059e-05, 1.7307698726654053e-05, 2.1126121282577515e-05, 2.4944543838500977e-05, 2.876296639442444e-05, 3.25813889503479e-05, 3.639981150627136e-05, 4.0218234062194824e-05, 4.4036656618118286e-05, 4.785507917404175e-05, 5.167350172996521e-05, 5.549192428588867e-05, 5.9310346841812134e-05, 6.31287693977356e-05, 6.694719195365906e-05, 7.076561450958252e-05, 7.458403706550598e-05, 7.840245962142944e-05, 8.22208821773529e-05, 8.603930473327637e-05, 8.985772728919983e-05, 9.367614984512329e-05, 9.749457240104675e-05, 0.00010131299495697021, 0.00010513141751289368, 0.00010894984006881714, 0.0001127682626247406, 0.00011658668518066406]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 5.0, 6.0, 7.0, 10.0, 14.0, 26.0, 35.0, 59.0, 102.0, 202.0, 377.0, 848.0, 2798.0, 14173.0, 205901.0, 788242.0, 28824.0, 4568.0, 1271.0, 524.0, 243.0, 130.0, 73.0, 43.0, 29.0, 10.0, 18.0, 6.0, 4.0, 6.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.113525390625, -0.11038684844970703, -0.10724830627441406, -0.1041097640991211, -0.10097122192382812, -0.09783267974853516, -0.09469413757324219, -0.09155559539794922, -0.08841705322265625, -0.08527851104736328, -0.08213996887207031, -0.07900142669677734, -0.07586288452148438, -0.0727243423461914, -0.06958580017089844, -0.06644725799560547, -0.0633087158203125, -0.06017017364501953, -0.05703163146972656, -0.053893089294433594, -0.050754547119140625, -0.047616004943847656, -0.04447746276855469, -0.04133892059326172, -0.03820037841796875, -0.03506183624267578, -0.03192329406738281, -0.028784751892089844, -0.025646209716796875, -0.022507667541503906, -0.019369125366210938, -0.01623058319091797, -0.013092041015625, -0.009953498840332031, -0.0068149566650390625, -0.0036764144897460938, -0.000537872314453125, 0.0026006698608398438, 0.0057392120361328125, 0.008877754211425781, 0.01201629638671875, 0.015154838562011719, 0.018293380737304688, 0.021431922912597656, 0.024570465087890625, 0.027709007263183594, 0.030847549438476562, 0.03398609161376953, 0.0371246337890625, 0.04026317596435547, 0.04340171813964844, 0.046540260314941406, 0.049678802490234375, 0.052817344665527344, 0.05595588684082031, 0.05909442901611328, 0.06223297119140625, 0.06537151336669922, 0.06851005554199219, 0.07164859771728516, 0.07478713989257812, 0.0779256820678711, 0.08106422424316406, 0.08420276641845703, 0.08734130859375]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 7.0, 4.0, 14.0, 23.0, 25.0, 32.0, 42.0, 73.0, 111.0, 155.0, 151.0, 113.0, 86.0, 39.0, 36.0, 20.0, 26.0, 12.0, 10.0, 7.0, 4.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.05389404296875, -0.051903724670410156, -0.04991340637207031, -0.04792308807373047, -0.045932769775390625, -0.04394245147705078, -0.04195213317871094, -0.039961814880371094, -0.03797149658203125, -0.035981178283691406, -0.03399085998535156, -0.03200054168701172, -0.030010223388671875, -0.02801990509033203, -0.026029586791992188, -0.024039268493652344, -0.0220489501953125, -0.020058631896972656, -0.018068313598632812, -0.01607799530029297, -0.014087677001953125, -0.012097358703613281, -0.010107040405273438, -0.008116722106933594, -0.00612640380859375, -0.004136085510253906, -0.0021457672119140625, -0.00015544891357421875, 0.001834869384765625, 0.0038251876831054688, 0.0058155059814453125, 0.007805824279785156, 0.009796142578125, 0.011786460876464844, 0.013776779174804688, 0.01576709747314453, 0.017757415771484375, 0.01974773406982422, 0.021738052368164062, 0.023728370666503906, 0.02571868896484375, 0.027709007263183594, 0.029699325561523438, 0.03168964385986328, 0.033679962158203125, 0.03567028045654297, 0.03766059875488281, 0.039650917053222656, 0.0416412353515625, 0.043631553649902344, 0.04562187194824219, 0.04761219024658203, 0.049602508544921875, 0.05159282684326172, 0.05358314514160156, 0.055573463439941406, 0.05756378173828125, 0.059554100036621094, 0.06154441833496094, 0.06353473663330078, 0.06552505493164062, 0.06751537322998047, 0.06950569152832031, 0.07149600982666016, 0.073486328125]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 8.0, 13.0, 38.0, 93.0, 223.0, 303.0, 223.0, 59.0, 36.0, 13.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.7570199966430664, -2.704591989517212, -2.6521639823913574, -2.599735975265503, -2.5473079681396484, -2.494879722595215, -2.4424517154693604, -2.390023708343506, -2.3375957012176514, -2.285167694091797, -2.2327396869659424, -2.180311679840088, -2.1278834342956543, -2.0754554271698, -2.0230274200439453, -1.9705994129180908, -1.9181714057922363, -1.8657433986663818, -1.8133153915405273, -1.7608872652053833, -1.7084592580795288, -1.6560312509536743, -1.6036031246185303, -1.5511751174926758, -1.4987471103668213, -1.4463191032409668, -1.3938910961151123, -1.3414629697799683, -1.2890349626541138, -1.2366069555282593, -1.1841788291931152, -1.1317508220672607, -1.0793226957321167, -1.0268946886062622, -0.9744666218757629, -0.9220385551452637, -0.8696105480194092, -0.8171825408935547, -0.7647544741630554, -0.7123264074325562, -0.6598984003067017, -0.6074703931808472, -0.5550423264503479, -0.5026142597198486, -0.45018625259399414, -0.39775821566581726, -0.3453301787376404, -0.2929021418094635, -0.24047410488128662, -0.18804606795310974, -0.13561803102493286, -0.08318999409675598, -0.0307619571685791, 0.02166607975959778, 0.07409411668777466, 0.12652215361595154, 0.17895019054412842, 0.2313782274723053, 0.2838062644004822, 0.33623430132865906, 0.38866233825683594, 0.4410903751850128, 0.4935184121131897, 0.545946478843689, 0.5983744859695435]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 3.0, 0.0, 5.0, 0.0, 5.0, 7.0, 13.0, 4.0, 7.0, 4.0, 15.0, 16.0, 16.0, 16.0, 29.0, 25.0, 23.0, 32.0, 33.0, 46.0, 32.0, 51.0, 41.0, 50.0, 54.0, 53.0, 44.0, 49.0, 40.0, 33.0, 29.0, 23.0, 32.0, 22.0, 27.0, 20.0, 20.0, 18.0, 20.0, 14.0, 9.0, 9.0, 6.0, 2.0, 0.0, 2.0, 2.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.40834635496139526, -0.3949120342731476, -0.3814776837825775, -0.36804336309432983, -0.35460904240608215, -0.3411746919155121, -0.3277403712272644, -0.31430602073669434, -0.30087170004844666, -0.287437379360199, -0.2740030288696289, -0.2605687081813812, -0.24713437259197235, -0.23370003700256348, -0.2202657163143158, -0.20683138072490692, -0.19339706003665924, -0.17996272444725037, -0.16652840375900269, -0.1530940681695938, -0.13965973258018494, -0.12622541189193726, -0.11279107630252838, -0.0993567407131195, -0.08592241257429123, -0.07248808443546295, -0.05905374884605408, -0.0456194207072258, -0.032185088843107224, -0.018750756978988647, -0.00531642884016037, 0.008117906749248505, 0.021552234888076782, 0.03498656675219536, 0.048420898616313934, 0.06185522675514221, 0.07528956234455109, 0.08872389048337936, 0.10215821862220764, 0.11559255421161652, 0.1290268898010254, 0.14246122539043427, 0.15589554607868195, 0.16932988166809082, 0.1827642172574997, 0.19619855284690857, 0.20963287353515625, 0.22306720912456512, 0.2365015298128128, 0.24993586540222168, 0.26337018609046936, 0.27680450677871704, 0.2902388572692871, 0.3036731779575348, 0.31710749864578247, 0.33054184913635254, 0.3439761698246002, 0.3574104905128479, 0.37084484100341797, 0.38427916169166565, 0.39771348237991333, 0.4111478328704834, 0.4245821535587311, 0.43801647424697876, 0.45145082473754883]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 7.0, 21.0, 13.0, 33.0, 57.0, 100.0, 253.0, 736.0, 14507.0, 4177191.0, 839.0, 260.0, 110.0, 62.0, 23.0, 20.0, 10.0, 12.0, 8.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.415771484375, -0.4031867980957031, -0.39060211181640625, -0.3780174255371094, -0.3654327392578125, -0.3528480529785156, -0.34026336669921875, -0.3276786804199219, -0.315093994140625, -0.3025093078613281, -0.28992462158203125, -0.2773399353027344, -0.2647552490234375, -0.2521705627441406, -0.23958587646484375, -0.22700119018554688, -0.21441650390625, -0.20183181762695312, -0.18924713134765625, -0.17666244506835938, -0.1640777587890625, -0.15149307250976562, -0.13890838623046875, -0.12632369995117188, -0.113739013671875, -0.10115432739257812, -0.08856964111328125, -0.07598495483398438, -0.0634002685546875, -0.050815582275390625, -0.03823089599609375, -0.025646209716796875, -0.0130615234375, -0.000476837158203125, 0.01210784912109375, 0.024692535400390625, 0.0372772216796875, 0.049861907958984375, 0.06244659423828125, 0.07503128051757812, 0.087615966796875, 0.10020065307617188, 0.11278533935546875, 0.12537002563476562, 0.1379547119140625, 0.15053939819335938, 0.16312408447265625, 0.17570877075195312, 0.18829345703125, 0.20087814331054688, 0.21346282958984375, 0.22604751586914062, 0.2386322021484375, 0.2512168884277344, 0.26380157470703125, 0.2763862609863281, 0.288970947265625, 0.3015556335449219, 0.31414031982421875, 0.3267250061035156, 0.3393096923828125, 0.3518943786621094, 0.36447906494140625, 0.3770637512207031, 0.3896484375]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 7.0, 22.0, 50.0, 86.0, 144.0, 190.0, 199.0, 138.0, 89.0, 35.0, 21.0, 7.0, 5.0, 1.0, 2.0, 5.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.133544921875, -0.13036537170410156, -0.12718582153320312, -0.12400627136230469, -0.12082672119140625, -0.11764717102050781, -0.11446762084960938, -0.11128807067871094, -0.1081085205078125, -0.10492897033691406, -0.10174942016601562, -0.09856986999511719, -0.09539031982421875, -0.09221076965332031, -0.08903121948242188, -0.08585166931152344, -0.082672119140625, -0.07949256896972656, -0.07631301879882812, -0.07313346862792969, -0.06995391845703125, -0.06677436828613281, -0.06359481811523438, -0.06041526794433594, -0.0572357177734375, -0.05405616760253906, -0.050876617431640625, -0.04769706726074219, -0.04451751708984375, -0.04133796691894531, -0.038158416748046875, -0.03497886657714844, -0.03179931640625, -0.028619766235351562, -0.025440216064453125, -0.022260665893554688, -0.01908111572265625, -0.015901565551757812, -0.012722015380859375, -0.009542465209960938, -0.0063629150390625, -0.0031833648681640625, -3.814697265625e-06, 0.0031757354736328125, 0.00635528564453125, 0.009534835815429688, 0.012714385986328125, 0.015893936157226562, 0.019073486328125, 0.022253036499023438, 0.025432586669921875, 0.028612136840820312, 0.03179168701171875, 0.03497123718261719, 0.038150787353515625, 0.04133033752441406, 0.0445098876953125, 0.04768943786621094, 0.050868988037109375, 0.05404853820800781, 0.05722808837890625, 0.06040763854980469, 0.06358718872070312, 0.06676673889160156, 0.0699462890625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 2.0, 4.0, 12.0, 4.0, 9.0, 6.0, 13.0, 14.0, 21.0, 29.0, 40.0, 59.0, 82.0, 151.0, 221.0, 358.0, 642.0, 1162.0, 2314.0, 7023.0, 4170655.0, 6431.0, 2145.0, 1187.0, 633.0, 396.0, 236.0, 140.0, 90.0, 62.0, 37.0, 21.0, 15.0, 14.0, 13.0, 9.0, 4.0, 14.0, 5.0, 5.0, 5.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.10406494140625, -0.100860595703125, -0.09765625, -0.094451904296875, -0.09124755859375, -0.088043212890625, -0.0848388671875, -0.081634521484375, -0.07843017578125, -0.075225830078125, -0.072021484375, -0.068817138671875, -0.06561279296875, -0.062408447265625, -0.0592041015625, -0.055999755859375, -0.05279541015625, -0.049591064453125, -0.04638671875, -0.043182373046875, -0.03997802734375, -0.036773681640625, -0.0335693359375, -0.030364990234375, -0.02716064453125, -0.023956298828125, -0.020751953125, -0.017547607421875, -0.01434326171875, -0.011138916015625, -0.0079345703125, -0.004730224609375, -0.00152587890625, 0.001678466796875, 0.0048828125, 0.008087158203125, 0.01129150390625, 0.014495849609375, 0.0177001953125, 0.020904541015625, 0.02410888671875, 0.027313232421875, 0.030517578125, 0.033721923828125, 0.03692626953125, 0.040130615234375, 0.0433349609375, 0.046539306640625, 0.04974365234375, 0.052947998046875, 0.05615234375, 0.059356689453125, 0.06256103515625, 0.065765380859375, 0.0689697265625, 0.072174072265625, 0.07537841796875, 0.078582763671875, 0.081787109375, 0.084991455078125, 0.08819580078125, 0.091400146484375, 0.0946044921875, 0.097808837890625, 0.10101318359375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 29.0, 4014.0, 20.0, 5.0, 8.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.011627197265625, -0.010914802551269531, -0.010202407836914062, -0.009490013122558594, -0.008777618408203125, -0.008065223693847656, -0.0073528289794921875, -0.006640434265136719, -0.00592803955078125, -0.005215644836425781, -0.0045032501220703125, -0.0037908554077148438, -0.003078460693359375, -0.0023660659790039062, -0.0016536712646484375, -0.0009412765502929688, -0.0002288818359375, 0.00048351287841796875, 0.0011959075927734375, 0.0019083023071289062, 0.002620697021484375, 0.0033330917358398438, 0.0040454864501953125, 0.004757881164550781, 0.00547027587890625, 0.006182670593261719, 0.0068950653076171875, 0.007607460021972656, 0.008319854736328125, 0.009032249450683594, 0.009744644165039062, 0.010457038879394531, 0.01116943359375, 0.011881828308105469, 0.012594223022460938, 0.013306617736816406, 0.014019012451171875, 0.014731407165527344, 0.015443801879882812, 0.01615619659423828, 0.01686859130859375, 0.01758098602294922, 0.018293380737304688, 0.019005775451660156, 0.019718170166015625, 0.020430564880371094, 0.021142959594726562, 0.02185535430908203, 0.0225677490234375, 0.02328014373779297, 0.023992538452148438, 0.024704933166503906, 0.025417327880859375, 0.026129722595214844, 0.026842117309570312, 0.02755451202392578, 0.02826690673828125, 0.02897930145263672, 0.029691696166992188, 0.030404090881347656, 0.031116485595703125, 0.031828880310058594, 0.03254127502441406, 0.03325366973876953, 0.033966064453125]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 11.0, 66.0, 471.0, 356.0, 85.0, 19.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.25576069951057434, -0.24949349462985992, -0.2432262897491455, -0.2369590699672699, -0.23069186508655548, -0.22442466020584106, -0.21815745532512665, -0.21189025044441223, -0.20562304556369781, -0.1993558406829834, -0.19308863580226898, -0.18682143092155457, -0.18055421113967896, -0.17428700625896454, -0.16801980137825012, -0.1617525964975357, -0.1554853916168213, -0.14921818673610687, -0.14295098185539246, -0.13668376207351685, -0.13041655719280243, -0.12414935231208801, -0.1178821474313736, -0.11161494255065918, -0.10534772276878357, -0.09908051788806915, -0.09281330555677414, -0.08654610067605972, -0.0802788957953453, -0.07401168346405029, -0.06774447858333588, -0.06147727370262146, -0.05521006882190704, -0.04894286021590233, -0.04267565533518791, -0.0364084467291832, -0.03014123998582363, -0.023874033242464066, -0.01760682463645935, -0.011339619755744934, -0.005072411149740219, 0.001194796059280634, 0.007462003268301487, 0.013729210942983627, 0.019996417686343193, 0.02626362442970276, 0.032530833035707474, 0.03879803791642189, 0.045065246522426605, 0.05133245512843132, 0.05759966000914574, 0.06386686861515045, 0.07013407349586487, 0.07640127837657928, 0.0826684907078743, 0.08893569558858871, 0.09520290791988373, 0.10147011280059814, 0.10773732513189316, 0.11400453001260757, 0.12027173489332199, 0.126538947224617, 0.13280615210533142, 0.13907335698604584, 0.14534056186676025]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 6.0, 10.0, 9.0, 15.0, 25.0, 33.0, 31.0, 45.0, 50.0, 52.0, 57.0, 86.0, 84.0, 72.0, 63.0, 55.0, 47.0, 52.0, 46.0, 34.0, 36.0, 31.0, 16.0, 21.0, 7.0, 6.0, 5.0, 1.0, 3.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04196751117706299, -0.04075542464852333, -0.03954333811998367, -0.03833124786615372, -0.03711916133761406, -0.0359070748090744, -0.034694984555244446, -0.03348289802670479, -0.03227081149816513, -0.031058724969625473, -0.029846636578440666, -0.02863454818725586, -0.027422461658716202, -0.026210375130176544, -0.024998286738991737, -0.02378619834780693, -0.022574111819267273, -0.021362025290727615, -0.02014993689954281, -0.018937848508358, -0.017725761979818344, -0.016513675451278687, -0.01530158706009388, -0.014089499600231647, -0.012877412140369415, -0.011665324680507183, -0.01045323722064495, -0.009241149760782719, -0.008029062300920486, -0.006816974841058254, -0.005604887381196022, -0.00439279992133379, -0.0031807124614715576, -0.0019686250016093254, -0.0007565375417470932, 0.000455549918115139, 0.0016676373779773712, 0.0028797248378396034, 0.004091812297701836, 0.005303899757564068, 0.0065159872174263, 0.007728074677288532, 0.008940162137150764, 0.010152249597012997, 0.011364337056875229, 0.012576424516737461, 0.013788511976599693, 0.015000599436461926, 0.016212686896324158, 0.017424773424863815, 0.018636861816048622, 0.01984895020723343, 0.021061036735773087, 0.022273123264312744, 0.02348521165549755, 0.024697300046682358, 0.025909386575222015, 0.027121473103761673, 0.02833356149494648, 0.029545649886131287, 0.030757736414670944, 0.0319698229432106, 0.03318191319704056, 0.034393999725580215, 0.03560608625411987]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 1.0, 3.0, 6.0, 5.0, 6.0, 13.0, 16.0, 22.0, 30.0, 53.0, 83.0, 117.0, 237.0, 392.0, 697.0, 1555.0, 3955.0, 23843.0, 662143.0, 335209.0, 14391.0, 3071.0, 1218.0, 625.0, 307.0, 177.0, 142.0, 74.0, 43.0, 42.0, 22.0, 19.0, 14.0, 8.0, 4.0, 8.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.422607421875, -0.4104957580566406, -0.39838409423828125, -0.3862724304199219, -0.3741607666015625, -0.3620491027832031, -0.34993743896484375, -0.3378257751464844, -0.325714111328125, -0.3136024475097656, -0.30149078369140625, -0.2893791198730469, -0.2772674560546875, -0.2651557922363281, -0.25304412841796875, -0.24093246459960938, -0.22882080078125, -0.21670913696289062, -0.20459747314453125, -0.19248580932617188, -0.1803741455078125, -0.16826248168945312, -0.15615081787109375, -0.14403915405273438, -0.131927490234375, -0.11981582641601562, -0.10770416259765625, -0.09559249877929688, -0.0834808349609375, -0.07136917114257812, -0.05925750732421875, -0.047145843505859375, -0.0350341796875, -0.022922515869140625, -0.01081085205078125, 0.001300811767578125, 0.0134124755859375, 0.025524139404296875, 0.03763580322265625, 0.049747467041015625, 0.061859130859375, 0.07397079467773438, 0.08608245849609375, 0.09819412231445312, 0.1103057861328125, 0.12241744995117188, 0.13452911376953125, 0.14664077758789062, 0.15875244140625, 0.17086410522460938, 0.18297576904296875, 0.19508743286132812, 0.2071990966796875, 0.21931076049804688, 0.23142242431640625, 0.24353408813476562, 0.255645751953125, 0.2677574157714844, 0.27986907958984375, 0.2919807434082031, 0.3040924072265625, 0.3162040710449219, 0.32831573486328125, 0.3404273986816406, 0.3525390625]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 7.0, 23.0, 43.0, 96.0, 143.0, 189.0, 194.0, 141.0, 90.0, 35.0, 20.0, 6.0, 6.0, 1.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.133544921875, -0.13036727905273438, -0.12718963623046875, -0.12401199340820312, -0.1208343505859375, -0.11765670776367188, -0.11447906494140625, -0.11130142211914062, -0.108123779296875, -0.10494613647460938, -0.10176849365234375, -0.09859085083007812, -0.0954132080078125, -0.09223556518554688, -0.08905792236328125, -0.08588027954101562, -0.08270263671875, -0.07952499389648438, -0.07634735107421875, -0.07316970825195312, -0.0699920654296875, -0.06681442260742188, -0.06363677978515625, -0.060459136962890625, -0.057281494140625, -0.054103851318359375, -0.05092620849609375, -0.047748565673828125, -0.0445709228515625, -0.041393280029296875, -0.03821563720703125, -0.035037994384765625, -0.0318603515625, -0.028682708740234375, -0.02550506591796875, -0.022327423095703125, -0.0191497802734375, -0.015972137451171875, -0.01279449462890625, -0.009616851806640625, -0.006439208984375, -0.003261566162109375, -8.392333984375e-05, 0.003093719482421875, 0.0062713623046875, 0.009449005126953125, 0.01262664794921875, 0.015804290771484375, 0.01898193359375, 0.022159576416015625, 0.02533721923828125, 0.028514862060546875, 0.0316925048828125, 0.034870147705078125, 0.03804779052734375, 0.041225433349609375, 0.044403076171875, 0.047580718994140625, 0.05075836181640625, 0.053936004638671875, 0.0571136474609375, 0.060291290283203125, 0.06346893310546875, 0.06664657592773438, 0.06982421875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 7.0, 8.0, 7.0, 9.0, 24.0, 21.0, 25.0, 35.0, 49.0, 94.0, 154.0, 264.0, 462.0, 887.0, 2296.0, 6741.0, 25691.0, 144726.0, 686026.0, 144016.0, 25791.0, 6775.0, 2331.0, 943.0, 459.0, 262.0, 144.0, 108.0, 66.0, 41.0, 23.0, 24.0, 18.0, 10.0, 8.0, 3.0, 5.0, 1.0, 1.0, 1.0, 5.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1419677734375, -0.13746070861816406, -0.13295364379882812, -0.1284465789794922, -0.12393951416015625, -0.11943244934082031, -0.11492538452148438, -0.11041831970214844, -0.1059112548828125, -0.10140419006347656, -0.09689712524414062, -0.09239006042480469, -0.08788299560546875, -0.08337593078613281, -0.07886886596679688, -0.07436180114746094, -0.069854736328125, -0.06534767150878906, -0.060840606689453125, -0.05633354187011719, -0.05182647705078125, -0.04731941223144531, -0.042812347412109375, -0.03830528259277344, -0.0337982177734375, -0.029291152954101562, -0.024784088134765625, -0.020277023315429688, -0.01576995849609375, -0.011262893676757812, -0.006755828857421875, -0.0022487640380859375, 0.00225830078125, 0.0067653656005859375, 0.011272430419921875, 0.015779495239257812, 0.02028656005859375, 0.024793624877929688, 0.029300689697265625, 0.03380775451660156, 0.0383148193359375, 0.04282188415527344, 0.047328948974609375, 0.05183601379394531, 0.05634307861328125, 0.06085014343261719, 0.06535720825195312, 0.06986427307128906, 0.074371337890625, 0.07887840270996094, 0.08338546752929688, 0.08789253234863281, 0.09239959716796875, 0.09690666198730469, 0.10141372680664062, 0.10592079162597656, 0.1104278564453125, 0.11493492126464844, 0.11944198608398438, 0.12394905090332031, 0.12845611572265625, 0.1329631805419922, 0.13747024536132812, 0.14197731018066406, 0.146484375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 6.0, 6.0, 6.0, 5.0, 10.0, 13.0, 14.0, 22.0, 19.0, 22.0, 32.0, 32.0, 32.0, 49.0, 48.0, 39.0, 47.0, 39.0, 50.0, 54.0, 66.0, 52.0, 40.0, 39.0, 37.0, 27.0, 29.0, 29.0, 26.0, 24.0, 26.0, 16.0, 11.0, 17.0, 6.0, 6.0, 6.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08770751953125, -0.08431529998779297, -0.08092308044433594, -0.0775308609008789, -0.07413864135742188, -0.07074642181396484, -0.06735420227050781, -0.06396198272705078, -0.06056976318359375, -0.05717754364013672, -0.05378532409667969, -0.050393104553222656, -0.047000885009765625, -0.043608665466308594, -0.04021644592285156, -0.03682422637939453, -0.0334320068359375, -0.03003978729248047, -0.026647567749023438, -0.023255348205566406, -0.019863128662109375, -0.016470909118652344, -0.013078689575195312, -0.009686470031738281, -0.00629425048828125, -0.0029020309448242188, 0.0004901885986328125, 0.0038824081420898438, 0.007274627685546875, 0.010666847229003906, 0.014059066772460938, 0.01745128631591797, 0.020843505859375, 0.02423572540283203, 0.027627944946289062, 0.031020164489746094, 0.034412384033203125, 0.037804603576660156, 0.04119682312011719, 0.04458904266357422, 0.04798126220703125, 0.05137348175048828, 0.05476570129394531, 0.058157920837402344, 0.061550140380859375, 0.0649423599243164, 0.06833457946777344, 0.07172679901123047, 0.0751190185546875, 0.07851123809814453, 0.08190345764160156, 0.0852956771850586, 0.08868789672851562, 0.09208011627197266, 0.09547233581542969, 0.09886455535888672, 0.10225677490234375, 0.10564899444580078, 0.10904121398925781, 0.11243343353271484, 0.11582565307617188, 0.1192178726196289, 0.12261009216308594, 0.12600231170654297, 0.12939453125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 5.0, 2.0, 2.0, 8.0, 5.0, 5.0, 9.0, 8.0, 17.0, 16.0, 35.0, 36.0, 49.0, 85.0, 116.0, 171.0, 282.0, 626.0, 1515.0, 4673.0, 31205.0, 967066.0, 34806.0, 4769.0, 1551.0, 667.0, 296.0, 162.0, 127.0, 77.0, 48.0, 28.0, 21.0, 16.0, 10.0, 8.0, 8.0, 8.0, 6.0, 4.0, 0.0, 4.0, 4.0, 1.0, 6.0, 0.0, 1.0, 1.0], "bins": [-0.2061767578125, -0.2006816864013672, -0.19518661499023438, -0.18969154357910156, -0.18419647216796875, -0.17870140075683594, -0.17320632934570312, -0.1677112579345703, -0.1622161865234375, -0.1567211151123047, -0.15122604370117188, -0.14573097229003906, -0.14023590087890625, -0.13474082946777344, -0.12924575805664062, -0.12375068664550781, -0.118255615234375, -0.11276054382324219, -0.10726547241210938, -0.10177040100097656, -0.09627532958984375, -0.09078025817871094, -0.08528518676757812, -0.07979011535644531, -0.0742950439453125, -0.06879997253417969, -0.06330490112304688, -0.05780982971191406, -0.05231475830078125, -0.04681968688964844, -0.041324615478515625, -0.03582954406738281, -0.03033447265625, -0.024839401245117188, -0.019344329833984375, -0.013849258422851562, -0.00835418701171875, -0.0028591156005859375, 0.002635955810546875, 0.008131027221679688, 0.0136260986328125, 0.019121170043945312, 0.024616241455078125, 0.030111312866210938, 0.03560638427734375, 0.04110145568847656, 0.046596527099609375, 0.05209159851074219, 0.057586669921875, 0.06308174133300781, 0.06857681274414062, 0.07407188415527344, 0.07956695556640625, 0.08506202697753906, 0.09055709838867188, 0.09605216979980469, 0.1015472412109375, 0.10704231262207031, 0.11253738403320312, 0.11803245544433594, 0.12352752685546875, 0.12902259826660156, 0.13451766967773438, 0.1400127410888672, 0.1455078125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 2.0, 4.0, 8.0, 11.0, 13.0, 14.0, 26.0, 31.0, 51.0, 66.0, 117.0, 165.0, 175.0, 97.0, 66.0, 49.0, 30.0, 19.0, 15.0, 9.0, 6.0, 6.0, 5.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0002484321594238281, -0.00024206936359405518, -0.00023570656776428223, -0.00022934377193450928, -0.00022298097610473633, -0.00021661818027496338, -0.00021025538444519043, -0.00020389258861541748, -0.00019752979278564453, -0.00019116699695587158, -0.00018480420112609863, -0.00017844140529632568, -0.00017207860946655273, -0.00016571581363677979, -0.00015935301780700684, -0.0001529902219772339, -0.00014662742614746094, -0.000140264630317688, -0.00013390183448791504, -0.0001275390386581421, -0.00012117624282836914, -0.00011481344699859619, -0.00010845065116882324, -0.00010208785533905029, -9.572505950927734e-05, -8.93622636795044e-05, -8.299946784973145e-05, -7.66366720199585e-05, -7.027387619018555e-05, -6.39110803604126e-05, -5.754828453063965e-05, -5.11854887008667e-05, -4.482269287109375e-05, -3.84598970413208e-05, -3.209710121154785e-05, -2.5734305381774902e-05, -1.9371509552001953e-05, -1.3008713722229004e-05, -6.645917892456055e-06, -2.8312206268310547e-07, 6.079673767089844e-06, 1.2442469596862793e-05, 1.8805265426635742e-05, 2.516806125640869e-05, 3.153085708618164e-05, 3.789365291595459e-05, 4.425644874572754e-05, 5.061924457550049e-05, 5.698204040527344e-05, 6.334483623504639e-05, 6.970763206481934e-05, 7.607042789459229e-05, 8.243322372436523e-05, 8.879601955413818e-05, 9.515881538391113e-05, 0.00010152161121368408, 0.00010788440704345703, 0.00011424720287322998, 0.00012060999870300293, 0.00012697279453277588, 0.00013333559036254883, 0.00013969838619232178, 0.00014606118202209473, 0.00015242397785186768, 0.00015878677368164062]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 4.0, 7.0, 7.0, 11.0, 19.0, 29.0, 36.0, 60.0, 104.0, 169.0, 406.0, 1003.0, 3470.0, 37093.0, 990103.0, 12488.0, 2148.0, 698.0, 323.0, 174.0, 74.0, 44.0, 30.0, 16.0, 11.0, 9.0, 1.0, 5.0, 5.0, 4.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.306884765625, -0.2979469299316406, -0.28900909423828125, -0.2800712585449219, -0.2711334228515625, -0.2621955871582031, -0.25325775146484375, -0.24431991577148438, -0.235382080078125, -0.22644424438476562, -0.21750640869140625, -0.20856857299804688, -0.1996307373046875, -0.19069290161132812, -0.18175506591796875, -0.17281723022460938, -0.16387939453125, -0.15494155883789062, -0.14600372314453125, -0.13706588745117188, -0.1281280517578125, -0.11919021606445312, -0.11025238037109375, -0.10131454467773438, -0.092376708984375, -0.08343887329101562, -0.07450103759765625, -0.06556320190429688, -0.0566253662109375, -0.047687530517578125, -0.03874969482421875, -0.029811859130859375, -0.0208740234375, -0.011936187744140625, -0.00299835205078125, 0.005939483642578125, 0.0148773193359375, 0.023815155029296875, 0.03275299072265625, 0.041690826416015625, 0.050628662109375, 0.059566497802734375, 0.06850433349609375, 0.07744216918945312, 0.0863800048828125, 0.09531784057617188, 0.10425567626953125, 0.11319351196289062, 0.12213134765625, 0.13106918334960938, 0.14000701904296875, 0.14894485473632812, 0.1578826904296875, 0.16682052612304688, 0.17575836181640625, 0.18469619750976562, 0.193634033203125, 0.20257186889648438, 0.21150970458984375, 0.22044754028320312, 0.2293853759765625, 0.23832321166992188, 0.24726104736328125, 0.2561988830566406, 0.26513671875]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 9.0, 9.0, 19.0, 17.0, 43.0, 81.0, 141.0, 268.0, 171.0, 103.0, 45.0, 39.0, 19.0, 16.0, 8.0, 10.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11175537109375, -0.10811710357666016, -0.10447883605957031, -0.10084056854248047, -0.09720230102539062, -0.09356403350830078, -0.08992576599121094, -0.0862874984741211, -0.08264923095703125, -0.0790109634399414, -0.07537269592285156, -0.07173442840576172, -0.06809616088867188, -0.06445789337158203, -0.06081962585449219, -0.057181358337402344, -0.0535430908203125, -0.049904823303222656, -0.04626655578613281, -0.04262828826904297, -0.038990020751953125, -0.03535175323486328, -0.03171348571777344, -0.028075218200683594, -0.02443695068359375, -0.020798683166503906, -0.017160415649414062, -0.013522148132324219, -0.009883880615234375, -0.006245613098144531, -0.0026073455810546875, 0.0010309219360351562, 0.004669189453125, 0.008307456970214844, 0.011945724487304688, 0.015583992004394531, 0.019222259521484375, 0.02286052703857422, 0.026498794555664062, 0.030137062072753906, 0.03377532958984375, 0.037413597106933594, 0.04105186462402344, 0.04469013214111328, 0.048328399658203125, 0.05196666717529297, 0.05560493469238281, 0.059243202209472656, 0.0628814697265625, 0.06651973724365234, 0.07015800476074219, 0.07379627227783203, 0.07743453979492188, 0.08107280731201172, 0.08471107482910156, 0.0883493423461914, 0.09198760986328125, 0.0956258773803711, 0.09926414489746094, 0.10290241241455078, 0.10654067993164062, 0.11017894744873047, 0.11381721496582031, 0.11745548248291016, 0.12109375]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 7.0, 0.0, 8.0, 9.0, 7.0, 22.0, 35.0, 51.0, 67.0, 111.0, 169.0, 181.0, 133.0, 73.0, 48.0, 33.0, 19.0, 18.0, 4.0, 5.0, 1.0, 5.0, 3.0, 0.0, 5.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4616219997406006, -1.4269235134124756, -1.392224907875061, -1.357526421546936, -1.322827935218811, -1.2881293296813965, -1.2534308433532715, -1.2187323570251465, -1.184033751487732, -1.149335265159607, -1.1146366596221924, -1.0799381732940674, -1.0452396869659424, -1.0105410814285278, -0.9758425951004028, -0.9411440491676331, -0.9064455628395081, -0.8717470169067383, -0.8370485305786133, -0.8023499846458435, -0.7676514387130737, -0.7329529523849487, -0.698254406452179, -0.6635558605194092, -0.6288573741912842, -0.5941588282585144, -0.5594603419303894, -0.5247617959976196, -0.49006325006484985, -0.45536473393440247, -0.4206662178039551, -0.3859676718711853, -0.3512691259384155, -0.31657060980796814, -0.28187206387519836, -0.24717354774475098, -0.2124750167131424, -0.1777764856815338, -0.14307796955108643, -0.10837943851947784, -0.07368090748786926, -0.03898238018155098, -0.0042838528752326965, 0.030414670705795288, 0.06511320173740387, 0.09981173276901245, 0.13451024889945984, 0.16920877993106842, 0.203907310962677, 0.23860584199428558, 0.27330437302589417, 0.30800288915634155, 0.34270143508911133, 0.3773999512195587, 0.4120984673500061, 0.4467970132827759, 0.48149552941322327, 0.5161940455436707, 0.5508925914764404, 0.5855910778045654, 0.6202896237373352, 0.654988169670105, 0.68968665599823, 0.7243852019309998, 0.7590837478637695]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 6.0, 5.0, 1.0, 6.0, 7.0, 6.0, 10.0, 14.0, 10.0, 18.0, 25.0, 18.0, 25.0, 28.0, 31.0, 31.0, 46.0, 45.0, 41.0, 44.0, 39.0, 40.0, 42.0, 47.0, 48.0, 33.0, 38.0, 45.0, 26.0, 21.0, 31.0, 31.0, 27.0, 12.0, 18.0, 25.0, 16.0, 13.0, 14.0, 8.0, 6.0, 4.0, 1.0, 6.0, 0.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.4322248101234436, -0.4184243977069855, -0.40462398529052734, -0.3908235728740692, -0.3770231604576111, -0.36322277784347534, -0.3494223654270172, -0.3356219530105591, -0.32182154059410095, -0.3080211281776428, -0.2942207157611847, -0.28042030334472656, -0.2666199207305908, -0.2528194785118103, -0.23901909589767456, -0.22521868348121643, -0.2114182710647583, -0.19761785864830017, -0.18381744623184204, -0.1700170487165451, -0.15621663630008698, -0.14241622388362885, -0.1286158263683319, -0.11481541395187378, -0.10101500153541565, -0.08721458911895752, -0.07341418415307999, -0.059613775461912155, -0.045813366770744324, -0.032012954354286194, -0.01821254938840866, -0.004412144422531128, 0.009388267993927002, 0.023188676685094833, 0.036989085376262665, 0.050789494067430496, 0.06458990275859833, 0.07839031517505646, 0.09219072014093399, 0.10599112510681152, 0.11979153752326965, 0.13359194993972778, 0.1473923623561859, 0.16119275987148285, 0.17499317228794098, 0.1887935847043991, 0.20259398221969604, 0.21639439463615417, 0.2301948070526123, 0.24399521946907043, 0.25779563188552856, 0.2715960443019867, 0.2853964567184448, 0.29919683933258057, 0.3129972517490387, 0.3267976641654968, 0.34059807658195496, 0.3543984889984131, 0.3681989014148712, 0.38199931383132935, 0.3957996964454651, 0.4096001386642456, 0.42340052127838135, 0.4372009336948395, 0.4510013461112976]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 10.0, 6.0, 14.0, 27.0, 74.0, 145.0, 490.0, 2040.0, 4186934.0, 3598.0, 580.0, 205.0, 68.0, 28.0, 18.0, 15.0, 7.0, 4.0, 6.0, 3.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.62109375, -0.6001052856445312, -0.5791168212890625, -0.5581283569335938, -0.537139892578125, -0.5161514282226562, -0.4951629638671875, -0.47417449951171875, -0.45318603515625, -0.43219757080078125, -0.4112091064453125, -0.39022064208984375, -0.369232177734375, -0.34824371337890625, -0.3272552490234375, -0.30626678466796875, -0.2852783203125, -0.26428985595703125, -0.2433013916015625, -0.22231292724609375, -0.201324462890625, -0.18033599853515625, -0.1593475341796875, -0.13835906982421875, -0.11737060546875, -0.09638214111328125, -0.0753936767578125, -0.05440521240234375, -0.033416748046875, -0.01242828369140625, 0.0085601806640625, 0.02954864501953125, 0.050537109375, 0.07152557373046875, 0.0925140380859375, 0.11350250244140625, 0.134490966796875, 0.15547943115234375, 0.1764678955078125, 0.19745635986328125, 0.21844482421875, 0.23943328857421875, 0.2604217529296875, 0.28141021728515625, 0.302398681640625, 0.32338714599609375, 0.3443756103515625, 0.36536407470703125, 0.3863525390625, 0.40734100341796875, 0.4283294677734375, 0.44931793212890625, 0.470306396484375, 0.49129486083984375, 0.5122833251953125, 0.5332717895507812, 0.55426025390625, 0.5752487182617188, 0.5962371826171875, 0.6172256469726562, 0.638214111328125, 0.6592025756835938, 0.6801910400390625, 0.7011795043945312, 0.72216796875]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 8.0, 18.0, 46.0, 89.0, 148.0, 186.0, 178.0, 169.0, 80.0, 39.0, 21.0, 2.0, 9.0, 1.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1336669921875, -0.13048839569091797, -0.12730979919433594, -0.1241312026977539, -0.12095260620117188, -0.11777400970458984, -0.11459541320800781, -0.11141681671142578, -0.10823822021484375, -0.10505962371826172, -0.10188102722167969, -0.09870243072509766, -0.09552383422851562, -0.0923452377319336, -0.08916664123535156, -0.08598804473876953, -0.0828094482421875, -0.07963085174560547, -0.07645225524902344, -0.0732736587524414, -0.07009506225585938, -0.06691646575927734, -0.06373786926269531, -0.06055927276611328, -0.05738067626953125, -0.05420207977294922, -0.05102348327636719, -0.047844886779785156, -0.044666290283203125, -0.041487693786621094, -0.03830909729003906, -0.03513050079345703, -0.031951904296875, -0.02877330780029297, -0.025594711303710938, -0.022416114807128906, -0.019237518310546875, -0.016058921813964844, -0.012880325317382812, -0.009701728820800781, -0.00652313232421875, -0.0033445358276367188, -0.0001659393310546875, 0.0030126571655273438, 0.006191253662109375, 0.009369850158691406, 0.012548446655273438, 0.01572704315185547, 0.0189056396484375, 0.02208423614501953, 0.025262832641601562, 0.028441429138183594, 0.031620025634765625, 0.034798622131347656, 0.03797721862792969, 0.04115581512451172, 0.04433441162109375, 0.04751300811767578, 0.05069160461425781, 0.053870201110839844, 0.057048797607421875, 0.060227394104003906, 0.06340599060058594, 0.06658458709716797, 0.06976318359375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 7.0, 5.0, 16.0, 15.0, 25.0, 43.0, 81.0, 121.0, 258.0, 428.0, 877.0, 1734.0, 3965.0, 13742.0, 4104755.0, 56238.0, 6853.0, 2578.0, 1176.0, 585.0, 315.0, 192.0, 110.0, 55.0, 41.0, 30.0, 15.0, 6.0, 2.0, 5.0, 5.0, 3.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09503173828125, -0.09147930145263672, -0.08792686462402344, -0.08437442779541016, -0.08082199096679688, -0.0772695541381836, -0.07371711730957031, -0.07016468048095703, -0.06661224365234375, -0.06305980682373047, -0.05950736999511719, -0.055954933166503906, -0.052402496337890625, -0.048850059509277344, -0.04529762268066406, -0.04174518585205078, -0.0381927490234375, -0.03464031219482422, -0.031087875366210938, -0.027535438537597656, -0.023983001708984375, -0.020430564880371094, -0.016878128051757812, -0.013325691223144531, -0.00977325439453125, -0.006220817565917969, -0.0026683807373046875, 0.0008840560913085938, 0.004436492919921875, 0.007988929748535156, 0.011541366577148438, 0.015093803405761719, 0.018646240234375, 0.02219867706298828, 0.025751113891601562, 0.029303550720214844, 0.032855987548828125, 0.036408424377441406, 0.03996086120605469, 0.04351329803466797, 0.04706573486328125, 0.05061817169189453, 0.05417060852050781, 0.057723045349121094, 0.061275482177734375, 0.06482791900634766, 0.06838035583496094, 0.07193279266357422, 0.0754852294921875, 0.07903766632080078, 0.08259010314941406, 0.08614253997802734, 0.08969497680664062, 0.0932474136352539, 0.09679985046386719, 0.10035228729248047, 0.10390472412109375, 0.10745716094970703, 0.11100959777832031, 0.1145620346069336, 0.11811447143554688, 0.12166690826416016, 0.12521934509277344, 0.12877178192138672, 0.13232421875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 0.0, 1.0, 2.0, 5.0, 14.0, 11.0, 60.0, 744.0, 3084.0, 91.0, 19.0, 12.0, 4.0, 5.0, 5.0, 2.0, 3.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0229949951171875, -0.021999597549438477, -0.021004199981689453, -0.02000880241394043, -0.019013404846191406, -0.018018007278442383, -0.01702260971069336, -0.016027212142944336, -0.015031814575195312, -0.014036417007446289, -0.013041019439697266, -0.012045621871948242, -0.011050224304199219, -0.010054826736450195, -0.009059429168701172, -0.008064031600952148, -0.007068634033203125, -0.0060732364654541016, -0.005077838897705078, -0.004082441329956055, -0.0030870437622070312, -0.002091646194458008, -0.0010962486267089844, -0.00010085105895996094, 0.0008945465087890625, 0.001889944076538086, 0.0028853416442871094, 0.003880739212036133, 0.004876136779785156, 0.00587153434753418, 0.006866931915283203, 0.007862329483032227, 0.00885772705078125, 0.009853124618530273, 0.010848522186279297, 0.01184391975402832, 0.012839317321777344, 0.013834714889526367, 0.01483011245727539, 0.015825510025024414, 0.016820907592773438, 0.01781630516052246, 0.018811702728271484, 0.019807100296020508, 0.02080249786376953, 0.021797895431518555, 0.022793292999267578, 0.0237886905670166, 0.024784088134765625, 0.02577948570251465, 0.026774883270263672, 0.027770280838012695, 0.02876567840576172, 0.029761075973510742, 0.030756473541259766, 0.03175187110900879, 0.03274726867675781, 0.033742666244506836, 0.03473806381225586, 0.03573346138000488, 0.036728858947753906, 0.03772425651550293, 0.03871965408325195, 0.03971505165100098, 0.04071044921875]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 9.0, 4.0, 6.0, 7.0, 14.0, 12.0, 31.0, 32.0, 51.0, 73.0, 103.0, 108.0, 110.0, 117.0, 76.0, 66.0, 52.0, 34.0, 20.0, 18.0, 20.0, 13.0, 5.0, 3.0, 7.0, 6.0, 7.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07730314880609512, -0.07460027933120728, -0.07189741730690002, -0.06919455528259277, -0.06649168580770493, -0.06378881633281708, -0.06108595430850983, -0.05838308855891228, -0.05568022280931473, -0.05297735705971718, -0.05027449131011963, -0.04757162556052208, -0.04486875981092453, -0.04216589406132698, -0.03946302831172943, -0.03676016256213188, -0.03405729681253433, -0.03135443106293678, -0.028651565313339233, -0.025948699563741684, -0.023245833814144135, -0.020542968064546585, -0.017840102314949036, -0.015137236565351486, -0.012434370815753937, -0.009731505066156387, -0.007028639316558838, -0.0043257735669612885, -0.001622907817363739, 0.0010799579322338104, 0.00378282368183136, 0.006485689431428909, 0.009188562631607056, 0.011891428381204605, 0.014594294130802155, 0.017297159880399704, 0.020000025629997253, 0.022702891379594803, 0.025405757129192352, 0.0281086228787899, 0.03081148862838745, 0.033514354377985, 0.03621722012758255, 0.0389200858771801, 0.04162295162677765, 0.0443258173763752, 0.04702868312597275, 0.0497315488755703, 0.05243441462516785, 0.055137280374765396, 0.057840146124362946, 0.060543011873960495, 0.06324587762355804, 0.0659487396478653, 0.06865160912275314, 0.07135447859764099, 0.07405734062194824, 0.0767602026462555, 0.07946307212114334, 0.08216594159603119, 0.08486880362033844, 0.08757166564464569, 0.09027453511953354, 0.09297740459442139, 0.09568026661872864]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 3.0, 7.0, 3.0, 13.0, 8.0, 14.0, 20.0, 16.0, 28.0, 35.0, 39.0, 47.0, 48.0, 49.0, 50.0, 52.0, 57.0, 51.0, 46.0, 55.0, 37.0, 54.0, 43.0, 53.0, 31.0, 27.0, 22.0, 26.0, 19.0, 13.0, 10.0, 10.0, 7.0, 5.0, 0.0, 1.0, 2.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.07715767621994019, -0.07499028742313385, -0.07282289862632751, -0.07065550982952118, -0.06848812103271484, -0.06632072478532791, -0.06415333598852158, -0.06198594719171524, -0.059818558394908905, -0.05765116959810257, -0.055483780801296234, -0.0533163882791996, -0.051148999482393265, -0.04898161068558693, -0.046814218163490295, -0.04464682936668396, -0.042479440569877625, -0.04031205177307129, -0.038144662976264954, -0.03597727045416832, -0.033809881657361984, -0.03164249286055565, -0.029475102201104164, -0.02730771154165268, -0.025140322744846344, -0.02297293394804001, -0.020805543288588524, -0.01863815262913704, -0.016470763832330704, -0.014303374104201794, -0.012135984376072884, -0.009968594647943974, -0.0078012049198150635, -0.005633815191686153, -0.0034664254635572433, -0.0012990357354283333, 0.0008683539927005768, 0.003035743720829487, 0.005203133448958397, 0.007370523177087307, 0.009537912905216217, 0.011705302633345127, 0.013872692361474037, 0.016040083020925522, 0.018207471817731857, 0.020374860614538193, 0.022542251273989677, 0.024709641933441162, 0.026877030730247498, 0.029044419527053833, 0.031211810186505318, 0.0333792008459568, 0.03554658964276314, 0.03771397843956947, 0.03988137096166611, 0.04204875975847244, 0.04421614855527878, 0.046383537352085114, 0.04855092614889145, 0.05071831867098808, 0.05288570746779442, 0.055053096264600754, 0.05722048878669739, 0.05938787758350372, 0.06155526638031006]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 2.0, 2.0, 1.0, 3.0, 2.0, 11.0, 17.0, 13.0, 13.0, 30.0, 65.0, 96.0, 169.0, 280.0, 507.0, 1214.0, 3322.0, 31156.0, 942410.0, 61707.0, 4731.0, 1491.0, 616.0, 280.0, 146.0, 103.0, 64.0, 31.0, 23.0, 23.0, 8.0, 8.0, 7.0, 6.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8076171875, -0.784271240234375, -0.76092529296875, -0.737579345703125, -0.7142333984375, -0.690887451171875, -0.66754150390625, -0.644195556640625, -0.620849609375, -0.597503662109375, -0.57415771484375, -0.550811767578125, -0.5274658203125, -0.504119873046875, -0.48077392578125, -0.457427978515625, -0.43408203125, -0.410736083984375, -0.38739013671875, -0.364044189453125, -0.3406982421875, -0.317352294921875, -0.29400634765625, -0.270660400390625, -0.247314453125, -0.223968505859375, -0.20062255859375, -0.177276611328125, -0.1539306640625, -0.130584716796875, -0.10723876953125, -0.083892822265625, -0.060546875, -0.037200927734375, -0.01385498046875, 0.009490966796875, 0.0328369140625, 0.056182861328125, 0.07952880859375, 0.102874755859375, 0.126220703125, 0.149566650390625, 0.17291259765625, 0.196258544921875, 0.2196044921875, 0.242950439453125, 0.26629638671875, 0.289642333984375, 0.31298828125, 0.336334228515625, 0.35968017578125, 0.383026123046875, 0.4063720703125, 0.429718017578125, 0.45306396484375, 0.476409912109375, 0.499755859375, 0.523101806640625, 0.54644775390625, 0.569793701171875, 0.5931396484375, 0.616485595703125, 0.63983154296875, 0.663177490234375, 0.6865234375]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 19.0, 50.0, 90.0, 145.0, 183.0, 183.0, 162.0, 83.0, 40.0, 21.0, 2.0, 9.0, 1.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.133544921875, -0.1303691864013672, -0.12719345092773438, -0.12401771545410156, -0.12084197998046875, -0.11766624450683594, -0.11449050903320312, -0.11131477355957031, -0.1081390380859375, -0.10496330261230469, -0.10178756713867188, -0.09861183166503906, -0.09543609619140625, -0.09226036071777344, -0.08908462524414062, -0.08590888977050781, -0.082733154296875, -0.07955741882324219, -0.07638168334960938, -0.07320594787597656, -0.07003021240234375, -0.06685447692871094, -0.06367874145507812, -0.06050300598144531, -0.0573272705078125, -0.05415153503417969, -0.050975799560546875, -0.04780006408691406, -0.04462432861328125, -0.04144859313964844, -0.038272857666015625, -0.03509712219238281, -0.03192138671875, -0.028745651245117188, -0.025569915771484375, -0.022394180297851562, -0.01921844482421875, -0.016042709350585938, -0.012866973876953125, -0.009691238403320312, -0.0065155029296875, -0.0033397674560546875, -0.000164031982421875, 0.0030117034912109375, 0.00618743896484375, 0.009363174438476562, 0.012538909912109375, 0.015714645385742188, 0.018890380859375, 0.022066116333007812, 0.025241851806640625, 0.028417587280273438, 0.03159332275390625, 0.03476905822753906, 0.037944793701171875, 0.04112052917480469, 0.0442962646484375, 0.04747200012207031, 0.050647735595703125, 0.05382347106933594, 0.05699920654296875, 0.06017494201660156, 0.06335067749023438, 0.06652641296386719, 0.0697021484375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 6.0, 4.0, 4.0, 10.0, 13.0, 14.0, 20.0, 27.0, 39.0, 48.0, 76.0, 122.0, 199.0, 331.0, 577.0, 1162.0, 2788.0, 7821.0, 30713.0, 194986.0, 681893.0, 99199.0, 18891.0, 5393.0, 2043.0, 915.0, 496.0, 264.0, 145.0, 111.0, 74.0, 58.0, 34.0, 29.0, 11.0, 13.0, 6.0, 8.0, 3.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1658935546875, -0.1609172821044922, -0.15594100952148438, -0.15096473693847656, -0.14598846435546875, -0.14101219177246094, -0.13603591918945312, -0.1310596466064453, -0.1260833740234375, -0.12110710144042969, -0.11613082885742188, -0.11115455627441406, -0.10617828369140625, -0.10120201110839844, -0.09622573852539062, -0.09124946594238281, -0.086273193359375, -0.08129692077636719, -0.07632064819335938, -0.07134437561035156, -0.06636810302734375, -0.06139183044433594, -0.056415557861328125, -0.05143928527832031, -0.0464630126953125, -0.04148674011230469, -0.036510467529296875, -0.03153419494628906, -0.02655792236328125, -0.021581649780273438, -0.016605377197265625, -0.011629104614257812, -0.00665283203125, -0.0016765594482421875, 0.003299713134765625, 0.008275985717773438, 0.01325225830078125, 0.018228530883789062, 0.023204803466796875, 0.028181076049804688, 0.0331573486328125, 0.03813362121582031, 0.043109893798828125, 0.04808616638183594, 0.05306243896484375, 0.05803871154785156, 0.06301498413085938, 0.06799125671386719, 0.072967529296875, 0.07794380187988281, 0.08292007446289062, 0.08789634704589844, 0.09287261962890625, 0.09784889221191406, 0.10282516479492188, 0.10780143737792969, 0.1127777099609375, 0.11775398254394531, 0.12273025512695312, 0.12770652770996094, 0.13268280029296875, 0.13765907287597656, 0.14263534545898438, 0.1476116180419922, 0.152587890625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 4.0, 3.0, 5.0, 9.0, 5.0, 11.0, 11.0, 18.0, 11.0, 20.0, 23.0, 27.0, 22.0, 26.0, 26.0, 34.0, 29.0, 35.0, 34.0, 44.0, 56.0, 42.0, 47.0, 44.0, 42.0, 37.0, 49.0, 40.0, 26.0, 36.0, 23.0, 24.0, 34.0, 20.0, 16.0, 15.0, 15.0, 9.0, 10.0, 7.0, 5.0, 4.0, 1.0, 2.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09796142578125, -0.09490585327148438, -0.09185028076171875, -0.08879470825195312, -0.0857391357421875, -0.08268356323242188, -0.07962799072265625, -0.07657241821289062, -0.073516845703125, -0.07046127319335938, -0.06740570068359375, -0.06435012817382812, -0.0612945556640625, -0.058238983154296875, -0.05518341064453125, -0.052127838134765625, -0.049072265625, -0.046016693115234375, -0.04296112060546875, -0.039905548095703125, -0.0368499755859375, -0.033794403076171875, -0.03073883056640625, -0.027683258056640625, -0.024627685546875, -0.021572113037109375, -0.01851654052734375, -0.015460968017578125, -0.0124053955078125, -0.009349822998046875, -0.00629425048828125, -0.003238677978515625, -0.00018310546875, 0.002872467041015625, 0.00592803955078125, 0.008983612060546875, 0.0120391845703125, 0.015094757080078125, 0.01815032958984375, 0.021205902099609375, 0.024261474609375, 0.027317047119140625, 0.03037261962890625, 0.033428192138671875, 0.0364837646484375, 0.039539337158203125, 0.04259490966796875, 0.045650482177734375, 0.0487060546875, 0.051761627197265625, 0.05481719970703125, 0.057872772216796875, 0.0609283447265625, 0.06398391723632812, 0.06703948974609375, 0.07009506225585938, 0.073150634765625, 0.07620620727539062, 0.07926177978515625, 0.08231735229492188, 0.0853729248046875, 0.08842849731445312, 0.09148406982421875, 0.09453964233398438, 0.09759521484375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 8.0, 9.0, 7.0, 12.0, 16.0, 12.0, 33.0, 37.0, 56.0, 64.0, 108.0, 143.0, 296.0, 491.0, 830.0, 1856.0, 5601.0, 26001.0, 818482.0, 174020.0, 13618.0, 3712.0, 1452.0, 640.0, 349.0, 229.0, 157.0, 87.0, 69.0, 41.0, 31.0, 30.0, 19.0, 12.0, 11.0, 9.0, 2.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.116943359375, -0.11314964294433594, -0.10935592651367188, -0.10556221008300781, -0.10176849365234375, -0.09797477722167969, -0.09418106079101562, -0.09038734436035156, -0.0865936279296875, -0.08279991149902344, -0.07900619506835938, -0.07521247863769531, -0.07141876220703125, -0.06762504577636719, -0.06383132934570312, -0.06003761291503906, -0.056243896484375, -0.05245018005371094, -0.048656463623046875, -0.04486274719238281, -0.04106903076171875, -0.03727531433105469, -0.033481597900390625, -0.029687881469726562, -0.0258941650390625, -0.022100448608398438, -0.018306732177734375, -0.014513015747070312, -0.01071929931640625, -0.0069255828857421875, -0.003131866455078125, 0.0006618499755859375, 0.00445556640625, 0.008249282836914062, 0.012042999267578125, 0.015836715698242188, 0.01963043212890625, 0.023424148559570312, 0.027217864990234375, 0.031011581420898438, 0.0348052978515625, 0.03859901428222656, 0.042392730712890625, 0.04618644714355469, 0.04998016357421875, 0.05377388000488281, 0.057567596435546875, 0.06136131286621094, 0.065155029296875, 0.06894874572753906, 0.07274246215820312, 0.07653617858886719, 0.08032989501953125, 0.08412361145019531, 0.08791732788085938, 0.09171104431152344, 0.0955047607421875, 0.09929847717285156, 0.10309219360351562, 0.10688591003417969, 0.11067962646484375, 0.11447334289550781, 0.11826705932617188, 0.12206077575683594, 0.1258544921875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 4.0, 3.0, 4.0, 8.0, 5.0, 4.0, 24.0, 18.0, 27.0, 37.0, 73.0, 109.0, 184.0, 186.0, 121.0, 70.0, 41.0, 23.0, 18.0, 18.0, 5.0, 6.0, 9.0, 3.0, 3.0, 5.0, 2.0, 0.0, 2.0, 0.0, 2.0, 3.0], "bins": [-0.0003476142883300781, -0.0003398917615413666, -0.00033216923475265503, -0.0003244467079639435, -0.00031672418117523193, -0.0003090016543865204, -0.00030127912759780884, -0.0002935566008090973, -0.00028583407402038574, -0.0002781115472316742, -0.00027038902044296265, -0.0002626664936542511, -0.00025494396686553955, -0.000247221440076828, -0.00023949891328811646, -0.0002317763864994049, -0.00022405385971069336, -0.0002163313329219818, -0.00020860880613327026, -0.00020088627934455872, -0.00019316375255584717, -0.00018544122576713562, -0.00017771869897842407, -0.00016999617218971252, -0.00016227364540100098, -0.00015455111861228943, -0.00014682859182357788, -0.00013910606503486633, -0.00013138353824615479, -0.00012366101145744324, -0.00011593848466873169, -0.00010821595788002014, -0.0001004934310913086, -9.277090430259705e-05, -8.50483775138855e-05, -7.732585072517395e-05, -6.96033239364624e-05, -6.188079714775085e-05, -5.415827035903931e-05, -4.643574357032776e-05, -3.871321678161621e-05, -3.099068999290466e-05, -2.3268163204193115e-05, -1.5545636415481567e-05, -7.82310962677002e-06, -1.0058283805847168e-07, 7.621943950653076e-06, 1.5344470739364624e-05, 2.3066997528076172e-05, 3.078952431678772e-05, 3.851205110549927e-05, 4.6234577894210815e-05, 5.395710468292236e-05, 6.167963147163391e-05, 6.940215826034546e-05, 7.712468504905701e-05, 8.484721183776855e-05, 9.25697386264801e-05, 0.00010029226541519165, 0.0001080147922039032, 0.00011573731899261475, 0.0001234598457813263, 0.00013118237257003784, 0.0001389048993587494, 0.00014662742614746094]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 7.0, 5.0, 3.0, 12.0, 9.0, 12.0, 18.0, 19.0, 37.0, 52.0, 110.0, 189.0, 338.0, 630.0, 1380.0, 3669.0, 14403.0, 148320.0, 835054.0, 33927.0, 6423.0, 2131.0, 879.0, 404.0, 182.0, 120.0, 75.0, 64.0, 33.0, 21.0, 10.0, 5.0, 10.0, 7.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1451416015625, -0.1409015655517578, -0.13666152954101562, -0.13242149353027344, -0.12818145751953125, -0.12394142150878906, -0.11970138549804688, -0.11546134948730469, -0.1112213134765625, -0.10698127746582031, -0.10274124145507812, -0.09850120544433594, -0.09426116943359375, -0.09002113342285156, -0.08578109741210938, -0.08154106140136719, -0.077301025390625, -0.07306098937988281, -0.06882095336914062, -0.06458091735839844, -0.06034088134765625, -0.05610084533691406, -0.051860809326171875, -0.04762077331542969, -0.0433807373046875, -0.03914070129394531, -0.034900665283203125, -0.030660629272460938, -0.02642059326171875, -0.022180557250976562, -0.017940521240234375, -0.013700485229492188, -0.00946044921875, -0.0052204132080078125, -0.000980377197265625, 0.0032596588134765625, 0.00749969482421875, 0.011739730834960938, 0.015979766845703125, 0.020219802856445312, 0.0244598388671875, 0.028699874877929688, 0.032939910888671875, 0.03717994689941406, 0.04141998291015625, 0.04566001892089844, 0.049900054931640625, 0.05414009094238281, 0.058380126953125, 0.06262016296386719, 0.06686019897460938, 0.07110023498535156, 0.07534027099609375, 0.07958030700683594, 0.08382034301757812, 0.08806037902832031, 0.0923004150390625, 0.09654045104980469, 0.10078048706054688, 0.10502052307128906, 0.10926055908203125, 0.11350059509277344, 0.11774063110351562, 0.12198066711425781, 0.126220703125]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 2.0, 1.0, 5.0, 3.0, 7.0, 8.0, 8.0, 11.0, 17.0, 23.0, 31.0, 44.0, 63.0, 106.0, 148.0, 159.0, 124.0, 82.0, 46.0, 35.0, 12.0, 17.0, 6.0, 8.0, 14.0, 4.0, 3.0, 2.0, 3.0, 3.0, 1.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.083984375, -0.0815286636352539, -0.07907295227050781, -0.07661724090576172, -0.07416152954101562, -0.07170581817626953, -0.06925010681152344, -0.06679439544677734, -0.06433868408203125, -0.061882972717285156, -0.05942726135253906, -0.05697154998779297, -0.054515838623046875, -0.05206012725830078, -0.04960441589355469, -0.047148704528808594, -0.0446929931640625, -0.042237281799316406, -0.03978157043457031, -0.03732585906982422, -0.034870147705078125, -0.03241443634033203, -0.029958724975585938, -0.027503013610839844, -0.02504730224609375, -0.022591590881347656, -0.020135879516601562, -0.01768016815185547, -0.015224456787109375, -0.012768745422363281, -0.010313034057617188, -0.007857322692871094, -0.005401611328125, -0.0029458999633789062, -0.0004901885986328125, 0.0019655227661132812, 0.004421234130859375, 0.006876945495605469, 0.009332656860351562, 0.011788368225097656, 0.01424407958984375, 0.016699790954589844, 0.019155502319335938, 0.02161121368408203, 0.024066925048828125, 0.02652263641357422, 0.028978347778320312, 0.031434059143066406, 0.0338897705078125, 0.036345481872558594, 0.03880119323730469, 0.04125690460205078, 0.043712615966796875, 0.04616832733154297, 0.04862403869628906, 0.051079750061035156, 0.05353546142578125, 0.055991172790527344, 0.05844688415527344, 0.06090259552001953, 0.06335830688476562, 0.06581401824951172, 0.06826972961425781, 0.0707254409790039, 0.07318115234375]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 3.0, 6.0, 4.0, 10.0, 11.0, 19.0, 16.0, 23.0, 24.0, 39.0, 61.0, 62.0, 102.0, 109.0, 118.0, 90.0, 80.0, 55.0, 41.0, 32.0, 30.0, 18.0, 12.0, 9.0, 7.0, 6.0, 5.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4781157970428467, -0.45712828636169434, -0.436140775680542, -0.41515326499938965, -0.3941657245159149, -0.3731782138347626, -0.35219070315361023, -0.3312031626701355, -0.31021565198898315, -0.2892281413078308, -0.26824063062667847, -0.24725310504436493, -0.2262655794620514, -0.20527806878089905, -0.1842905580997467, -0.16330303251743317, -0.14231553673744202, -0.12132801860570908, -0.10034050047397614, -0.07935298979282379, -0.05836547166109085, -0.03737795352935791, -0.016390442848205566, 0.004597082734107971, 0.025584593415260315, 0.046572111546993256, 0.0675596296787262, 0.08854714035987854, 0.10953465849161148, 0.13052217662334442, 0.15150968730449677, 0.1724972128868103, 0.19348472356796265, 0.214472234249115, 0.23545975983142853, 0.2564472556114197, 0.2774347960948944, 0.29842230677604675, 0.3194098174571991, 0.34039735794067383, 0.36138486862182617, 0.3823723793029785, 0.40335988998413086, 0.4243474006652832, 0.44533494114875793, 0.4663224518299103, 0.4873099625110626, 0.5082975029945374, 0.5292849540710449, 0.5502724647521973, 0.5712599754333496, 0.592247486114502, 0.6132349967956543, 0.6342225074768066, 0.655210018157959, 0.6761975884437561, 0.6971850991249084, 0.7181726098060608, 0.7391601204872131, 0.7601476311683655, 0.7811351418495178, 0.8021227121353149, 0.8231102228164673, 0.8440977334976196, 0.865085244178772]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 7.0, 3.0, 6.0, 4.0, 10.0, 10.0, 4.0, 19.0, 12.0, 24.0, 16.0, 20.0, 28.0, 31.0, 27.0, 39.0, 38.0, 43.0, 40.0, 40.0, 54.0, 38.0, 49.0, 40.0, 47.0, 46.0, 44.0, 29.0, 39.0, 31.0, 29.0, 22.0, 23.0, 18.0, 19.0, 15.0, 16.0, 7.0, 6.0, 6.0, 7.0, 3.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4817732572555542, -0.46676936745643616, -0.4517654478549957, -0.4367615580558777, -0.42175763845443726, -0.4067537486553192, -0.3917498290538788, -0.37674593925476074, -0.3617420196533203, -0.34673812985420227, -0.33173421025276184, -0.3167303204536438, -0.30172640085220337, -0.2867225110530853, -0.2717185914516449, -0.25671470165252686, -0.24171079695224762, -0.22670689225196838, -0.21170298755168915, -0.1966990828514099, -0.18169517815113068, -0.16669127345085144, -0.1516873836517334, -0.13668346405029297, -0.12167956680059433, -0.1066756621003151, -0.09167175740003586, -0.07666786015033722, -0.061663951724767685, -0.04666005074977875, -0.03165614604949951, -0.016652241349220276, -0.00164833664894104, 0.013355567120015621, 0.028359470888972282, 0.04336337372660637, 0.058367278426885605, 0.07337117940187454, 0.08837508410215378, 0.10337898880243301, 0.11838289350271225, 0.1333867907524109, 0.14839069545269012, 0.16339460015296936, 0.1783985048532486, 0.19340240955352783, 0.20840631425380707, 0.2234102189540863, 0.23841412365436554, 0.2534180283546448, 0.2684219181537628, 0.28342583775520325, 0.2984297275543213, 0.3134336471557617, 0.32843753695487976, 0.3434414565563202, 0.35844534635543823, 0.3734492361545563, 0.3884531557559967, 0.40345704555511475, 0.4184609651565552, 0.4334648549556732, 0.44846877455711365, 0.4634726643562317, 0.4784765839576721]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 5.0, 16.0, 12.0, 15.0, 20.0, 26.0, 27.0, 62.0, 84.0, 134.0, 189.0, 329.0, 564.0, 1188.0, 3175.0, 14327.0, 219819.0, 3882796.0, 57631.0, 8319.0, 2611.0, 1269.0, 599.0, 382.0, 247.0, 135.0, 97.0, 59.0, 49.0, 30.0, 14.0, 13.0, 9.0, 4.0, 7.0, 3.0, 7.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.51953125, -0.5059700012207031, -0.49240875244140625, -0.4788475036621094, -0.4652862548828125, -0.4517250061035156, -0.43816375732421875, -0.4246025085449219, -0.411041259765625, -0.3974800109863281, -0.38391876220703125, -0.3703575134277344, -0.3567962646484375, -0.3432350158691406, -0.32967376708984375, -0.3161125183105469, -0.30255126953125, -0.2889900207519531, -0.27542877197265625, -0.2618675231933594, -0.2483062744140625, -0.23474502563476562, -0.22118377685546875, -0.20762252807617188, -0.194061279296875, -0.18050003051757812, -0.16693878173828125, -0.15337753295898438, -0.1398162841796875, -0.12625503540039062, -0.11269378662109375, -0.09913253784179688, -0.0855712890625, -0.07201004028320312, -0.05844879150390625, -0.044887542724609375, -0.0313262939453125, -0.017765045166015625, -0.00420379638671875, 0.009357452392578125, 0.022918701171875, 0.036479949951171875, 0.05004119873046875, 0.06360244750976562, 0.0771636962890625, 0.09072494506835938, 0.10428619384765625, 0.11784744262695312, 0.13140869140625, 0.14496994018554688, 0.15853118896484375, 0.17209243774414062, 0.1856536865234375, 0.19921493530273438, 0.21277618408203125, 0.22633743286132812, 0.239898681640625, 0.2534599304199219, 0.26702117919921875, 0.2805824279785156, 0.2941436767578125, 0.3077049255371094, 0.32126617431640625, 0.3348274230957031, 0.348388671875]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 22.0, 41.0, 93.0, 157.0, 181.0, 194.0, 154.0, 83.0, 35.0, 17.0, 6.0, 6.0, 1.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.13330078125, -0.1301288604736328, -0.12695693969726562, -0.12378501892089844, -0.12061309814453125, -0.11744117736816406, -0.11426925659179688, -0.11109733581542969, -0.1079254150390625, -0.10475349426269531, -0.10158157348632812, -0.09840965270996094, -0.09523773193359375, -0.09206581115722656, -0.08889389038085938, -0.08572196960449219, -0.082550048828125, -0.07937812805175781, -0.07620620727539062, -0.07303428649902344, -0.06986236572265625, -0.06669044494628906, -0.06351852416992188, -0.06034660339355469, -0.0571746826171875, -0.05400276184082031, -0.050830841064453125, -0.04765892028808594, -0.04448699951171875, -0.04131507873535156, -0.038143157958984375, -0.03497123718261719, -0.03179931640625, -0.028627395629882812, -0.025455474853515625, -0.022283554077148438, -0.01911163330078125, -0.015939712524414062, -0.012767791748046875, -0.009595870971679688, -0.0064239501953125, -0.0032520294189453125, -8.0108642578125e-05, 0.0030918121337890625, 0.00626373291015625, 0.009435653686523438, 0.012607574462890625, 0.015779495239257812, 0.018951416015625, 0.022123336791992188, 0.025295257568359375, 0.028467178344726562, 0.03163909912109375, 0.03481101989746094, 0.037982940673828125, 0.04115486145019531, 0.0443267822265625, 0.04749870300292969, 0.050670623779296875, 0.05384254455566406, 0.05701446533203125, 0.06018638610839844, 0.06335830688476562, 0.06653022766113281, 0.0697021484375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 3.0, 3.0, 4.0, 4.0, 7.0, 8.0, 11.0, 18.0, 31.0, 64.0, 80.0, 117.0, 184.0, 345.0, 643.0, 1250.0, 2720.0, 7784.0, 32501.0, 266374.0, 3644687.0, 199140.0, 26328.0, 6794.0, 2608.0, 1157.0, 581.0, 314.0, 203.0, 115.0, 76.0, 42.0, 34.0, 17.0, 9.0, 4.0, 5.0, 3.0, 4.0, 3.0, 3.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1663818359375, -0.1612548828125, -0.1561279296875, -0.1510009765625, -0.1458740234375, -0.1407470703125, -0.1356201171875, -0.1304931640625, -0.1253662109375, -0.1202392578125, -0.1151123046875, -0.1099853515625, -0.1048583984375, -0.0997314453125, -0.0946044921875, -0.0894775390625, -0.0843505859375, -0.0792236328125, -0.0740966796875, -0.0689697265625, -0.0638427734375, -0.0587158203125, -0.0535888671875, -0.0484619140625, -0.0433349609375, -0.0382080078125, -0.0330810546875, -0.0279541015625, -0.0228271484375, -0.0177001953125, -0.0125732421875, -0.0074462890625, -0.0023193359375, 0.0028076171875, 0.0079345703125, 0.0130615234375, 0.0181884765625, 0.0233154296875, 0.0284423828125, 0.0335693359375, 0.0386962890625, 0.0438232421875, 0.0489501953125, 0.0540771484375, 0.0592041015625, 0.0643310546875, 0.0694580078125, 0.0745849609375, 0.0797119140625, 0.0848388671875, 0.0899658203125, 0.0950927734375, 0.1002197265625, 0.1053466796875, 0.1104736328125, 0.1156005859375, 0.1207275390625, 0.1258544921875, 0.1309814453125, 0.1361083984375, 0.1412353515625, 0.1463623046875, 0.1514892578125, 0.1566162109375, 0.1617431640625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 4.0, 6.0, 8.0, 15.0, 29.0, 39.0, 77.0, 104.0, 167.0, 315.0, 634.0, 1489.0, 635.0, 266.0, 119.0, 74.0, 33.0, 23.0, 9.0, 5.0, 8.0, 4.0, 5.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1712646484375, -0.16629791259765625, -0.1613311767578125, -0.15636444091796875, -0.151397705078125, -0.14643096923828125, -0.1414642333984375, -0.13649749755859375, -0.13153076171875, -0.12656402587890625, -0.1215972900390625, -0.11663055419921875, -0.111663818359375, -0.10669708251953125, -0.1017303466796875, -0.09676361083984375, -0.091796875, -0.08683013916015625, -0.0818634033203125, -0.07689666748046875, -0.071929931640625, -0.06696319580078125, -0.0619964599609375, -0.05702972412109375, -0.05206298828125, -0.04709625244140625, -0.0421295166015625, -0.03716278076171875, -0.032196044921875, -0.02722930908203125, -0.0222625732421875, -0.01729583740234375, -0.0123291015625, -0.00736236572265625, -0.0023956298828125, 0.00257110595703125, 0.007537841796875, 0.01250457763671875, 0.0174713134765625, 0.02243804931640625, 0.02740478515625, 0.03237152099609375, 0.0373382568359375, 0.04230499267578125, 0.047271728515625, 0.05223846435546875, 0.0572052001953125, 0.06217193603515625, 0.067138671875, 0.07210540771484375, 0.0770721435546875, 0.08203887939453125, 0.087005615234375, 0.09197235107421875, 0.0969390869140625, 0.10190582275390625, 0.10687255859375, 0.11183929443359375, 0.1168060302734375, 0.12177276611328125, 0.126739501953125, 0.13170623779296875, 0.1366729736328125, 0.14163970947265625, 0.1466064453125]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 5.0, 2.0, 9.0, 9.0, 8.0, 11.0, 16.0, 20.0, 32.0, 32.0, 37.0, 47.0, 52.0, 70.0, 89.0, 99.0, 111.0, 87.0, 89.0, 60.0, 40.0, 30.0, 11.0, 6.0, 6.0, 8.0, 3.0, 6.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2237436771392822, -1.1884782314300537, -1.1532129049301147, -1.1179474592208862, -1.0826821327209473, -1.0474166870117188, -1.0121513605117798, -0.9768859148025513, -0.9416205883026123, -0.9063552021980286, -0.8710898160934448, -0.8358244299888611, -0.8005590438842773, -0.7652936577796936, -0.7300282716751099, -0.6947628259658813, -0.6594974398612976, -0.6242320537567139, -0.5889666676521301, -0.5537012815475464, -0.5184358954429626, -0.4831705093383789, -0.4479050934314728, -0.41263970732688904, -0.3773743212223053, -0.34210893511772156, -0.3068435490131378, -0.2715781331062317, -0.23631276190280914, -0.2010473757982254, -0.16578197479248047, -0.13051658868789673, -0.09525120258331299, -0.05998581275343895, -0.02472042292356491, 0.010544970631599426, 0.045810356736183167, 0.0810757428407669, 0.11634114384651184, 0.15160652995109558, 0.18687191605567932, 0.22213730216026306, 0.2574026882648468, 0.29266810417175293, 0.32793349027633667, 0.3631988763809204, 0.39846426248550415, 0.4337296485900879, 0.46899503469467163, 0.5042604207992554, 0.5395258069038391, 0.5747911930084229, 0.6100565791130066, 0.6453219652175903, 0.6805874109268188, 0.7158527374267578, 0.7511181831359863, 0.7863835692405701, 0.8216489553451538, 0.8569143414497375, 0.8921797275543213, 0.927445113658905, 0.9627104997634888, 0.9979759454727173, 1.0332412719726562]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 2.0, 4.0, 5.0, 10.0, 10.0, 9.0, 14.0, 17.0, 34.0, 31.0, 33.0, 46.0, 31.0, 30.0, 45.0, 44.0, 35.0, 37.0, 36.0, 35.0, 39.0, 34.0, 46.0, 49.0, 31.0, 45.0, 37.0, 34.0, 37.0, 33.0, 19.0, 28.0, 18.0, 14.0, 5.0, 10.0, 2.0, 4.0, 4.0, 4.0, 0.0, 5.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7265638113021851, -0.6995563507080078, -0.6725489497184753, -0.6455414891242981, -0.6185340881347656, -0.5915266275405884, -0.5645192265510559, -0.5375117659568787, -0.5105043649673462, -0.48349693417549133, -0.4564895033836365, -0.4294820725917816, -0.40247464179992676, -0.3754671812057495, -0.34845978021621704, -0.3214523196220398, -0.29444488883018494, -0.2674374580383301, -0.24043002724647522, -0.21342259645462036, -0.1864151656627655, -0.15940771996974945, -0.1324002891778946, -0.10539285838603973, -0.07838542759418488, -0.05137799680233002, -0.02437056228518486, 0.0026368722319602966, 0.029644303023815155, 0.05665174126625061, 0.08365917205810547, 0.11066660284996033, 0.13767403364181519, 0.16468146443367004, 0.1916888952255249, 0.21869632601737976, 0.24570375680923462, 0.27271121740341187, 0.29971861839294434, 0.3267260789871216, 0.35373347997665405, 0.3807409107685089, 0.40774834156036377, 0.43475577235221863, 0.4617632031440735, 0.48877066373825073, 0.5157780647277832, 0.5427855253219604, 0.5697929859161377, 0.5968004465103149, 0.6238078474998474, 0.6508153080940247, 0.6778227090835571, 0.7048301696777344, 0.7318375706672668, 0.7588450312614441, 0.7858524322509766, 0.8128598928451538, 0.8398672938346863, 0.8668747544288635, 0.893882155418396, 0.9208896160125732, 0.9478970170021057, 0.974904477596283, 1.0019118785858154]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 1.0, 4.0, 3.0, 6.0, 7.0, 9.0, 10.0, 13.0, 20.0, 36.0, 47.0, 62.0, 104.0, 200.0, 417.0, 976.0, 3170.0, 19156.0, 887227.0, 126954.0, 7028.0, 1708.0, 629.0, 281.0, 146.0, 106.0, 69.0, 48.0, 38.0, 24.0, 15.0, 10.0, 8.0, 8.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0439453125, -1.013916015625, -0.98388671875, -0.953857421875, -0.923828125, -0.893798828125, -0.86376953125, -0.833740234375, -0.8037109375, -0.773681640625, -0.74365234375, -0.713623046875, -0.68359375, -0.653564453125, -0.62353515625, -0.593505859375, -0.5634765625, -0.533447265625, -0.50341796875, -0.473388671875, -0.443359375, -0.413330078125, -0.38330078125, -0.353271484375, -0.3232421875, -0.293212890625, -0.26318359375, -0.233154296875, -0.203125, -0.173095703125, -0.14306640625, -0.113037109375, -0.0830078125, -0.052978515625, -0.02294921875, 0.007080078125, 0.037109375, 0.067138671875, 0.09716796875, 0.127197265625, 0.1572265625, 0.187255859375, 0.21728515625, 0.247314453125, 0.27734375, 0.307373046875, 0.33740234375, 0.367431640625, 0.3974609375, 0.427490234375, 0.45751953125, 0.487548828125, 0.517578125, 0.547607421875, 0.57763671875, 0.607666015625, 0.6376953125, 0.667724609375, 0.69775390625, 0.727783203125, 0.7578125, 0.787841796875, 0.81787109375, 0.847900390625, 0.8779296875]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 5.0, 21.0, 38.0, 79.0, 110.0, 164.0, 147.0, 167.0, 107.0, 72.0, 50.0, 16.0, 8.0, 5.0, 2.0, 4.0, 4.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1336669921875, -0.13045215606689453, -0.12723731994628906, -0.1240224838256836, -0.12080764770507812, -0.11759281158447266, -0.11437797546386719, -0.11116313934326172, -0.10794830322265625, -0.10473346710205078, -0.10151863098144531, -0.09830379486083984, -0.09508895874023438, -0.0918741226196289, -0.08865928649902344, -0.08544445037841797, -0.0822296142578125, -0.07901477813720703, -0.07579994201660156, -0.0725851058959961, -0.06937026977539062, -0.06615543365478516, -0.06294059753417969, -0.05972576141357422, -0.05651092529296875, -0.05329608917236328, -0.05008125305175781, -0.046866416931152344, -0.043651580810546875, -0.040436744689941406, -0.03722190856933594, -0.03400707244873047, -0.030792236328125, -0.02757740020751953, -0.024362564086914062, -0.021147727966308594, -0.017932891845703125, -0.014718055725097656, -0.011503219604492188, -0.008288383483886719, -0.00507354736328125, -0.0018587112426757812, 0.0013561248779296875, 0.004570960998535156, 0.007785797119140625, 0.011000633239746094, 0.014215469360351562, 0.01743030548095703, 0.0206451416015625, 0.02385997772216797, 0.027074813842773438, 0.030289649963378906, 0.033504486083984375, 0.036719322204589844, 0.03993415832519531, 0.04314899444580078, 0.04636383056640625, 0.04957866668701172, 0.05279350280761719, 0.056008338928222656, 0.059223175048828125, 0.062438011169433594, 0.06565284729003906, 0.06886768341064453, 0.07208251953125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 6.0, 5.0, 13.0, 14.0, 15.0, 31.0, 48.0, 63.0, 107.0, 213.0, 352.0, 668.0, 1573.0, 4757.0, 23615.0, 413698.0, 568603.0, 26717.0, 5028.0, 1561.0, 696.0, 323.0, 163.0, 98.0, 57.0, 37.0, 24.0, 24.0, 9.0, 11.0, 7.0, 5.0, 2.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.39306640625, -0.3815155029296875, -0.369964599609375, -0.3584136962890625, -0.34686279296875, -0.3353118896484375, -0.323760986328125, -0.3122100830078125, -0.3006591796875, -0.2891082763671875, -0.277557373046875, -0.2660064697265625, -0.25445556640625, -0.2429046630859375, -0.231353759765625, -0.2198028564453125, -0.208251953125, -0.1967010498046875, -0.185150146484375, -0.1735992431640625, -0.16204833984375, -0.1504974365234375, -0.138946533203125, -0.1273956298828125, -0.1158447265625, -0.1042938232421875, -0.092742919921875, -0.0811920166015625, -0.06964111328125, -0.0580902099609375, -0.046539306640625, -0.0349884033203125, -0.0234375, -0.0118865966796875, -0.000335693359375, 0.0112152099609375, 0.02276611328125, 0.0343170166015625, 0.045867919921875, 0.0574188232421875, 0.0689697265625, 0.0805206298828125, 0.092071533203125, 0.1036224365234375, 0.11517333984375, 0.1267242431640625, 0.138275146484375, 0.1498260498046875, 0.161376953125, 0.1729278564453125, 0.184478759765625, 0.1960296630859375, 0.20758056640625, 0.2191314697265625, 0.230682373046875, 0.2422332763671875, 0.2537841796875, 0.2653350830078125, 0.276885986328125, 0.2884368896484375, 0.29998779296875, 0.3115386962890625, 0.323089599609375, 0.3346405029296875, 0.34619140625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 0.0, 7.0, 2.0, 6.0, 7.0, 12.0, 18.0, 12.0, 14.0, 20.0, 34.0, 33.0, 32.0, 45.0, 53.0, 69.0, 65.0, 73.0, 64.0, 65.0, 53.0, 58.0, 47.0, 48.0, 37.0, 28.0, 27.0, 19.0, 17.0, 14.0, 7.0, 6.0, 3.0, 8.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.155029296875, -0.14899444580078125, -0.1429595947265625, -0.13692474365234375, -0.130889892578125, -0.12485504150390625, -0.1188201904296875, -0.11278533935546875, -0.10675048828125, -0.10071563720703125, -0.0946807861328125, -0.08864593505859375, -0.082611083984375, -0.07657623291015625, -0.0705413818359375, -0.06450653076171875, -0.0584716796875, -0.05243682861328125, -0.0464019775390625, -0.04036712646484375, -0.034332275390625, -0.02829742431640625, -0.0222625732421875, -0.01622772216796875, -0.01019287109375, -0.00415802001953125, 0.0018768310546875, 0.00791168212890625, 0.013946533203125, 0.01998138427734375, 0.0260162353515625, 0.03205108642578125, 0.0380859375, 0.04412078857421875, 0.0501556396484375, 0.05619049072265625, 0.062225341796875, 0.06826019287109375, 0.0742950439453125, 0.08032989501953125, 0.08636474609375, 0.09239959716796875, 0.0984344482421875, 0.10446929931640625, 0.110504150390625, 0.11653900146484375, 0.1225738525390625, 0.12860870361328125, 0.1346435546875, 0.14067840576171875, 0.1467132568359375, 0.15274810791015625, 0.158782958984375, 0.16481781005859375, 0.1708526611328125, 0.17688751220703125, 0.18292236328125, 0.18895721435546875, 0.1949920654296875, 0.20102691650390625, 0.207061767578125, 0.21309661865234375, 0.2191314697265625, 0.22516632080078125, 0.231201171875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 2.0, 3.0, 3.0, 7.0, 9.0, 10.0, 6.0, 12.0, 24.0, 28.0, 59.0, 112.0, 201.0, 465.0, 1169.0, 5629.0, 381108.0, 651829.0, 5745.0, 1180.0, 461.0, 241.0, 99.0, 63.0, 33.0, 20.0, 16.0, 9.0, 6.0, 1.0, 2.0, 1.0, 6.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.88525390625, -0.8641815185546875, -0.843109130859375, -0.8220367431640625, -0.80096435546875, -0.7798919677734375, -0.758819580078125, -0.7377471923828125, -0.7166748046875, -0.6956024169921875, -0.674530029296875, -0.6534576416015625, -0.63238525390625, -0.6113128662109375, -0.590240478515625, -0.5691680908203125, -0.548095703125, -0.5270233154296875, -0.505950927734375, -0.4848785400390625, -0.46380615234375, -0.4427337646484375, -0.421661376953125, -0.4005889892578125, -0.3795166015625, -0.3584442138671875, -0.337371826171875, -0.3162994384765625, -0.29522705078125, -0.2741546630859375, -0.253082275390625, -0.2320098876953125, -0.2109375, -0.1898651123046875, -0.168792724609375, -0.1477203369140625, -0.12664794921875, -0.1055755615234375, -0.084503173828125, -0.0634307861328125, -0.0423583984375, -0.0212860107421875, -0.000213623046875, 0.0208587646484375, 0.04193115234375, 0.0630035400390625, 0.084075927734375, 0.1051483154296875, 0.126220703125, 0.1472930908203125, 0.168365478515625, 0.1894378662109375, 0.21051025390625, 0.2315826416015625, 0.252655029296875, 0.2737274169921875, 0.2947998046875, 0.3158721923828125, 0.336944580078125, 0.3580169677734375, 0.37908935546875, 0.4001617431640625, 0.421234130859375, 0.4423065185546875, 0.46337890625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 2.0, 3.0, 6.0, 11.0, 8.0, 8.0, 13.0, 19.0, 22.0, 15.0, 32.0, 27.0, 29.0, 47.0, 56.0, 80.0, 79.0, 102.0, 88.0, 74.0, 54.0, 43.0, 45.0, 26.0, 26.0, 16.0, 17.0, 9.0, 11.0, 4.0, 10.0, 4.0, 8.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00010591745376586914, -0.0001021726056933403, -9.842775762081146e-05, -9.468290954828262e-05, -9.093806147575378e-05, -8.719321340322495e-05, -8.34483653306961e-05, -7.970351725816727e-05, -7.595866918563843e-05, -7.221382111310959e-05, -6.846897304058075e-05, -6.472412496805191e-05, -6.097927689552307e-05, -5.723442882299423e-05, -5.348958075046539e-05, -4.9744732677936554e-05, -4.5999884605407715e-05, -4.2255036532878876e-05, -3.851018846035004e-05, -3.47653403878212e-05, -3.102049231529236e-05, -2.727564424276352e-05, -2.353079617023468e-05, -1.978594809770584e-05, -1.6041100025177002e-05, -1.2296251952648163e-05, -8.551403880119324e-06, -4.806555807590485e-06, -1.0617077350616455e-06, 2.6831403374671936e-06, 6.427988409996033e-06, 1.0172836482524872e-05, 1.3917684555053711e-05, 1.766253262758255e-05, 2.140738070011139e-05, 2.5152228772640228e-05, 2.8897076845169067e-05, 3.2641924917697906e-05, 3.6386772990226746e-05, 4.0131621062755585e-05, 4.3876469135284424e-05, 4.762131720781326e-05, 5.13661652803421e-05, 5.511101335287094e-05, 5.885586142539978e-05, 6.260070949792862e-05, 6.634555757045746e-05, 7.00904056429863e-05, 7.383525371551514e-05, 7.758010178804398e-05, 8.132494986057281e-05, 8.506979793310165e-05, 8.881464600563049e-05, 9.255949407815933e-05, 9.630434215068817e-05, 0.00010004919022321701, 0.00010379403829574585, 0.00010753888636827469, 0.00011128373444080353, 0.00011502858251333237, 0.0001187734305858612, 0.00012251827865839005, 0.00012626312673091888, 0.00013000797480344772, 0.00013375282287597656]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 6.0, 4.0, 8.0, 8.0, 7.0, 17.0, 18.0, 18.0, 33.0, 34.0, 49.0, 93.0, 94.0, 186.0, 279.0, 433.0, 682.0, 1266.0, 2560.0, 5943.0, 17407.0, 111175.0, 822329.0, 63047.0, 13028.0, 4751.0, 2167.0, 1118.0, 613.0, 380.0, 240.0, 155.0, 95.0, 99.0, 52.0, 44.0, 36.0, 19.0, 14.0, 12.0, 7.0, 9.0, 6.0, 6.0, 3.0, 3.0, 4.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.2138671875, -0.2074604034423828, -0.20105361938476562, -0.19464683532714844, -0.18824005126953125, -0.18183326721191406, -0.17542648315429688, -0.1690196990966797, -0.1626129150390625, -0.1562061309814453, -0.14979934692382812, -0.14339256286621094, -0.13698577880859375, -0.13057899475097656, -0.12417221069335938, -0.11776542663574219, -0.111358642578125, -0.10495185852050781, -0.09854507446289062, -0.09213829040527344, -0.08573150634765625, -0.07932472229003906, -0.07291793823242188, -0.06651115417480469, -0.0601043701171875, -0.05369758605957031, -0.047290802001953125, -0.04088401794433594, -0.03447723388671875, -0.028070449829101562, -0.021663665771484375, -0.015256881713867188, -0.00885009765625, -0.0024433135986328125, 0.003963470458984375, 0.010370254516601562, 0.01677703857421875, 0.023183822631835938, 0.029590606689453125, 0.03599739074707031, 0.0424041748046875, 0.04881095886230469, 0.055217742919921875, 0.06162452697753906, 0.06803131103515625, 0.07443809509277344, 0.08084487915039062, 0.08725166320800781, 0.093658447265625, 0.10006523132324219, 0.10647201538085938, 0.11287879943847656, 0.11928558349609375, 0.12569236755371094, 0.13209915161132812, 0.1385059356689453, 0.1449127197265625, 0.1513195037841797, 0.15772628784179688, 0.16413307189941406, 0.17053985595703125, 0.17694664001464844, 0.18335342407226562, 0.1897602081298828, 0.1961669921875]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 6.0, 1.0, 4.0, 8.0, 15.0, 14.0, 31.0, 58.0, 99.0, 137.0, 243.0, 160.0, 97.0, 45.0, 30.0, 14.0, 9.0, 5.0, 5.0, 8.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.2398681640625, -0.23308753967285156, -0.22630691528320312, -0.2195262908935547, -0.21274566650390625, -0.2059650421142578, -0.19918441772460938, -0.19240379333496094, -0.1856231689453125, -0.17884254455566406, -0.17206192016601562, -0.1652812957763672, -0.15850067138671875, -0.1517200469970703, -0.14493942260742188, -0.13815879821777344, -0.131378173828125, -0.12459754943847656, -0.11781692504882812, -0.11103630065917969, -0.10425567626953125, -0.09747505187988281, -0.09069442749023438, -0.08391380310058594, -0.0771331787109375, -0.07035255432128906, -0.06357192993164062, -0.05679130554199219, -0.05001068115234375, -0.04323005676269531, -0.036449432373046875, -0.029668807983398438, -0.02288818359375, -0.016107559204101562, -0.009326934814453125, -0.0025463104248046875, 0.00423431396484375, 0.011014938354492188, 0.017795562744140625, 0.024576187133789062, 0.0313568115234375, 0.03813743591308594, 0.044918060302734375, 0.05169868469238281, 0.05847930908203125, 0.06525993347167969, 0.07204055786132812, 0.07882118225097656, 0.085601806640625, 0.09238243103027344, 0.09916305541992188, 0.10594367980957031, 0.11272430419921875, 0.11950492858886719, 0.12628555297851562, 0.13306617736816406, 0.1398468017578125, 0.14662742614746094, 0.15340805053710938, 0.1601886749267578, 0.16696929931640625, 0.1737499237060547, 0.18053054809570312, 0.18731117248535156, 0.194091796875]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 9.0, 14.0, 28.0, 51.0, 114.0, 296.0, 278.0, 134.0, 49.0, 22.0, 7.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.948605060577393, -5.8271331787109375, -5.705661296844482, -5.584188938140869, -5.462717056274414, -5.341245174407959, -5.219773292541504, -5.098301410675049, -4.976829528808594, -4.855357646942139, -4.733885765075684, -4.61241340637207, -4.490941524505615, -4.36946964263916, -4.247997760772705, -4.12652587890625, -4.005053520202637, -3.8835816383361816, -3.7621095180511475, -3.6406376361846924, -3.519165515899658, -3.397693634033203, -3.276221752166748, -3.154749870300293, -3.033277750015259, -2.9118058681488037, -2.7903337478637695, -2.6688618659973145, -2.5473899841308594, -2.425917863845825, -2.30444598197937, -2.182973861694336, -2.061501979827881, -1.9400299787521362, -1.8185579776763916, -1.6970860958099365, -1.575614094734192, -1.4541420936584473, -1.3326702117919922, -1.2111982107162476, -1.0897260904312134, -0.9682540893554688, -0.8467821478843689, -0.725310206413269, -0.6038382053375244, -0.4823662042617798, -0.36089426279067993, -0.23942232131958008, -0.11795032024383545, 0.003521651029586792, 0.12499362230300903, 0.24646559357643127, 0.3679375648498535, 0.48940956592559814, 0.610881507396698, 0.7323534488677979, 0.8538254499435425, 0.9752974510192871, 1.0967693328857422, 1.2182413339614868, 1.3397133350372314, 1.461185336112976, 1.5826573371887207, 1.7041292190551758, 1.8256012201309204]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 4.0, 4.0, 8.0, 15.0, 14.0, 20.0, 26.0, 26.0, 27.0, 31.0, 50.0, 49.0, 51.0, 51.0, 75.0, 75.0, 63.0, 78.0, 65.0, 51.0, 42.0, 47.0, 23.0, 24.0, 21.0, 20.0, 17.0, 12.0, 7.0, 5.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0], "bins": [-1.3496026992797852, -1.3180228471755981, -1.2864429950714111, -1.2548632621765137, -1.2232834100723267, -1.1917035579681396, -1.1601238250732422, -1.1285439729690552, -1.0969641208648682, -1.0653842687606812, -1.0338044166564941, -1.0022246837615967, -0.9706448316574097, -0.9390649795532227, -0.9074851870536804, -0.8759053945541382, -0.8443255424499512, -0.8127456903457642, -0.7811658978462219, -0.7495861053466797, -0.7180062532424927, -0.6864264011383057, -0.6548466086387634, -0.6232668161392212, -0.5916869640350342, -0.5601071119308472, -0.5285273194313049, -0.4969474971294403, -0.4653676748275757, -0.43378785252571106, -0.40220803022384644, -0.3706282079219818, -0.3390483856201172, -0.30746856331825256, -0.27588874101638794, -0.24430891871452332, -0.2127290964126587, -0.18114927411079407, -0.14956945180892944, -0.11798962950706482, -0.0864098072052002, -0.05482998490333557, -0.023250162601470947, 0.008329659700393677, 0.0399094820022583, 0.07148930430412292, 0.10306912660598755, 0.13464894890785217, 0.1662287712097168, 0.19780859351158142, 0.22938841581344604, 0.26096823811531067, 0.2925480604171753, 0.3241278827190399, 0.35570770502090454, 0.38728752732276917, 0.4188673496246338, 0.4504471719264984, 0.48202699422836304, 0.5136067867279053, 0.5451866388320923, 0.5767664909362793, 0.6083462834358215, 0.6399260759353638, 0.6715059280395508]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 5.0, 5.0, 4.0, 7.0, 9.0, 8.0, 10.0, 10.0, 20.0, 16.0, 21.0, 21.0, 29.0, 38.0, 58.0, 66.0, 90.0, 117.0, 152.0, 200.0, 250.0, 410.0, 610.0, 1068.0, 2025.0, 5305.0, 22277.0, 351671.0, 3716857.0, 73207.0, 11984.0, 4044.0, 1720.0, 812.0, 421.0, 264.0, 156.0, 96.0, 68.0, 58.0, 28.0, 20.0, 12.0, 11.0, 6.0, 5.0, 4.0, 7.0, 3.0, 4.0, 4.0, 1.0, 1.0], "bins": [-0.325927734375, -0.3176250457763672, -0.3093223571777344, -0.30101966857910156, -0.29271697998046875, -0.28441429138183594, -0.2761116027832031, -0.2678089141845703, -0.2595062255859375, -0.2512035369873047, -0.24290084838867188, -0.23459815979003906, -0.22629547119140625, -0.21799278259277344, -0.20969009399414062, -0.2013874053955078, -0.193084716796875, -0.1847820281982422, -0.17647933959960938, -0.16817665100097656, -0.15987396240234375, -0.15157127380371094, -0.14326858520507812, -0.1349658966064453, -0.1266632080078125, -0.11836051940917969, -0.11005783081054688, -0.10175514221191406, -0.09345245361328125, -0.08514976501464844, -0.07684707641601562, -0.06854438781738281, -0.06024169921875, -0.05193901062011719, -0.043636322021484375, -0.03533363342285156, -0.02703094482421875, -0.018728256225585938, -0.010425567626953125, -0.0021228790283203125, 0.0061798095703125, 0.014482498168945312, 0.022785186767578125, 0.031087875366210938, 0.03939056396484375, 0.04769325256347656, 0.055995941162109375, 0.06429862976074219, 0.072601318359375, 0.08090400695800781, 0.08920669555664062, 0.09750938415527344, 0.10581207275390625, 0.11411476135253906, 0.12241744995117188, 0.1307201385498047, 0.1390228271484375, 0.1473255157470703, 0.15562820434570312, 0.16393089294433594, 0.17223358154296875, 0.18053627014160156, 0.18883895874023438, 0.1971416473388672, 0.2054443359375]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 6.0, 6.0, 21.0, 43.0, 94.0, 114.0, 173.0, 148.0, 149.0, 103.0, 69.0, 33.0, 24.0, 2.0, 8.0, 1.0, 3.0, 5.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1317138671875, -0.12853050231933594, -0.12534713745117188, -0.12216377258300781, -0.11898040771484375, -0.11579704284667969, -0.11261367797851562, -0.10943031311035156, -0.1062469482421875, -0.10306358337402344, -0.09988021850585938, -0.09669685363769531, -0.09351348876953125, -0.09033012390136719, -0.08714675903320312, -0.08396339416503906, -0.080780029296875, -0.07759666442871094, -0.07441329956054688, -0.07122993469238281, -0.06804656982421875, -0.06486320495605469, -0.061679840087890625, -0.05849647521972656, -0.0553131103515625, -0.05212974548339844, -0.048946380615234375, -0.04576301574707031, -0.04257965087890625, -0.03939628601074219, -0.036212921142578125, -0.03302955627441406, -0.02984619140625, -0.026662826538085938, -0.023479461669921875, -0.020296096801757812, -0.01711273193359375, -0.013929367065429688, -0.010746002197265625, -0.0075626373291015625, -0.0043792724609375, -0.0011959075927734375, 0.001987457275390625, 0.0051708221435546875, 0.00835418701171875, 0.011537551879882812, 0.014720916748046875, 0.017904281616210938, 0.021087646484375, 0.024271011352539062, 0.027454376220703125, 0.030637741088867188, 0.03382110595703125, 0.03700447082519531, 0.040187835693359375, 0.04337120056152344, 0.0465545654296875, 0.04973793029785156, 0.052921295166015625, 0.05610466003417969, 0.05928802490234375, 0.06247138977050781, 0.06565475463867188, 0.06883811950683594, 0.072021484375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 5.0, 4.0, 9.0, 17.0, 34.0, 34.0, 55.0, 93.0, 168.0, 227.0, 279.0, 473.0, 654.0, 891.0, 1418.0, 2043.0, 3591.0, 6830.0, 15964.0, 52036.0, 327579.0, 3365309.0, 327194.0, 55344.0, 17421.0, 7585.0, 3750.0, 2099.0, 1139.0, 720.0, 446.0, 248.0, 203.0, 133.0, 94.0, 54.0, 48.0, 44.0, 26.0, 12.0, 2.0, 6.0, 4.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1378173828125, -0.1329803466796875, -0.128143310546875, -0.1233062744140625, -0.11846923828125, -0.1136322021484375, -0.108795166015625, -0.1039581298828125, -0.09912109375, -0.0942840576171875, -0.089447021484375, -0.0846099853515625, -0.07977294921875, -0.0749359130859375, -0.070098876953125, -0.0652618408203125, -0.0604248046875, -0.0555877685546875, -0.050750732421875, -0.0459136962890625, -0.04107666015625, -0.0362396240234375, -0.031402587890625, -0.0265655517578125, -0.021728515625, -0.0168914794921875, -0.012054443359375, -0.0072174072265625, -0.00238037109375, 0.0024566650390625, 0.007293701171875, 0.0121307373046875, 0.0169677734375, 0.0218048095703125, 0.026641845703125, 0.0314788818359375, 0.03631591796875, 0.0411529541015625, 0.045989990234375, 0.0508270263671875, 0.0556640625, 0.0605010986328125, 0.065338134765625, 0.0701751708984375, 0.07501220703125, 0.0798492431640625, 0.084686279296875, 0.0895233154296875, 0.0943603515625, 0.0991973876953125, 0.104034423828125, 0.1088714599609375, 0.11370849609375, 0.1185455322265625, 0.123382568359375, 0.1282196044921875, 0.133056640625, 0.1378936767578125, 0.142730712890625, 0.1475677490234375, 0.15240478515625, 0.1572418212890625, 0.162078857421875, 0.1669158935546875, 0.1717529296875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 3.0, 0.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 3.0, 3.0, 0.0, 2.0, 2.0, 2.0, 4.0, 2.0, 5.0, 6.0, 18.0, 24.0, 42.0, 69.0, 93.0, 199.0, 370.0, 960.0, 1036.0, 482.0, 240.0, 152.0, 110.0, 65.0, 48.0, 26.0, 21.0, 22.0, 14.0, 11.0, 8.0, 8.0, 4.0, 4.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.188232421875, -0.18329429626464844, -0.17835617065429688, -0.1734180450439453, -0.16847991943359375, -0.1635417938232422, -0.15860366821289062, -0.15366554260253906, -0.1487274169921875, -0.14378929138183594, -0.13885116577148438, -0.1339130401611328, -0.12897491455078125, -0.12403678894042969, -0.11909866333007812, -0.11416053771972656, -0.109222412109375, -0.10428428649902344, -0.09934616088867188, -0.09440803527832031, -0.08946990966796875, -0.08453178405761719, -0.07959365844726562, -0.07465553283691406, -0.0697174072265625, -0.06477928161621094, -0.059841156005859375, -0.05490303039550781, -0.04996490478515625, -0.04502677917480469, -0.040088653564453125, -0.03515052795410156, -0.03021240234375, -0.025274276733398438, -0.020336151123046875, -0.015398025512695312, -0.01045989990234375, -0.0055217742919921875, -0.000583648681640625, 0.0043544769287109375, 0.0092926025390625, 0.014230728149414062, 0.019168853759765625, 0.024106979370117188, 0.02904510498046875, 0.03398323059082031, 0.038921356201171875, 0.04385948181152344, 0.048797607421875, 0.05373573303222656, 0.058673858642578125, 0.06361198425292969, 0.06855010986328125, 0.07348823547363281, 0.07842636108398438, 0.08336448669433594, 0.0883026123046875, 0.09324073791503906, 0.09817886352539062, 0.10311698913574219, 0.10805511474609375, 0.11299324035644531, 0.11793136596679688, 0.12286949157714844, 0.1278076171875]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 6.0, 3.0, 1.0, 1.0, 7.0, 13.0, 16.0, 17.0, 42.0, 45.0, 71.0, 94.0, 105.0, 145.0, 102.0, 90.0, 53.0, 52.0, 38.0, 27.0, 18.0, 15.0, 8.0, 15.0, 3.0, 3.0, 0.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.387558937072754, -1.3371734619140625, -1.2867878675460815, -1.2364022731781006, -1.1860167980194092, -1.1356313228607178, -1.0852457284927368, -1.0348601341247559, -0.9844746589660645, -0.9340891242027283, -0.8837035894393921, -0.8333180546760559, -0.7829325199127197, -0.7325469851493835, -0.6821614503860474, -0.6317759156227112, -0.581390380859375, -0.5310048460960388, -0.48061931133270264, -0.43023377656936646, -0.3798482418060303, -0.3294627070426941, -0.2790771722793579, -0.22869163751602173, -0.17830610275268555, -0.12792056798934937, -0.07753503322601318, -0.027149498462677002, 0.02323603630065918, 0.07362157106399536, 0.12400710582733154, 0.17439264059066772, 0.2247781753540039, 0.2751637101173401, 0.32554924488067627, 0.37593477964401245, 0.42632031440734863, 0.4767058491706848, 0.527091383934021, 0.5774769186973572, 0.6278624534606934, 0.6782479882240295, 0.7286335229873657, 0.7790190577507019, 0.8294045925140381, 0.8797901272773743, 0.9301756620407104, 0.9805611968040466, 1.0309467315673828, 1.0813322067260742, 1.1317178010940552, 1.1821033954620361, 1.2324888706207275, 1.282874345779419, 1.3332599401474, 1.3836455345153809, 1.4340310096740723, 1.4844164848327637, 1.5348020792007446, 1.5851876735687256, 1.635573148727417, 1.6859586238861084, 1.7363442182540894, 1.7867298126220703, 1.8371152877807617]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 5.0, 6.0, 4.0, 12.0, 10.0, 16.0, 12.0, 24.0, 27.0, 26.0, 41.0, 29.0, 35.0, 43.0, 56.0, 45.0, 45.0, 59.0, 58.0, 50.0, 38.0, 47.0, 45.0, 42.0, 30.0, 35.0, 30.0, 26.0, 26.0, 19.0, 22.0, 12.0, 9.0, 6.0, 6.0, 7.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.313619613647461, -1.2759904861450195, -1.2383614778518677, -1.2007323503494263, -1.1631033420562744, -1.125474214553833, -1.0878452062606812, -1.0502160787582397, -1.012587070465088, -0.9749580025672913, -0.9373289346694946, -0.899699866771698, -0.8620707988739014, -0.8244417309761047, -0.7868126630783081, -0.7491835355758667, -0.7115544676780701, -0.6739253997802734, -0.6362963318824768, -0.5986672639846802, -0.5610381960868835, -0.5234091281890869, -0.4857800304889679, -0.44815096259117126, -0.41052189469337463, -0.372892826795578, -0.33526375889778137, -0.29763466119766235, -0.2600055932998657, -0.22237654030323029, -0.18474745750427246, -0.14711838960647583, -0.1094893217086792, -0.07186025381088257, -0.03423117846250534, 0.003397896885871887, 0.04102696478366852, 0.07865603268146515, 0.11628511548042297, 0.1539141833782196, 0.19154325127601624, 0.22917231917381287, 0.2668013870716095, 0.3044304847717285, 0.34205955266952515, 0.3796886205673218, 0.4173176884651184, 0.45494675636291504, 0.49257582426071167, 0.5302048921585083, 0.5678339600563049, 0.6054630279541016, 0.6430920958518982, 0.6807211637496948, 0.7183502912521362, 0.7559792995452881, 0.7936084270477295, 0.8312374949455261, 0.8688665628433228, 0.9064956307411194, 0.944124698638916, 0.9817537665367126, 1.0193828344345093, 1.0570119619369507, 1.0946409702301025]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 1.0, 5.0, 4.0, 11.0, 16.0, 15.0, 26.0, 41.0, 65.0, 99.0, 165.0, 257.0, 424.0, 725.0, 1505.0, 3687.0, 13095.0, 87141.0, 757419.0, 156067.0, 19239.0, 4697.0, 1756.0, 873.0, 432.0, 270.0, 180.0, 115.0, 86.0, 50.0, 25.0, 23.0, 15.0, 4.0, 11.0, 5.0, 4.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.406982421875, -0.3945045471191406, -0.38202667236328125, -0.3695487976074219, -0.3570709228515625, -0.3445930480957031, -0.33211517333984375, -0.3196372985839844, -0.307159423828125, -0.2946815490722656, -0.28220367431640625, -0.2697257995605469, -0.2572479248046875, -0.24477005004882812, -0.23229217529296875, -0.21981430053710938, -0.20733642578125, -0.19485855102539062, -0.18238067626953125, -0.16990280151367188, -0.1574249267578125, -0.14494705200195312, -0.13246917724609375, -0.11999130249023438, -0.107513427734375, -0.09503555297851562, -0.08255767822265625, -0.07007980346679688, -0.0576019287109375, -0.045124053955078125, -0.03264617919921875, -0.020168304443359375, -0.0076904296875, 0.004787445068359375, 0.01726531982421875, 0.029743194580078125, 0.0422210693359375, 0.054698944091796875, 0.06717681884765625, 0.07965469360351562, 0.092132568359375, 0.10461044311523438, 0.11708831787109375, 0.12956619262695312, 0.1420440673828125, 0.15452194213867188, 0.16699981689453125, 0.17947769165039062, 0.19195556640625, 0.20443344116210938, 0.21691131591796875, 0.22938919067382812, 0.2418670654296875, 0.2543449401855469, 0.26682281494140625, 0.2793006896972656, 0.291778564453125, 0.3042564392089844, 0.31673431396484375, 0.3292121887207031, 0.3416900634765625, 0.3541679382324219, 0.36664581298828125, 0.3791236877441406, 0.3916015625]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 5.0, 7.0, 9.0, 26.0, 37.0, 56.0, 83.0, 96.0, 124.0, 129.0, 117.0, 90.0, 86.0, 44.0, 32.0, 21.0, 14.0, 10.0, 6.0, 2.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.133056640625, -0.1296863555908203, -0.12631607055664062, -0.12294578552246094, -0.11957550048828125, -0.11620521545410156, -0.11283493041992188, -0.10946464538574219, -0.1060943603515625, -0.10272407531738281, -0.09935379028320312, -0.09598350524902344, -0.09261322021484375, -0.08924293518066406, -0.08587265014648438, -0.08250236511230469, -0.079132080078125, -0.07576179504394531, -0.07239151000976562, -0.06902122497558594, -0.06565093994140625, -0.06228065490722656, -0.058910369873046875, -0.05554008483886719, -0.0521697998046875, -0.04879951477050781, -0.045429229736328125, -0.04205894470214844, -0.03868865966796875, -0.03531837463378906, -0.031948089599609375, -0.028577804565429688, -0.02520751953125, -0.021837234497070312, -0.018466949462890625, -0.015096664428710938, -0.01172637939453125, -0.008356094360351562, -0.004985809326171875, -0.0016155242919921875, 0.0017547607421875, 0.0051250457763671875, 0.008495330810546875, 0.011865615844726562, 0.01523590087890625, 0.018606185913085938, 0.021976470947265625, 0.025346755981445312, 0.028717041015625, 0.03208732604980469, 0.035457611083984375, 0.03882789611816406, 0.04219818115234375, 0.04556846618652344, 0.048938751220703125, 0.05230903625488281, 0.0556793212890625, 0.05904960632324219, 0.062419891357421875, 0.06579017639160156, 0.06916046142578125, 0.07253074645996094, 0.07590103149414062, 0.07927131652832031, 0.0826416015625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 6.0, 4.0, 10.0, 14.0, 42.0, 51.0, 79.0, 148.0, 267.0, 568.0, 1148.0, 2404.0, 5335.0, 12643.0, 32509.0, 101590.0, 487021.0, 288346.0, 73260.0, 24880.0, 9900.0, 4430.0, 1967.0, 904.0, 442.0, 254.0, 143.0, 75.0, 36.0, 28.0, 21.0, 8.0, 5.0, 3.0, 3.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2203369140625, -0.21383094787597656, -0.20732498168945312, -0.2008190155029297, -0.19431304931640625, -0.1878070831298828, -0.18130111694335938, -0.17479515075683594, -0.1682891845703125, -0.16178321838378906, -0.15527725219726562, -0.1487712860107422, -0.14226531982421875, -0.1357593536376953, -0.12925338745117188, -0.12274742126464844, -0.116241455078125, -0.10973548889160156, -0.10322952270507812, -0.09672355651855469, -0.09021759033203125, -0.08371162414550781, -0.07720565795898438, -0.07069969177246094, -0.0641937255859375, -0.05768775939941406, -0.051181793212890625, -0.04467582702636719, -0.03816986083984375, -0.03166389465332031, -0.025157928466796875, -0.018651962280273438, -0.01214599609375, -0.0056400299072265625, 0.000865936279296875, 0.0073719024658203125, 0.01387786865234375, 0.020383834838867188, 0.026889801025390625, 0.03339576721191406, 0.0399017333984375, 0.04640769958496094, 0.052913665771484375, 0.05941963195800781, 0.06592559814453125, 0.07243156433105469, 0.07893753051757812, 0.08544349670410156, 0.091949462890625, 0.09845542907714844, 0.10496139526367188, 0.11146736145019531, 0.11797332763671875, 0.12447929382324219, 0.13098526000976562, 0.13749122619628906, 0.1439971923828125, 0.15050315856933594, 0.15700912475585938, 0.1635150909423828, 0.17002105712890625, 0.1765270233154297, 0.18303298950195312, 0.18953895568847656, 0.196044921875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 7.0, 7.0, 9.0, 11.0, 12.0, 11.0, 20.0, 25.0, 19.0, 16.0, 38.0, 35.0, 45.0, 39.0, 43.0, 47.0, 51.0, 55.0, 47.0, 63.0, 52.0, 34.0, 48.0, 43.0, 39.0, 39.0, 14.0, 24.0, 25.0, 11.0, 14.0, 17.0, 7.0, 5.0, 9.0, 3.0, 3.0, 3.0, 4.0, 4.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.209228515625, -0.20272445678710938, -0.19622039794921875, -0.18971633911132812, -0.1832122802734375, -0.17670822143554688, -0.17020416259765625, -0.16370010375976562, -0.157196044921875, -0.15069198608398438, -0.14418792724609375, -0.13768386840820312, -0.1311798095703125, -0.12467575073242188, -0.11817169189453125, -0.11166763305664062, -0.10516357421875, -0.09865951538085938, -0.09215545654296875, -0.08565139770507812, -0.0791473388671875, -0.07264328002929688, -0.06613922119140625, -0.059635162353515625, -0.053131103515625, -0.046627044677734375, -0.04012298583984375, -0.033618927001953125, -0.0271148681640625, -0.020610809326171875, -0.01410675048828125, -0.007602691650390625, -0.0010986328125, 0.005405426025390625, 0.01190948486328125, 0.018413543701171875, 0.0249176025390625, 0.031421661376953125, 0.03792572021484375, 0.044429779052734375, 0.050933837890625, 0.057437896728515625, 0.06394195556640625, 0.07044601440429688, 0.0769500732421875, 0.08345413208007812, 0.08995819091796875, 0.09646224975585938, 0.10296630859375, 0.10947036743164062, 0.11597442626953125, 0.12247848510742188, 0.1289825439453125, 0.13548660278320312, 0.14199066162109375, 0.14849472045898438, 0.154998779296875, 0.16150283813476562, 0.16800689697265625, 0.17451095581054688, 0.1810150146484375, 0.18751907348632812, 0.19402313232421875, 0.20052719116210938, 0.20703125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 5.0, 7.0, 11.0, 18.0, 34.0, 45.0, 65.0, 138.0, 269.0, 678.0, 1874.0, 6868.0, 39760.0, 760367.0, 211723.0, 20315.0, 4153.0, 1255.0, 486.0, 216.0, 109.0, 66.0, 28.0, 18.0, 17.0, 14.0, 4.0, 5.0, 1.0, 6.0, 0.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1529541015625, -0.14868450164794922, -0.14441490173339844, -0.14014530181884766, -0.13587570190429688, -0.1316061019897461, -0.1273365020751953, -0.12306690216064453, -0.11879730224609375, -0.11452770233154297, -0.11025810241699219, -0.1059885025024414, -0.10171890258789062, -0.09744930267333984, -0.09317970275878906, -0.08891010284423828, -0.0846405029296875, -0.08037090301513672, -0.07610130310058594, -0.07183170318603516, -0.06756210327148438, -0.0632925033569336, -0.05902290344238281, -0.05475330352783203, -0.05048370361328125, -0.04621410369873047, -0.04194450378417969, -0.037674903869628906, -0.033405303955078125, -0.029135704040527344, -0.024866104125976562, -0.02059650421142578, -0.016326904296875, -0.012057304382324219, -0.0077877044677734375, -0.0035181045532226562, 0.000751495361328125, 0.005021095275878906, 0.009290695190429688, 0.013560295104980469, 0.01782989501953125, 0.02209949493408203, 0.026369094848632812, 0.030638694763183594, 0.034908294677734375, 0.039177894592285156, 0.04344749450683594, 0.04771709442138672, 0.0519866943359375, 0.05625629425048828, 0.06052589416503906, 0.06479549407958984, 0.06906509399414062, 0.0733346939086914, 0.07760429382324219, 0.08187389373779297, 0.08614349365234375, 0.09041309356689453, 0.09468269348144531, 0.0989522933959961, 0.10322189331054688, 0.10749149322509766, 0.11176109313964844, 0.11603069305419922, 0.12030029296875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 4.0, 2.0, 5.0, 4.0, 4.0, 13.0, 13.0, 12.0, 16.0, 21.0, 41.0, 81.0, 114.0, 150.0, 149.0, 138.0, 81.0, 42.0, 30.0, 18.0, 14.0, 7.0, 8.0, 6.0, 6.0, 8.0, 4.0, 3.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00014400482177734375, -0.00014023110270500183, -0.0001364573836326599, -0.000132683664560318, -0.00012890994548797607, -0.00012513622641563416, -0.00012136250734329224, -0.00011758878827095032, -0.0001138150691986084, -0.00011004135012626648, -0.00010626763105392456, -0.00010249391198158264, -9.872019290924072e-05, -9.49464738368988e-05, -9.117275476455688e-05, -8.739903569221497e-05, -8.362531661987305e-05, -7.985159754753113e-05, -7.607787847518921e-05, -7.230415940284729e-05, -6.853044033050537e-05, -6.475672125816345e-05, -6.098300218582153e-05, -5.7209283113479614e-05, -5.3435564041137695e-05, -4.9661844968795776e-05, -4.588812589645386e-05, -4.211440682411194e-05, -3.834068775177002e-05, -3.45669686794281e-05, -3.079324960708618e-05, -2.7019530534744263e-05, -2.3245811462402344e-05, -1.9472092390060425e-05, -1.5698373317718506e-05, -1.1924654245376587e-05, -8.150935173034668e-06, -4.377216100692749e-06, -6.034970283508301e-07, 3.170222043991089e-06, 6.943941116333008e-06, 1.0717660188674927e-05, 1.4491379261016846e-05, 1.8265098333358765e-05, 2.2038817405700684e-05, 2.5812536478042603e-05, 2.958625555038452e-05, 3.335997462272644e-05, 3.713369369506836e-05, 4.090741276741028e-05, 4.46811318397522e-05, 4.8454850912094116e-05, 5.2228569984436035e-05, 5.6002289056777954e-05, 5.977600812911987e-05, 6.354972720146179e-05, 6.732344627380371e-05, 7.109716534614563e-05, 7.487088441848755e-05, 7.864460349082947e-05, 8.241832256317139e-05, 8.61920416355133e-05, 8.996576070785522e-05, 9.373947978019714e-05, 9.751319885253906e-05]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 4.0, 10.0, 9.0, 7.0, 24.0, 22.0, 47.0, 48.0, 62.0, 166.0, 242.0, 409.0, 756.0, 1501.0, 2854.0, 6087.0, 13811.0, 36006.0, 132010.0, 620415.0, 163123.0, 41851.0, 15546.0, 6877.0, 3146.0, 1592.0, 847.0, 427.0, 237.0, 163.0, 84.0, 64.0, 36.0, 24.0, 20.0, 9.0, 8.0, 3.0, 4.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.061492919921875, -0.059481143951416016, -0.05746936798095703, -0.05545759201049805, -0.05344581604003906, -0.05143404006958008, -0.049422264099121094, -0.04741048812866211, -0.045398712158203125, -0.04338693618774414, -0.041375160217285156, -0.03936338424682617, -0.03735160827636719, -0.0353398323059082, -0.03332805633544922, -0.031316280364990234, -0.02930450439453125, -0.027292728424072266, -0.02528095245361328, -0.023269176483154297, -0.021257400512695312, -0.019245624542236328, -0.017233848571777344, -0.01522207260131836, -0.013210296630859375, -0.01119852066040039, -0.009186744689941406, -0.007174968719482422, -0.0051631927490234375, -0.003151416778564453, -0.0011396408081054688, 0.0008721351623535156, 0.0028839111328125, 0.004895687103271484, 0.006907463073730469, 0.008919239044189453, 0.010931015014648438, 0.012942790985107422, 0.014954566955566406, 0.01696634292602539, 0.018978118896484375, 0.02098989486694336, 0.023001670837402344, 0.025013446807861328, 0.027025222778320312, 0.029036998748779297, 0.03104877471923828, 0.033060550689697266, 0.03507232666015625, 0.037084102630615234, 0.03909587860107422, 0.0411076545715332, 0.04311943054199219, 0.04513120651245117, 0.047142982482910156, 0.04915475845336914, 0.051166534423828125, 0.05317831039428711, 0.055190086364746094, 0.05720186233520508, 0.05921363830566406, 0.06122541427612305, 0.06323719024658203, 0.06524896621704102, 0.0672607421875]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 9.0, 11.0, 8.0, 4.0, 16.0, 12.0, 20.0, 28.0, 28.0, 29.0, 38.0, 60.0, 53.0, 91.0, 131.0, 100.0, 82.0, 53.0, 47.0, 41.0, 28.0, 16.0, 21.0, 17.0, 14.0, 10.0, 10.0, 10.0, 4.0, 6.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0699462890625, -0.06767082214355469, -0.06539535522460938, -0.06311988830566406, -0.06084442138671875, -0.05856895446777344, -0.056293487548828125, -0.05401802062988281, -0.0517425537109375, -0.04946708679199219, -0.047191619873046875, -0.04491615295410156, -0.04264068603515625, -0.04036521911621094, -0.038089752197265625, -0.03581428527832031, -0.033538818359375, -0.03126335144042969, -0.028987884521484375, -0.026712417602539062, -0.02443695068359375, -0.022161483764648438, -0.019886016845703125, -0.017610549926757812, -0.0153350830078125, -0.013059616088867188, -0.010784149169921875, -0.008508682250976562, -0.00623321533203125, -0.0039577484130859375, -0.001682281494140625, 0.0005931854248046875, 0.00286865234375, 0.0051441192626953125, 0.007419586181640625, 0.009695053100585938, 0.01197052001953125, 0.014245986938476562, 0.016521453857421875, 0.018796920776367188, 0.0210723876953125, 0.023347854614257812, 0.025623321533203125, 0.027898788452148438, 0.03017425537109375, 0.03244972229003906, 0.034725189208984375, 0.03700065612792969, 0.039276123046875, 0.04155158996582031, 0.043827056884765625, 0.04610252380371094, 0.04837799072265625, 0.05065345764160156, 0.052928924560546875, 0.05520439147949219, 0.0574798583984375, 0.05975532531738281, 0.062030792236328125, 0.06430625915527344, 0.06658172607421875, 0.06885719299316406, 0.07113265991210938, 0.07340812683105469, 0.07568359375]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 8.0, 5.0, 5.0, 8.0, 9.0, 21.0, 25.0, 36.0, 29.0, 84.0, 92.0, 141.0, 144.0, 120.0, 77.0, 61.0, 38.0, 23.0, 16.0, 18.0, 14.0, 10.0, 5.0, 6.0, 6.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.3173056840896606, -1.2774688005447388, -1.2376320362091064, -1.1977951526641846, -1.1579582691192627, -1.1181213855743408, -1.078284502029419, -1.0384477376937866, -0.9986108541488647, -0.9587739706039429, -0.9189371466636658, -0.8791003227233887, -0.8392634391784668, -0.7994265556335449, -0.7595897316932678, -0.7197529077529907, -0.6799160242080688, -0.640079140663147, -0.6002423167228699, -0.5604054927825928, -0.5205686092376709, -0.4807317554950714, -0.4408949017524719, -0.40105804800987244, -0.36122119426727295, -0.32138434052467346, -0.281547486782074, -0.2417106330394745, -0.201873779296875, -0.1620369255542755, -0.12220007181167603, -0.08236321806907654, -0.0425264835357666, -0.0026896297931671143, 0.03714722394943237, 0.07698407769203186, 0.11682093143463135, 0.15665778517723083, 0.19649463891983032, 0.2363314926624298, 0.2761683464050293, 0.3160052001476288, 0.35584205389022827, 0.39567890763282776, 0.43551576137542725, 0.47535261511802673, 0.5151894688606262, 0.5550262928009033, 0.5948631763458252, 0.6347000598907471, 0.6745368838310242, 0.7143737077713013, 0.7542105913162231, 0.794047474861145, 0.8338842988014221, 0.8737211227416992, 0.9135580062866211, 0.953394889831543, 0.9932317137718201, 1.0330685377120972, 1.072905421257019, 1.112742304801941, 1.1525790691375732, 1.1924159526824951, 1.232252836227417]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 6.0, 6.0, 6.0, 4.0, 10.0, 10.0, 23.0, 30.0, 27.0, 34.0, 45.0, 53.0, 59.0, 61.0, 87.0, 87.0, 73.0, 66.0, 60.0, 57.0, 28.0, 41.0, 29.0, 25.0, 16.0, 21.0, 9.0, 13.0, 6.0, 3.0, 3.0, 5.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.3824677467346191, -1.344494104385376, -1.3065203428268433, -1.2685467004776, -1.230573058128357, -1.1925992965698242, -1.154625654220581, -1.116652011871338, -1.0786783695220947, -1.0407047271728516, -1.0027309656143188, -0.9647573232650757, -0.9267836809158325, -0.8888099789619446, -0.8508362770080566, -0.8128626346588135, -0.7748888731002808, -0.7369151711463928, -0.6989415287971497, -0.6609678268432617, -0.6229941844940186, -0.5850204825401306, -0.5470467805862427, -0.5090731382369995, -0.4710994362831116, -0.433125764131546, -0.39515209197998047, -0.35717839002609253, -0.319204717874527, -0.2812310457229614, -0.24325735867023468, -0.20528367161750793, -0.16730999946594238, -0.12933632731437683, -0.09136264026165009, -0.05338896065950394, -0.015415281057357788, 0.022558391094207764, 0.06053207814693451, 0.09850576519966125, 0.1364794373512268, 0.17445310950279236, 0.2124267965555191, 0.25040048360824585, 0.2883741557598114, 0.32634782791137695, 0.3643215298652649, 0.40229520201683044, 0.440268874168396, 0.47824254631996155, 0.5162162184715271, 0.554189920425415, 0.5921635627746582, 0.6301372647285461, 0.6681109666824341, 0.7060846090316772, 0.7440583109855652, 0.7820320129394531, 0.8200056552886963, 0.8579793572425842, 0.8959530591964722, 0.9339267015457153, 0.9719004034996033, 1.0098741054534912, 1.0478477478027344]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 5.0, 8.0, 8.0, 14.0, 15.0, 34.0, 55.0, 90.0, 176.0, 319.0, 593.0, 1979.0, 14845.0, 3811739.0, 352794.0, 8956.0, 1674.0, 566.0, 207.0, 101.0, 44.0, 23.0, 16.0, 11.0, 4.0, 6.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.76953125, -0.7515830993652344, -0.7336349487304688, -0.7156867980957031, -0.6977386474609375, -0.6797904968261719, -0.6618423461914062, -0.6438941955566406, -0.625946044921875, -0.6079978942871094, -0.5900497436523438, -0.5721015930175781, -0.5541534423828125, -0.5362052917480469, -0.5182571411132812, -0.5003089904785156, -0.48236083984375, -0.4644126892089844, -0.44646453857421875, -0.4285163879394531, -0.4105682373046875, -0.3926200866699219, -0.37467193603515625, -0.3567237854003906, -0.338775634765625, -0.3208274841308594, -0.30287933349609375, -0.2849311828613281, -0.2669830322265625, -0.24903488159179688, -0.23108673095703125, -0.21313858032226562, -0.1951904296875, -0.17724227905273438, -0.15929412841796875, -0.14134597778320312, -0.1233978271484375, -0.10544967651367188, -0.08750152587890625, -0.06955337524414062, -0.051605224609375, -0.033657073974609375, -0.01570892333984375, 0.002239227294921875, 0.0201873779296875, 0.038135528564453125, 0.05608367919921875, 0.07403182983398438, 0.09197998046875, 0.10992813110351562, 0.12787628173828125, 0.14582443237304688, 0.1637725830078125, 0.18172073364257812, 0.19966888427734375, 0.21761703491210938, 0.235565185546875, 0.2535133361816406, 0.27146148681640625, 0.2894096374511719, 0.3073577880859375, 0.3253059387207031, 0.34325408935546875, 0.3612022399902344, 0.379150390625]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 6.0, 10.0, 16.0, 40.0, 68.0, 86.0, 102.0, 109.0, 121.0, 125.0, 96.0, 87.0, 53.0, 27.0, 18.0, 13.0, 12.0, 3.0, 3.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1318359375, -0.12858009338378906, -0.12532424926757812, -0.12206840515136719, -0.11881256103515625, -0.11555671691894531, -0.11230087280273438, -0.10904502868652344, -0.1057891845703125, -0.10253334045410156, -0.09927749633789062, -0.09602165222167969, -0.09276580810546875, -0.08950996398925781, -0.08625411987304688, -0.08299827575683594, -0.079742431640625, -0.07648658752441406, -0.07323074340820312, -0.06997489929199219, -0.06671905517578125, -0.06346321105957031, -0.060207366943359375, -0.05695152282714844, -0.0536956787109375, -0.05043983459472656, -0.047183990478515625, -0.04392814636230469, -0.04067230224609375, -0.03741645812988281, -0.034160614013671875, -0.030904769897460938, -0.02764892578125, -0.024393081665039062, -0.021137237548828125, -0.017881393432617188, -0.01462554931640625, -0.011369705200195312, -0.008113861083984375, -0.0048580169677734375, -0.0016021728515625, 0.0016536712646484375, 0.004909515380859375, 0.008165359497070312, 0.01142120361328125, 0.014677047729492188, 0.017932891845703125, 0.021188735961914062, 0.024444580078125, 0.027700424194335938, 0.030956268310546875, 0.03421211242675781, 0.03746795654296875, 0.04072380065917969, 0.043979644775390625, 0.04723548889160156, 0.0504913330078125, 0.05374717712402344, 0.057003021240234375, 0.06025886535644531, 0.06351470947265625, 0.06677055358886719, 0.07002639770507812, 0.07328224182128906, 0.0765380859375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 5.0, 6.0, 8.0, 18.0, 23.0, 34.0, 35.0, 53.0, 74.0, 137.0, 266.0, 469.0, 913.0, 1989.0, 4609.0, 11698.0, 34390.0, 150886.0, 3150758.0, 727770.0, 76762.0, 20262.0, 7078.0, 2882.0, 1326.0, 690.0, 416.0, 233.0, 157.0, 115.0, 63.0, 54.0, 38.0, 19.0, 8.0, 14.0, 13.0, 5.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.206298828125, -0.1998138427734375, -0.193328857421875, -0.1868438720703125, -0.18035888671875, -0.1738739013671875, -0.167388916015625, -0.1609039306640625, -0.1544189453125, -0.1479339599609375, -0.141448974609375, -0.1349639892578125, -0.12847900390625, -0.1219940185546875, -0.115509033203125, -0.1090240478515625, -0.1025390625, -0.0960540771484375, -0.089569091796875, -0.0830841064453125, -0.07659912109375, -0.0701141357421875, -0.063629150390625, -0.0571441650390625, -0.0506591796875, -0.0441741943359375, -0.037689208984375, -0.0312042236328125, -0.02471923828125, -0.0182342529296875, -0.011749267578125, -0.0052642822265625, 0.001220703125, 0.0077056884765625, 0.014190673828125, 0.0206756591796875, 0.02716064453125, 0.0336456298828125, 0.040130615234375, 0.0466156005859375, 0.0531005859375, 0.0595855712890625, 0.066070556640625, 0.0725555419921875, 0.07904052734375, 0.0855255126953125, 0.092010498046875, 0.0984954833984375, 0.10498046875, 0.1114654541015625, 0.117950439453125, 0.1244354248046875, 0.13092041015625, 0.1374053955078125, 0.143890380859375, 0.1503753662109375, 0.1568603515625, 0.1633453369140625, 0.169830322265625, 0.1763153076171875, 0.18280029296875, 0.1892852783203125, 0.195770263671875, 0.2022552490234375, 0.208740234375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 4.0, 6.0, 13.0, 10.0, 15.0, 21.0, 21.0, 31.0, 50.0, 57.0, 95.0, 175.0, 253.0, 577.0, 1304.0, 751.0, 275.0, 144.0, 74.0, 55.0, 43.0, 29.0, 20.0, 16.0, 7.0, 10.0, 4.0, 3.0, 5.0, 2.0, 4.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.2166748046875, -0.20980262756347656, -0.20293045043945312, -0.1960582733154297, -0.18918609619140625, -0.1823139190673828, -0.17544174194335938, -0.16856956481933594, -0.1616973876953125, -0.15482521057128906, -0.14795303344726562, -0.1410808563232422, -0.13420867919921875, -0.1273365020751953, -0.12046432495117188, -0.11359214782714844, -0.106719970703125, -0.09984779357910156, -0.09297561645507812, -0.08610343933105469, -0.07923126220703125, -0.07235908508300781, -0.06548690795898438, -0.05861473083496094, -0.0517425537109375, -0.04487037658691406, -0.037998199462890625, -0.031126022338867188, -0.02425384521484375, -0.017381668090820312, -0.010509490966796875, -0.0036373138427734375, 0.00323486328125, 0.010107040405273438, 0.016979217529296875, 0.023851394653320312, 0.03072357177734375, 0.03759574890136719, 0.044467926025390625, 0.05134010314941406, 0.0582122802734375, 0.06508445739746094, 0.07195663452148438, 0.07882881164550781, 0.08570098876953125, 0.09257316589355469, 0.09944534301757812, 0.10631752014160156, 0.113189697265625, 0.12006187438964844, 0.12693405151367188, 0.1338062286376953, 0.14067840576171875, 0.1475505828857422, 0.15442276000976562, 0.16129493713378906, 0.1681671142578125, 0.17503929138183594, 0.18191146850585938, 0.1887836456298828, 0.19565582275390625, 0.2025279998779297, 0.20940017700195312, 0.21627235412597656, 0.22314453125]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 1.0, 2.0, 7.0, 6.0, 14.0, 17.0, 19.0, 41.0, 72.0, 97.0, 131.0, 174.0, 142.0, 108.0, 57.0, 40.0, 19.0, 15.0, 13.0, 9.0, 4.0, 4.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9809967279434204, -1.9184601306915283, -1.8559236526489258, -1.7933870553970337, -1.7308504581451416, -1.668313980102539, -1.605777382850647, -1.5432407855987549, -1.4807043075561523, -1.4181677103042603, -1.3556312322616577, -1.2930946350097656, -1.230558156967163, -1.168021559715271, -1.105484962463379, -1.0429484844207764, -0.9804118871688843, -0.917875349521637, -0.8553388118743896, -0.7928022146224976, -0.7302656769752502, -0.6677291393280029, -0.6051925420761108, -0.5426560044288635, -0.4801194667816162, -0.4175829291343689, -0.3550463616847992, -0.2925097942352295, -0.22997325658798218, -0.16743671894073486, -0.10490015149116516, -0.04236358404159546, 0.020173072814941406, 0.08270962536334991, 0.14524617791175842, 0.20778273046016693, 0.27031928300857544, 0.33285582065582275, 0.39539238810539246, 0.45792895555496216, 0.5204654932022095, 0.5830020308494568, 0.6455385684967041, 0.7080751657485962, 0.7706117033958435, 0.8331482410430908, 0.8956848382949829, 0.9582213759422302, 1.0207579135894775, 1.0832945108413696, 1.1458309888839722, 1.2083675861358643, 1.2709040641784668, 1.3334406614303589, 1.395977258682251, 1.4585137367248535, 1.5210503339767456, 1.5835869312286377, 1.6461234092712402, 1.7086600065231323, 1.7711966037750244, 1.833733081817627, 1.896269679069519, 1.9588062763214111, 2.0213427543640137]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 6.0, 1.0, 6.0, 3.0, 9.0, 6.0, 10.0, 11.0, 9.0, 19.0, 14.0, 17.0, 20.0, 31.0, 31.0, 32.0, 57.0, 44.0, 40.0, 49.0, 48.0, 53.0, 41.0, 39.0, 40.0, 41.0, 41.0, 36.0, 41.0, 42.0, 22.0, 18.0, 27.0, 22.0, 17.0, 13.0, 13.0, 6.0, 9.0, 4.0, 7.0, 3.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7867507338523865, -0.7595539093017578, -0.7323570847511292, -0.7051602602005005, -0.6779634952545166, -0.6507666707038879, -0.6235698461532593, -0.5963730216026306, -0.569176197052002, -0.5419793725013733, -0.5147825479507446, -0.48758575320243835, -0.4603889584541321, -0.4331921339035034, -0.40599530935287476, -0.3787984848022461, -0.3516017198562622, -0.32440489530563354, -0.29720810055732727, -0.2700112760066986, -0.24281446635723114, -0.21561765670776367, -0.188420832157135, -0.16122402250766754, -0.13402721285820007, -0.1068304032087326, -0.07963358610868454, -0.052436769008636475, -0.025239959359169006, 0.001956850290298462, 0.029153674840927124, 0.05635048449039459, 0.08354723453521729, 0.11074404418468475, 0.13794085383415222, 0.16513767838478088, 0.19233448803424835, 0.21953129768371582, 0.24672812223434448, 0.27392494678497314, 0.3011217415332794, 0.3283185660839081, 0.35551536083221436, 0.382712185382843, 0.4099090099334717, 0.43710580468177795, 0.4643026292324066, 0.4914994239807129, 0.5186962485313416, 0.5458930730819702, 0.5730898976325989, 0.6002867221832275, 0.6274834871292114, 0.6546803116798401, 0.6818771362304688, 0.7090739607810974, 0.7362707853317261, 0.7634676098823547, 0.7906644344329834, 0.8178611993789673, 0.845058023929596, 0.8722548484802246, 0.8994516730308533, 0.9266484975814819, 0.9538452625274658]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 5.0, 2.0, 0.0, 4.0, 5.0, 11.0, 3.0, 17.0, 13.0, 17.0, 28.0, 40.0, 46.0, 67.0, 110.0, 193.0, 292.0, 510.0, 1010.0, 2443.0, 7067.0, 31027.0, 248966.0, 663268.0, 73462.0, 12996.0, 3682.0, 1435.0, 728.0, 404.0, 245.0, 141.0, 87.0, 68.0, 43.0, 40.0, 28.0, 18.0, 12.0, 6.0, 10.0, 6.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.43701171875, -0.42494964599609375, -0.4128875732421875, -0.40082550048828125, -0.388763427734375, -0.37670135498046875, -0.3646392822265625, -0.35257720947265625, -0.34051513671875, -0.32845306396484375, -0.3163909912109375, -0.30432891845703125, -0.292266845703125, -0.28020477294921875, -0.2681427001953125, -0.25608062744140625, -0.2440185546875, -0.23195648193359375, -0.2198944091796875, -0.20783233642578125, -0.195770263671875, -0.18370819091796875, -0.1716461181640625, -0.15958404541015625, -0.14752197265625, -0.13545989990234375, -0.1233978271484375, -0.11133575439453125, -0.099273681640625, -0.08721160888671875, -0.0751495361328125, -0.06308746337890625, -0.051025390625, -0.03896331787109375, -0.0269012451171875, -0.01483917236328125, -0.002777099609375, 0.00928497314453125, 0.0213470458984375, 0.03340911865234375, 0.04547119140625, 0.05753326416015625, 0.0695953369140625, 0.08165740966796875, 0.093719482421875, 0.10578155517578125, 0.1178436279296875, 0.12990570068359375, 0.1419677734375, 0.15402984619140625, 0.1660919189453125, 0.17815399169921875, 0.190216064453125, 0.20227813720703125, 0.2143402099609375, 0.22640228271484375, 0.23846435546875, 0.25052642822265625, 0.2625885009765625, 0.27465057373046875, 0.286712646484375, 0.29877471923828125, 0.3108367919921875, 0.32289886474609375, 0.3349609375]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 7.0, 3.0, 16.0, 16.0, 37.0, 51.0, 83.0, 87.0, 106.0, 105.0, 120.0, 99.0, 91.0, 72.0, 42.0, 23.0, 13.0, 10.0, 8.0, 7.0, 4.0, 1.0, 2.0, 0.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.1290283203125, -0.125946044921875, -0.12286376953125, -0.119781494140625, -0.11669921875, -0.113616943359375, -0.11053466796875, -0.107452392578125, -0.1043701171875, -0.101287841796875, -0.09820556640625, -0.095123291015625, -0.092041015625, -0.088958740234375, -0.08587646484375, -0.082794189453125, -0.0797119140625, -0.076629638671875, -0.07354736328125, -0.070465087890625, -0.0673828125, -0.064300537109375, -0.06121826171875, -0.058135986328125, -0.0550537109375, -0.051971435546875, -0.04888916015625, -0.045806884765625, -0.042724609375, -0.039642333984375, -0.03656005859375, -0.033477783203125, -0.0303955078125, -0.027313232421875, -0.02423095703125, -0.021148681640625, -0.01806640625, -0.014984130859375, -0.01190185546875, -0.008819580078125, -0.0057373046875, -0.002655029296875, 0.00042724609375, 0.003509521484375, 0.006591796875, 0.009674072265625, 0.01275634765625, 0.015838623046875, 0.0189208984375, 0.022003173828125, 0.02508544921875, 0.028167724609375, 0.03125, 0.034332275390625, 0.03741455078125, 0.040496826171875, 0.0435791015625, 0.046661376953125, 0.04974365234375, 0.052825927734375, 0.055908203125, 0.058990478515625, 0.06207275390625, 0.065155029296875, 0.0682373046875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 0.0, 4.0, 8.0, 3.0, 13.0, 13.0, 22.0, 46.0, 64.0, 112.0, 202.0, 479.0, 960.0, 2496.0, 6833.0, 23653.0, 107866.0, 674713.0, 180666.0, 35066.0, 9633.0, 3274.0, 1258.0, 582.0, 248.0, 142.0, 84.0, 45.0, 15.0, 20.0, 10.0, 7.0, 6.0, 8.0, 2.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.324462890625, -0.314208984375, -0.303955078125, -0.293701171875, -0.283447265625, -0.273193359375, -0.262939453125, -0.252685546875, -0.242431640625, -0.232177734375, -0.221923828125, -0.211669921875, -0.201416015625, -0.191162109375, -0.180908203125, -0.170654296875, -0.160400390625, -0.150146484375, -0.139892578125, -0.129638671875, -0.119384765625, -0.109130859375, -0.098876953125, -0.088623046875, -0.078369140625, -0.068115234375, -0.057861328125, -0.047607421875, -0.037353515625, -0.027099609375, -0.016845703125, -0.006591796875, 0.003662109375, 0.013916015625, 0.024169921875, 0.034423828125, 0.044677734375, 0.054931640625, 0.065185546875, 0.075439453125, 0.085693359375, 0.095947265625, 0.106201171875, 0.116455078125, 0.126708984375, 0.136962890625, 0.147216796875, 0.157470703125, 0.167724609375, 0.177978515625, 0.188232421875, 0.198486328125, 0.208740234375, 0.218994140625, 0.229248046875, 0.239501953125, 0.249755859375, 0.260009765625, 0.270263671875, 0.280517578125, 0.290771484375, 0.301025390625, 0.311279296875, 0.321533203125, 0.331787109375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 0.0, 4.0, 6.0, 6.0, 4.0, 7.0, 14.0, 7.0, 21.0, 29.0, 23.0, 37.0, 45.0, 56.0, 53.0, 58.0, 56.0, 60.0, 61.0, 74.0, 61.0, 61.0, 45.0, 48.0, 31.0, 29.0, 24.0, 20.0, 8.0, 20.0, 9.0, 11.0, 7.0, 3.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.293212890625, -0.2844123840332031, -0.27561187744140625, -0.2668113708496094, -0.2580108642578125, -0.24921035766601562, -0.24040985107421875, -0.23160934448242188, -0.222808837890625, -0.21400833129882812, -0.20520782470703125, -0.19640731811523438, -0.1876068115234375, -0.17880630493164062, -0.17000579833984375, -0.16120529174804688, -0.15240478515625, -0.14360427856445312, -0.13480377197265625, -0.12600326538085938, -0.1172027587890625, -0.10840225219726562, -0.09960174560546875, -0.09080123901367188, -0.082000732421875, -0.07320022583007812, -0.06439971923828125, -0.055599212646484375, -0.0467987060546875, -0.037998199462890625, -0.02919769287109375, -0.020397186279296875, -0.0115966796875, -0.002796173095703125, 0.00600433349609375, 0.014804840087890625, 0.0236053466796875, 0.032405853271484375, 0.04120635986328125, 0.050006866455078125, 0.058807373046875, 0.06760787963867188, 0.07640838623046875, 0.08520889282226562, 0.0940093994140625, 0.10280990600585938, 0.11161041259765625, 0.12041091918945312, 0.12921142578125, 0.13801193237304688, 0.14681243896484375, 0.15561294555664062, 0.1644134521484375, 0.17321395874023438, 0.18201446533203125, 0.19081497192382812, 0.199615478515625, 0.20841598510742188, 0.21721649169921875, 0.22601699829101562, 0.2348175048828125, 0.24361801147460938, 0.25241851806640625, 0.2612190246582031, 0.27001953125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 8.0, 11.0, 11.0, 24.0, 32.0, 33.0, 33.0, 49.0, 85.0, 133.0, 161.0, 231.0, 375.0, 556.0, 990.0, 1519.0, 2648.0, 5176.0, 9937.0, 21840.0, 56781.0, 213959.0, 574457.0, 96693.0, 32930.0, 14058.0, 6832.0, 3585.0, 2022.0, 1225.0, 717.0, 482.0, 323.0, 172.0, 133.0, 93.0, 62.0, 46.0, 35.0, 28.0, 19.0, 14.0, 7.0, 10.0, 9.0, 4.0, 5.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0408935546875, -0.039540767669677734, -0.03818798065185547, -0.0368351936340332, -0.03548240661621094, -0.03412961959838867, -0.032776832580566406, -0.03142404556274414, -0.030071258544921875, -0.02871847152709961, -0.027365684509277344, -0.026012897491455078, -0.024660110473632812, -0.023307323455810547, -0.02195453643798828, -0.020601749420166016, -0.01924896240234375, -0.017896175384521484, -0.01654338836669922, -0.015190601348876953, -0.013837814331054688, -0.012485027313232422, -0.011132240295410156, -0.00977945327758789, -0.008426666259765625, -0.007073879241943359, -0.005721092224121094, -0.004368305206298828, -0.0030155181884765625, -0.0016627311706542969, -0.00030994415283203125, 0.0010428428649902344, 0.0023956298828125, 0.0037484169006347656, 0.005101203918457031, 0.006453990936279297, 0.0078067779541015625, 0.009159564971923828, 0.010512351989746094, 0.01186513900756836, 0.013217926025390625, 0.01457071304321289, 0.015923500061035156, 0.017276287078857422, 0.018629074096679688, 0.019981861114501953, 0.02133464813232422, 0.022687435150146484, 0.02404022216796875, 0.025393009185791016, 0.02674579620361328, 0.028098583221435547, 0.029451370239257812, 0.030804157257080078, 0.032156944274902344, 0.03350973129272461, 0.034862518310546875, 0.03621530532836914, 0.037568092346191406, 0.03892087936401367, 0.04027366638183594, 0.0416264533996582, 0.04297924041748047, 0.044332027435302734, 0.045684814453125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 4.0, 6.0, 2.0, 9.0, 9.0, 11.0, 13.0, 23.0, 58.0, 99.0, 224.0, 253.0, 129.0, 71.0, 33.0, 19.0, 5.0, 6.0, 8.0, 7.0, 6.0, 2.0, 3.0, 0.0, 3.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002808570861816406, -0.00027181580662727356, -0.0002627745270729065, -0.00025373324751853943, -0.00024469196796417236, -0.0002356506884098053, -0.00022660940885543823, -0.00021756812930107117, -0.0002085268497467041, -0.00019948557019233704, -0.00019044429063796997, -0.0001814030110836029, -0.00017236173152923584, -0.00016332045197486877, -0.0001542791724205017, -0.00014523789286613464, -0.00013619661331176758, -0.0001271553337574005, -0.00011811405420303345, -0.00010907277464866638, -0.00010003149509429932, -9.099021553993225e-05, -8.194893598556519e-05, -7.290765643119812e-05, -6.386637687683105e-05, -5.482509732246399e-05, -4.5783817768096924e-05, -3.674253821372986e-05, -2.7701258659362793e-05, -1.8659979104995728e-05, -9.618699550628662e-06, -5.774199962615967e-07, 8.463859558105469e-06, 1.7505139112472534e-05, 2.65464186668396e-05, 3.5587698221206665e-05, 4.462897777557373e-05, 5.3670257329940796e-05, 6.271153688430786e-05, 7.175281643867493e-05, 8.079409599304199e-05, 8.983537554740906e-05, 9.887665510177612e-05, 0.00010791793465614319, 0.00011695921421051025, 0.00012600049376487732, 0.00013504177331924438, 0.00014408305287361145, 0.00015312433242797852, 0.00016216561198234558, 0.00017120689153671265, 0.0001802481710910797, 0.00018928945064544678, 0.00019833073019981384, 0.0002073720097541809, 0.00021641328930854797, 0.00022545456886291504, 0.0002344958484172821, 0.00024353712797164917, 0.00025257840752601624, 0.0002616196870803833, 0.00027066096663475037, 0.00027970224618911743, 0.0002887435257434845, 0.00029778480529785156]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 9.0, 5.0, 11.0, 5.0, 13.0, 17.0, 29.0, 30.0, 51.0, 123.0, 204.0, 307.0, 618.0, 1369.0, 3223.0, 8270.0, 26583.0, 121455.0, 716625.0, 127348.0, 27591.0, 8574.0, 3265.0, 1388.0, 631.0, 336.0, 175.0, 115.0, 56.0, 43.0, 21.0, 11.0, 18.0, 4.0, 8.0, 9.0, 4.0, 3.0, 3.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.061920166015625, -0.06001567840576172, -0.05811119079589844, -0.056206703186035156, -0.054302215576171875, -0.052397727966308594, -0.05049324035644531, -0.04858875274658203, -0.04668426513671875, -0.04477977752685547, -0.04287528991699219, -0.040970802307128906, -0.039066314697265625, -0.037161827087402344, -0.03525733947753906, -0.03335285186767578, -0.0314483642578125, -0.02954387664794922, -0.027639389038085938, -0.025734901428222656, -0.023830413818359375, -0.021925926208496094, -0.020021438598632812, -0.01811695098876953, -0.01621246337890625, -0.014307975769042969, -0.012403488159179688, -0.010499000549316406, -0.008594512939453125, -0.006690025329589844, -0.0047855377197265625, -0.0028810501098632812, -0.0009765625, 0.0009279251098632812, 0.0028324127197265625, 0.004736900329589844, 0.006641387939453125, 0.008545875549316406, 0.010450363159179688, 0.012354850769042969, 0.01425933837890625, 0.01616382598876953, 0.018068313598632812, 0.019972801208496094, 0.021877288818359375, 0.023781776428222656, 0.025686264038085938, 0.02759075164794922, 0.0294952392578125, 0.03139972686767578, 0.03330421447753906, 0.035208702087402344, 0.037113189697265625, 0.039017677307128906, 0.04092216491699219, 0.04282665252685547, 0.04473114013671875, 0.04663562774658203, 0.04854011535644531, 0.050444602966308594, 0.052349090576171875, 0.054253578186035156, 0.05615806579589844, 0.05806255340576172, 0.059967041015625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 7.0, 7.0, 4.0, 1.0, 8.0, 13.0, 14.0, 18.0, 19.0, 22.0, 32.0, 35.0, 51.0, 43.0, 60.0, 81.0, 77.0, 82.0, 75.0, 68.0, 43.0, 56.0, 36.0, 27.0, 25.0, 14.0, 23.0, 10.0, 7.0, 9.0, 8.0, 7.0, 4.0, 5.0, 2.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03790283203125, -0.036640167236328125, -0.03537750244140625, -0.034114837646484375, -0.0328521728515625, -0.031589508056640625, -0.03032684326171875, -0.029064178466796875, -0.027801513671875, -0.026538848876953125, -0.02527618408203125, -0.024013519287109375, -0.0227508544921875, -0.021488189697265625, -0.02022552490234375, -0.018962860107421875, -0.0177001953125, -0.016437530517578125, -0.01517486572265625, -0.013912200927734375, -0.0126495361328125, -0.011386871337890625, -0.01012420654296875, -0.008861541748046875, -0.007598876953125, -0.006336212158203125, -0.00507354736328125, -0.003810882568359375, -0.0025482177734375, -0.001285552978515625, -2.288818359375e-05, 0.001239776611328125, 0.00250244140625, 0.003765106201171875, 0.00502777099609375, 0.006290435791015625, 0.0075531005859375, 0.008815765380859375, 0.01007843017578125, 0.011341094970703125, 0.012603759765625, 0.013866424560546875, 0.01512908935546875, 0.016391754150390625, 0.0176544189453125, 0.018917083740234375, 0.02017974853515625, 0.021442413330078125, 0.022705078125, 0.023967742919921875, 0.02523040771484375, 0.026493072509765625, 0.0277557373046875, 0.029018402099609375, 0.03028106689453125, 0.031543731689453125, 0.032806396484375, 0.034069061279296875, 0.03533172607421875, 0.036594390869140625, 0.0378570556640625, 0.039119720458984375, 0.04038238525390625, 0.041645050048828125, 0.04290771484375]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 5.0, 5.0, 2.0, 0.0, 5.0, 4.0, 6.0, 13.0, 10.0, 7.0, 9.0, 13.0, 23.0, 16.0, 44.0, 32.0, 48.0, 67.0, 87.0, 112.0, 112.0, 87.0, 45.0, 47.0, 46.0, 35.0, 22.0, 22.0, 14.0, 11.0, 8.0, 6.0, 8.0, 5.0, 5.0, 7.0, 2.0, 5.0, 2.0, 1.0, 5.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.8069772720336914, -0.7781876921653748, -0.7493980526924133, -0.7206084728240967, -0.6918188333511353, -0.6630292534828186, -0.634239673614502, -0.6054500341415405, -0.5766603946685791, -0.5478708148002625, -0.519081175327301, -0.4902915954589844, -0.46150195598602295, -0.4327123761177063, -0.40392276644706726, -0.3751331567764282, -0.3463435769081116, -0.31755396723747253, -0.2887643575668335, -0.25997477769851685, -0.2311851531267166, -0.20239554345607758, -0.17360594868659973, -0.1448163390159607, -0.11602672934532166, -0.08723711967468262, -0.058447517454624176, -0.029657915234565735, -0.0008683055639266968, 0.02792130410671234, 0.056710898876190186, 0.08550050854682922, 0.11429011821746826, 0.1430797278881073, 0.17186933755874634, 0.20065893232822418, 0.22944854199886322, 0.25823813676834106, 0.2870277464389801, 0.31581735610961914, 0.3446069657802582, 0.3733965754508972, 0.40218618512153625, 0.4309757947921753, 0.45976537466049194, 0.48855501413345337, 0.51734459400177, 0.5461342334747314, 0.5749238133430481, 0.6037133932113647, 0.6325030326843262, 0.6612926125526428, 0.6900822520256042, 0.7188718318939209, 0.7476614713668823, 0.776451051235199, 0.8052406311035156, 0.8340302109718323, 0.8628198504447937, 0.8916094303131104, 0.9203990697860718, 0.9491886496543884, 0.9779782295227051, 1.0067678689956665, 1.035557508468628]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 5.0, 3.0, 3.0, 3.0, 7.0, 6.0, 6.0, 12.0, 17.0, 19.0, 18.0, 14.0, 13.0, 13.0, 32.0, 28.0, 31.0, 22.0, 35.0, 36.0, 28.0, 36.0, 69.0, 63.0, 62.0, 51.0, 40.0, 39.0, 38.0, 41.0, 27.0, 20.0, 22.0, 15.0, 20.0, 16.0, 16.0, 13.0, 4.0, 10.0, 13.0, 9.0, 12.0, 5.0, 3.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.7811167240142822, -0.7565103769302368, -0.7319040894508362, -0.7072977423667908, -0.6826914548873901, -0.6580851078033447, -0.6334787607192993, -0.6088724732398987, -0.584266185760498, -0.5596598386764526, -0.535053551197052, -0.5104472041130066, -0.48584091663360596, -0.46123456954956055, -0.4366282522678375, -0.4120219349861145, -0.3874155879020691, -0.36280927062034607, -0.33820295333862305, -0.31359660625457764, -0.288990318775177, -0.2643839716911316, -0.23977765440940857, -0.21517133712768555, -0.19056501984596252, -0.1659587025642395, -0.14135238528251648, -0.11674605309963226, -0.09213973581790924, -0.06753341853618622, -0.042927086353302, -0.01832076907157898, 0.006285488605499268, 0.03089180961251259, 0.05549813061952591, 0.08010445535182953, 0.10471077263355255, 0.12931708991527557, 0.1539234220981598, 0.1785297393798828, 0.20313605666160583, 0.22774237394332886, 0.2523486912250519, 0.2769550085067749, 0.3015613555908203, 0.32616764307022095, 0.35077399015426636, 0.3753803074359894, 0.3999866247177124, 0.4245929419994354, 0.44919925928115845, 0.47380560636520386, 0.4984118938446045, 0.5230182409286499, 0.5476245880126953, 0.572230875492096, 0.5968371629714966, 0.621443510055542, 0.6460497975349426, 0.670656144618988, 0.6952624320983887, 0.7198687791824341, 0.7444751262664795, 0.7690814137458801, 0.7936877608299255]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 5.0, 3.0, 5.0, 10.0, 11.0, 20.0, 31.0, 56.0, 71.0, 162.0, 294.0, 592.0, 1156.0, 3776.0, 43432.0, 4017908.0, 117679.0, 6780.0, 1481.0, 494.0, 158.0, 81.0, 33.0, 21.0, 13.0, 9.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.87109375, -0.8511238098144531, -0.8311538696289062, -0.8111839294433594, -0.7912139892578125, -0.7712440490722656, -0.7512741088867188, -0.7313041687011719, -0.711334228515625, -0.6913642883300781, -0.6713943481445312, -0.6514244079589844, -0.6314544677734375, -0.6114845275878906, -0.5915145874023438, -0.5715446472167969, -0.55157470703125, -0.5316047668457031, -0.5116348266601562, -0.4916648864746094, -0.4716949462890625, -0.4517250061035156, -0.43175506591796875, -0.4117851257324219, -0.391815185546875, -0.3718452453613281, -0.35187530517578125, -0.3319053649902344, -0.3119354248046875, -0.2919654846191406, -0.27199554443359375, -0.2520256042480469, -0.2320556640625, -0.21208572387695312, -0.19211578369140625, -0.17214584350585938, -0.1521759033203125, -0.13220596313476562, -0.11223602294921875, -0.09226608276367188, -0.072296142578125, -0.052326202392578125, -0.03235626220703125, -0.012386322021484375, 0.0075836181640625, 0.027553558349609375, 0.04752349853515625, 0.06749343872070312, 0.08746337890625, 0.10743331909179688, 0.12740325927734375, 0.14737319946289062, 0.1673431396484375, 0.18731307983398438, 0.20728302001953125, 0.22725296020507812, 0.247222900390625, 0.2671928405761719, 0.28716278076171875, 0.3071327209472656, 0.3271026611328125, 0.3470726013183594, 0.36704254150390625, 0.3870124816894531, 0.406982421875]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 5.0, 9.0, 16.0, 45.0, 47.0, 67.0, 89.0, 106.0, 104.0, 114.0, 113.0, 93.0, 55.0, 56.0, 32.0, 20.0, 13.0, 12.0, 4.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.13134765625, -0.12822818756103516, -0.1251087188720703, -0.12198925018310547, -0.11886978149414062, -0.11575031280517578, -0.11263084411621094, -0.1095113754272461, -0.10639190673828125, -0.1032724380493164, -0.10015296936035156, -0.09703350067138672, -0.09391403198242188, -0.09079456329345703, -0.08767509460449219, -0.08455562591552734, -0.0814361572265625, -0.07831668853759766, -0.07519721984863281, -0.07207775115966797, -0.06895828247070312, -0.06583881378173828, -0.06271934509277344, -0.059599876403808594, -0.05648040771484375, -0.053360939025878906, -0.05024147033691406, -0.04712200164794922, -0.044002532958984375, -0.04088306427001953, -0.03776359558105469, -0.034644126892089844, -0.031524658203125, -0.028405189514160156, -0.025285720825195312, -0.02216625213623047, -0.019046783447265625, -0.01592731475830078, -0.012807846069335938, -0.009688377380371094, -0.00656890869140625, -0.0034494400024414062, -0.0003299713134765625, 0.0027894973754882812, 0.005908966064453125, 0.009028434753417969, 0.012147903442382812, 0.015267372131347656, 0.0183868408203125, 0.021506309509277344, 0.024625778198242188, 0.02774524688720703, 0.030864715576171875, 0.03398418426513672, 0.03710365295410156, 0.040223121643066406, 0.04334259033203125, 0.046462059020996094, 0.04958152770996094, 0.05270099639892578, 0.055820465087890625, 0.05893993377685547, 0.06205940246582031, 0.06517887115478516, 0.06829833984375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 4.0, 3.0, 4.0, 9.0, 15.0, 26.0, 35.0, 59.0, 83.0, 165.0, 290.0, 777.0, 2821.0, 16762.0, 206277.0, 3763735.0, 182853.0, 15976.0, 2706.0, 718.0, 382.0, 186.0, 121.0, 70.0, 70.0, 42.0, 50.0, 22.0, 15.0, 8.0, 2.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.48388671875, -0.4713096618652344, -0.45873260498046875, -0.4461555480957031, -0.4335784912109375, -0.4210014343261719, -0.40842437744140625, -0.3958473205566406, -0.383270263671875, -0.3706932067871094, -0.35811614990234375, -0.3455390930175781, -0.3329620361328125, -0.3203849792480469, -0.30780792236328125, -0.2952308654785156, -0.28265380859375, -0.2700767517089844, -0.25749969482421875, -0.24492263793945312, -0.2323455810546875, -0.21976852416992188, -0.20719146728515625, -0.19461441040039062, -0.182037353515625, -0.16946029663085938, -0.15688323974609375, -0.14430618286132812, -0.1317291259765625, -0.11915206909179688, -0.10657501220703125, -0.09399795532226562, -0.0814208984375, -0.06884384155273438, -0.05626678466796875, -0.043689727783203125, -0.0311126708984375, -0.018535614013671875, -0.00595855712890625, 0.006618499755859375, 0.019195556640625, 0.031772613525390625, 0.04434967041015625, 0.056926727294921875, 0.0695037841796875, 0.08208084106445312, 0.09465789794921875, 0.10723495483398438, 0.11981201171875, 0.13238906860351562, 0.14496612548828125, 0.15754318237304688, 0.1701202392578125, 0.18269729614257812, 0.19527435302734375, 0.20785140991210938, 0.220428466796875, 0.23300552368164062, 0.24558258056640625, 0.2581596374511719, 0.2707366943359375, 0.2833137512207031, 0.29589080810546875, 0.3084678649902344, 0.321044921875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 4.0, 2.0, 8.0, 7.0, 9.0, 10.0, 26.0, 28.0, 46.0, 51.0, 85.0, 128.0, 204.0, 327.0, 703.0, 1023.0, 501.0, 292.0, 189.0, 140.0, 96.0, 59.0, 46.0, 21.0, 26.0, 22.0, 10.0, 6.0, 5.0, 6.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.140380859375, -0.13311767578125, -0.1258544921875, -0.11859130859375, -0.111328125, -0.10406494140625, -0.0968017578125, -0.08953857421875, -0.082275390625, -0.07501220703125, -0.0677490234375, -0.06048583984375, -0.05322265625, -0.04595947265625, -0.0386962890625, -0.03143310546875, -0.024169921875, -0.01690673828125, -0.0096435546875, -0.00238037109375, 0.0048828125, 0.01214599609375, 0.0194091796875, 0.02667236328125, 0.033935546875, 0.04119873046875, 0.0484619140625, 0.05572509765625, 0.06298828125, 0.07025146484375, 0.0775146484375, 0.08477783203125, 0.092041015625, 0.09930419921875, 0.1065673828125, 0.11383056640625, 0.12109375, 0.12835693359375, 0.1356201171875, 0.14288330078125, 0.150146484375, 0.15740966796875, 0.1646728515625, 0.17193603515625, 0.17919921875, 0.18646240234375, 0.1937255859375, 0.20098876953125, 0.208251953125, 0.21551513671875, 0.2227783203125, 0.23004150390625, 0.2373046875, 0.24456787109375, 0.2518310546875, 0.25909423828125, 0.266357421875, 0.27362060546875, 0.2808837890625, 0.28814697265625, 0.29541015625, 0.30267333984375, 0.3099365234375, 0.31719970703125, 0.324462890625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 5.0, 5.0, 7.0, 10.0, 18.0, 22.0, 45.0, 46.0, 71.0, 87.0, 115.0, 95.0, 108.0, 85.0, 61.0, 47.0, 43.0, 26.0, 21.0, 16.0, 17.0, 13.0, 10.0, 10.0, 6.0, 4.0, 4.0, 1.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.7761776447296143, -1.7270032167434692, -1.6778287887573242, -1.6286543607711792, -1.5794799327850342, -1.5303055047988892, -1.4811310768127441, -1.4319565296173096, -1.382782220840454, -1.333607792854309, -1.284433364868164, -1.235258936882019, -1.186084508895874, -1.136910080909729, -1.087735652923584, -1.0385611057281494, -0.9893866777420044, -0.9402122497558594, -0.8910378217697144, -0.8418633937835693, -0.7926889657974243, -0.7435145378112793, -0.6943400502204895, -0.6451656222343445, -0.5959911942481995, -0.5468167662620544, -0.4976423382759094, -0.448467880487442, -0.399293452501297, -0.350119024515152, -0.30094456672668457, -0.25177013874053955, -0.20259582996368408, -0.15342140197753906, -0.10424695909023285, -0.055072516202926636, -0.005898088216781616, 0.0432763397693634, 0.09245079755783081, 0.14162522554397583, 0.19079965353012085, 0.23997408151626587, 0.2891485095024109, 0.3383229672908783, 0.3874973952770233, 0.43667182326316833, 0.48584628105163574, 0.5350207090377808, 0.5841951370239258, 0.6333695650100708, 0.6825439929962158, 0.7317184209823608, 0.7808928489685059, 0.8300672769546509, 0.8792417645454407, 0.9284161925315857, 0.9775906205177307, 1.0267651081085205, 1.0759395360946655, 1.1251139640808105, 1.1742883920669556, 1.2234628200531006, 1.2726372480392456, 1.3218116760253906, 1.3709861040115356]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 5.0, 1.0, 0.0, 1.0, 2.0, 7.0, 3.0, 4.0, 14.0, 3.0, 13.0, 11.0, 15.0, 13.0, 16.0, 22.0, 17.0, 29.0, 36.0, 38.0, 37.0, 27.0, 35.0, 40.0, 40.0, 44.0, 46.0, 43.0, 36.0, 34.0, 40.0, 29.0, 31.0, 32.0, 28.0, 29.0, 22.0, 35.0, 16.0, 18.0, 16.0, 13.0, 7.0, 11.0, 8.0, 11.0, 5.0, 8.0, 5.0, 4.0, 1.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 4.0, 2.0], "bins": [-0.8957594633102417, -0.868302583694458, -0.8408456444740295, -0.8133887052536011, -0.7859318256378174, -0.7584749460220337, -0.7310180068016052, -0.7035610675811768, -0.6761041879653931, -0.6486473083496094, -0.6211903691291809, -0.5937334299087524, -0.5662765502929688, -0.5388196706771851, -0.5113627314567566, -0.4839058220386505, -0.45644891262054443, -0.42899200320243835, -0.4015350937843323, -0.3740781843662262, -0.3466212749481201, -0.31916436553001404, -0.29170745611190796, -0.2642505466938019, -0.2367936372756958, -0.20933672785758972, -0.18187981843948364, -0.15442290902137756, -0.12696599960327148, -0.0995090901851654, -0.07205218076705933, -0.04459527134895325, -0.017138361930847168, 0.010318547487258911, 0.03777545690536499, 0.06523236632347107, 0.09268927574157715, 0.12014618515968323, 0.1476030945777893, 0.17506000399589539, 0.20251691341400146, 0.22997382283210754, 0.2574307322502136, 0.2848876416683197, 0.3123445510864258, 0.33980146050453186, 0.36725836992263794, 0.394715279340744, 0.4221721887588501, 0.4496290981769562, 0.47708600759506226, 0.5045429468154907, 0.5319998264312744, 0.5594567060470581, 0.5869136452674866, 0.614370584487915, 0.6418274641036987, 0.6692843437194824, 0.6967412829399109, 0.7241982221603394, 0.751655101776123, 0.7791119813919067, 0.8065689206123352, 0.8340258598327637, 0.8614827394485474]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 2.0, 5.0, 8.0, 6.0, 13.0, 12.0, 14.0, 11.0, 28.0, 31.0, 46.0, 51.0, 95.0, 104.0, 188.0, 344.0, 632.0, 1300.0, 2996.0, 8244.0, 28976.0, 133211.0, 649523.0, 172133.0, 34390.0, 9691.0, 3287.0, 1421.0, 689.0, 353.0, 253.0, 146.0, 115.0, 68.0, 37.0, 36.0, 26.0, 19.0, 13.0, 11.0, 5.0, 9.0, 7.0, 1.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3203125, -0.3098335266113281, -0.29935455322265625, -0.2888755798339844, -0.2783966064453125, -0.2679176330566406, -0.25743865966796875, -0.24695968627929688, -0.236480712890625, -0.22600173950195312, -0.21552276611328125, -0.20504379272460938, -0.1945648193359375, -0.18408584594726562, -0.17360687255859375, -0.16312789916992188, -0.15264892578125, -0.14216995239257812, -0.13169097900390625, -0.12121200561523438, -0.1107330322265625, -0.10025405883789062, -0.08977508544921875, -0.07929611206054688, -0.068817138671875, -0.058338165283203125, -0.04785919189453125, -0.037380218505859375, -0.0269012451171875, -0.016422271728515625, -0.00594329833984375, 0.004535675048828125, 0.0150146484375, 0.025493621826171875, 0.03597259521484375, 0.046451568603515625, 0.0569305419921875, 0.06740951538085938, 0.07788848876953125, 0.08836746215820312, 0.098846435546875, 0.10932540893554688, 0.11980438232421875, 0.13028335571289062, 0.1407623291015625, 0.15124130249023438, 0.16172027587890625, 0.17219924926757812, 0.18267822265625, 0.19315719604492188, 0.20363616943359375, 0.21411514282226562, 0.2245941162109375, 0.23507308959960938, 0.24555206298828125, 0.2560310363769531, 0.266510009765625, 0.2769889831542969, 0.28746795654296875, 0.2979469299316406, 0.3084259033203125, 0.3189048767089844, 0.32938385009765625, 0.3398628234863281, 0.350341796875]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 10.0, 16.0, 13.0, 26.0, 39.0, 56.0, 80.0, 85.0, 86.0, 89.0, 98.0, 87.0, 79.0, 72.0, 46.0, 48.0, 25.0, 19.0, 11.0, 7.0, 3.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.1336669921875, -0.13055801391601562, -0.12744903564453125, -0.12434005737304688, -0.1212310791015625, -0.11812210083007812, -0.11501312255859375, -0.11190414428710938, -0.108795166015625, -0.10568618774414062, -0.10257720947265625, -0.09946823120117188, -0.0963592529296875, -0.09325027465820312, -0.09014129638671875, -0.08703231811523438, -0.08392333984375, -0.08081436157226562, -0.07770538330078125, -0.07459640502929688, -0.0714874267578125, -0.06837844848632812, -0.06526947021484375, -0.062160491943359375, -0.059051513671875, -0.055942535400390625, -0.05283355712890625, -0.049724578857421875, -0.0466156005859375, -0.043506622314453125, -0.04039764404296875, -0.037288665771484375, -0.0341796875, -0.031070709228515625, -0.02796173095703125, -0.024852752685546875, -0.0217437744140625, -0.018634796142578125, -0.01552581787109375, -0.012416839599609375, -0.009307861328125, -0.006198883056640625, -0.00308990478515625, 1.9073486328125e-05, 0.0031280517578125, 0.006237030029296875, 0.00934600830078125, 0.012454986572265625, 0.01556396484375, 0.018672943115234375, 0.02178192138671875, 0.024890899658203125, 0.0279998779296875, 0.031108856201171875, 0.03421783447265625, 0.037326812744140625, 0.040435791015625, 0.043544769287109375, 0.04665374755859375, 0.049762725830078125, 0.0528717041015625, 0.055980682373046875, 0.05908966064453125, 0.062198638916015625, 0.0653076171875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 2.0, 4.0, 0.0, 1.0, 5.0, 7.0, 6.0, 11.0, 8.0, 15.0, 22.0, 33.0, 52.0, 96.0, 146.0, 255.0, 550.0, 1055.0, 2386.0, 5832.0, 16030.0, 49560.0, 210255.0, 617609.0, 99529.0, 28097.0, 9850.0, 3808.0, 1677.0, 766.0, 389.0, 194.0, 96.0, 72.0, 44.0, 29.0, 16.0, 15.0, 8.0, 11.0, 5.0, 5.0, 5.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2802734375, -0.2699928283691406, -0.25971221923828125, -0.24943161010742188, -0.2391510009765625, -0.22887039184570312, -0.21858978271484375, -0.20830917358398438, -0.198028564453125, -0.18774795532226562, -0.17746734619140625, -0.16718673706054688, -0.1569061279296875, -0.14662551879882812, -0.13634490966796875, -0.12606430053710938, -0.11578369140625, -0.10550308227539062, -0.09522247314453125, -0.08494186401367188, -0.0746612548828125, -0.06438064575195312, -0.05410003662109375, -0.043819427490234375, -0.033538818359375, -0.023258209228515625, -0.01297760009765625, -0.002696990966796875, 0.0075836181640625, 0.017864227294921875, 0.02814483642578125, 0.038425445556640625, 0.0487060546875, 0.058986663818359375, 0.06926727294921875, 0.07954788208007812, 0.0898284912109375, 0.10010910034179688, 0.11038970947265625, 0.12067031860351562, 0.130950927734375, 0.14123153686523438, 0.15151214599609375, 0.16179275512695312, 0.1720733642578125, 0.18235397338867188, 0.19263458251953125, 0.20291519165039062, 0.21319580078125, 0.22347640991210938, 0.23375701904296875, 0.24403762817382812, 0.2543182373046875, 0.2645988464355469, 0.27487945556640625, 0.2851600646972656, 0.295440673828125, 0.3057212829589844, 0.31600189208984375, 0.3262825012207031, 0.3365631103515625, 0.3468437194824219, 0.35712432861328125, 0.3674049377441406, 0.377685546875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 4.0, 6.0, 5.0, 4.0, 10.0, 8.0, 9.0, 12.0, 14.0, 17.0, 17.0, 34.0, 35.0, 52.0, 33.0, 49.0, 56.0, 56.0, 46.0, 55.0, 58.0, 50.0, 49.0, 49.0, 39.0, 33.0, 41.0, 31.0, 28.0, 16.0, 14.0, 16.0, 14.0, 13.0, 10.0, 5.0, 4.0, 4.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.289306640625, -0.28113555908203125, -0.2729644775390625, -0.26479339599609375, -0.256622314453125, -0.24845123291015625, -0.2402801513671875, -0.23210906982421875, -0.22393798828125, -0.21576690673828125, -0.2075958251953125, -0.19942474365234375, -0.191253662109375, -0.18308258056640625, -0.1749114990234375, -0.16674041748046875, -0.1585693359375, -0.15039825439453125, -0.1422271728515625, -0.13405609130859375, -0.125885009765625, -0.11771392822265625, -0.1095428466796875, -0.10137176513671875, -0.09320068359375, -0.08502960205078125, -0.0768585205078125, -0.06868743896484375, -0.060516357421875, -0.05234527587890625, -0.0441741943359375, -0.03600311279296875, -0.02783203125, -0.01966094970703125, -0.0114898681640625, -0.00331878662109375, 0.004852294921875, 0.01302337646484375, 0.0211944580078125, 0.02936553955078125, 0.03753662109375, 0.04570770263671875, 0.0538787841796875, 0.06204986572265625, 0.070220947265625, 0.07839202880859375, 0.0865631103515625, 0.09473419189453125, 0.1029052734375, 0.11107635498046875, 0.1192474365234375, 0.12741851806640625, 0.135589599609375, 0.14376068115234375, 0.1519317626953125, 0.16010284423828125, 0.16827392578125, 0.17644500732421875, 0.1846160888671875, 0.19278717041015625, 0.200958251953125, 0.20912933349609375, 0.2173004150390625, 0.22547149658203125, 0.233642578125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 4.0, 4.0, 7.0, 7.0, 13.0, 17.0, 17.0, 41.0, 69.0, 93.0, 143.0, 189.0, 347.0, 570.0, 1009.0, 2054.0, 4214.0, 9650.0, 25125.0, 87157.0, 679379.0, 173863.0, 38990.0, 13883.0, 5777.0, 2646.0, 1387.0, 746.0, 435.0, 248.0, 147.0, 85.0, 68.0, 50.0, 27.0, 18.0, 26.0, 8.0, 10.0, 7.0, 10.0, 4.0, 2.0, 4.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.072021484375, -0.07000398635864258, -0.06798648834228516, -0.06596899032592773, -0.06395149230957031, -0.06193399429321289, -0.05991649627685547, -0.05789899826049805, -0.055881500244140625, -0.0538640022277832, -0.05184650421142578, -0.04982900619506836, -0.04781150817871094, -0.045794010162353516, -0.043776512145996094, -0.04175901412963867, -0.03974151611328125, -0.03772401809692383, -0.035706520080566406, -0.033689022064208984, -0.03167152404785156, -0.02965402603149414, -0.02763652801513672, -0.025619029998779297, -0.023601531982421875, -0.021584033966064453, -0.01956653594970703, -0.01754903793334961, -0.015531539916992188, -0.013514041900634766, -0.011496543884277344, -0.009479045867919922, -0.0074615478515625, -0.005444049835205078, -0.0034265518188476562, -0.0014090538024902344, 0.0006084442138671875, 0.0026259422302246094, 0.004643440246582031, 0.006660938262939453, 0.008678436279296875, 0.010695934295654297, 0.012713432312011719, 0.01473093032836914, 0.016748428344726562, 0.018765926361083984, 0.020783424377441406, 0.022800922393798828, 0.02481842041015625, 0.026835918426513672, 0.028853416442871094, 0.030870914459228516, 0.03288841247558594, 0.03490591049194336, 0.03692340850830078, 0.0389409065246582, 0.040958404541015625, 0.04297590255737305, 0.04499340057373047, 0.04701089859008789, 0.04902839660644531, 0.051045894622802734, 0.053063392639160156, 0.05508089065551758, 0.057098388671875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 0.0, 6.0, 2.0, 6.0, 5.0, 12.0, 12.0, 20.0, 17.0, 19.0, 19.0, 37.0, 52.0, 82.0, 163.0, 204.0, 93.0, 55.0, 40.0, 27.0, 29.0, 15.0, 29.0, 8.0, 15.0, 6.0, 6.0, 9.0, 4.0, 3.0, 2.0, 3.0, 2.0, 1.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00019073486328125, -0.00018532201647758484, -0.00017990916967391968, -0.00017449632287025452, -0.00016908347606658936, -0.0001636706292629242, -0.00015825778245925903, -0.00015284493565559387, -0.0001474320888519287, -0.00014201924204826355, -0.0001366063952445984, -0.00013119354844093323, -0.00012578070163726807, -0.0001203678548336029, -0.00011495500802993774, -0.00010954216122627258, -0.00010412931442260742, -9.871646761894226e-05, -9.33036208152771e-05, -8.789077401161194e-05, -8.247792720794678e-05, -7.706508040428162e-05, -7.165223360061646e-05, -6.62393867969513e-05, -6.082653999328613e-05, -5.541369318962097e-05, -5.000084638595581e-05, -4.458799958229065e-05, -3.917515277862549e-05, -3.376230597496033e-05, -2.8349459171295166e-05, -2.2936612367630005e-05, -1.7523765563964844e-05, -1.2110918760299683e-05, -6.6980719566345215e-06, -1.2852251529693604e-06, 4.127621650695801e-06, 9.540468454360962e-06, 1.4953315258026123e-05, 2.0366162061691284e-05, 2.5779008865356445e-05, 3.1191855669021606e-05, 3.660470247268677e-05, 4.201754927635193e-05, 4.743039608001709e-05, 5.284324288368225e-05, 5.825608968734741e-05, 6.366893649101257e-05, 6.908178329467773e-05, 7.44946300983429e-05, 7.990747690200806e-05, 8.532032370567322e-05, 9.073317050933838e-05, 9.614601731300354e-05, 0.0001015588641166687, 0.00010697171092033386, 0.00011238455772399902, 0.00011779740452766418, 0.00012321025133132935, 0.0001286230981349945, 0.00013403594493865967, 0.00013944879174232483, 0.00014486163854599, 0.00015027448534965515, 0.0001556873321533203]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 2.0, 2.0, 6.0, 6.0, 7.0, 18.0, 14.0, 39.0, 52.0, 104.0, 221.0, 441.0, 1131.0, 2886.0, 9045.0, 39179.0, 327133.0, 603826.0, 48077.0, 10813.0, 3276.0, 1232.0, 526.0, 244.0, 114.0, 58.0, 39.0, 11.0, 14.0, 11.0, 5.0, 6.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05743408203125, -0.055230140686035156, -0.05302619934082031, -0.05082225799560547, -0.048618316650390625, -0.04641437530517578, -0.04421043395996094, -0.042006492614746094, -0.03980255126953125, -0.037598609924316406, -0.03539466857910156, -0.03319072723388672, -0.030986785888671875, -0.02878284454345703, -0.026578903198242188, -0.024374961853027344, -0.0221710205078125, -0.019967079162597656, -0.017763137817382812, -0.015559196472167969, -0.013355255126953125, -0.011151313781738281, -0.008947372436523438, -0.006743431091308594, -0.00453948974609375, -0.0023355484008789062, -0.0001316070556640625, 0.0020723342895507812, 0.004276275634765625, 0.006480216979980469, 0.008684158325195312, 0.010888099670410156, 0.013092041015625, 0.015295982360839844, 0.017499923706054688, 0.01970386505126953, 0.021907806396484375, 0.02411174774169922, 0.026315689086914062, 0.028519630432128906, 0.03072357177734375, 0.032927513122558594, 0.03513145446777344, 0.03733539581298828, 0.039539337158203125, 0.04174327850341797, 0.04394721984863281, 0.046151161193847656, 0.0483551025390625, 0.050559043884277344, 0.05276298522949219, 0.05496692657470703, 0.057170867919921875, 0.05937480926513672, 0.06157875061035156, 0.0637826919555664, 0.06598663330078125, 0.0681905746459961, 0.07039451599121094, 0.07259845733642578, 0.07480239868164062, 0.07700634002685547, 0.07921028137207031, 0.08141422271728516, 0.0836181640625]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 3.0, 2.0, 2.0, 9.0, 6.0, 7.0, 12.0, 19.0, 21.0, 20.0, 33.0, 34.0, 56.0, 63.0, 65.0, 84.0, 108.0, 100.0, 77.0, 59.0, 48.0, 45.0, 33.0, 22.0, 21.0, 11.0, 11.0, 11.0, 3.0, 3.0, 3.0, 7.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.05462646484375, -0.05313301086425781, -0.051639556884765625, -0.05014610290527344, -0.04865264892578125, -0.04715919494628906, -0.045665740966796875, -0.04417228698730469, -0.0426788330078125, -0.04118537902832031, -0.039691925048828125, -0.03819847106933594, -0.03670501708984375, -0.03521156311035156, -0.033718109130859375, -0.03222465515136719, -0.030731201171875, -0.029237747192382812, -0.027744293212890625, -0.026250839233398438, -0.02475738525390625, -0.023263931274414062, -0.021770477294921875, -0.020277023315429688, -0.0187835693359375, -0.017290115356445312, -0.015796661376953125, -0.014303207397460938, -0.01280975341796875, -0.011316299438476562, -0.009822845458984375, -0.008329391479492188, -0.0068359375, -0.0053424835205078125, -0.003849029541015625, -0.0023555755615234375, -0.00086212158203125, 0.0006313323974609375, 0.002124786376953125, 0.0036182403564453125, 0.0051116943359375, 0.0066051483154296875, 0.008098602294921875, 0.009592056274414062, 0.01108551025390625, 0.012578964233398438, 0.014072418212890625, 0.015565872192382812, 0.017059326171875, 0.018552780151367188, 0.020046234130859375, 0.021539688110351562, 0.02303314208984375, 0.024526596069335938, 0.026020050048828125, 0.027513504028320312, 0.0290069580078125, 0.030500411987304688, 0.031993865966796875, 0.03348731994628906, 0.03498077392578125, 0.03647422790527344, 0.037967681884765625, 0.03946113586425781, 0.04095458984375]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 1.0, 3.0, 2.0, 2.0, 2.0, 4.0, 4.0, 5.0, 7.0, 8.0, 12.0, 10.0, 20.0, 15.0, 24.0, 40.0, 43.0, 56.0, 78.0, 121.0, 198.0, 108.0, 66.0, 45.0, 30.0, 30.0, 12.0, 13.0, 9.0, 8.0, 7.0, 6.0, 4.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0], "bins": [-1.693743348121643, -1.6537140607833862, -1.6136847734451294, -1.5736554861068726, -1.5336263179779053, -1.4935970306396484, -1.4535677433013916, -1.4135384559631348, -1.373509168624878, -1.333479881286621, -1.2934505939483643, -1.2534213066101074, -1.2133920192718506, -1.1733628511428833, -1.1333335638046265, -1.0933042764663696, -1.0532749891281128, -1.013245701789856, -0.9732164144515991, -0.9331871867179871, -0.8931578993797302, -0.8531286120414734, -0.8130993843078613, -0.7730700969696045, -0.7330408096313477, -0.6930115222930908, -0.652982234954834, -0.6129530072212219, -0.5729237198829651, -0.5328944325447083, -0.4928651750087738, -0.45283591747283936, -0.41280651092529297, -0.37277722358703613, -0.3327479660511017, -0.29271870851516724, -0.2526894211769104, -0.21266014873981476, -0.17263087630271912, -0.13260161876678467, -0.09257233142852783, -0.05254305899143219, -0.012513786554336548, 0.027515485882759094, 0.06754475831985474, 0.10757403075695038, 0.14760330319404602, 0.18763256072998047, 0.2276618480682373, 0.26769113540649414, 0.3077203929424286, 0.34774965047836304, 0.3877789378166199, 0.4278082251548767, 0.46783748269081116, 0.5078667402267456, 0.5478960275650024, 0.5879253149032593, 0.6279546022415161, 0.6679838299751282, 0.708013117313385, 0.7480424046516418, 0.7880716323852539, 0.8281009197235107, 0.8681302070617676]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 5.0, 2.0, 12.0, 7.0, 8.0, 13.0, 8.0, 10.0, 19.0, 17.0, 18.0, 35.0, 29.0, 29.0, 22.0, 40.0, 45.0, 45.0, 75.0, 66.0, 70.0, 52.0, 55.0, 40.0, 30.0, 38.0, 17.0, 44.0, 18.0, 24.0, 17.0, 18.0, 16.0, 7.0, 9.0, 11.0, 8.0, 10.0, 2.0, 2.0, 6.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.864099383354187, -0.8332605361938477, -0.8024216890335083, -0.771582841873169, -0.7407439947128296, -0.7099051475524902, -0.6790663003921509, -0.6482274532318115, -0.6173886060714722, -0.5865497589111328, -0.5557109117507935, -0.5248720645904541, -0.49403321743011475, -0.4631943702697754, -0.43235552310943604, -0.4015166759490967, -0.37067779898643494, -0.3398389518260956, -0.3090001046657562, -0.27816125750541687, -0.24732241034507751, -0.21648354828357697, -0.1856447011232376, -0.15480585396289825, -0.1239670068025589, -0.09312815964221954, -0.06228930875658989, -0.031450457870960236, -0.0006116107106208801, 0.030227243900299072, 0.06106609106063843, 0.09190493822097778, 0.12274378538131714, 0.1535826325416565, 0.18442147970199585, 0.2152603268623352, 0.24609917402267456, 0.2769380211830139, 0.30777686834335327, 0.3386157155036926, 0.369454562664032, 0.40029340982437134, 0.4311322569847107, 0.46197110414505005, 0.4928099513053894, 0.5236487984657288, 0.5544876456260681, 0.5853264927864075, 0.6161653995513916, 0.647004246711731, 0.6778430938720703, 0.7086819410324097, 0.739520788192749, 0.7703596353530884, 0.8011984825134277, 0.8320373296737671, 0.8628761768341064, 0.8937150239944458, 0.9245538711547852, 0.9553927183151245, 0.9862315654754639, 1.0170704126358032, 1.0479092597961426, 1.078748106956482, 1.1095869541168213]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 4.0, 2.0, 3.0, 8.0, 11.0, 16.0, 16.0, 24.0, 38.0, 48.0, 81.0, 130.0, 197.0, 381.0, 742.0, 1788.0, 5765.0, 29724.0, 1792447.0, 2321402.0, 31364.0, 6276.0, 2018.0, 857.0, 412.0, 195.0, 130.0, 75.0, 40.0, 28.0, 21.0, 12.0, 6.0, 5.0, 5.0, 3.0, 2.0, 0.0, 3.0, 2.0], "bins": [-0.5234375, -0.5112686157226562, -0.4990997314453125, -0.48693084716796875, -0.474761962890625, -0.46259307861328125, -0.4504241943359375, -0.43825531005859375, -0.42608642578125, -0.41391754150390625, -0.4017486572265625, -0.38957977294921875, -0.377410888671875, -0.36524200439453125, -0.3530731201171875, -0.34090423583984375, -0.3287353515625, -0.31656646728515625, -0.3043975830078125, -0.29222869873046875, -0.280059814453125, -0.26789093017578125, -0.2557220458984375, -0.24355316162109375, -0.23138427734375, -0.21921539306640625, -0.2070465087890625, -0.19487762451171875, -0.182708740234375, -0.17053985595703125, -0.1583709716796875, -0.14620208740234375, -0.134033203125, -0.12186431884765625, -0.1096954345703125, -0.09752655029296875, -0.085357666015625, -0.07318878173828125, -0.0610198974609375, -0.04885101318359375, -0.03668212890625, -0.02451324462890625, -0.0123443603515625, -0.00017547607421875, 0.011993408203125, 0.02416229248046875, 0.0363311767578125, 0.04850006103515625, 0.0606689453125, 0.07283782958984375, 0.0850067138671875, 0.09717559814453125, 0.109344482421875, 0.12151336669921875, 0.1336822509765625, 0.14585113525390625, 0.15802001953125, 0.17018890380859375, 0.1823577880859375, 0.19452667236328125, 0.206695556640625, 0.21886444091796875, 0.2310333251953125, 0.24320220947265625, 0.25537109375]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 10.0, 13.0, 20.0, 36.0, 33.0, 67.0, 75.0, 88.0, 101.0, 101.0, 93.0, 99.0, 82.0, 64.0, 30.0, 39.0, 14.0, 14.0, 12.0, 2.0, 3.0, 3.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.1317138671875, -0.1286182403564453, -0.12552261352539062, -0.12242698669433594, -0.11933135986328125, -0.11623573303222656, -0.11314010620117188, -0.11004447937011719, -0.1069488525390625, -0.10385322570800781, -0.10075759887695312, -0.09766197204589844, -0.09456634521484375, -0.09147071838378906, -0.08837509155273438, -0.08527946472167969, -0.082183837890625, -0.07908821105957031, -0.07599258422851562, -0.07289695739746094, -0.06980133056640625, -0.06670570373535156, -0.06361007690429688, -0.06051445007324219, -0.0574188232421875, -0.05432319641113281, -0.051227569580078125, -0.04813194274902344, -0.04503631591796875, -0.04194068908691406, -0.038845062255859375, -0.03574943542480469, -0.03265380859375, -0.029558181762695312, -0.026462554931640625, -0.023366928100585938, -0.02027130126953125, -0.017175674438476562, -0.014080047607421875, -0.010984420776367188, -0.0078887939453125, -0.0047931671142578125, -0.001697540283203125, 0.0013980865478515625, 0.00449371337890625, 0.0075893402099609375, 0.010684967041015625, 0.013780593872070312, 0.016876220703125, 0.019971847534179688, 0.023067474365234375, 0.026163101196289062, 0.02925872802734375, 0.03235435485839844, 0.035449981689453125, 0.03854560852050781, 0.0416412353515625, 0.04473686218261719, 0.047832489013671875, 0.05092811584472656, 0.05402374267578125, 0.05711936950683594, 0.060214996337890625, 0.06331062316894531, 0.06640625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 3.0, 4.0, 4.0, 3.0, 8.0, 8.0, 12.0, 13.0, 27.0, 48.0, 49.0, 74.0, 87.0, 164.0, 223.0, 400.0, 783.0, 1738.0, 5098.0, 22108.0, 216899.0, 3839629.0, 87458.0, 12489.0, 3437.0, 1388.0, 730.0, 435.0, 302.0, 183.0, 149.0, 96.0, 74.0, 45.0, 31.0, 28.0, 22.0, 17.0, 13.0, 4.0, 4.0, 1.0, 4.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.310546875, -0.29779052734375, -0.2850341796875, -0.27227783203125, -0.259521484375, -0.24676513671875, -0.2340087890625, -0.22125244140625, -0.20849609375, -0.19573974609375, -0.1829833984375, -0.17022705078125, -0.157470703125, -0.14471435546875, -0.1319580078125, -0.11920166015625, -0.1064453125, -0.09368896484375, -0.0809326171875, -0.06817626953125, -0.055419921875, -0.04266357421875, -0.0299072265625, -0.01715087890625, -0.00439453125, 0.00836181640625, 0.0211181640625, 0.03387451171875, 0.046630859375, 0.05938720703125, 0.0721435546875, 0.08489990234375, 0.09765625, 0.11041259765625, 0.1231689453125, 0.13592529296875, 0.148681640625, 0.16143798828125, 0.1741943359375, 0.18695068359375, 0.19970703125, 0.21246337890625, 0.2252197265625, 0.23797607421875, 0.250732421875, 0.26348876953125, 0.2762451171875, 0.28900146484375, 0.3017578125, 0.31451416015625, 0.3272705078125, 0.34002685546875, 0.352783203125, 0.36553955078125, 0.3782958984375, 0.39105224609375, 0.40380859375, 0.41656494140625, 0.4293212890625, 0.44207763671875, 0.454833984375, 0.46759033203125, 0.4803466796875, 0.49310302734375, 0.505859375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 3.0, 1.0, 2.0, 9.0, 8.0, 9.0, 16.0, 20.0, 29.0, 37.0, 55.0, 107.0, 162.0, 437.0, 1875.0, 834.0, 194.0, 99.0, 63.0, 35.0, 26.0, 20.0, 10.0, 12.0, 5.0, 4.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.177978515625, -0.16790390014648438, -0.15782928466796875, -0.14775466918945312, -0.1376800537109375, -0.12760543823242188, -0.11753082275390625, -0.10745620727539062, -0.097381591796875, -0.08730697631835938, -0.07723236083984375, -0.06715774536132812, -0.0570831298828125, -0.047008514404296875, -0.03693389892578125, -0.026859283447265625, -0.01678466796875, -0.006710052490234375, 0.00336456298828125, 0.013439178466796875, 0.0235137939453125, 0.033588409423828125, 0.04366302490234375, 0.053737640380859375, 0.063812255859375, 0.07388687133789062, 0.08396148681640625, 0.09403610229492188, 0.1041107177734375, 0.11418533325195312, 0.12425994873046875, 0.13433456420898438, 0.1444091796875, 0.15448379516601562, 0.16455841064453125, 0.17463302612304688, 0.1847076416015625, 0.19478225708007812, 0.20485687255859375, 0.21493148803710938, 0.225006103515625, 0.23508071899414062, 0.24515533447265625, 0.2552299499511719, 0.2653045654296875, 0.2753791809082031, 0.28545379638671875, 0.2955284118652344, 0.30560302734375, 0.3156776428222656, 0.32575225830078125, 0.3358268737792969, 0.3459014892578125, 0.3559761047363281, 0.36605072021484375, 0.3761253356933594, 0.386199951171875, 0.3962745666503906, 0.40634918212890625, 0.4164237976074219, 0.4264984130859375, 0.4365730285644531, 0.44664764404296875, 0.4567222595214844, 0.466796875]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 10.0, 10.0, 33.0, 41.0, 92.0, 157.0, 266.0, 190.0, 103.0, 43.0, 25.0, 18.0, 9.0, 6.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.710350513458252, -4.585576057434082, -4.460801601409912, -4.336026668548584, -4.211252212524414, -4.086477756500244, -3.961703300476074, -3.8369288444519043, -3.7121541500091553, -3.5873796939849854, -3.4626049995422363, -3.3378305435180664, -3.2130560874938965, -3.0882813930511475, -2.9635069370269775, -2.8387322425842285, -2.7139577865600586, -2.5891833305358887, -2.4644086360931396, -2.3396341800689697, -2.2148594856262207, -2.090085029602051, -1.9653105735778809, -1.8405359983444214, -1.715761423110962, -1.5909868478775024, -1.466212272644043, -1.341437816619873, -1.2166632413864136, -1.091888666152954, -0.9671141505241394, -0.8423396348953247, -0.7175650596618652, -0.5927904844284058, -0.46801596879959106, -0.343241423368454, -0.2184668779373169, -0.09369230270385742, 0.031082212924957275, 0.15585672855377197, 0.28063130378723145, 0.40540584921836853, 0.5301803946495056, 0.6549549102783203, 0.7797294855117798, 0.9045040607452393, 1.0292785167694092, 1.1540530920028687, 1.2788276672363281, 1.4036022424697876, 1.528376817703247, 1.653151273727417, 1.7779258489608765, 1.902700424194336, 2.027474880218506, 2.152249336242676, 2.277024030685425, 2.4017984867095947, 2.5265731811523438, 2.6513476371765137, 2.7761220932006836, 2.9008967876434326, 3.0256712436676025, 3.1504459381103516, 3.2752203941345215]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 6.0, 3.0, 3.0, 6.0, 2.0, 12.0, 18.0, 19.0, 27.0, 35.0, 51.0, 45.0, 47.0, 49.0, 65.0, 68.0, 60.0, 72.0, 62.0, 70.0, 53.0, 45.0, 35.0, 37.0, 30.0, 17.0, 16.0, 17.0, 12.0, 14.0, 7.0, 8.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.3712878227233887, -2.3168811798095703, -2.262474298477173, -2.2080676555633545, -2.153660774230957, -2.0992541313171387, -2.044847249984741, -1.9904404878616333, -1.9360337257385254, -1.8816269636154175, -1.8272202014923096, -1.7728134393692017, -1.7184066772460938, -1.6639999151229858, -1.609593152999878, -1.55518639087677, -1.500779628753662, -1.4463728666305542, -1.3919661045074463, -1.3375593423843384, -1.2831525802612305, -1.2287458181381226, -1.1743390560150146, -1.1199322938919067, -1.0655256509780884, -1.0111188888549805, -0.9567121267318726, -0.9023053646087646, -0.8478986024856567, -0.7934918403625488, -0.7390850782394409, -0.684678316116333, -0.6302715539932251, -0.5758647918701172, -0.5214580297470093, -0.46705126762390137, -0.41264450550079346, -0.35823777318000793, -0.3038310110569, -0.24942424893379211, -0.1950174868106842, -0.1406107246875763, -0.08620397001504898, -0.03179721534252167, 0.022609546780586243, 0.07701629400253296, 0.13142305612564087, 0.18582981824874878, 0.2402365803718567, 0.2946433424949646, 0.3490501046180725, 0.4034568667411804, 0.45786362886428833, 0.5122703313827515, 0.5666770935058594, 0.6210838556289673, 0.6754906177520752, 0.7298973798751831, 0.784304141998291, 0.8387109041213989, 0.8931176662445068, 0.9475244283676147, 1.0019311904907227, 1.0563379526138306, 1.1107447147369385]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 9.0, 9.0, 8.0, 13.0, 25.0, 23.0, 35.0, 60.0, 92.0, 125.0, 213.0, 408.0, 769.0, 1847.0, 5049.0, 16718.0, 74391.0, 617426.0, 272411.0, 42004.0, 10564.0, 3472.0, 1396.0, 644.0, 363.0, 166.0, 107.0, 68.0, 57.0, 27.0, 16.0, 13.0, 5.0, 6.0, 5.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.76953125, -0.7460861206054688, -0.7226409912109375, -0.6991958618164062, -0.675750732421875, -0.6523056030273438, -0.6288604736328125, -0.6054153442382812, -0.58197021484375, -0.5585250854492188, -0.5350799560546875, -0.5116348266601562, -0.488189697265625, -0.46474456787109375, -0.4412994384765625, -0.41785430908203125, -0.3944091796875, -0.37096405029296875, -0.3475189208984375, -0.32407379150390625, -0.300628662109375, -0.27718353271484375, -0.2537384033203125, -0.23029327392578125, -0.20684814453125, -0.18340301513671875, -0.1599578857421875, -0.13651275634765625, -0.113067626953125, -0.08962249755859375, -0.0661773681640625, -0.04273223876953125, -0.019287109375, 0.00415802001953125, 0.0276031494140625, 0.05104827880859375, 0.074493408203125, 0.09793853759765625, 0.1213836669921875, 0.14482879638671875, 0.16827392578125, 0.19171905517578125, 0.2151641845703125, 0.23860931396484375, 0.262054443359375, 0.28549957275390625, 0.3089447021484375, 0.33238983154296875, 0.3558349609375, 0.37928009033203125, 0.4027252197265625, 0.42617034912109375, 0.449615478515625, 0.47306060791015625, 0.4965057373046875, 0.5199508666992188, 0.54339599609375, 0.5668411254882812, 0.5902862548828125, 0.6137313842773438, 0.637176513671875, 0.6606216430664062, 0.6840667724609375, 0.7075119018554688, 0.73095703125]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 8.0, 7.0, 11.0, 18.0, 21.0, 29.0, 35.0, 57.0, 49.0, 69.0, 65.0, 80.0, 95.0, 72.0, 60.0, 70.0, 64.0, 48.0, 40.0, 35.0, 21.0, 15.0, 8.0, 7.0, 7.0, 5.0, 5.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.1334228515625, -0.13029098510742188, -0.12715911865234375, -0.12402725219726562, -0.1208953857421875, -0.11776351928710938, -0.11463165283203125, -0.11149978637695312, -0.108367919921875, -0.10523605346679688, -0.10210418701171875, -0.09897232055664062, -0.0958404541015625, -0.09270858764648438, -0.08957672119140625, -0.08644485473632812, -0.08331298828125, -0.08018112182617188, -0.07704925537109375, -0.07391738891601562, -0.0707855224609375, -0.06765365600585938, -0.06452178955078125, -0.061389923095703125, -0.058258056640625, -0.055126190185546875, -0.05199432373046875, -0.048862457275390625, -0.0457305908203125, -0.042598724365234375, -0.03946685791015625, -0.036334991455078125, -0.033203125, -0.030071258544921875, -0.02693939208984375, -0.023807525634765625, -0.0206756591796875, -0.017543792724609375, -0.01441192626953125, -0.011280059814453125, -0.008148193359375, -0.005016326904296875, -0.00188446044921875, 0.001247406005859375, 0.0043792724609375, 0.007511138916015625, 0.01064300537109375, 0.013774871826171875, 0.01690673828125, 0.020038604736328125, 0.02317047119140625, 0.026302337646484375, 0.0294342041015625, 0.032566070556640625, 0.03569793701171875, 0.038829803466796875, 0.041961669921875, 0.045093536376953125, 0.04822540283203125, 0.051357269287109375, 0.0544891357421875, 0.057621002197265625, 0.06075286865234375, 0.06388473510742188, 0.0670166015625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 6.0, 1.0, 7.0, 7.0, 11.0, 20.0, 36.0, 63.0, 112.0, 234.0, 465.0, 1136.0, 3294.0, 10379.0, 42559.0, 589037.0, 347984.0, 38674.0, 9509.0, 2953.0, 1124.0, 478.0, 214.0, 114.0, 56.0, 34.0, 20.0, 16.0, 8.0, 3.0, 2.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.8642578125, -0.8431625366210938, -0.8220672607421875, -0.8009719848632812, -0.779876708984375, -0.7587814331054688, -0.7376861572265625, -0.7165908813476562, -0.69549560546875, -0.6744003295898438, -0.6533050537109375, -0.6322097778320312, -0.611114501953125, -0.5900192260742188, -0.5689239501953125, -0.5478286743164062, -0.5267333984375, -0.5056381225585938, -0.4845428466796875, -0.46344757080078125, -0.442352294921875, -0.42125701904296875, -0.4001617431640625, -0.37906646728515625, -0.35797119140625, -0.33687591552734375, -0.3157806396484375, -0.29468536376953125, -0.273590087890625, -0.25249481201171875, -0.2313995361328125, -0.21030426025390625, -0.189208984375, -0.16811370849609375, -0.1470184326171875, -0.12592315673828125, -0.104827880859375, -0.08373260498046875, -0.0626373291015625, -0.04154205322265625, -0.02044677734375, 0.00064849853515625, 0.0217437744140625, 0.04283905029296875, 0.063934326171875, 0.08502960205078125, 0.1061248779296875, 0.12722015380859375, 0.1483154296875, 0.16941070556640625, 0.1905059814453125, 0.21160125732421875, 0.232696533203125, 0.25379180908203125, 0.2748870849609375, 0.29598236083984375, 0.31707763671875, 0.33817291259765625, 0.3592681884765625, 0.38036346435546875, 0.401458740234375, 0.42255401611328125, 0.4436492919921875, 0.46474456787109375, 0.48583984375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 13.0, 10.0, 14.0, 14.0, 16.0, 34.0, 36.0, 50.0, 59.0, 67.0, 85.0, 97.0, 85.0, 81.0, 71.0, 57.0, 63.0, 31.0, 38.0, 26.0, 20.0, 12.0, 6.0, 5.0, 7.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.56103515625, -0.5469741821289062, -0.5329132080078125, -0.5188522338867188, -0.504791259765625, -0.49073028564453125, -0.4766693115234375, -0.46260833740234375, -0.44854736328125, -0.43448638916015625, -0.4204254150390625, -0.40636444091796875, -0.392303466796875, -0.37824249267578125, -0.3641815185546875, -0.35012054443359375, -0.3360595703125, -0.32199859619140625, -0.3079376220703125, -0.29387664794921875, -0.279815673828125, -0.26575469970703125, -0.2516937255859375, -0.23763275146484375, -0.22357177734375, -0.20951080322265625, -0.1954498291015625, -0.18138885498046875, -0.167327880859375, -0.15326690673828125, -0.1392059326171875, -0.12514495849609375, -0.111083984375, -0.09702301025390625, -0.0829620361328125, -0.06890106201171875, -0.054840087890625, -0.04077911376953125, -0.0267181396484375, -0.01265716552734375, 0.00140380859375, 0.01546478271484375, 0.0295257568359375, 0.04358673095703125, 0.057647705078125, 0.07170867919921875, 0.0857696533203125, 0.09983062744140625, 0.1138916015625, 0.12795257568359375, 0.1420135498046875, 0.15607452392578125, 0.170135498046875, 0.18419647216796875, 0.1982574462890625, 0.21231842041015625, 0.22637939453125, 0.24044036865234375, 0.2545013427734375, 0.26856231689453125, 0.282623291015625, 0.29668426513671875, 0.3107452392578125, 0.32480621337890625, 0.3388671875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 7.0, 6.0, 9.0, 13.0, 27.0, 21.0, 32.0, 51.0, 70.0, 117.0, 147.0, 283.0, 438.0, 795.0, 1621.0, 4031.0, 17222.0, 274971.0, 716161.0, 23524.0, 4944.0, 1826.0, 905.0, 485.0, 295.0, 186.0, 111.0, 76.0, 56.0, 33.0, 25.0, 14.0, 16.0, 8.0, 7.0, 7.0, 3.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.171142578125, -0.1661205291748047, -0.16109848022460938, -0.15607643127441406, -0.15105438232421875, -0.14603233337402344, -0.14101028442382812, -0.1359882354736328, -0.1309661865234375, -0.1259441375732422, -0.12092208862304688, -0.11590003967285156, -0.11087799072265625, -0.10585594177246094, -0.10083389282226562, -0.09581184387207031, -0.090789794921875, -0.08576774597167969, -0.08074569702148438, -0.07572364807128906, -0.07070159912109375, -0.06567955017089844, -0.060657501220703125, -0.05563545227050781, -0.0506134033203125, -0.04559135437011719, -0.040569305419921875, -0.03554725646972656, -0.03052520751953125, -0.025503158569335938, -0.020481109619140625, -0.015459060668945312, -0.01043701171875, -0.0054149627685546875, -0.000392913818359375, 0.0046291351318359375, 0.00965118408203125, 0.014673233032226562, 0.019695281982421875, 0.024717330932617188, 0.0297393798828125, 0.03476142883300781, 0.039783477783203125, 0.04480552673339844, 0.04982757568359375, 0.05484962463378906, 0.059871673583984375, 0.06489372253417969, 0.069915771484375, 0.07493782043457031, 0.07995986938476562, 0.08498191833496094, 0.09000396728515625, 0.09502601623535156, 0.10004806518554688, 0.10507011413574219, 0.1100921630859375, 0.11511421203613281, 0.12013626098632812, 0.12515830993652344, 0.13018035888671875, 0.13520240783691406, 0.14022445678710938, 0.1452465057373047, 0.1502685546875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 5.0, 3.0, 4.0, 0.0, 3.0, 5.0, 2.0, 4.0, 6.0, 8.0, 16.0, 10.0, 15.0, 18.0, 18.0, 26.0, 37.0, 60.0, 76.0, 115.0, 168.0, 121.0, 74.0, 53.0, 26.0, 19.0, 20.0, 15.0, 11.0, 9.0, 15.0, 8.0, 5.0, 5.0, 3.0, 6.0, 1.0, 2.0, 5.0, 4.0, 1.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.0003180503845214844, -0.00030934810638427734, -0.0003006458282470703, -0.0002919435501098633, -0.00028324127197265625, -0.0002745389938354492, -0.0002658367156982422, -0.00025713443756103516, -0.0002484321594238281, -0.0002397298812866211, -0.00023102760314941406, -0.00022232532501220703, -0.000213623046875, -0.00020492076873779297, -0.00019621849060058594, -0.0001875162124633789, -0.00017881393432617188, -0.00017011165618896484, -0.0001614093780517578, -0.00015270709991455078, -0.00014400482177734375, -0.00013530254364013672, -0.0001266002655029297, -0.00011789798736572266, -0.00010919570922851562, -0.0001004934310913086, -9.179115295410156e-05, -8.308887481689453e-05, -7.43865966796875e-05, -6.568431854248047e-05, -5.698204040527344e-05, -4.8279762268066406e-05, -3.9577484130859375e-05, -3.0875205993652344e-05, -2.2172927856445312e-05, -1.3470649719238281e-05, -4.76837158203125e-06, 3.933906555175781e-06, 1.2636184692382812e-05, 2.1338462829589844e-05, 3.0040740966796875e-05, 3.8743019104003906e-05, 4.744529724121094e-05, 5.614757537841797e-05, 6.4849853515625e-05, 7.355213165283203e-05, 8.225440979003906e-05, 9.09566879272461e-05, 9.965896606445312e-05, 0.00010836124420166016, 0.00011706352233886719, 0.00012576580047607422, 0.00013446807861328125, 0.00014317035675048828, 0.0001518726348876953, 0.00016057491302490234, 0.00016927719116210938, 0.0001779794692993164, 0.00018668174743652344, 0.00019538402557373047, 0.0002040863037109375, 0.00021278858184814453, 0.00022149085998535156, 0.0002301931381225586, 0.00023889541625976562]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 9.0, 6.0, 6.0, 6.0, 12.0, 13.0, 24.0, 32.0, 69.0, 85.0, 119.0, 211.0, 334.0, 632.0, 1188.0, 2323.0, 4939.0, 11748.0, 35874.0, 178759.0, 699847.0, 76750.0, 20680.0, 7688.0, 3323.0, 1709.0, 918.0, 493.0, 292.0, 164.0, 106.0, 67.0, 31.0, 39.0, 23.0, 10.0, 10.0, 10.0, 4.0, 5.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06988525390625, -0.06757640838623047, -0.06526756286621094, -0.0629587173461914, -0.060649871826171875, -0.058341026306152344, -0.05603218078613281, -0.05372333526611328, -0.05141448974609375, -0.04910564422607422, -0.04679679870605469, -0.044487953186035156, -0.042179107666015625, -0.039870262145996094, -0.03756141662597656, -0.03525257110595703, -0.0329437255859375, -0.03063488006591797, -0.028326034545898438, -0.026017189025878906, -0.023708343505859375, -0.021399497985839844, -0.019090652465820312, -0.01678180694580078, -0.01447296142578125, -0.012164115905761719, -0.009855270385742188, -0.007546424865722656, -0.005237579345703125, -0.0029287338256835938, -0.0006198883056640625, 0.0016889572143554688, 0.003997802734375, 0.006306648254394531, 0.008615493774414062, 0.010924339294433594, 0.013233184814453125, 0.015542030334472656, 0.017850875854492188, 0.02015972137451172, 0.02246856689453125, 0.02477741241455078, 0.027086257934570312, 0.029395103454589844, 0.031703948974609375, 0.034012794494628906, 0.03632164001464844, 0.03863048553466797, 0.0409393310546875, 0.04324817657470703, 0.04555702209472656, 0.047865867614746094, 0.050174713134765625, 0.052483558654785156, 0.05479240417480469, 0.05710124969482422, 0.05941009521484375, 0.06171894073486328, 0.06402778625488281, 0.06633663177490234, 0.06864547729492188, 0.0709543228149414, 0.07326316833496094, 0.07557201385498047, 0.077880859375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 3.0, 6.0, 4.0, 2.0, 5.0, 11.0, 8.0, 8.0, 14.0, 13.0, 30.0, 39.0, 49.0, 57.0, 78.0, 92.0, 97.0, 112.0, 83.0, 67.0, 57.0, 44.0, 33.0, 17.0, 23.0, 13.0, 5.0, 10.0, 4.0, 6.0, 0.0, 4.0, 6.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0567626953125, -0.054986000061035156, -0.05320930480957031, -0.05143260955810547, -0.049655914306640625, -0.04787921905517578, -0.04610252380371094, -0.044325828552246094, -0.04254913330078125, -0.040772438049316406, -0.03899574279785156, -0.03721904754638672, -0.035442352294921875, -0.03366565704345703, -0.03188896179199219, -0.030112266540527344, -0.0283355712890625, -0.026558876037597656, -0.024782180786132812, -0.02300548553466797, -0.021228790283203125, -0.01945209503173828, -0.017675399780273438, -0.015898704528808594, -0.01412200927734375, -0.012345314025878906, -0.010568618774414062, -0.008791923522949219, -0.007015228271484375, -0.005238533020019531, -0.0034618377685546875, -0.0016851425170898438, 9.1552734375e-05, 0.0018682479858398438, 0.0036449432373046875, 0.005421638488769531, 0.007198333740234375, 0.008975028991699219, 0.010751724243164062, 0.012528419494628906, 0.01430511474609375, 0.016081809997558594, 0.017858505249023438, 0.01963520050048828, 0.021411895751953125, 0.02318859100341797, 0.024965286254882812, 0.026741981506347656, 0.0285186767578125, 0.030295372009277344, 0.03207206726074219, 0.03384876251220703, 0.035625457763671875, 0.03740215301513672, 0.03917884826660156, 0.040955543518066406, 0.04273223876953125, 0.044508934020996094, 0.04628562927246094, 0.04806232452392578, 0.049839019775390625, 0.05161571502685547, 0.05339241027832031, 0.055169105529785156, 0.05694580078125]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 6.0, 10.0, 21.0, 16.0, 49.0, 91.0, 191.0, 259.0, 123.0, 68.0, 38.0, 35.0, 20.0, 14.0, 19.0, 10.0, 9.0, 8.0, 7.0, 5.0, 2.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.241309404373169, -1.1639025211334229, -1.0864956378936768, -1.0090887546539307, -0.9316819310188293, -0.8542750477790833, -0.7768682241439819, -0.6994613409042358, -0.6220544576644897, -0.5446475744247437, -0.46724072098731995, -0.38983386754989624, -0.31242698431015015, -0.23502010107040405, -0.15761324763298035, -0.08020639419555664, -0.002799510955810547, 0.07460735738277435, 0.15201422572135925, 0.22942109405994415, 0.30682796239852905, 0.38423484563827515, 0.46164169907569885, 0.5390485525131226, 0.6164554357528687, 0.6938623189926147, 0.7712692022323608, 0.8486760258674622, 0.9260829091072083, 1.0034897327423096, 1.0808966159820557, 1.1583034992218018, 1.2357103824615479, 1.313117265701294, 1.39052414894104, 1.4679310321807861, 1.5453379154205322, 1.6227447986602783, 1.7001515626907349, 1.777558445930481, 1.854965329170227, 1.9323722124099731, 2.0097789764404297, 2.087185859680176, 2.164592742919922, 2.241999626159668, 2.319406509399414, 2.39681339263916, 2.4742202758789062, 2.5516271591186523, 2.6290340423583984, 2.7064409255981445, 2.7838478088378906, 2.8612546920776367, 2.938661575317383, 3.016068458557129, 3.093475341796875, 3.170882225036621, 3.248289108276367, 3.3256959915161133, 3.4031028747558594, 3.4805097579956055, 3.5579166412353516, 3.6353235244750977, 3.7127301692962646]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 4.0, 1.0, 7.0, 8.0, 15.0, 10.0, 19.0, 19.0, 25.0, 28.0, 41.0, 39.0, 46.0, 31.0, 59.0, 83.0, 91.0, 99.0, 81.0, 40.0, 42.0, 29.0, 28.0, 35.0, 19.0, 27.0, 16.0, 12.0, 9.0, 19.0, 9.0, 5.0, 5.0, 3.0, 5.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9773365259170532, -0.9343498349189758, -0.8913631439208984, -0.8483763933181763, -0.8053897023200989, -0.7624030113220215, -0.7194162607192993, -0.6764295697212219, -0.6334428787231445, -0.5904561877250671, -0.5474694967269897, -0.5044827461242676, -0.4614960551261902, -0.4185093641281128, -0.375522643327713, -0.33253592252731323, -0.28954923152923584, -0.24656252562999725, -0.20357581973075867, -0.16058911383152008, -0.1176024079322815, -0.07461570203304291, -0.03162899613380432, 0.011357724666595459, 0.05434441566467285, 0.09733112156391144, 0.14031782746315002, 0.1833045333623886, 0.2262912392616272, 0.2692779302597046, 0.31226465106010437, 0.35525137186050415, 0.39823806285858154, 0.44122475385665894, 0.4842114746570587, 0.5271981954574585, 0.5701848864555359, 0.6131715774536133, 0.6561583280563354, 0.6991450190544128, 0.7421317100524902, 0.7851184010505676, 0.828105092048645, 0.8710918426513672, 0.9140785336494446, 0.957065224647522, 1.0000519752502441, 1.0430386066436768, 1.086025357246399, 1.129012107849121, 1.1719987392425537, 1.2149854898452759, 1.257972240447998, 1.3009588718414307, 1.3439456224441528, 1.386932373046875, 1.4299190044403076, 1.4729057550430298, 1.5158923864364624, 1.5588791370391846, 1.6018657684326172, 1.6448525190353394, 1.6878392696380615, 1.7308259010314941, 1.7738126516342163]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 3.0, 3.0, 4.0, 0.0, 5.0, 8.0, 11.0, 14.0, 20.0, 27.0, 42.0, 58.0, 93.0, 152.0, 221.0, 442.0, 742.0, 1492.0, 3362.0, 13668.0, 275029.0, 3837368.0, 49025.0, 7592.0, 2566.0, 1068.0, 554.0, 253.0, 179.0, 100.0, 48.0, 46.0, 27.0, 21.0, 16.0, 4.0, 5.0, 3.0, 10.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0205078125, -0.99072265625, -0.9609375, -0.93115234375, -0.9013671875, -0.87158203125, -0.841796875, -0.81201171875, -0.7822265625, -0.75244140625, -0.72265625, -0.69287109375, -0.6630859375, -0.63330078125, -0.603515625, -0.57373046875, -0.5439453125, -0.51416015625, -0.484375, -0.45458984375, -0.4248046875, -0.39501953125, -0.365234375, -0.33544921875, -0.3056640625, -0.27587890625, -0.24609375, -0.21630859375, -0.1865234375, -0.15673828125, -0.126953125, -0.09716796875, -0.0673828125, -0.03759765625, -0.0078125, 0.02197265625, 0.0517578125, 0.08154296875, 0.111328125, 0.14111328125, 0.1708984375, 0.20068359375, 0.23046875, 0.26025390625, 0.2900390625, 0.31982421875, 0.349609375, 0.37939453125, 0.4091796875, 0.43896484375, 0.46875, 0.49853515625, 0.5283203125, 0.55810546875, 0.587890625, 0.61767578125, 0.6474609375, 0.67724609375, 0.70703125, 0.73681640625, 0.7666015625, 0.79638671875, 0.826171875, 0.85595703125, 0.8857421875]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 6.0, 9.0, 15.0, 19.0, 23.0, 28.0, 55.0, 50.0, 62.0, 81.0, 88.0, 92.0, 76.0, 85.0, 71.0, 59.0, 56.0, 38.0, 25.0, 17.0, 21.0, 8.0, 6.0, 8.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.131103515625, -0.127960205078125, -0.12481689453125, -0.121673583984375, -0.1185302734375, -0.115386962890625, -0.11224365234375, -0.109100341796875, -0.10595703125, -0.102813720703125, -0.09967041015625, -0.096527099609375, -0.0933837890625, -0.090240478515625, -0.08709716796875, -0.083953857421875, -0.080810546875, -0.077667236328125, -0.07452392578125, -0.071380615234375, -0.0682373046875, -0.065093994140625, -0.06195068359375, -0.058807373046875, -0.0556640625, -0.052520751953125, -0.04937744140625, -0.046234130859375, -0.0430908203125, -0.039947509765625, -0.03680419921875, -0.033660888671875, -0.030517578125, -0.027374267578125, -0.02423095703125, -0.021087646484375, -0.0179443359375, -0.014801025390625, -0.01165771484375, -0.008514404296875, -0.00537109375, -0.002227783203125, 0.00091552734375, 0.004058837890625, 0.0072021484375, 0.010345458984375, 0.01348876953125, 0.016632080078125, 0.019775390625, 0.022918701171875, 0.02606201171875, 0.029205322265625, 0.0323486328125, 0.035491943359375, 0.03863525390625, 0.041778564453125, 0.044921875, 0.048065185546875, 0.05120849609375, 0.054351806640625, 0.0574951171875, 0.060638427734375, 0.06378173828125, 0.066925048828125, 0.070068359375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 8.0, 17.0, 16.0, 27.0, 35.0, 43.0, 80.0, 130.0, 230.0, 358.0, 714.0, 1711.0, 6271.0, 54629.0, 3638589.0, 466628.0, 18929.0, 3378.0, 1224.0, 540.0, 297.0, 159.0, 98.0, 64.0, 36.0, 27.0, 12.0, 5.0, 9.0, 4.0, 7.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.818359375, -0.7972640991210938, -0.7761688232421875, -0.7550735473632812, -0.733978271484375, -0.7128829956054688, -0.6917877197265625, -0.6706924438476562, -0.64959716796875, -0.6285018920898438, -0.6074066162109375, -0.5863113403320312, -0.565216064453125, -0.5441207885742188, -0.5230255126953125, -0.5019302368164062, -0.4808349609375, -0.45973968505859375, -0.4386444091796875, -0.41754913330078125, -0.396453857421875, -0.37535858154296875, -0.3542633056640625, -0.33316802978515625, -0.31207275390625, -0.29097747802734375, -0.2698822021484375, -0.24878692626953125, -0.227691650390625, -0.20659637451171875, -0.1855010986328125, -0.16440582275390625, -0.143310546875, -0.12221527099609375, -0.1011199951171875, -0.08002471923828125, -0.058929443359375, -0.03783416748046875, -0.0167388916015625, 0.00435638427734375, 0.02545166015625, 0.04654693603515625, 0.0676422119140625, 0.08873748779296875, 0.109832763671875, 0.13092803955078125, 0.1520233154296875, 0.17311859130859375, 0.1942138671875, 0.21530914306640625, 0.2364044189453125, 0.25749969482421875, 0.278594970703125, 0.29969024658203125, 0.3207855224609375, 0.34188079833984375, 0.36297607421875, 0.38407135009765625, 0.4051666259765625, 0.42626190185546875, 0.447357177734375, 0.46845245361328125, 0.4895477294921875, 0.5106430053710938, 0.53173828125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 11.0, 10.0, 32.0, 35.0, 93.0, 168.0, 370.0, 1024.0, 1412.0, 469.0, 230.0, 109.0, 52.0, 28.0, 11.0, 8.0, 5.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.80810546875, -0.788909912109375, -0.76971435546875, -0.750518798828125, -0.7313232421875, -0.712127685546875, -0.69293212890625, -0.673736572265625, -0.654541015625, -0.635345458984375, -0.61614990234375, -0.596954345703125, -0.5777587890625, -0.558563232421875, -0.53936767578125, -0.520172119140625, -0.5009765625, -0.481781005859375, -0.46258544921875, -0.443389892578125, -0.4241943359375, -0.404998779296875, -0.38580322265625, -0.366607666015625, -0.347412109375, -0.328216552734375, -0.30902099609375, -0.289825439453125, -0.2706298828125, -0.251434326171875, -0.23223876953125, -0.213043212890625, -0.19384765625, -0.174652099609375, -0.15545654296875, -0.136260986328125, -0.1170654296875, -0.097869873046875, -0.07867431640625, -0.059478759765625, -0.040283203125, -0.021087646484375, -0.00189208984375, 0.017303466796875, 0.0364990234375, 0.055694580078125, 0.07489013671875, 0.094085693359375, 0.11328125, 0.132476806640625, 0.15167236328125, 0.170867919921875, 0.1900634765625, 0.209259033203125, 0.22845458984375, 0.247650146484375, 0.266845703125, 0.286041259765625, 0.30523681640625, 0.324432373046875, 0.3436279296875, 0.362823486328125, 0.38201904296875, 0.401214599609375, 0.42041015625]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 4.0, 0.0, 5.0, 3.0, 6.0, 5.0, 4.0, 7.0, 7.0, 14.0, 6.0, 11.0, 25.0, 30.0, 30.0, 53.0, 65.0, 94.0, 116.0, 119.0, 106.0, 76.0, 53.0, 44.0, 31.0, 26.0, 19.0, 13.0, 13.0, 6.0, 6.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.063363075256348, -3.969193458557129, -3.875023603439331, -3.7808539867401123, -3.6866843700408936, -3.5925145149230957, -3.498344898223877, -3.404175281524658, -3.3100056648254395, -3.2158360481262207, -3.121666193008423, -3.027496576309204, -2.9333269596099854, -2.8391571044921875, -2.7449874877929688, -2.65081787109375, -2.556648015975952, -2.4624783992767334, -2.3683085441589355, -2.274138927459717, -2.179969310760498, -2.0857996940612793, -1.9916298389434814, -1.8974602222442627, -1.8032904863357544, -1.709120750427246, -1.6149511337280273, -1.520781397819519, -1.4266116619110107, -1.332442045211792, -1.2382723093032837, -1.1441025733947754, -1.0499327182769775, -0.955763041973114, -0.8615933656692505, -0.7674236297607422, -0.6732539534568787, -0.5790842771530151, -0.48491454124450684, -0.3907448649406433, -0.2965751886367798, -0.20240549743175507, -0.10823580622673035, -0.014066100120544434, 0.08010357618331909, 0.17427325248718262, 0.2684429883956909, 0.36261266469955444, 0.45678234100341797, 0.5509520173072815, 0.645121693611145, 0.7392914295196533, 0.8334611058235168, 0.9276307821273804, 1.0218005180358887, 1.1159701347351074, 1.2101398706436157, 1.304309606552124, 1.3984792232513428, 1.492648959159851, 1.5868186950683594, 1.6809883117675781, 1.7751580476760864, 1.8693277835845947, 1.9634974002838135]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 6.0, 1.0, 4.0, 10.0, 18.0, 9.0, 8.0, 11.0, 14.0, 22.0, 17.0, 14.0, 34.0, 24.0, 31.0, 47.0, 42.0, 43.0, 51.0, 43.0, 39.0, 48.0, 36.0, 54.0, 39.0, 40.0, 19.0, 32.0, 22.0, 31.0, 29.0, 17.0, 23.0, 20.0, 12.0, 16.0, 8.0, 14.0, 11.0, 10.0, 5.0, 7.0, 1.0, 3.0, 5.0, 1.0, 2.0, 5.0, 1.0, 1.0, 2.0, 2.0], "bins": [-1.9230966567993164, -1.8669215440750122, -1.810746431350708, -1.7545711994171143, -1.69839608669281, -1.6422209739685059, -1.5860458612442017, -1.5298707485198975, -1.4736956357955933, -1.417520523071289, -1.3613454103469849, -1.3051702976226807, -1.248995065689087, -1.1928199529647827, -1.1366448402404785, -1.0804697275161743, -1.0242946147918701, -0.9681195020675659, -0.9119443297386169, -0.8557692170143127, -0.7995941042900085, -0.7434189319610596, -0.6872438192367554, -0.6310687065124512, -0.5748934745788574, -0.5187183618545532, -0.46254321932792664, -0.40636807680130005, -0.35019296407699585, -0.29401782155036926, -0.23784267902374268, -0.18166756629943848, -0.12549245357513428, -0.06931732594966888, -0.013142190873622894, 0.043032944202423096, 0.09920807182788849, 0.15538319945335388, 0.21155834197998047, 0.26773345470428467, 0.32390859723091125, 0.38008373975753784, 0.43625885248184204, 0.49243399500846863, 0.5486091375350952, 0.6047842502593994, 0.6609593629837036, 0.7171344757080078, 0.7733096480369568, 0.829484760761261, 0.88565993309021, 0.9418350458145142, 0.9980101585388184, 1.0541852712631226, 1.1103603839874268, 1.1665356159210205, 1.2227107286453247, 1.278885841369629, 1.335060954093933, 1.3912360668182373, 1.447411298751831, 1.5035864114761353, 1.5597615242004395, 1.6159366369247437, 1.6721117496490479]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 8.0, 6.0, 6.0, 11.0, 12.0, 35.0, 43.0, 75.0, 90.0, 160.0, 279.0, 430.0, 736.0, 1385.0, 2604.0, 5290.0, 11768.0, 30116.0, 100071.0, 579093.0, 227486.0, 54158.0, 18918.0, 7754.0, 3646.0, 1877.0, 963.0, 585.0, 335.0, 223.0, 149.0, 82.0, 57.0, 29.0, 30.0, 16.0, 14.0, 10.0, 2.0, 7.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.642578125, -0.6229629516601562, -0.6033477783203125, -0.5837326049804688, -0.564117431640625, -0.5445022583007812, -0.5248870849609375, -0.5052719116210938, -0.48565673828125, -0.46604156494140625, -0.4464263916015625, -0.42681121826171875, -0.407196044921875, -0.38758087158203125, -0.3679656982421875, -0.34835052490234375, -0.3287353515625, -0.30912017822265625, -0.2895050048828125, -0.26988983154296875, -0.250274658203125, -0.23065948486328125, -0.2110443115234375, -0.19142913818359375, -0.17181396484375, -0.15219879150390625, -0.1325836181640625, -0.11296844482421875, -0.093353271484375, -0.07373809814453125, -0.0541229248046875, -0.03450775146484375, -0.014892578125, 0.00472259521484375, 0.0243377685546875, 0.04395294189453125, 0.063568115234375, 0.08318328857421875, 0.1027984619140625, 0.12241363525390625, 0.14202880859375, 0.16164398193359375, 0.1812591552734375, 0.20087432861328125, 0.220489501953125, 0.24010467529296875, 0.2597198486328125, 0.27933502197265625, 0.2989501953125, 0.31856536865234375, 0.3381805419921875, 0.35779571533203125, 0.377410888671875, 0.39702606201171875, 0.4166412353515625, 0.43625640869140625, 0.45587158203125, 0.47548675537109375, 0.4951019287109375, 0.5147171020507812, 0.534332275390625, 0.5539474487304688, 0.5735626220703125, 0.5931777954101562, 0.61279296875]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 2.0, 4.0, 4.0, 7.0, 6.0, 7.0, 11.0, 17.0, 14.0, 27.0, 17.0, 35.0, 49.0, 41.0, 44.0, 41.0, 56.0, 74.0, 54.0, 76.0, 59.0, 51.0, 56.0, 44.0, 26.0, 43.0, 28.0, 26.0, 22.0, 13.0, 10.0, 11.0, 4.0, 5.0, 11.0, 1.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.14208984375, -0.13840484619140625, -0.1347198486328125, -0.13103485107421875, -0.127349853515625, -0.12366485595703125, -0.1199798583984375, -0.11629486083984375, -0.11260986328125, -0.10892486572265625, -0.1052398681640625, -0.10155487060546875, -0.097869873046875, -0.09418487548828125, -0.0904998779296875, -0.08681488037109375, -0.0831298828125, -0.07944488525390625, -0.0757598876953125, -0.07207489013671875, -0.068389892578125, -0.06470489501953125, -0.0610198974609375, -0.05733489990234375, -0.05364990234375, -0.04996490478515625, -0.0462799072265625, -0.04259490966796875, -0.038909912109375, -0.03522491455078125, -0.0315399169921875, -0.02785491943359375, -0.024169921875, -0.02048492431640625, -0.0167999267578125, -0.01311492919921875, -0.009429931640625, -0.00574493408203125, -0.0020599365234375, 0.00162506103515625, 0.00531005859375, 0.00899505615234375, 0.0126800537109375, 0.01636505126953125, 0.020050048828125, 0.02373504638671875, 0.0274200439453125, 0.03110504150390625, 0.0347900390625, 0.03847503662109375, 0.0421600341796875, 0.04584503173828125, 0.049530029296875, 0.05321502685546875, 0.0569000244140625, 0.06058502197265625, 0.06427001953125, 0.06795501708984375, 0.0716400146484375, 0.07532501220703125, 0.079010009765625, 0.08269500732421875, 0.0863800048828125, 0.09006500244140625, 0.09375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 5.0, 1.0, 1.0, 7.0, 4.0, 5.0, 7.0, 12.0, 16.0, 30.0, 31.0, 53.0, 71.0, 98.0, 141.0, 189.0, 330.0, 562.0, 885.0, 1517.0, 2934.0, 5850.0, 13647.0, 37684.0, 175770.0, 695631.0, 73242.0, 21823.0, 8709.0, 4150.0, 2073.0, 1164.0, 726.0, 407.0, 241.0, 160.0, 112.0, 96.0, 52.0, 42.0, 25.0, 17.0, 9.0, 11.0, 4.0, 6.0, 8.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.576171875, -0.5564727783203125, -0.536773681640625, -0.5170745849609375, -0.49737548828125, -0.4776763916015625, -0.457977294921875, -0.4382781982421875, -0.4185791015625, -0.3988800048828125, -0.379180908203125, -0.3594818115234375, -0.33978271484375, -0.3200836181640625, -0.300384521484375, -0.2806854248046875, -0.260986328125, -0.2412872314453125, -0.221588134765625, -0.2018890380859375, -0.18218994140625, -0.1624908447265625, -0.142791748046875, -0.1230926513671875, -0.1033935546875, -0.0836944580078125, -0.063995361328125, -0.0442962646484375, -0.02459716796875, -0.0048980712890625, 0.014801025390625, 0.0345001220703125, 0.05419921875, 0.0738983154296875, 0.093597412109375, 0.1132965087890625, 0.13299560546875, 0.1526947021484375, 0.172393798828125, 0.1920928955078125, 0.2117919921875, 0.2314910888671875, 0.251190185546875, 0.2708892822265625, 0.29058837890625, 0.3102874755859375, 0.329986572265625, 0.3496856689453125, 0.369384765625, 0.3890838623046875, 0.408782958984375, 0.4284820556640625, 0.44818115234375, 0.4678802490234375, 0.487579345703125, 0.5072784423828125, 0.5269775390625, 0.5466766357421875, 0.566375732421875, 0.5860748291015625, 0.60577392578125, 0.6254730224609375, 0.645172119140625, 0.6648712158203125, 0.6845703125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 5.0, 4.0, 9.0, 9.0, 8.0, 17.0, 16.0, 19.0, 28.0, 42.0, 43.0, 60.0, 69.0, 76.0, 72.0, 74.0, 72.0, 89.0, 53.0, 43.0, 35.0, 36.0, 24.0, 20.0, 15.0, 16.0, 12.0, 6.0, 6.0, 9.0, 5.0, 7.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.67138671875, -0.650665283203125, -0.62994384765625, -0.609222412109375, -0.5885009765625, -0.567779541015625, -0.54705810546875, -0.526336669921875, -0.505615234375, -0.484893798828125, -0.46417236328125, -0.443450927734375, -0.4227294921875, -0.402008056640625, -0.38128662109375, -0.360565185546875, -0.33984375, -0.319122314453125, -0.29840087890625, -0.277679443359375, -0.2569580078125, -0.236236572265625, -0.21551513671875, -0.194793701171875, -0.174072265625, -0.153350830078125, -0.13262939453125, -0.111907958984375, -0.0911865234375, -0.070465087890625, -0.04974365234375, -0.029022216796875, -0.00830078125, 0.012420654296875, 0.03314208984375, 0.053863525390625, 0.0745849609375, 0.095306396484375, 0.11602783203125, 0.136749267578125, 0.157470703125, 0.178192138671875, 0.19891357421875, 0.219635009765625, 0.2403564453125, 0.261077880859375, 0.28179931640625, 0.302520751953125, 0.3232421875, 0.343963623046875, 0.36468505859375, 0.385406494140625, 0.4061279296875, 0.426849365234375, 0.44757080078125, 0.468292236328125, 0.489013671875, 0.509735107421875, 0.53045654296875, 0.551177978515625, 0.5718994140625, 0.592620849609375, 0.61334228515625, 0.634063720703125, 0.65478515625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 6.0, 6.0, 4.0, 8.0, 13.0, 12.0, 8.0, 43.0, 58.0, 103.0, 153.0, 300.0, 522.0, 1004.0, 2033.0, 4758.0, 12792.0, 47160.0, 729224.0, 203781.0, 30159.0, 9295.0, 3658.0, 1636.0, 820.0, 421.0, 213.0, 143.0, 73.0, 52.0, 32.0, 24.0, 17.0, 20.0, 3.0, 6.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12347412109375, -0.11947154998779297, -0.11546897888183594, -0.1114664077758789, -0.10746383666992188, -0.10346126556396484, -0.09945869445800781, -0.09545612335205078, -0.09145355224609375, -0.08745098114013672, -0.08344841003417969, -0.07944583892822266, -0.07544326782226562, -0.0714406967163086, -0.06743812561035156, -0.06343555450439453, -0.0594329833984375, -0.05543041229248047, -0.05142784118652344, -0.047425270080566406, -0.043422698974609375, -0.039420127868652344, -0.03541755676269531, -0.03141498565673828, -0.02741241455078125, -0.02340984344482422, -0.019407272338867188, -0.015404701232910156, -0.011402130126953125, -0.007399559020996094, -0.0033969879150390625, 0.0006055831909179688, 0.004608154296875, 0.008610725402832031, 0.012613296508789062, 0.016615867614746094, 0.020618438720703125, 0.024621009826660156, 0.028623580932617188, 0.03262615203857422, 0.03662872314453125, 0.04063129425048828, 0.04463386535644531, 0.048636436462402344, 0.052639007568359375, 0.056641578674316406, 0.06064414978027344, 0.06464672088623047, 0.0686492919921875, 0.07265186309814453, 0.07665443420410156, 0.0806570053100586, 0.08465957641601562, 0.08866214752197266, 0.09266471862792969, 0.09666728973388672, 0.10066986083984375, 0.10467243194580078, 0.10867500305175781, 0.11267757415771484, 0.11668014526367188, 0.1206827163696289, 0.12468528747558594, 0.12868785858154297, 0.1326904296875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 5.0, 4.0, 10.0, 11.0, 26.0, 37.0, 90.0, 147.0, 263.0, 195.0, 97.0, 43.0, 24.0, 11.0, 10.0, 6.0, 9.0, 2.0, 1.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00027561187744140625, -0.0002676434814929962, -0.0002596750855445862, -0.00025170668959617615, -0.0002437382936477661, -0.00023576989769935608, -0.00022780150175094604, -0.000219833105802536, -0.00021186470985412598, -0.00020389631390571594, -0.0001959279179573059, -0.00018795952200889587, -0.00017999112606048584, -0.0001720227301120758, -0.00016405433416366577, -0.00015608593821525574, -0.0001481175422668457, -0.00014014914631843567, -0.00013218075037002563, -0.0001242123544216156, -0.00011624395847320557, -0.00010827556252479553, -0.0001003071665763855, -9.233877062797546e-05, -8.437037467956543e-05, -7.64019787311554e-05, -6.843358278274536e-05, -6.046518683433533e-05, -5.249679088592529e-05, -4.452839493751526e-05, -3.6559998989105225e-05, -2.859160304069519e-05, -2.0623207092285156e-05, -1.2654811143875122e-05, -4.686415195465088e-06, 3.2819807529449463e-06, 1.125037670135498e-05, 1.9218772649765015e-05, 2.718716859817505e-05, 3.515556454658508e-05, 4.312396049499512e-05, 5.109235644340515e-05, 5.9060752391815186e-05, 6.702914834022522e-05, 7.499754428863525e-05, 8.296594023704529e-05, 9.093433618545532e-05, 9.890273213386536e-05, 0.00010687112808227539, 0.00011483952403068542, 0.00012280791997909546, 0.0001307763159275055, 0.00013874471187591553, 0.00014671310782432556, 0.0001546815037727356, 0.00016264989972114563, 0.00017061829566955566, 0.0001785866916179657, 0.00018655508756637573, 0.00019452348351478577, 0.0002024918794631958, 0.00021046027541160583, 0.00021842867136001587, 0.0002263970673084259, 0.00023436546325683594]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 4.0, 5.0, 4.0, 1.0, 6.0, 8.0, 8.0, 12.0, 27.0, 27.0, 43.0, 46.0, 91.0, 120.0, 164.0, 289.0, 394.0, 611.0, 1055.0, 1778.0, 3114.0, 6206.0, 13655.0, 34000.0, 126776.0, 721771.0, 87525.0, 27257.0, 11210.0, 5308.0, 2816.0, 1611.0, 952.0, 537.0, 357.0, 243.0, 162.0, 118.0, 68.0, 44.0, 38.0, 30.0, 16.0, 17.0, 13.0, 7.0, 4.0, 10.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.07684326171875, -0.07447052001953125, -0.0720977783203125, -0.06972503662109375, -0.067352294921875, -0.06497955322265625, -0.0626068115234375, -0.06023406982421875, -0.057861328125, -0.05548858642578125, -0.0531158447265625, -0.05074310302734375, -0.048370361328125, -0.04599761962890625, -0.0436248779296875, -0.04125213623046875, -0.03887939453125, -0.03650665283203125, -0.0341339111328125, -0.03176116943359375, -0.029388427734375, -0.02701568603515625, -0.0246429443359375, -0.02227020263671875, -0.0198974609375, -0.01752471923828125, -0.0151519775390625, -0.01277923583984375, -0.010406494140625, -0.00803375244140625, -0.0056610107421875, -0.00328826904296875, -0.00091552734375, 0.00145721435546875, 0.0038299560546875, 0.00620269775390625, 0.008575439453125, 0.01094818115234375, 0.0133209228515625, 0.01569366455078125, 0.01806640625, 0.02043914794921875, 0.0228118896484375, 0.02518463134765625, 0.027557373046875, 0.02993011474609375, 0.0323028564453125, 0.03467559814453125, 0.03704833984375, 0.03942108154296875, 0.0417938232421875, 0.04416656494140625, 0.046539306640625, 0.04891204833984375, 0.0512847900390625, 0.05365753173828125, 0.0560302734375, 0.05840301513671875, 0.0607757568359375, 0.06314849853515625, 0.065521240234375, 0.06789398193359375, 0.0702667236328125, 0.07263946533203125, 0.07501220703125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 0.0, 3.0, 2.0, 3.0, 11.0, 9.0, 9.0, 16.0, 12.0, 18.0, 37.0, 29.0, 49.0, 40.0, 64.0, 99.0, 125.0, 110.0, 73.0, 62.0, 48.0, 35.0, 23.0, 21.0, 21.0, 25.0, 13.0, 5.0, 9.0, 8.0, 3.0, 7.0, 7.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.081298828125, -0.07847118377685547, -0.07564353942871094, -0.0728158950805664, -0.06998825073242188, -0.06716060638427734, -0.06433296203613281, -0.06150531768798828, -0.05867767333984375, -0.05585002899169922, -0.05302238464355469, -0.050194740295410156, -0.047367095947265625, -0.044539451599121094, -0.04171180725097656, -0.03888416290283203, -0.0360565185546875, -0.03322887420654297, -0.030401229858398438, -0.027573585510253906, -0.024745941162109375, -0.021918296813964844, -0.019090652465820312, -0.01626300811767578, -0.01343536376953125, -0.010607719421386719, -0.0077800750732421875, -0.004952430725097656, -0.002124786376953125, 0.0007028579711914062, 0.0035305023193359375, 0.006358146667480469, 0.009185791015625, 0.012013435363769531, 0.014841079711914062, 0.017668724060058594, 0.020496368408203125, 0.023324012756347656, 0.026151657104492188, 0.02897930145263672, 0.03180694580078125, 0.03463459014892578, 0.03746223449707031, 0.040289878845214844, 0.043117523193359375, 0.045945167541503906, 0.04877281188964844, 0.05160045623779297, 0.0544281005859375, 0.05725574493408203, 0.06008338928222656, 0.0629110336303711, 0.06573867797851562, 0.06856632232666016, 0.07139396667480469, 0.07422161102294922, 0.07704925537109375, 0.07987689971923828, 0.08270454406738281, 0.08553218841552734, 0.08835983276367188, 0.0911874771118164, 0.09401512145996094, 0.09684276580810547, 0.09967041015625]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 1.0, 11.0, 9.0, 11.0, 10.0, 23.0, 35.0, 53.0, 72.0, 152.0, 411.0, 118.0, 39.0, 26.0, 9.0, 9.0, 2.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.351711750030518, -6.17690372467041, -6.002095699310303, -5.827287673950195, -5.65247917175293, -5.477671146392822, -5.302863121032715, -5.128055095672607, -4.9532470703125, -4.778439044952393, -4.603631019592285, -4.4288225173950195, -4.254014492034912, -4.079206466674805, -3.9043984413146973, -3.72959041595459, -3.554781913757324, -3.379973888397217, -3.2051656246185303, -3.030357599258423, -2.8555493354797363, -2.680741310119629, -2.5059332847595215, -2.331125259399414, -2.1563169956207275, -1.9815088510513306, -1.8067007064819336, -1.6318926811218262, -1.4570845365524292, -1.2822763919830322, -1.1074683666229248, -0.9326602220535278, -0.7578525543212891, -0.5830444097518921, -0.4082363247871399, -0.2334282398223877, -0.05862009525299072, 0.11618804931640625, 0.29099607467651367, 0.46580421924591064, 0.6406123638153076, 0.8154205083847046, 0.9902285933494568, 1.165036678314209, 1.339844822883606, 1.514652967453003, 1.6894609928131104, 1.8642691373825073, 2.0390772819519043, 2.2138853073120117, 2.3886935710906982, 2.5635015964508057, 2.738309860229492, 2.9131178855895996, 3.087925910949707, 3.2627339363098145, 3.437542200088501, 3.6123502254486084, 3.787158489227295, 3.9619665145874023, 4.13677453994751, 4.311582565307617, 4.486391067504883, 4.66119909286499, 4.836007118225098]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 6.0, 6.0, 6.0, 7.0, 7.0, 7.0, 9.0, 14.0, 12.0, 24.0, 21.0, 19.0, 25.0, 36.0, 34.0, 29.0, 42.0, 59.0, 128.0, 122.0, 63.0, 51.0, 39.0, 33.0, 27.0, 37.0, 19.0, 23.0, 14.0, 19.0, 11.0, 16.0, 10.0, 10.0, 3.0, 1.0, 6.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.698139190673828, -2.616666555404663, -2.535193920135498, -2.453721046447754, -2.372248411178589, -2.290775775909424, -2.2093029022216797, -2.1278302669525146, -2.0463576316833496, -1.9648849964141846, -1.88341224193573, -1.8019394874572754, -1.7204668521881104, -1.6389942169189453, -1.5575214624404907, -1.4760487079620361, -1.394576072692871, -1.313103437423706, -1.2316306829452515, -1.1501579284667969, -1.0686852931976318, -0.987212598323822, -0.9057399034500122, -0.8242672085762024, -0.7427945137023926, -0.6613218188285828, -0.579849123954773, -0.49837642908096313, -0.4169037342071533, -0.3354310393333435, -0.2539583444595337, -0.17248564958572388, -0.09101319313049316, -0.00954049825668335, 0.07193219661712646, 0.15340489149093628, 0.2348775863647461, 0.3163502812385559, 0.3978229761123657, 0.47929567098617554, 0.5607683658599854, 0.6422410607337952, 0.723713755607605, 0.8051864504814148, 0.8866591453552246, 0.9681318402290344, 1.0496045351028442, 1.1310772895812988, 1.2125499248504639, 1.294022560119629, 1.3754953145980835, 1.456968069076538, 1.5384407043457031, 1.6199133396148682, 1.7013860940933228, 1.7828588485717773, 1.8643314838409424, 1.9458041191101074, 2.0272769927978516, 2.1087496280670166, 2.1902222633361816, 2.2716948986053467, 2.3531675338745117, 2.434640407562256, 2.516113042831421]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 3.0, 11.0, 2.0, 6.0, 10.0, 10.0, 10.0, 17.0, 19.0, 16.0, 41.0, 56.0, 85.0, 107.0, 158.0, 230.0, 304.0, 494.0, 1527.0, 13528.0, 4046217.0, 125999.0, 3416.0, 768.0, 312.0, 241.0, 169.0, 127.0, 95.0, 74.0, 69.0, 28.0, 33.0, 19.0, 20.0, 22.0, 14.0, 6.0, 2.0, 6.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.82080078125, -0.799041748046875, -0.77728271484375, -0.755523681640625, -0.7337646484375, -0.712005615234375, -0.69024658203125, -0.668487548828125, -0.646728515625, -0.624969482421875, -0.60321044921875, -0.581451416015625, -0.5596923828125, -0.537933349609375, -0.51617431640625, -0.494415283203125, -0.47265625, -0.450897216796875, -0.42913818359375, -0.407379150390625, -0.3856201171875, -0.363861083984375, -0.34210205078125, -0.320343017578125, -0.298583984375, -0.276824951171875, -0.25506591796875, -0.233306884765625, -0.2115478515625, -0.189788818359375, -0.16802978515625, -0.146270751953125, -0.12451171875, -0.102752685546875, -0.08099365234375, -0.059234619140625, -0.0374755859375, -0.015716552734375, 0.00604248046875, 0.027801513671875, 0.049560546875, 0.071319580078125, 0.09307861328125, 0.114837646484375, 0.1365966796875, 0.158355712890625, 0.18011474609375, 0.201873779296875, 0.2236328125, 0.245391845703125, 0.26715087890625, 0.288909912109375, 0.3106689453125, 0.332427978515625, 0.35418701171875, 0.375946044921875, 0.397705078125, 0.419464111328125, 0.44122314453125, 0.462982177734375, 0.4847412109375, 0.506500244140625, 0.52825927734375, 0.550018310546875, 0.57177734375]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 4.0, 6.0, 9.0, 13.0, 20.0, 21.0, 26.0, 40.0, 47.0, 55.0, 58.0, 67.0, 62.0, 75.0, 75.0, 81.0, 62.0, 64.0, 55.0, 29.0, 31.0, 27.0, 24.0, 13.0, 9.0, 10.0, 7.0, 9.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1522216796875, -0.14770126342773438, -0.14318084716796875, -0.13866043090820312, -0.1341400146484375, -0.12961959838867188, -0.12509918212890625, -0.12057876586914062, -0.116058349609375, -0.11153793334960938, -0.10701751708984375, -0.10249710083007812, -0.0979766845703125, -0.09345626831054688, -0.08893585205078125, -0.08441543579101562, -0.07989501953125, -0.07537460327148438, -0.07085418701171875, -0.06633377075195312, -0.0618133544921875, -0.057292938232421875, -0.05277252197265625, -0.048252105712890625, -0.043731689453125, -0.039211273193359375, -0.03469085693359375, -0.030170440673828125, -0.0256500244140625, -0.021129608154296875, -0.01660919189453125, -0.012088775634765625, -0.007568359375, -0.003047943115234375, 0.00147247314453125, 0.005992889404296875, 0.0105133056640625, 0.015033721923828125, 0.01955413818359375, 0.024074554443359375, 0.028594970703125, 0.033115386962890625, 0.03763580322265625, 0.042156219482421875, 0.0466766357421875, 0.051197052001953125, 0.05571746826171875, 0.060237884521484375, 0.06475830078125, 0.06927871704101562, 0.07379913330078125, 0.07831954956054688, 0.0828399658203125, 0.08736038208007812, 0.09188079833984375, 0.09640121459960938, 0.100921630859375, 0.10544204711914062, 0.10996246337890625, 0.11448287963867188, 0.1190032958984375, 0.12352371215820312, 0.12804412841796875, 0.13256454467773438, 0.1370849609375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 7.0, 8.0, 15.0, 34.0, 58.0, 111.0, 200.0, 368.0, 874.0, 2081.0, 9172.0, 386766.0, 3771239.0, 17831.0, 3188.0, 1158.0, 566.0, 279.0, 146.0, 75.0, 50.0, 19.0, 12.0, 9.0, 7.0, 3.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5791015625, -0.55694580078125, -0.5347900390625, -0.51263427734375, -0.490478515625, -0.46832275390625, -0.4461669921875, -0.42401123046875, -0.40185546875, -0.37969970703125, -0.3575439453125, -0.33538818359375, -0.313232421875, -0.29107666015625, -0.2689208984375, -0.24676513671875, -0.224609375, -0.20245361328125, -0.1802978515625, -0.15814208984375, -0.135986328125, -0.11383056640625, -0.0916748046875, -0.06951904296875, -0.04736328125, -0.02520751953125, -0.0030517578125, 0.01910400390625, 0.041259765625, 0.06341552734375, 0.0855712890625, 0.10772705078125, 0.1298828125, 0.15203857421875, 0.1741943359375, 0.19635009765625, 0.218505859375, 0.24066162109375, 0.2628173828125, 0.28497314453125, 0.30712890625, 0.32928466796875, 0.3514404296875, 0.37359619140625, 0.395751953125, 0.41790771484375, 0.4400634765625, 0.46221923828125, 0.484375, 0.50653076171875, 0.5286865234375, 0.55084228515625, 0.572998046875, 0.59515380859375, 0.6173095703125, 0.63946533203125, 0.66162109375, 0.68377685546875, 0.7059326171875, 0.72808837890625, 0.750244140625, 0.77239990234375, 0.7945556640625, 0.81671142578125, 0.8388671875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 6.0, 5.0, 5.0, 12.0, 16.0, 20.0, 22.0, 62.0, 108.0, 224.0, 697.0, 1515.0, 837.0, 260.0, 111.0, 61.0, 36.0, 20.0, 16.0, 6.0, 5.0, 9.0, 7.0, 8.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.240234375, -0.2265777587890625, -0.212921142578125, -0.1992645263671875, -0.18560791015625, -0.1719512939453125, -0.158294677734375, -0.1446380615234375, -0.1309814453125, -0.1173248291015625, -0.103668212890625, -0.0900115966796875, -0.07635498046875, -0.0626983642578125, -0.049041748046875, -0.0353851318359375, -0.021728515625, -0.0080718994140625, 0.005584716796875, 0.0192413330078125, 0.03289794921875, 0.0465545654296875, 0.060211181640625, 0.0738677978515625, 0.0875244140625, 0.1011810302734375, 0.114837646484375, 0.1284942626953125, 0.14215087890625, 0.1558074951171875, 0.169464111328125, 0.1831207275390625, 0.19677734375, 0.2104339599609375, 0.224090576171875, 0.2377471923828125, 0.25140380859375, 0.2650604248046875, 0.278717041015625, 0.2923736572265625, 0.3060302734375, 0.3196868896484375, 0.333343505859375, 0.3470001220703125, 0.36065673828125, 0.3743133544921875, 0.387969970703125, 0.4016265869140625, 0.415283203125, 0.4289398193359375, 0.442596435546875, 0.4562530517578125, 0.46990966796875, 0.4835662841796875, 0.497222900390625, 0.5108795166015625, 0.5245361328125, 0.5381927490234375, 0.551849365234375, 0.5655059814453125, 0.57916259765625, 0.5928192138671875, 0.606475830078125, 0.6201324462890625, 0.6337890625]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 5.0, 11.0, 39.0, 87.0, 242.0, 312.0, 154.0, 66.0, 44.0, 14.0, 10.0, 10.0, 5.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.582521915435791, -7.418257236480713, -7.253992557525635, -7.089727401733398, -6.92546272277832, -6.761198043823242, -6.596933364868164, -6.432668685913086, -6.268404006958008, -6.10413932800293, -5.939874649047852, -5.775609493255615, -5.611344814300537, -5.447080135345459, -5.282815456390381, -5.118550777435303, -4.954285621643066, -4.790020942687988, -4.62575626373291, -4.461491107940674, -4.297226428985596, -4.132961750030518, -3.9686970710754395, -3.8044323921203613, -3.640167474746704, -3.475902795791626, -3.3116378784179688, -3.1473731994628906, -2.9831085205078125, -2.8188436031341553, -2.654578924179077, -2.49031400680542, -2.3260498046875, -2.161785125732422, -1.9975202083587646, -1.8332555294036865, -1.6689907312393188, -1.5047259330749512, -1.340461254119873, -1.1761964559555054, -1.0119316577911377, -0.84766685962677, -0.6834021210670471, -0.5191373825073242, -0.35487258434295654, -0.19060778617858887, -0.026343047618865967, 0.13792169094085693, 0.3021864891052246, 0.4664512574672699, 0.6307160258293152, 0.7949807643890381, 0.9592455625534058, 1.1235103607177734, 1.2877750396728516, 1.4520398378372192, 1.616304636001587, 1.7805694341659546, 1.9448342323303223, 2.1090989112854004, 2.2733635902404785, 2.4376285076141357, 2.601893186569214, 2.766158103942871, 2.930422782897949]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 4.0, 15.0, 9.0, 23.0, 26.0, 37.0, 44.0, 42.0, 48.0, 59.0, 67.0, 72.0, 100.0, 92.0, 83.0, 57.0, 56.0, 34.0, 41.0, 29.0, 22.0, 16.0, 6.0, 4.0, 2.0, 6.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5968148708343506, -3.4969451427459717, -3.3970754146575928, -3.297205924987793, -3.197336196899414, -3.097466468811035, -2.9975967407226562, -2.8977270126342773, -2.7978575229644775, -2.6979877948760986, -2.5981180667877197, -2.49824857711792, -2.398378849029541, -2.298509120941162, -2.198639392852783, -2.0987696647644043, -1.998900055885315, -1.899030327796936, -1.7991607189178467, -1.6992909908294678, -1.5994213819503784, -1.4995516538619995, -1.3996820449829102, -1.2998123168945312, -1.1999425888061523, -1.1000728607177734, -1.000203251838684, -0.9003335237503052, -0.8004639148712158, -0.7005941867828369, -0.6007245182991028, -0.5008548498153687, -0.4009852409362793, -0.30111557245254517, -0.20124588906764984, -0.10137620568275452, -0.0015065371990203857, 0.09836313128471375, 0.19823282957077026, 0.2981024980545044, 0.3979721665382385, 0.49784183502197266, 0.5977115035057068, 0.6975811719894409, 0.7974509000778198, 0.8973205089569092, 0.9971902370452881, 1.097059965133667, 1.1969295740127563, 1.2967993021011353, 1.3966689109802246, 1.4965386390686035, 1.5964082479476929, 1.6962779760360718, 1.7961475849151611, 1.89601731300354, 1.995887041091919, 2.095756769180298, 2.1956264972686768, 2.2954959869384766, 2.3953657150268555, 2.4952354431152344, 2.5951051712036133, 2.694974899291992, 2.794844388961792]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 5.0, 3.0, 4.0, 7.0, 12.0, 10.0, 14.0, 27.0, 42.0, 52.0, 86.0, 146.0, 234.0, 351.0, 586.0, 1118.0, 2124.0, 4725.0, 11698.0, 35869.0, 168085.0, 635895.0, 136740.0, 31446.0, 10491.0, 4311.0, 1982.0, 1004.0, 599.0, 342.0, 190.0, 111.0, 93.0, 50.0, 40.0, 20.0, 15.0, 9.0, 7.0, 10.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.42578125, -0.4108123779296875, -0.395843505859375, -0.3808746337890625, -0.36590576171875, -0.3509368896484375, -0.335968017578125, -0.3209991455078125, -0.3060302734375, -0.2910614013671875, -0.276092529296875, -0.2611236572265625, -0.24615478515625, -0.2311859130859375, -0.216217041015625, -0.2012481689453125, -0.186279296875, -0.1713104248046875, -0.156341552734375, -0.1413726806640625, -0.12640380859375, -0.1114349365234375, -0.096466064453125, -0.0814971923828125, -0.0665283203125, -0.0515594482421875, -0.036590576171875, -0.0216217041015625, -0.00665283203125, 0.0083160400390625, 0.023284912109375, 0.0382537841796875, 0.05322265625, 0.0681915283203125, 0.083160400390625, 0.0981292724609375, 0.11309814453125, 0.1280670166015625, 0.143035888671875, 0.1580047607421875, 0.1729736328125, 0.1879425048828125, 0.202911376953125, 0.2178802490234375, 0.23284912109375, 0.2478179931640625, 0.262786865234375, 0.2777557373046875, 0.292724609375, 0.3076934814453125, 0.322662353515625, 0.3376312255859375, 0.35260009765625, 0.3675689697265625, 0.382537841796875, 0.3975067138671875, 0.4124755859375, 0.4274444580078125, 0.442413330078125, 0.4573822021484375, 0.47235107421875, 0.4873199462890625, 0.502288818359375, 0.5172576904296875, 0.5322265625]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 2.0, 6.0, 5.0, 9.0, 4.0, 7.0, 15.0, 17.0, 17.0, 30.0, 28.0, 28.0, 26.0, 48.0, 44.0, 37.0, 44.0, 53.0, 57.0, 62.0, 49.0, 53.0, 58.0, 47.0, 40.0, 41.0, 26.0, 32.0, 27.0, 17.0, 14.0, 15.0, 12.0, 7.0, 7.0, 7.0, 4.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.1590576171875, -0.1545085906982422, -0.14995956420898438, -0.14541053771972656, -0.14086151123046875, -0.13631248474121094, -0.13176345825195312, -0.1272144317626953, -0.1226654052734375, -0.11811637878417969, -0.11356735229492188, -0.10901832580566406, -0.10446929931640625, -0.09992027282714844, -0.09537124633789062, -0.09082221984863281, -0.086273193359375, -0.08172416687011719, -0.07717514038085938, -0.07262611389160156, -0.06807708740234375, -0.06352806091308594, -0.058979034423828125, -0.05443000793457031, -0.0498809814453125, -0.04533195495605469, -0.040782928466796875, -0.03623390197753906, -0.03168487548828125, -0.027135848999023438, -0.022586822509765625, -0.018037796020507812, -0.01348876953125, -0.008939743041992188, -0.004390716552734375, 0.0001583099365234375, 0.00470733642578125, 0.009256362915039062, 0.013805389404296875, 0.018354415893554688, 0.0229034423828125, 0.027452468872070312, 0.032001495361328125, 0.03655052185058594, 0.04109954833984375, 0.04564857482910156, 0.050197601318359375, 0.05474662780761719, 0.059295654296875, 0.06384468078613281, 0.06839370727539062, 0.07294273376464844, 0.07749176025390625, 0.08204078674316406, 0.08658981323242188, 0.09113883972167969, 0.0956878662109375, 0.10023689270019531, 0.10478591918945312, 0.10933494567871094, 0.11388397216796875, 0.11843299865722656, 0.12298202514648438, 0.1275310516357422, 0.132080078125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 5.0, 5.0, 7.0, 11.0, 14.0, 23.0, 29.0, 33.0, 44.0, 53.0, 87.0, 115.0, 175.0, 261.0, 361.0, 696.0, 1512.0, 4018.0, 13392.0, 66204.0, 756699.0, 168406.0, 25297.0, 6475.0, 2235.0, 943.0, 505.0, 261.0, 174.0, 133.0, 101.0, 81.0, 57.0, 41.0, 29.0, 19.0, 17.0, 9.0, 7.0, 7.0, 11.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.49365234375, -0.4785652160644531, -0.46347808837890625, -0.4483909606933594, -0.4333038330078125, -0.4182167053222656, -0.40312957763671875, -0.3880424499511719, -0.372955322265625, -0.3578681945800781, -0.34278106689453125, -0.3276939392089844, -0.3126068115234375, -0.2975196838378906, -0.28243255615234375, -0.2673454284667969, -0.25225830078125, -0.23717117309570312, -0.22208404541015625, -0.20699691772460938, -0.1919097900390625, -0.17682266235351562, -0.16173553466796875, -0.14664840698242188, -0.131561279296875, -0.11647415161132812, -0.10138702392578125, -0.08629989624023438, -0.0712127685546875, -0.056125640869140625, -0.04103851318359375, -0.025951385498046875, -0.0108642578125, 0.004222869873046875, 0.01930999755859375, 0.034397125244140625, 0.0494842529296875, 0.06457138061523438, 0.07965850830078125, 0.09474563598632812, 0.109832763671875, 0.12491989135742188, 0.14000701904296875, 0.15509414672851562, 0.1701812744140625, 0.18526840209960938, 0.20035552978515625, 0.21544265747070312, 0.23052978515625, 0.24561691284179688, 0.26070404052734375, 0.2757911682128906, 0.2908782958984375, 0.3059654235839844, 0.32105255126953125, 0.3361396789550781, 0.351226806640625, 0.3663139343261719, 0.38140106201171875, 0.3964881896972656, 0.4115753173828125, 0.4266624450683594, 0.44174957275390625, 0.4568367004394531, 0.471923828125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 4.0, 5.0, 11.0, 12.0, 11.0, 19.0, 21.0, 16.0, 26.0, 28.0, 44.0, 48.0, 49.0, 63.0, 66.0, 60.0, 70.0, 52.0, 66.0, 51.0, 42.0, 49.0, 35.0, 24.0, 26.0, 19.0, 19.0, 11.0, 11.0, 11.0, 8.0, 7.0, 4.0, 3.0, 6.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6416015625, -0.6211090087890625, -0.600616455078125, -0.5801239013671875, -0.55963134765625, -0.5391387939453125, -0.518646240234375, -0.4981536865234375, -0.4776611328125, -0.4571685791015625, -0.436676025390625, -0.4161834716796875, -0.39569091796875, -0.3751983642578125, -0.354705810546875, -0.3342132568359375, -0.313720703125, -0.2932281494140625, -0.272735595703125, -0.2522430419921875, -0.23175048828125, -0.2112579345703125, -0.190765380859375, -0.1702728271484375, -0.1497802734375, -0.1292877197265625, -0.108795166015625, -0.0883026123046875, -0.06781005859375, -0.0473175048828125, -0.026824951171875, -0.0063323974609375, 0.01416015625, 0.0346527099609375, 0.055145263671875, 0.0756378173828125, 0.09613037109375, 0.1166229248046875, 0.137115478515625, 0.1576080322265625, 0.1781005859375, 0.1985931396484375, 0.219085693359375, 0.2395782470703125, 0.26007080078125, 0.2805633544921875, 0.301055908203125, 0.3215484619140625, 0.342041015625, 0.3625335693359375, 0.383026123046875, 0.4035186767578125, 0.42401123046875, 0.4445037841796875, 0.464996337890625, 0.4854888916015625, 0.5059814453125, 0.5264739990234375, 0.546966552734375, 0.5674591064453125, 0.58795166015625, 0.6084442138671875, 0.628936767578125, 0.6494293212890625, 0.669921875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 2.0, 8.0, 4.0, 14.0, 24.0, 31.0, 82.0, 187.0, 351.0, 1042.0, 4498.0, 92872.0, 936436.0, 10376.0, 1677.0, 528.0, 199.0, 99.0, 59.0, 21.0, 11.0, 13.0, 6.0, 6.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.330810546875, -0.3202056884765625, -0.309600830078125, -0.2989959716796875, -0.28839111328125, -0.2777862548828125, -0.267181396484375, -0.2565765380859375, -0.2459716796875, -0.2353668212890625, -0.224761962890625, -0.2141571044921875, -0.20355224609375, -0.1929473876953125, -0.182342529296875, -0.1717376708984375, -0.1611328125, -0.1505279541015625, -0.139923095703125, -0.1293182373046875, -0.11871337890625, -0.1081085205078125, -0.097503662109375, -0.0868988037109375, -0.0762939453125, -0.0656890869140625, -0.055084228515625, -0.0444793701171875, -0.03387451171875, -0.0232696533203125, -0.012664794921875, -0.0020599365234375, 0.008544921875, 0.0191497802734375, 0.029754638671875, 0.0403594970703125, 0.05096435546875, 0.0615692138671875, 0.072174072265625, 0.0827789306640625, 0.0933837890625, 0.1039886474609375, 0.114593505859375, 0.1251983642578125, 0.13580322265625, 0.1464080810546875, 0.157012939453125, 0.1676177978515625, 0.17822265625, 0.1888275146484375, 0.199432373046875, 0.2100372314453125, 0.22064208984375, 0.2312469482421875, 0.241851806640625, 0.2524566650390625, 0.2630615234375, 0.2736663818359375, 0.284271240234375, 0.2948760986328125, 0.30548095703125, 0.3160858154296875, 0.326690673828125, 0.3372955322265625, 0.347900390625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 5.0, 7.0, 6.0, 11.0, 13.0, 14.0, 23.0, 30.0, 53.0, 57.0, 94.0, 157.0, 195.0, 107.0, 77.0, 46.0, 28.0, 24.0, 13.0, 15.0, 5.0, 5.0, 5.0, 7.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002334117889404297, -0.00022617727518081665, -0.0002189427614212036, -0.00021170824766159058, -0.00020447373390197754, -0.0001972392201423645, -0.00019000470638275146, -0.00018277019262313843, -0.0001755356788635254, -0.00016830116510391235, -0.00016106665134429932, -0.00015383213758468628, -0.00014659762382507324, -0.0001393631100654602, -0.00013212859630584717, -0.00012489408254623413, -0.0001176595687866211, -0.00011042505502700806, -0.00010319054126739502, -9.595602750778198e-05, -8.872151374816895e-05, -8.148699998855591e-05, -7.425248622894287e-05, -6.701797246932983e-05, -5.97834587097168e-05, -5.254894495010376e-05, -4.531443119049072e-05, -3.8079917430877686e-05, -3.084540367126465e-05, -2.361088991165161e-05, -1.6376376152038574e-05, -9.141862392425537e-06, -1.9073486328125e-06, 5.327165126800537e-06, 1.2561678886413574e-05, 1.979619264602661e-05, 2.703070640563965e-05, 3.4265220165252686e-05, 4.149973392486572e-05, 4.873424768447876e-05, 5.59687614440918e-05, 6.320327520370483e-05, 7.043778896331787e-05, 7.767230272293091e-05, 8.490681648254395e-05, 9.214133024215698e-05, 9.937584400177002e-05, 0.00010661035776138306, 0.0001138448715209961, 0.00012107938528060913, 0.00012831389904022217, 0.0001355484127998352, 0.00014278292655944824, 0.00015001744031906128, 0.00015725195407867432, 0.00016448646783828735, 0.0001717209815979004, 0.00017895549535751343, 0.00018619000911712646, 0.0001934245228767395, 0.00020065903663635254, 0.00020789355039596558, 0.0002151280641555786, 0.00022236257791519165, 0.0002295970916748047]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 9.0, 5.0, 11.0, 14.0, 13.0, 28.0, 47.0, 95.0, 162.0, 397.0, 1348.0, 10519.0, 1016454.0, 16977.0, 1579.0, 448.0, 213.0, 97.0, 48.0, 33.0, 13.0, 18.0, 10.0, 3.0, 6.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5771484375, -0.5604515075683594, -0.5437545776367188, -0.5270576477050781, -0.5103607177734375, -0.4936637878417969, -0.47696685791015625, -0.4602699279785156, -0.443572998046875, -0.4268760681152344, -0.41017913818359375, -0.3934822082519531, -0.3767852783203125, -0.3600883483886719, -0.34339141845703125, -0.3266944885253906, -0.30999755859375, -0.2933006286621094, -0.27660369873046875, -0.2599067687988281, -0.2432098388671875, -0.22651290893554688, -0.20981597900390625, -0.19311904907226562, -0.176422119140625, -0.15972518920898438, -0.14302825927734375, -0.12633132934570312, -0.1096343994140625, -0.09293746948242188, -0.07624053955078125, -0.059543609619140625, -0.0428466796875, -0.026149749755859375, -0.00945281982421875, 0.007244110107421875, 0.0239410400390625, 0.040637969970703125, 0.05733489990234375, 0.07403182983398438, 0.090728759765625, 0.10742568969726562, 0.12412261962890625, 0.14081954956054688, 0.1575164794921875, 0.17421340942382812, 0.19091033935546875, 0.20760726928710938, 0.22430419921875, 0.24100112915039062, 0.25769805908203125, 0.2743949890136719, 0.2910919189453125, 0.3077888488769531, 0.32448577880859375, 0.3411827087402344, 0.357879638671875, 0.3745765686035156, 0.39127349853515625, 0.4079704284667969, 0.4246673583984375, 0.4413642883300781, 0.45806121826171875, 0.4747581481933594, 0.491455078125]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 4.0, 8.0, 8.0, 35.0, 61.0, 168.0, 387.0, 205.0, 66.0, 24.0, 21.0, 4.0, 7.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.64208984375, -0.6250076293945312, -0.6079254150390625, -0.5908432006835938, -0.573760986328125, -0.5566787719726562, -0.5395965576171875, -0.5225143432617188, -0.50543212890625, -0.48834991455078125, -0.4712677001953125, -0.45418548583984375, -0.437103271484375, -0.42002105712890625, -0.4029388427734375, -0.38585662841796875, -0.3687744140625, -0.35169219970703125, -0.3346099853515625, -0.31752777099609375, -0.300445556640625, -0.28336334228515625, -0.2662811279296875, -0.24919891357421875, -0.23211669921875, -0.21503448486328125, -0.1979522705078125, -0.18087005615234375, -0.163787841796875, -0.14670562744140625, -0.1296234130859375, -0.11254119873046875, -0.095458984375, -0.07837677001953125, -0.0612945556640625, -0.04421234130859375, -0.027130126953125, -0.01004791259765625, 0.0070343017578125, 0.02411651611328125, 0.04119873046875, 0.05828094482421875, 0.0753631591796875, 0.09244537353515625, 0.109527587890625, 0.12660980224609375, 0.1436920166015625, 0.16077423095703125, 0.1778564453125, 0.19493865966796875, 0.2120208740234375, 0.22910308837890625, 0.246185302734375, 0.26326751708984375, 0.2803497314453125, 0.29743194580078125, 0.31451416015625, 0.33159637451171875, 0.3486785888671875, 0.36576080322265625, 0.382843017578125, 0.39992523193359375, 0.4170074462890625, 0.43408966064453125, 0.451171875]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 10.0, 371.0, 567.0, 44.0, 13.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-31.435022354125977, -30.853286743164062, -30.27155113220215, -29.689815521240234, -29.108081817626953, -28.52634620666504, -27.944610595703125, -27.36287498474121, -26.781139373779297, -26.199403762817383, -25.61766815185547, -25.035932540893555, -24.45419692993164, -23.87246322631836, -23.290727615356445, -22.70899200439453, -22.127256393432617, -21.545520782470703, -20.96378517150879, -20.382049560546875, -19.800315856933594, -19.21858024597168, -18.636844635009766, -18.05510902404785, -17.473373413085938, -16.891637802124023, -16.30990219116211, -15.728167533874512, -15.146431922912598, -14.564696311950684, -13.982961654663086, -13.401226043701172, -12.819488525390625, -12.237752914428711, -11.656017303466797, -11.0742826461792, -10.492547035217285, -9.910811424255371, -9.329076766967773, -8.74734115600586, -8.165605545043945, -7.583869934082031, -7.002134799957275, -6.4203996658325195, -5.8386640548706055, -5.256928443908691, -4.6751933097839355, -4.09345817565918, -3.5117225646972656, -2.9299871921539307, -2.3482518196105957, -1.7665164470672607, -1.1847810745239258, -0.6030457019805908, -0.02131032943725586, 0.5604248046875, 1.142160415649414, 1.723895788192749, 2.305631160736084, 2.887366533279419, 3.469101905822754, 4.050837516784668, 4.632572650909424, 5.21430778503418, 5.796043395996094]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 1.0, 3.0, 5.0, 11.0, 11.0, 22.0, 29.0, 36.0, 36.0, 53.0, 34.0, 107.0, 132.0, 115.0, 123.0, 61.0, 60.0, 45.0, 30.0, 25.0, 18.0, 15.0, 10.0, 13.0, 6.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.7437186241149902, -3.5891010761260986, -3.434483528137207, -3.2798657417297363, -3.1252481937408447, -2.970630645751953, -2.8160128593444824, -2.661395311355591, -2.506777763366699, -2.3521602153778076, -2.197542667388916, -2.0429248809814453, -1.8883073329925537, -1.733689785003662, -1.579072117805481, -1.4244544506072998, -1.2698369026184082, -1.1152193546295166, -0.9606016874313354, -0.8059840798377991, -0.6513664722442627, -0.4967488646507263, -0.34213125705718994, -0.1875135898590088, -0.03289604187011719, 0.12172156572341919, 0.27633917331695557, 0.43095678091049194, 0.5855743885040283, 0.7401919960975647, 0.8948096036911011, 1.0494272708892822, 1.204045295715332, 1.3586628437042236, 1.5132805109024048, 1.667898178100586, 1.8225157260894775, 1.9771332740783691, 2.13175106048584, 2.2863686084747314, 2.440986156463623, 2.5956037044525146, 2.7502212524414062, 2.904839038848877, 3.0594565868377686, 3.21407413482666, 3.368691921234131, 3.5233094692230225, 3.677927017211914, 3.8325445652008057, 3.9871621131896973, 4.141779899597168, 4.2963972091674805, 4.451014995574951, 4.605632781982422, 4.760250091552734, 4.914867877960205, 5.069485664367676, 5.224102973937988, 5.378720760345459, 5.53333854675293, 5.687955856323242, 5.842573642730713, 5.997191429138184, 6.151808738708496]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 3.0, 5.0, 8.0, 8.0, 11.0, 13.0, 18.0, 14.0, 31.0, 49.0, 80.0, 83.0, 120.0, 183.0, 265.0, 444.0, 748.0, 1257.0, 2416.0, 5437.0, 15370.0, 52692.0, 270411.0, 1497725.0, 1857064.0, 384364.0, 72675.0, 19646.0, 6722.0, 2814.0, 1387.0, 773.0, 494.0, 286.0, 203.0, 122.0, 98.0, 69.0, 58.0, 34.0, 30.0, 21.0, 12.0, 8.0, 4.0, 3.0, 7.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.1654052734375, -0.16008567810058594, -0.15476608276367188, -0.1494464874267578, -0.14412689208984375, -0.1388072967529297, -0.13348770141601562, -0.12816810607910156, -0.1228485107421875, -0.11752891540527344, -0.11220932006835938, -0.10688972473144531, -0.10157012939453125, -0.09625053405761719, -0.09093093872070312, -0.08561134338378906, -0.080291748046875, -0.07497215270996094, -0.06965255737304688, -0.06433296203613281, -0.05901336669921875, -0.05369377136230469, -0.048374176025390625, -0.04305458068847656, -0.0377349853515625, -0.03241539001464844, -0.027095794677734375, -0.021776199340820312, -0.01645660400390625, -0.011137008666992188, -0.005817413330078125, -0.0004978179931640625, 0.00482177734375, 0.010141372680664062, 0.015460968017578125, 0.020780563354492188, 0.02610015869140625, 0.03141975402832031, 0.036739349365234375, 0.04205894470214844, 0.0473785400390625, 0.05269813537597656, 0.058017730712890625, 0.06333732604980469, 0.06865692138671875, 0.07397651672363281, 0.07929611206054688, 0.08461570739746094, 0.089935302734375, 0.09525489807128906, 0.10057449340820312, 0.10589408874511719, 0.11121368408203125, 0.11653327941894531, 0.12185287475585938, 0.12717247009277344, 0.1324920654296875, 0.13781166076660156, 0.14313125610351562, 0.1484508514404297, 0.15377044677734375, 0.1590900421142578, 0.16440963745117188, 0.16972923278808594, 0.175048828125]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 1.0, 4.0, 11.0, 7.0, 10.0, 7.0, 17.0, 15.0, 19.0, 25.0, 27.0, 29.0, 49.0, 39.0, 55.0, 59.0, 53.0, 73.0, 71.0, 42.0, 63.0, 65.0, 47.0, 42.0, 42.0, 26.0, 20.0, 16.0, 18.0, 12.0, 14.0, 8.0, 5.0, 2.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.18310546875, -0.17754554748535156, -0.17198562622070312, -0.1664257049560547, -0.16086578369140625, -0.1553058624267578, -0.14974594116210938, -0.14418601989746094, -0.1386260986328125, -0.13306617736816406, -0.12750625610351562, -0.12194633483886719, -0.11638641357421875, -0.11082649230957031, -0.10526657104492188, -0.09970664978027344, -0.094146728515625, -0.08858680725097656, -0.08302688598632812, -0.07746696472167969, -0.07190704345703125, -0.06634712219238281, -0.060787200927734375, -0.05522727966308594, -0.0496673583984375, -0.04410743713378906, -0.038547515869140625, -0.03298759460449219, -0.02742767333984375, -0.021867752075195312, -0.016307830810546875, -0.010747909545898438, -0.00518798828125, 0.0003719329833984375, 0.005931854248046875, 0.011491775512695312, 0.01705169677734375, 0.022611618041992188, 0.028171539306640625, 0.03373146057128906, 0.0392913818359375, 0.04485130310058594, 0.050411224365234375, 0.05597114562988281, 0.06153106689453125, 0.06709098815917969, 0.07265090942382812, 0.07821083068847656, 0.083770751953125, 0.08933067321777344, 0.09489059448242188, 0.10045051574707031, 0.10601043701171875, 0.11157035827636719, 0.11713027954101562, 0.12269020080566406, 0.1282501220703125, 0.13381004333496094, 0.13936996459960938, 0.1449298858642578, 0.15048980712890625, 0.1560497283935547, 0.16160964965820312, 0.16716957092285156, 0.1727294921875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 5.0, 16.0, 28.0, 62.0, 106.0, 356.0, 1295.0, 49371.0, 4138407.0, 3557.0, 709.0, 205.0, 80.0, 41.0, 23.0, 7.0, 8.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9697265625, -1.913787841796875, -1.85784912109375, -1.801910400390625, -1.7459716796875, -1.690032958984375, -1.63409423828125, -1.578155517578125, -1.522216796875, -1.466278076171875, -1.41033935546875, -1.354400634765625, -1.2984619140625, -1.242523193359375, -1.18658447265625, -1.130645751953125, -1.07470703125, -1.018768310546875, -0.96282958984375, -0.906890869140625, -0.8509521484375, -0.795013427734375, -0.73907470703125, -0.683135986328125, -0.627197265625, -0.571258544921875, -0.51531982421875, -0.459381103515625, -0.4034423828125, -0.347503662109375, -0.29156494140625, -0.235626220703125, -0.1796875, -0.123748779296875, -0.06781005859375, -0.011871337890625, 0.0440673828125, 0.100006103515625, 0.15594482421875, 0.211883544921875, 0.267822265625, 0.323760986328125, 0.37969970703125, 0.435638427734375, 0.4915771484375, 0.547515869140625, 0.60345458984375, 0.659393310546875, 0.71533203125, 0.771270751953125, 0.82720947265625, 0.883148193359375, 0.9390869140625, 0.995025634765625, 1.05096435546875, 1.106903076171875, 1.162841796875, 1.218780517578125, 1.27471923828125, 1.330657958984375, 1.3865966796875, 1.442535400390625, 1.49847412109375, 1.554412841796875, 1.6103515625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 10.0, 25.0, 35.0, 104.0, 297.0, 942.0, 1667.0, 641.0, 195.0, 82.0, 33.0, 15.0, 13.0, 9.0, 2.0, 3.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.499267578125, -0.4667930603027344, -0.43431854248046875, -0.4018440246582031, -0.3693695068359375, -0.3368949890136719, -0.30442047119140625, -0.2719459533691406, -0.239471435546875, -0.20699691772460938, -0.17452239990234375, -0.14204788208007812, -0.1095733642578125, -0.07709884643554688, -0.04462432861328125, -0.012149810791015625, 0.02032470703125, 0.052799224853515625, 0.08527374267578125, 0.11774826049804688, 0.1502227783203125, 0.18269729614257812, 0.21517181396484375, 0.24764633178710938, 0.280120849609375, 0.3125953674316406, 0.34506988525390625, 0.3775444030761719, 0.4100189208984375, 0.4424934387207031, 0.47496795654296875, 0.5074424743652344, 0.5399169921875, 0.5723915100097656, 0.6048660278320312, 0.6373405456542969, 0.6698150634765625, 0.7022895812988281, 0.7347640991210938, 0.7672386169433594, 0.799713134765625, 0.8321876525878906, 0.8646621704101562, 0.8971366882324219, 0.9296112060546875, 0.9620857238769531, 0.9945602416992188, 1.0270347595214844, 1.05950927734375, 1.0919837951660156, 1.1244583129882812, 1.1569328308105469, 1.1894073486328125, 1.2218818664550781, 1.2543563842773438, 1.2868309020996094, 1.319305419921875, 1.3517799377441406, 1.3842544555664062, 1.4167289733886719, 1.4492034912109375, 1.4816780090332031, 1.5141525268554688, 1.5466270446777344, 1.5791015625]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 5.0, 3.0, 11.0, 22.0, 38.0, 89.0, 168.0, 305.0, 192.0, 88.0, 35.0, 12.0, 10.0, 8.0, 1.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5666961669921875, -3.3871774673461914, -3.2076590061187744, -3.0281405448913574, -2.8486218452453613, -2.6691031455993652, -2.4895846843719482, -2.3100662231445312, -2.130547523498535, -1.9510289430618286, -1.771510362625122, -1.5919917821884155, -1.412473201751709, -1.2329546213150024, -1.053436040878296, -0.8739174604415894, -0.6943988800048828, -0.5148802995681763, -0.3353617191314697, -0.15584313869476318, 0.02367544174194336, 0.2031940221786499, 0.38271260261535645, 0.562231183052063, 0.7417497634887695, 0.9212683439254761, 1.1007869243621826, 1.2803055047988892, 1.4598240852355957, 1.6393426656723022, 1.8188612461090088, 1.9983798265457153, 2.1778979301452637, 2.3574166297912598, 2.5369350910186768, 2.7164535522460938, 2.89597225189209, 3.075490951538086, 3.255009412765503, 3.43452787399292, 3.614046573638916, 3.793565273284912, 3.973083734512329, 4.152602195739746, 4.332120895385742, 4.511639595031738, 4.691158294677734, 4.870676517486572, 5.050195217132568, 5.2297139167785645, 5.409232139587402, 5.588750839233398, 5.7682695388793945, 5.947788238525391, 6.127306938171387, 6.306825160980225, 6.486343860626221, 6.665862560272217, 6.845380783081055, 7.024899482727051, 7.204418182373047, 7.383936882019043, 7.563455581665039, 7.742973804473877, 7.922492504119873]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 0.0, 2.0, 5.0, 8.0, 5.0, 8.0, 12.0, 16.0, 16.0, 27.0, 39.0, 44.0, 51.0, 61.0, 63.0, 92.0, 83.0, 84.0, 83.0, 66.0, 53.0, 49.0, 32.0, 30.0, 18.0, 11.0, 10.0, 4.0, 6.0, 7.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.638813018798828, -4.514854907989502, -4.390896797180176, -4.26693868637085, -4.142980575561523, -4.0190229415893555, -3.89506459236145, -3.771106481552124, -3.647148609161377, -3.523190498352051, -3.3992323875427246, -3.2752742767333984, -3.1513164043426514, -3.027358293533325, -2.903400182723999, -2.779442071914673, -2.6554839611053467, -2.5315258502960205, -2.4075677394866943, -2.2836098670959473, -2.159651756286621, -2.035693645477295, -1.9117355346679688, -1.7877774238586426, -1.663819432258606, -1.5398613214492798, -1.4159033298492432, -1.291945219039917, -1.1679871082305908, -1.0440291166305542, -0.920071005821228, -0.7961129546165466, -0.6721546649932861, -0.5481966137886047, -0.42423853278160095, -0.30028045177459717, -0.17632240056991577, -0.052364349365234375, 0.0715937614440918, 0.1955518126487732, 0.3195098638534546, 0.443467915058136, 0.5674259662628174, 0.6913840770721436, 0.815342128276825, 0.9393001794815063, 1.0632582902908325, 1.1872162818908691, 1.3111743927001953, 1.4351325035095215, 1.559090495109558, 1.6830486059188843, 1.807006597518921, 1.930964708328247, 2.0549228191375732, 2.1788809299468994, 2.3028388023376465, 2.4267969131469727, 2.550755023956299, 2.674713134765625, 2.798671007156372, 2.9226291179656982, 3.0465872287750244, 3.1705453395843506, 3.2945034503936768]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 7.0, 6.0, 4.0, 21.0, 25.0, 37.0, 78.0, 115.0, 197.0, 381.0, 949.0, 2404.0, 9362.0, 62802.0, 845566.0, 108214.0, 13041.0, 3164.0, 1161.0, 477.0, 218.0, 132.0, 74.0, 42.0, 20.0, 18.0, 12.0, 7.0, 6.0, 5.0, 5.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.66796875, -0.650665283203125, -0.63336181640625, -0.616058349609375, -0.5987548828125, -0.581451416015625, -0.56414794921875, -0.546844482421875, -0.529541015625, -0.512237548828125, -0.49493408203125, -0.477630615234375, -0.4603271484375, -0.443023681640625, -0.42572021484375, -0.408416748046875, -0.39111328125, -0.373809814453125, -0.35650634765625, -0.339202880859375, -0.3218994140625, -0.304595947265625, -0.28729248046875, -0.269989013671875, -0.252685546875, -0.235382080078125, -0.21807861328125, -0.200775146484375, -0.1834716796875, -0.166168212890625, -0.14886474609375, -0.131561279296875, -0.1142578125, -0.096954345703125, -0.07965087890625, -0.062347412109375, -0.0450439453125, -0.027740478515625, -0.01043701171875, 0.006866455078125, 0.024169921875, 0.041473388671875, 0.05877685546875, 0.076080322265625, 0.0933837890625, 0.110687255859375, 0.12799072265625, 0.145294189453125, 0.16259765625, 0.179901123046875, 0.19720458984375, 0.214508056640625, 0.2318115234375, 0.249114990234375, 0.26641845703125, 0.283721923828125, 0.301025390625, 0.318328857421875, 0.33563232421875, 0.352935791015625, 0.3702392578125, 0.387542724609375, 0.40484619140625, 0.422149658203125, 0.439453125]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 0.0, 6.0, 3.0, 7.0, 7.0, 13.0, 15.0, 32.0, 34.0, 59.0, 58.0, 66.0, 93.0, 106.0, 108.0, 90.0, 85.0, 63.0, 52.0, 31.0, 27.0, 19.0, 9.0, 4.0, 8.0, 3.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.433837890625, -0.42322349548339844, -0.4126091003417969, -0.4019947052001953, -0.39138031005859375, -0.3807659149169922, -0.3701515197753906, -0.35953712463378906, -0.3489227294921875, -0.33830833435058594, -0.3276939392089844, -0.3170795440673828, -0.30646514892578125, -0.2958507537841797, -0.2852363586425781, -0.27462196350097656, -0.264007568359375, -0.25339317321777344, -0.24277877807617188, -0.2321643829345703, -0.22154998779296875, -0.2109355926513672, -0.20032119750976562, -0.18970680236816406, -0.1790924072265625, -0.16847801208496094, -0.15786361694335938, -0.1472492218017578, -0.13663482666015625, -0.1260204315185547, -0.11540603637695312, -0.10479164123535156, -0.09417724609375, -0.08356285095214844, -0.07294845581054688, -0.06233406066894531, -0.05171966552734375, -0.04110527038574219, -0.030490875244140625, -0.019876480102539062, -0.0092620849609375, 0.0013523101806640625, 0.011966705322265625, 0.022581100463867188, 0.03319549560546875, 0.04380989074707031, 0.054424285888671875, 0.06503868103027344, 0.075653076171875, 0.08626747131347656, 0.09688186645507812, 0.10749626159667969, 0.11811065673828125, 0.1287250518798828, 0.13933944702148438, 0.14995384216308594, 0.1605682373046875, 0.17118263244628906, 0.18179702758789062, 0.1924114227294922, 0.20302581787109375, 0.2136402130126953, 0.22425460815429688, 0.23486900329589844, 0.2454833984375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 7.0, 3.0, 5.0, 8.0, 8.0, 7.0, 12.0, 12.0, 28.0, 34.0, 43.0, 58.0, 81.0, 103.0, 190.0, 319.0, 655.0, 1417.0, 4844.0, 28854.0, 883789.0, 112834.0, 10614.0, 2517.0, 901.0, 440.0, 254.0, 159.0, 112.0, 79.0, 48.0, 32.0, 27.0, 20.0, 12.0, 14.0, 8.0, 5.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.52978515625, -0.5140876770019531, -0.49839019775390625, -0.4826927185058594, -0.4669952392578125, -0.4512977600097656, -0.43560028076171875, -0.4199028015136719, -0.404205322265625, -0.3885078430175781, -0.37281036376953125, -0.3571128845214844, -0.3414154052734375, -0.3257179260253906, -0.31002044677734375, -0.2943229675292969, -0.27862548828125, -0.2629280090332031, -0.24723052978515625, -0.23153305053710938, -0.2158355712890625, -0.20013809204101562, -0.18444061279296875, -0.16874313354492188, -0.153045654296875, -0.13734817504882812, -0.12165069580078125, -0.10595321655273438, -0.0902557373046875, -0.07455825805664062, -0.05886077880859375, -0.043163299560546875, -0.0274658203125, -0.011768341064453125, 0.00392913818359375, 0.019626617431640625, 0.0353240966796875, 0.051021575927734375, 0.06671905517578125, 0.08241653442382812, 0.098114013671875, 0.11381149291992188, 0.12950897216796875, 0.14520645141601562, 0.1609039306640625, 0.17660140991210938, 0.19229888916015625, 0.20799636840820312, 0.22369384765625, 0.23939132690429688, 0.25508880615234375, 0.2707862854003906, 0.2864837646484375, 0.3021812438964844, 0.31787872314453125, 0.3335762023925781, 0.349273681640625, 0.3649711608886719, 0.38066864013671875, 0.3963661193847656, 0.4120635986328125, 0.4277610778808594, 0.44345855712890625, 0.4591560363769531, 0.474853515625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 3.0, 3.0, 5.0, 10.0, 6.0, 12.0, 12.0, 18.0, 15.0, 26.0, 37.0, 39.0, 37.0, 62.0, 78.0, 82.0, 89.0, 81.0, 84.0, 53.0, 50.0, 40.0, 31.0, 36.0, 23.0, 24.0, 6.0, 11.0, 8.0, 5.0, 4.0, 1.0, 2.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.15234375, -1.1188507080078125, -1.085357666015625, -1.0518646240234375, -1.01837158203125, -0.9848785400390625, -0.951385498046875, -0.9178924560546875, -0.8843994140625, -0.8509063720703125, -0.817413330078125, -0.7839202880859375, -0.75042724609375, -0.7169342041015625, -0.683441162109375, -0.6499481201171875, -0.616455078125, -0.5829620361328125, -0.549468994140625, -0.5159759521484375, -0.48248291015625, -0.4489898681640625, -0.415496826171875, -0.3820037841796875, -0.3485107421875, -0.3150177001953125, -0.281524658203125, -0.2480316162109375, -0.21453857421875, -0.1810455322265625, -0.147552490234375, -0.1140594482421875, -0.08056640625, -0.0470733642578125, -0.013580322265625, 0.0199127197265625, 0.05340576171875, 0.0868988037109375, 0.120391845703125, 0.1538848876953125, 0.1873779296875, 0.2208709716796875, 0.254364013671875, 0.2878570556640625, 0.32135009765625, 0.3548431396484375, 0.388336181640625, 0.4218292236328125, 0.455322265625, 0.4888153076171875, 0.522308349609375, 0.5558013916015625, 0.58929443359375, 0.6227874755859375, 0.656280517578125, 0.6897735595703125, 0.7232666015625, 0.7567596435546875, 0.790252685546875, 0.8237457275390625, 0.85723876953125, 0.8907318115234375, 0.924224853515625, 0.9577178955078125, 0.9912109375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 5.0, 4.0, 3.0, 9.0, 11.0, 2.0, 13.0, 16.0, 25.0, 21.0, 33.0, 41.0, 58.0, 101.0, 188.0, 291.0, 512.0, 1081.0, 2507.0, 7305.0, 63856.0, 945748.0, 18811.0, 4304.0, 1734.0, 807.0, 384.0, 239.0, 142.0, 85.0, 66.0, 45.0, 20.0, 26.0, 14.0, 12.0, 4.0, 6.0, 6.0, 2.0, 2.0, 3.0, 2.0, 3.0, 7.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.1151123046875, -0.11154651641845703, -0.10798072814941406, -0.1044149398803711, -0.10084915161132812, -0.09728336334228516, -0.09371757507324219, -0.09015178680419922, -0.08658599853515625, -0.08302021026611328, -0.07945442199707031, -0.07588863372802734, -0.07232284545898438, -0.0687570571899414, -0.06519126892089844, -0.06162548065185547, -0.0580596923828125, -0.05449390411376953, -0.05092811584472656, -0.047362327575683594, -0.043796539306640625, -0.040230751037597656, -0.03666496276855469, -0.03309917449951172, -0.02953338623046875, -0.02596759796142578, -0.022401809692382812, -0.018836021423339844, -0.015270233154296875, -0.011704444885253906, -0.008138656616210938, -0.004572868347167969, -0.001007080078125, 0.0025587081909179688, 0.0061244964599609375, 0.009690284729003906, 0.013256072998046875, 0.016821861267089844, 0.020387649536132812, 0.02395343780517578, 0.02751922607421875, 0.03108501434326172, 0.03465080261230469, 0.038216590881347656, 0.041782379150390625, 0.045348167419433594, 0.04891395568847656, 0.05247974395751953, 0.0560455322265625, 0.05961132049560547, 0.06317710876464844, 0.0667428970336914, 0.07030868530273438, 0.07387447357177734, 0.07744026184082031, 0.08100605010986328, 0.08457183837890625, 0.08813762664794922, 0.09170341491699219, 0.09526920318603516, 0.09883499145507812, 0.1024007797241211, 0.10596656799316406, 0.10953235626220703, 0.11309814453125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 3.0, 4.0, 8.0, 9.0, 14.0, 20.0, 20.0, 17.0, 21.0, 27.0, 54.0, 57.0, 95.0, 150.0, 128.0, 85.0, 68.0, 52.0, 26.0, 21.0, 21.0, 21.0, 14.0, 14.0, 13.0, 6.0, 7.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.0001518726348876953, -0.00014724396169185638, -0.00014261528849601746, -0.00013798661530017853, -0.0001333579421043396, -0.00012872926890850067, -0.00012410059571266174, -0.00011947192251682281, -0.00011484324932098389, -0.00011021457612514496, -0.00010558590292930603, -0.0001009572297334671, -9.632855653762817e-05, -9.169988334178925e-05, -8.707121014595032e-05, -8.244253695011139e-05, -7.781386375427246e-05, -7.318519055843353e-05, -6.85565173625946e-05, -6.392784416675568e-05, -5.929917097091675e-05, -5.467049777507782e-05, -5.004182457923889e-05, -4.541315138339996e-05, -4.0784478187561035e-05, -3.615580499172211e-05, -3.152713179588318e-05, -2.689845860004425e-05, -2.2269785404205322e-05, -1.7641112208366394e-05, -1.3012439012527466e-05, -8.383765816688538e-06, -3.7550926208496094e-06, 8.735805749893188e-07, 5.502253770828247e-06, 1.0130926966667175e-05, 1.4759600162506104e-05, 1.9388273358345032e-05, 2.401694655418396e-05, 2.8645619750022888e-05, 3.3274292945861816e-05, 3.7902966141700745e-05, 4.253163933753967e-05, 4.71603125333786e-05, 5.178898572921753e-05, 5.641765892505646e-05, 6.104633212089539e-05, 6.567500531673431e-05, 7.030367851257324e-05, 7.493235170841217e-05, 7.95610249042511e-05, 8.418969810009003e-05, 8.881837129592896e-05, 9.344704449176788e-05, 9.807571768760681e-05, 0.00010270439088344574, 0.00010733306407928467, 0.0001119617372751236, 0.00011659041047096252, 0.00012121908366680145, 0.00012584775686264038, 0.0001304764300584793, 0.00013510510325431824, 0.00013973377645015717, 0.0001443624496459961]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 1.0, 5.0, 2.0, 9.0, 13.0, 17.0, 34.0, 35.0, 68.0, 73.0, 121.0, 257.0, 490.0, 1134.0, 3102.0, 13991.0, 822543.0, 191357.0, 10624.0, 2632.0, 990.0, 438.0, 243.0, 148.0, 77.0, 42.0, 36.0, 21.0, 23.0, 10.0, 8.0, 5.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05908203125, -0.05688762664794922, -0.05469322204589844, -0.052498817443847656, -0.050304412841796875, -0.048110008239746094, -0.04591560363769531, -0.04372119903564453, -0.04152679443359375, -0.03933238983154297, -0.03713798522949219, -0.034943580627441406, -0.032749176025390625, -0.030554771423339844, -0.028360366821289062, -0.02616596221923828, -0.0239715576171875, -0.02177715301513672, -0.019582748413085938, -0.017388343811035156, -0.015193939208984375, -0.012999534606933594, -0.010805130004882812, -0.008610725402832031, -0.00641632080078125, -0.004221916198730469, -0.0020275115966796875, 0.00016689300537109375, 0.002361297607421875, 0.004555702209472656, 0.0067501068115234375, 0.008944511413574219, 0.011138916015625, 0.013333320617675781, 0.015527725219726562, 0.017722129821777344, 0.019916534423828125, 0.022110939025878906, 0.024305343627929688, 0.02649974822998047, 0.02869415283203125, 0.03088855743408203, 0.03308296203613281, 0.035277366638183594, 0.037471771240234375, 0.039666175842285156, 0.04186058044433594, 0.04405498504638672, 0.0462493896484375, 0.04844379425048828, 0.05063819885253906, 0.052832603454589844, 0.055027008056640625, 0.057221412658691406, 0.05941581726074219, 0.06161022186279297, 0.06380462646484375, 0.06599903106689453, 0.06819343566894531, 0.0703878402709961, 0.07258224487304688, 0.07477664947509766, 0.07697105407714844, 0.07916545867919922, 0.08135986328125]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 7.0, 2.0, 7.0, 12.0, 8.0, 13.0, 12.0, 22.0, 57.0, 78.0, 172.0, 260.0, 141.0, 87.0, 52.0, 14.0, 18.0, 15.0, 6.0, 6.0, 9.0, 4.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.103271484375, -0.09821319580078125, -0.0931549072265625, -0.08809661865234375, -0.083038330078125, -0.07798004150390625, -0.0729217529296875, -0.06786346435546875, -0.06280517578125, -0.05774688720703125, -0.0526885986328125, -0.04763031005859375, -0.042572021484375, -0.03751373291015625, -0.0324554443359375, -0.02739715576171875, -0.0223388671875, -0.01728057861328125, -0.0122222900390625, -0.00716400146484375, -0.002105712890625, 0.00295257568359375, 0.0080108642578125, 0.01306915283203125, 0.01812744140625, 0.02318572998046875, 0.0282440185546875, 0.03330230712890625, 0.038360595703125, 0.04341888427734375, 0.0484771728515625, 0.05353546142578125, 0.05859375, 0.06365203857421875, 0.0687103271484375, 0.07376861572265625, 0.078826904296875, 0.08388519287109375, 0.0889434814453125, 0.09400177001953125, 0.09906005859375, 0.10411834716796875, 0.1091766357421875, 0.11423492431640625, 0.119293212890625, 0.12435150146484375, 0.1294097900390625, 0.13446807861328125, 0.1395263671875, 0.14458465576171875, 0.1496429443359375, 0.15470123291015625, 0.159759521484375, 0.16481781005859375, 0.1698760986328125, 0.17493438720703125, 0.17999267578125, 0.18505096435546875, 0.1901092529296875, 0.19516754150390625, 0.200225830078125, 0.20528411865234375, 0.2103424072265625, 0.21540069580078125, 0.220458984375]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 7.0, 23.0, 39.0, 150.0, 497.0, 159.0, 65.0, 31.0, 14.0, 6.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5795183181762695, -3.3853201866149902, -3.191122055053711, -2.9969239234924316, -2.8027257919311523, -2.608527660369873, -2.4143295288085938, -2.2201313972473145, -2.025933265686035, -1.8317351341247559, -1.6375370025634766, -1.4433388710021973, -1.249140739440918, -1.0549426078796387, -0.8607443571090698, -0.6665462255477905, -0.4723479747772217, -0.2781498432159424, -0.0839516818523407, 0.11024647951126099, 0.3044446110725403, 0.4986427426338196, 0.6928409337997437, 0.887039065361023, 1.0812371969223022, 1.2754353284835815, 1.4696334600448608, 1.6638317108154297, 1.858029842376709, 2.0522279739379883, 2.2464261054992676, 2.440624237060547, 2.634822368621826, 2.8290205001831055, 3.0232186317443848, 3.217416763305664, 3.4116148948669434, 3.6058130264282227, 3.800011157989502, 3.9942092895507812, 4.1884074211120605, 4.38260555267334, 4.576803684234619, 4.771001815795898, 4.965199947357178, 5.159398078918457, 5.353596210479736, 5.547794342041016, 5.741992950439453, 5.936191082000732, 6.130389213562012, 6.324587345123291, 6.51878547668457, 6.71298360824585, 6.907181739807129, 7.101379871368408, 7.2955780029296875, 7.489776134490967, 7.683974266052246, 7.878172397613525, 8.072370529174805, 8.266569137573242, 8.460766792297363, 8.6549654006958, 8.849163055419922]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 4.0, 1.0, 0.0, 4.0, 7.0, 7.0, 6.0, 10.0, 15.0, 22.0, 18.0, 24.0, 26.0, 32.0, 68.0, 83.0, 96.0, 73.0, 98.0, 110.0, 80.0, 50.0, 28.0, 25.0, 17.0, 14.0, 11.0, 11.0, 11.0, 5.0, 11.0, 8.0, 10.0, 5.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.550352096557617, -2.4510185718536377, -2.351685047149658, -2.2523515224456787, -2.153017997741699, -2.0536844730377197, -1.9543509483337402, -1.8550174236297607, -1.7556838989257812, -1.6563503742218018, -1.5570168495178223, -1.4576833248138428, -1.3583498001098633, -1.2590162754058838, -1.1596827507019043, -1.0603492259979248, -0.9610157012939453, -0.8616821765899658, -0.7623486518859863, -0.6630151271820068, -0.5636816024780273, -0.46434807777404785, -0.36501455307006836, -0.26568102836608887, -0.16634750366210938, -0.06701397895812988, 0.03231954574584961, 0.1316530704498291, 0.2309865951538086, 0.3303201198577881, 0.4296536445617676, 0.5289871692657471, 0.6283206939697266, 0.727654218673706, 0.8269877433776855, 0.926321268081665, 1.0256547927856445, 1.124988317489624, 1.2243218421936035, 1.323655366897583, 1.4229888916015625, 1.522322416305542, 1.6216559410095215, 1.720989465713501, 1.8203229904174805, 1.91965651512146, 2.0189900398254395, 2.118323564529419, 2.2176570892333984, 2.316990613937378, 2.4163241386413574, 2.515657663345337, 2.6149911880493164, 2.714324712753296, 2.8136582374572754, 2.912991762161255, 3.0123252868652344, 3.111658811569214, 3.2109923362731934, 3.310325860977173, 3.4096593856811523, 3.508992910385132, 3.6083264350891113, 3.707659959793091, 3.8069934844970703]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 6.0, 7.0, 5.0, 13.0, 5.0, 12.0, 10.0, 9.0, 14.0, 13.0, 18.0, 21.0, 27.0, 24.0, 39.0, 52.0, 168.0, 251.0, 50.0, 33.0, 32.0, 33.0, 22.0, 22.0, 14.0, 11.0, 15.0, 7.0, 7.0, 11.0, 7.0, 3.0, 6.0, 4.0, 4.0, 4.0, 3.0, 6.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.144775390625, -0.14012527465820312, -0.13547515869140625, -0.13082504272460938, -0.1261749267578125, -0.12152481079101562, -0.11687469482421875, -0.11222457885742188, -0.107574462890625, -0.10292434692382812, -0.09827423095703125, -0.09362411499023438, -0.0889739990234375, -0.08432388305664062, -0.07967376708984375, -0.07502365112304688, -0.07037353515625, -0.06572341918945312, -0.06107330322265625, -0.056423187255859375, -0.0517730712890625, -0.047122955322265625, -0.04247283935546875, -0.037822723388671875, -0.033172607421875, -0.028522491455078125, -0.02387237548828125, -0.019222259521484375, -0.0145721435546875, -0.009922027587890625, -0.00527191162109375, -0.000621795654296875, 0.0040283203125, 0.008678436279296875, 0.01332855224609375, 0.017978668212890625, 0.0226287841796875, 0.027278900146484375, 0.03192901611328125, 0.036579132080078125, 0.041229248046875, 0.045879364013671875, 0.05052947998046875, 0.055179595947265625, 0.0598297119140625, 0.06447982788085938, 0.06912994384765625, 0.07378005981445312, 0.07843017578125, 0.08308029174804688, 0.08773040771484375, 0.09238052368164062, 0.0970306396484375, 0.10168075561523438, 0.10633087158203125, 0.11098098754882812, 0.115631103515625, 0.12028121948242188, 0.12493133544921875, 0.12958145141601562, 0.1342315673828125, 0.13888168334960938, 0.14353179931640625, 0.14818191528320312, 0.15283203125]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [5.0, 1.0, 0.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 4.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 11.0, 4.0, 18.0, 12.0, 38.0, 26.0, 20.0, 67.0, 116.0, 373.0, 1676.0, 64031.0, 8319340.0, 2116.0, 385.0, 117.0, 71.0, 56.0, 25.0, 8.0, 22.0, 3.0, 4.0, 1.0, 3.0, 2.0, 2.0, 7.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 1.0, 0.0, 1.0], "bins": [-2.3081440925598145, -2.242325782775879, -2.1765074729919434, -2.110689163208008, -2.0448708534240723, -1.9790524244308472, -1.9132341146469116, -1.847415804862976, -1.781597375869751, -1.7157790660858154, -1.6499607563018799, -1.5841424465179443, -1.5183240175247192, -1.4525057077407837, -1.3866873979568481, -1.3208690881729126, -1.255050778388977, -1.1892324686050415, -1.123414158821106, -1.0575957298278809, -0.9917774200439453, -0.9259591102600098, -0.8601408004760742, -0.7943224906921387, -0.7285041213035583, -0.6626858115196228, -0.5968674421310425, -0.5310491323471069, -0.465230792760849, -0.39941245317459106, -0.3335941433906555, -0.2677758038043976, -0.20195746421813965, -0.1361391246318817, -0.07032079994678497, -0.004502475261688232, 0.0613158643245697, 0.12713420391082764, 0.19295251369476318, 0.2587708532810211, 0.32458919286727905, 0.390407532453537, 0.4562258720397949, 0.5220441818237305, 0.587862491607666, 0.6536808609962463, 0.7194991707801819, 0.7853175401687622, 0.8511358499526978, 0.9169541597366333, 0.9827725291252136, 1.048590898513794, 1.1144092082977295, 1.180227518081665, 1.2460458278656006, 1.3118641376495361, 1.3776824474334717, 1.4435007572174072, 1.5093190670013428, 1.5751373767852783, 1.6409558057785034, 1.706774115562439, 1.7725924253463745, 1.83841073513031, 1.9042291641235352]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 6.0, 4.0, 4.0, 2.0, 4.0, 1.0, 3.0, 6.0, 4.0, 3.0, 8.0, 4.0, 10.0, 6.0, 10.0, 6.0, 6.0, 2.0, 3.0, 5.0, 4.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.655138611793518, -1.6143183708190918, -1.573498249053955, -1.5326780080795288, -1.4918577671051025, -1.4510376453399658, -1.4102174043655396, -1.3693971633911133, -1.3285770416259766, -1.2877568006515503, -1.2469366788864136, -1.2061164379119873, -1.165296196937561, -1.1244760751724243, -1.083655834197998, -1.0428357124328613, -1.0020153522491455, -0.961195170879364, -0.9203749299049377, -0.8795547485351562, -0.8387345671653748, -0.7979143857955933, -0.757094144821167, -0.7162739634513855, -0.675453782081604, -0.6346336007118225, -0.5938133597373962, -0.5529931783676147, -0.5121729969978333, -0.47135278582572937, -0.4305325746536255, -0.389712393283844, -0.3488921523094177, -0.30807194113731384, -0.26725175976753235, -0.22643154859542847, -0.18561135232448578, -0.1447911560535431, -0.10397094488143921, -0.06315076351165771, -0.022330552339553833, 0.018489647656679153, 0.05930984765291214, 0.10013005137443542, 0.1409502476453781, 0.1817704439163208, 0.22259065508842468, 0.2634108364582062, 0.30423104763031006, 0.34505125880241394, 0.38587144017219543, 0.4266916513442993, 0.4675118327140808, 0.5083320140838623, 0.5491522550582886, 0.5899724364280701, 0.6307926177978516, 0.6716127991676331, 0.7124330401420593, 0.7532532215118408, 0.7940734028816223, 0.8348935842514038, 0.8757138252258301, 0.9165340065956116, 0.9573542475700378]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 6.0, 2.0, 9.0, 8.0, 11.0, 20.0, 22.0, 26.0, 42.0, 39.0, 80.0, 118.0, 164.0, 306.0, 641.0, 1415.0, 3641.0, 11106.0, 37881.0, 157886.0, 227122.0, 59996.0, 15485.0, 4701.0, 1781.0, 775.0, 369.0, 216.0, 122.0, 72.0, 45.0, 39.0, 37.0, 30.0, 11.0, 8.0, 9.0, 8.0, 4.0, 4.0, 3.0, 5.0, 1.0, 4.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.84716796875, -0.8199920654296875, -0.792816162109375, -0.7656402587890625, -0.73846435546875, -0.7112884521484375, -0.684112548828125, -0.6569366455078125, -0.6297607421875, -0.6025848388671875, -0.575408935546875, -0.5482330322265625, -0.52105712890625, -0.4938812255859375, -0.466705322265625, -0.4395294189453125, -0.412353515625, -0.3851776123046875, -0.358001708984375, -0.3308258056640625, -0.30364990234375, -0.2764739990234375, -0.249298095703125, -0.2221221923828125, -0.1949462890625, -0.1677703857421875, -0.140594482421875, -0.1134185791015625, -0.08624267578125, -0.0590667724609375, -0.031890869140625, -0.0047149658203125, 0.0224609375, 0.0496368408203125, 0.076812744140625, 0.1039886474609375, 0.13116455078125, 0.1583404541015625, 0.185516357421875, 0.2126922607421875, 0.2398681640625, 0.2670440673828125, 0.294219970703125, 0.3213958740234375, 0.34857177734375, 0.3757476806640625, 0.402923583984375, 0.4300994873046875, 0.457275390625, 0.4844512939453125, 0.511627197265625, 0.5388031005859375, 0.56597900390625, 0.5931549072265625, 0.620330810546875, 0.6475067138671875, 0.6746826171875, 0.7018585205078125, 0.729034423828125, 0.7562103271484375, 0.78338623046875, 0.8105621337890625, 0.837738037109375, 0.8649139404296875, 0.89208984375]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 8.0, 4.0, 9.0, 16.0, 15.0, 39.0, 40.0, 61.0, 75.0, 90.0, 116.0, 122.0, 99.0, 80.0, 64.0, 41.0, 50.0, 20.0, 17.0, 12.0, 10.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.300048828125, -0.2902030944824219, -0.28035736083984375, -0.2705116271972656, -0.2606658935546875, -0.2508201599121094, -0.24097442626953125, -0.23112869262695312, -0.221282958984375, -0.21143722534179688, -0.20159149169921875, -0.19174575805664062, -0.1819000244140625, -0.17205429077148438, -0.16220855712890625, -0.15236282348632812, -0.14251708984375, -0.13267135620117188, -0.12282562255859375, -0.11297988891601562, -0.1031341552734375, -0.09328842163085938, -0.08344268798828125, -0.07359695434570312, -0.063751220703125, -0.053905487060546875, -0.04405975341796875, -0.034214019775390625, -0.0243682861328125, -0.014522552490234375, -0.00467681884765625, 0.005168914794921875, 0.0150146484375, 0.024860382080078125, 0.03470611572265625, 0.044551849365234375, 0.0543975830078125, 0.06424331665039062, 0.07408905029296875, 0.08393478393554688, 0.093780517578125, 0.10362625122070312, 0.11347198486328125, 0.12331771850585938, 0.1331634521484375, 0.14300918579101562, 0.15285491943359375, 0.16270065307617188, 0.17254638671875, 0.18239212036132812, 0.19223785400390625, 0.20208358764648438, 0.2119293212890625, 0.22177505493164062, 0.23162078857421875, 0.24146652221679688, 0.251312255859375, 0.2611579895019531, 0.27100372314453125, 0.2808494567871094, 0.2906951904296875, 0.3005409240722656, 0.31038665771484375, 0.3202323913574219, 0.330078125]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 1.0, 4.0, 6.0, 5.0, 7.0, 30.0, 68.0, 157.0, 120.0, 45.0, 12.0, 8.0, 11.0, 4.0, 2.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2807621955871582, -1.2317323684692383, -1.1827025413513184, -1.1336725950241089, -1.084642767906189, -1.035612940788269, -0.9865831136703491, -0.9375532269477844, -0.8885233402252197, -0.8394935131072998, -0.7904636263847351, -0.7414337992668152, -0.6924039125442505, -0.6433740854263306, -0.5943442583084106, -0.545314371585846, -0.496284544467926, -0.4472546875476837, -0.3982248306274414, -0.3491950035095215, -0.3001651167869568, -0.25113528966903687, -0.20210543274879456, -0.15307557582855225, -0.10404571890830994, -0.055015865713357925, -0.005986012518405914, 0.0430438369512558, 0.09207369387149811, 0.14110355079174042, 0.19013339281082153, 0.23916324973106384, 0.28819310665130615, 0.33722296357154846, 0.38625282049179077, 0.4352826476097107, 0.4843125343322754, 0.5333423614501953, 0.5823721885681152, 0.6314020752906799, 0.6804319620132446, 0.7294617891311646, 0.7784916758537292, 0.8275215029716492, 0.8765513896942139, 0.9255812168121338, 0.9746110439300537, 1.0236408710479736, 1.0726706981658936, 1.1217005252838135, 1.1707303524017334, 1.2197602987289429, 1.2687901258468628, 1.3178199529647827, 1.3668497800827026, 1.415879726409912, 1.464909553527832, 1.513939380645752, 1.5629692077636719, 1.6119991540908813, 1.6610289812088013, 1.7100588083267212, 1.7590886354446411, 1.8081185817718506, 1.8571484088897705]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 5.0, 9.0, 12.0, 32.0, 103.0, 154.0, 81.0, 36.0, 13.0, 7.0, 7.0, 10.0, 3.0, 4.0, 3.0, 2.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.622973084449768, -1.5557844638824463, -1.4885958433151245, -1.4214072227478027, -1.354218602180481, -1.2870299816131592, -1.219841480255127, -1.1526527404785156, -1.0854642391204834, -1.0182756185531616, -0.9510869979858398, -0.8838983774185181, -0.8167097568511963, -0.7495211362838745, -0.6823325753211975, -0.6151439547538757, -0.5479552745819092, -0.4807666540145874, -0.4135780334472656, -0.34638944268226624, -0.27920082211494446, -0.21201220154762268, -0.1448236107826233, -0.07763499021530151, -0.010446369647979736, 0.056742243468761444, 0.12393085658550262, 0.1911194622516632, 0.258308082818985, 0.32549670338630676, 0.39268529415130615, 0.45987391471862793, 0.5270624160766602, 0.5942510366439819, 0.6614396572113037, 0.7286282777786255, 0.7958168983459473, 0.863005518913269, 0.930194079875946, 0.9973827004432678, 1.0645713806152344, 1.1317600011825562, 1.198948621749878, 1.2661372423171997, 1.3333258628845215, 1.4005144834518433, 1.467703104019165, 1.5348916053771973, 1.602080225944519, 1.6692688465118408, 1.7364574670791626, 1.8036460876464844, 1.8708347082138062, 1.938023328781128, 2.00521183013916, 2.0724005699157715, 2.1395890712738037, 2.206777572631836, 2.2739663124084473, 2.3411548137664795, 2.408343553543091, 2.475532054901123, 2.5427207946777344, 2.6099092960357666, 2.677098035812378]}, "eval/loss": 4.3373589515686035, "eval/wer": 2.4481753272510907, "eval/runtime": 1098.1378, "eval/samples_per_second": 2.406, "eval/steps_per_second": 0.301, "train/train_runtime": 6248.9422, "train/train_samples_per_second": 4.567, "train/train_steps_per_second": 0.143, "train/total_flos": 0.0, "train/train_loss": 4.35051649381227, "_wandb": {"runtime": 7690}} \ No newline at end of file