diff --git "a/wandb/run-20220318_085758-21ccfwts/files/wandb-summary.json" "b/wandb/run-20220318_085758-21ccfwts/files/wandb-summary.json" --- "a/wandb/run-20220318_085758-21ccfwts/files/wandb-summary.json" +++ "b/wandb/run-20220318_085758-21ccfwts/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 0.8683, "train/learning_rate": 7.627672209026128e-05, "train/epoch": 5.61, "train/global_step": 5000, "_runtime": 32100, "_timestamp": 1647625978, "_step": 5001, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 23.0, 205.0, 516.0, 231.0, 36.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.947040557861328, -20.310117721557617, -16.67319679260254, -13.036273956298828, -9.399352073669434, -5.762430191040039, -2.125507354736328, 1.51141357421875, 5.148336410522461, 8.785258293151855, 12.42218017578125, 16.05910301208496, 19.696025848388672, 23.33294677734375, 26.96986961364746, 30.60679054260254, 34.24371337890625, 37.88063430786133, 41.51755905151367, 45.15447998046875, 48.79140090942383, 52.428321838378906, 56.06524658203125, 59.70216751098633, 63.339088439941406, 66.97601318359375, 70.61293029785156, 74.2498550415039, 77.88677978515625, 81.52369689941406, 85.1606216430664, 88.79754638671875, 92.4344711303711, 96.07139587402344, 99.70831298828125, 103.3452377319336, 106.98216247558594, 110.61907958984375, 114.2560043334961, 117.89292907714844, 121.52984619140625, 125.1667709350586, 128.80369567871094, 132.44061279296875, 136.07752990722656, 139.71446228027344, 143.35137939453125, 146.98829650878906, 150.62522888183594, 154.26214599609375, 157.89907836914062, 161.53599548339844, 165.17291259765625, 168.80984497070312, 172.44676208496094, 176.08367919921875, 179.72059631347656, 183.35751342773438, 186.99444580078125, 190.63136291503906, 194.26828002929688, 197.90521240234375, 201.54212951660156, 205.17904663085938, 208.81597900390625]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 6.0, 5.0, 2.0, 6.0, 6.0, 10.0, 9.0, 10.0, 13.0, 9.0, 18.0, 20.0, 31.0, 29.0, 26.0, 37.0, 36.0, 32.0, 44.0, 45.0, 55.0, 48.0, 36.0, 41.0, 39.0, 47.0, 35.0, 33.0, 44.0, 40.0, 20.0, 33.0, 23.0, 35.0, 18.0, 8.0, 8.0, 11.0, 9.0, 6.0, 4.0, 6.0, 1.0, 2.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-15.669662475585938, -15.11377239227295, -14.557883262634277, -14.001993179321289, -13.446104049682617, -12.890213966369629, -12.33432388305664, -11.778434753417969, -11.22254467010498, -10.666654586791992, -10.11076545715332, -9.554875373840332, -8.998985290527344, -8.443096160888672, -7.887206077575684, -7.3313164710998535, -6.775426864624023, -6.219537258148193, -5.663647651672363, -5.107757568359375, -4.551867961883545, -3.995978355407715, -3.4400885105133057, -2.8841986656188965, -2.3283090591430664, -1.7724193334579468, -1.2165296077728271, -0.6606398820877075, -0.10475015640258789, 0.4511394500732422, 1.0070292949676514, 1.5629191398620605, 2.118806838989258, 2.674696445465088, 3.230586290359497, 3.7864761352539062, 4.342365741729736, 4.898255348205566, 5.454145431518555, 6.010035037994385, 6.565924644470215, 7.121814250946045, 7.677703857421875, 8.233593940734863, 8.789484024047852, 9.345373153686523, 9.901263236999512, 10.4571533203125, 11.013042449951172, 11.56893253326416, 12.124821662902832, 12.68071174621582, 13.236600875854492, 13.79249095916748, 14.348381042480469, 14.90427017211914, 15.460160255432129, 16.016050338745117, 16.57193946838379, 17.12782859802246, 17.683719635009766, 18.239608764648438, 18.79549789428711, 19.351388931274414, 19.907278060913086]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 2.0, 6.0, 8.0, 7.0, 7.0, 7.0, 12.0, 12.0, 20.0, 15.0, 25.0, 19.0, 36.0, 36.0, 40.0, 50.0, 39.0, 39.0, 55.0, 43.0, 58.0, 47.0, 56.0, 45.0, 53.0, 43.0, 40.0, 33.0, 31.0, 21.0, 20.0, 17.0, 14.0, 15.0, 9.0, 7.0, 6.0, 5.0, 5.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5048828125, -1.453277587890625, -1.40167236328125, -1.350067138671875, -1.2984619140625, -1.246856689453125, -1.19525146484375, -1.143646240234375, -1.092041015625, -1.040435791015625, -0.98883056640625, -0.937225341796875, -0.8856201171875, -0.834014892578125, -0.78240966796875, -0.730804443359375, -0.67919921875, -0.627593994140625, -0.57598876953125, -0.524383544921875, -0.4727783203125, -0.421173095703125, -0.36956787109375, -0.317962646484375, -0.266357421875, -0.214752197265625, -0.16314697265625, -0.111541748046875, -0.0599365234375, -0.008331298828125, 0.04327392578125, 0.094879150390625, 0.146484375, 0.198089599609375, 0.24969482421875, 0.301300048828125, 0.3529052734375, 0.404510498046875, 0.45611572265625, 0.507720947265625, 0.559326171875, 0.610931396484375, 0.66253662109375, 0.714141845703125, 0.7657470703125, 0.817352294921875, 0.86895751953125, 0.920562744140625, 0.97216796875, 1.023773193359375, 1.07537841796875, 1.126983642578125, 1.1785888671875, 1.230194091796875, 1.28179931640625, 1.333404541015625, 1.385009765625, 1.436614990234375, 1.48822021484375, 1.539825439453125, 1.5914306640625, 1.643035888671875, 1.69464111328125, 1.746246337890625, 1.7978515625]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 5.0, 3.0, 7.0, 7.0, 6.0, 11.0, 14.0, 20.0, 28.0, 36.0, 54.0, 81.0, 112.0, 171.0, 291.0, 392.0, 689.0, 1202.0, 2689.0, 6676.0, 22918.0, 112416.0, 891414.0, 2731693.0, 345283.0, 56023.0, 13341.0, 4342.0, 1955.0, 917.0, 588.0, 312.0, 195.0, 119.0, 71.0, 46.0, 28.0, 50.0, 27.0, 14.0, 14.0, 5.0, 8.0, 5.0, 5.0, 1.0, 5.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.40625, -7.18377685546875, -6.9613037109375, -6.73883056640625, -6.516357421875, -6.29388427734375, -6.0714111328125, -5.84893798828125, -5.62646484375, -5.40399169921875, -5.1815185546875, -4.95904541015625, -4.736572265625, -4.51409912109375, -4.2916259765625, -4.06915283203125, -3.8466796875, -3.62420654296875, -3.4017333984375, -3.17926025390625, -2.956787109375, -2.73431396484375, -2.5118408203125, -2.28936767578125, -2.06689453125, -1.84442138671875, -1.6219482421875, -1.39947509765625, -1.177001953125, -0.95452880859375, -0.7320556640625, -0.50958251953125, -0.287109375, -0.06463623046875, 0.1578369140625, 0.38031005859375, 0.602783203125, 0.82525634765625, 1.0477294921875, 1.27020263671875, 1.49267578125, 1.71514892578125, 1.9376220703125, 2.16009521484375, 2.382568359375, 2.60504150390625, 2.8275146484375, 3.04998779296875, 3.2724609375, 3.49493408203125, 3.7174072265625, 3.93988037109375, 4.162353515625, 4.38482666015625, 4.6072998046875, 4.82977294921875, 5.05224609375, 5.27471923828125, 5.4971923828125, 5.71966552734375, 5.942138671875, 6.16461181640625, 6.3870849609375, 6.60955810546875, 6.83203125]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 11.0, 12.0, 17.0, 22.0, 59.0, 75.0, 170.0, 312.0, 449.0, 755.0, 832.0, 537.0, 363.0, 212.0, 115.0, 64.0, 36.0, 18.0, 8.0, 7.0, 3.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.171875, -10.8704833984375, -10.569091796875, -10.2677001953125, -9.96630859375, -9.6649169921875, -9.363525390625, -9.0621337890625, -8.7607421875, -8.4593505859375, -8.157958984375, -7.8565673828125, -7.55517578125, -7.2537841796875, -6.952392578125, -6.6510009765625, -6.349609375, -6.0482177734375, -5.746826171875, -5.4454345703125, -5.14404296875, -4.8426513671875, -4.541259765625, -4.2398681640625, -3.9384765625, -3.6370849609375, -3.335693359375, -3.0343017578125, -2.73291015625, -2.4315185546875, -2.130126953125, -1.8287353515625, -1.52734375, -1.2259521484375, -0.924560546875, -0.6231689453125, -0.32177734375, -0.0203857421875, 0.281005859375, 0.5823974609375, 0.8837890625, 1.1851806640625, 1.486572265625, 1.7879638671875, 2.08935546875, 2.3907470703125, 2.692138671875, 2.9935302734375, 3.294921875, 3.5963134765625, 3.897705078125, 4.1990966796875, 4.50048828125, 4.8018798828125, 5.103271484375, 5.4046630859375, 5.7060546875, 6.0074462890625, 6.308837890625, 6.6102294921875, 6.91162109375, 7.2130126953125, 7.514404296875, 7.8157958984375, 8.1171875]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 21.0, 26.0, 72.0, 97.0, 184.0, 397.0, 869.0, 2666.0, 20938.0, 1731087.0, 2405734.0, 27278.0, 2999.0, 1060.0, 427.0, 207.0, 109.0, 44.0, 22.0, 15.0, 11.0, 5.0, 5.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-34.375, -33.421142578125, -32.46728515625, -31.513427734375, -30.5595703125, -29.605712890625, -28.65185546875, -27.697998046875, -26.744140625, -25.790283203125, -24.83642578125, -23.882568359375, -22.9287109375, -21.974853515625, -21.02099609375, -20.067138671875, -19.11328125, -18.159423828125, -17.20556640625, -16.251708984375, -15.2978515625, -14.343994140625, -13.39013671875, -12.436279296875, -11.482421875, -10.528564453125, -9.57470703125, -8.620849609375, -7.6669921875, -6.713134765625, -5.75927734375, -4.805419921875, -3.8515625, -2.897705078125, -1.94384765625, -0.989990234375, -0.0361328125, 0.917724609375, 1.87158203125, 2.825439453125, 3.779296875, 4.733154296875, 5.68701171875, 6.640869140625, 7.5947265625, 8.548583984375, 9.50244140625, 10.456298828125, 11.41015625, 12.364013671875, 13.31787109375, 14.271728515625, 15.2255859375, 16.179443359375, 17.13330078125, 18.087158203125, 19.041015625, 19.994873046875, 20.94873046875, 21.902587890625, 22.8564453125, 23.810302734375, 24.76416015625, 25.718017578125, 26.671875]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 16.0, 206.0, 465.0, 277.0, 50.0, 3.0, 1.0], "bins": [-211.5327606201172, -207.97804260253906, -204.42332458496094, -200.8686065673828, -197.3138885498047, -193.75917053222656, -190.20445251464844, -186.6497344970703, -183.0950164794922, -179.54029846191406, -175.98558044433594, -172.4308624267578, -168.8761444091797, -165.32142639160156, -161.76670837402344, -158.2119903564453, -154.65728759765625, -151.10256958007812, -147.5478515625, -143.99313354492188, -140.43841552734375, -136.88369750976562, -133.3289794921875, -129.77426147460938, -126.21954345703125, -122.66482543945312, -119.110107421875, -115.55538940429688, -112.00067138671875, -108.44595336914062, -104.8912353515625, -101.33651733398438, -97.78179931640625, -94.22708129882812, -90.67236328125, -87.11764526367188, -83.56292724609375, -80.00820922851562, -76.4534912109375, -72.89877319335938, -69.34405517578125, -65.78933715820312, -62.234619140625, -58.679901123046875, -55.12518310546875, -51.570465087890625, -48.015750885009766, -44.46103286743164, -40.90631866455078, -37.351600646972656, -33.79688262939453, -30.24216651916504, -26.687448501586914, -23.13273048400879, -19.578014373779297, -16.023296356201172, -12.468576431274414, -8.913858413696289, -5.3591413497924805, -1.8044242858886719, 1.7502937316894531, 5.305011749267578, 8.85972785949707, 12.414445877075195, 15.96916389465332]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 5.0, 1.0, 4.0, 5.0, 3.0, 8.0, 14.0, 7.0, 8.0, 10.0, 17.0, 25.0, 24.0, 22.0, 28.0, 27.0, 25.0, 32.0, 37.0, 38.0, 38.0, 37.0, 46.0, 42.0, 43.0, 40.0, 39.0, 30.0, 31.0, 29.0, 35.0, 33.0, 26.0, 28.0, 18.0, 20.0, 21.0, 13.0, 16.0, 13.0, 16.0, 12.0, 11.0, 8.0, 3.0, 6.0, 6.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.903553009033203, -16.351224899291992, -15.798894882202148, -15.246566772460938, -14.69423770904541, -14.141908645629883, -13.589579582214355, -13.037250518798828, -12.484922409057617, -11.93259334564209, -11.380264282226562, -10.827936172485352, -10.275607109069824, -9.723278045654297, -9.17094898223877, -8.618619918823242, -8.066290855407715, -7.5139617919921875, -6.961633205413818, -6.409304141998291, -5.856975555419922, -5.3046464920043945, -4.752317428588867, -4.19998836517334, -3.6476597785949707, -3.0953309535980225, -2.543002128601074, -1.9906730651855469, -1.4383442401885986, -0.8860154151916504, -0.33368635177612305, 0.2186424732208252, 0.7709712982177734, 1.3233001232147217, 1.8756290674209595, 2.4279580116271973, 2.9802868366241455, 3.5326156616210938, 4.084944725036621, 4.637273788452148, 5.189602375030518, 5.741931438446045, 6.294260025024414, 6.846589088439941, 7.398918151855469, 7.951246738433838, 8.503576278686523, 9.055904388427734, 9.608233451843262, 10.160562515258789, 10.712891578674316, 11.265220642089844, 11.817548751831055, 12.369877815246582, 12.92220687866211, 13.474535942077637, 14.026865005493164, 14.579194068908691, 15.131523132324219, 15.68385124206543, 16.236181259155273, 16.788509368896484, 17.340839385986328, 17.89316749572754, 18.44549560546875]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 6.0, 4.0, 3.0, 6.0, 8.0, 20.0, 13.0, 12.0, 17.0, 14.0, 16.0, 21.0, 23.0, 31.0, 27.0, 34.0, 45.0, 53.0, 34.0, 41.0, 41.0, 60.0, 56.0, 43.0, 47.0, 34.0, 48.0, 28.0, 34.0, 34.0, 30.0, 18.0, 16.0, 20.0, 19.0, 13.0, 7.0, 7.0, 5.0, 11.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.685546875, -1.6351470947265625, -1.584747314453125, -1.5343475341796875, -1.48394775390625, -1.4335479736328125, -1.383148193359375, -1.3327484130859375, -1.2823486328125, -1.2319488525390625, -1.181549072265625, -1.1311492919921875, -1.08074951171875, -1.0303497314453125, -0.979949951171875, -0.9295501708984375, -0.879150390625, -0.8287506103515625, -0.778350830078125, -0.7279510498046875, -0.67755126953125, -0.6271514892578125, -0.576751708984375, -0.5263519287109375, -0.4759521484375, -0.4255523681640625, -0.375152587890625, -0.3247528076171875, -0.27435302734375, -0.2239532470703125, -0.173553466796875, -0.1231536865234375, -0.07275390625, -0.0223541259765625, 0.028045654296875, 0.0784454345703125, 0.12884521484375, 0.1792449951171875, 0.229644775390625, 0.2800445556640625, 0.3304443359375, 0.3808441162109375, 0.431243896484375, 0.4816436767578125, 0.53204345703125, 0.5824432373046875, 0.632843017578125, 0.6832427978515625, 0.733642578125, 0.7840423583984375, 0.834442138671875, 0.8848419189453125, 0.93524169921875, 0.9856414794921875, 1.036041259765625, 1.0864410400390625, 1.1368408203125, 1.1872406005859375, 1.237640380859375, 1.2880401611328125, 1.33843994140625, 1.3888397216796875, 1.439239501953125, 1.4896392822265625, 1.5400390625]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 6.0, 9.0, 11.0, 14.0, 19.0, 32.0, 35.0, 71.0, 91.0, 202.0, 309.0, 539.0, 890.0, 1589.0, 2689.0, 4399.0, 7478.0, 11919.0, 18650.0, 28131.0, 41366.0, 57565.0, 74988.0, 92675.0, 106185.0, 115400.0, 109723.0, 97209.0, 80679.0, 61582.0, 46003.0, 32026.0, 21141.0, 13704.0, 8612.0, 5150.0, 3115.0, 1781.0, 1052.0, 617.0, 366.0, 213.0, 123.0, 70.0, 45.0, 28.0, 16.0, 14.0, 8.0, 8.0, 5.0, 5.0, 8.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.9111328125, -0.8823394775390625, -0.853546142578125, -0.8247528076171875, -0.79595947265625, -0.7671661376953125, -0.738372802734375, -0.7095794677734375, -0.6807861328125, -0.6519927978515625, -0.623199462890625, -0.5944061279296875, -0.56561279296875, -0.5368194580078125, -0.508026123046875, -0.4792327880859375, -0.450439453125, -0.4216461181640625, -0.392852783203125, -0.3640594482421875, -0.33526611328125, -0.3064727783203125, -0.277679443359375, -0.2488861083984375, -0.2200927734375, -0.1912994384765625, -0.162506103515625, -0.1337127685546875, -0.10491943359375, -0.0761260986328125, -0.047332763671875, -0.0185394287109375, 0.01025390625, 0.0390472412109375, 0.067840576171875, 0.0966339111328125, 0.12542724609375, 0.1542205810546875, 0.183013916015625, 0.2118072509765625, 0.2406005859375, 0.2693939208984375, 0.298187255859375, 0.3269805908203125, 0.35577392578125, 0.3845672607421875, 0.413360595703125, 0.4421539306640625, 0.470947265625, 0.4997406005859375, 0.528533935546875, 0.5573272705078125, 0.58612060546875, 0.6149139404296875, 0.643707275390625, 0.6725006103515625, 0.7012939453125, 0.7300872802734375, 0.758880615234375, 0.7876739501953125, 0.81646728515625, 0.8452606201171875, 0.874053955078125, 0.9028472900390625, 0.931640625]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 4.0, 5.0, 6.0, 6.0, 6.0, 4.0, 7.0, 9.0, 13.0, 13.0, 11.0, 15.0, 23.0, 22.0, 24.0, 29.0, 32.0, 22.0, 25.0, 31.0, 30.0, 39.0, 25.0, 36.0, 35.0, 44.0, 1065.0, 30.0, 25.0, 41.0, 22.0, 35.0, 26.0, 31.0, 33.0, 28.0, 20.0, 16.0, 22.0, 23.0, 18.0, 14.0, 10.0, 19.0, 8.0, 9.0, 7.0, 4.0, 5.0, 2.0, 3.0, 8.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.58984375, -1.5384979248046875, -1.487152099609375, -1.4358062744140625, -1.38446044921875, -1.3331146240234375, -1.281768798828125, -1.2304229736328125, -1.1790771484375, -1.1277313232421875, -1.076385498046875, -1.0250396728515625, -0.97369384765625, -0.9223480224609375, -0.871002197265625, -0.8196563720703125, -0.768310546875, -0.7169647216796875, -0.665618896484375, -0.6142730712890625, -0.56292724609375, -0.5115814208984375, -0.460235595703125, -0.4088897705078125, -0.3575439453125, -0.3061981201171875, -0.254852294921875, -0.2035064697265625, -0.15216064453125, -0.1008148193359375, -0.049468994140625, 0.0018768310546875, 0.05322265625, 0.1045684814453125, 0.155914306640625, 0.2072601318359375, 0.25860595703125, 0.3099517822265625, 0.361297607421875, 0.4126434326171875, 0.4639892578125, 0.5153350830078125, 0.566680908203125, 0.6180267333984375, 0.66937255859375, 0.7207183837890625, 0.772064208984375, 0.8234100341796875, 0.874755859375, 0.9261016845703125, 0.977447509765625, 1.0287933349609375, 1.08013916015625, 1.1314849853515625, 1.182830810546875, 1.2341766357421875, 1.2855224609375, 1.3368682861328125, 1.388214111328125, 1.4395599365234375, 1.49090576171875, 1.5422515869140625, 1.593597412109375, 1.6449432373046875, 1.6962890625]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 4.0, 7.0, 5.0, 9.0, 16.0, 19.0, 30.0, 64.0, 63.0, 74.0, 124.0, 168.0, 242.0, 335.0, 472.0, 727.0, 993.0, 1445.0, 1922.0, 2841.0, 3966.0, 5547.0, 8004.0, 11319.0, 16792.0, 28700.0, 78190.0, 1707808.0, 133100.0, 33674.0, 18844.0, 12403.0, 8573.0, 6010.0, 4264.0, 3008.0, 2118.0, 1583.0, 1024.0, 809.0, 564.0, 386.0, 274.0, 201.0, 141.0, 77.0, 60.0, 42.0, 32.0, 19.0, 17.0, 13.0, 7.0, 2.0, 5.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0], "bins": [-1.4716796875, -1.423614501953125, -1.37554931640625, -1.327484130859375, -1.2794189453125, -1.231353759765625, -1.18328857421875, -1.135223388671875, -1.087158203125, -1.039093017578125, -0.99102783203125, -0.942962646484375, -0.8948974609375, -0.846832275390625, -0.79876708984375, -0.750701904296875, -0.70263671875, -0.654571533203125, -0.60650634765625, -0.558441162109375, -0.5103759765625, -0.462310791015625, -0.41424560546875, -0.366180419921875, -0.318115234375, -0.270050048828125, -0.22198486328125, -0.173919677734375, -0.1258544921875, -0.077789306640625, -0.02972412109375, 0.018341064453125, 0.06640625, 0.114471435546875, 0.16253662109375, 0.210601806640625, 0.2586669921875, 0.306732177734375, 0.35479736328125, 0.402862548828125, 0.450927734375, 0.498992919921875, 0.54705810546875, 0.595123291015625, 0.6431884765625, 0.691253662109375, 0.73931884765625, 0.787384033203125, 0.83544921875, 0.883514404296875, 0.93157958984375, 0.979644775390625, 1.0277099609375, 1.075775146484375, 1.12384033203125, 1.171905517578125, 1.219970703125, 1.268035888671875, 1.31610107421875, 1.364166259765625, 1.4122314453125, 1.460296630859375, 1.50836181640625, 1.556427001953125, 1.6044921875]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 1.0, 2.0, 5.0, 4.0, 2.0, 8.0, 7.0, 13.0, 18.0, 10.0, 28.0, 29.0, 25.0, 29.0, 31.0, 34.0, 37.0, 34.0, 40.0, 40.0, 48.0, 42.0, 32.0, 33.0, 46.0, 39.0, 48.0, 43.0, 50.0, 36.0, 40.0, 30.0, 24.0, 22.0, 16.0, 12.0, 11.0, 16.0, 3.0, 6.0, 4.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.1878662109375, -0.18210601806640625, -0.1763458251953125, -0.17058563232421875, -0.164825439453125, -0.15906524658203125, -0.1533050537109375, -0.14754486083984375, -0.14178466796875, -0.13602447509765625, -0.1302642822265625, -0.12450408935546875, -0.118743896484375, -0.11298370361328125, -0.1072235107421875, -0.10146331787109375, -0.095703125, -0.08994293212890625, -0.0841827392578125, -0.07842254638671875, -0.072662353515625, -0.06690216064453125, -0.0611419677734375, -0.05538177490234375, -0.04962158203125, -0.04386138916015625, -0.0381011962890625, -0.03234100341796875, -0.026580810546875, -0.02082061767578125, -0.0150604248046875, -0.00930023193359375, -0.0035400390625, 0.00222015380859375, 0.0079803466796875, 0.01374053955078125, 0.019500732421875, 0.02526092529296875, 0.0310211181640625, 0.03678131103515625, 0.04254150390625, 0.04830169677734375, 0.0540618896484375, 0.05982208251953125, 0.065582275390625, 0.07134246826171875, 0.0771026611328125, 0.08286285400390625, 0.088623046875, 0.09438323974609375, 0.1001434326171875, 0.10590362548828125, 0.111663818359375, 0.11742401123046875, 0.1231842041015625, 0.12894439697265625, 0.13470458984375, 0.14046478271484375, 0.1462249755859375, 0.15198516845703125, 0.157745361328125, 0.16350555419921875, 0.1692657470703125, 0.17502593994140625, 0.1807861328125]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 9.0, 4.0, 10.0, 4.0, 12.0, 15.0, 14.0, 26.0, 36.0, 46.0, 48.0, 83.0, 83.0, 96.0, 103.0, 134.0, 149.0, 202.0, 281.0, 426.0, 1272.0, 225181.0, 814667.0, 3696.0, 519.0, 295.0, 236.0, 180.0, 136.0, 121.0, 108.0, 76.0, 69.0, 44.0, 50.0, 35.0, 18.0, 20.0, 16.0, 12.0, 9.0, 3.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-3.1640625, -3.065673828125, -2.96728515625, -2.868896484375, -2.7705078125, -2.672119140625, -2.57373046875, -2.475341796875, -2.376953125, -2.278564453125, -2.18017578125, -2.081787109375, -1.9833984375, -1.885009765625, -1.78662109375, -1.688232421875, -1.58984375, -1.491455078125, -1.39306640625, -1.294677734375, -1.1962890625, -1.097900390625, -0.99951171875, -0.901123046875, -0.802734375, -0.704345703125, -0.60595703125, -0.507568359375, -0.4091796875, -0.310791015625, -0.21240234375, -0.114013671875, -0.015625, 0.082763671875, 0.18115234375, 0.279541015625, 0.3779296875, 0.476318359375, 0.57470703125, 0.673095703125, 0.771484375, 0.869873046875, 0.96826171875, 1.066650390625, 1.1650390625, 1.263427734375, 1.36181640625, 1.460205078125, 1.55859375, 1.656982421875, 1.75537109375, 1.853759765625, 1.9521484375, 2.050537109375, 2.14892578125, 2.247314453125, 2.345703125, 2.444091796875, 2.54248046875, 2.640869140625, 2.7392578125, 2.837646484375, 2.93603515625, 3.034423828125, 3.1328125]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 4.0, 11.0, 28.0, 32.0, 79.0, 158.0, 245.0, 221.0, 125.0, 56.0, 28.0, 11.0, 7.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8361284732818604, -1.7557697296142578, -1.6754109859466553, -1.5950521230697632, -1.5146933794021606, -1.434334635734558, -1.353975772857666, -1.2736170291900635, -1.193258285522461, -1.1128995418548584, -1.0325407981872559, -0.9521819353103638, -0.8718231916427612, -0.7914644479751587, -0.7111056447029114, -0.6307468414306641, -0.5503880977630615, -0.4700293242931366, -0.38967055082321167, -0.30931177735328674, -0.22895300388336182, -0.1485942304134369, -0.06823545694351196, 0.012123346328735352, 0.09248208999633789, 0.17284086346626282, 0.25319963693618774, 0.33355841040611267, 0.4139171838760376, 0.4942759573459625, 0.5746347308158875, 0.6549935340881348, 0.7353525161743164, 0.815711259841919, 0.8960700631141663, 0.9764288663864136, 1.0567876100540161, 1.1371463537216187, 1.2175052165985107, 1.2978639602661133, 1.3782227039337158, 1.4585814476013184, 1.538940191268921, 1.619299054145813, 1.6996577978134155, 1.780016541481018, 1.8603754043579102, 1.9407341480255127, 2.0210928916931152, 2.1014516353607178, 2.1818103790283203, 2.262169122695923, 2.3425278663635254, 2.422886848449707, 2.5032455921173096, 2.583604335784912, 2.6639630794525146, 2.744321823120117, 2.8246805667877197, 2.9050393104553223, 2.985398292541504, 3.0657570362091064, 3.146115779876709, 3.2264745235443115, 3.306833267211914]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 6.0, 5.0, 4.0, 6.0, 7.0, 7.0, 11.0, 11.0, 5.0, 15.0, 16.0, 16.0, 18.0, 22.0, 25.0, 27.0, 30.0, 37.0, 22.0, 35.0, 38.0, 46.0, 31.0, 42.0, 39.0, 32.0, 45.0, 38.0, 23.0, 45.0, 35.0, 31.0, 26.0, 24.0, 26.0, 23.0, 20.0, 16.0, 20.0, 17.0, 9.0, 9.0, 13.0, 7.0, 7.0, 1.0, 5.0, 4.0, 2.0, 0.0, 3.0, 1.0, 4.0, 0.0, 3.0, 2.0, 2.0], "bins": [-1.105726957321167, -1.0704123973846436, -1.0350979566574097, -0.999783456325531, -0.9644689559936523, -0.9291544556617737, -0.893839955329895, -0.8585253953933716, -0.8232109546661377, -0.787896454334259, -0.7525819540023804, -0.7172674536705017, -0.681952953338623, -0.6466384530067444, -0.6113239526748657, -0.5760093927383423, -0.5406948924064636, -0.505380392074585, -0.4700658917427063, -0.43475139141082764, -0.399436891078949, -0.3641223907470703, -0.32880786061286926, -0.2934933602809906, -0.25817885994911194, -0.22286435961723328, -0.18754985928535461, -0.15223534405231476, -0.1169208437204361, -0.08160634338855743, -0.04629182815551758, -0.010977327823638916, 0.024337172508239746, 0.05965167656540871, 0.09496618062257767, 0.13028068840503693, 0.1655951887369156, 0.20090968906879425, 0.2362242043018341, 0.27153870463371277, 0.30685320496559143, 0.3421677052974701, 0.37748220562934875, 0.4127967357635498, 0.44811123609542847, 0.48342573642730713, 0.5187402367591858, 0.5540547370910645, 0.5893692374229431, 0.6246837377548218, 0.6599982380867004, 0.6953127384185791, 0.7306272387504578, 0.7659417390823364, 0.8012562990188599, 0.8365707397460938, 0.8718852996826172, 0.9071998000144958, 0.9425143003463745, 0.9778288006782532, 1.0131433010101318, 1.0484578609466553, 1.0837723016738892, 1.1190868616104126, 1.1544013023376465]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 4.0, 4.0, 6.0, 8.0, 12.0, 9.0, 11.0, 13.0, 9.0, 16.0, 21.0, 31.0, 17.0, 21.0, 41.0, 34.0, 38.0, 41.0, 40.0, 48.0, 31.0, 45.0, 36.0, 45.0, 39.0, 45.0, 47.0, 39.0, 36.0, 34.0, 25.0, 29.0, 25.0, 18.0, 13.0, 20.0, 12.0, 10.0, 8.0, 3.0, 8.0, 5.0, 2.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.4140625, -1.3670806884765625, -1.320098876953125, -1.2731170654296875, -1.22613525390625, -1.1791534423828125, -1.132171630859375, -1.0851898193359375, -1.0382080078125, -0.9912261962890625, -0.944244384765625, -0.8972625732421875, -0.85028076171875, -0.8032989501953125, -0.756317138671875, -0.7093353271484375, -0.662353515625, -0.6153717041015625, -0.568389892578125, -0.5214080810546875, -0.47442626953125, -0.4274444580078125, -0.380462646484375, -0.3334808349609375, -0.2864990234375, -0.2395172119140625, -0.192535400390625, -0.1455535888671875, -0.09857177734375, -0.0515899658203125, -0.004608154296875, 0.0423736572265625, 0.08935546875, 0.1363372802734375, 0.183319091796875, 0.2303009033203125, 0.27728271484375, 0.3242645263671875, 0.371246337890625, 0.4182281494140625, 0.4652099609375, 0.5121917724609375, 0.559173583984375, 0.6061553955078125, 0.65313720703125, 0.7001190185546875, 0.747100830078125, 0.7940826416015625, 0.841064453125, 0.8880462646484375, 0.935028076171875, 0.9820098876953125, 1.02899169921875, 1.0759735107421875, 1.122955322265625, 1.1699371337890625, 1.2169189453125, 1.2639007568359375, 1.310882568359375, 1.3578643798828125, 1.40484619140625, 1.4518280029296875, 1.498809814453125, 1.5457916259765625, 1.5927734375]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 0.0, 8.0, 11.0, 8.0, 13.0, 17.0, 22.0, 37.0, 61.0, 76.0, 129.0, 186.0, 328.0, 572.0, 997.0, 1575.0, 2740.0, 4836.0, 8164.0, 14701.0, 26092.0, 47663.0, 92927.0, 179411.0, 256292.0, 192374.0, 101996.0, 51996.0, 28262.0, 15747.0, 8834.0, 5179.0, 3006.0, 1685.0, 963.0, 638.0, 353.0, 242.0, 158.0, 102.0, 51.0, 40.0, 21.0, 17.0, 11.0, 6.0, 5.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-3.263671875, -3.1634521484375, -3.063232421875, -2.9630126953125, -2.86279296875, -2.7625732421875, -2.662353515625, -2.5621337890625, -2.4619140625, -2.3616943359375, -2.261474609375, -2.1612548828125, -2.06103515625, -1.9608154296875, -1.860595703125, -1.7603759765625, -1.66015625, -1.5599365234375, -1.459716796875, -1.3594970703125, -1.25927734375, -1.1590576171875, -1.058837890625, -0.9586181640625, -0.8583984375, -0.7581787109375, -0.657958984375, -0.5577392578125, -0.45751953125, -0.3572998046875, -0.257080078125, -0.1568603515625, -0.056640625, 0.0435791015625, 0.143798828125, 0.2440185546875, 0.34423828125, 0.4444580078125, 0.544677734375, 0.6448974609375, 0.7451171875, 0.8453369140625, 0.945556640625, 1.0457763671875, 1.14599609375, 1.2462158203125, 1.346435546875, 1.4466552734375, 1.546875, 1.6470947265625, 1.747314453125, 1.8475341796875, 1.94775390625, 2.0479736328125, 2.148193359375, 2.2484130859375, 2.3486328125, 2.4488525390625, 2.549072265625, 2.6492919921875, 2.74951171875, 2.8497314453125, 2.949951171875, 3.0501708984375, 3.150390625]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 5.0, 3.0, 0.0, 5.0, 9.0, 11.0, 7.0, 4.0, 9.0, 15.0, 13.0, 20.0, 18.0, 20.0, 19.0, 33.0, 33.0, 21.0, 23.0, 48.0, 62.0, 90.0, 123.0, 181.0, 219.0, 1255.0, 193.0, 139.0, 84.0, 65.0, 45.0, 41.0, 36.0, 24.0, 29.0, 10.0, 18.0, 19.0, 24.0, 17.0, 16.0, 10.0, 15.0, 4.0, 7.0, 5.0, 1.0, 4.0, 5.0, 1.0, 1.0, 1.0], "bins": [-6.1171875, -5.9530029296875, -5.788818359375, -5.6246337890625, -5.46044921875, -5.2962646484375, -5.132080078125, -4.9678955078125, -4.8037109375, -4.6395263671875, -4.475341796875, -4.3111572265625, -4.14697265625, -3.9827880859375, -3.818603515625, -3.6544189453125, -3.490234375, -3.3260498046875, -3.161865234375, -2.9976806640625, -2.83349609375, -2.6693115234375, -2.505126953125, -2.3409423828125, -2.1767578125, -2.0125732421875, -1.848388671875, -1.6842041015625, -1.52001953125, -1.3558349609375, -1.191650390625, -1.0274658203125, -0.86328125, -0.6990966796875, -0.534912109375, -0.3707275390625, -0.20654296875, -0.0423583984375, 0.121826171875, 0.2860107421875, 0.4501953125, 0.6143798828125, 0.778564453125, 0.9427490234375, 1.10693359375, 1.2711181640625, 1.435302734375, 1.5994873046875, 1.763671875, 1.9278564453125, 2.092041015625, 2.2562255859375, 2.42041015625, 2.5845947265625, 2.748779296875, 2.9129638671875, 3.0771484375, 3.2413330078125, 3.405517578125, 3.5697021484375, 3.73388671875, 3.8980712890625, 4.062255859375, 4.2264404296875, 4.390625]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 2.0, 6.0, 6.0, 3.0, 6.0, 5.0, 13.0, 10.0, 8.0, 15.0, 19.0, 23.0, 13.0, 22.0, 23.0, 35.0, 63.0, 93.0, 192.0, 447.0, 1875.0, 56830.0, 2863657.0, 216753.0, 4330.0, 565.0, 245.0, 109.0, 90.0, 39.0, 30.0, 24.0, 23.0, 22.0, 21.0, 11.0, 11.0, 10.0, 12.0, 8.0, 7.0, 8.0, 8.0, 6.0, 3.0, 2.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-18.609375, -17.981689453125, -17.35400390625, -16.726318359375, -16.0986328125, -15.470947265625, -14.84326171875, -14.215576171875, -13.587890625, -12.960205078125, -12.33251953125, -11.704833984375, -11.0771484375, -10.449462890625, -9.82177734375, -9.194091796875, -8.56640625, -7.938720703125, -7.31103515625, -6.683349609375, -6.0556640625, -5.427978515625, -4.80029296875, -4.172607421875, -3.544921875, -2.917236328125, -2.28955078125, -1.661865234375, -1.0341796875, -0.406494140625, 0.22119140625, 0.848876953125, 1.4765625, 2.104248046875, 2.73193359375, 3.359619140625, 3.9873046875, 4.614990234375, 5.24267578125, 5.870361328125, 6.498046875, 7.125732421875, 7.75341796875, 8.381103515625, 9.0087890625, 9.636474609375, 10.26416015625, 10.891845703125, 11.51953125, 12.147216796875, 12.77490234375, 13.402587890625, 14.0302734375, 14.657958984375, 15.28564453125, 15.913330078125, 16.541015625, 17.168701171875, 17.79638671875, 18.424072265625, 19.0517578125, 19.679443359375, 20.30712890625, 20.934814453125, 21.5625]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 8.0, 465.0, 541.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.41594696044922, -22.870834350585938, -18.32572364807129, -13.780611991882324, -9.23550033569336, -4.690387725830078, -0.1452770233154297, 4.399833679199219, 8.9449462890625, 13.490057945251465, 18.03516960144043, 22.580280303955078, 27.12539291381836, 31.67050552368164, 36.215614318847656, 40.76072692871094, 45.30583953857422, 49.8509521484375, 54.39606475830078, 58.9411735534668, 63.48628616333008, 68.03140258789062, 72.57650756835938, 77.12162017822266, 81.66673278808594, 86.21184539794922, 90.7569580078125, 95.30207061767578, 99.84718322753906, 104.39228820800781, 108.9374008178711, 113.48251342773438, 118.02761840820312, 122.5727310180664, 127.11784362792969, 131.66294860839844, 136.20806884765625, 140.753173828125, 145.2982940673828, 149.84339904785156, 154.38851928710938, 158.93362426757812, 163.47874450683594, 168.0238494873047, 172.5689697265625, 177.11407470703125, 181.65919494628906, 186.2042999267578, 190.74940490722656, 195.2945098876953, 199.83963012695312, 204.38473510742188, 208.9298553466797, 213.47496032714844, 218.02008056640625, 222.565185546875, 227.11029052734375, 231.6553955078125, 236.2005157470703, 240.74562072753906, 245.29074096679688, 249.83584594726562, 254.38096618652344, 258.92608642578125, 263.47119140625]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 8.0, 5.0, 6.0, 6.0, 9.0, 14.0, 16.0, 9.0, 16.0, 22.0, 19.0, 19.0, 25.0, 30.0, 27.0, 38.0, 33.0, 39.0, 50.0, 33.0, 43.0, 46.0, 36.0, 45.0, 43.0, 47.0, 35.0, 29.0, 25.0, 29.0, 30.0, 27.0, 23.0, 24.0, 19.0, 12.0, 16.0, 14.0, 8.0, 4.0, 5.0, 6.0, 4.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.65017318725586, -16.026336669921875, -15.40250015258789, -14.778663635253906, -14.154827117919922, -13.530990600585938, -12.907153129577637, -12.283316612243652, -11.659480094909668, -11.035643577575684, -10.4118070602417, -9.787970542907715, -9.164133071899414, -8.54029655456543, -7.916460037231445, -7.292623519897461, -6.668787002563477, -6.044950485229492, -5.421113967895508, -4.797276973724365, -4.173440456390381, -3.5496039390563965, -2.925767183303833, -2.3019304275512695, -1.6780939102172852, -1.0542572736740112, -0.4304206371307373, 0.19341599941253662, 0.8172526359558105, 1.441089153289795, 2.0649259090423584, 2.688762664794922, 3.312601089477539, 3.9364376068115234, 4.560274124145508, 5.18411111831665, 5.807947635650635, 6.431784152984619, 7.055621147155762, 7.679457664489746, 8.30329418182373, 8.927130699157715, 9.5509672164917, 10.174803733825684, 10.798641204833984, 11.422477722167969, 12.046314239501953, 12.670150756835938, 13.293987274169922, 13.917823791503906, 14.54166030883789, 15.165496826171875, 15.78933334350586, 16.413169860839844, 17.037006378173828, 17.660842895507812, 18.284679412841797, 18.90851593017578, 19.532352447509766, 20.15618896484375, 20.780025482177734, 21.40386199951172, 22.027698516845703, 22.651535034179688, 23.275373458862305]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 4.0, 5.0, 4.0, 5.0, 11.0, 13.0, 14.0, 18.0, 16.0, 21.0, 31.0, 31.0, 26.0, 34.0, 37.0, 38.0, 37.0, 36.0, 42.0, 42.0, 55.0, 51.0, 51.0, 47.0, 41.0, 36.0, 38.0, 29.0, 21.0, 30.0, 19.0, 24.0, 24.0, 16.0, 13.0, 11.0, 6.0, 10.0, 5.0, 3.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.6904296875, -1.6367034912109375, -1.582977294921875, -1.5292510986328125, -1.47552490234375, -1.4217987060546875, -1.368072509765625, -1.3143463134765625, -1.2606201171875, -1.2068939208984375, -1.153167724609375, -1.0994415283203125, -1.04571533203125, -0.9919891357421875, -0.938262939453125, -0.8845367431640625, -0.830810546875, -0.7770843505859375, -0.723358154296875, -0.6696319580078125, -0.61590576171875, -0.5621795654296875, -0.508453369140625, -0.4547271728515625, -0.4010009765625, -0.3472747802734375, -0.293548583984375, -0.2398223876953125, -0.18609619140625, -0.1323699951171875, -0.078643798828125, -0.0249176025390625, 0.02880859375, 0.0825347900390625, 0.136260986328125, 0.1899871826171875, 0.24371337890625, 0.2974395751953125, 0.351165771484375, 0.4048919677734375, 0.4586181640625, 0.5123443603515625, 0.566070556640625, 0.6197967529296875, 0.67352294921875, 0.7272491455078125, 0.780975341796875, 0.8347015380859375, 0.888427734375, 0.9421539306640625, 0.995880126953125, 1.0496063232421875, 1.10333251953125, 1.1570587158203125, 1.210784912109375, 1.2645111083984375, 1.3182373046875, 1.3719635009765625, 1.425689697265625, 1.4794158935546875, 1.53314208984375, 1.5868682861328125, 1.640594482421875, 1.6943206787109375, 1.748046875]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [4.0, 3.0, 0.0, 1.0, 5.0, 4.0, 3.0, 7.0, 8.0, 5.0, 13.0, 18.0, 28.0, 27.0, 33.0, 54.0, 68.0, 85.0, 102.0, 139.0, 223.0, 361.0, 653.0, 1132.0, 2535.0, 5772.0, 13823.0, 38998.0, 119575.0, 434581.0, 1677501.0, 1403893.0, 344708.0, 96997.0, 31763.0, 11769.0, 4662.0, 2222.0, 982.0, 538.0, 321.0, 203.0, 136.0, 83.0, 60.0, 47.0, 36.0, 36.0, 22.0, 12.0, 12.0, 10.0, 10.0, 7.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0], "bins": [-3.974609375, -3.846038818359375, -3.71746826171875, -3.588897705078125, -3.4603271484375, -3.331756591796875, -3.20318603515625, -3.074615478515625, -2.946044921875, -2.817474365234375, -2.68890380859375, -2.560333251953125, -2.4317626953125, -2.303192138671875, -2.17462158203125, -2.046051025390625, -1.91748046875, -1.788909912109375, -1.66033935546875, -1.531768798828125, -1.4031982421875, -1.274627685546875, -1.14605712890625, -1.017486572265625, -0.888916015625, -0.760345458984375, -0.63177490234375, -0.503204345703125, -0.3746337890625, -0.246063232421875, -0.11749267578125, 0.011077880859375, 0.1396484375, 0.268218994140625, 0.39678955078125, 0.525360107421875, 0.6539306640625, 0.782501220703125, 0.91107177734375, 1.039642333984375, 1.168212890625, 1.296783447265625, 1.42535400390625, 1.553924560546875, 1.6824951171875, 1.811065673828125, 1.93963623046875, 2.068206787109375, 2.19677734375, 2.325347900390625, 2.45391845703125, 2.582489013671875, 2.7110595703125, 2.839630126953125, 2.96820068359375, 3.096771240234375, 3.225341796875, 3.353912353515625, 3.48248291015625, 3.611053466796875, 3.7396240234375, 3.868194580078125, 3.99676513671875, 4.125335693359375, 4.25390625]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 0.0, 2.0, 4.0, 7.0, 7.0, 12.0, 13.0, 16.0, 21.0, 42.0, 38.0, 63.0, 87.0, 131.0, 173.0, 257.0, 318.0, 403.0, 422.0, 475.0, 346.0, 284.0, 259.0, 218.0, 141.0, 93.0, 67.0, 46.0, 31.0, 34.0, 22.0, 19.0, 14.0, 3.0, 5.0, 3.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.4453125, -5.25732421875, -5.0693359375, -4.88134765625, -4.693359375, -4.50537109375, -4.3173828125, -4.12939453125, -3.94140625, -3.75341796875, -3.5654296875, -3.37744140625, -3.189453125, -3.00146484375, -2.8134765625, -2.62548828125, -2.4375, -2.24951171875, -2.0615234375, -1.87353515625, -1.685546875, -1.49755859375, -1.3095703125, -1.12158203125, -0.93359375, -0.74560546875, -0.5576171875, -0.36962890625, -0.181640625, 0.00634765625, 0.1943359375, 0.38232421875, 0.5703125, 0.75830078125, 0.9462890625, 1.13427734375, 1.322265625, 1.51025390625, 1.6982421875, 1.88623046875, 2.07421875, 2.26220703125, 2.4501953125, 2.63818359375, 2.826171875, 3.01416015625, 3.2021484375, 3.39013671875, 3.578125, 3.76611328125, 3.9541015625, 4.14208984375, 4.330078125, 4.51806640625, 4.7060546875, 4.89404296875, 5.08203125, 5.27001953125, 5.4580078125, 5.64599609375, 5.833984375, 6.02197265625, 6.2099609375, 6.39794921875, 6.5859375]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 4.0, 8.0, 18.0, 25.0, 37.0, 77.0, 134.0, 283.0, 504.0, 963.0, 2450.0, 10944.0, 110816.0, 1562632.0, 2306261.0, 178106.0, 15855.0, 2998.0, 1063.0, 512.0, 299.0, 136.0, 82.0, 28.0, 26.0, 14.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.375, -10.921630859375, -10.46826171875, -10.014892578125, -9.5615234375, -9.108154296875, -8.65478515625, -8.201416015625, -7.748046875, -7.294677734375, -6.84130859375, -6.387939453125, -5.9345703125, -5.481201171875, -5.02783203125, -4.574462890625, -4.12109375, -3.667724609375, -3.21435546875, -2.760986328125, -2.3076171875, -1.854248046875, -1.40087890625, -0.947509765625, -0.494140625, -0.040771484375, 0.41259765625, 0.865966796875, 1.3193359375, 1.772705078125, 2.22607421875, 2.679443359375, 3.1328125, 3.586181640625, 4.03955078125, 4.492919921875, 4.9462890625, 5.399658203125, 5.85302734375, 6.306396484375, 6.759765625, 7.213134765625, 7.66650390625, 8.119873046875, 8.5732421875, 9.026611328125, 9.47998046875, 9.933349609375, 10.38671875, 10.840087890625, 11.29345703125, 11.746826171875, 12.2001953125, 12.653564453125, 13.10693359375, 13.560302734375, 14.013671875, 14.467041015625, 14.92041015625, 15.373779296875, 15.8271484375, 16.280517578125, 16.73388671875, 17.187255859375, 17.640625]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 26.0, 68.0, 145.0, 204.0, 219.0, 191.0, 97.0, 40.0, 15.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.980743408203125, -20.317119598388672, -18.65349578857422, -16.989870071411133, -15.32624626159668, -13.662622451782227, -11.998997688293457, -10.335372924804688, -8.671749114990234, -7.008124828338623, -5.344500541687012, -3.6808762550354004, -2.017251968383789, -0.35362815856933594, 1.3099966049194336, 2.973621368408203, 4.637245178222656, 6.300869464874268, 7.964493751525879, 9.628118515014648, 11.291742324829102, 12.955366134643555, 14.618990898132324, 16.282615661621094, 17.946239471435547, 19.60986328125, 21.273487091064453, 22.93711280822754, 24.600736618041992, 26.264360427856445, 27.92798614501953, 29.591609954833984, 31.255233764648438, 32.91885757446289, 34.582481384277344, 36.2461051940918, 37.90972900390625, 39.57335662841797, 41.23698043823242, 42.900604248046875, 44.56422805786133, 46.22785186767578, 47.891475677490234, 49.55509948730469, 51.218727111816406, 52.882347106933594, 54.54597473144531, 56.209598541259766, 57.87322235107422, 59.53684616088867, 61.200469970703125, 62.86409378051758, 64.52771759033203, 66.19134521484375, 67.85496520996094, 69.51859283447266, 71.18222045898438, 72.8458480834961, 74.50946807861328, 76.173095703125, 77.83671569824219, 79.5003433227539, 81.1639633178711, 82.82759094238281, 84.4912109375]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 5.0, 3.0, 5.0, 3.0, 12.0, 9.0, 8.0, 11.0, 16.0, 8.0, 19.0, 21.0, 23.0, 26.0, 28.0, 27.0, 33.0, 29.0, 40.0, 27.0, 39.0, 33.0, 33.0, 42.0, 41.0, 40.0, 22.0, 31.0, 40.0, 27.0, 38.0, 31.0, 25.0, 28.0, 21.0, 23.0, 23.0, 14.0, 16.0, 15.0, 13.0, 17.0, 8.0, 8.0, 5.0, 2.0, 5.0, 4.0, 2.0, 2.0, 3.0, 0.0, 0.0, 3.0, 2.0, 2.0], "bins": [-17.525236129760742, -16.97063636779785, -16.41603660583496, -15.86143684387207, -15.30683708190918, -14.752237319946289, -14.197637557983398, -13.643037796020508, -13.088438034057617, -12.533838272094727, -11.979238510131836, -11.424638748168945, -10.870038986206055, -10.315439224243164, -9.760839462280273, -9.206239700317383, -8.651639938354492, -8.097040176391602, -7.542440414428711, -6.98784065246582, -6.43324089050293, -5.878641128540039, -5.324041366577148, -4.769441604614258, -4.214841842651367, -3.6602420806884766, -3.105642318725586, -2.5510425567626953, -1.9964427947998047, -1.441843032836914, -0.8872432708740234, -0.3326435089111328, 0.221954345703125, 0.7765541076660156, 1.3311538696289062, 1.8857536315917969, 2.4403533935546875, 2.994953155517578, 3.5495529174804688, 4.104152679443359, 4.65875244140625, 5.213352203369141, 5.767951965332031, 6.322551727294922, 6.8771514892578125, 7.431751251220703, 7.986351013183594, 8.540950775146484, 9.095550537109375, 9.650150299072266, 10.204750061035156, 10.759349822998047, 11.313949584960938, 11.868549346923828, 12.423149108886719, 12.97774887084961, 13.5323486328125, 14.08694839477539, 14.641548156738281, 15.196147918701172, 15.750747680664062, 16.305347442626953, 16.859947204589844, 17.414546966552734, 17.969146728515625]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 6.0, 4.0, 5.0, 13.0, 10.0, 9.0, 6.0, 16.0, 12.0, 33.0, 22.0, 30.0, 34.0, 33.0, 36.0, 42.0, 47.0, 47.0, 35.0, 50.0, 46.0, 57.0, 48.0, 51.0, 46.0, 39.0, 38.0, 28.0, 26.0, 24.0, 19.0, 15.0, 22.0, 10.0, 10.0, 10.0, 12.0, 3.0, 3.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.67578125, -1.616180419921875, -1.55657958984375, -1.496978759765625, -1.4373779296875, -1.377777099609375, -1.31817626953125, -1.258575439453125, -1.198974609375, -1.139373779296875, -1.07977294921875, -1.020172119140625, -0.9605712890625, -0.900970458984375, -0.84136962890625, -0.781768798828125, -0.72216796875, -0.662567138671875, -0.60296630859375, -0.543365478515625, -0.4837646484375, -0.424163818359375, -0.36456298828125, -0.304962158203125, -0.245361328125, -0.185760498046875, -0.12615966796875, -0.066558837890625, -0.0069580078125, 0.052642822265625, 0.11224365234375, 0.171844482421875, 0.2314453125, 0.291046142578125, 0.35064697265625, 0.410247802734375, 0.4698486328125, 0.529449462890625, 0.58905029296875, 0.648651123046875, 0.708251953125, 0.767852783203125, 0.82745361328125, 0.887054443359375, 0.9466552734375, 1.006256103515625, 1.06585693359375, 1.125457763671875, 1.18505859375, 1.244659423828125, 1.30426025390625, 1.363861083984375, 1.4234619140625, 1.483062744140625, 1.54266357421875, 1.602264404296875, 1.661865234375, 1.721466064453125, 1.78106689453125, 1.840667724609375, 1.9002685546875, 1.959869384765625, 2.01947021484375, 2.079071044921875, 2.138671875]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 7.0, 1.0, 10.0, 17.0, 18.0, 28.0, 49.0, 62.0, 119.0, 192.0, 334.0, 523.0, 866.0, 1441.0, 2404.0, 3733.0, 5979.0, 9104.0, 13716.0, 20108.0, 28000.0, 38692.0, 51096.0, 64265.0, 77270.0, 88244.0, 95568.0, 97318.0, 91473.0, 82670.0, 70236.0, 57062.0, 44620.0, 32750.0, 23553.0, 16302.0, 11141.0, 7198.0, 4769.0, 2928.0, 1883.0, 1083.0, 692.0, 406.0, 242.0, 156.0, 92.0, 57.0, 28.0, 17.0, 22.0, 11.0, 5.0, 4.0, 3.0, 0.0, 1.0, 2.0], "bins": [-0.93017578125, -0.9021835327148438, -0.8741912841796875, -0.8461990356445312, -0.818206787109375, -0.7902145385742188, -0.7622222900390625, -0.7342300415039062, -0.70623779296875, -0.6782455444335938, -0.6502532958984375, -0.6222610473632812, -0.594268798828125, -0.5662765502929688, -0.5382843017578125, -0.5102920532226562, -0.4822998046875, -0.45430755615234375, -0.4263153076171875, -0.39832305908203125, -0.370330810546875, -0.34233856201171875, -0.3143463134765625, -0.28635406494140625, -0.25836181640625, -0.23036956787109375, -0.2023773193359375, -0.17438507080078125, -0.146392822265625, -0.11840057373046875, -0.0904083251953125, -0.06241607666015625, -0.034423828125, -0.00643157958984375, 0.0215606689453125, 0.04955291748046875, 0.077545166015625, 0.10553741455078125, 0.1335296630859375, 0.16152191162109375, 0.18951416015625, 0.21750640869140625, 0.2454986572265625, 0.27349090576171875, 0.301483154296875, 0.32947540283203125, 0.3574676513671875, 0.38545989990234375, 0.4134521484375, 0.44144439697265625, 0.4694366455078125, 0.49742889404296875, 0.525421142578125, 0.5534133911132812, 0.5814056396484375, 0.6093978881835938, 0.63739013671875, 0.6653823852539062, 0.6933746337890625, 0.7213668823242188, 0.749359130859375, 0.7773513793945312, 0.8053436279296875, 0.8333358764648438, 0.861328125]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 5.0, 7.0, 9.0, 13.0, 9.0, 13.0, 11.0, 11.0, 19.0, 28.0, 24.0, 36.0, 32.0, 31.0, 26.0, 25.0, 37.0, 44.0, 43.0, 33.0, 38.0, 1056.0, 39.0, 41.0, 39.0, 35.0, 33.0, 36.0, 23.0, 32.0, 27.0, 23.0, 17.0, 15.0, 23.0, 18.0, 16.0, 9.0, 8.0, 9.0, 7.0, 7.0, 6.0, 7.0, 4.0, 2.0, 3.0, 1.0, 0.0, 2.0, 2.0], "bins": [-1.884765625, -1.8300323486328125, -1.775299072265625, -1.7205657958984375, -1.66583251953125, -1.6110992431640625, -1.556365966796875, -1.5016326904296875, -1.4468994140625, -1.3921661376953125, -1.337432861328125, -1.2826995849609375, -1.22796630859375, -1.1732330322265625, -1.118499755859375, -1.0637664794921875, -1.009033203125, -0.9542999267578125, -0.899566650390625, -0.8448333740234375, -0.79010009765625, -0.7353668212890625, -0.680633544921875, -0.6259002685546875, -0.5711669921875, -0.5164337158203125, -0.461700439453125, -0.4069671630859375, -0.35223388671875, -0.2975006103515625, -0.242767333984375, -0.1880340576171875, -0.13330078125, -0.0785675048828125, -0.023834228515625, 0.0308990478515625, 0.08563232421875, 0.1403656005859375, 0.195098876953125, 0.2498321533203125, 0.3045654296875, 0.3592987060546875, 0.414031982421875, 0.4687652587890625, 0.52349853515625, 0.5782318115234375, 0.632965087890625, 0.6876983642578125, 0.742431640625, 0.7971649169921875, 0.851898193359375, 0.9066314697265625, 0.96136474609375, 1.0160980224609375, 1.070831298828125, 1.1255645751953125, 1.1802978515625, 1.2350311279296875, 1.289764404296875, 1.3444976806640625, 1.39923095703125, 1.4539642333984375, 1.508697509765625, 1.5634307861328125, 1.6181640625]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 5.0, 7.0, 8.0, 12.0, 21.0, 29.0, 45.0, 57.0, 67.0, 146.0, 183.0, 275.0, 413.0, 654.0, 894.0, 1316.0, 1881.0, 2765.0, 3942.0, 5894.0, 8354.0, 12361.0, 19337.0, 36388.0, 243777.0, 1638282.0, 51505.0, 23261.0, 14384.0, 9687.0, 6624.0, 4549.0, 3144.0, 2179.0, 1496.0, 1031.0, 694.0, 482.0, 303.0, 218.0, 140.0, 111.0, 61.0, 40.0, 31.0, 25.0, 24.0, 15.0, 10.0, 7.0, 3.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.724609375, -1.665496826171875, -1.60638427734375, -1.547271728515625, -1.4881591796875, -1.429046630859375, -1.36993408203125, -1.310821533203125, -1.251708984375, -1.192596435546875, -1.13348388671875, -1.074371337890625, -1.0152587890625, -0.956146240234375, -0.89703369140625, -0.837921142578125, -0.77880859375, -0.719696044921875, -0.66058349609375, -0.601470947265625, -0.5423583984375, -0.483245849609375, -0.42413330078125, -0.365020751953125, -0.305908203125, -0.246795654296875, -0.18768310546875, -0.128570556640625, -0.0694580078125, -0.010345458984375, 0.04876708984375, 0.107879638671875, 0.1669921875, 0.226104736328125, 0.28521728515625, 0.344329833984375, 0.4034423828125, 0.462554931640625, 0.52166748046875, 0.580780029296875, 0.639892578125, 0.699005126953125, 0.75811767578125, 0.817230224609375, 0.8763427734375, 0.935455322265625, 0.99456787109375, 1.053680419921875, 1.11279296875, 1.171905517578125, 1.23101806640625, 1.290130615234375, 1.3492431640625, 1.408355712890625, 1.46746826171875, 1.526580810546875, 1.585693359375, 1.644805908203125, 1.70391845703125, 1.763031005859375, 1.8221435546875, 1.881256103515625, 1.94036865234375, 1.999481201171875, 2.05859375]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 6.0, 2.0, 3.0, 3.0, 5.0, 1.0, 6.0, 7.0, 10.0, 14.0, 11.0, 17.0, 18.0, 24.0, 20.0, 30.0, 28.0, 15.0, 27.0, 32.0, 20.0, 24.0, 27.0, 22.0, 29.0, 28.0, 20.0, 24.0, 25.0, 24.0, 23.0, 28.0, 25.0, 28.0, 30.0, 27.0, 29.0, 33.0, 28.0, 29.0, 23.0, 27.0, 27.0, 21.0, 19.0, 14.0, 12.0, 13.0, 8.0, 14.0, 6.0, 6.0, 9.0, 1.0, 1.0, 1.0, 6.0, 3.0, 2.0, 3.0, 1.0], "bins": [-0.1497802734375, -0.1450958251953125, -0.140411376953125, -0.1357269287109375, -0.13104248046875, -0.1263580322265625, -0.121673583984375, -0.1169891357421875, -0.1123046875, -0.1076202392578125, -0.102935791015625, -0.0982513427734375, -0.09356689453125, -0.0888824462890625, -0.084197998046875, -0.0795135498046875, -0.0748291015625, -0.0701446533203125, -0.065460205078125, -0.0607757568359375, -0.05609130859375, -0.0514068603515625, -0.046722412109375, -0.0420379638671875, -0.037353515625, -0.0326690673828125, -0.027984619140625, -0.0233001708984375, -0.01861572265625, -0.0139312744140625, -0.009246826171875, -0.0045623779296875, 0.0001220703125, 0.0048065185546875, 0.009490966796875, 0.0141754150390625, 0.01885986328125, 0.0235443115234375, 0.028228759765625, 0.0329132080078125, 0.03759765625, 0.0422821044921875, 0.046966552734375, 0.0516510009765625, 0.05633544921875, 0.0610198974609375, 0.065704345703125, 0.0703887939453125, 0.0750732421875, 0.0797576904296875, 0.084442138671875, 0.0891265869140625, 0.09381103515625, 0.0984954833984375, 0.103179931640625, 0.1078643798828125, 0.112548828125, 0.1172332763671875, 0.121917724609375, 0.1266021728515625, 0.13128662109375, 0.1359710693359375, 0.140655517578125, 0.1453399658203125, 0.1500244140625]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [4.0, 3.0, 5.0, 8.0, 12.0, 11.0, 6.0, 11.0, 10.0, 5.0, 14.0, 32.0, 35.0, 35.0, 45.0, 56.0, 53.0, 63.0, 70.0, 79.0, 86.0, 107.0, 81.0, 87.0, 145.0, 131.0, 153.0, 193.0, 289.0, 504.0, 2951.0, 395875.0, 638975.0, 5971.0, 553.0, 321.0, 201.0, 179.0, 131.0, 130.0, 104.0, 104.0, 92.0, 92.0, 81.0, 78.0, 66.0, 56.0, 38.0, 50.0, 38.0, 25.0, 24.0, 22.0, 12.0, 16.0, 14.0, 6.0, 4.0, 7.0, 12.0, 9.0, 3.0, 3.0], "bins": [-2.36328125, -2.28961181640625, -2.2159423828125, -2.14227294921875, -2.068603515625, -1.99493408203125, -1.9212646484375, -1.84759521484375, -1.77392578125, -1.70025634765625, -1.6265869140625, -1.55291748046875, -1.479248046875, -1.40557861328125, -1.3319091796875, -1.25823974609375, -1.1845703125, -1.11090087890625, -1.0372314453125, -0.96356201171875, -0.889892578125, -0.81622314453125, -0.7425537109375, -0.66888427734375, -0.59521484375, -0.52154541015625, -0.4478759765625, -0.37420654296875, -0.300537109375, -0.22686767578125, -0.1531982421875, -0.07952880859375, -0.005859375, 0.06781005859375, 0.1414794921875, 0.21514892578125, 0.288818359375, 0.36248779296875, 0.4361572265625, 0.50982666015625, 0.58349609375, 0.65716552734375, 0.7308349609375, 0.80450439453125, 0.878173828125, 0.95184326171875, 1.0255126953125, 1.09918212890625, 1.1728515625, 1.24652099609375, 1.3201904296875, 1.39385986328125, 1.467529296875, 1.54119873046875, 1.6148681640625, 1.68853759765625, 1.76220703125, 1.83587646484375, 1.9095458984375, 1.98321533203125, 2.056884765625, 2.13055419921875, 2.2042236328125, 2.27789306640625, 2.3515625]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 16.0, 73.0, 303.0, 501.0, 93.0, 18.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.023780345916748, -4.807290554046631, -4.590800762176514, -4.3743109703063965, -4.157821178436279, -3.941331386566162, -3.724841356277466, -3.5083515644073486, -3.2918617725372314, -3.0753719806671143, -2.858882188796997, -2.642392158508301, -2.4259023666381836, -2.2094125747680664, -1.9929227828979492, -1.776432991027832, -1.5599431991577148, -1.3434534072875977, -1.1269636154174805, -0.9104737043380737, -0.6939839124679565, -0.47749412059783936, -0.2610042095184326, -0.04451441764831543, 0.17197537422180176, 0.38846519589424133, 0.6049550175666809, 0.8214448690414429, 1.03793466091156, 1.2544244527816772, 1.470914363861084, 1.6874041557312012, 1.9038934707641602, 2.1203832626342773, 2.3368730545043945, 2.5533628463745117, 2.769852638244629, 2.986342430114746, 3.2028324604034424, 3.4193222522735596, 3.6358120441436768, 3.852301836013794, 4.06879186630249, 4.285281658172607, 4.501771450042725, 4.718261241912842, 4.934751033782959, 5.151240825653076, 5.367730617523193, 5.5842204093933105, 5.800710201263428, 6.017199993133545, 6.233689785003662, 6.450179576873779, 6.666669845581055, 6.883159637451172, 7.099649429321289, 7.316139221191406, 7.532629013061523, 7.749118804931641, 7.965608596801758, 8.182098388671875, 8.398588180541992, 8.61507797241211, 8.831567764282227]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 7.0, 10.0, 10.0, 12.0, 12.0, 19.0, 24.0, 16.0, 25.0, 23.0, 32.0, 27.0, 40.0, 41.0, 49.0, 45.0, 61.0, 49.0, 41.0, 48.0, 46.0, 51.0, 41.0, 37.0, 29.0, 34.0, 36.0, 26.0, 28.0, 14.0, 14.0, 15.0, 10.0, 4.0, 11.0, 8.0, 5.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7742832899093628, -1.7017157077789307, -1.629148244857788, -1.556580662727356, -1.4840131998062134, -1.4114456176757812, -1.3388781547546387, -1.2663105726242065, -1.1937429904937744, -1.1211754083633423, -1.0486079454421997, -0.9760403633117676, -0.903472900390625, -0.8309053182601929, -0.7583377957344055, -0.6857702732086182, -0.6132028102874756, -0.5406352877616882, -0.4680677652359009, -0.39550021290779114, -0.3229326903820038, -0.25036516785621643, -0.1777976155281067, -0.10523009300231934, -0.03266257047653198, 0.03990495949983597, 0.11247248947620392, 0.18504002690315247, 0.2576075494289398, 0.3301750719547272, 0.4027426242828369, 0.47531014680862427, 0.5478775501251221, 0.6204450726509094, 0.6930125951766968, 0.7655801773071289, 0.8381476402282715, 0.9107152223587036, 0.983282744884491, 1.0558502674102783, 1.128417730331421, 1.200985312461853, 1.2735527753829956, 1.3461203575134277, 1.4186878204345703, 1.4912554025650024, 1.5638229846954346, 1.6363904476165771, 1.7089580297470093, 1.7815256118774414, 1.854093074798584, 1.9266606569290161, 1.9992281198501587, 2.071795701980591, 2.1443631649017334, 2.216930866241455, 2.2894983291625977, 2.3620657920837402, 2.434633493423462, 2.5072009563446045, 2.579768419265747, 2.6523358821868896, 2.7249035835266113, 2.797471046447754, 2.8700385093688965]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 5.0, 2.0, 6.0, 7.0, 8.0, 13.0, 10.0, 13.0, 18.0, 19.0, 22.0, 23.0, 23.0, 34.0, 24.0, 35.0, 32.0, 31.0, 41.0, 45.0, 49.0, 50.0, 48.0, 36.0, 46.0, 48.0, 44.0, 31.0, 20.0, 37.0, 19.0, 33.0, 21.0, 18.0, 16.0, 15.0, 9.0, 9.0, 14.0, 6.0, 10.0, 1.0, 4.0, 4.0, 2.0, 4.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.740234375, -1.685638427734375, -1.63104248046875, -1.576446533203125, -1.5218505859375, -1.467254638671875, -1.41265869140625, -1.358062744140625, -1.303466796875, -1.248870849609375, -1.19427490234375, -1.139678955078125, -1.0850830078125, -1.030487060546875, -0.97589111328125, -0.921295166015625, -0.86669921875, -0.812103271484375, -0.75750732421875, -0.702911376953125, -0.6483154296875, -0.593719482421875, -0.53912353515625, -0.484527587890625, -0.429931640625, -0.375335693359375, -0.32073974609375, -0.266143798828125, -0.2115478515625, -0.156951904296875, -0.10235595703125, -0.047760009765625, 0.0068359375, 0.061431884765625, 0.11602783203125, 0.170623779296875, 0.2252197265625, 0.279815673828125, 0.33441162109375, 0.389007568359375, 0.443603515625, 0.498199462890625, 0.55279541015625, 0.607391357421875, 0.6619873046875, 0.716583251953125, 0.77117919921875, 0.825775146484375, 0.88037109375, 0.934967041015625, 0.98956298828125, 1.044158935546875, 1.0987548828125, 1.153350830078125, 1.20794677734375, 1.262542724609375, 1.317138671875, 1.371734619140625, 1.42633056640625, 1.480926513671875, 1.5355224609375, 1.590118408203125, 1.64471435546875, 1.699310302734375, 1.75390625]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 6.0, 4.0, 9.0, 15.0, 29.0, 16.0, 33.0, 54.0, 65.0, 113.0, 196.0, 285.0, 422.0, 779.0, 1291.0, 2457.0, 4632.0, 8530.0, 16052.0, 31045.0, 58751.0, 109566.0, 181046.0, 224453.0, 178715.0, 106995.0, 58563.0, 30108.0, 15567.0, 8350.0, 4533.0, 2436.0, 1421.0, 756.0, 469.0, 275.0, 180.0, 105.0, 78.0, 51.0, 29.0, 26.0, 16.0, 14.0, 12.0, 3.0, 6.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.81640625, -1.7621612548828125, -1.707916259765625, -1.6536712646484375, -1.59942626953125, -1.5451812744140625, -1.490936279296875, -1.4366912841796875, -1.3824462890625, -1.3282012939453125, -1.273956298828125, -1.2197113037109375, -1.16546630859375, -1.1112213134765625, -1.056976318359375, -1.0027313232421875, -0.948486328125, -0.8942413330078125, -0.839996337890625, -0.7857513427734375, -0.73150634765625, -0.6772613525390625, -0.623016357421875, -0.5687713623046875, -0.5145263671875, -0.4602813720703125, -0.406036376953125, -0.3517913818359375, -0.29754638671875, -0.2433013916015625, -0.189056396484375, -0.1348114013671875, -0.08056640625, -0.0263214111328125, 0.027923583984375, 0.0821685791015625, 0.13641357421875, 0.1906585693359375, 0.244903564453125, 0.2991485595703125, 0.3533935546875, 0.4076385498046875, 0.461883544921875, 0.5161285400390625, 0.57037353515625, 0.6246185302734375, 0.678863525390625, 0.7331085205078125, 0.787353515625, 0.8415985107421875, 0.895843505859375, 0.9500885009765625, 1.00433349609375, 1.0585784912109375, 1.112823486328125, 1.1670684814453125, 1.2213134765625, 1.2755584716796875, 1.329803466796875, 1.3840484619140625, 1.43829345703125, 1.4925384521484375, 1.546783447265625, 1.6010284423828125, 1.6552734375]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 5.0, 1.0, 1.0, 2.0, 5.0, 10.0, 4.0, 10.0, 11.0, 13.0, 11.0, 17.0, 16.0, 16.0, 15.0, 31.0, 30.0, 19.0, 31.0, 45.0, 54.0, 53.0, 78.0, 120.0, 212.0, 1346.0, 261.0, 132.0, 88.0, 68.0, 52.0, 34.0, 28.0, 34.0, 22.0, 23.0, 37.0, 21.0, 21.0, 15.0, 24.0, 13.0, 8.0, 6.0, 7.0, 3.0, 5.0, 1.0, 2.0, 0.0, 0.0, 4.0, 1.0], "bins": [-7.63671875, -7.42864990234375, -7.2205810546875, -7.01251220703125, -6.804443359375, -6.59637451171875, -6.3883056640625, -6.18023681640625, -5.97216796875, -5.76409912109375, -5.5560302734375, -5.34796142578125, -5.139892578125, -4.93182373046875, -4.7237548828125, -4.51568603515625, -4.3076171875, -4.09954833984375, -3.8914794921875, -3.68341064453125, -3.475341796875, -3.26727294921875, -3.0592041015625, -2.85113525390625, -2.64306640625, -2.43499755859375, -2.2269287109375, -2.01885986328125, -1.810791015625, -1.60272216796875, -1.3946533203125, -1.18658447265625, -0.978515625, -0.77044677734375, -0.5623779296875, -0.35430908203125, -0.146240234375, 0.06182861328125, 0.2698974609375, 0.47796630859375, 0.68603515625, 0.89410400390625, 1.1021728515625, 1.31024169921875, 1.518310546875, 1.72637939453125, 1.9344482421875, 2.14251708984375, 2.3505859375, 2.55865478515625, 2.7667236328125, 2.97479248046875, 3.182861328125, 3.39093017578125, 3.5989990234375, 3.80706787109375, 4.01513671875, 4.22320556640625, 4.4312744140625, 4.63934326171875, 4.847412109375, 5.05548095703125, 5.2635498046875, 5.47161865234375, 5.6796875]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 7.0, 8.0, 4.0, 10.0, 11.0, 18.0, 15.0, 19.0, 27.0, 29.0, 22.0, 31.0, 49.0, 42.0, 78.0, 159.0, 343.0, 799.0, 2366.0, 12366.0, 143860.0, 2410730.0, 538098.0, 29996.0, 4331.0, 1171.0, 462.0, 222.0, 110.0, 62.0, 43.0, 39.0, 24.0, 29.0, 19.0, 19.0, 18.0, 13.0, 12.0, 12.0, 8.0, 6.0, 8.0, 8.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-9.6171875, -9.303955078125, -8.99072265625, -8.677490234375, -8.3642578125, -8.051025390625, -7.73779296875, -7.424560546875, -7.111328125, -6.798095703125, -6.48486328125, -6.171630859375, -5.8583984375, -5.545166015625, -5.23193359375, -4.918701171875, -4.60546875, -4.292236328125, -3.97900390625, -3.665771484375, -3.3525390625, -3.039306640625, -2.72607421875, -2.412841796875, -2.099609375, -1.786376953125, -1.47314453125, -1.159912109375, -0.8466796875, -0.533447265625, -0.22021484375, 0.093017578125, 0.40625, 0.719482421875, 1.03271484375, 1.345947265625, 1.6591796875, 1.972412109375, 2.28564453125, 2.598876953125, 2.912109375, 3.225341796875, 3.53857421875, 3.851806640625, 4.1650390625, 4.478271484375, 4.79150390625, 5.104736328125, 5.41796875, 5.731201171875, 6.04443359375, 6.357666015625, 6.6708984375, 6.984130859375, 7.29736328125, 7.610595703125, 7.923828125, 8.237060546875, 8.55029296875, 8.863525390625, 9.1767578125, 9.489990234375, 9.80322265625, 10.116455078125, 10.4296875]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 8.0, 56.0, 305.0, 434.0, 185.0, 26.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.64113235473633, -31.107921600341797, -29.574710845947266, -28.041500091552734, -26.508289337158203, -24.975078582763672, -23.441865921020508, -21.908655166625977, -20.375444412231445, -18.842233657836914, -17.309022903442383, -15.775811195373535, -14.242600440979004, -12.709389686584473, -11.176177978515625, -9.642967224121094, -8.109756469726562, -6.576545715332031, -5.043334484100342, -3.5101232528686523, -1.976912498474121, -0.44370174407958984, 1.0895099639892578, 2.622720718383789, 4.15593147277832, 5.689142227172852, 7.222353458404541, 8.75556468963623, 10.288775444030762, 11.821986198425293, 13.35519790649414, 14.888408660888672, 16.42162322998047, 17.954833984375, 19.48804473876953, 21.021255493164062, 22.554466247558594, 24.087677001953125, 25.62088966369629, 27.15410041809082, 28.68731117248535, 30.220521926879883, 31.753732681274414, 33.28694534301758, 34.82015609741211, 36.35336685180664, 37.88657760620117, 39.4197883605957, 40.952999114990234, 42.486209869384766, 44.0194206237793, 45.55263137817383, 47.08584213256836, 48.61905288696289, 50.15226745605469, 51.68547821044922, 53.21868896484375, 54.75189971923828, 56.28511047363281, 57.818321228027344, 59.351531982421875, 60.884742736816406, 62.41795349121094, 63.95116424560547, 65.484375]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 2.0, 2.0, 7.0, 5.0, 6.0, 7.0, 11.0, 14.0, 12.0, 14.0, 22.0, 29.0, 23.0, 26.0, 41.0, 29.0, 41.0, 27.0, 46.0, 41.0, 56.0, 34.0, 33.0, 50.0, 45.0, 40.0, 43.0, 49.0, 31.0, 25.0, 28.0, 20.0, 15.0, 17.0, 26.0, 13.0, 12.0, 13.0, 7.0, 9.0, 12.0, 9.0, 4.0, 3.0, 3.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-23.126609802246094, -22.414621353149414, -21.702632904052734, -20.990644454956055, -20.278656005859375, -19.566667556762695, -18.854679107666016, -18.142690658569336, -17.430702209472656, -16.718713760375977, -16.006725311279297, -15.294736862182617, -14.582748413085938, -13.870759963989258, -13.158771514892578, -12.446783065795898, -11.734794616699219, -11.022806167602539, -10.31081771850586, -9.59882926940918, -8.8868408203125, -8.17485237121582, -7.462863922119141, -6.750875473022461, -6.038887023925781, -5.326898574829102, -4.614910125732422, -3.902921676635742, -3.1909332275390625, -2.478944778442383, -1.7669563293457031, -1.0549678802490234, -0.34297943115234375, 0.36900901794433594, 1.0809974670410156, 1.7929859161376953, 2.504974365234375, 3.2169628143310547, 3.9289512634277344, 4.640939712524414, 5.352928161621094, 6.064916610717773, 6.776905059814453, 7.488893508911133, 8.200881958007812, 8.912870407104492, 9.624858856201172, 10.336847305297852, 11.048835754394531, 11.760824203491211, 12.47281265258789, 13.18480110168457, 13.89678955078125, 14.60877799987793, 15.32076644897461, 16.03275489807129, 16.74474334716797, 17.45673179626465, 18.168720245361328, 18.880708694458008, 19.592697143554688, 20.304685592651367, 21.016674041748047, 21.728662490844727, 22.440650939941406]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 5.0, 7.0, 6.0, 9.0, 7.0, 19.0, 20.0, 11.0, 24.0, 19.0, 15.0, 23.0, 27.0, 36.0, 37.0, 41.0, 38.0, 43.0, 37.0, 49.0, 43.0, 49.0, 51.0, 41.0, 49.0, 43.0, 34.0, 38.0, 25.0, 21.0, 21.0, 18.0, 22.0, 16.0, 13.0, 9.0, 9.0, 7.0, 6.0, 4.0, 4.0, 5.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7197265625, -1.6593475341796875, -1.598968505859375, -1.5385894775390625, -1.47821044921875, -1.4178314208984375, -1.357452392578125, -1.2970733642578125, -1.2366943359375, -1.1763153076171875, -1.115936279296875, -1.0555572509765625, -0.99517822265625, -0.9347991943359375, -0.874420166015625, -0.8140411376953125, -0.753662109375, -0.6932830810546875, -0.632904052734375, -0.5725250244140625, -0.51214599609375, -0.4517669677734375, -0.391387939453125, -0.3310089111328125, -0.2706298828125, -0.2102508544921875, -0.149871826171875, -0.0894927978515625, -0.02911376953125, 0.0312652587890625, 0.091644287109375, 0.1520233154296875, 0.21240234375, 0.2727813720703125, 0.333160400390625, 0.3935394287109375, 0.45391845703125, 0.5142974853515625, 0.574676513671875, 0.6350555419921875, 0.6954345703125, 0.7558135986328125, 0.816192626953125, 0.8765716552734375, 0.93695068359375, 0.9973297119140625, 1.057708740234375, 1.1180877685546875, 1.178466796875, 1.2388458251953125, 1.299224853515625, 1.3596038818359375, 1.41998291015625, 1.4803619384765625, 1.540740966796875, 1.6011199951171875, 1.6614990234375, 1.7218780517578125, 1.782257080078125, 1.8426361083984375, 1.90301513671875, 1.9633941650390625, 2.023773193359375, 2.0841522216796875, 2.14453125]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 4.0, 6.0, 7.0, 15.0, 17.0, 17.0, 14.0, 26.0, 28.0, 29.0, 41.0, 37.0, 48.0, 49.0, 53.0, 68.0, 132.0, 293.0, 1008.0, 4345.0, 23140.0, 156361.0, 1592033.0, 2158578.0, 218423.0, 31180.0, 5942.0, 1309.0, 422.0, 160.0, 108.0, 61.0, 67.0, 50.0, 36.0, 30.0, 24.0, 19.0, 16.0, 16.0, 10.0, 11.0, 10.0, 9.0, 12.0, 7.0, 5.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.40234375, -6.18218994140625, -5.9620361328125, -5.74188232421875, -5.521728515625, -5.30157470703125, -5.0814208984375, -4.86126708984375, -4.64111328125, -4.42095947265625, -4.2008056640625, -3.98065185546875, -3.760498046875, -3.54034423828125, -3.3201904296875, -3.10003662109375, -2.8798828125, -2.65972900390625, -2.4395751953125, -2.21942138671875, -1.999267578125, -1.77911376953125, -1.5589599609375, -1.33880615234375, -1.11865234375, -0.89849853515625, -0.6783447265625, -0.45819091796875, -0.238037109375, -0.01788330078125, 0.2022705078125, 0.42242431640625, 0.642578125, 0.86273193359375, 1.0828857421875, 1.30303955078125, 1.523193359375, 1.74334716796875, 1.9635009765625, 2.18365478515625, 2.40380859375, 2.62396240234375, 2.8441162109375, 3.06427001953125, 3.284423828125, 3.50457763671875, 3.7247314453125, 3.94488525390625, 4.1650390625, 4.38519287109375, 4.6053466796875, 4.82550048828125, 5.045654296875, 5.26580810546875, 5.4859619140625, 5.70611572265625, 5.92626953125, 6.14642333984375, 6.3665771484375, 6.58673095703125, 6.806884765625, 7.02703857421875, 7.2471923828125, 7.46734619140625, 7.6875]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 12.0, 10.0, 27.0, 26.0, 50.0, 58.0, 66.0, 123.0, 156.0, 176.0, 322.0, 391.0, 450.0, 450.0, 454.0, 355.0, 270.0, 194.0, 146.0, 107.0, 70.0, 51.0, 37.0, 22.0, 12.0, 11.0, 6.0, 7.0, 9.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.4609375, -7.2608642578125, -7.060791015625, -6.8607177734375, -6.66064453125, -6.4605712890625, -6.260498046875, -6.0604248046875, -5.8603515625, -5.6602783203125, -5.460205078125, -5.2601318359375, -5.06005859375, -4.8599853515625, -4.659912109375, -4.4598388671875, -4.259765625, -4.0596923828125, -3.859619140625, -3.6595458984375, -3.45947265625, -3.2593994140625, -3.059326171875, -2.8592529296875, -2.6591796875, -2.4591064453125, -2.259033203125, -2.0589599609375, -1.85888671875, -1.6588134765625, -1.458740234375, -1.2586669921875, -1.05859375, -0.8585205078125, -0.658447265625, -0.4583740234375, -0.25830078125, -0.0582275390625, 0.141845703125, 0.3419189453125, 0.5419921875, 0.7420654296875, 0.942138671875, 1.1422119140625, 1.34228515625, 1.5423583984375, 1.742431640625, 1.9425048828125, 2.142578125, 2.3426513671875, 2.542724609375, 2.7427978515625, 2.94287109375, 3.1429443359375, 3.343017578125, 3.5430908203125, 3.7431640625, 3.9432373046875, 4.143310546875, 4.3433837890625, 4.54345703125, 4.7435302734375, 4.943603515625, 5.1436767578125, 5.34375]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 6.0, 7.0, 10.0, 16.0, 22.0, 45.0, 71.0, 99.0, 156.0, 292.0, 491.0, 1023.0, 2843.0, 13087.0, 88672.0, 714329.0, 2645138.0, 632422.0, 79042.0, 11817.0, 2599.0, 966.0, 448.0, 274.0, 140.0, 105.0, 64.0, 35.0, 26.0, 20.0, 9.0, 8.0, 7.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-14.1171875, -13.759521484375, -13.40185546875, -13.044189453125, -12.6865234375, -12.328857421875, -11.97119140625, -11.613525390625, -11.255859375, -10.898193359375, -10.54052734375, -10.182861328125, -9.8251953125, -9.467529296875, -9.10986328125, -8.752197265625, -8.39453125, -8.036865234375, -7.67919921875, -7.321533203125, -6.9638671875, -6.606201171875, -6.24853515625, -5.890869140625, -5.533203125, -5.175537109375, -4.81787109375, -4.460205078125, -4.1025390625, -3.744873046875, -3.38720703125, -3.029541015625, -2.671875, -2.314208984375, -1.95654296875, -1.598876953125, -1.2412109375, -0.883544921875, -0.52587890625, -0.168212890625, 0.189453125, 0.547119140625, 0.90478515625, 1.262451171875, 1.6201171875, 1.977783203125, 2.33544921875, 2.693115234375, 3.05078125, 3.408447265625, 3.76611328125, 4.123779296875, 4.4814453125, 4.839111328125, 5.19677734375, 5.554443359375, 5.912109375, 6.269775390625, 6.62744140625, 6.985107421875, 7.3427734375, 7.700439453125, 8.05810546875, 8.415771484375, 8.7734375]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [4.0, 19.0, 76.0, 195.0, 313.0, 268.0, 107.0, 33.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.507125854492188, -9.842357635498047, -7.17758846282959, -4.512819766998291, -1.8480510711669922, 0.8167171478271484, 3.4814863204956055, 6.1462554931640625, 8.811023712158203, 11.475791931152344, 14.1405611038208, 16.805330276489258, 19.4700984954834, 22.13486671447754, 24.799636840820312, 27.464405059814453, 30.129173278808594, 32.793941497802734, 35.458709716796875, 38.123477935791016, 40.788246154785156, 43.45301818847656, 46.1177864074707, 48.782554626464844, 51.447322845458984, 54.112091064453125, 56.776859283447266, 59.441627502441406, 62.10639953613281, 64.77116394042969, 67.4359359741211, 70.1007080078125, 72.76547241210938, 75.43024444580078, 78.09500885009766, 80.75978088378906, 83.42454528808594, 86.08931732177734, 88.75408172607422, 91.41885375976562, 94.0836181640625, 96.7483901977539, 99.41315460205078, 102.07792663574219, 104.74269104003906, 107.40746307373047, 110.07222747802734, 112.73699951171875, 115.40177154541016, 118.06654357910156, 120.73130798339844, 123.39608001708984, 126.06084442138672, 128.72561645507812, 131.390380859375, 134.05514526367188, 136.7199249267578, 139.3846893310547, 142.04946899414062, 144.7142333984375, 147.37899780273438, 150.04376220703125, 152.7085418701172, 155.37330627441406, 158.03807067871094]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 5.0, 5.0, 9.0, 2.0, 10.0, 12.0, 8.0, 11.0, 19.0, 12.0, 15.0, 24.0, 31.0, 20.0, 29.0, 28.0, 30.0, 35.0, 34.0, 38.0, 29.0, 34.0, 36.0, 42.0, 45.0, 37.0, 36.0, 36.0, 34.0, 44.0, 42.0, 29.0, 32.0, 24.0, 26.0, 16.0, 17.0, 16.0, 9.0, 8.0, 6.0, 9.0, 4.0, 5.0, 3.0, 0.0, 9.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-18.418704986572266, -17.847375869750977, -17.27604866027832, -16.70471954345703, -16.133392333984375, -15.562063217163086, -14.990735054016113, -14.41940689086914, -13.848078727722168, -13.276750564575195, -12.705422401428223, -12.13409423828125, -11.562765121459961, -10.991437911987305, -10.420108795166016, -9.848780632019043, -9.27745246887207, -8.706124305725098, -8.134796142578125, -7.563467502593994, -6.9921393394470215, -6.420811176300049, -5.849482536315918, -5.278154373168945, -4.706826210021973, -4.135498046875, -3.5641696453094482, -2.9928412437438965, -2.421513080596924, -1.8501849174499512, -1.2788565158843994, -0.7075281143188477, -0.1362018585205078, 0.4351264238357544, 1.0064547061920166, 1.5777829885482788, 2.149111270904541, 2.7204394340515137, 3.2917678356170654, 3.863096237182617, 4.43442440032959, 5.0057525634765625, 5.577080726623535, 6.148409366607666, 6.719737529754639, 7.291065692901611, 7.862394332885742, 8.433722496032715, 9.005050659179688, 9.57637882232666, 10.147706985473633, 10.719035148620605, 11.290363311767578, 11.861692428588867, 12.43302059173584, 13.004348754882812, 13.575676918029785, 14.147005081176758, 14.71833324432373, 15.289661407470703, 15.860990524291992, 16.43231773376465, 17.003646850585938, 17.574974060058594, 18.146303176879883]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 0.0, 4.0, 0.0, 5.0, 6.0, 4.0, 9.0, 8.0, 8.0, 10.0, 8.0, 14.0, 16.0, 9.0, 19.0, 29.0, 29.0, 28.0, 28.0, 23.0, 31.0, 42.0, 37.0, 40.0, 44.0, 37.0, 37.0, 45.0, 41.0, 41.0, 35.0, 34.0, 41.0, 39.0, 29.0, 24.0, 14.0, 19.0, 17.0, 17.0, 8.0, 17.0, 12.0, 13.0, 7.0, 6.0, 8.0, 6.0, 4.0, 3.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.6806640625, -1.6252288818359375, -1.569793701171875, -1.5143585205078125, -1.45892333984375, -1.4034881591796875, -1.348052978515625, -1.2926177978515625, -1.2371826171875, -1.1817474365234375, -1.126312255859375, -1.0708770751953125, -1.01544189453125, -0.9600067138671875, -0.904571533203125, -0.8491363525390625, -0.793701171875, -0.7382659912109375, -0.682830810546875, -0.6273956298828125, -0.57196044921875, -0.5165252685546875, -0.461090087890625, -0.4056549072265625, -0.3502197265625, -0.2947845458984375, -0.239349365234375, -0.1839141845703125, -0.12847900390625, -0.0730438232421875, -0.017608642578125, 0.0378265380859375, 0.09326171875, 0.1486968994140625, 0.204132080078125, 0.2595672607421875, 0.31500244140625, 0.3704376220703125, 0.425872802734375, 0.4813079833984375, 0.5367431640625, 0.5921783447265625, 0.647613525390625, 0.7030487060546875, 0.75848388671875, 0.8139190673828125, 0.869354248046875, 0.9247894287109375, 0.980224609375, 1.0356597900390625, 1.091094970703125, 1.1465301513671875, 1.20196533203125, 1.2574005126953125, 1.312835693359375, 1.3682708740234375, 1.4237060546875, 1.4791412353515625, 1.534576416015625, 1.5900115966796875, 1.64544677734375, 1.7008819580078125, 1.756317138671875, 1.8117523193359375, 1.8671875]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 8.0, 12.0, 15.0, 15.0, 43.0, 45.0, 96.0, 160.0, 275.0, 376.0, 567.0, 896.0, 1410.0, 2193.0, 3236.0, 4861.0, 7227.0, 10199.0, 14371.0, 19745.0, 25782.0, 33804.0, 42565.0, 51485.0, 60777.0, 69601.0, 75672.0, 80512.0, 82105.0, 78250.0, 72502.0, 64892.0, 55658.0, 46639.0, 37375.0, 29033.0, 22196.0, 16358.0, 11863.0, 8460.0, 5887.0, 3913.0, 2572.0, 1776.0, 1174.0, 717.0, 477.0, 306.0, 183.0, 94.0, 83.0, 40.0, 33.0, 18.0, 9.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.802734375, -0.7770233154296875, -0.751312255859375, -0.7256011962890625, -0.69989013671875, -0.6741790771484375, -0.648468017578125, -0.6227569580078125, -0.5970458984375, -0.5713348388671875, -0.545623779296875, -0.5199127197265625, -0.49420166015625, -0.4684906005859375, -0.442779541015625, -0.4170684814453125, -0.391357421875, -0.3656463623046875, -0.339935302734375, -0.3142242431640625, -0.28851318359375, -0.2628021240234375, -0.237091064453125, -0.2113800048828125, -0.1856689453125, -0.1599578857421875, -0.134246826171875, -0.1085357666015625, -0.08282470703125, -0.0571136474609375, -0.031402587890625, -0.0056915283203125, 0.02001953125, 0.0457305908203125, 0.071441650390625, 0.0971527099609375, 0.12286376953125, 0.1485748291015625, 0.174285888671875, 0.1999969482421875, 0.2257080078125, 0.2514190673828125, 0.277130126953125, 0.3028411865234375, 0.32855224609375, 0.3542633056640625, 0.379974365234375, 0.4056854248046875, 0.431396484375, 0.4571075439453125, 0.482818603515625, 0.5085296630859375, 0.53424072265625, 0.5599517822265625, 0.585662841796875, 0.6113739013671875, 0.6370849609375, 0.6627960205078125, 0.688507080078125, 0.7142181396484375, 0.73992919921875, 0.7656402587890625, 0.791351318359375, 0.8170623779296875, 0.8427734375]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 4.0, 2.0, 7.0, 9.0, 10.0, 9.0, 12.0, 13.0, 21.0, 26.0, 30.0, 24.0, 29.0, 34.0, 45.0, 36.0, 32.0, 36.0, 35.0, 41.0, 1067.0, 42.0, 48.0, 34.0, 39.0, 42.0, 37.0, 39.0, 27.0, 30.0, 17.0, 29.0, 24.0, 25.0, 12.0, 6.0, 8.0, 8.0, 6.0, 10.0, 7.0, 3.0, 6.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.013671875, -1.9526214599609375, -1.891571044921875, -1.8305206298828125, -1.76947021484375, -1.7084197998046875, -1.647369384765625, -1.5863189697265625, -1.5252685546875, -1.4642181396484375, -1.403167724609375, -1.3421173095703125, -1.28106689453125, -1.2200164794921875, -1.158966064453125, -1.0979156494140625, -1.036865234375, -0.9758148193359375, -0.914764404296875, -0.8537139892578125, -0.79266357421875, -0.7316131591796875, -0.670562744140625, -0.6095123291015625, -0.5484619140625, -0.4874114990234375, -0.426361083984375, -0.3653106689453125, -0.30426025390625, -0.2432098388671875, -0.182159423828125, -0.1211090087890625, -0.06005859375, 0.0009918212890625, 0.062042236328125, 0.1230926513671875, 0.18414306640625, 0.2451934814453125, 0.306243896484375, 0.3672943115234375, 0.4283447265625, 0.4893951416015625, 0.550445556640625, 0.6114959716796875, 0.67254638671875, 0.7335968017578125, 0.794647216796875, 0.8556976318359375, 0.916748046875, 0.9777984619140625, 1.038848876953125, 1.0998992919921875, 1.16094970703125, 1.2220001220703125, 1.283050537109375, 1.3441009521484375, 1.4051513671875, 1.4662017822265625, 1.527252197265625, 1.5883026123046875, 1.64935302734375, 1.7104034423828125, 1.771453857421875, 1.8325042724609375, 1.8935546875]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 6.0, 10.0, 14.0, 24.0, 17.0, 33.0, 59.0, 96.0, 139.0, 188.0, 270.0, 455.0, 689.0, 1092.0, 1524.0, 2286.0, 3507.0, 4969.0, 7331.0, 10711.0, 16732.0, 28303.0, 85872.0, 1770788.0, 83957.0, 28052.0, 16492.0, 10864.0, 7424.0, 4882.0, 3382.0, 2386.0, 1508.0, 1038.0, 697.0, 434.0, 321.0, 197.0, 137.0, 96.0, 51.0, 32.0, 21.0, 15.0, 16.0, 7.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-2.130859375, -2.063201904296875, -1.99554443359375, -1.927886962890625, -1.8602294921875, -1.792572021484375, -1.72491455078125, -1.657257080078125, -1.589599609375, -1.521942138671875, -1.45428466796875, -1.386627197265625, -1.3189697265625, -1.251312255859375, -1.18365478515625, -1.115997314453125, -1.04833984375, -0.980682373046875, -0.91302490234375, -0.845367431640625, -0.7777099609375, -0.710052490234375, -0.64239501953125, -0.574737548828125, -0.507080078125, -0.439422607421875, -0.37176513671875, -0.304107666015625, -0.2364501953125, -0.168792724609375, -0.10113525390625, -0.033477783203125, 0.0341796875, 0.101837158203125, 0.16949462890625, 0.237152099609375, 0.3048095703125, 0.372467041015625, 0.44012451171875, 0.507781982421875, 0.575439453125, 0.643096923828125, 0.71075439453125, 0.778411865234375, 0.8460693359375, 0.913726806640625, 0.98138427734375, 1.049041748046875, 1.11669921875, 1.184356689453125, 1.25201416015625, 1.319671630859375, 1.3873291015625, 1.454986572265625, 1.52264404296875, 1.590301513671875, 1.657958984375, 1.725616455078125, 1.79327392578125, 1.860931396484375, 1.9285888671875, 1.996246337890625, 2.06390380859375, 2.131561279296875, 2.19921875]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 4.0, 5.0, 11.0, 7.0, 11.0, 18.0, 8.0, 17.0, 19.0, 27.0, 40.0, 36.0, 57.0, 48.0, 44.0, 41.0, 33.0, 50.0, 31.0, 28.0, 26.0, 35.0, 23.0, 38.0, 36.0, 45.0, 42.0, 36.0, 41.0, 42.0, 33.0, 20.0, 16.0, 12.0, 9.0, 5.0, 2.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.201904296875, -0.19572067260742188, -0.18953704833984375, -0.18335342407226562, -0.1771697998046875, -0.17098617553710938, -0.16480255126953125, -0.15861892700195312, -0.152435302734375, -0.14625167846679688, -0.14006805419921875, -0.13388442993164062, -0.1277008056640625, -0.12151718139648438, -0.11533355712890625, -0.10914993286132812, -0.10296630859375, -0.09678268432617188, -0.09059906005859375, -0.08441543579101562, -0.0782318115234375, -0.07204818725585938, -0.06586456298828125, -0.059680938720703125, -0.053497314453125, -0.047313690185546875, -0.04113006591796875, -0.034946441650390625, -0.0287628173828125, -0.022579193115234375, -0.01639556884765625, -0.010211944580078125, -0.0040283203125, 0.002155303955078125, 0.00833892822265625, 0.014522552490234375, 0.0207061767578125, 0.026889801025390625, 0.03307342529296875, 0.039257049560546875, 0.045440673828125, 0.051624298095703125, 0.05780792236328125, 0.06399154663085938, 0.0701751708984375, 0.07635879516601562, 0.08254241943359375, 0.08872604370117188, 0.09490966796875, 0.10109329223632812, 0.10727691650390625, 0.11346054077148438, 0.1196441650390625, 0.12582778930664062, 0.13201141357421875, 0.13819503784179688, 0.144378662109375, 0.15056228637695312, 0.15674591064453125, 0.16292953491210938, 0.1691131591796875, 0.17529678344726562, 0.18148040771484375, 0.18766403198242188, 0.19384765625]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 6.0, 2.0, 7.0, 14.0, 10.0, 13.0, 24.0, 36.0, 43.0, 44.0, 64.0, 90.0, 111.0, 135.0, 184.0, 205.0, 205.0, 288.0, 400.0, 770.0, 26531.0, 978352.0, 38337.0, 845.0, 375.0, 281.0, 233.0, 202.0, 151.0, 136.0, 129.0, 90.0, 64.0, 48.0, 29.0, 23.0, 16.0, 17.0, 13.0, 11.0, 9.0, 7.0, 2.0, 3.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.876953125, -2.78271484375, -2.6884765625, -2.59423828125, -2.5, -2.40576171875, -2.3115234375, -2.21728515625, -2.123046875, -2.02880859375, -1.9345703125, -1.84033203125, -1.74609375, -1.65185546875, -1.5576171875, -1.46337890625, -1.369140625, -1.27490234375, -1.1806640625, -1.08642578125, -0.9921875, -0.89794921875, -0.8037109375, -0.70947265625, -0.615234375, -0.52099609375, -0.4267578125, -0.33251953125, -0.23828125, -0.14404296875, -0.0498046875, 0.04443359375, 0.138671875, 0.23291015625, 0.3271484375, 0.42138671875, 0.515625, 0.60986328125, 0.7041015625, 0.79833984375, 0.892578125, 0.98681640625, 1.0810546875, 1.17529296875, 1.26953125, 1.36376953125, 1.4580078125, 1.55224609375, 1.646484375, 1.74072265625, 1.8349609375, 1.92919921875, 2.0234375, 2.11767578125, 2.2119140625, 2.30615234375, 2.400390625, 2.49462890625, 2.5888671875, 2.68310546875, 2.77734375, 2.87158203125, 2.9658203125, 3.06005859375, 3.154296875]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 25.0, 66.0, 321.0, 478.0, 93.0, 19.0, 6.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.072506427764893, -5.8712968826293945, -5.670086860656738, -5.46887731552124, -5.267667770385742, -5.066458225250244, -4.865248680114746, -4.66403865814209, -4.462829113006592, -4.261619567871094, -4.0604095458984375, -3.8592000007629395, -3.6579904556274414, -3.4567809104919434, -3.255571126937866, -3.054361343383789, -2.853151798248291, -2.651942253112793, -2.450732469558716, -2.2495226860046387, -2.0483131408691406, -1.847103476524353, -1.6458938121795654, -1.4446841478347778, -1.2434744834899902, -1.0422648191452026, -0.841055154800415, -0.6398454904556274, -0.43863582611083984, -0.23742616176605225, -0.03621649742126465, 0.16499316692352295, 0.36620330810546875, 0.5674129724502563, 0.768622636795044, 0.9698323011398315, 1.1710419654846191, 1.3722516298294067, 1.5734612941741943, 1.774670958518982, 1.9758806228637695, 2.1770901679992676, 2.3782999515533447, 2.579509735107422, 2.78071928024292, 2.981928825378418, 3.183138608932495, 3.3843483924865723, 3.5855579376220703, 3.7867674827575684, 3.9879772663116455, 4.189187049865723, 4.390396595001221, 4.591606140136719, 4.792816162109375, 4.994025707244873, 5.195235252380371, 5.396444797515869, 5.597654342651367, 5.798864364624023, 6.0000739097595215, 6.2012834548950195, 6.402493476867676, 6.603703022003174, 6.804912567138672]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 9.0, 8.0, 13.0, 13.0, 12.0, 8.0, 17.0, 25.0, 17.0, 33.0, 26.0, 23.0, 29.0, 28.0, 37.0, 32.0, 30.0, 44.0, 46.0, 45.0, 37.0, 50.0, 30.0, 49.0, 30.0, 34.0, 37.0, 35.0, 10.0, 28.0, 25.0, 23.0, 25.0, 14.0, 10.0, 13.0, 9.0, 10.0, 6.0, 9.0, 6.0, 4.0, 1.0, 7.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.7944624423980713, -1.7399507761001587, -1.685439109802246, -1.630927562713623, -1.5764158964157104, -1.5219042301177979, -1.4673925638198853, -1.4128808975219727, -1.3583693504333496, -1.303857684135437, -1.2493460178375244, -1.1948344707489014, -1.1403228044509888, -1.0858111381530762, -1.0312994718551636, -0.976787805557251, -0.9222761392593384, -0.8677644729614258, -0.813252866268158, -0.7587411999702454, -0.7042295932769775, -0.6497179269790649, -0.5952062606811523, -0.5406945943832397, -0.4861829876899719, -0.4316713511943817, -0.3771597146987915, -0.3226480484008789, -0.2681364119052887, -0.2136247754096985, -0.1591131091117859, -0.10460147261619568, -0.05008971691131592, 0.004421927034854889, 0.058933570981025696, 0.1134452223777771, 0.1679568588733673, 0.22246849536895752, 0.2769801616668701, 0.3314917981624603, 0.38600343465805054, 0.44051507115364075, 0.49502670764923096, 0.5495383739471436, 0.6040500402450562, 0.658561646938324, 0.7130733132362366, 0.7675849199295044, 0.822096586227417, 0.8766082525253296, 0.9311198592185974, 0.98563152551651, 1.0401431322097778, 1.0946547985076904, 1.149166464805603, 1.2036781311035156, 1.2581896781921387, 1.3127013444900513, 1.3672130107879639, 1.421724557876587, 1.4762362241744995, 1.530747890472412, 1.5852595567703247, 1.6397712230682373, 1.69428288936615]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 3.0, 6.0, 6.0, 6.0, 8.0, 9.0, 10.0, 14.0, 19.0, 18.0, 20.0, 16.0, 25.0, 21.0, 32.0, 24.0, 26.0, 26.0, 39.0, 41.0, 34.0, 48.0, 41.0, 40.0, 47.0, 40.0, 39.0, 28.0, 39.0, 31.0, 31.0, 28.0, 32.0, 19.0, 22.0, 21.0, 20.0, 13.0, 9.0, 8.0, 7.0, 12.0, 7.0, 5.0, 6.0, 4.0, 3.0, 3.0, 0.0, 4.0, 4.0], "bins": [-2.037109375, -1.9809417724609375, -1.924774169921875, -1.8686065673828125, -1.81243896484375, -1.7562713623046875, -1.700103759765625, -1.6439361572265625, -1.5877685546875, -1.5316009521484375, -1.475433349609375, -1.4192657470703125, -1.36309814453125, -1.3069305419921875, -1.250762939453125, -1.1945953369140625, -1.138427734375, -1.0822601318359375, -1.026092529296875, -0.9699249267578125, -0.91375732421875, -0.8575897216796875, -0.801422119140625, -0.7452545166015625, -0.6890869140625, -0.6329193115234375, -0.576751708984375, -0.5205841064453125, -0.46441650390625, -0.4082489013671875, -0.352081298828125, -0.2959136962890625, -0.23974609375, -0.1835784912109375, -0.127410888671875, -0.0712432861328125, -0.01507568359375, 0.0410919189453125, 0.097259521484375, 0.1534271240234375, 0.2095947265625, 0.2657623291015625, 0.321929931640625, 0.3780975341796875, 0.43426513671875, 0.4904327392578125, 0.546600341796875, 0.6027679443359375, 0.658935546875, 0.7151031494140625, 0.771270751953125, 0.8274383544921875, 0.88360595703125, 0.9397735595703125, 0.995941162109375, 1.0521087646484375, 1.1082763671875, 1.1644439697265625, 1.220611572265625, 1.2767791748046875, 1.33294677734375, 1.3891143798828125, 1.445281982421875, 1.5014495849609375, 1.5576171875]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 9.0, 6.0, 12.0, 26.0, 35.0, 62.0, 82.0, 162.0, 218.0, 312.0, 487.0, 789.0, 1164.0, 1740.0, 2636.0, 3908.0, 5744.0, 8684.0, 13260.0, 21410.0, 42181.0, 110373.0, 317292.0, 310192.0, 106807.0, 41245.0, 21014.0, 12782.0, 8527.0, 5777.0, 3868.0, 2609.0, 1764.0, 1170.0, 773.0, 493.0, 321.0, 225.0, 142.0, 88.0, 47.0, 43.0, 26.0, 24.0, 9.0, 10.0, 4.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.876953125, -2.78973388671875, -2.7025146484375, -2.61529541015625, -2.528076171875, -2.44085693359375, -2.3536376953125, -2.26641845703125, -2.17919921875, -2.09197998046875, -2.0047607421875, -1.91754150390625, -1.830322265625, -1.74310302734375, -1.6558837890625, -1.56866455078125, -1.4814453125, -1.39422607421875, -1.3070068359375, -1.21978759765625, -1.132568359375, -1.04534912109375, -0.9581298828125, -0.87091064453125, -0.78369140625, -0.69647216796875, -0.6092529296875, -0.52203369140625, -0.434814453125, -0.34759521484375, -0.2603759765625, -0.17315673828125, -0.0859375, 0.00128173828125, 0.0885009765625, 0.17572021484375, 0.262939453125, 0.35015869140625, 0.4373779296875, 0.52459716796875, 0.61181640625, 0.69903564453125, 0.7862548828125, 0.87347412109375, 0.960693359375, 1.04791259765625, 1.1351318359375, 1.22235107421875, 1.3095703125, 1.39678955078125, 1.4840087890625, 1.57122802734375, 1.658447265625, 1.74566650390625, 1.8328857421875, 1.92010498046875, 2.00732421875, 2.09454345703125, 2.1817626953125, 2.26898193359375, 2.356201171875, 2.44342041015625, 2.5306396484375, 2.61785888671875, 2.705078125]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 4.0, 4.0, 6.0, 4.0, 9.0, 12.0, 7.0, 17.0, 16.0, 24.0, 22.0, 21.0, 22.0, 21.0, 24.0, 33.0, 33.0, 38.0, 64.0, 81.0, 123.0, 236.0, 1459.0, 213.0, 127.0, 71.0, 42.0, 44.0, 41.0, 26.0, 22.0, 22.0, 28.0, 20.0, 25.0, 15.0, 18.0, 19.0, 7.0, 8.0, 6.0, 6.0, 5.0, 2.0, 6.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.796875, -6.57366943359375, -6.3504638671875, -6.12725830078125, -5.904052734375, -5.68084716796875, -5.4576416015625, -5.23443603515625, -5.01123046875, -4.78802490234375, -4.5648193359375, -4.34161376953125, -4.118408203125, -3.89520263671875, -3.6719970703125, -3.44879150390625, -3.2255859375, -3.00238037109375, -2.7791748046875, -2.55596923828125, -2.332763671875, -2.10955810546875, -1.8863525390625, -1.66314697265625, -1.43994140625, -1.21673583984375, -0.9935302734375, -0.77032470703125, -0.547119140625, -0.32391357421875, -0.1007080078125, 0.12249755859375, 0.345703125, 0.56890869140625, 0.7921142578125, 1.01531982421875, 1.238525390625, 1.46173095703125, 1.6849365234375, 1.90814208984375, 2.13134765625, 2.35455322265625, 2.5777587890625, 2.80096435546875, 3.024169921875, 3.24737548828125, 3.4705810546875, 3.69378662109375, 3.9169921875, 4.14019775390625, 4.3634033203125, 4.58660888671875, 4.809814453125, 5.03302001953125, 5.2562255859375, 5.47943115234375, 5.70263671875, 5.92584228515625, 6.1490478515625, 6.37225341796875, 6.595458984375, 6.81866455078125, 7.0418701171875, 7.26507568359375, 7.48828125]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 7.0, 10.0, 8.0, 13.0, 11.0, 18.0, 20.0, 29.0, 38.0, 46.0, 68.0, 81.0, 126.0, 182.0, 418.0, 1180.0, 3984.0, 16640.0, 106377.0, 2271568.0, 682666.0, 48718.0, 9314.0, 2475.0, 761.0, 335.0, 153.0, 98.0, 80.0, 58.0, 55.0, 49.0, 33.0, 19.0, 22.0, 11.0, 7.0, 3.0, 7.0, 7.0, 5.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-10.6171875, -10.2935791015625, -9.969970703125, -9.6463623046875, -9.32275390625, -8.9991455078125, -8.675537109375, -8.3519287109375, -8.0283203125, -7.7047119140625, -7.381103515625, -7.0574951171875, -6.73388671875, -6.4102783203125, -6.086669921875, -5.7630615234375, -5.439453125, -5.1158447265625, -4.792236328125, -4.4686279296875, -4.14501953125, -3.8214111328125, -3.497802734375, -3.1741943359375, -2.8505859375, -2.5269775390625, -2.203369140625, -1.8797607421875, -1.55615234375, -1.2325439453125, -0.908935546875, -0.5853271484375, -0.26171875, 0.0618896484375, 0.385498046875, 0.7091064453125, 1.03271484375, 1.3563232421875, 1.679931640625, 2.0035400390625, 2.3271484375, 2.6507568359375, 2.974365234375, 3.2979736328125, 3.62158203125, 3.9451904296875, 4.268798828125, 4.5924072265625, 4.916015625, 5.2396240234375, 5.563232421875, 5.8868408203125, 6.21044921875, 6.5340576171875, 6.857666015625, 7.1812744140625, 7.5048828125, 7.8284912109375, 8.152099609375, 8.4757080078125, 8.79931640625, 9.1229248046875, 9.446533203125, 9.7701416015625, 10.09375]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [4.0, 15.0, 242.0, 537.0, 210.0, 11.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.515935897827148, -6.057094573974609, -3.598252773284912, -1.1394109725952148, 1.3194303512573242, 3.7782716751098633, 6.237113952636719, 8.695955276489258, 11.154796600341797, 13.613637924194336, 16.072479248046875, 18.531322479248047, 20.990161895751953, 23.449005126953125, 25.907846450805664, 28.366687774658203, 30.825529098510742, 33.28437042236328, 35.74321365356445, 38.20205307006836, 40.66089630126953, 43.11973571777344, 45.57857894897461, 48.03742218017578, 50.49626159667969, 52.95510482788086, 55.413944244384766, 57.87278747558594, 60.331626892089844, 62.790470123291016, 65.24931335449219, 67.7081527709961, 70.16699981689453, 72.62583923339844, 75.08468627929688, 77.54352569580078, 80.00236511230469, 82.4612045288086, 84.92005157470703, 87.37889099121094, 89.83773040771484, 92.29656982421875, 94.75541687011719, 97.2142562866211, 99.673095703125, 102.1319351196289, 104.59078216552734, 107.04962158203125, 109.50846862792969, 111.9673080444336, 114.42615509033203, 116.88499450683594, 119.34383392333984, 121.80267333984375, 124.26152038574219, 126.7203598022461, 129.17919921875, 131.63804626464844, 134.0968780517578, 136.55572509765625, 139.0145721435547, 141.47340393066406, 143.9322509765625, 146.39108276367188, 148.8499298095703]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 5.0, 6.0, 3.0, 4.0, 10.0, 5.0, 8.0, 11.0, 7.0, 11.0, 14.0, 24.0, 16.0, 30.0, 22.0, 26.0, 26.0, 32.0, 25.0, 34.0, 34.0, 43.0, 46.0, 47.0, 37.0, 43.0, 38.0, 37.0, 33.0, 27.0, 27.0, 40.0, 33.0, 33.0, 24.0, 15.0, 17.0, 31.0, 12.0, 12.0, 13.0, 12.0, 11.0, 12.0, 4.0, 4.0, 4.0, 2.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-24.629318237304688, -23.902782440185547, -23.176246643066406, -22.449710845947266, -21.723175048828125, -20.996641159057617, -20.270105361938477, -19.543569564819336, -18.817033767700195, -18.090497970581055, -17.363962173461914, -16.637426376342773, -15.91089153289795, -15.184355735778809, -14.457820892333984, -13.731285095214844, -13.004749298095703, -12.278213500976562, -11.551677703857422, -10.825142860412598, -10.098607063293457, -9.372071266174316, -8.645536422729492, -7.919000625610352, -7.192464828491211, -6.46592903137207, -5.739393711090088, -5.0128583908081055, -4.286322593688965, -3.5597870349884033, -2.833251476287842, -2.1067161560058594, -1.380178451538086, -0.6536428928375244, 0.07289266586303711, 0.7994282245635986, 1.5259637832641602, 2.2524993419647217, 2.979034900665283, 3.7055702209472656, 4.432106018066406, 5.158641815185547, 5.885177135467529, 6.611712455749512, 7.338248252868652, 8.064784049987793, 8.791318893432617, 9.517854690551758, 10.244390487670898, 10.970926284790039, 11.69746208190918, 12.423996925354004, 13.150532722473145, 13.877068519592285, 14.60360336303711, 15.33013916015625, 16.05667495727539, 16.78321075439453, 17.509746551513672, 18.236282348632812, 18.962818145751953, 19.68935203552246, 20.4158878326416, 21.142423629760742, 21.868959426879883]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 4.0, 5.0, 6.0, 8.0, 8.0, 9.0, 13.0, 12.0, 21.0, 24.0, 17.0, 21.0, 22.0, 35.0, 16.0, 25.0, 46.0, 31.0, 31.0, 32.0, 48.0, 44.0, 42.0, 47.0, 37.0, 36.0, 45.0, 43.0, 29.0, 27.0, 31.0, 31.0, 19.0, 24.0, 14.0, 18.0, 21.0, 14.0, 11.0, 3.0, 7.0, 6.0, 5.0, 7.0, 3.0, 2.0, 2.0, 4.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0], "bins": [-2.068359375, -2.004730224609375, -1.94110107421875, -1.877471923828125, -1.8138427734375, -1.750213623046875, -1.68658447265625, -1.622955322265625, -1.559326171875, -1.495697021484375, -1.43206787109375, -1.368438720703125, -1.3048095703125, -1.241180419921875, -1.17755126953125, -1.113922119140625, -1.05029296875, -0.986663818359375, -0.92303466796875, -0.859405517578125, -0.7957763671875, -0.732147216796875, -0.66851806640625, -0.604888916015625, -0.541259765625, -0.477630615234375, -0.41400146484375, -0.350372314453125, -0.2867431640625, -0.223114013671875, -0.15948486328125, -0.095855712890625, -0.0322265625, 0.031402587890625, 0.09503173828125, 0.158660888671875, 0.2222900390625, 0.285919189453125, 0.34954833984375, 0.413177490234375, 0.476806640625, 0.540435791015625, 0.60406494140625, 0.667694091796875, 0.7313232421875, 0.794952392578125, 0.85858154296875, 0.922210693359375, 0.98583984375, 1.049468994140625, 1.11309814453125, 1.176727294921875, 1.2403564453125, 1.303985595703125, 1.36761474609375, 1.431243896484375, 1.494873046875, 1.558502197265625, 1.62213134765625, 1.685760498046875, 1.7493896484375, 1.813018798828125, 1.87664794921875, 1.940277099609375, 2.00390625]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 1.0, 8.0, 4.0, 7.0, 10.0, 12.0, 13.0, 7.0, 13.0, 17.0, 24.0, 45.0, 55.0, 53.0, 81.0, 116.0, 239.0, 778.0, 4015.0, 27835.0, 273025.0, 2842603.0, 958531.0, 74354.0, 9735.0, 1727.0, 427.0, 173.0, 100.0, 46.0, 46.0, 42.0, 21.0, 22.0, 19.0, 21.0, 11.0, 11.0, 10.0, 8.0, 6.0, 3.0, 3.0, 3.0, 5.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.140625, -7.884033203125, -7.62744140625, -7.370849609375, -7.1142578125, -6.857666015625, -6.60107421875, -6.344482421875, -6.087890625, -5.831298828125, -5.57470703125, -5.318115234375, -5.0615234375, -4.804931640625, -4.54833984375, -4.291748046875, -4.03515625, -3.778564453125, -3.52197265625, -3.265380859375, -3.0087890625, -2.752197265625, -2.49560546875, -2.239013671875, -1.982421875, -1.725830078125, -1.46923828125, -1.212646484375, -0.9560546875, -0.699462890625, -0.44287109375, -0.186279296875, 0.0703125, 0.326904296875, 0.58349609375, 0.840087890625, 1.0966796875, 1.353271484375, 1.60986328125, 1.866455078125, 2.123046875, 2.379638671875, 2.63623046875, 2.892822265625, 3.1494140625, 3.406005859375, 3.66259765625, 3.919189453125, 4.17578125, 4.432373046875, 4.68896484375, 4.945556640625, 5.2021484375, 5.458740234375, 5.71533203125, 5.971923828125, 6.228515625, 6.485107421875, 6.74169921875, 6.998291015625, 7.2548828125, 7.511474609375, 7.76806640625, 8.024658203125, 8.28125]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 3.0, 5.0, 7.0, 8.0, 14.0, 9.0, 19.0, 25.0, 27.0, 41.0, 52.0, 91.0, 120.0, 123.0, 228.0, 262.0, 303.0, 399.0, 427.0, 396.0, 378.0, 280.0, 215.0, 159.0, 124.0, 94.0, 74.0, 57.0, 40.0, 27.0, 18.0, 9.0, 6.0, 9.0, 8.0, 9.0, 5.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.8515625, -5.67205810546875, -5.4925537109375, -5.31304931640625, -5.133544921875, -4.95404052734375, -4.7745361328125, -4.59503173828125, -4.41552734375, -4.23602294921875, -4.0565185546875, -3.87701416015625, -3.697509765625, -3.51800537109375, -3.3385009765625, -3.15899658203125, -2.9794921875, -2.79998779296875, -2.6204833984375, -2.44097900390625, -2.261474609375, -2.08197021484375, -1.9024658203125, -1.72296142578125, -1.54345703125, -1.36395263671875, -1.1844482421875, -1.00494384765625, -0.825439453125, -0.64593505859375, -0.4664306640625, -0.28692626953125, -0.107421875, 0.07208251953125, 0.2515869140625, 0.43109130859375, 0.610595703125, 0.79010009765625, 0.9696044921875, 1.14910888671875, 1.32861328125, 1.50811767578125, 1.6876220703125, 1.86712646484375, 2.046630859375, 2.22613525390625, 2.4056396484375, 2.58514404296875, 2.7646484375, 2.94415283203125, 3.1236572265625, 3.30316162109375, 3.482666015625, 3.66217041015625, 3.8416748046875, 4.02117919921875, 4.20068359375, 4.38018798828125, 4.5596923828125, 4.73919677734375, 4.918701171875, 5.09820556640625, 5.2777099609375, 5.45721435546875, 5.63671875]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 6.0, 10.0, 10.0, 21.0, 19.0, 29.0, 37.0, 71.0, 124.0, 226.0, 364.0, 832.0, 2372.0, 10126.0, 69909.0, 692188.0, 2837269.0, 514773.0, 54053.0, 8248.0, 1996.0, 755.0, 379.0, 194.0, 104.0, 54.0, 41.0, 27.0, 13.0, 9.0, 10.0, 8.0, 6.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.265625, -12.868896484375, -12.47216796875, -12.075439453125, -11.6787109375, -11.281982421875, -10.88525390625, -10.488525390625, -10.091796875, -9.695068359375, -9.29833984375, -8.901611328125, -8.5048828125, -8.108154296875, -7.71142578125, -7.314697265625, -6.91796875, -6.521240234375, -6.12451171875, -5.727783203125, -5.3310546875, -4.934326171875, -4.53759765625, -4.140869140625, -3.744140625, -3.347412109375, -2.95068359375, -2.553955078125, -2.1572265625, -1.760498046875, -1.36376953125, -0.967041015625, -0.5703125, -0.173583984375, 0.22314453125, 0.619873046875, 1.0166015625, 1.413330078125, 1.81005859375, 2.206787109375, 2.603515625, 3.000244140625, 3.39697265625, 3.793701171875, 4.1904296875, 4.587158203125, 4.98388671875, 5.380615234375, 5.77734375, 6.174072265625, 6.57080078125, 6.967529296875, 7.3642578125, 7.760986328125, 8.15771484375, 8.554443359375, 8.951171875, 9.347900390625, 9.74462890625, 10.141357421875, 10.5380859375, 10.934814453125, 11.33154296875, 11.728271484375, 12.125]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 14.0, 27.0, 40.0, 70.0, 108.0, 144.0, 122.0, 135.0, 117.0, 100.0, 45.0, 41.0, 26.0, 7.0, 8.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-18.97478485107422, -17.691471099853516, -16.408157348632812, -15.124842643737793, -13.84152889251709, -12.558215141296387, -11.274900436401367, -9.991586685180664, -8.708272933959961, -7.424959182739258, -6.1416449546813965, -4.858330726623535, -3.575016975402832, -2.291703224182129, -1.0083889961242676, 0.27492523193359375, 1.5582389831542969, 2.841552972793579, 4.124866962432861, 5.408181190490723, 6.691494941711426, 7.974808692932129, 9.258123397827148, 10.541437149047852, 11.824750900268555, 13.108064651489258, 14.391378402709961, 15.67469310760498, 16.9580078125, 18.241321563720703, 19.524635314941406, 20.80794906616211, 22.091262817382812, 23.374576568603516, 24.65789031982422, 25.941204071044922, 27.224517822265625, 28.507831573486328, 29.791147232055664, 31.074460983276367, 32.35777282714844, 33.64108657836914, 34.924400329589844, 36.20771408081055, 37.49102783203125, 38.77434158325195, 40.057655334472656, 41.340972900390625, 42.62428665161133, 43.90760040283203, 45.190914154052734, 46.47422790527344, 47.75754165649414, 49.040855407714844, 50.32416915893555, 51.60748291015625, 52.89080047607422, 54.17411422729492, 55.457427978515625, 56.74074172973633, 58.02405548095703, 59.307369232177734, 60.59068298339844, 61.874000549316406, 63.157310485839844]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 3.0, 3.0, 4.0, 11.0, 7.0, 8.0, 21.0, 13.0, 16.0, 17.0, 31.0, 31.0, 28.0, 29.0, 27.0, 46.0, 36.0, 37.0, 40.0, 38.0, 47.0, 47.0, 52.0, 43.0, 36.0, 44.0, 29.0, 43.0, 30.0, 30.0, 26.0, 24.0, 20.0, 13.0, 15.0, 18.0, 11.0, 8.0, 1.0, 8.0, 4.0, 4.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.27437973022461, -18.631837844848633, -17.98929786682129, -17.346755981445312, -16.70421600341797, -16.061674118041992, -15.419132232666016, -14.776591300964355, -14.134050369262695, -13.491509437561035, -12.848968505859375, -12.206426620483398, -11.563885688781738, -10.921344757080078, -10.278802871704102, -9.636261940002441, -8.993721008300781, -8.351180076599121, -7.708638668060303, -7.066097259521484, -6.423556327819824, -5.781015396118164, -5.138473987579346, -4.495932579040527, -3.853391647338867, -3.210850477218628, -2.5683093070983887, -1.9257681369781494, -1.2832269668579102, -0.6406857967376709, 0.0018553733825683594, 0.6443967819213867, 1.286935806274414, 1.9294769763946533, 2.5720181465148926, 3.214559316635132, 3.857100486755371, 4.499641418457031, 5.14218282699585, 5.784724235534668, 6.427265167236328, 7.069806098937988, 7.712347507476807, 8.354888916015625, 8.997429847717285, 9.639970779418945, 10.282512664794922, 10.925053596496582, 11.567594528198242, 12.210135459899902, 12.852676391601562, 13.495218276977539, 14.1377592086792, 14.78030014038086, 15.422842025756836, 16.065383911132812, 16.707923889160156, 17.350465774536133, 17.993005752563477, 18.635547637939453, 19.278087615966797, 19.920629501342773, 20.56317138671875, 21.205711364746094, 21.84825325012207]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 1.0, 3.0, 4.0, 4.0, 8.0, 9.0, 7.0, 9.0, 5.0, 20.0, 21.0, 18.0, 31.0, 21.0, 38.0, 33.0, 42.0, 48.0, 62.0, 47.0, 59.0, 40.0, 44.0, 48.0, 48.0, 45.0, 41.0, 26.0, 48.0, 27.0, 24.0, 20.0, 24.0, 12.0, 12.0, 12.0, 9.0, 11.0, 7.0, 10.0, 2.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.365234375, -2.287933349609375, -2.21063232421875, -2.133331298828125, -2.0560302734375, -1.978729248046875, -1.90142822265625, -1.824127197265625, -1.746826171875, -1.669525146484375, -1.59222412109375, -1.514923095703125, -1.4376220703125, -1.360321044921875, -1.28302001953125, -1.205718994140625, -1.12841796875, -1.051116943359375, -0.97381591796875, -0.896514892578125, -0.8192138671875, -0.741912841796875, -0.66461181640625, -0.587310791015625, -0.510009765625, -0.432708740234375, -0.35540771484375, -0.278106689453125, -0.2008056640625, -0.123504638671875, -0.04620361328125, 0.031097412109375, 0.1083984375, 0.185699462890625, 0.26300048828125, 0.340301513671875, 0.4176025390625, 0.494903564453125, 0.57220458984375, 0.649505615234375, 0.726806640625, 0.804107666015625, 0.88140869140625, 0.958709716796875, 1.0360107421875, 1.113311767578125, 1.19061279296875, 1.267913818359375, 1.34521484375, 1.422515869140625, 1.49981689453125, 1.577117919921875, 1.6544189453125, 1.731719970703125, 1.80902099609375, 1.886322021484375, 1.963623046875, 2.040924072265625, 2.11822509765625, 2.195526123046875, 2.2728271484375, 2.350128173828125, 2.42742919921875, 2.504730224609375, 2.58203125]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 7.0, 14.0, 17.0, 29.0, 59.0, 91.0, 134.0, 215.0, 319.0, 561.0, 868.0, 1318.0, 2053.0, 3064.0, 4740.0, 7009.0, 9994.0, 14250.0, 19582.0, 26455.0, 34966.0, 44344.0, 54899.0, 65673.0, 75926.0, 83232.0, 88273.0, 87258.0, 81731.0, 72561.0, 62561.0, 51631.0, 41570.0, 31910.0, 24021.0, 17718.0, 12608.0, 9005.0, 6189.0, 4147.0, 2585.0, 1826.0, 1221.0, 743.0, 434.0, 283.0, 182.0, 125.0, 69.0, 43.0, 19.0, 16.0, 13.0, 6.0, 4.0, 0.0, 2.0], "bins": [-1.005859375, -0.97613525390625, -0.9464111328125, -0.91668701171875, -0.886962890625, -0.85723876953125, -0.8275146484375, -0.79779052734375, -0.76806640625, -0.73834228515625, -0.7086181640625, -0.67889404296875, -0.649169921875, -0.61944580078125, -0.5897216796875, -0.55999755859375, -0.5302734375, -0.50054931640625, -0.4708251953125, -0.44110107421875, -0.411376953125, -0.38165283203125, -0.3519287109375, -0.32220458984375, -0.29248046875, -0.26275634765625, -0.2330322265625, -0.20330810546875, -0.173583984375, -0.14385986328125, -0.1141357421875, -0.08441162109375, -0.0546875, -0.02496337890625, 0.0047607421875, 0.03448486328125, 0.064208984375, 0.09393310546875, 0.1236572265625, 0.15338134765625, 0.18310546875, 0.21282958984375, 0.2425537109375, 0.27227783203125, 0.302001953125, 0.33172607421875, 0.3614501953125, 0.39117431640625, 0.4208984375, 0.45062255859375, 0.4803466796875, 0.51007080078125, 0.539794921875, 0.56951904296875, 0.5992431640625, 0.62896728515625, 0.65869140625, 0.68841552734375, 0.7181396484375, 0.74786376953125, 0.777587890625, 0.80731201171875, 0.8370361328125, 0.86676025390625, 0.896484375]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 4.0, 1.0, 9.0, 6.0, 9.0, 7.0, 8.0, 13.0, 12.0, 14.0, 20.0, 16.0, 22.0, 26.0, 29.0, 29.0, 32.0, 39.0, 33.0, 42.0, 37.0, 39.0, 42.0, 1066.0, 30.0, 40.0, 28.0, 42.0, 33.0, 23.0, 31.0, 31.0, 31.0, 21.0, 24.0, 21.0, 23.0, 15.0, 14.0, 12.0, 18.0, 7.0, 11.0, 6.0, 3.0, 3.0, 1.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.271484375, -2.2039794921875, -2.136474609375, -2.0689697265625, -2.00146484375, -1.9339599609375, -1.866455078125, -1.7989501953125, -1.7314453125, -1.6639404296875, -1.596435546875, -1.5289306640625, -1.46142578125, -1.3939208984375, -1.326416015625, -1.2589111328125, -1.19140625, -1.1239013671875, -1.056396484375, -0.9888916015625, -0.92138671875, -0.8538818359375, -0.786376953125, -0.7188720703125, -0.6513671875, -0.5838623046875, -0.516357421875, -0.4488525390625, -0.38134765625, -0.3138427734375, -0.246337890625, -0.1788330078125, -0.111328125, -0.0438232421875, 0.023681640625, 0.0911865234375, 0.15869140625, 0.2261962890625, 0.293701171875, 0.3612060546875, 0.4287109375, 0.4962158203125, 0.563720703125, 0.6312255859375, 0.69873046875, 0.7662353515625, 0.833740234375, 0.9012451171875, 0.96875, 1.0362548828125, 1.103759765625, 1.1712646484375, 1.23876953125, 1.3062744140625, 1.373779296875, 1.4412841796875, 1.5087890625, 1.5762939453125, 1.643798828125, 1.7113037109375, 1.77880859375, 1.8463134765625, 1.913818359375, 1.9813232421875, 2.048828125]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 6.0, 2.0, 10.0, 13.0, 15.0, 25.0, 42.0, 53.0, 113.0, 139.0, 215.0, 347.0, 504.0, 773.0, 1169.0, 1714.0, 2603.0, 3756.0, 5586.0, 8304.0, 12482.0, 19531.0, 37903.0, 480984.0, 1419191.0, 41507.0, 20577.0, 13111.0, 8718.0, 5760.0, 3927.0, 2609.0, 1847.0, 1223.0, 812.0, 516.0, 341.0, 234.0, 148.0, 103.0, 75.0, 46.0, 39.0, 19.0, 13.0, 11.0, 8.0, 5.0, 6.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.26953125, -2.19140625, -2.11328125, -2.03515625, -1.95703125, -1.87890625, -1.80078125, -1.72265625, -1.64453125, -1.56640625, -1.48828125, -1.41015625, -1.33203125, -1.25390625, -1.17578125, -1.09765625, -1.01953125, -0.94140625, -0.86328125, -0.78515625, -0.70703125, -0.62890625, -0.55078125, -0.47265625, -0.39453125, -0.31640625, -0.23828125, -0.16015625, -0.08203125, -0.00390625, 0.07421875, 0.15234375, 0.23046875, 0.30859375, 0.38671875, 0.46484375, 0.54296875, 0.62109375, 0.69921875, 0.77734375, 0.85546875, 0.93359375, 1.01171875, 1.08984375, 1.16796875, 1.24609375, 1.32421875, 1.40234375, 1.48046875, 1.55859375, 1.63671875, 1.71484375, 1.79296875, 1.87109375, 1.94921875, 2.02734375, 2.10546875, 2.18359375, 2.26171875, 2.33984375, 2.41796875, 2.49609375, 2.57421875, 2.65234375, 2.73046875]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 1.0, 4.0, 2.0, 5.0, 4.0, 7.0, 10.0, 9.0, 11.0, 10.0, 13.0, 15.0, 12.0, 23.0, 19.0, 19.0, 18.0, 22.0, 26.0, 23.0, 34.0, 31.0, 31.0, 40.0, 38.0, 18.0, 27.0, 33.0, 37.0, 40.0, 20.0, 24.0, 38.0, 38.0, 17.0, 29.0, 33.0, 21.0, 25.0, 16.0, 23.0, 24.0, 15.0, 17.0, 15.0, 6.0, 10.0, 9.0, 9.0, 10.0, 6.0, 6.0, 4.0, 8.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1380615234375, -0.13366317749023438, -0.12926483154296875, -0.12486648559570312, -0.1204681396484375, -0.11606979370117188, -0.11167144775390625, -0.10727310180664062, -0.102874755859375, -0.09847640991210938, -0.09407806396484375, -0.08967971801757812, -0.0852813720703125, -0.08088302612304688, -0.07648468017578125, -0.07208633422851562, -0.06768798828125, -0.06328964233398438, -0.05889129638671875, -0.054492950439453125, -0.0500946044921875, -0.045696258544921875, -0.04129791259765625, -0.036899566650390625, -0.032501220703125, -0.028102874755859375, -0.02370452880859375, -0.019306182861328125, -0.0149078369140625, -0.010509490966796875, -0.00611114501953125, -0.001712799072265625, 0.002685546875, 0.007083892822265625, 0.01148223876953125, 0.015880584716796875, 0.0202789306640625, 0.024677276611328125, 0.02907562255859375, 0.033473968505859375, 0.037872314453125, 0.042270660400390625, 0.04666900634765625, 0.051067352294921875, 0.0554656982421875, 0.059864044189453125, 0.06426239013671875, 0.06866073608398438, 0.07305908203125, 0.07745742797851562, 0.08185577392578125, 0.08625411987304688, 0.0906524658203125, 0.09505081176757812, 0.09944915771484375, 0.10384750366210938, 0.108245849609375, 0.11264419555664062, 0.11704254150390625, 0.12144088745117188, 0.1258392333984375, 0.13023757934570312, 0.13463592529296875, 0.13903427124023438, 0.1434326171875]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 2.0, 5.0, 5.0, 7.0, 12.0, 19.0, 19.0, 23.0, 24.0, 25.0, 32.0, 41.0, 49.0, 66.0, 78.0, 75.0, 98.0, 99.0, 132.0, 175.0, 184.0, 221.0, 323.0, 412.0, 894.0, 15543.0, 693409.0, 329228.0, 4751.0, 659.0, 373.0, 266.0, 221.0, 167.0, 153.0, 128.0, 98.0, 85.0, 58.0, 64.0, 66.0, 45.0, 46.0, 36.0, 32.0, 25.0, 22.0, 17.0, 12.0, 8.0, 6.0, 6.0, 7.0, 4.0, 3.0, 3.0, 1.0, 3.0], "bins": [-2.1796875, -2.11334228515625, -2.0469970703125, -1.98065185546875, -1.914306640625, -1.84796142578125, -1.7816162109375, -1.71527099609375, -1.64892578125, -1.58258056640625, -1.5162353515625, -1.44989013671875, -1.383544921875, -1.31719970703125, -1.2508544921875, -1.18450927734375, -1.1181640625, -1.05181884765625, -0.9854736328125, -0.91912841796875, -0.852783203125, -0.78643798828125, -0.7200927734375, -0.65374755859375, -0.58740234375, -0.52105712890625, -0.4547119140625, -0.38836669921875, -0.322021484375, -0.25567626953125, -0.1893310546875, -0.12298583984375, -0.056640625, 0.00970458984375, 0.0760498046875, 0.14239501953125, 0.208740234375, 0.27508544921875, 0.3414306640625, 0.40777587890625, 0.47412109375, 0.54046630859375, 0.6068115234375, 0.67315673828125, 0.739501953125, 0.80584716796875, 0.8721923828125, 0.93853759765625, 1.0048828125, 1.07122802734375, 1.1375732421875, 1.20391845703125, 1.270263671875, 1.33660888671875, 1.4029541015625, 1.46929931640625, 1.53564453125, 1.60198974609375, 1.6683349609375, 1.73468017578125, 1.801025390625, 1.86737060546875, 1.9337158203125, 2.00006103515625, 2.06640625]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 8.0, 37.0, 102.0, 288.0, 378.0, 128.0, 41.0, 14.0, 7.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.8069934844970703, -3.6765167713165283, -3.5460400581359863, -3.4155633449554443, -3.2850866317749023, -3.1546096801757812, -3.0241329669952393, -2.8936562538146973, -2.7631795406341553, -2.6327028274536133, -2.5022261142730713, -2.3717494010925293, -2.241272449493408, -2.1107959747314453, -1.9803190231323242, -1.8498423099517822, -1.7193655967712402, -1.5888888835906982, -1.4584121704101562, -1.3279353380203247, -1.1974586248397827, -1.0669819116592407, -0.936505138874054, -0.8060283660888672, -0.6755516529083252, -0.5450749397277832, -0.41459816694259644, -0.28412142395973206, -0.15364468097686768, -0.023167967796325684, 0.10730880498886108, 0.23778557777404785, 0.36826229095458984, 0.4987390339374542, 0.6292157769203186, 0.7596925497055054, 0.8901692628860474, 1.0206459760665894, 1.151122808456421, 1.281599521636963, 1.4120762348175049, 1.5425529479980469, 1.6730296611785889, 1.8035064935684204, 1.9339832067489624, 2.064459800720215, 2.194936752319336, 2.325413465499878, 2.45589017868042, 2.586366891860962, 2.716843605041504, 2.847320318222046, 2.977797031402588, 3.108273983001709, 3.238750696182251, 3.369227409362793, 3.499704122543335, 3.630180835723877, 3.760657548904419, 3.891134262084961, 4.021611213684082, 4.152087688446045, 4.282564640045166, 4.413041114807129, 4.54351806640625]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 4.0, 3.0, 7.0, 7.0, 13.0, 14.0, 11.0, 22.0, 30.0, 35.0, 37.0, 31.0, 51.0, 49.0, 40.0, 54.0, 67.0, 51.0, 46.0, 68.0, 51.0, 44.0, 46.0, 36.0, 35.0, 29.0, 29.0, 28.0, 20.0, 16.0, 10.0, 11.0, 8.0, 1.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3453744649887085, -1.2809009552001953, -1.2164274454116821, -1.151953935623169, -1.0874805450439453, -1.0230070352554321, -0.958533525466919, -0.8940600156784058, -0.8295865654945374, -0.7651130557060242, -0.7006396055221558, -0.6361660957336426, -0.5716925859451294, -0.507219135761261, -0.4427456259727478, -0.378272145986557, -0.3137986660003662, -0.24932518601417542, -0.18485169112682343, -0.12037819623947144, -0.05590471625328064, 0.008568763732910156, 0.07304227352142334, 0.13751575350761414, 0.20198923349380493, 0.2664627134799957, 0.3309361934661865, 0.3954097032546997, 0.4598831832408905, 0.5243566632270813, 0.5888301730155945, 0.6533036231994629, 0.7177772521972656, 0.7822507619857788, 0.8467242121696472, 0.9111977219581604, 0.9756711721420288, 1.040144681930542, 1.1046181917190552, 1.1690917015075684, 1.233565092086792, 1.2980386018753052, 1.3625121116638184, 1.426985502243042, 1.4914590120315552, 1.5559325218200684, 1.6204060316085815, 1.6848795413970947, 1.749353051185608, 1.813826560974121, 1.8783000707626343, 1.9427735805511475, 2.007246971130371, 2.071720600128174, 2.1361939907073975, 2.200667381286621, 2.265141010284424, 2.3296144008636475, 2.39408802986145, 2.458561420440674, 2.5230350494384766, 2.5875084400177, 2.651981830596924, 2.7164554595947266, 2.78092885017395]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 7.0, 3.0, 6.0, 8.0, 8.0, 9.0, 16.0, 13.0, 13.0, 10.0, 15.0, 22.0, 18.0, 33.0, 19.0, 30.0, 37.0, 46.0, 45.0, 27.0, 37.0, 40.0, 43.0, 40.0, 35.0, 32.0, 44.0, 38.0, 28.0, 33.0, 40.0, 29.0, 32.0, 20.0, 12.0, 17.0, 14.0, 8.0, 12.0, 10.0, 11.0, 6.0, 11.0, 9.0, 5.0, 3.0, 4.0, 2.0, 3.0, 3.0, 1.0, 0.0, 2.0], "bins": [-2.15625, -2.09246826171875, -2.0286865234375, -1.96490478515625, -1.901123046875, -1.83734130859375, -1.7735595703125, -1.70977783203125, -1.64599609375, -1.58221435546875, -1.5184326171875, -1.45465087890625, -1.390869140625, -1.32708740234375, -1.2633056640625, -1.19952392578125, -1.1357421875, -1.07196044921875, -1.0081787109375, -0.94439697265625, -0.880615234375, -0.81683349609375, -0.7530517578125, -0.68927001953125, -0.62548828125, -0.56170654296875, -0.4979248046875, -0.43414306640625, -0.370361328125, -0.30657958984375, -0.2427978515625, -0.17901611328125, -0.115234375, -0.05145263671875, 0.0123291015625, 0.07611083984375, 0.139892578125, 0.20367431640625, 0.2674560546875, 0.33123779296875, 0.39501953125, 0.45880126953125, 0.5225830078125, 0.58636474609375, 0.650146484375, 0.71392822265625, 0.7777099609375, 0.84149169921875, 0.9052734375, 0.96905517578125, 1.0328369140625, 1.09661865234375, 1.160400390625, 1.22418212890625, 1.2879638671875, 1.35174560546875, 1.41552734375, 1.47930908203125, 1.5430908203125, 1.60687255859375, 1.670654296875, 1.73443603515625, 1.7982177734375, 1.86199951171875, 1.92578125]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 7.0, 10.0, 18.0, 22.0, 45.0, 57.0, 92.0, 120.0, 176.0, 303.0, 445.0, 678.0, 1134.0, 1713.0, 2614.0, 4117.0, 6463.0, 10631.0, 18389.0, 34788.0, 73479.0, 161484.0, 270012.0, 229870.0, 115791.0, 52566.0, 25731.0, 14376.0, 8648.0, 5235.0, 3397.0, 2206.0, 1379.0, 897.0, 586.0, 385.0, 230.0, 171.0, 103.0, 66.0, 40.0, 29.0, 12.0, 17.0, 7.0, 2.0, 8.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.857421875, -1.8007659912109375, -1.744110107421875, -1.6874542236328125, -1.63079833984375, -1.5741424560546875, -1.517486572265625, -1.4608306884765625, -1.4041748046875, -1.3475189208984375, -1.290863037109375, -1.2342071533203125, -1.17755126953125, -1.1208953857421875, -1.064239501953125, -1.0075836181640625, -0.950927734375, -0.8942718505859375, -0.837615966796875, -0.7809600830078125, -0.72430419921875, -0.6676483154296875, -0.610992431640625, -0.5543365478515625, -0.4976806640625, -0.4410247802734375, -0.384368896484375, -0.3277130126953125, -0.27105712890625, -0.2144012451171875, -0.157745361328125, -0.1010894775390625, -0.04443359375, 0.0122222900390625, 0.068878173828125, 0.1255340576171875, 0.18218994140625, 0.2388458251953125, 0.295501708984375, 0.3521575927734375, 0.4088134765625, 0.4654693603515625, 0.522125244140625, 0.5787811279296875, 0.63543701171875, 0.6920928955078125, 0.748748779296875, 0.8054046630859375, 0.862060546875, 0.9187164306640625, 0.975372314453125, 1.0320281982421875, 1.08868408203125, 1.1453399658203125, 1.201995849609375, 1.2586517333984375, 1.3153076171875, 1.3719635009765625, 1.428619384765625, 1.4852752685546875, 1.54193115234375, 1.5985870361328125, 1.655242919921875, 1.7118988037109375, 1.7685546875]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 10.0, 6.0, 5.0, 10.0, 14.0, 9.0, 19.0, 16.0, 17.0, 21.0, 24.0, 33.0, 22.0, 34.0, 33.0, 41.0, 53.0, 46.0, 53.0, 130.0, 284.0, 1470.0, 192.0, 92.0, 59.0, 44.0, 38.0, 32.0, 29.0, 34.0, 33.0, 20.0, 20.0, 10.0, 21.0, 11.0, 25.0, 8.0, 6.0, 7.0, 7.0, 5.0, 5.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.87890625, -7.62713623046875, -7.3753662109375, -7.12359619140625, -6.871826171875, -6.62005615234375, -6.3682861328125, -6.11651611328125, -5.86474609375, -5.61297607421875, -5.3612060546875, -5.10943603515625, -4.857666015625, -4.60589599609375, -4.3541259765625, -4.10235595703125, -3.8505859375, -3.59881591796875, -3.3470458984375, -3.09527587890625, -2.843505859375, -2.59173583984375, -2.3399658203125, -2.08819580078125, -1.83642578125, -1.58465576171875, -1.3328857421875, -1.08111572265625, -0.829345703125, -0.57757568359375, -0.3258056640625, -0.07403564453125, 0.177734375, 0.42950439453125, 0.6812744140625, 0.93304443359375, 1.184814453125, 1.43658447265625, 1.6883544921875, 1.94012451171875, 2.19189453125, 2.44366455078125, 2.6954345703125, 2.94720458984375, 3.198974609375, 3.45074462890625, 3.7025146484375, 3.95428466796875, 4.2060546875, 4.45782470703125, 4.7095947265625, 4.96136474609375, 5.213134765625, 5.46490478515625, 5.7166748046875, 5.96844482421875, 6.22021484375, 6.47198486328125, 6.7237548828125, 6.97552490234375, 7.227294921875, 7.47906494140625, 7.7308349609375, 7.98260498046875, 8.234375]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 4.0, 4.0, 2.0, 6.0, 8.0, 10.0, 8.0, 21.0, 20.0, 32.0, 40.0, 51.0, 75.0, 147.0, 210.0, 458.0, 1005.0, 3076.0, 17499.0, 386567.0, 2662978.0, 63267.0, 6965.0, 1733.0, 648.0, 324.0, 193.0, 106.0, 68.0, 46.0, 42.0, 34.0, 19.0, 14.0, 14.0, 7.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0], "bins": [-13.609375, -13.212158203125, -12.81494140625, -12.417724609375, -12.0205078125, -11.623291015625, -11.22607421875, -10.828857421875, -10.431640625, -10.034423828125, -9.63720703125, -9.239990234375, -8.8427734375, -8.445556640625, -8.04833984375, -7.651123046875, -7.25390625, -6.856689453125, -6.45947265625, -6.062255859375, -5.6650390625, -5.267822265625, -4.87060546875, -4.473388671875, -4.076171875, -3.678955078125, -3.28173828125, -2.884521484375, -2.4873046875, -2.090087890625, -1.69287109375, -1.295654296875, -0.8984375, -0.501220703125, -0.10400390625, 0.293212890625, 0.6904296875, 1.087646484375, 1.48486328125, 1.882080078125, 2.279296875, 2.676513671875, 3.07373046875, 3.470947265625, 3.8681640625, 4.265380859375, 4.66259765625, 5.059814453125, 5.45703125, 5.854248046875, 6.25146484375, 6.648681640625, 7.0458984375, 7.443115234375, 7.84033203125, 8.237548828125, 8.634765625, 9.031982421875, 9.42919921875, 9.826416015625, 10.2236328125, 10.620849609375, 11.01806640625, 11.415283203125, 11.8125]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 472.0, 549.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-319.0098571777344, -313.10003662109375, -307.19024658203125, -301.2804260253906, -295.37060546875, -289.4608154296875, -283.5509948730469, -277.64117431640625, -271.73138427734375, -265.8215637207031, -259.9117736816406, -254.001953125, -248.09214782714844, -242.18234252929688, -236.27252197265625, -230.3627166748047, -224.45291137695312, -218.54310607910156, -212.63328552246094, -206.72348022460938, -200.8136749267578, -194.90386962890625, -188.99404907226562, -183.08424377441406, -177.17442321777344, -171.26461791992188, -165.35479736328125, -159.4449920654297, -153.53518676757812, -147.62538146972656, -141.71556091308594, -135.80575561523438, -129.8959503173828, -123.98613739013672, -118.07633209228516, -112.16651916503906, -106.2567138671875, -100.3469009399414, -94.43708801269531, -88.52728271484375, -82.61747741699219, -76.7076644897461, -70.79785919189453, -64.88804626464844, -58.978240966796875, -53.06842803955078, -47.15861892700195, -41.248809814453125, -35.33899688720703, -29.429187774658203, -23.519378662109375, -17.609567642211914, -11.699758529663086, -5.789949417114258, 0.11986160278320312, 6.029670715332031, 11.93947982788086, 17.849288940429688, 23.759098052978516, 29.668909072875977, 35.57872009277344, 41.488525390625, 47.398338317871094, 53.30814743041992, 59.21795654296875]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 9.0, 7.0, 6.0, 7.0, 12.0, 2.0, 8.0, 20.0, 13.0, 27.0, 21.0, 26.0, 22.0, 34.0, 37.0, 39.0, 45.0, 40.0, 48.0, 46.0, 43.0, 39.0, 47.0, 41.0, 48.0, 50.0, 31.0, 29.0, 28.0, 29.0, 24.0, 25.0, 18.0, 15.0, 13.0, 10.0, 8.0, 8.0, 9.0, 7.0, 4.0, 3.0, 3.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-26.981353759765625, -26.130475997924805, -25.279600143432617, -24.428722381591797, -23.577844619750977, -22.72696876525879, -21.87609100341797, -21.02521514892578, -20.17433738708496, -19.32345962524414, -18.472583770751953, -17.621706008911133, -16.770828247070312, -15.919952392578125, -15.069074630737305, -14.2181978225708, -13.36732006072998, -12.516443252563477, -11.665565490722656, -10.814688682556152, -9.963811874389648, -9.112934112548828, -8.262057304382324, -7.41118049621582, -6.560303211212158, -5.709425926208496, -4.858549118041992, -4.00767183303833, -3.156794786453247, -2.305917739868164, -1.455040454864502, -0.604163646697998, 0.24671363830566406, 1.097590684890747, 1.9484678506851196, 2.799345016479492, 3.650222063064575, 4.501099109649658, 5.35197639465332, 6.202853202819824, 7.053730487823486, 7.904607772827148, 8.755484580993652, 9.606361389160156, 10.457239151000977, 11.30811595916748, 12.158992767333984, 13.009870529174805, 13.860747337341309, 14.711624145507812, 15.562501907348633, 16.413379669189453, 17.26425552368164, 18.11513328552246, 18.96601104736328, 19.81688690185547, 20.66776466369629, 21.51864242553711, 22.369518280029297, 23.220396041870117, 24.071273803710938, 24.922149658203125, 25.773027420043945, 26.623905181884766, 27.474781036376953]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 3.0, 6.0, 3.0, 7.0, 11.0, 16.0, 18.0, 16.0, 17.0, 17.0, 17.0, 28.0, 35.0, 36.0, 54.0, 41.0, 43.0, 42.0, 54.0, 42.0, 48.0, 45.0, 42.0, 40.0, 39.0, 53.0, 26.0, 31.0, 25.0, 25.0, 13.0, 17.0, 25.0, 23.0, 18.0, 5.0, 4.0, 7.0, 3.0, 6.0, 1.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-2.7578125, -2.678955078125, -2.60009765625, -2.521240234375, -2.4423828125, -2.363525390625, -2.28466796875, -2.205810546875, -2.126953125, -2.048095703125, -1.96923828125, -1.890380859375, -1.8115234375, -1.732666015625, -1.65380859375, -1.574951171875, -1.49609375, -1.417236328125, -1.33837890625, -1.259521484375, -1.1806640625, -1.101806640625, -1.02294921875, -0.944091796875, -0.865234375, -0.786376953125, -0.70751953125, -0.628662109375, -0.5498046875, -0.470947265625, -0.39208984375, -0.313232421875, -0.234375, -0.155517578125, -0.07666015625, 0.002197265625, 0.0810546875, 0.159912109375, 0.23876953125, 0.317626953125, 0.396484375, 0.475341796875, 0.55419921875, 0.633056640625, 0.7119140625, 0.790771484375, 0.86962890625, 0.948486328125, 1.02734375, 1.106201171875, 1.18505859375, 1.263916015625, 1.3427734375, 1.421630859375, 1.50048828125, 1.579345703125, 1.658203125, 1.737060546875, 1.81591796875, 1.894775390625, 1.9736328125, 2.052490234375, 2.13134765625, 2.210205078125, 2.2890625]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 7.0, 12.0, 9.0, 5.0, 17.0, 12.0, 30.0, 38.0, 63.0, 97.0, 195.0, 357.0, 801.0, 1907.0, 4851.0, 13534.0, 40106.0, 130445.0, 514235.0, 1719316.0, 1305489.0, 328352.0, 89205.0, 28382.0, 10036.0, 3787.0, 1522.0, 692.0, 329.0, 169.0, 90.0, 71.0, 35.0, 40.0, 22.0, 7.0, 9.0, 5.0, 5.0, 1.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.31640625, -4.18499755859375, -4.0535888671875, -3.92218017578125, -3.790771484375, -3.65936279296875, -3.5279541015625, -3.39654541015625, -3.26513671875, -3.13372802734375, -3.0023193359375, -2.87091064453125, -2.739501953125, -2.60809326171875, -2.4766845703125, -2.34527587890625, -2.2138671875, -2.08245849609375, -1.9510498046875, -1.81964111328125, -1.688232421875, -1.55682373046875, -1.4254150390625, -1.29400634765625, -1.16259765625, -1.03118896484375, -0.8997802734375, -0.76837158203125, -0.636962890625, -0.50555419921875, -0.3741455078125, -0.24273681640625, -0.111328125, 0.02008056640625, 0.1514892578125, 0.28289794921875, 0.414306640625, 0.54571533203125, 0.6771240234375, 0.80853271484375, 0.93994140625, 1.07135009765625, 1.2027587890625, 1.33416748046875, 1.465576171875, 1.59698486328125, 1.7283935546875, 1.85980224609375, 1.9912109375, 2.12261962890625, 2.2540283203125, 2.38543701171875, 2.516845703125, 2.64825439453125, 2.7796630859375, 2.91107177734375, 3.04248046875, 3.17388916015625, 3.3052978515625, 3.43670654296875, 3.568115234375, 3.69952392578125, 3.8309326171875, 3.96234130859375, 4.09375]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 6.0, 6.0, 15.0, 11.0, 13.0, 27.0, 40.0, 51.0, 75.0, 115.0, 175.0, 241.0, 284.0, 398.0, 467.0, 476.0, 444.0, 350.0, 246.0, 168.0, 146.0, 117.0, 67.0, 44.0, 24.0, 19.0, 18.0, 17.0, 10.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.5, -5.29052734375, -5.0810546875, -4.87158203125, -4.662109375, -4.45263671875, -4.2431640625, -4.03369140625, -3.82421875, -3.61474609375, -3.4052734375, -3.19580078125, -2.986328125, -2.77685546875, -2.5673828125, -2.35791015625, -2.1484375, -1.93896484375, -1.7294921875, -1.52001953125, -1.310546875, -1.10107421875, -0.8916015625, -0.68212890625, -0.47265625, -0.26318359375, -0.0537109375, 0.15576171875, 0.365234375, 0.57470703125, 0.7841796875, 0.99365234375, 1.203125, 1.41259765625, 1.6220703125, 1.83154296875, 2.041015625, 2.25048828125, 2.4599609375, 2.66943359375, 2.87890625, 3.08837890625, 3.2978515625, 3.50732421875, 3.716796875, 3.92626953125, 4.1357421875, 4.34521484375, 4.5546875, 4.76416015625, 4.9736328125, 5.18310546875, 5.392578125, 5.60205078125, 5.8115234375, 6.02099609375, 6.23046875, 6.43994140625, 6.6494140625, 6.85888671875, 7.068359375, 7.27783203125, 7.4873046875, 7.69677734375, 7.90625]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 5.0, 12.0, 21.0, 36.0, 36.0, 49.0, 102.0, 160.0, 355.0, 830.0, 2390.0, 9568.0, 48288.0, 286479.0, 1733172.0, 1757986.0, 292252.0, 48830.0, 9590.0, 2526.0, 785.0, 377.0, 172.0, 80.0, 74.0, 41.0, 23.0, 17.0, 10.0, 8.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.9921875, -10.6868896484375, -10.381591796875, -10.0762939453125, -9.77099609375, -9.4656982421875, -9.160400390625, -8.8551025390625, -8.5498046875, -8.2445068359375, -7.939208984375, -7.6339111328125, -7.32861328125, -7.0233154296875, -6.718017578125, -6.4127197265625, -6.107421875, -5.8021240234375, -5.496826171875, -5.1915283203125, -4.88623046875, -4.5809326171875, -4.275634765625, -3.9703369140625, -3.6650390625, -3.3597412109375, -3.054443359375, -2.7491455078125, -2.44384765625, -2.1385498046875, -1.833251953125, -1.5279541015625, -1.22265625, -0.9173583984375, -0.612060546875, -0.3067626953125, -0.00146484375, 0.3038330078125, 0.609130859375, 0.9144287109375, 1.2197265625, 1.5250244140625, 1.830322265625, 2.1356201171875, 2.44091796875, 2.7462158203125, 3.051513671875, 3.3568115234375, 3.662109375, 3.9674072265625, 4.272705078125, 4.5780029296875, 4.88330078125, 5.1885986328125, 5.493896484375, 5.7991943359375, 6.1044921875, 6.4097900390625, 6.715087890625, 7.0203857421875, 7.32568359375, 7.6309814453125, 7.936279296875, 8.2415771484375, 8.546875]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 6.0, 22.0, 40.0, 58.0, 98.0, 122.0, 113.0, 140.0, 122.0, 97.0, 76.0, 57.0, 30.0, 14.0, 9.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.038944244384766, -35.72954559326172, -34.420143127441406, -33.11074447631836, -31.801342010498047, -30.491943359375, -29.18254280090332, -27.87314224243164, -26.56374168395996, -25.25434112548828, -23.9449405670166, -22.635540008544922, -21.326141357421875, -20.016738891601562, -18.707340240478516, -17.397939682006836, -16.088539123535156, -14.779138565063477, -13.469738006591797, -12.160338401794434, -10.850937843322754, -9.541537284851074, -8.232137680053711, -6.922737121582031, -5.613336563110352, -4.303936004638672, -2.9945359230041504, -1.6851356029510498, -0.3757352828979492, 0.9336652755737305, 2.243065357208252, 3.5524654388427734, 4.8618621826171875, 6.171262741088867, 7.480662822723389, 8.79006290435791, 10.09946346282959, 11.40886402130127, 12.718263626098633, 14.027664184570312, 15.337064743041992, 16.646465301513672, 17.95586585998535, 19.26526641845703, 20.574665069580078, 21.88406753540039, 23.193466186523438, 24.502866744995117, 25.812267303466797, 27.121667861938477, 28.431068420410156, 29.740468978881836, 31.049869537353516, 32.35926818847656, 33.668670654296875, 34.97806930541992, 36.28746795654297, 37.596866607666016, 38.90626907348633, 40.215667724609375, 41.52507019042969, 42.834468841552734, 44.14387130737305, 45.453269958496094, 46.762672424316406]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 6.0, 1.0, 0.0, 1.0, 4.0, 5.0, 1.0, 2.0, 3.0, 4.0, 7.0, 2.0, 10.0, 11.0, 11.0, 19.0, 15.0, 19.0, 31.0, 25.0, 25.0, 17.0, 21.0, 21.0, 34.0, 35.0, 35.0, 34.0, 40.0, 43.0, 53.0, 35.0, 42.0, 34.0, 34.0, 38.0, 23.0, 35.0, 22.0, 29.0, 28.0, 24.0, 21.0, 15.0, 7.0, 14.0, 15.0, 12.0, 8.0, 12.0, 7.0, 6.0, 1.0, 7.0, 4.0, 4.0, 1.0, 0.0, 4.0, 2.0, 1.0, 3.0], "bins": [-18.312238693237305, -17.75177001953125, -17.191301345825195, -16.63083267211914, -16.070363998413086, -15.509895324707031, -14.949426651000977, -14.388957977294922, -13.828489303588867, -13.268020629882812, -12.707551956176758, -12.147083282470703, -11.586614608764648, -11.026145935058594, -10.465677261352539, -9.905208587646484, -9.344738960266113, -8.784270286560059, -8.223801612854004, -7.663332939147949, -7.1028642654418945, -6.54239559173584, -5.981926441192627, -5.421457767486572, -4.860989093780518, -4.300520420074463, -3.740051746368408, -3.1795828342437744, -2.6191141605377197, -2.058645486831665, -1.4981765747070312, -0.9377079010009766, -0.3772392272949219, 0.1832295060157776, 0.743698239326477, 1.3041670322418213, 1.864635705947876, 2.4251043796539307, 2.9855732917785645, 3.546041965484619, 4.106510639190674, 4.6669793128967285, 5.227447986602783, 5.787917137145996, 6.348385810852051, 6.9088544845581055, 7.46932315826416, 8.029791831970215, 8.59026050567627, 9.150729179382324, 9.711197853088379, 10.271666526794434, 10.832135200500488, 11.392603874206543, 11.953073501586914, 12.513542175292969, 13.074010848999023, 13.634479522705078, 14.194948196411133, 14.755416870117188, 15.315885543823242, 15.876354217529297, 16.43682289123535, 16.997291564941406, 17.55776023864746]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 2.0, 4.0, 4.0, 3.0, 15.0, 16.0, 12.0, 20.0, 21.0, 26.0, 29.0, 34.0, 46.0, 49.0, 40.0, 40.0, 43.0, 34.0, 48.0, 47.0, 29.0, 39.0, 53.0, 47.0, 37.0, 33.0, 35.0, 28.0, 36.0, 26.0, 17.0, 13.0, 13.0, 12.0, 16.0, 8.0, 11.0, 6.0, 5.0, 4.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.630859375, -2.552490234375, -2.47412109375, -2.395751953125, -2.3173828125, -2.239013671875, -2.16064453125, -2.082275390625, -2.00390625, -1.925537109375, -1.84716796875, -1.768798828125, -1.6904296875, -1.612060546875, -1.53369140625, -1.455322265625, -1.376953125, -1.298583984375, -1.22021484375, -1.141845703125, -1.0634765625, -0.985107421875, -0.90673828125, -0.828369140625, -0.75, -0.671630859375, -0.59326171875, -0.514892578125, -0.4365234375, -0.358154296875, -0.27978515625, -0.201416015625, -0.123046875, -0.044677734375, 0.03369140625, 0.112060546875, 0.1904296875, 0.268798828125, 0.34716796875, 0.425537109375, 0.50390625, 0.582275390625, 0.66064453125, 0.739013671875, 0.8173828125, 0.895751953125, 0.97412109375, 1.052490234375, 1.130859375, 1.209228515625, 1.28759765625, 1.365966796875, 1.4443359375, 1.522705078125, 1.60107421875, 1.679443359375, 1.7578125, 1.836181640625, 1.91455078125, 1.992919921875, 2.0712890625, 2.149658203125, 2.22802734375, 2.306396484375, 2.384765625]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 5.0, 5.0, 12.0, 23.0, 25.0, 57.0, 85.0, 156.0, 249.0, 374.0, 598.0, 1071.0, 1581.0, 2520.0, 3773.0, 5536.0, 8497.0, 11886.0, 16715.0, 23395.0, 30924.0, 40204.0, 49728.0, 59956.0, 69844.0, 77759.0, 82971.0, 85304.0, 82525.0, 76951.0, 68237.0, 58435.0, 48606.0, 38235.0, 29538.0, 22012.0, 16081.0, 11377.0, 7956.0, 5411.0, 3501.0, 2397.0, 1568.0, 961.0, 638.0, 333.0, 230.0, 132.0, 74.0, 47.0, 34.0, 17.0, 11.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.93896484375, -0.9081039428710938, -0.8772430419921875, -0.8463821411132812, -0.815521240234375, -0.7846603393554688, -0.7537994384765625, -0.7229385375976562, -0.69207763671875, -0.6612167358398438, -0.6303558349609375, -0.5994949340820312, -0.568634033203125, -0.5377731323242188, -0.5069122314453125, -0.47605133056640625, -0.4451904296875, -0.41432952880859375, -0.3834686279296875, -0.35260772705078125, -0.321746826171875, -0.29088592529296875, -0.2600250244140625, -0.22916412353515625, -0.19830322265625, -0.16744232177734375, -0.1365814208984375, -0.10572052001953125, -0.074859619140625, -0.04399871826171875, -0.0131378173828125, 0.01772308349609375, 0.048583984375, 0.07944488525390625, 0.1103057861328125, 0.14116668701171875, 0.172027587890625, 0.20288848876953125, 0.2337493896484375, 0.26461029052734375, 0.29547119140625, 0.32633209228515625, 0.3571929931640625, 0.38805389404296875, 0.418914794921875, 0.44977569580078125, 0.4806365966796875, 0.5114974975585938, 0.5423583984375, 0.5732192993164062, 0.6040802001953125, 0.6349411010742188, 0.665802001953125, 0.6966629028320312, 0.7275238037109375, 0.7583847045898438, 0.78924560546875, 0.8201065063476562, 0.8509674072265625, 0.8818283081054688, 0.912689208984375, 0.9435501098632812, 0.9744110107421875, 1.0052719116210938, 1.0361328125]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 5.0, 0.0, 4.0, 2.0, 9.0, 9.0, 11.0, 5.0, 16.0, 13.0, 13.0, 20.0, 19.0, 30.0, 31.0, 23.0, 31.0, 32.0, 42.0, 34.0, 37.0, 33.0, 39.0, 41.0, 1056.0, 40.0, 34.0, 39.0, 39.0, 35.0, 33.0, 40.0, 45.0, 31.0, 25.0, 22.0, 13.0, 23.0, 7.0, 10.0, 9.0, 10.0, 6.0, 7.0, 5.0, 6.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.12109375, -2.047393798828125, -1.97369384765625, -1.899993896484375, -1.8262939453125, -1.752593994140625, -1.67889404296875, -1.605194091796875, -1.531494140625, -1.457794189453125, -1.38409423828125, -1.310394287109375, -1.2366943359375, -1.162994384765625, -1.08929443359375, -1.015594482421875, -0.94189453125, -0.868194580078125, -0.79449462890625, -0.720794677734375, -0.6470947265625, -0.573394775390625, -0.49969482421875, -0.425994873046875, -0.352294921875, -0.278594970703125, -0.20489501953125, -0.131195068359375, -0.0574951171875, 0.016204833984375, 0.08990478515625, 0.163604736328125, 0.2373046875, 0.311004638671875, 0.38470458984375, 0.458404541015625, 0.5321044921875, 0.605804443359375, 0.67950439453125, 0.753204345703125, 0.826904296875, 0.900604248046875, 0.97430419921875, 1.048004150390625, 1.1217041015625, 1.195404052734375, 1.26910400390625, 1.342803955078125, 1.41650390625, 1.490203857421875, 1.56390380859375, 1.637603759765625, 1.7113037109375, 1.785003662109375, 1.85870361328125, 1.932403564453125, 2.006103515625, 2.079803466796875, 2.15350341796875, 2.227203369140625, 2.3009033203125, 2.374603271484375, 2.44830322265625, 2.522003173828125, 2.595703125]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 8.0, 11.0, 14.0, 16.0, 39.0, 38.0, 56.0, 116.0, 160.0, 213.0, 322.0, 516.0, 771.0, 1107.0, 1651.0, 2471.0, 3520.0, 5341.0, 7559.0, 11266.0, 17031.0, 30764.0, 107009.0, 1759047.0, 73183.0, 26684.0, 15913.0, 10273.0, 7079.0, 4755.0, 3229.0, 2328.0, 1527.0, 1035.0, 700.0, 462.0, 328.0, 197.0, 140.0, 88.0, 67.0, 27.0, 20.0, 12.0, 7.0, 11.0, 10.0, 6.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.4296875, -2.34979248046875, -2.2698974609375, -2.19000244140625, -2.110107421875, -2.03021240234375, -1.9503173828125, -1.87042236328125, -1.79052734375, -1.71063232421875, -1.6307373046875, -1.55084228515625, -1.470947265625, -1.39105224609375, -1.3111572265625, -1.23126220703125, -1.1513671875, -1.07147216796875, -0.9915771484375, -0.91168212890625, -0.831787109375, -0.75189208984375, -0.6719970703125, -0.59210205078125, -0.51220703125, -0.43231201171875, -0.3524169921875, -0.27252197265625, -0.192626953125, -0.11273193359375, -0.0328369140625, 0.04705810546875, 0.126953125, 0.20684814453125, 0.2867431640625, 0.36663818359375, 0.446533203125, 0.52642822265625, 0.6063232421875, 0.68621826171875, 0.76611328125, 0.84600830078125, 0.9259033203125, 1.00579833984375, 1.085693359375, 1.16558837890625, 1.2454833984375, 1.32537841796875, 1.4052734375, 1.48516845703125, 1.5650634765625, 1.64495849609375, 1.724853515625, 1.80474853515625, 1.8846435546875, 1.96453857421875, 2.04443359375, 2.12432861328125, 2.2042236328125, 2.28411865234375, 2.364013671875, 2.44390869140625, 2.5238037109375, 2.60369873046875, 2.68359375]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 5.0, 4.0, 5.0, 5.0, 8.0, 5.0, 14.0, 21.0, 20.0, 16.0, 23.0, 38.0, 31.0, 27.0, 27.0, 30.0, 25.0, 24.0, 32.0, 35.0, 26.0, 32.0, 22.0, 26.0, 37.0, 29.0, 26.0, 29.0, 27.0, 25.0, 33.0, 42.0, 35.0, 25.0, 36.0, 33.0, 25.0, 18.0, 15.0, 13.0, 12.0, 5.0, 7.0, 10.0, 5.0, 7.0, 2.0, 5.0, 3.0, 1.0, 2.0, 3.0], "bins": [-0.18505859375, -0.17985153198242188, -0.17464447021484375, -0.16943740844726562, -0.1642303466796875, -0.15902328491210938, -0.15381622314453125, -0.14860916137695312, -0.143402099609375, -0.13819503784179688, -0.13298797607421875, -0.12778091430664062, -0.1225738525390625, -0.11736679077148438, -0.11215972900390625, -0.10695266723632812, -0.10174560546875, -0.09653854370117188, -0.09133148193359375, -0.08612442016601562, -0.0809173583984375, -0.07571029663085938, -0.07050323486328125, -0.06529617309570312, -0.060089111328125, -0.054882049560546875, -0.04967498779296875, -0.044467926025390625, -0.0392608642578125, -0.034053802490234375, -0.02884674072265625, -0.023639678955078125, -0.0184326171875, -0.013225555419921875, -0.00801849365234375, -0.002811431884765625, 0.0023956298828125, 0.007602691650390625, 0.01280975341796875, 0.018016815185546875, 0.023223876953125, 0.028430938720703125, 0.03363800048828125, 0.038845062255859375, 0.0440521240234375, 0.049259185791015625, 0.05446624755859375, 0.059673309326171875, 0.06488037109375, 0.07008743286132812, 0.07529449462890625, 0.08050155639648438, 0.0857086181640625, 0.09091567993164062, 0.09612274169921875, 0.10132980346679688, 0.106536865234375, 0.11174392700195312, 0.11695098876953125, 0.12215805053710938, 0.1273651123046875, 0.13257217407226562, 0.13777923583984375, 0.14298629760742188, 0.148193359375]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 1.0, 7.0, 3.0, 3.0, 7.0, 13.0, 9.0, 13.0, 12.0, 32.0, 30.0, 36.0, 58.0, 74.0, 98.0, 130.0, 172.0, 201.0, 225.0, 238.0, 309.0, 428.0, 979.0, 27124.0, 917192.0, 97306.0, 1588.0, 494.0, 352.0, 283.0, 235.0, 209.0, 146.0, 122.0, 87.0, 87.0, 67.0, 41.0, 45.0, 34.0, 22.0, 13.0, 11.0, 7.0, 5.0, 6.0, 2.0, 2.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.390625, -2.3040771484375, -2.217529296875, -2.1309814453125, -2.04443359375, -1.9578857421875, -1.871337890625, -1.7847900390625, -1.6982421875, -1.6116943359375, -1.525146484375, -1.4385986328125, -1.35205078125, -1.2655029296875, -1.178955078125, -1.0924072265625, -1.005859375, -0.9193115234375, -0.832763671875, -0.7462158203125, -0.65966796875, -0.5731201171875, -0.486572265625, -0.4000244140625, -0.3134765625, -0.2269287109375, -0.140380859375, -0.0538330078125, 0.03271484375, 0.1192626953125, 0.205810546875, 0.2923583984375, 0.37890625, 0.4654541015625, 0.552001953125, 0.6385498046875, 0.72509765625, 0.8116455078125, 0.898193359375, 0.9847412109375, 1.0712890625, 1.1578369140625, 1.244384765625, 1.3309326171875, 1.41748046875, 1.5040283203125, 1.590576171875, 1.6771240234375, 1.763671875, 1.8502197265625, 1.936767578125, 2.0233154296875, 2.10986328125, 2.1964111328125, 2.282958984375, 2.3695068359375, 2.4560546875, 2.5426025390625, 2.629150390625, 2.7156982421875, 2.80224609375, 2.8887939453125, 2.975341796875, 3.0618896484375, 3.1484375]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 14.0, 56.0, 157.0, 461.0, 238.0, 54.0, 21.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.0047173500061035, -5.820735454559326, -5.636753559112549, -5.4527716636657715, -5.268789768218994, -5.084807872772217, -4.9008259773254395, -4.716844081878662, -4.532862186431885, -4.348880290985107, -4.16489839553833, -3.9809165000915527, -3.7969346046447754, -3.612952709197998, -3.4289708137512207, -3.2449889183044434, -3.061007022857666, -2.8770251274108887, -2.6930432319641113, -2.509061336517334, -2.3250794410705566, -2.1410975456237793, -1.957115650177002, -1.7731337547302246, -1.5891518592834473, -1.40516996383667, -1.2211880683898926, -1.0372061729431152, -0.8532242774963379, -0.6692423820495605, -0.4852604866027832, -0.30127859115600586, -0.11729717254638672, 0.06668472290039062, 0.25066661834716797, 0.4346485137939453, 0.6186304092407227, 0.8026123046875, 0.9865942001342773, 1.1705760955810547, 1.354557991027832, 1.5385398864746094, 1.7225217819213867, 1.906503677368164, 2.0904855728149414, 2.2744674682617188, 2.458449363708496, 2.6424312591552734, 2.826413154602051, 3.010395050048828, 3.1943769454956055, 3.378358840942383, 3.56234073638916, 3.7463226318359375, 3.930304527282715, 4.114286422729492, 4.2982683181762695, 4.482250213623047, 4.666232109069824, 4.850214004516602, 5.034195899963379, 5.218177795410156, 5.402159690856934, 5.586141586303711, 5.770123481750488]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 8.0, 12.0, 10.0, 13.0, 18.0, 11.0, 21.0, 24.0, 31.0, 22.0, 45.0, 47.0, 49.0, 55.0, 46.0, 59.0, 50.0, 49.0, 63.0, 52.0, 50.0, 42.0, 43.0, 25.0, 34.0, 27.0, 26.0, 18.0, 20.0, 12.0, 10.0, 5.0, 5.0, 4.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7321114540100098, -1.6587269306182861, -1.5853424072265625, -1.5119577646255493, -1.4385732412338257, -1.365188717842102, -1.2918040752410889, -1.2184195518493652, -1.1450350284576416, -1.071650505065918, -0.9982659220695496, -0.9248813390731812, -0.8514968156814575, -0.7781122922897339, -0.7047277092933655, -0.6313431262969971, -0.5579586029052734, -0.4845740497112274, -0.4111894965171814, -0.3378049433231354, -0.26442039012908936, -0.19103583693504333, -0.11765128374099731, -0.044266700744628906, 0.029117822647094727, 0.10250237584114075, 0.17588692903518677, 0.2492714822292328, 0.3226560354232788, 0.39604058861732483, 0.46942514181137085, 0.5428097248077393, 0.6161942481994629, 0.6895787715911865, 0.7629633545875549, 0.8363479375839233, 0.909732460975647, 0.9831169843673706, 1.0565016269683838, 1.1298861503601074, 1.203270673751831, 1.2766551971435547, 1.3500397205352783, 1.4234243631362915, 1.4968088865280151, 1.5701934099197388, 1.643578052520752, 1.7169625759124756, 1.7903470993041992, 1.8637316226959229, 1.9371161460876465, 2.01050066947937, 2.0838851928710938, 2.1572699546813965, 2.23065447807312, 2.3040390014648438, 2.3774235248565674, 2.450808048248291, 2.5241925716400146, 2.5975770950317383, 2.670961856842041, 2.7443463802337646, 2.8177309036254883, 2.891115427017212, 2.9644999504089355]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 11.0, 5.0, 11.0, 10.0, 8.0, 13.0, 20.0, 22.0, 24.0, 37.0, 26.0, 32.0, 45.0, 37.0, 46.0, 44.0, 37.0, 44.0, 37.0, 46.0, 48.0, 30.0, 33.0, 34.0, 26.0, 32.0, 27.0, 33.0, 28.0, 28.0, 20.0, 14.0, 11.0, 14.0, 12.0, 9.0, 9.0, 8.0, 4.0, 7.0, 5.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0], "bins": [-2.37109375, -2.2989501953125, -2.226806640625, -2.1546630859375, -2.08251953125, -2.0103759765625, -1.938232421875, -1.8660888671875, -1.7939453125, -1.7218017578125, -1.649658203125, -1.5775146484375, -1.50537109375, -1.4332275390625, -1.361083984375, -1.2889404296875, -1.216796875, -1.1446533203125, -1.072509765625, -1.0003662109375, -0.92822265625, -0.8560791015625, -0.783935546875, -0.7117919921875, -0.6396484375, -0.5675048828125, -0.495361328125, -0.4232177734375, -0.35107421875, -0.2789306640625, -0.206787109375, -0.1346435546875, -0.0625, 0.0096435546875, 0.081787109375, 0.1539306640625, 0.22607421875, 0.2982177734375, 0.370361328125, 0.4425048828125, 0.5146484375, 0.5867919921875, 0.658935546875, 0.7310791015625, 0.80322265625, 0.8753662109375, 0.947509765625, 1.0196533203125, 1.091796875, 1.1639404296875, 1.236083984375, 1.3082275390625, 1.38037109375, 1.4525146484375, 1.524658203125, 1.5968017578125, 1.6689453125, 1.7410888671875, 1.813232421875, 1.8853759765625, 1.95751953125, 2.0296630859375, 2.101806640625, 2.1739501953125, 2.24609375]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 5.0, 3.0, 5.0, 12.0, 24.0, 30.0, 41.0, 77.0, 114.0, 183.0, 319.0, 513.0, 842.0, 1267.0, 2069.0, 3258.0, 5283.0, 8448.0, 14152.0, 25121.0, 45386.0, 87150.0, 167733.0, 256730.0, 198515.0, 105006.0, 54608.0, 29086.0, 16628.0, 9667.0, 6187.0, 3840.0, 2351.0, 1490.0, 905.0, 552.0, 372.0, 219.0, 144.0, 91.0, 58.0, 33.0, 13.0, 13.0, 10.0, 3.0, 2.0, 6.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.111328125, -2.0485687255859375, -1.985809326171875, -1.9230499267578125, -1.86029052734375, -1.7975311279296875, -1.734771728515625, -1.6720123291015625, -1.6092529296875, -1.5464935302734375, -1.483734130859375, -1.4209747314453125, -1.35821533203125, -1.2954559326171875, -1.232696533203125, -1.1699371337890625, -1.107177734375, -1.0444183349609375, -0.981658935546875, -0.9188995361328125, -0.85614013671875, -0.7933807373046875, -0.730621337890625, -0.6678619384765625, -0.6051025390625, -0.5423431396484375, -0.479583740234375, -0.4168243408203125, -0.35406494140625, -0.2913055419921875, -0.228546142578125, -0.1657867431640625, -0.10302734375, -0.0402679443359375, 0.022491455078125, 0.0852508544921875, 0.14801025390625, 0.2107696533203125, 0.273529052734375, 0.3362884521484375, 0.3990478515625, 0.4618072509765625, 0.524566650390625, 0.5873260498046875, 0.65008544921875, 0.7128448486328125, 0.775604248046875, 0.8383636474609375, 0.901123046875, 0.9638824462890625, 1.026641845703125, 1.0894012451171875, 1.15216064453125, 1.2149200439453125, 1.277679443359375, 1.3404388427734375, 1.4031982421875, 1.4659576416015625, 1.528717041015625, 1.5914764404296875, 1.65423583984375, 1.7169952392578125, 1.779754638671875, 1.8425140380859375, 1.9052734375]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 1.0, 2.0, 2.0, 3.0, 6.0, 8.0, 7.0, 7.0, 18.0, 20.0, 18.0, 25.0, 31.0, 33.0, 36.0, 36.0, 49.0, 65.0, 73.0, 129.0, 250.0, 1490.0, 203.0, 113.0, 78.0, 58.0, 38.0, 40.0, 37.0, 36.0, 24.0, 25.0, 13.0, 17.0, 15.0, 14.0, 15.0, 5.0, 4.0, 5.0, 0.0, 3.0, 5.0, 4.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.09375, -11.7698974609375, -11.446044921875, -11.1221923828125, -10.79833984375, -10.4744873046875, -10.150634765625, -9.8267822265625, -9.5029296875, -9.1790771484375, -8.855224609375, -8.5313720703125, -8.20751953125, -7.8836669921875, -7.559814453125, -7.2359619140625, -6.912109375, -6.5882568359375, -6.264404296875, -5.9405517578125, -5.61669921875, -5.2928466796875, -4.968994140625, -4.6451416015625, -4.3212890625, -3.9974365234375, -3.673583984375, -3.3497314453125, -3.02587890625, -2.7020263671875, -2.378173828125, -2.0543212890625, -1.73046875, -1.4066162109375, -1.082763671875, -0.7589111328125, -0.43505859375, -0.1112060546875, 0.212646484375, 0.5364990234375, 0.8603515625, 1.1842041015625, 1.508056640625, 1.8319091796875, 2.15576171875, 2.4796142578125, 2.803466796875, 3.1273193359375, 3.451171875, 3.7750244140625, 4.098876953125, 4.4227294921875, 4.74658203125, 5.0704345703125, 5.394287109375, 5.7181396484375, 6.0419921875, 6.3658447265625, 6.689697265625, 7.0135498046875, 7.33740234375, 7.6612548828125, 7.985107421875, 8.3089599609375, 8.6328125]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 7.0, 0.0, 4.0, 7.0, 3.0, 10.0, 8.0, 16.0, 19.0, 18.0, 18.0, 23.0, 43.0, 50.0, 64.0, 93.0, 159.0, 249.0, 463.0, 1057.0, 3299.0, 16182.0, 155278.0, 2566774.0, 367387.0, 26791.0, 4806.0, 1443.0, 570.0, 284.0, 175.0, 104.0, 73.0, 57.0, 44.0, 28.0, 20.0, 28.0, 12.0, 13.0, 8.0, 5.0, 4.0, 7.0, 2.0, 4.0, 1.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.0234375, -10.66357421875, -10.3037109375, -9.94384765625, -9.583984375, -9.22412109375, -8.8642578125, -8.50439453125, -8.14453125, -7.78466796875, -7.4248046875, -7.06494140625, -6.705078125, -6.34521484375, -5.9853515625, -5.62548828125, -5.265625, -4.90576171875, -4.5458984375, -4.18603515625, -3.826171875, -3.46630859375, -3.1064453125, -2.74658203125, -2.38671875, -2.02685546875, -1.6669921875, -1.30712890625, -0.947265625, -0.58740234375, -0.2275390625, 0.13232421875, 0.4921875, 0.85205078125, 1.2119140625, 1.57177734375, 1.931640625, 2.29150390625, 2.6513671875, 3.01123046875, 3.37109375, 3.73095703125, 4.0908203125, 4.45068359375, 4.810546875, 5.17041015625, 5.5302734375, 5.89013671875, 6.25, 6.60986328125, 6.9697265625, 7.32958984375, 7.689453125, 8.04931640625, 8.4091796875, 8.76904296875, 9.12890625, 9.48876953125, 9.8486328125, 10.20849609375, 10.568359375, 10.92822265625, 11.2880859375, 11.64794921875, 12.0078125]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [33.0, 460.0, 476.0, 47.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.1238884925842285, -3.668919563293457, -0.21395063400268555, 3.2410178184509277, 6.695987224578857, 10.150957107543945, 13.605924606323242, 17.060894012451172, 20.5158634185791, 23.97083282470703, 27.425800323486328, 30.880769729614258, 34.33573913574219, 37.79071044921875, 41.24567413330078, 44.700645446777344, 48.15561294555664, 51.61058044433594, 55.0655517578125, 58.5205192565918, 61.975486755371094, 65.43045806884766, 68.88542175292969, 72.34039306640625, 75.79536437988281, 79.25033569335938, 82.7052993774414, 86.16027069091797, 89.61524200439453, 93.07020568847656, 96.52517700195312, 99.98014831542969, 103.43511962890625, 106.89009094238281, 110.34505462646484, 113.8000259399414, 117.25499725341797, 120.7099609375, 124.16493225097656, 127.61990356445312, 131.0748748779297, 134.52984619140625, 137.9848175048828, 141.43978881835938, 144.89474487304688, 148.34971618652344, 151.8046875, 155.25965881347656, 158.71463012695312, 162.1696014404297, 165.62457275390625, 169.07952880859375, 172.5345001220703, 175.98947143554688, 179.44444274902344, 182.8994140625, 186.3543701171875, 189.80934143066406, 193.26431274414062, 196.71926879882812, 200.1742401123047, 203.62921142578125, 207.0841827392578, 210.53915405273438, 213.99412536621094]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 4.0, 3.0, 7.0, 5.0, 8.0, 12.0, 7.0, 6.0, 11.0, 10.0, 17.0, 17.0, 20.0, 25.0, 31.0, 21.0, 30.0, 34.0, 28.0, 36.0, 39.0, 32.0, 42.0, 44.0, 36.0, 32.0, 44.0, 36.0, 38.0, 36.0, 40.0, 35.0, 24.0, 29.0, 21.0, 23.0, 27.0, 13.0, 19.0, 8.0, 15.0, 9.0, 5.0, 7.0, 5.0, 6.0, 6.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-25.685508728027344, -24.850847244262695, -24.01618766784668, -23.18152618408203, -22.346866607666016, -21.512205123901367, -20.67754554748535, -19.842884063720703, -19.008224487304688, -18.17356300354004, -17.338903427124023, -16.504241943359375, -15.66958236694336, -14.834920883178711, -14.000261306762695, -13.165599822998047, -12.330939292907715, -11.496278762817383, -10.66161823272705, -9.826957702636719, -8.992297172546387, -8.157636642456055, -7.3229756355285645, -6.488315105438232, -5.6536545753479, -4.818994045257568, -3.9843335151672363, -3.149672746658325, -2.315012216567993, -1.480351448059082, -0.64569091796875, 0.18896961212158203, 1.023630142211914, 1.858290672302246, 2.692951202392578, 3.5276119709014893, 4.362272262573242, 5.196933269500732, 6.0315937995910645, 6.8662543296813965, 7.7009148597717285, 8.535575866699219, 9.37023639678955, 10.204896926879883, 11.039557456970215, 11.874217987060547, 12.708878517150879, 13.543539047241211, 14.378199577331543, 15.212860107421875, 16.047521591186523, 16.88218116760254, 17.716842651367188, 18.551502227783203, 19.38616371154785, 20.220823287963867, 21.055484771728516, 21.890146255493164, 22.72480583190918, 23.559467315673828, 24.394126892089844, 25.228788375854492, 26.063447952270508, 26.898109436035156, 27.732769012451172]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 3.0, 2.0, 4.0, 6.0, 4.0, 14.0, 8.0, 17.0, 12.0, 16.0, 18.0, 20.0, 20.0, 21.0, 25.0, 36.0, 33.0, 43.0, 44.0, 38.0, 40.0, 41.0, 33.0, 42.0, 42.0, 36.0, 35.0, 34.0, 40.0, 42.0, 39.0, 17.0, 23.0, 29.0, 19.0, 12.0, 17.0, 20.0, 14.0, 13.0, 12.0, 6.0, 5.0, 2.0, 5.0, 1.0, 2.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.41015625, -2.33319091796875, -2.2562255859375, -2.17926025390625, -2.102294921875, -2.02532958984375, -1.9483642578125, -1.87139892578125, -1.79443359375, -1.71746826171875, -1.6405029296875, -1.56353759765625, -1.486572265625, -1.40960693359375, -1.3326416015625, -1.25567626953125, -1.1787109375, -1.10174560546875, -1.0247802734375, -0.94781494140625, -0.870849609375, -0.79388427734375, -0.7169189453125, -0.63995361328125, -0.56298828125, -0.48602294921875, -0.4090576171875, -0.33209228515625, -0.255126953125, -0.17816162109375, -0.1011962890625, -0.02423095703125, 0.052734375, 0.12969970703125, 0.2066650390625, 0.28363037109375, 0.360595703125, 0.43756103515625, 0.5145263671875, 0.59149169921875, 0.66845703125, 0.74542236328125, 0.8223876953125, 0.89935302734375, 0.976318359375, 1.05328369140625, 1.1302490234375, 1.20721435546875, 1.2841796875, 1.36114501953125, 1.4381103515625, 1.51507568359375, 1.592041015625, 1.66900634765625, 1.7459716796875, 1.82293701171875, 1.89990234375, 1.97686767578125, 2.0538330078125, 2.13079833984375, 2.207763671875, 2.28472900390625, 2.3616943359375, 2.43865966796875, 2.515625]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 7.0, 1.0, 4.0, 6.0, 3.0, 8.0, 10.0, 11.0, 20.0, 21.0, 26.0, 45.0, 55.0, 150.0, 322.0, 988.0, 3248.0, 12910.0, 58032.0, 306913.0, 1727185.0, 1709715.0, 299806.0, 56764.0, 13031.0, 3310.0, 981.0, 344.0, 132.0, 80.0, 46.0, 28.0, 16.0, 23.0, 10.0, 15.0, 9.0, 8.0, 4.0, 1.0, 3.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.50390625, -6.31805419921875, -6.1322021484375, -5.94635009765625, -5.760498046875, -5.57464599609375, -5.3887939453125, -5.20294189453125, -5.01708984375, -4.83123779296875, -4.6453857421875, -4.45953369140625, -4.273681640625, -4.08782958984375, -3.9019775390625, -3.71612548828125, -3.5302734375, -3.34442138671875, -3.1585693359375, -2.97271728515625, -2.786865234375, -2.60101318359375, -2.4151611328125, -2.22930908203125, -2.04345703125, -1.85760498046875, -1.6717529296875, -1.48590087890625, -1.300048828125, -1.11419677734375, -0.9283447265625, -0.74249267578125, -0.556640625, -0.37078857421875, -0.1849365234375, 0.00091552734375, 0.186767578125, 0.37261962890625, 0.5584716796875, 0.74432373046875, 0.93017578125, 1.11602783203125, 1.3018798828125, 1.48773193359375, 1.673583984375, 1.85943603515625, 2.0452880859375, 2.23114013671875, 2.4169921875, 2.60284423828125, 2.7886962890625, 2.97454833984375, 3.160400390625, 3.34625244140625, 3.5321044921875, 3.71795654296875, 3.90380859375, 4.08966064453125, 4.2755126953125, 4.46136474609375, 4.647216796875, 4.83306884765625, 5.0189208984375, 5.20477294921875, 5.390625]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 7.0, 7.0, 9.0, 9.0, 18.0, 14.0, 14.0, 24.0, 47.0, 44.0, 51.0, 76.0, 92.0, 114.0, 166.0, 206.0, 258.0, 337.0, 371.0, 360.0, 348.0, 300.0, 261.0, 220.0, 162.0, 121.0, 106.0, 92.0, 54.0, 43.0, 37.0, 28.0, 21.0, 11.0, 16.0, 16.0, 5.0, 6.0, 4.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-6.0234375, -5.8533935546875, -5.683349609375, -5.5133056640625, -5.34326171875, -5.1732177734375, -5.003173828125, -4.8331298828125, -4.6630859375, -4.4930419921875, -4.322998046875, -4.1529541015625, -3.98291015625, -3.8128662109375, -3.642822265625, -3.4727783203125, -3.302734375, -3.1326904296875, -2.962646484375, -2.7926025390625, -2.62255859375, -2.4525146484375, -2.282470703125, -2.1124267578125, -1.9423828125, -1.7723388671875, -1.602294921875, -1.4322509765625, -1.26220703125, -1.0921630859375, -0.922119140625, -0.7520751953125, -0.58203125, -0.4119873046875, -0.241943359375, -0.0718994140625, 0.09814453125, 0.2681884765625, 0.438232421875, 0.6082763671875, 0.7783203125, 0.9483642578125, 1.118408203125, 1.2884521484375, 1.45849609375, 1.6285400390625, 1.798583984375, 1.9686279296875, 2.138671875, 2.3087158203125, 2.478759765625, 2.6488037109375, 2.81884765625, 2.9888916015625, 3.158935546875, 3.3289794921875, 3.4990234375, 3.6690673828125, 3.839111328125, 4.0091552734375, 4.17919921875, 4.3492431640625, 4.519287109375, 4.6893310546875, 4.859375]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 4.0, 8.0, 12.0, 14.0, 24.0, 38.0, 57.0, 86.0, 123.0, 184.0, 354.0, 658.0, 1431.0, 4227.0, 15523.0, 69340.0, 335657.0, 1554944.0, 1720592.0, 386177.0, 79047.0, 17818.0, 4674.0, 1636.0, 714.0, 348.0, 231.0, 134.0, 88.0, 38.0, 27.0, 25.0, 10.0, 18.0, 10.0, 6.0, 7.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.65625, -8.3861083984375, -8.115966796875, -7.8458251953125, -7.57568359375, -7.3055419921875, -7.035400390625, -6.7652587890625, -6.4951171875, -6.2249755859375, -5.954833984375, -5.6846923828125, -5.41455078125, -5.1444091796875, -4.874267578125, -4.6041259765625, -4.333984375, -4.0638427734375, -3.793701171875, -3.5235595703125, -3.25341796875, -2.9832763671875, -2.713134765625, -2.4429931640625, -2.1728515625, -1.9027099609375, -1.632568359375, -1.3624267578125, -1.09228515625, -0.8221435546875, -0.552001953125, -0.2818603515625, -0.01171875, 0.2584228515625, 0.528564453125, 0.7987060546875, 1.06884765625, 1.3389892578125, 1.609130859375, 1.8792724609375, 2.1494140625, 2.4195556640625, 2.689697265625, 2.9598388671875, 3.22998046875, 3.5001220703125, 3.770263671875, 4.0404052734375, 4.310546875, 4.5806884765625, 4.850830078125, 5.1209716796875, 5.39111328125, 5.6612548828125, 5.931396484375, 6.2015380859375, 6.4716796875, 6.7418212890625, 7.011962890625, 7.2821044921875, 7.55224609375, 7.8223876953125, 8.092529296875, 8.3626708984375, 8.6328125]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 6.0, 4.0, 15.0, 17.0, 49.0, 75.0, 89.0, 99.0, 133.0, 146.0, 122.0, 90.0, 79.0, 39.0, 26.0, 15.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.838224411010742, -26.43946075439453, -25.04069709777832, -23.64193344116211, -22.243167877197266, -20.844404220581055, -19.445640563964844, -18.046875, -16.648113250732422, -15.249349594116211, -13.850584983825684, -12.451821327209473, -11.053056716918945, -9.654293060302734, -8.255529403686523, -6.856764793395996, -5.458000183105469, -4.0592360496521, -2.6604721546173096, -1.2617082595825195, 0.1370558738708496, 1.5358200073242188, 2.9345836639404297, 4.333348274230957, 5.732111930847168, 7.130876064300537, 8.529640197753906, 9.928403854370117, 11.327167510986328, 12.725932121276855, 14.124695777893066, 15.523460388183594, 16.922225952148438, 18.32098960876465, 19.71975326538086, 21.118518829345703, 22.517282485961914, 23.916046142578125, 25.314809799194336, 26.713573455810547, 28.11233901977539, 29.5111026763916, 30.909866333007812, 32.308631896972656, 33.707393646240234, 35.10615921020508, 36.504920959472656, 37.9036865234375, 39.302452087402344, 40.70121765136719, 42.099979400634766, 43.49874496459961, 44.89750671386719, 46.29627227783203, 47.695037841796875, 49.09379959106445, 50.49256134033203, 51.891326904296875, 53.29008865356445, 54.6888542175293, 56.087615966796875, 57.48638153076172, 58.88514709472656, 60.28390884399414, 61.682674407958984]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 4.0, 1.0, 2.0, 2.0, 6.0, 6.0, 7.0, 9.0, 11.0, 10.0, 24.0, 18.0, 23.0, 24.0, 24.0, 24.0, 22.0, 36.0, 33.0, 42.0, 42.0, 42.0, 39.0, 41.0, 39.0, 40.0, 37.0, 49.0, 47.0, 35.0, 37.0, 28.0, 21.0, 27.0, 15.0, 19.0, 23.0, 19.0, 16.0, 19.0, 12.0, 4.0, 5.0, 9.0, 5.0, 3.0, 2.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-21.415010452270508, -20.728939056396484, -20.04286766052246, -19.356796264648438, -18.67072296142578, -17.984651565551758, -17.298580169677734, -16.61250877380371, -15.926436424255371, -15.240365028381348, -14.554292678833008, -13.868221282958984, -13.182149887084961, -12.496077537536621, -11.810006141662598, -11.123933792114258, -10.437862396240234, -9.751791000366211, -9.065718650817871, -8.379647254943848, -7.693575382232666, -7.007503509521484, -6.321432113647461, -5.635360240936279, -4.949288368225098, -4.263216495513916, -3.5771448612213135, -2.891073226928711, -2.2050013542175293, -1.5189294815063477, -0.8328580856323242, -0.14678621292114258, 0.5392875671386719, 1.225359320640564, 1.911431074142456, 2.5975027084350586, 3.2835745811462402, 3.969646453857422, 4.655717849731445, 5.341789722442627, 6.027861595153809, 6.71393346786499, 7.400005340576172, 8.086076736450195, 8.772148132324219, 9.458220481872559, 10.144291877746582, 10.830364227294922, 11.516435623168945, 12.202507019042969, 12.888579368591309, 13.574650764465332, 14.260723114013672, 14.946794509887695, 15.632865905761719, 16.318937301635742, 17.005008697509766, 17.69108009338379, 18.377151489257812, 19.06322479248047, 19.749296188354492, 20.435367584228516, 21.12143898010254, 21.807510375976562, 22.49358367919922]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 6.0, 8.0, 9.0, 14.0, 16.0, 9.0, 18.0, 26.0, 21.0, 23.0, 34.0, 33.0, 30.0, 44.0, 37.0, 53.0, 31.0, 53.0, 52.0, 45.0, 39.0, 47.0, 43.0, 52.0, 39.0, 29.0, 32.0, 34.0, 17.0, 25.0, 16.0, 15.0, 12.0, 6.0, 13.0, 8.0, 5.0, 5.0, 3.0, 3.0, 1.0, 0.0, 5.0, 0.0, 2.0], "bins": [-3.41796875, -3.327392578125, -3.23681640625, -3.146240234375, -3.0556640625, -2.965087890625, -2.87451171875, -2.783935546875, -2.693359375, -2.602783203125, -2.51220703125, -2.421630859375, -2.3310546875, -2.240478515625, -2.14990234375, -2.059326171875, -1.96875, -1.878173828125, -1.78759765625, -1.697021484375, -1.6064453125, -1.515869140625, -1.42529296875, -1.334716796875, -1.244140625, -1.153564453125, -1.06298828125, -0.972412109375, -0.8818359375, -0.791259765625, -0.70068359375, -0.610107421875, -0.51953125, -0.428955078125, -0.33837890625, -0.247802734375, -0.1572265625, -0.066650390625, 0.02392578125, 0.114501953125, 0.205078125, 0.295654296875, 0.38623046875, 0.476806640625, 0.5673828125, 0.657958984375, 0.74853515625, 0.839111328125, 0.9296875, 1.020263671875, 1.11083984375, 1.201416015625, 1.2919921875, 1.382568359375, 1.47314453125, 1.563720703125, 1.654296875, 1.744873046875, 1.83544921875, 1.926025390625, 2.0166015625, 2.107177734375, 2.19775390625, 2.288330078125, 2.37890625]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 12.0, 14.0, 28.0, 43.0, 74.0, 139.0, 229.0, 439.0, 680.0, 1123.0, 1812.0, 2978.0, 4505.0, 7130.0, 10766.0, 15968.0, 22554.0, 31166.0, 40787.0, 53032.0, 64792.0, 75836.0, 85606.0, 90940.0, 91921.0, 87532.0, 79324.0, 68422.0, 56394.0, 44301.0, 33755.0, 24607.0, 17612.0, 12066.0, 8072.0, 5245.0, 3324.0, 2256.0, 1271.0, 776.0, 429.0, 271.0, 143.0, 80.0, 49.0, 32.0, 17.0, 5.0, 6.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-1.236328125, -1.2001190185546875, -1.163909912109375, -1.1277008056640625, -1.09149169921875, -1.0552825927734375, -1.019073486328125, -0.9828643798828125, -0.9466552734375, -0.9104461669921875, -0.874237060546875, -0.8380279541015625, -0.80181884765625, -0.7656097412109375, -0.729400634765625, -0.6931915283203125, -0.656982421875, -0.6207733154296875, -0.584564208984375, -0.5483551025390625, -0.51214599609375, -0.4759368896484375, -0.439727783203125, -0.4035186767578125, -0.3673095703125, -0.3311004638671875, -0.294891357421875, -0.2586822509765625, -0.22247314453125, -0.1862640380859375, -0.150054931640625, -0.1138458251953125, -0.07763671875, -0.0414276123046875, -0.005218505859375, 0.0309906005859375, 0.06719970703125, 0.1034088134765625, 0.139617919921875, 0.1758270263671875, 0.2120361328125, 0.2482452392578125, 0.284454345703125, 0.3206634521484375, 0.35687255859375, 0.3930816650390625, 0.429290771484375, 0.4654998779296875, 0.501708984375, 0.5379180908203125, 0.574127197265625, 0.6103363037109375, 0.64654541015625, 0.6827545166015625, 0.718963623046875, 0.7551727294921875, 0.7913818359375, 0.8275909423828125, 0.863800048828125, 0.9000091552734375, 0.93621826171875, 0.9724273681640625, 1.008636474609375, 1.0448455810546875, 1.0810546875]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 6.0, 5.0, 8.0, 9.0, 8.0, 4.0, 14.0, 17.0, 17.0, 12.0, 15.0, 27.0, 34.0, 24.0, 25.0, 32.0, 28.0, 49.0, 35.0, 38.0, 42.0, 37.0, 39.0, 1059.0, 30.0, 27.0, 37.0, 37.0, 34.0, 33.0, 32.0, 14.0, 31.0, 22.0, 15.0, 23.0, 16.0, 14.0, 15.0, 14.0, 7.0, 12.0, 5.0, 4.0, 5.0, 8.0, 5.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0], "bins": [-2.708984375, -2.627838134765625, -2.54669189453125, -2.465545654296875, -2.3843994140625, -2.303253173828125, -2.22210693359375, -2.140960693359375, -2.059814453125, -1.978668212890625, -1.89752197265625, -1.816375732421875, -1.7352294921875, -1.654083251953125, -1.57293701171875, -1.491790771484375, -1.41064453125, -1.329498291015625, -1.24835205078125, -1.167205810546875, -1.0860595703125, -1.004913330078125, -0.92376708984375, -0.842620849609375, -0.761474609375, -0.680328369140625, -0.59918212890625, -0.518035888671875, -0.4368896484375, -0.355743408203125, -0.27459716796875, -0.193450927734375, -0.1123046875, -0.031158447265625, 0.04998779296875, 0.131134033203125, 0.2122802734375, 0.293426513671875, 0.37457275390625, 0.455718994140625, 0.536865234375, 0.618011474609375, 0.69915771484375, 0.780303955078125, 0.8614501953125, 0.942596435546875, 1.02374267578125, 1.104888916015625, 1.18603515625, 1.267181396484375, 1.34832763671875, 1.429473876953125, 1.5106201171875, 1.591766357421875, 1.67291259765625, 1.754058837890625, 1.835205078125, 1.916351318359375, 1.99749755859375, 2.078643798828125, 2.1597900390625, 2.240936279296875, 2.32208251953125, 2.403228759765625, 2.484375]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 5.0, 10.0, 8.0, 14.0, 24.0, 46.0, 49.0, 93.0, 140.0, 174.0, 288.0, 410.0, 646.0, 936.0, 1325.0, 1944.0, 2830.0, 4154.0, 6020.0, 8597.0, 12590.0, 18883.0, 34173.0, 278970.0, 1612434.0, 46239.0, 21821.0, 13840.0, 9554.0, 6681.0, 4557.0, 2993.0, 2063.0, 1465.0, 1027.0, 695.0, 471.0, 321.0, 212.0, 159.0, 80.0, 64.0, 46.0, 23.0, 23.0, 10.0, 7.0, 7.0, 3.0, 6.0, 8.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.5234375, -2.439727783203125, -2.35601806640625, -2.272308349609375, -2.1885986328125, -2.104888916015625, -2.02117919921875, -1.937469482421875, -1.853759765625, -1.770050048828125, -1.68634033203125, -1.602630615234375, -1.5189208984375, -1.435211181640625, -1.35150146484375, -1.267791748046875, -1.18408203125, -1.100372314453125, -1.01666259765625, -0.932952880859375, -0.8492431640625, -0.765533447265625, -0.68182373046875, -0.598114013671875, -0.514404296875, -0.430694580078125, -0.34698486328125, -0.263275146484375, -0.1795654296875, -0.095855712890625, -0.01214599609375, 0.071563720703125, 0.1552734375, 0.238983154296875, 0.32269287109375, 0.406402587890625, 0.4901123046875, 0.573822021484375, 0.65753173828125, 0.741241455078125, 0.824951171875, 0.908660888671875, 0.99237060546875, 1.076080322265625, 1.1597900390625, 1.243499755859375, 1.32720947265625, 1.410919189453125, 1.49462890625, 1.578338623046875, 1.66204833984375, 1.745758056640625, 1.8294677734375, 1.913177490234375, 1.99688720703125, 2.080596923828125, 2.164306640625, 2.248016357421875, 2.33172607421875, 2.415435791015625, 2.4991455078125, 2.582855224609375, 2.66656494140625, 2.750274658203125, 2.833984375]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 4.0, 0.0, 8.0, 12.0, 9.0, 11.0, 12.0, 18.0, 22.0, 16.0, 20.0, 23.0, 31.0, 29.0, 28.0, 32.0, 35.0, 33.0, 35.0, 25.0, 26.0, 25.0, 32.0, 22.0, 24.0, 22.0, 25.0, 22.0, 24.0, 16.0, 15.0, 41.0, 19.0, 33.0, 39.0, 25.0, 19.0, 25.0, 26.0, 14.0, 20.0, 11.0, 10.0, 22.0, 11.0, 14.0, 5.0, 5.0, 5.0, 2.0, 3.0, 5.0, 2.0], "bins": [-0.162353515625, -0.15790939331054688, -0.15346527099609375, -0.14902114868164062, -0.1445770263671875, -0.14013290405273438, -0.13568878173828125, -0.13124465942382812, -0.126800537109375, -0.12235641479492188, -0.11791229248046875, -0.11346817016601562, -0.1090240478515625, -0.10457992553710938, -0.10013580322265625, -0.09569168090820312, -0.09124755859375, -0.08680343627929688, -0.08235931396484375, -0.07791519165039062, -0.0734710693359375, -0.06902694702148438, -0.06458282470703125, -0.060138702392578125, -0.055694580078125, -0.051250457763671875, -0.04680633544921875, -0.042362213134765625, -0.0379180908203125, -0.033473968505859375, -0.02902984619140625, -0.024585723876953125, -0.0201416015625, -0.015697479248046875, -0.01125335693359375, -0.006809234619140625, -0.0023651123046875, 0.002079010009765625, 0.00652313232421875, 0.010967254638671875, 0.015411376953125, 0.019855499267578125, 0.02429962158203125, 0.028743743896484375, 0.0331878662109375, 0.037631988525390625, 0.04207611083984375, 0.046520233154296875, 0.05096435546875, 0.055408477783203125, 0.05985260009765625, 0.06429672241210938, 0.0687408447265625, 0.07318496704101562, 0.07762908935546875, 0.08207321166992188, 0.086517333984375, 0.09096145629882812, 0.09540557861328125, 0.09984970092773438, 0.1042938232421875, 0.10873794555664062, 0.11318206787109375, 0.11762619018554688, 0.1220703125]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 4.0, 5.0, 1.0, 9.0, 11.0, 9.0, 18.0, 17.0, 17.0, 28.0, 30.0, 49.0, 49.0, 63.0, 91.0, 127.0, 162.0, 192.0, 253.0, 283.0, 366.0, 455.0, 775.0, 6032.0, 607709.0, 425179.0, 3796.0, 750.0, 451.0, 346.0, 251.0, 209.0, 187.0, 126.0, 104.0, 79.0, 87.0, 58.0, 35.0, 19.0, 26.0, 25.0, 18.0, 11.0, 14.0, 11.0, 10.0, 5.0, 2.0, 3.0, 3.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0625, -1.988677978515625, -1.91485595703125, -1.841033935546875, -1.7672119140625, -1.693389892578125, -1.61956787109375, -1.545745849609375, -1.471923828125, -1.398101806640625, -1.32427978515625, -1.250457763671875, -1.1766357421875, -1.102813720703125, -1.02899169921875, -0.955169677734375, -0.88134765625, -0.807525634765625, -0.73370361328125, -0.659881591796875, -0.5860595703125, -0.512237548828125, -0.43841552734375, -0.364593505859375, -0.290771484375, -0.216949462890625, -0.14312744140625, -0.069305419921875, 0.0045166015625, 0.078338623046875, 0.15216064453125, 0.225982666015625, 0.2998046875, 0.373626708984375, 0.44744873046875, 0.521270751953125, 0.5950927734375, 0.668914794921875, 0.74273681640625, 0.816558837890625, 0.890380859375, 0.964202880859375, 1.03802490234375, 1.111846923828125, 1.1856689453125, 1.259490966796875, 1.33331298828125, 1.407135009765625, 1.48095703125, 1.554779052734375, 1.62860107421875, 1.702423095703125, 1.7762451171875, 1.850067138671875, 1.92388916015625, 1.997711181640625, 2.071533203125, 2.145355224609375, 2.21917724609375, 2.292999267578125, 2.3668212890625, 2.440643310546875, 2.51446533203125, 2.588287353515625, 2.662109375]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 5.0, 33.0, 143.0, 465.0, 288.0, 46.0, 21.0, 4.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.301940441131592, -5.135199069976807, -4.9684576988220215, -4.801716327667236, -4.634974956512451, -4.468233585357666, -4.301492214202881, -4.134750843048096, -3.9680094718933105, -3.8012681007385254, -3.6345267295837402, -3.467785358428955, -3.30104398727417, -3.1343026161193848, -2.9675612449645996, -2.8008198738098145, -2.63407826423645, -2.467336893081665, -2.30059552192688, -2.1338541507720947, -1.9671127796173096, -1.8003714084625244, -1.6336299180984497, -1.4668885469436646, -1.3001471757888794, -1.1334058046340942, -0.9666644334793091, -0.7999230027198792, -0.633181631565094, -0.46644026041030884, -0.2996988296508789, -0.13295745849609375, 0.033783912658691406, 0.20052529871463776, 0.3672666847705841, 0.5340080857276917, 0.7007494568824768, 0.867490828037262, 1.034232258796692, 1.200973629951477, 1.3677150011062622, 1.5344563722610474, 1.7011977434158325, 1.8679392337799072, 2.0346806049346924, 2.2014219760894775, 2.3681633472442627, 2.534904718399048, 2.701646089553833, 2.868387460708618, 3.0351288318634033, 3.2018702030181885, 3.3686115741729736, 3.535352945327759, 3.702094554901123, 3.868835926055908, 4.035577297210693, 4.2023186683654785, 4.369060039520264, 4.535801410675049, 4.702542781829834, 4.869284152984619, 5.036025524139404, 5.2027668952941895, 5.369508266448975]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 5.0, 4.0, 8.0, 6.0, 12.0, 7.0, 14.0, 17.0, 19.0, 19.0, 39.0, 37.0, 40.0, 44.0, 44.0, 51.0, 49.0, 51.0, 54.0, 44.0, 56.0, 56.0, 47.0, 44.0, 51.0, 30.0, 16.0, 27.0, 25.0, 30.0, 17.0, 12.0, 13.0, 7.0, 12.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.480533480644226, -1.4155057668685913, -1.350477933883667, -1.2854502201080322, -1.2204225063323975, -1.1553947925567627, -1.090367078781128, -1.0253392457962036, -0.9603115320205688, -0.8952838182449341, -0.8302560448646545, -0.765228271484375, -0.7002005577087402, -0.6351728439331055, -0.5701450705528259, -0.5051172971725464, -0.4400895833969116, -0.37506183981895447, -0.3100340962409973, -0.24500635266304016, -0.179978609085083, -0.11495086550712585, -0.0499231219291687, 0.015104621648788452, 0.0801323652267456, 0.14516010880470276, 0.2101878523826599, 0.27521559596061707, 0.3402433395385742, 0.40527108311653137, 0.4702988266944885, 0.5353266000747681, 0.6003544330596924, 0.6653821468353271, 0.7304099202156067, 0.7954376935958862, 0.860465407371521, 0.9254931211471558, 0.9905208945274353, 1.0555486679077148, 1.1205763816833496, 1.1856040954589844, 1.2506318092346191, 1.3156596422195435, 1.3806873559951782, 1.445715069770813, 1.5107429027557373, 1.575770616531372, 1.6407983303070068, 1.7058260440826416, 1.7708537578582764, 1.8358815908432007, 1.9009093046188354, 1.9659370183944702, 2.0309648513793945, 2.0959925651550293, 2.161020278930664, 2.226047992706299, 2.2910757064819336, 2.3561034202575684, 2.421131134033203, 2.486159086227417, 2.5511868000030518, 2.6162145137786865, 2.6812422275543213]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 2.0, 5.0, 15.0, 11.0, 10.0, 15.0, 16.0, 17.0, 27.0, 16.0, 35.0, 27.0, 33.0, 42.0, 43.0, 41.0, 49.0, 31.0, 57.0, 42.0, 47.0, 39.0, 34.0, 47.0, 41.0, 33.0, 29.0, 26.0, 19.0, 23.0, 22.0, 17.0, 19.0, 14.0, 12.0, 15.0, 5.0, 6.0, 6.0, 5.0, 6.0, 3.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0], "bins": [-3.126953125, -3.03851318359375, -2.9500732421875, -2.86163330078125, -2.773193359375, -2.68475341796875, -2.5963134765625, -2.50787353515625, -2.41943359375, -2.33099365234375, -2.2425537109375, -2.15411376953125, -2.065673828125, -1.97723388671875, -1.8887939453125, -1.80035400390625, -1.7119140625, -1.62347412109375, -1.5350341796875, -1.44659423828125, -1.358154296875, -1.26971435546875, -1.1812744140625, -1.09283447265625, -1.00439453125, -0.91595458984375, -0.8275146484375, -0.73907470703125, -0.650634765625, -0.56219482421875, -0.4737548828125, -0.38531494140625, -0.296875, -0.20843505859375, -0.1199951171875, -0.03155517578125, 0.056884765625, 0.14532470703125, 0.2337646484375, 0.32220458984375, 0.41064453125, 0.49908447265625, 0.5875244140625, 0.67596435546875, 0.764404296875, 0.85284423828125, 0.9412841796875, 1.02972412109375, 1.1181640625, 1.20660400390625, 1.2950439453125, 1.38348388671875, 1.471923828125, 1.56036376953125, 1.6488037109375, 1.73724365234375, 1.82568359375, 1.91412353515625, 2.0025634765625, 2.09100341796875, 2.179443359375, 2.26788330078125, 2.3563232421875, 2.44476318359375, 2.533203125]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 11.0, 5.0, 19.0, 18.0, 38.0, 47.0, 69.0, 126.0, 200.0, 216.0, 367.0, 544.0, 846.0, 1196.0, 1751.0, 2611.0, 4102.0, 6382.0, 10179.0, 17531.0, 31057.0, 57677.0, 113894.0, 270805.0, 275507.0, 117287.0, 58119.0, 31058.0, 17758.0, 10302.0, 6461.0, 4109.0, 2654.0, 1852.0, 1224.0, 823.0, 592.0, 414.0, 282.0, 149.0, 100.0, 81.0, 40.0, 21.0, 19.0, 9.0, 7.0, 4.0, 1.0, 5.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.7734375, -2.69189453125, -2.6103515625, -2.52880859375, -2.447265625, -2.36572265625, -2.2841796875, -2.20263671875, -2.12109375, -2.03955078125, -1.9580078125, -1.87646484375, -1.794921875, -1.71337890625, -1.6318359375, -1.55029296875, -1.46875, -1.38720703125, -1.3056640625, -1.22412109375, -1.142578125, -1.06103515625, -0.9794921875, -0.89794921875, -0.81640625, -0.73486328125, -0.6533203125, -0.57177734375, -0.490234375, -0.40869140625, -0.3271484375, -0.24560546875, -0.1640625, -0.08251953125, -0.0009765625, 0.08056640625, 0.162109375, 0.24365234375, 0.3251953125, 0.40673828125, 0.48828125, 0.56982421875, 0.6513671875, 0.73291015625, 0.814453125, 0.89599609375, 0.9775390625, 1.05908203125, 1.140625, 1.22216796875, 1.3037109375, 1.38525390625, 1.466796875, 1.54833984375, 1.6298828125, 1.71142578125, 1.79296875, 1.87451171875, 1.9560546875, 2.03759765625, 2.119140625, 2.20068359375, 2.2822265625, 2.36376953125, 2.4453125]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 2.0, 2.0, 5.0, 6.0, 6.0, 2.0, 8.0, 10.0, 11.0, 18.0, 15.0, 18.0, 16.0, 28.0, 38.0, 28.0, 35.0, 37.0, 37.0, 44.0, 71.0, 104.0, 225.0, 1451.0, 253.0, 108.0, 49.0, 52.0, 48.0, 42.0, 35.0, 30.0, 26.0, 31.0, 25.0, 23.0, 23.0, 23.0, 13.0, 14.0, 10.0, 9.0, 5.0, 4.0, 6.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-9.765625, -9.46533203125, -9.1650390625, -8.86474609375, -8.564453125, -8.26416015625, -7.9638671875, -7.66357421875, -7.36328125, -7.06298828125, -6.7626953125, -6.46240234375, -6.162109375, -5.86181640625, -5.5615234375, -5.26123046875, -4.9609375, -4.66064453125, -4.3603515625, -4.06005859375, -3.759765625, -3.45947265625, -3.1591796875, -2.85888671875, -2.55859375, -2.25830078125, -1.9580078125, -1.65771484375, -1.357421875, -1.05712890625, -0.7568359375, -0.45654296875, -0.15625, 0.14404296875, 0.4443359375, 0.74462890625, 1.044921875, 1.34521484375, 1.6455078125, 1.94580078125, 2.24609375, 2.54638671875, 2.8466796875, 3.14697265625, 3.447265625, 3.74755859375, 4.0478515625, 4.34814453125, 4.6484375, 4.94873046875, 5.2490234375, 5.54931640625, 5.849609375, 6.14990234375, 6.4501953125, 6.75048828125, 7.05078125, 7.35107421875, 7.6513671875, 7.95166015625, 8.251953125, 8.55224609375, 8.8525390625, 9.15283203125, 9.453125]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 1.0, 0.0, 4.0, 3.0, 5.0, 10.0, 9.0, 10.0, 19.0, 25.0, 27.0, 53.0, 70.0, 101.0, 133.0, 234.0, 388.0, 1188.0, 7234.0, 190169.0, 2891553.0, 49224.0, 3638.0, 719.0, 323.0, 182.0, 115.0, 78.0, 57.0, 36.0, 22.0, 18.0, 14.0, 15.0, 15.0, 4.0, 5.0, 5.0, 5.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.140625, -16.513671875, -15.88671875, -15.259765625, -14.6328125, -14.005859375, -13.37890625, -12.751953125, -12.125, -11.498046875, -10.87109375, -10.244140625, -9.6171875, -8.990234375, -8.36328125, -7.736328125, -7.109375, -6.482421875, -5.85546875, -5.228515625, -4.6015625, -3.974609375, -3.34765625, -2.720703125, -2.09375, -1.466796875, -0.83984375, -0.212890625, 0.4140625, 1.041015625, 1.66796875, 2.294921875, 2.921875, 3.548828125, 4.17578125, 4.802734375, 5.4296875, 6.056640625, 6.68359375, 7.310546875, 7.9375, 8.564453125, 9.19140625, 9.818359375, 10.4453125, 11.072265625, 11.69921875, 12.326171875, 12.953125, 13.580078125, 14.20703125, 14.833984375, 15.4609375, 16.087890625, 16.71484375, 17.341796875, 17.96875, 18.595703125, 19.22265625, 19.849609375, 20.4765625, 21.103515625, 21.73046875, 22.357421875, 22.984375]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [183.0, 786.0, 45.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.254812240600586, -1.9999918937683105, 3.254828453063965, 8.509649276733398, 13.764469146728516, 19.019289016723633, 24.274110794067383, 29.528928756713867, 34.78375244140625, 40.03857421875, 45.293392181396484, 50.548213958740234, 55.80303192138672, 61.05785369873047, 66.31267547607422, 71.56748962402344, 76.82231140136719, 82.07713317871094, 87.33195495605469, 92.58677673339844, 97.84159088134766, 103.0964126586914, 108.35123443603516, 113.60604858398438, 118.86087799072266, 124.1156997680664, 129.37051391601562, 134.62533569335938, 139.88015747070312, 145.13497924804688, 150.38980102539062, 155.64462280273438, 160.89942932128906, 166.1542510986328, 171.40907287597656, 176.6638946533203, 181.91871643066406, 187.17352294921875, 192.4283447265625, 197.68316650390625, 202.93798828125, 208.19281005859375, 213.4476318359375, 218.70245361328125, 223.957275390625, 229.21209716796875, 234.4669189453125, 239.7217254638672, 244.9765625, 250.23138427734375, 255.4862060546875, 260.74102783203125, 265.995849609375, 271.25067138671875, 276.5054931640625, 281.76031494140625, 287.0151062011719, 292.2699279785156, 297.5247497558594, 302.7795715332031, 308.0343933105469, 313.2892150878906, 318.5440368652344, 323.7988586425781, 329.0536804199219]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 3.0, 2.0, 3.0, 7.0, 11.0, 7.0, 9.0, 14.0, 14.0, 26.0, 23.0, 19.0, 27.0, 25.0, 32.0, 27.0, 28.0, 26.0, 36.0, 38.0, 40.0, 46.0, 38.0, 41.0, 30.0, 53.0, 37.0, 29.0, 36.0, 27.0, 29.0, 30.0, 26.0, 23.0, 19.0, 23.0, 12.0, 19.0, 8.0, 12.0, 6.0, 9.0, 2.0, 3.0, 10.0, 8.0, 1.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-28.719524383544922, -27.856754302978516, -26.993986129760742, -26.131216049194336, -25.26844596862793, -24.405677795410156, -23.54290771484375, -22.680137634277344, -21.817367553710938, -20.95459747314453, -20.091829299926758, -19.22905921936035, -18.366289138793945, -17.503520965576172, -16.640750885009766, -15.77798080444336, -14.915212631225586, -14.052443504333496, -13.18967342376709, -12.326904296875, -11.464134216308594, -10.601365089416504, -9.738595962524414, -8.875825881958008, -8.013056755065918, -7.15028715133667, -6.287517547607422, -5.424748420715332, -4.561978816986084, -3.699209213256836, -2.836440086364746, -1.973670482635498, -1.11090087890625, -0.2481313943862915, 0.614638090133667, 1.477407455444336, 2.340177059173584, 3.202946662902832, 4.065715789794922, 4.92848539352417, 5.791254997253418, 6.654024600982666, 7.516794204711914, 8.379563331604004, 9.242332458496094, 10.1051025390625, 10.96787166595459, 11.83064079284668, 12.693410873413086, 13.556180000305176, 14.418950080871582, 15.281719207763672, 16.144489288330078, 17.007259368896484, 17.870027542114258, 18.732797622680664, 19.595565795898438, 20.458335876464844, 21.321104049682617, 22.183874130249023, 23.04664421081543, 23.909412384033203, 24.77218246459961, 25.634952545166016, 26.497722625732422]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 4.0, 5.0, 9.0, 12.0, 14.0, 5.0, 11.0, 12.0, 28.0, 16.0, 22.0, 30.0, 34.0, 39.0, 32.0, 33.0, 56.0, 45.0, 37.0, 52.0, 43.0, 46.0, 36.0, 40.0, 38.0, 35.0, 38.0, 29.0, 34.0, 25.0, 31.0, 15.0, 19.0, 10.0, 10.0, 13.0, 6.0, 14.0, 6.0, 3.0, 6.0, 4.0, 0.0, 6.0, 2.0, 0.0, 2.0, 3.0], "bins": [-3.32421875, -3.23248291015625, -3.1407470703125, -3.04901123046875, -2.957275390625, -2.86553955078125, -2.7738037109375, -2.68206787109375, -2.59033203125, -2.49859619140625, -2.4068603515625, -2.31512451171875, -2.223388671875, -2.13165283203125, -2.0399169921875, -1.94818115234375, -1.8564453125, -1.76470947265625, -1.6729736328125, -1.58123779296875, -1.489501953125, -1.39776611328125, -1.3060302734375, -1.21429443359375, -1.12255859375, -1.03082275390625, -0.9390869140625, -0.84735107421875, -0.755615234375, -0.66387939453125, -0.5721435546875, -0.48040771484375, -0.388671875, -0.29693603515625, -0.2052001953125, -0.11346435546875, -0.021728515625, 0.07000732421875, 0.1617431640625, 0.25347900390625, 0.34521484375, 0.43695068359375, 0.5286865234375, 0.62042236328125, 0.712158203125, 0.80389404296875, 0.8956298828125, 0.98736572265625, 1.0791015625, 1.17083740234375, 1.2625732421875, 1.35430908203125, 1.446044921875, 1.53778076171875, 1.6295166015625, 1.72125244140625, 1.81298828125, 1.90472412109375, 1.9964599609375, 2.08819580078125, 2.179931640625, 2.27166748046875, 2.3634033203125, 2.45513916015625, 2.546875]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 7.0, 3.0, 12.0, 18.0, 22.0, 40.0, 55.0, 79.0, 133.0, 268.0, 558.0, 1374.0, 3497.0, 9978.0, 31237.0, 108729.0, 440150.0, 1522684.0, 1496355.0, 423319.0, 108228.0, 31398.0, 9897.0, 3538.0, 1430.0, 601.0, 284.0, 156.0, 76.0, 61.0, 29.0, 28.0, 16.0, 13.0, 3.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.1015625, -4.95147705078125, -4.8013916015625, -4.65130615234375, -4.501220703125, -4.35113525390625, -4.2010498046875, -4.05096435546875, -3.90087890625, -3.75079345703125, -3.6007080078125, -3.45062255859375, -3.300537109375, -3.15045166015625, -3.0003662109375, -2.85028076171875, -2.7001953125, -2.55010986328125, -2.4000244140625, -2.24993896484375, -2.099853515625, -1.94976806640625, -1.7996826171875, -1.64959716796875, -1.49951171875, -1.34942626953125, -1.1993408203125, -1.04925537109375, -0.899169921875, -0.74908447265625, -0.5989990234375, -0.44891357421875, -0.298828125, -0.14874267578125, 0.0013427734375, 0.15142822265625, 0.301513671875, 0.45159912109375, 0.6016845703125, 0.75177001953125, 0.90185546875, 1.05194091796875, 1.2020263671875, 1.35211181640625, 1.502197265625, 1.65228271484375, 1.8023681640625, 1.95245361328125, 2.1025390625, 2.25262451171875, 2.4027099609375, 2.55279541015625, 2.702880859375, 2.85296630859375, 3.0030517578125, 3.15313720703125, 3.30322265625, 3.45330810546875, 3.6033935546875, 3.75347900390625, 3.903564453125, 4.05364990234375, 4.2037353515625, 4.35382080078125, 4.50390625]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 0.0, 6.0, 6.0, 6.0, 7.0, 17.0, 21.0, 29.0, 41.0, 62.0, 90.0, 138.0, 179.0, 272.0, 343.0, 430.0, 488.0, 494.0, 387.0, 302.0, 217.0, 155.0, 117.0, 80.0, 62.0, 40.0, 27.0, 17.0, 16.0, 10.0, 9.0, 7.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.65625, -8.4140625, -8.171875, -7.9296875, -7.6875, -7.4453125, -7.203125, -6.9609375, -6.71875, -6.4765625, -6.234375, -5.9921875, -5.75, -5.5078125, -5.265625, -5.0234375, -4.78125, -4.5390625, -4.296875, -4.0546875, -3.8125, -3.5703125, -3.328125, -3.0859375, -2.84375, -2.6015625, -2.359375, -2.1171875, -1.875, -1.6328125, -1.390625, -1.1484375, -0.90625, -0.6640625, -0.421875, -0.1796875, 0.0625, 0.3046875, 0.546875, 0.7890625, 1.03125, 1.2734375, 1.515625, 1.7578125, 2.0, 2.2421875, 2.484375, 2.7265625, 2.96875, 3.2109375, 3.453125, 3.6953125, 3.9375, 4.1796875, 4.421875, 4.6640625, 4.90625, 5.1484375, 5.390625, 5.6328125, 5.875, 6.1171875, 6.359375, 6.6015625, 6.84375]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 6.0, 5.0, 17.0, 12.0, 24.0, 24.0, 49.0, 80.0, 129.0, 223.0, 410.0, 790.0, 2010.0, 5601.0, 20067.0, 86971.0, 417543.0, 1780032.0, 1470450.0, 318705.0, 67325.0, 16024.0, 4577.0, 1629.0, 711.0, 386.0, 197.0, 106.0, 59.0, 52.0, 22.0, 19.0, 13.0, 8.0, 5.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.70703125, -7.44049072265625, -7.1739501953125, -6.90740966796875, -6.640869140625, -6.37432861328125, -6.1077880859375, -5.84124755859375, -5.57470703125, -5.30816650390625, -5.0416259765625, -4.77508544921875, -4.508544921875, -4.24200439453125, -3.9754638671875, -3.70892333984375, -3.4423828125, -3.17584228515625, -2.9093017578125, -2.64276123046875, -2.376220703125, -2.10968017578125, -1.8431396484375, -1.57659912109375, -1.31005859375, -1.04351806640625, -0.7769775390625, -0.51043701171875, -0.243896484375, 0.02264404296875, 0.2891845703125, 0.55572509765625, 0.822265625, 1.08880615234375, 1.3553466796875, 1.62188720703125, 1.888427734375, 2.15496826171875, 2.4215087890625, 2.68804931640625, 2.95458984375, 3.22113037109375, 3.4876708984375, 3.75421142578125, 4.020751953125, 4.28729248046875, 4.5538330078125, 4.82037353515625, 5.0869140625, 5.35345458984375, 5.6199951171875, 5.88653564453125, 6.153076171875, 6.41961669921875, 6.6861572265625, 6.95269775390625, 7.21923828125, 7.48577880859375, 7.7523193359375, 8.01885986328125, 8.285400390625, 8.55194091796875, 8.8184814453125, 9.08502197265625, 9.3515625]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 4.0, 8.0, 25.0, 26.0, 69.0, 88.0, 120.0, 172.0, 154.0, 116.0, 91.0, 56.0, 40.0, 23.0, 12.0, 9.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.068540573120117, -28.49445915222168, -26.920377731323242, -25.346296310424805, -23.772214889526367, -22.19813346862793, -20.624052047729492, -19.049970626831055, -17.475889205932617, -15.90180778503418, -14.327726364135742, -12.753644943237305, -11.179563522338867, -9.60548210144043, -8.031400680541992, -6.457319259643555, -4.883237838745117, -3.3091564178466797, -1.7350749969482422, -0.1609935760498047, 1.4130878448486328, 2.9871692657470703, 4.561250686645508, 6.135332107543945, 7.709413528442383, 9.28349494934082, 10.857576370239258, 12.431657791137695, 14.005739212036133, 15.57982063293457, 17.153902053833008, 18.727983474731445, 20.30206298828125, 21.876144409179688, 23.450225830078125, 25.024307250976562, 26.598388671875, 28.172470092773438, 29.746551513671875, 31.320632934570312, 32.89471435546875, 34.46879577636719, 36.042877197265625, 37.61695861816406, 39.1910400390625, 40.76512145996094, 42.339202880859375, 43.91328430175781, 45.48736572265625, 47.06144714355469, 48.635528564453125, 50.20960998535156, 51.78369140625, 53.35777282714844, 54.931854248046875, 56.50593566894531, 58.08001708984375, 59.65409851074219, 61.228179931640625, 62.80226135253906, 64.3763427734375, 65.95042419433594, 67.52450561523438, 69.09858703613281, 70.67266845703125]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 9.0, 17.0, 7.0, 14.0, 17.0, 18.0, 17.0, 19.0, 23.0, 24.0, 27.0, 32.0, 31.0, 41.0, 35.0, 36.0, 49.0, 47.0, 36.0, 39.0, 50.0, 41.0, 34.0, 22.0, 27.0, 34.0, 27.0, 29.0, 37.0, 29.0, 22.0, 16.0, 17.0, 13.0, 4.0, 18.0, 6.0, 7.0, 6.0, 5.0, 6.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-22.22614097595215, -21.551668167114258, -20.877193450927734, -20.202720642089844, -19.52824592590332, -18.85377311706543, -18.179298400878906, -17.504825592041016, -16.830352783203125, -16.155879974365234, -15.481405258178711, -14.80693244934082, -14.132458686828613, -13.457984924316406, -12.7835111618042, -12.109037399291992, -11.434563636779785, -10.760089874267578, -10.085616111755371, -9.411142349243164, -8.736669540405273, -8.062195777893066, -7.387722015380859, -6.7132487297058105, -6.0387749671936035, -5.3643012046813965, -4.689827919006348, -4.015354156494141, -3.3408806324005127, -2.6664071083068848, -1.9919333457946777, -1.317460060119629, -0.6429862976074219, 0.03148728609085083, 0.7059608697891235, 1.380434513092041, 2.054908037185669, 2.729381561279297, 3.403855323791504, 4.078328609466553, 4.75280237197876, 5.427276134490967, 6.101749420166016, 6.776223182678223, 7.45069694519043, 8.12516975402832, 8.799644470214844, 9.474117279052734, 10.148591041564941, 10.823064804077148, 11.497538566589355, 12.172012329101562, 12.846485137939453, 13.52095890045166, 14.195432662963867, 14.869905471801758, 15.544380187988281, 16.218852996826172, 16.893327713012695, 17.567800521850586, 18.24227523803711, 18.916748046875, 19.59122085571289, 20.265695571899414, 20.940168380737305]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 3.0, 5.0, 8.0, 4.0, 14.0, 10.0, 16.0, 22.0, 20.0, 34.0, 20.0, 37.0, 47.0, 41.0, 47.0, 31.0, 52.0, 44.0, 55.0, 52.0, 53.0, 43.0, 52.0, 43.0, 43.0, 37.0, 25.0, 22.0, 21.0, 20.0, 19.0, 16.0, 14.0, 9.0, 7.0, 3.0, 5.0, 4.0, 1.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-3.68359375, -3.580291748046875, -3.47698974609375, -3.373687744140625, -3.2703857421875, -3.167083740234375, -3.06378173828125, -2.960479736328125, -2.857177734375, -2.753875732421875, -2.65057373046875, -2.547271728515625, -2.4439697265625, -2.340667724609375, -2.23736572265625, -2.134063720703125, -2.03076171875, -1.927459716796875, -1.82415771484375, -1.720855712890625, -1.6175537109375, -1.514251708984375, -1.41094970703125, -1.307647705078125, -1.204345703125, -1.101043701171875, -0.99774169921875, -0.894439697265625, -0.7911376953125, -0.687835693359375, -0.58453369140625, -0.481231689453125, -0.3779296875, -0.274627685546875, -0.17132568359375, -0.068023681640625, 0.0352783203125, 0.138580322265625, 0.24188232421875, 0.345184326171875, 0.448486328125, 0.551788330078125, 0.65509033203125, 0.758392333984375, 0.8616943359375, 0.964996337890625, 1.06829833984375, 1.171600341796875, 1.27490234375, 1.378204345703125, 1.48150634765625, 1.584808349609375, 1.6881103515625, 1.791412353515625, 1.89471435546875, 1.998016357421875, 2.101318359375, 2.204620361328125, 2.30792236328125, 2.411224365234375, 2.5145263671875, 2.617828369140625, 2.72113037109375, 2.824432373046875, 2.927734375]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 2.0, 7.0, 10.0, 10.0, 31.0, 43.0, 78.0, 92.0, 178.0, 237.0, 374.0, 595.0, 990.0, 1417.0, 2127.0, 3005.0, 4588.0, 6569.0, 9309.0, 12592.0, 17568.0, 23041.0, 29807.0, 37607.0, 46413.0, 55409.0, 63183.0, 70257.0, 75874.0, 78482.0, 77733.0, 74302.0, 68147.0, 60042.0, 51162.0, 42516.0, 34483.0, 27193.0, 20696.0, 15266.0, 11227.0, 8127.0, 5769.0, 3960.0, 2723.0, 1866.0, 1177.0, 846.0, 530.0, 332.0, 210.0, 153.0, 94.0, 46.0, 33.0, 16.0, 11.0, 7.0, 2.0, 6.0], "bins": [-1.0625, -1.03106689453125, -0.9996337890625, -0.96820068359375, -0.936767578125, -0.90533447265625, -0.8739013671875, -0.84246826171875, -0.81103515625, -0.77960205078125, -0.7481689453125, -0.71673583984375, -0.685302734375, -0.65386962890625, -0.6224365234375, -0.59100341796875, -0.5595703125, -0.52813720703125, -0.4967041015625, -0.46527099609375, -0.433837890625, -0.40240478515625, -0.3709716796875, -0.33953857421875, -0.30810546875, -0.27667236328125, -0.2452392578125, -0.21380615234375, -0.182373046875, -0.15093994140625, -0.1195068359375, -0.08807373046875, -0.056640625, -0.02520751953125, 0.0062255859375, 0.03765869140625, 0.069091796875, 0.10052490234375, 0.1319580078125, 0.16339111328125, 0.19482421875, 0.22625732421875, 0.2576904296875, 0.28912353515625, 0.320556640625, 0.35198974609375, 0.3834228515625, 0.41485595703125, 0.4462890625, 0.47772216796875, 0.5091552734375, 0.54058837890625, 0.572021484375, 0.60345458984375, 0.6348876953125, 0.66632080078125, 0.69775390625, 0.72918701171875, 0.7606201171875, 0.79205322265625, 0.823486328125, 0.85491943359375, 0.8863525390625, 0.91778564453125, 0.94921875]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 2.0, 3.0, 8.0, 8.0, 4.0, 6.0, 13.0, 15.0, 9.0, 19.0, 24.0, 20.0, 26.0, 36.0, 20.0, 23.0, 33.0, 42.0, 44.0, 37.0, 35.0, 45.0, 1067.0, 44.0, 35.0, 33.0, 42.0, 41.0, 40.0, 40.0, 17.0, 27.0, 19.0, 20.0, 23.0, 25.0, 16.0, 10.0, 11.0, 8.0, 8.0, 10.0, 7.0, 7.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0], "bins": [-3.251953125, -3.1614990234375, -3.071044921875, -2.9805908203125, -2.89013671875, -2.7996826171875, -2.709228515625, -2.6187744140625, -2.5283203125, -2.4378662109375, -2.347412109375, -2.2569580078125, -2.16650390625, -2.0760498046875, -1.985595703125, -1.8951416015625, -1.8046875, -1.7142333984375, -1.623779296875, -1.5333251953125, -1.44287109375, -1.3524169921875, -1.261962890625, -1.1715087890625, -1.0810546875, -0.9906005859375, -0.900146484375, -0.8096923828125, -0.71923828125, -0.6287841796875, -0.538330078125, -0.4478759765625, -0.357421875, -0.2669677734375, -0.176513671875, -0.0860595703125, 0.00439453125, 0.0948486328125, 0.185302734375, 0.2757568359375, 0.3662109375, 0.4566650390625, 0.547119140625, 0.6375732421875, 0.72802734375, 0.8184814453125, 0.908935546875, 0.9993896484375, 1.08984375, 1.1802978515625, 1.270751953125, 1.3612060546875, 1.45166015625, 1.5421142578125, 1.632568359375, 1.7230224609375, 1.8134765625, 1.9039306640625, 1.994384765625, 2.0848388671875, 2.17529296875, 2.2657470703125, 2.356201171875, 2.4466552734375, 2.537109375]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 6.0, 8.0, 10.0, 10.0, 19.0, 39.0, 52.0, 60.0, 91.0, 158.0, 218.0, 323.0, 525.0, 702.0, 1067.0, 1562.0, 2301.0, 3356.0, 4993.0, 7044.0, 10571.0, 15796.0, 25565.0, 73562.0, 1778632.0, 92336.0, 27285.0, 16405.0, 11038.0, 7374.0, 5008.0, 3580.0, 2373.0, 1706.0, 1124.0, 738.0, 504.0, 329.0, 242.0, 162.0, 100.0, 46.0, 48.0, 20.0, 29.0, 6.0, 6.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.947265625, -2.856719970703125, -2.76617431640625, -2.675628662109375, -2.5850830078125, -2.494537353515625, -2.40399169921875, -2.313446044921875, -2.222900390625, -2.132354736328125, -2.04180908203125, -1.951263427734375, -1.8607177734375, -1.770172119140625, -1.67962646484375, -1.589080810546875, -1.49853515625, -1.407989501953125, -1.31744384765625, -1.226898193359375, -1.1363525390625, -1.045806884765625, -0.95526123046875, -0.864715576171875, -0.774169921875, -0.683624267578125, -0.59307861328125, -0.502532958984375, -0.4119873046875, -0.321441650390625, -0.23089599609375, -0.140350341796875, -0.0498046875, 0.040740966796875, 0.13128662109375, 0.221832275390625, 0.3123779296875, 0.402923583984375, 0.49346923828125, 0.584014892578125, 0.674560546875, 0.765106201171875, 0.85565185546875, 0.946197509765625, 1.0367431640625, 1.127288818359375, 1.21783447265625, 1.308380126953125, 1.39892578125, 1.489471435546875, 1.58001708984375, 1.670562744140625, 1.7611083984375, 1.851654052734375, 1.94219970703125, 2.032745361328125, 2.123291015625, 2.213836669921875, 2.30438232421875, 2.394927978515625, 2.4854736328125, 2.576019287109375, 2.66656494140625, 2.757110595703125, 2.84765625]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 3.0, 6.0, 2.0, 8.0, 9.0, 4.0, 16.0, 16.0, 18.0, 35.0, 22.0, 30.0, 20.0, 29.0, 21.0, 19.0, 27.0, 24.0, 34.0, 31.0, 31.0, 35.0, 28.0, 30.0, 27.0, 33.0, 29.0, 12.0, 28.0, 29.0, 32.0, 31.0, 36.0, 26.0, 39.0, 24.0, 18.0, 18.0, 19.0, 19.0, 23.0, 14.0, 11.0, 9.0, 11.0, 5.0, 6.0, 3.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.15771484375, -0.15285873413085938, -0.14800262451171875, -0.14314651489257812, -0.1382904052734375, -0.13343429565429688, -0.12857818603515625, -0.12372207641601562, -0.118865966796875, -0.11400985717773438, -0.10915374755859375, -0.10429763793945312, -0.0994415283203125, -0.09458541870117188, -0.08972930908203125, -0.08487319946289062, -0.08001708984375, -0.07516098022460938, -0.07030487060546875, -0.06544876098632812, -0.0605926513671875, -0.055736541748046875, -0.05088043212890625, -0.046024322509765625, -0.041168212890625, -0.036312103271484375, -0.03145599365234375, -0.026599884033203125, -0.0217437744140625, -0.016887664794921875, -0.01203155517578125, -0.007175445556640625, -0.0023193359375, 0.002536773681640625, 0.00739288330078125, 0.012248992919921875, 0.0171051025390625, 0.021961212158203125, 0.02681732177734375, 0.031673431396484375, 0.036529541015625, 0.041385650634765625, 0.04624176025390625, 0.051097869873046875, 0.0559539794921875, 0.060810089111328125, 0.06566619873046875, 0.07052230834960938, 0.07537841796875, 0.08023452758789062, 0.08509063720703125, 0.08994674682617188, 0.0948028564453125, 0.09965896606445312, 0.10451507568359375, 0.10937118530273438, 0.114227294921875, 0.11908340454101562, 0.12393951416015625, 0.12879562377929688, 0.1336517333984375, 0.13850784301757812, 0.14336395263671875, 0.14822006225585938, 0.153076171875]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 1.0, 7.0, 6.0, 9.0, 7.0, 16.0, 11.0, 23.0, 22.0, 35.0, 27.0, 43.0, 47.0, 90.0, 125.0, 150.0, 210.0, 289.0, 354.0, 393.0, 665.0, 1633.0, 188484.0, 843940.0, 8920.0, 943.0, 500.0, 360.0, 329.0, 242.0, 148.0, 118.0, 79.0, 63.0, 47.0, 44.0, 43.0, 36.0, 26.0, 18.0, 16.0, 8.0, 4.0, 10.0, 3.0, 9.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.60546875, -2.52203369140625, -2.4385986328125, -2.35516357421875, -2.271728515625, -2.18829345703125, -2.1048583984375, -2.02142333984375, -1.93798828125, -1.85455322265625, -1.7711181640625, -1.68768310546875, -1.604248046875, -1.52081298828125, -1.4373779296875, -1.35394287109375, -1.2705078125, -1.18707275390625, -1.1036376953125, -1.02020263671875, -0.936767578125, -0.85333251953125, -0.7698974609375, -0.68646240234375, -0.60302734375, -0.51959228515625, -0.4361572265625, -0.35272216796875, -0.269287109375, -0.18585205078125, -0.1024169921875, -0.01898193359375, 0.064453125, 0.14788818359375, 0.2313232421875, 0.31475830078125, 0.398193359375, 0.48162841796875, 0.5650634765625, 0.64849853515625, 0.73193359375, 0.81536865234375, 0.8988037109375, 0.98223876953125, 1.065673828125, 1.14910888671875, 1.2325439453125, 1.31597900390625, 1.3994140625, 1.48284912109375, 1.5662841796875, 1.64971923828125, 1.733154296875, 1.81658935546875, 1.9000244140625, 1.98345947265625, 2.06689453125, 2.15032958984375, 2.2337646484375, 2.31719970703125, 2.400634765625, 2.48406982421875, 2.5675048828125, 2.65093994140625, 2.734375]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 15.0, 132.0, 739.0, 114.0, 9.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.678567409515381, -6.381537437438965, -6.084506988525391, -5.787477016448975, -5.490447044372559, -5.193417072296143, -4.896387100219727, -4.599356651306152, -4.302326679229736, -4.00529670715332, -3.708266496658325, -3.41123628616333, -3.114206314086914, -2.817176342010498, -2.520146131515503, -2.223115921020508, -1.9260859489440918, -1.6290558576583862, -1.3320257663726807, -1.034995675086975, -0.7379655838012695, -0.44093549251556396, -0.1439054012298584, 0.15312480926513672, 0.45015478134155273, 0.7471848726272583, 1.0442149639129639, 1.3412450551986694, 1.638275146484375, 1.9353052377700806, 2.232335329055786, 2.5293655395507812, 2.826395034790039, 3.123425006866455, 3.42045521736145, 3.7174854278564453, 4.014515399932861, 4.311545372009277, 4.608575820922852, 4.905605792999268, 5.202635765075684, 5.4996657371521, 5.796695709228516, 6.09372615814209, 6.390756130218506, 6.687786102294922, 6.984816551208496, 7.281846523284912, 7.578876495361328, 7.875906467437744, 8.17293643951416, 8.469966888427734, 8.766996383666992, 9.064026832580566, 9.36105728149414, 9.658086776733398, 9.955117225646973, 10.252147674560547, 10.549177169799805, 10.846207618713379, 11.143238067626953, 11.440267562866211, 11.737298011779785, 12.03432846069336, 12.331357955932617]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 2.0, 4.0, 5.0, 11.0, 4.0, 10.0, 14.0, 17.0, 22.0, 25.0, 30.0, 35.0, 39.0, 38.0, 46.0, 56.0, 59.0, 54.0, 46.0, 60.0, 41.0, 56.0, 44.0, 42.0, 43.0, 42.0, 32.0, 25.0, 29.0, 17.0, 19.0, 15.0, 7.0, 11.0, 5.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.333892345428467, -2.2619309425354004, -2.189969778060913, -2.1180083751678467, -2.0460469722747803, -1.9740856885910034, -1.9021244049072266, -1.8301630020141602, -1.7582017183303833, -1.6862404346466064, -1.61427903175354, -1.5423177480697632, -1.4703564643859863, -1.39839506149292, -1.326433777809143, -1.2544724941253662, -1.1825110912322998, -1.110549807548523, -1.0385884046554565, -0.9666271209716797, -0.8946657776832581, -0.8227044343948364, -0.7507431507110596, -0.6787818074226379, -0.6068204641342163, -0.5348591208457947, -0.46289780735969543, -0.3909364938735962, -0.31897515058517456, -0.24701380729675293, -0.1750524938106537, -0.10309118032455444, -0.031130075454711914, 0.04083125293254852, 0.11279258131980896, 0.1847539097070694, 0.25671523809432983, 0.32867658138275146, 0.4006378948688507, 0.47259920835494995, 0.5445605516433716, 0.6165218949317932, 0.6884832382202148, 0.7604445219039917, 0.8324058651924133, 0.904367208480835, 0.9763284921646118, 1.0482897758483887, 1.120251178741455, 1.192212462425232, 1.2641738653182983, 1.3361351490020752, 1.4080965518951416, 1.4800578355789185, 1.5520191192626953, 1.6239805221557617, 1.6959418058395386, 1.7679030895233154, 1.8398644924163818, 1.9118257761001587, 1.9837870597839355, 2.055748462677002, 2.1277098655700684, 2.1996710300445557, 2.271632432937622]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 4.0, 4.0, 7.0, 7.0, 9.0, 9.0, 7.0, 15.0, 14.0, 21.0, 35.0, 32.0, 36.0, 36.0, 41.0, 39.0, 31.0, 51.0, 53.0, 38.0, 45.0, 53.0, 40.0, 42.0, 41.0, 43.0, 39.0, 30.0, 28.0, 29.0, 31.0, 24.0, 9.0, 13.0, 9.0, 10.0, 6.0, 11.0, 3.0, 3.0, 2.0, 4.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.5546875, -3.45343017578125, -3.3521728515625, -3.25091552734375, -3.149658203125, -3.04840087890625, -2.9471435546875, -2.84588623046875, -2.74462890625, -2.64337158203125, -2.5421142578125, -2.44085693359375, -2.339599609375, -2.23834228515625, -2.1370849609375, -2.03582763671875, -1.9345703125, -1.83331298828125, -1.7320556640625, -1.63079833984375, -1.529541015625, -1.42828369140625, -1.3270263671875, -1.22576904296875, -1.12451171875, -1.02325439453125, -0.9219970703125, -0.82073974609375, -0.719482421875, -0.61822509765625, -0.5169677734375, -0.41571044921875, -0.314453125, -0.21319580078125, -0.1119384765625, -0.01068115234375, 0.090576171875, 0.19183349609375, 0.2930908203125, 0.39434814453125, 0.49560546875, 0.59686279296875, 0.6981201171875, 0.79937744140625, 0.900634765625, 1.00189208984375, 1.1031494140625, 1.20440673828125, 1.3056640625, 1.40692138671875, 1.5081787109375, 1.60943603515625, 1.710693359375, 1.81195068359375, 1.9132080078125, 2.01446533203125, 2.11572265625, 2.21697998046875, 2.3182373046875, 2.41949462890625, 2.520751953125, 2.62200927734375, 2.7232666015625, 2.82452392578125, 2.92578125]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 3.0, 3.0, 6.0, 3.0, 5.0, 5.0, 11.0, 14.0, 13.0, 17.0, 24.0, 32.0, 35.0, 96.0, 195.0, 486.0, 1312.0, 3777.0, 10511.0, 29018.0, 95343.0, 400716.0, 375326.0, 88480.0, 27690.0, 9861.0, 3509.0, 1181.0, 453.0, 170.0, 70.0, 41.0, 31.0, 26.0, 12.0, 21.0, 10.0, 13.0, 7.0, 8.0, 6.0, 2.0, 5.0, 2.0, 0.0, 4.0, 1.0, 3.0, 4.0], "bins": [-6.75390625, -6.57122802734375, -6.3885498046875, -6.20587158203125, -6.023193359375, -5.84051513671875, -5.6578369140625, -5.47515869140625, -5.29248046875, -5.10980224609375, -4.9271240234375, -4.74444580078125, -4.561767578125, -4.37908935546875, -4.1964111328125, -4.01373291015625, -3.8310546875, -3.64837646484375, -3.4656982421875, -3.28302001953125, -3.100341796875, -2.91766357421875, -2.7349853515625, -2.55230712890625, -2.36962890625, -2.18695068359375, -2.0042724609375, -1.82159423828125, -1.638916015625, -1.45623779296875, -1.2735595703125, -1.09088134765625, -0.908203125, -0.72552490234375, -0.5428466796875, -0.36016845703125, -0.177490234375, 0.00518798828125, 0.1878662109375, 0.37054443359375, 0.55322265625, 0.73590087890625, 0.9185791015625, 1.10125732421875, 1.283935546875, 1.46661376953125, 1.6492919921875, 1.83197021484375, 2.0146484375, 2.19732666015625, 2.3800048828125, 2.56268310546875, 2.745361328125, 2.92803955078125, 3.1107177734375, 3.29339599609375, 3.47607421875, 3.65875244140625, 3.8414306640625, 4.02410888671875, 4.206787109375, 4.38946533203125, 4.5721435546875, 4.75482177734375, 4.9375]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 7.0, 4.0, 6.0, 8.0, 10.0, 14.0, 7.0, 17.0, 22.0, 28.0, 16.0, 35.0, 47.0, 31.0, 35.0, 51.0, 67.0, 111.0, 281.0, 1469.0, 215.0, 99.0, 80.0, 48.0, 53.0, 45.0, 36.0, 34.0, 28.0, 24.0, 29.0, 26.0, 11.0, 16.0, 7.0, 7.0, 5.0, 6.0, 7.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.6484375, -10.272705078125, -9.89697265625, -9.521240234375, -9.1455078125, -8.769775390625, -8.39404296875, -8.018310546875, -7.642578125, -7.266845703125, -6.89111328125, -6.515380859375, -6.1396484375, -5.763916015625, -5.38818359375, -5.012451171875, -4.63671875, -4.260986328125, -3.88525390625, -3.509521484375, -3.1337890625, -2.758056640625, -2.38232421875, -2.006591796875, -1.630859375, -1.255126953125, -0.87939453125, -0.503662109375, -0.1279296875, 0.247802734375, 0.62353515625, 0.999267578125, 1.375, 1.750732421875, 2.12646484375, 2.502197265625, 2.8779296875, 3.253662109375, 3.62939453125, 4.005126953125, 4.380859375, 4.756591796875, 5.13232421875, 5.508056640625, 5.8837890625, 6.259521484375, 6.63525390625, 7.010986328125, 7.38671875, 7.762451171875, 8.13818359375, 8.513916015625, 8.8896484375, 9.265380859375, 9.64111328125, 10.016845703125, 10.392578125, 10.768310546875, 11.14404296875, 11.519775390625, 11.8955078125, 12.271240234375, 12.64697265625, 13.022705078125, 13.3984375]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 7.0, 8.0, 6.0, 12.0, 9.0, 10.0, 15.0, 15.0, 28.0, 32.0, 40.0, 40.0, 55.0, 80.0, 129.0, 185.0, 259.0, 559.0, 1586.0, 12653.0, 529384.0, 2556797.0, 39243.0, 2862.0, 689.0, 329.0, 183.0, 119.0, 99.0, 68.0, 44.0, 33.0, 32.0, 20.0, 19.0, 14.0, 12.0, 4.0, 8.0, 6.0, 9.0, 3.0, 4.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-22.140625, -21.52880859375, -20.9169921875, -20.30517578125, -19.693359375, -19.08154296875, -18.4697265625, -17.85791015625, -17.24609375, -16.63427734375, -16.0224609375, -15.41064453125, -14.798828125, -14.18701171875, -13.5751953125, -12.96337890625, -12.3515625, -11.73974609375, -11.1279296875, -10.51611328125, -9.904296875, -9.29248046875, -8.6806640625, -8.06884765625, -7.45703125, -6.84521484375, -6.2333984375, -5.62158203125, -5.009765625, -4.39794921875, -3.7861328125, -3.17431640625, -2.5625, -1.95068359375, -1.3388671875, -0.72705078125, -0.115234375, 0.49658203125, 1.1083984375, 1.72021484375, 2.33203125, 2.94384765625, 3.5556640625, 4.16748046875, 4.779296875, 5.39111328125, 6.0029296875, 6.61474609375, 7.2265625, 7.83837890625, 8.4501953125, 9.06201171875, 9.673828125, 10.28564453125, 10.8974609375, 11.50927734375, 12.12109375, 12.73291015625, 13.3447265625, 13.95654296875, 14.568359375, 15.18017578125, 15.7919921875, 16.40380859375, 17.015625]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [347.0, 670.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.101202964782715, -0.959681510925293, 7.181839942932129, 15.32336139678955, 23.464881896972656, 31.606403350830078, 39.7479248046875, 47.88944625854492, 56.030967712402344, 64.1724853515625, 72.31401062011719, 80.45553588867188, 88.59705352783203, 96.73857116699219, 104.88009643554688, 113.02162170410156, 121.16313934326172, 129.30465698242188, 137.44618225097656, 145.58770751953125, 153.72921752929688, 161.87074279785156, 170.01226806640625, 178.15379333496094, 186.29531860351562, 194.4368438720703, 202.578369140625, 210.71987915039062, 218.8614044189453, 227.0029296875, 235.14443969726562, 243.2859649658203, 251.42745971679688, 259.5689697265625, 267.71051025390625, 275.8520202636719, 283.9935302734375, 292.13507080078125, 300.2765808105469, 308.4181213378906, 316.55963134765625, 324.7011413574219, 332.8426818847656, 340.98419189453125, 349.125732421875, 357.2672424316406, 365.40875244140625, 373.55029296875, 381.6918029785156, 389.83331298828125, 397.974853515625, 406.1163635253906, 414.25787353515625, 422.3994140625, 430.5409240722656, 438.6824645996094, 446.823974609375, 454.9654846191406, 463.1070251464844, 471.24853515625, 479.39007568359375, 487.5315856933594, 495.673095703125, 503.81463623046875, 511.9561462402344]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 4.0, 6.0, 3.0, 4.0, 9.0, 8.0, 7.0, 12.0, 14.0, 13.0, 15.0, 17.0, 19.0, 22.0, 23.0, 20.0, 29.0, 25.0, 26.0, 30.0, 41.0, 28.0, 47.0, 37.0, 39.0, 52.0, 38.0, 41.0, 29.0, 34.0, 28.0, 34.0, 39.0, 24.0, 29.0, 22.0, 26.0, 15.0, 14.0, 16.0, 15.0, 14.0, 7.0, 9.0, 3.0, 9.0, 6.0, 3.0, 4.0, 6.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.543285369873047, -24.68453025817871, -23.825773239135742, -22.967018127441406, -22.108261108398438, -21.2495059967041, -20.390750885009766, -19.531993865966797, -18.673236846923828, -17.814481735229492, -16.955724716186523, -16.096969604492188, -15.238212585449219, -14.379457473754883, -13.52070140838623, -12.661945343017578, -11.803190231323242, -10.94443416595459, -10.085678100585938, -9.226922988891602, -8.368165969848633, -7.509410381317139, -6.6506547927856445, -5.791898727416992, -4.93314266204834, -4.0743865966796875, -3.2156307697296143, -2.356874942779541, -1.4981188774108887, -0.6393628120422363, 0.2193927764892578, 1.0781488418579102, 1.9369068145751953, 2.7956628799438477, 3.654418706893921, 4.513174533843994, 5.3719305992126465, 6.230686664581299, 7.089442253112793, 7.948198318481445, 8.806954383850098, 9.66571044921875, 10.524466514587402, 11.383222579956055, 12.24197769165039, 13.10073471069336, 13.959489822387695, 14.818245887756348, 15.677001953125, 16.535757064819336, 17.394514083862305, 18.25326919555664, 19.11202621459961, 19.970781326293945, 20.82953643798828, 21.68829345703125, 22.54705047607422, 23.405805587768555, 24.264562606811523, 25.12331771850586, 25.982074737548828, 26.840829849243164, 27.6995849609375, 28.55834197998047, 29.417097091674805]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 8.0, 8.0, 6.0, 12.0, 14.0, 18.0, 15.0, 16.0, 16.0, 24.0, 25.0, 29.0, 35.0, 36.0, 40.0, 45.0, 44.0, 38.0, 38.0, 39.0, 38.0, 38.0, 41.0, 44.0, 39.0, 32.0, 35.0, 36.0, 35.0, 18.0, 30.0, 26.0, 16.0, 12.0, 12.0, 10.0, 11.0, 3.0, 3.0, 4.0, 3.0, 4.0, 5.0, 0.0, 1.0, 5.0, 1.0], "bins": [-3.517578125, -3.4219970703125, -3.326416015625, -3.2308349609375, -3.13525390625, -3.0396728515625, -2.944091796875, -2.8485107421875, -2.7529296875, -2.6573486328125, -2.561767578125, -2.4661865234375, -2.37060546875, -2.2750244140625, -2.179443359375, -2.0838623046875, -1.98828125, -1.8927001953125, -1.797119140625, -1.7015380859375, -1.60595703125, -1.5103759765625, -1.414794921875, -1.3192138671875, -1.2236328125, -1.1280517578125, -1.032470703125, -0.9368896484375, -0.84130859375, -0.7457275390625, -0.650146484375, -0.5545654296875, -0.458984375, -0.3634033203125, -0.267822265625, -0.1722412109375, -0.07666015625, 0.0189208984375, 0.114501953125, 0.2100830078125, 0.3056640625, 0.4012451171875, 0.496826171875, 0.5924072265625, 0.68798828125, 0.7835693359375, 0.879150390625, 0.9747314453125, 1.0703125, 1.1658935546875, 1.261474609375, 1.3570556640625, 1.45263671875, 1.5482177734375, 1.643798828125, 1.7393798828125, 1.8349609375, 1.9305419921875, 2.026123046875, 2.1217041015625, 2.21728515625, 2.3128662109375, 2.408447265625, 2.5040283203125, 2.599609375]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 6.0, 8.0, 3.0, 11.0, 14.0, 13.0, 18.0, 25.0, 28.0, 29.0, 45.0, 38.0, 39.0, 63.0, 76.0, 93.0, 263.0, 798.0, 4667.0, 37810.0, 507057.0, 2982015.0, 609529.0, 44678.0, 5227.0, 913.0, 268.0, 129.0, 96.0, 71.0, 49.0, 41.0, 34.0, 34.0, 23.0, 16.0, 16.0, 7.0, 10.0, 5.0, 4.0, 4.0, 9.0, 2.0, 1.0, 5.0, 5.0], "bins": [-11.6953125, -11.39178466796875, -11.0882568359375, -10.78472900390625, -10.481201171875, -10.17767333984375, -9.8741455078125, -9.57061767578125, -9.26708984375, -8.96356201171875, -8.6600341796875, -8.35650634765625, -8.052978515625, -7.74945068359375, -7.4459228515625, -7.14239501953125, -6.8388671875, -6.53533935546875, -6.2318115234375, -5.92828369140625, -5.624755859375, -5.32122802734375, -5.0177001953125, -4.71417236328125, -4.41064453125, -4.10711669921875, -3.8035888671875, -3.50006103515625, -3.196533203125, -2.89300537109375, -2.5894775390625, -2.28594970703125, -1.982421875, -1.67889404296875, -1.3753662109375, -1.07183837890625, -0.768310546875, -0.46478271484375, -0.1612548828125, 0.14227294921875, 0.44580078125, 0.74932861328125, 1.0528564453125, 1.35638427734375, 1.659912109375, 1.96343994140625, 2.2669677734375, 2.57049560546875, 2.8740234375, 3.17755126953125, 3.4810791015625, 3.78460693359375, 4.088134765625, 4.39166259765625, 4.6951904296875, 4.99871826171875, 5.30224609375, 5.60577392578125, 5.9093017578125, 6.21282958984375, 6.516357421875, 6.81988525390625, 7.1234130859375, 7.42694091796875, 7.73046875]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 1.0, 4.0, 9.0, 12.0, 10.0, 23.0, 31.0, 39.0, 58.0, 102.0, 135.0, 208.0, 299.0, 418.0, 531.0, 570.0, 455.0, 345.0, 259.0, 180.0, 143.0, 75.0, 57.0, 38.0, 21.0, 20.0, 7.0, 9.0, 8.0, 7.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.5859375, -6.3140869140625, -6.042236328125, -5.7703857421875, -5.49853515625, -5.2266845703125, -4.954833984375, -4.6829833984375, -4.4111328125, -4.1392822265625, -3.867431640625, -3.5955810546875, -3.32373046875, -3.0518798828125, -2.780029296875, -2.5081787109375, -2.236328125, -1.9644775390625, -1.692626953125, -1.4207763671875, -1.14892578125, -0.8770751953125, -0.605224609375, -0.3333740234375, -0.0615234375, 0.2103271484375, 0.482177734375, 0.7540283203125, 1.02587890625, 1.2977294921875, 1.569580078125, 1.8414306640625, 2.11328125, 2.3851318359375, 2.656982421875, 2.9288330078125, 3.20068359375, 3.4725341796875, 3.744384765625, 4.0162353515625, 4.2880859375, 4.5599365234375, 4.831787109375, 5.1036376953125, 5.37548828125, 5.6473388671875, 5.919189453125, 6.1910400390625, 6.462890625, 6.7347412109375, 7.006591796875, 7.2784423828125, 7.55029296875, 7.8221435546875, 8.093994140625, 8.3658447265625, 8.6376953125, 8.9095458984375, 9.181396484375, 9.4532470703125, 9.72509765625, 9.9969482421875, 10.268798828125, 10.5406494140625, 10.8125]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 6.0, 8.0, 10.0, 12.0, 13.0, 12.0, 32.0, 46.0, 62.0, 105.0, 190.0, 298.0, 696.0, 2713.0, 37777.0, 1541656.0, 2535920.0, 69310.0, 3714.0, 856.0, 336.0, 175.0, 128.0, 73.0, 29.0, 32.0, 27.0, 15.0, 15.0, 5.0, 5.0, 4.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.640625, -23.99365234375, -23.3466796875, -22.69970703125, -22.052734375, -21.40576171875, -20.7587890625, -20.11181640625, -19.46484375, -18.81787109375, -18.1708984375, -17.52392578125, -16.876953125, -16.22998046875, -15.5830078125, -14.93603515625, -14.2890625, -13.64208984375, -12.9951171875, -12.34814453125, -11.701171875, -11.05419921875, -10.4072265625, -9.76025390625, -9.11328125, -8.46630859375, -7.8193359375, -7.17236328125, -6.525390625, -5.87841796875, -5.2314453125, -4.58447265625, -3.9375, -3.29052734375, -2.6435546875, -1.99658203125, -1.349609375, -0.70263671875, -0.0556640625, 0.59130859375, 1.23828125, 1.88525390625, 2.5322265625, 3.17919921875, 3.826171875, 4.47314453125, 5.1201171875, 5.76708984375, 6.4140625, 7.06103515625, 7.7080078125, 8.35498046875, 9.001953125, 9.64892578125, 10.2958984375, 10.94287109375, 11.58984375, 12.23681640625, 12.8837890625, 13.53076171875, 14.177734375, 14.82470703125, 15.4716796875, 16.11865234375, 16.765625]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 14.0, 64.0, 204.0, 320.0, 275.0, 109.0, 21.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-146.72312927246094, -143.0154266357422, -139.30770874023438, -135.60000610351562, -131.8922882080078, -128.18458557128906, -124.47687530517578, -120.7691650390625, -117.06145477294922, -113.35374450683594, -109.64603424072266, -105.93832397460938, -102.23062133789062, -98.52290344238281, -94.81520080566406, -91.10749053955078, -87.3997802734375, -83.69207000732422, -79.98435974121094, -76.27664947509766, -72.56893920898438, -68.86123657226562, -65.15352630615234, -61.44581604003906, -57.73810577392578, -54.0303955078125, -50.32268524169922, -46.6149787902832, -42.90726852416992, -39.19955825805664, -35.491851806640625, -31.784141540527344, -28.076431274414062, -24.36872100830078, -20.661012649536133, -16.953304290771484, -13.245594024658203, -9.537883758544922, -5.830175399780273, -2.122467041015625, 1.5852432250976562, 5.292952537536621, 9.000661849975586, 12.70837116241455, 16.416080474853516, 20.123790740966797, 23.831499099731445, 27.539207458496094, 31.246917724609375, 34.954627990722656, 38.66233825683594, 42.37004470825195, 46.077754974365234, 49.785465240478516, 53.49317169189453, 57.20088195800781, 60.908592224121094, 64.61630249023438, 68.32401275634766, 72.03172302246094, 75.73942565917969, 79.4471435546875, 83.15484619140625, 86.86255645751953, 90.57026672363281]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 7.0, 7.0, 4.0, 12.0, 8.0, 3.0, 9.0, 13.0, 16.0, 13.0, 20.0, 19.0, 33.0, 26.0, 32.0, 26.0, 34.0, 34.0, 30.0, 26.0, 39.0, 36.0, 43.0, 48.0, 47.0, 37.0, 47.0, 41.0, 37.0, 34.0, 32.0, 22.0, 23.0, 31.0, 14.0, 18.0, 11.0, 14.0, 9.0, 12.0, 12.0, 3.0, 3.0, 4.0, 6.0, 2.0, 4.0, 2.0, 2.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-21.722326278686523, -21.022445678710938, -20.32256507873535, -19.622684478759766, -18.922801971435547, -18.22292137145996, -17.523040771484375, -16.82316017150879, -16.123279571533203, -15.423398971557617, -14.723518371582031, -14.023636817932129, -13.323756217956543, -12.623875617980957, -11.923994064331055, -11.224113464355469, -10.524232864379883, -9.824352264404297, -9.124471664428711, -8.424590110778809, -7.724709510803223, -7.024828910827637, -6.324947834014893, -5.625066757202148, -4.9251861572265625, -4.225305557250977, -3.5254244804382324, -2.8255436420440674, -2.1256628036499023, -1.4257819652557373, -0.7259011268615723, -0.026020050048828125, 0.6738605499267578, 1.3737413883209229, 2.073622226715088, 2.773503065109253, 3.473383903503418, 4.173264503479004, 4.873145580291748, 5.573026657104492, 6.272907257080078, 6.972787857055664, 7.672668933868408, 8.372550010681152, 9.072430610656738, 9.772311210632324, 10.472192764282227, 11.172073364257812, 11.871953964233398, 12.571834564208984, 13.27171516418457, 13.971596717834473, 14.671477317810059, 15.371357917785645, 16.071239471435547, 16.771120071411133, 17.47100067138672, 18.170881271362305, 18.87076187133789, 19.570642471313477, 20.270523071289062, 20.97040557861328, 21.670286178588867, 22.370166778564453, 23.07004737854004]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 5.0, 5.0, 5.0, 6.0, 4.0, 10.0, 9.0, 10.0, 13.0, 20.0, 16.0, 32.0, 25.0, 38.0, 34.0, 38.0, 27.0, 28.0, 32.0, 43.0, 46.0, 49.0, 42.0, 45.0, 50.0, 53.0, 31.0, 41.0, 35.0, 38.0, 29.0, 23.0, 20.0, 18.0, 18.0, 10.0, 10.0, 10.0, 12.0, 9.0, 5.0, 4.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-3.490234375, -3.39306640625, -3.2958984375, -3.19873046875, -3.1015625, -3.00439453125, -2.9072265625, -2.81005859375, -2.712890625, -2.61572265625, -2.5185546875, -2.42138671875, -2.32421875, -2.22705078125, -2.1298828125, -2.03271484375, -1.935546875, -1.83837890625, -1.7412109375, -1.64404296875, -1.546875, -1.44970703125, -1.3525390625, -1.25537109375, -1.158203125, -1.06103515625, -0.9638671875, -0.86669921875, -0.76953125, -0.67236328125, -0.5751953125, -0.47802734375, -0.380859375, -0.28369140625, -0.1865234375, -0.08935546875, 0.0078125, 0.10498046875, 0.2021484375, 0.29931640625, 0.396484375, 0.49365234375, 0.5908203125, 0.68798828125, 0.78515625, 0.88232421875, 0.9794921875, 1.07666015625, 1.173828125, 1.27099609375, 1.3681640625, 1.46533203125, 1.5625, 1.65966796875, 1.7568359375, 1.85400390625, 1.951171875, 2.04833984375, 2.1455078125, 2.24267578125, 2.33984375, 2.43701171875, 2.5341796875, 2.63134765625, 2.728515625]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 5.0, 2.0, 5.0, 5.0, 17.0, 32.0, 57.0, 82.0, 116.0, 237.0, 378.0, 597.0, 1107.0, 1829.0, 2881.0, 4522.0, 7102.0, 10561.0, 15945.0, 22982.0, 32123.0, 43119.0, 55793.0, 68344.0, 80500.0, 89865.0, 96020.0, 95298.0, 87973.0, 78575.0, 65698.0, 53254.0, 40564.0, 29987.0, 21218.0, 14813.0, 9893.0, 6463.0, 4019.0, 2579.0, 1666.0, 984.0, 585.0, 314.0, 197.0, 110.0, 52.0, 46.0, 17.0, 18.0, 7.0, 6.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.216796875, -1.1774139404296875, -1.138031005859375, -1.0986480712890625, -1.05926513671875, -1.0198822021484375, -0.980499267578125, -0.9411163330078125, -0.9017333984375, -0.8623504638671875, -0.822967529296875, -0.7835845947265625, -0.74420166015625, -0.7048187255859375, -0.665435791015625, -0.6260528564453125, -0.586669921875, -0.5472869873046875, -0.507904052734375, -0.4685211181640625, -0.42913818359375, -0.3897552490234375, -0.350372314453125, -0.3109893798828125, -0.2716064453125, -0.2322235107421875, -0.192840576171875, -0.1534576416015625, -0.11407470703125, -0.0746917724609375, -0.035308837890625, 0.0040740966796875, 0.04345703125, 0.0828399658203125, 0.122222900390625, 0.1616058349609375, 0.20098876953125, 0.2403717041015625, 0.279754638671875, 0.3191375732421875, 0.3585205078125, 0.3979034423828125, 0.437286376953125, 0.4766693115234375, 0.51605224609375, 0.5554351806640625, 0.594818115234375, 0.6342010498046875, 0.673583984375, 0.7129669189453125, 0.752349853515625, 0.7917327880859375, 0.83111572265625, 0.8704986572265625, 0.909881591796875, 0.9492645263671875, 0.9886474609375, 1.0280303955078125, 1.067413330078125, 1.1067962646484375, 1.14617919921875, 1.1855621337890625, 1.224945068359375, 1.2643280029296875, 1.3037109375]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 0.0, 9.0, 4.0, 7.0, 8.0, 10.0, 12.0, 18.0, 22.0, 15.0, 22.0, 33.0, 32.0, 28.0, 32.0, 32.0, 33.0, 38.0, 34.0, 49.0, 50.0, 1009.0, 76.0, 42.0, 41.0, 34.0, 32.0, 34.0, 30.0, 34.0, 25.0, 16.0, 21.0, 23.0, 19.0, 17.0, 9.0, 20.0, 15.0, 9.0, 2.0, 6.0, 6.0, 7.0, 2.0, 3.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-2.73828125, -2.647003173828125, -2.55572509765625, -2.464447021484375, -2.3731689453125, -2.281890869140625, -2.19061279296875, -2.099334716796875, -2.008056640625, -1.916778564453125, -1.82550048828125, -1.734222412109375, -1.6429443359375, -1.551666259765625, -1.46038818359375, -1.369110107421875, -1.27783203125, -1.186553955078125, -1.09527587890625, -1.003997802734375, -0.9127197265625, -0.821441650390625, -0.73016357421875, -0.638885498046875, -0.547607421875, -0.456329345703125, -0.36505126953125, -0.273773193359375, -0.1824951171875, -0.091217041015625, 6.103515625e-05, 0.091339111328125, 0.1826171875, 0.273895263671875, 0.36517333984375, 0.456451416015625, 0.5477294921875, 0.639007568359375, 0.73028564453125, 0.821563720703125, 0.912841796875, 1.004119873046875, 1.09539794921875, 1.186676025390625, 1.2779541015625, 1.369232177734375, 1.46051025390625, 1.551788330078125, 1.64306640625, 1.734344482421875, 1.82562255859375, 1.916900634765625, 2.0081787109375, 2.099456787109375, 2.19073486328125, 2.282012939453125, 2.373291015625, 2.464569091796875, 2.55584716796875, 2.647125244140625, 2.7384033203125, 2.829681396484375, 2.92095947265625, 3.012237548828125, 3.103515625]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 10.0, 9.0, 23.0, 21.0, 41.0, 66.0, 91.0, 143.0, 211.0, 323.0, 502.0, 768.0, 1169.0, 1732.0, 2587.0, 3762.0, 5492.0, 8368.0, 12318.0, 19237.0, 35147.0, 284784.0, 1609614.0, 46403.0, 22028.0, 14039.0, 9305.0, 6187.0, 4149.0, 2866.0, 1952.0, 1220.0, 865.0, 602.0, 392.0, 247.0, 158.0, 107.0, 79.0, 41.0, 28.0, 17.0, 11.0, 8.0, 5.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.96875, -2.8734130859375, -2.778076171875, -2.6827392578125, -2.58740234375, -2.4920654296875, -2.396728515625, -2.3013916015625, -2.2060546875, -2.1107177734375, -2.015380859375, -1.9200439453125, -1.82470703125, -1.7293701171875, -1.634033203125, -1.5386962890625, -1.443359375, -1.3480224609375, -1.252685546875, -1.1573486328125, -1.06201171875, -0.9666748046875, -0.871337890625, -0.7760009765625, -0.6806640625, -0.5853271484375, -0.489990234375, -0.3946533203125, -0.29931640625, -0.2039794921875, -0.108642578125, -0.0133056640625, 0.08203125, 0.1773681640625, 0.272705078125, 0.3680419921875, 0.46337890625, 0.5587158203125, 0.654052734375, 0.7493896484375, 0.8447265625, 0.9400634765625, 1.035400390625, 1.1307373046875, 1.22607421875, 1.3214111328125, 1.416748046875, 1.5120849609375, 1.607421875, 1.7027587890625, 1.798095703125, 1.8934326171875, 1.98876953125, 2.0841064453125, 2.179443359375, 2.2747802734375, 2.3701171875, 2.4654541015625, 2.560791015625, 2.6561279296875, 2.75146484375, 2.8468017578125, 2.942138671875, 3.0374755859375, 3.1328125]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 2.0, 2.0, 4.0, 1.0, 7.0, 5.0, 8.0, 9.0, 14.0, 17.0, 31.0, 41.0, 52.0, 51.0, 57.0, 59.0, 56.0, 72.0, 72.0, 60.0, 46.0, 57.0, 57.0, 52.0, 43.0, 33.0, 20.0, 18.0, 19.0, 11.0, 10.0, 3.0, 4.0, 2.0, 4.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2132568359375, -0.20509910583496094, -0.19694137573242188, -0.1887836456298828, -0.18062591552734375, -0.1724681854248047, -0.16431045532226562, -0.15615272521972656, -0.1479949951171875, -0.13983726501464844, -0.13167953491210938, -0.12352180480957031, -0.11536407470703125, -0.10720634460449219, -0.09904861450195312, -0.09089088439941406, -0.082733154296875, -0.07457542419433594, -0.06641769409179688, -0.05825996398925781, -0.05010223388671875, -0.04194450378417969, -0.033786773681640625, -0.025629043579101562, -0.0174713134765625, -0.009313583374023438, -0.001155853271484375, 0.0070018768310546875, 0.01515960693359375, 0.023317337036132812, 0.031475067138671875, 0.03963279724121094, 0.04779052734375, 0.05594825744628906, 0.06410598754882812, 0.07226371765136719, 0.08042144775390625, 0.08857917785644531, 0.09673690795898438, 0.10489463806152344, 0.1130523681640625, 0.12121009826660156, 0.12936782836914062, 0.1375255584716797, 0.14568328857421875, 0.1538410186767578, 0.16199874877929688, 0.17015647888183594, 0.178314208984375, 0.18647193908691406, 0.19462966918945312, 0.2027873992919922, 0.21094512939453125, 0.2191028594970703, 0.22726058959960938, 0.23541831970214844, 0.2435760498046875, 0.25173377990722656, 0.2598915100097656, 0.2680492401123047, 0.27620697021484375, 0.2843647003173828, 0.2925224304199219, 0.30068016052246094, 0.308837890625]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 6.0, 1.0, 4.0, 5.0, 6.0, 23.0, 16.0, 32.0, 39.0, 67.0, 95.0, 189.0, 317.0, 711.0, 2929.0, 816079.0, 224754.0, 1951.0, 640.0, 292.0, 136.0, 95.0, 58.0, 44.0, 10.0, 17.0, 11.0, 9.0, 5.0, 3.0, 2.0, 5.0, 3.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 4.0], "bins": [-6.15625, -6.001953125, -5.84765625, -5.693359375, -5.5390625, -5.384765625, -5.23046875, -5.076171875, -4.921875, -4.767578125, -4.61328125, -4.458984375, -4.3046875, -4.150390625, -3.99609375, -3.841796875, -3.6875, -3.533203125, -3.37890625, -3.224609375, -3.0703125, -2.916015625, -2.76171875, -2.607421875, -2.453125, -2.298828125, -2.14453125, -1.990234375, -1.8359375, -1.681640625, -1.52734375, -1.373046875, -1.21875, -1.064453125, -0.91015625, -0.755859375, -0.6015625, -0.447265625, -0.29296875, -0.138671875, 0.015625, 0.169921875, 0.32421875, 0.478515625, 0.6328125, 0.787109375, 0.94140625, 1.095703125, 1.25, 1.404296875, 1.55859375, 1.712890625, 1.8671875, 2.021484375, 2.17578125, 2.330078125, 2.484375, 2.638671875, 2.79296875, 2.947265625, 3.1015625, 3.255859375, 3.41015625, 3.564453125, 3.71875]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 4.0, 17.0, 54.0, 207.0, 482.0, 177.0, 44.0, 16.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-7.186920642852783, -7.032151699066162, -6.877382755279541, -6.722614288330078, -6.567845344543457, -6.413076400756836, -6.258307456970215, -6.103538513183594, -5.948769569396973, -5.794000625610352, -5.6392316818237305, -5.484462738037109, -5.3296942710876465, -5.174925327301025, -5.020156383514404, -4.865387439727783, -4.71061897277832, -4.555850028991699, -4.401081085205078, -4.246312141418457, -4.091543674468994, -3.936774730682373, -3.782005786895752, -3.627236843109131, -3.4724678993225098, -3.3176989555358887, -3.1629302501678467, -3.0081613063812256, -2.8533923625946045, -2.6986236572265625, -2.5438547134399414, -2.3890857696533203, -2.23431658744812, -2.079547643661499, -1.9247788190841675, -1.770009994506836, -1.6152410507202148, -1.4604722261428833, -1.3057034015655518, -1.1509344577789307, -0.9961656332015991, -0.8413967490196228, -0.6866278648376465, -0.5318590402603149, -0.3770901560783386, -0.2223212718963623, -0.06755244731903076, 0.08721649646759033, 0.24198532104492188, 0.3967542052268982, 0.5515230894088745, 0.706291913986206, 0.8610607981681824, 1.0158296823501587, 1.1705985069274902, 1.3253674507141113, 1.4801362752914429, 1.6349050998687744, 1.7896740436553955, 1.944442868232727, 2.0992116928100586, 2.2539806365966797, 2.408749580383301, 2.563518524169922, 2.718287229537964]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 2.0, 8.0, 5.0, 6.0, 11.0, 11.0, 14.0, 16.0, 19.0, 21.0, 29.0, 33.0, 32.0, 29.0, 38.0, 38.0, 40.0, 44.0, 48.0, 40.0, 44.0, 46.0, 46.0, 39.0, 39.0, 32.0, 28.0, 35.0, 30.0, 31.0, 29.0, 16.0, 17.0, 20.0, 14.0, 12.0, 15.0, 5.0, 7.0, 8.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3741886615753174, -1.3238097429275513, -1.2734308242797852, -1.223051905632019, -1.172672986984253, -1.1222940683364868, -1.0719151496887207, -1.0215362310409546, -0.9711573123931885, -0.9207783937454224, -0.8703994750976562, -0.8200205564498901, -0.769641637802124, -0.7192627191543579, -0.6688838005065918, -0.6185048818588257, -0.5681259632110596, -0.5177470445632935, -0.46736812591552734, -0.41698920726776123, -0.3666102886199951, -0.316231369972229, -0.2658524513244629, -0.21547353267669678, -0.16509461402893066, -0.11471569538116455, -0.06433677673339844, -0.013957858085632324, 0.03642106056213379, 0.0867999792098999, 0.13717889785766602, 0.18755781650543213, 0.23793673515319824, 0.28831565380096436, 0.33869457244873047, 0.3890734910964966, 0.4394524097442627, 0.4898313283920288, 0.5402102470397949, 0.590589165687561, 0.6409680843353271, 0.6913470029830933, 0.7417259216308594, 0.7921048402786255, 0.8424837589263916, 0.8928626775741577, 0.9432415962219238, 0.9936205148696899, 1.043999433517456, 1.0943783521652222, 1.1447572708129883, 1.1951361894607544, 1.2455151081085205, 1.2958940267562866, 1.3462729454040527, 1.3966518640518188, 1.447030782699585, 1.497409701347351, 1.5477886199951172, 1.5981675386428833, 1.6485464572906494, 1.6989253759384155, 1.7493042945861816, 1.7996832132339478, 1.8500621318817139]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 1.0, 0.0, 6.0, 3.0, 4.0, 3.0, 8.0, 9.0, 6.0, 7.0, 11.0, 15.0, 21.0, 20.0, 17.0, 30.0, 25.0, 31.0, 33.0, 34.0, 35.0, 40.0, 38.0, 47.0, 50.0, 47.0, 53.0, 43.0, 41.0, 41.0, 39.0, 44.0, 28.0, 26.0, 23.0, 25.0, 25.0, 14.0, 14.0, 8.0, 7.0, 10.0, 7.0, 5.0, 6.0, 3.0, 2.0, 3.0, 5.0, 0.0, 1.0, 2.0, 1.0], "bins": [-3.634765625, -3.533721923828125, -3.43267822265625, -3.331634521484375, -3.2305908203125, -3.129547119140625, -3.02850341796875, -2.927459716796875, -2.826416015625, -2.725372314453125, -2.62432861328125, -2.523284912109375, -2.4222412109375, -2.321197509765625, -2.22015380859375, -2.119110107421875, -2.01806640625, -1.917022705078125, -1.81597900390625, -1.714935302734375, -1.6138916015625, -1.512847900390625, -1.41180419921875, -1.310760498046875, -1.209716796875, -1.108673095703125, -1.00762939453125, -0.906585693359375, -0.8055419921875, -0.704498291015625, -0.60345458984375, -0.502410888671875, -0.4013671875, -0.300323486328125, -0.19927978515625, -0.098236083984375, 0.0028076171875, 0.103851318359375, 0.20489501953125, 0.305938720703125, 0.406982421875, 0.508026123046875, 0.60906982421875, 0.710113525390625, 0.8111572265625, 0.912200927734375, 1.01324462890625, 1.114288330078125, 1.21533203125, 1.316375732421875, 1.41741943359375, 1.518463134765625, 1.6195068359375, 1.720550537109375, 1.82159423828125, 1.922637939453125, 2.023681640625, 2.124725341796875, 2.22576904296875, 2.326812744140625, 2.4278564453125, 2.528900146484375, 2.62994384765625, 2.730987548828125, 2.83203125]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 1.0, 3.0, 8.0, 8.0, 17.0, 24.0, 35.0, 46.0, 84.0, 128.0, 200.0, 329.0, 494.0, 750.0, 1170.0, 1749.0, 2713.0, 4125.0, 6383.0, 9705.0, 15246.0, 24840.0, 41638.0, 77375.0, 155496.0, 262570.0, 205058.0, 102856.0, 53161.0, 30200.0, 18737.0, 11688.0, 7691.0, 4835.0, 3228.0, 2082.0, 1339.0, 887.0, 592.0, 373.0, 209.0, 166.0, 119.0, 72.0, 41.0, 32.0, 20.0, 13.0, 9.0, 8.0, 6.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-2.1875, -2.113861083984375, -2.04022216796875, -1.966583251953125, -1.8929443359375, -1.819305419921875, -1.74566650390625, -1.672027587890625, -1.598388671875, -1.524749755859375, -1.45111083984375, -1.377471923828125, -1.3038330078125, -1.230194091796875, -1.15655517578125, -1.082916259765625, -1.00927734375, -0.935638427734375, -0.86199951171875, -0.788360595703125, -0.7147216796875, -0.641082763671875, -0.56744384765625, -0.493804931640625, -0.420166015625, -0.346527099609375, -0.27288818359375, -0.199249267578125, -0.1256103515625, -0.051971435546875, 0.02166748046875, 0.095306396484375, 0.1689453125, 0.242584228515625, 0.31622314453125, 0.389862060546875, 0.4635009765625, 0.537139892578125, 0.61077880859375, 0.684417724609375, 0.758056640625, 0.831695556640625, 0.90533447265625, 0.978973388671875, 1.0526123046875, 1.126251220703125, 1.19989013671875, 1.273529052734375, 1.34716796875, 1.420806884765625, 1.49444580078125, 1.568084716796875, 1.6417236328125, 1.715362548828125, 1.78900146484375, 1.862640380859375, 1.936279296875, 2.009918212890625, 2.08355712890625, 2.157196044921875, 2.2308349609375, 2.304473876953125, 2.37811279296875, 2.451751708984375, 2.525390625]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 7.0, 10.0, 7.0, 13.0, 12.0, 8.0, 12.0, 23.0, 17.0, 22.0, 26.0, 38.0, 41.0, 49.0, 39.0, 45.0, 63.0, 118.0, 244.0, 1454.0, 258.0, 110.0, 59.0, 51.0, 34.0, 43.0, 51.0, 23.0, 27.0, 19.0, 25.0, 14.0, 19.0, 16.0, 13.0, 13.0, 4.0, 9.0, 4.0, 4.0, 5.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.4765625, -10.094970703125, -9.71337890625, -9.331787109375, -8.9501953125, -8.568603515625, -8.18701171875, -7.805419921875, -7.423828125, -7.042236328125, -6.66064453125, -6.279052734375, -5.8974609375, -5.515869140625, -5.13427734375, -4.752685546875, -4.37109375, -3.989501953125, -3.60791015625, -3.226318359375, -2.8447265625, -2.463134765625, -2.08154296875, -1.699951171875, -1.318359375, -0.936767578125, -0.55517578125, -0.173583984375, 0.2080078125, 0.589599609375, 0.97119140625, 1.352783203125, 1.734375, 2.115966796875, 2.49755859375, 2.879150390625, 3.2607421875, 3.642333984375, 4.02392578125, 4.405517578125, 4.787109375, 5.168701171875, 5.55029296875, 5.931884765625, 6.3134765625, 6.695068359375, 7.07666015625, 7.458251953125, 7.83984375, 8.221435546875, 8.60302734375, 8.984619140625, 9.3662109375, 9.747802734375, 10.12939453125, 10.510986328125, 10.892578125, 11.274169921875, 11.65576171875, 12.037353515625, 12.4189453125, 12.800537109375, 13.18212890625, 13.563720703125, 13.9453125]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 5.0, 4.0, 6.0, 2.0, 7.0, 16.0, 29.0, 36.0, 68.0, 87.0, 155.0, 250.0, 561.0, 2935.0, 1840854.0, 1296862.0, 2653.0, 558.0, 248.0, 136.0, 91.0, 48.0, 33.0, 21.0, 19.0, 11.0, 8.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.15625, -33.89990234375, -32.6435546875, -31.38720703125, -30.130859375, -28.87451171875, -27.6181640625, -26.36181640625, -25.10546875, -23.84912109375, -22.5927734375, -21.33642578125, -20.080078125, -18.82373046875, -17.5673828125, -16.31103515625, -15.0546875, -13.79833984375, -12.5419921875, -11.28564453125, -10.029296875, -8.77294921875, -7.5166015625, -6.26025390625, -5.00390625, -3.74755859375, -2.4912109375, -1.23486328125, 0.021484375, 1.27783203125, 2.5341796875, 3.79052734375, 5.046875, 6.30322265625, 7.5595703125, 8.81591796875, 10.072265625, 11.32861328125, 12.5849609375, 13.84130859375, 15.09765625, 16.35400390625, 17.6103515625, 18.86669921875, 20.123046875, 21.37939453125, 22.6357421875, 23.89208984375, 25.1484375, 26.40478515625, 27.6611328125, 28.91748046875, 30.173828125, 31.43017578125, 32.6865234375, 33.94287109375, 35.19921875, 36.45556640625, 37.7119140625, 38.96826171875, 40.224609375, 41.48095703125, 42.7373046875, 43.99365234375, 45.25]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 120.0, 841.0, 57.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.01042938232422, -49.17369842529297, -43.33696746826172, -37.500240325927734, -31.663509368896484, -25.826778411865234, -19.99005126953125, -14.1533203125, -8.31658935546875, -2.4798593521118164, 3.356870651245117, 9.193599700927734, 15.030330657958984, 20.867061614990234, 26.70378875732422, 32.54051971435547, 38.37725067138672, 44.21398162841797, 50.05071258544922, 55.8874397277832, 61.72417068481445, 67.56089782714844, 73.39762878417969, 79.23435974121094, 85.07109069824219, 90.90782165527344, 96.74455261230469, 102.58128356933594, 108.41801452636719, 114.25474548339844, 120.09146881103516, 125.9281997680664, 131.76492309570312, 137.60165405273438, 143.43838500976562, 149.27511596679688, 155.11184692382812, 160.94857788085938, 166.78530883789062, 172.62203979492188, 178.45877075195312, 184.29550170898438, 190.13223266601562, 195.96896362304688, 201.80569458007812, 207.64242553710938, 213.47915649414062, 219.31588745117188, 225.15260314941406, 230.9893341064453, 236.82606506347656, 242.6627960205078, 248.49952697753906, 254.3362579345703, 260.1729736328125, 266.00970458984375, 271.846435546875, 277.68316650390625, 283.5198974609375, 289.35662841796875, 295.193359375, 301.03009033203125, 306.8668212890625, 312.70355224609375, 318.540283203125]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 7.0, 2.0, 3.0, 6.0, 10.0, 10.0, 15.0, 16.0, 9.0, 19.0, 29.0, 28.0, 21.0, 29.0, 29.0, 31.0, 30.0, 43.0, 41.0, 47.0, 48.0, 40.0, 47.0, 37.0, 41.0, 35.0, 38.0, 44.0, 34.0, 25.0, 26.0, 19.0, 23.0, 23.0, 17.0, 20.0, 13.0, 10.0, 12.0, 5.0, 3.0, 9.0, 7.0, 2.0, 2.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.26657485961914, -32.225852966308594, -31.18513298034668, -30.144412994384766, -29.10369110107422, -28.062969207763672, -27.022249221801758, -25.981529235839844, -24.940807342529297, -23.90008544921875, -22.859365463256836, -21.818645477294922, -20.777923583984375, -19.737201690673828, -18.696481704711914, -17.65576171875, -16.615039825439453, -15.574318885803223, -14.533597946166992, -13.492877006530762, -12.452156066894531, -11.4114351272583, -10.37071418762207, -9.32999324798584, -8.28927230834961, -7.248551368713379, -6.207830429077148, -5.167109489440918, -4.1263885498046875, -3.085667610168457, -2.0449466705322266, -1.004225730895996, 0.0364990234375, 1.0772199630737305, 2.117940902709961, 3.1586618423461914, 4.199382781982422, 5.240103721618652, 6.280824661254883, 7.321545600891113, 8.362266540527344, 9.402987480163574, 10.443708419799805, 11.484429359436035, 12.525150299072266, 13.565871238708496, 14.606592178344727, 15.647313117980957, 16.688034057617188, 17.728755950927734, 18.76947593688965, 19.810195922851562, 20.85091781616211, 21.891639709472656, 22.93235969543457, 23.973079681396484, 25.01380157470703, 26.054523468017578, 27.095243453979492, 28.135963439941406, 29.176685333251953, 30.2174072265625, 31.258127212524414, 32.29884719848633, 33.339569091796875]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 2.0, 3.0, 5.0, 7.0, 5.0, 10.0, 11.0, 8.0, 14.0, 25.0, 17.0, 28.0, 37.0, 29.0, 31.0, 42.0, 33.0, 53.0, 33.0, 51.0, 44.0, 35.0, 67.0, 36.0, 42.0, 38.0, 38.0, 39.0, 33.0, 41.0, 26.0, 23.0, 22.0, 16.0, 20.0, 11.0, 8.0, 7.0, 6.0, 1.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0], "bins": [-3.91015625, -3.799530029296875, -3.68890380859375, -3.578277587890625, -3.4676513671875, -3.357025146484375, -3.24639892578125, -3.135772705078125, -3.025146484375, -2.914520263671875, -2.80389404296875, -2.693267822265625, -2.5826416015625, -2.472015380859375, -2.36138916015625, -2.250762939453125, -2.14013671875, -2.029510498046875, -1.91888427734375, -1.808258056640625, -1.6976318359375, -1.587005615234375, -1.47637939453125, -1.365753173828125, -1.255126953125, -1.144500732421875, -1.03387451171875, -0.923248291015625, -0.8126220703125, -0.701995849609375, -0.59136962890625, -0.480743408203125, -0.3701171875, -0.259490966796875, -0.14886474609375, -0.038238525390625, 0.0723876953125, 0.183013916015625, 0.29364013671875, 0.404266357421875, 0.514892578125, 0.625518798828125, 0.73614501953125, 0.846771240234375, 0.9573974609375, 1.068023681640625, 1.17864990234375, 1.289276123046875, 1.39990234375, 1.510528564453125, 1.62115478515625, 1.731781005859375, 1.8424072265625, 1.953033447265625, 2.06365966796875, 2.174285888671875, 2.284912109375, 2.395538330078125, 2.50616455078125, 2.616790771484375, 2.7274169921875, 2.838043212890625, 2.94866943359375, 3.059295654296875, 3.169921875]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 11.0, 11.0, 17.0, 21.0, 19.0, 36.0, 65.0, 117.0, 194.0, 362.0, 644.0, 1211.0, 2643.0, 6008.0, 13914.0, 34869.0, 88884.0, 242018.0, 661437.0, 1284686.0, 1097669.0, 477414.0, 173240.0, 64876.0, 25094.0, 10370.0, 4417.0, 1992.0, 931.0, 471.0, 226.0, 161.0, 89.0, 62.0, 39.0, 27.0, 14.0, 10.0, 7.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.958984375, -3.841949462890625, -3.72491455078125, -3.607879638671875, -3.4908447265625, -3.373809814453125, -3.25677490234375, -3.139739990234375, -3.022705078125, -2.905670166015625, -2.78863525390625, -2.671600341796875, -2.5545654296875, -2.437530517578125, -2.32049560546875, -2.203460693359375, -2.08642578125, -1.969390869140625, -1.85235595703125, -1.735321044921875, -1.6182861328125, -1.501251220703125, -1.38421630859375, -1.267181396484375, -1.150146484375, -1.033111572265625, -0.91607666015625, -0.799041748046875, -0.6820068359375, -0.564971923828125, -0.44793701171875, -0.330902099609375, -0.2138671875, -0.096832275390625, 0.02020263671875, 0.137237548828125, 0.2542724609375, 0.371307373046875, 0.48834228515625, 0.605377197265625, 0.722412109375, 0.839447021484375, 0.95648193359375, 1.073516845703125, 1.1905517578125, 1.307586669921875, 1.42462158203125, 1.541656494140625, 1.65869140625, 1.775726318359375, 1.89276123046875, 2.009796142578125, 2.1268310546875, 2.243865966796875, 2.36090087890625, 2.477935791015625, 2.594970703125, 2.712005615234375, 2.82904052734375, 2.946075439453125, 3.0631103515625, 3.180145263671875, 3.29718017578125, 3.414215087890625, 3.53125]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 5.0, 3.0, 10.0, 6.0, 3.0, 9.0, 16.0, 15.0, 29.0, 45.0, 53.0, 70.0, 96.0, 145.0, 183.0, 244.0, 289.0, 396.0, 419.0, 412.0, 386.0, 284.0, 246.0, 191.0, 134.0, 105.0, 81.0, 55.0, 38.0, 31.0, 28.0, 18.0, 9.0, 5.0, 7.0, 7.0, 2.0, 3.0, 0.0, 4.0, 0.0, 1.0, 0.0, 3.0], "bins": [-8.2265625, -8.01544189453125, -7.8043212890625, -7.59320068359375, -7.382080078125, -7.17095947265625, -6.9598388671875, -6.74871826171875, -6.53759765625, -6.32647705078125, -6.1153564453125, -5.90423583984375, -5.693115234375, -5.48199462890625, -5.2708740234375, -5.05975341796875, -4.8486328125, -4.63751220703125, -4.4263916015625, -4.21527099609375, -4.004150390625, -3.79302978515625, -3.5819091796875, -3.37078857421875, -3.15966796875, -2.94854736328125, -2.7374267578125, -2.52630615234375, -2.315185546875, -2.10406494140625, -1.8929443359375, -1.68182373046875, -1.470703125, -1.25958251953125, -1.0484619140625, -0.83734130859375, -0.626220703125, -0.41510009765625, -0.2039794921875, 0.00714111328125, 0.21826171875, 0.42938232421875, 0.6405029296875, 0.85162353515625, 1.062744140625, 1.27386474609375, 1.4849853515625, 1.69610595703125, 1.9072265625, 2.11834716796875, 2.3294677734375, 2.54058837890625, 2.751708984375, 2.96282958984375, 3.1739501953125, 3.38507080078125, 3.59619140625, 3.80731201171875, 4.0184326171875, 4.22955322265625, 4.440673828125, 4.65179443359375, 4.8629150390625, 5.07403564453125, 5.28515625]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 5.0, 7.0, 11.0, 8.0, 7.0, 26.0, 36.0, 43.0, 67.0, 113.0, 143.0, 224.0, 429.0, 1040.0, 4070.0, 29997.0, 303611.0, 2414840.0, 1297416.0, 124667.0, 13654.0, 2239.0, 710.0, 351.0, 192.0, 123.0, 89.0, 61.0, 32.0, 24.0, 12.0, 13.0, 9.0, 9.0, 6.0, 3.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.3828125, -8.98876953125, -8.5947265625, -8.20068359375, -7.806640625, -7.41259765625, -7.0185546875, -6.62451171875, -6.23046875, -5.83642578125, -5.4423828125, -5.04833984375, -4.654296875, -4.26025390625, -3.8662109375, -3.47216796875, -3.078125, -2.68408203125, -2.2900390625, -1.89599609375, -1.501953125, -1.10791015625, -0.7138671875, -0.31982421875, 0.07421875, 0.46826171875, 0.8623046875, 1.25634765625, 1.650390625, 2.04443359375, 2.4384765625, 2.83251953125, 3.2265625, 3.62060546875, 4.0146484375, 4.40869140625, 4.802734375, 5.19677734375, 5.5908203125, 5.98486328125, 6.37890625, 6.77294921875, 7.1669921875, 7.56103515625, 7.955078125, 8.34912109375, 8.7431640625, 9.13720703125, 9.53125, 9.92529296875, 10.3193359375, 10.71337890625, 11.107421875, 11.50146484375, 11.8955078125, 12.28955078125, 12.68359375, 13.07763671875, 13.4716796875, 13.86572265625, 14.259765625, 14.65380859375, 15.0478515625, 15.44189453125, 15.8359375]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 7.0, 7.0, 21.0, 29.0, 54.0, 88.0, 102.0, 114.0, 116.0, 138.0, 102.0, 80.0, 71.0, 39.0, 21.0, 14.0, 8.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.63648986816406, -58.26636505126953, -56.896240234375, -55.52611541748047, -54.15598678588867, -52.78586196899414, -51.41573715209961, -50.04561233520508, -48.67548751831055, -47.305362701416016, -45.935237884521484, -44.56510925292969, -43.194984436035156, -41.824859619140625, -40.454734802246094, -39.08460998535156, -37.71448516845703, -36.3443603515625, -34.97423553466797, -33.60411071777344, -32.23398208618164, -30.86385726928711, -29.493732452392578, -28.123607635498047, -26.75347900390625, -25.38335418701172, -24.013227462768555, -22.643102645874023, -21.272977828979492, -19.902851104736328, -18.532726287841797, -17.162601470947266, -15.792478561401367, -14.42235279083252, -13.052227973937988, -11.68210220336914, -10.31197738647461, -8.941851615905762, -7.571725845336914, -6.201601028442383, -4.831475257873535, -3.4613499641418457, -2.091224431991577, -0.7210988998413086, 0.6490263938903809, 2.0191516876220703, 3.389277458190918, 4.759402275085449, 6.129528045654297, 7.499653339385986, 8.869778633117676, 10.239904403686523, 11.610029220581055, 12.980154991149902, 14.35028076171875, 15.720405578613281, 17.090530395507812, 18.460655212402344, 19.830781936645508, 21.20090675354004, 22.57103157043457, 23.941158294677734, 25.311283111572266, 26.681407928466797, 28.05153465270996]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 4.0, 2.0, 8.0, 4.0, 4.0, 7.0, 13.0, 10.0, 9.0, 21.0, 17.0, 14.0, 23.0, 27.0, 13.0, 24.0, 26.0, 33.0, 33.0, 27.0, 29.0, 39.0, 42.0, 39.0, 37.0, 32.0, 47.0, 41.0, 31.0, 28.0, 28.0, 38.0, 27.0, 29.0, 27.0, 26.0, 17.0, 26.0, 13.0, 15.0, 12.0, 15.0, 11.0, 10.0, 10.0, 3.0, 7.0, 3.0, 2.0, 5.0, 1.0, 2.0, 1.0, 4.0], "bins": [-22.758737564086914, -22.10589599609375, -21.45305633544922, -20.800214767456055, -20.147375106811523, -19.49453353881836, -18.841693878173828, -18.188852310180664, -17.5360107421875, -16.883169174194336, -16.230329513549805, -15.577488899230957, -14.92464828491211, -14.271806716918945, -13.618966102600098, -12.96612548828125, -12.313285827636719, -11.660445213317871, -11.007604598999023, -10.354763984680176, -9.701923370361328, -9.049081802368164, -8.396241188049316, -7.743400573730469, -7.090559959411621, -6.437719345092773, -5.784878730773926, -5.13203763961792, -4.479197025299072, -3.8263564109802246, -3.173515558242798, -2.520674705505371, -1.8678359985351562, -1.214995265007019, -0.5621545314788818, 0.09068620204925537, 0.7435269355773926, 1.3963675498962402, 2.049208402633667, 2.7020492553710938, 3.3548898696899414, 4.007730484008789, 4.660571098327637, 5.313412189483643, 5.96625280380249, 6.619093418121338, 7.271934509277344, 7.924775123596191, 8.577615737915039, 9.230456352233887, 9.883296966552734, 10.536137580871582, 11.18897819519043, 11.841819763183594, 12.494660377502441, 13.147500991821289, 13.800341606140137, 14.453182220458984, 15.106022834777832, 15.75886344909668, 16.411705017089844, 17.064544677734375, 17.71738624572754, 18.370227813720703, 19.023067474365234]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 2.0, 2.0, 10.0, 5.0, 10.0, 10.0, 18.0, 15.0, 17.0, 22.0, 31.0, 34.0, 26.0, 41.0, 24.0, 30.0, 41.0, 34.0, 40.0, 43.0, 55.0, 43.0, 35.0, 40.0, 34.0, 35.0, 47.0, 51.0, 28.0, 27.0, 33.0, 17.0, 19.0, 16.0, 17.0, 7.0, 12.0, 7.0, 3.0, 5.0, 6.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.23046875, -3.1287841796875, -3.027099609375, -2.9254150390625, -2.82373046875, -2.7220458984375, -2.620361328125, -2.5186767578125, -2.4169921875, -2.3153076171875, -2.213623046875, -2.1119384765625, -2.01025390625, -1.9085693359375, -1.806884765625, -1.7052001953125, -1.603515625, -1.5018310546875, -1.400146484375, -1.2984619140625, -1.19677734375, -1.0950927734375, -0.993408203125, -0.8917236328125, -0.7900390625, -0.6883544921875, -0.586669921875, -0.4849853515625, -0.38330078125, -0.2816162109375, -0.179931640625, -0.0782470703125, 0.0234375, 0.1251220703125, 0.226806640625, 0.3284912109375, 0.43017578125, 0.5318603515625, 0.633544921875, 0.7352294921875, 0.8369140625, 0.9385986328125, 1.040283203125, 1.1419677734375, 1.24365234375, 1.3453369140625, 1.447021484375, 1.5487060546875, 1.650390625, 1.7520751953125, 1.853759765625, 1.9554443359375, 2.05712890625, 2.1588134765625, 2.260498046875, 2.3621826171875, 2.4638671875, 2.5655517578125, 2.667236328125, 2.7689208984375, 2.87060546875, 2.9722900390625, 3.073974609375, 3.1756591796875, 3.27734375]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 5.0, 7.0, 7.0, 23.0, 30.0, 59.0, 96.0, 121.0, 197.0, 388.0, 620.0, 995.0, 1774.0, 2845.0, 4751.0, 7293.0, 11209.0, 16675.0, 24187.0, 34202.0, 46298.0, 59775.0, 73977.0, 86332.0, 96017.0, 100105.0, 96990.0, 88356.0, 75353.0, 61527.0, 47953.0, 35390.0, 25233.0, 17571.0, 11763.0, 7749.0, 4938.0, 2977.0, 1916.0, 1183.0, 705.0, 378.0, 230.0, 146.0, 73.0, 62.0, 34.0, 11.0, 13.0, 13.0, 7.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.2333984375, -1.1943206787109375, -1.155242919921875, -1.1161651611328125, -1.07708740234375, -1.0380096435546875, -0.998931884765625, -0.9598541259765625, -0.9207763671875, -0.8816986083984375, -0.842620849609375, -0.8035430908203125, -0.76446533203125, -0.7253875732421875, -0.686309814453125, -0.6472320556640625, -0.608154296875, -0.5690765380859375, -0.529998779296875, -0.4909210205078125, -0.45184326171875, -0.4127655029296875, -0.373687744140625, -0.3346099853515625, -0.2955322265625, -0.2564544677734375, -0.217376708984375, -0.1782989501953125, -0.13922119140625, -0.1001434326171875, -0.061065673828125, -0.0219879150390625, 0.01708984375, 0.0561676025390625, 0.095245361328125, 0.1343231201171875, 0.17340087890625, 0.2124786376953125, 0.251556396484375, 0.2906341552734375, 0.3297119140625, 0.3687896728515625, 0.407867431640625, 0.4469451904296875, 0.48602294921875, 0.5251007080078125, 0.564178466796875, 0.6032562255859375, 0.642333984375, 0.6814117431640625, 0.720489501953125, 0.7595672607421875, 0.79864501953125, 0.8377227783203125, 0.876800537109375, 0.9158782958984375, 0.9549560546875, 0.9940338134765625, 1.033111572265625, 1.0721893310546875, 1.11126708984375, 1.1503448486328125, 1.189422607421875, 1.2285003662109375, 1.267578125]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 4.0, 3.0, 8.0, 8.0, 5.0, 10.0, 13.0, 12.0, 16.0, 14.0, 16.0, 16.0, 24.0, 25.0, 30.0, 21.0, 33.0, 35.0, 32.0, 24.0, 54.0, 49.0, 1073.0, 38.0, 36.0, 44.0, 45.0, 41.0, 39.0, 38.0, 28.0, 28.0, 35.0, 19.0, 17.0, 22.0, 12.0, 12.0, 7.0, 7.0, 8.0, 9.0, 9.0, 3.0, 3.0, 4.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.26171875, -3.16259765625, -3.0634765625, -2.96435546875, -2.865234375, -2.76611328125, -2.6669921875, -2.56787109375, -2.46875, -2.36962890625, -2.2705078125, -2.17138671875, -2.072265625, -1.97314453125, -1.8740234375, -1.77490234375, -1.67578125, -1.57666015625, -1.4775390625, -1.37841796875, -1.279296875, -1.18017578125, -1.0810546875, -0.98193359375, -0.8828125, -0.78369140625, -0.6845703125, -0.58544921875, -0.486328125, -0.38720703125, -0.2880859375, -0.18896484375, -0.08984375, 0.00927734375, 0.1083984375, 0.20751953125, 0.306640625, 0.40576171875, 0.5048828125, 0.60400390625, 0.703125, 0.80224609375, 0.9013671875, 1.00048828125, 1.099609375, 1.19873046875, 1.2978515625, 1.39697265625, 1.49609375, 1.59521484375, 1.6943359375, 1.79345703125, 1.892578125, 1.99169921875, 2.0908203125, 2.18994140625, 2.2890625, 2.38818359375, 2.4873046875, 2.58642578125, 2.685546875, 2.78466796875, 2.8837890625, 2.98291015625, 3.08203125]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 1.0, 4.0, 5.0, 10.0, 25.0, 32.0, 34.0, 68.0, 128.0, 200.0, 261.0, 445.0, 680.0, 1048.0, 1582.0, 2432.0, 3664.0, 5550.0, 8192.0, 12596.0, 19788.0, 39805.0, 1161359.0, 743649.0, 39072.0, 19723.0, 12591.0, 8285.0, 5353.0, 3570.0, 2357.0, 1681.0, 1064.0, 646.0, 465.0, 292.0, 171.0, 104.0, 74.0, 52.0, 32.0, 19.0, 11.0, 9.0, 6.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-3.623046875, -3.522369384765625, -3.42169189453125, -3.321014404296875, -3.2203369140625, -3.119659423828125, -3.01898193359375, -2.918304443359375, -2.817626953125, -2.716949462890625, -2.61627197265625, -2.515594482421875, -2.4149169921875, -2.314239501953125, -2.21356201171875, -2.112884521484375, -2.01220703125, -1.911529541015625, -1.81085205078125, -1.710174560546875, -1.6094970703125, -1.508819580078125, -1.40814208984375, -1.307464599609375, -1.206787109375, -1.106109619140625, -1.00543212890625, -0.904754638671875, -0.8040771484375, -0.703399658203125, -0.60272216796875, -0.502044677734375, -0.4013671875, -0.300689697265625, -0.20001220703125, -0.099334716796875, 0.0013427734375, 0.102020263671875, 0.20269775390625, 0.303375244140625, 0.404052734375, 0.504730224609375, 0.60540771484375, 0.706085205078125, 0.8067626953125, 0.907440185546875, 1.00811767578125, 1.108795166015625, 1.20947265625, 1.310150146484375, 1.41082763671875, 1.511505126953125, 1.6121826171875, 1.712860107421875, 1.81353759765625, 1.914215087890625, 2.014892578125, 2.115570068359375, 2.21624755859375, 2.316925048828125, 2.4176025390625, 2.518280029296875, 2.61895751953125, 2.719635009765625, 2.8203125]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 4.0, 4.0, 9.0, 6.0, 7.0, 10.0, 6.0, 19.0, 16.0, 14.0, 22.0, 17.0, 28.0, 39.0, 40.0, 35.0, 41.0, 42.0, 34.0, 37.0, 49.0, 49.0, 45.0, 56.0, 41.0, 43.0, 32.0, 42.0, 40.0, 30.0, 21.0, 21.0, 18.0, 18.0, 15.0, 9.0, 12.0, 9.0, 8.0, 11.0, 3.0, 4.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2015380859375, -0.19552040100097656, -0.18950271606445312, -0.1834850311279297, -0.17746734619140625, -0.1714496612548828, -0.16543197631835938, -0.15941429138183594, -0.1533966064453125, -0.14737892150878906, -0.14136123657226562, -0.1353435516357422, -0.12932586669921875, -0.12330818176269531, -0.11729049682617188, -0.11127281188964844, -0.105255126953125, -0.09923744201660156, -0.09321975708007812, -0.08720207214355469, -0.08118438720703125, -0.07516670227050781, -0.06914901733398438, -0.06313133239746094, -0.0571136474609375, -0.05109596252441406, -0.045078277587890625, -0.03906059265136719, -0.03304290771484375, -0.027025222778320312, -0.021007537841796875, -0.014989852905273438, -0.00897216796875, -0.0029544830322265625, 0.003063201904296875, 0.009080886840820312, 0.01509857177734375, 0.021116256713867188, 0.027133941650390625, 0.03315162658691406, 0.0391693115234375, 0.04518699645996094, 0.051204681396484375, 0.05722236633300781, 0.06324005126953125, 0.06925773620605469, 0.07527542114257812, 0.08129310607910156, 0.087310791015625, 0.09332847595214844, 0.09934616088867188, 0.10536384582519531, 0.11138153076171875, 0.11739921569824219, 0.12341690063476562, 0.12943458557128906, 0.1354522705078125, 0.14146995544433594, 0.14748764038085938, 0.1535053253173828, 0.15952301025390625, 0.1655406951904297, 0.17155838012695312, 0.17757606506347656, 0.18359375]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 5.0, 8.0, 12.0, 11.0, 10.0, 8.0, 19.0, 21.0, 32.0, 33.0, 41.0, 87.0, 132.0, 179.0, 293.0, 531.0, 1143.0, 14446.0, 1010382.0, 18497.0, 1197.0, 543.0, 277.0, 193.0, 137.0, 83.0, 49.0, 46.0, 25.0, 27.0, 12.0, 19.0, 9.0, 5.0, 14.0, 4.0, 6.0, 6.0, 6.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.427734375, -3.3154296875, -3.203125, -3.0908203125, -2.978515625, -2.8662109375, -2.75390625, -2.6416015625, -2.529296875, -2.4169921875, -2.3046875, -2.1923828125, -2.080078125, -1.9677734375, -1.85546875, -1.7431640625, -1.630859375, -1.5185546875, -1.40625, -1.2939453125, -1.181640625, -1.0693359375, -0.95703125, -0.8447265625, -0.732421875, -0.6201171875, -0.5078125, -0.3955078125, -0.283203125, -0.1708984375, -0.05859375, 0.0537109375, 0.166015625, 0.2783203125, 0.390625, 0.5029296875, 0.615234375, 0.7275390625, 0.83984375, 0.9521484375, 1.064453125, 1.1767578125, 1.2890625, 1.4013671875, 1.513671875, 1.6259765625, 1.73828125, 1.8505859375, 1.962890625, 2.0751953125, 2.1875, 2.2998046875, 2.412109375, 2.5244140625, 2.63671875, 2.7490234375, 2.861328125, 2.9736328125, 3.0859375, 3.1982421875, 3.310546875, 3.4228515625, 3.53515625, 3.6474609375, 3.759765625]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 8.0, 14.0, 102.0, 533.0, 301.0, 40.0, 12.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.786763191223145, -9.577709197998047, -9.36865520477295, -9.159601211547852, -8.950547218322754, -8.741493225097656, -8.532439231872559, -8.323385238647461, -8.114331245422363, -7.905277252197266, -7.696223258972168, -7.48716926574707, -7.278115272521973, -7.069061279296875, -6.860007286071777, -6.65095329284668, -6.441899299621582, -6.232845306396484, -6.023791313171387, -5.814737319946289, -5.605683326721191, -5.396629333496094, -5.187575340270996, -4.978521347045898, -4.769467830657959, -4.560413837432861, -4.351359844207764, -4.142305850982666, -3.9332518577575684, -3.7241978645324707, -3.515143871307373, -3.3060898780822754, -3.0970356464385986, -2.887981653213501, -2.6789276599884033, -2.4698736667633057, -2.260819673538208, -2.0517659187316895, -1.8427118062973022, -1.6336578130722046, -1.424603819847107, -1.2155498266220093, -1.0064958333969116, -0.7974418997764587, -0.5883879065513611, -0.3793339729309082, -0.17027997970581055, 0.03877401351928711, 0.24782800674438477, 0.4568819999694824, 0.6659359931945801, 0.874989926815033, 1.0840439796447754, 1.2930978536605835, 1.5021518468856812, 1.7112058401107788, 1.9202598333358765, 2.1293137073516846, 2.3383677005767822, 2.54742169380188, 2.7564756870269775, 2.965529680252075, 3.174583673477173, 3.3836376667022705, 3.592691659927368]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 2.0, 1.0, 3.0, 5.0, 2.0, 1.0, 8.0, 4.0, 19.0, 5.0, 19.0, 14.0, 18.0, 30.0, 29.0, 41.0, 31.0, 38.0, 27.0, 39.0, 38.0, 65.0, 49.0, 46.0, 41.0, 44.0, 41.0, 38.0, 41.0, 32.0, 37.0, 27.0, 21.0, 30.0, 22.0, 23.0, 23.0, 12.0, 11.0, 12.0, 6.0, 5.0, 4.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3281090259552002, -1.278219223022461, -1.2283294200897217, -1.1784396171569824, -1.1285498142242432, -1.0786598920822144, -1.028770089149475, -0.9788802862167358, -0.9289904832839966, -0.8791006803512573, -0.8292108774185181, -0.779321014881134, -0.7294312119483948, -0.6795414090156555, -0.6296515464782715, -0.5797617435455322, -0.529871940612793, -0.4799821376800537, -0.43009230494499207, -0.3802024722099304, -0.33031266927719116, -0.2804228663444519, -0.23053303360939026, -0.1806432008743286, -0.13075339794158936, -0.0808635801076889, -0.030973762273788452, 0.018916055560112, 0.06880587339401245, 0.1186956912279129, 0.16858550906181335, 0.218475341796875, 0.26836514472961426, 0.3182549476623535, 0.36814478039741516, 0.4180346131324768, 0.46792441606521606, 0.5178142189979553, 0.5677040815353394, 0.6175938844680786, 0.6674836874008179, 0.7173734903335571, 0.7672632932662964, 0.8171531558036804, 0.8670429587364197, 0.9169327616691589, 0.966822624206543, 1.0167124271392822, 1.0666022300720215, 1.1164920330047607, 1.1663818359375, 1.2162716388702393, 1.2661614418029785, 1.3160513639450073, 1.3659411668777466, 1.4158309698104858, 1.465720772743225, 1.5156105756759644, 1.5655003786087036, 1.6153901815414429, 1.6652801036834717, 1.715169906616211, 1.7650597095489502, 1.8149495124816895, 1.8648393154144287]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 3.0, 1.0, 10.0, 4.0, 8.0, 6.0, 15.0, 25.0, 19.0, 22.0, 22.0, 28.0, 32.0, 29.0, 33.0, 37.0, 42.0, 33.0, 43.0, 37.0, 36.0, 48.0, 38.0, 41.0, 39.0, 46.0, 36.0, 43.0, 28.0, 31.0, 23.0, 25.0, 24.0, 18.0, 14.0, 16.0, 14.0, 7.0, 9.0, 6.0, 4.0, 2.0, 2.0, 6.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.388671875, -3.286468505859375, -3.18426513671875, -3.082061767578125, -2.9798583984375, -2.877655029296875, -2.77545166015625, -2.673248291015625, -2.571044921875, -2.468841552734375, -2.36663818359375, -2.264434814453125, -2.1622314453125, -2.060028076171875, -1.95782470703125, -1.855621337890625, -1.75341796875, -1.651214599609375, -1.54901123046875, -1.446807861328125, -1.3446044921875, -1.242401123046875, -1.14019775390625, -1.037994384765625, -0.935791015625, -0.833587646484375, -0.73138427734375, -0.629180908203125, -0.5269775390625, -0.424774169921875, -0.32257080078125, -0.220367431640625, -0.1181640625, -0.015960693359375, 0.08624267578125, 0.188446044921875, 0.2906494140625, 0.392852783203125, 0.49505615234375, 0.597259521484375, 0.699462890625, 0.801666259765625, 0.90386962890625, 1.006072998046875, 1.1082763671875, 1.210479736328125, 1.31268310546875, 1.414886474609375, 1.51708984375, 1.619293212890625, 1.72149658203125, 1.823699951171875, 1.9259033203125, 2.028106689453125, 2.13031005859375, 2.232513427734375, 2.334716796875, 2.436920166015625, 2.53912353515625, 2.641326904296875, 2.7435302734375, 2.845733642578125, 2.94793701171875, 3.050140380859375, 3.15234375]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 8.0, 4.0, 13.0, 9.0, 29.0, 44.0, 60.0, 103.0, 159.0, 277.0, 418.0, 654.0, 1256.0, 2034.0, 3394.0, 5817.0, 10033.0, 17217.0, 28692.0, 47679.0, 79295.0, 135482.0, 220531.0, 200472.0, 119993.0, 70193.0, 42654.0, 24962.0, 15508.0, 8966.0, 5209.0, 2988.0, 1830.0, 1015.0, 628.0, 345.0, 235.0, 123.0, 81.0, 64.0, 37.0, 28.0, 10.0, 6.0, 1.0, 5.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.015625, -2.923919677734375, -2.83221435546875, -2.740509033203125, -2.6488037109375, -2.557098388671875, -2.46539306640625, -2.373687744140625, -2.281982421875, -2.190277099609375, -2.09857177734375, -2.006866455078125, -1.9151611328125, -1.823455810546875, -1.73175048828125, -1.640045166015625, -1.54833984375, -1.456634521484375, -1.36492919921875, -1.273223876953125, -1.1815185546875, -1.089813232421875, -0.99810791015625, -0.906402587890625, -0.814697265625, -0.722991943359375, -0.63128662109375, -0.539581298828125, -0.4478759765625, -0.356170654296875, -0.26446533203125, -0.172760009765625, -0.0810546875, 0.010650634765625, 0.10235595703125, 0.194061279296875, 0.2857666015625, 0.377471923828125, 0.46917724609375, 0.560882568359375, 0.652587890625, 0.744293212890625, 0.83599853515625, 0.927703857421875, 1.0194091796875, 1.111114501953125, 1.20281982421875, 1.294525146484375, 1.38623046875, 1.477935791015625, 1.56964111328125, 1.661346435546875, 1.7530517578125, 1.844757080078125, 1.93646240234375, 2.028167724609375, 2.119873046875, 2.211578369140625, 2.30328369140625, 2.394989013671875, 2.4866943359375, 2.578399658203125, 2.67010498046875, 2.761810302734375, 2.853515625]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 7.0, 5.0, 4.0, 11.0, 3.0, 11.0, 7.0, 9.0, 21.0, 23.0, 27.0, 29.0, 30.0, 37.0, 43.0, 49.0, 70.0, 95.0, 165.0, 288.0, 1366.0, 199.0, 108.0, 70.0, 67.0, 46.0, 48.0, 40.0, 33.0, 28.0, 26.0, 17.0, 15.0, 15.0, 9.0, 9.0, 10.0, 7.0, 4.0, 1.0, 4.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-14.8828125, -14.4715576171875, -14.060302734375, -13.6490478515625, -13.23779296875, -12.8265380859375, -12.415283203125, -12.0040283203125, -11.5927734375, -11.1815185546875, -10.770263671875, -10.3590087890625, -9.94775390625, -9.5364990234375, -9.125244140625, -8.7139892578125, -8.302734375, -7.8914794921875, -7.480224609375, -7.0689697265625, -6.65771484375, -6.2464599609375, -5.835205078125, -5.4239501953125, -5.0126953125, -4.6014404296875, -4.190185546875, -3.7789306640625, -3.36767578125, -2.9564208984375, -2.545166015625, -2.1339111328125, -1.72265625, -1.3114013671875, -0.900146484375, -0.4888916015625, -0.07763671875, 0.3336181640625, 0.744873046875, 1.1561279296875, 1.5673828125, 1.9786376953125, 2.389892578125, 2.8011474609375, 3.21240234375, 3.6236572265625, 4.034912109375, 4.4461669921875, 4.857421875, 5.2686767578125, 5.679931640625, 6.0911865234375, 6.50244140625, 6.9136962890625, 7.324951171875, 7.7362060546875, 8.1474609375, 8.5587158203125, 8.969970703125, 9.3812255859375, 9.79248046875, 10.2037353515625, 10.614990234375, 11.0262451171875, 11.4375]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 3.0, 4.0, 8.0, 16.0, 20.0, 45.0, 50.0, 65.0, 126.0, 191.0, 354.0, 776.0, 3352.0, 676463.0, 2456230.0, 6099.0, 954.0, 390.0, 218.0, 128.0, 76.0, 48.0, 31.0, 27.0, 13.0, 9.0, 6.0, 5.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.59375, -36.4580078125, -35.322265625, -34.1865234375, -33.05078125, -31.9150390625, -30.779296875, -29.6435546875, -28.5078125, -27.3720703125, -26.236328125, -25.1005859375, -23.96484375, -22.8291015625, -21.693359375, -20.5576171875, -19.421875, -18.2861328125, -17.150390625, -16.0146484375, -14.87890625, -13.7431640625, -12.607421875, -11.4716796875, -10.3359375, -9.2001953125, -8.064453125, -6.9287109375, -5.79296875, -4.6572265625, -3.521484375, -2.3857421875, -1.25, -0.1142578125, 1.021484375, 2.1572265625, 3.29296875, 4.4287109375, 5.564453125, 6.7001953125, 7.8359375, 8.9716796875, 10.107421875, 11.2431640625, 12.37890625, 13.5146484375, 14.650390625, 15.7861328125, 16.921875, 18.0576171875, 19.193359375, 20.3291015625, 21.46484375, 22.6005859375, 23.736328125, 24.8720703125, 26.0078125, 27.1435546875, 28.279296875, 29.4150390625, 30.55078125, 31.6865234375, 32.822265625, 33.9580078125, 35.09375]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [3.0, 172.0, 839.0, 6.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.939653396606445, -13.78732967376709, -2.6350059509277344, 8.517316818237305, 19.669641494750977, 30.82196617126465, 41.97428894042969, 53.126617431640625, 64.27893829345703, 75.43125915527344, 86.58358764648438, 97.73590850830078, 108.88822937011719, 120.04055786132812, 131.19287109375, 142.34521484375, 153.49752807617188, 164.6498565673828, 175.8021697998047, 186.95449829101562, 198.10682678222656, 209.2591552734375, 220.41146850585938, 231.5637969970703, 242.7161102294922, 253.86843872070312, 265.020751953125, 276.173095703125, 287.3254089355469, 298.47772216796875, 309.63006591796875, 320.7823791503906, 331.9347229003906, 343.0870361328125, 354.2393798828125, 365.3916931152344, 376.54400634765625, 387.69635009765625, 398.8486633300781, 410.0009765625, 421.1533203125, 432.3056335449219, 443.4579772949219, 454.61029052734375, 465.7626037597656, 476.9149475097656, 488.0672607421875, 499.2196044921875, 510.37188720703125, 521.5242309570312, 532.676513671875, 543.828857421875, 554.981201171875, 566.1334838867188, 577.2858276367188, 588.4381713867188, 599.5905151367188, 610.7428588867188, 621.8951416015625, 633.0474853515625, 644.1998291015625, 655.3521118164062, 666.5044555664062, 677.6567993164062, 688.80908203125]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 8.0, 3.0, 6.0, 10.0, 8.0, 12.0, 6.0, 12.0, 12.0, 14.0, 17.0, 28.0, 21.0, 31.0, 34.0, 25.0, 33.0, 36.0, 37.0, 37.0, 38.0, 43.0, 39.0, 37.0, 29.0, 44.0, 36.0, 17.0, 37.0, 33.0, 28.0, 35.0, 31.0, 19.0, 28.0, 21.0, 18.0, 16.0, 11.0, 13.0, 4.0, 10.0, 6.0, 5.0, 5.0, 4.0, 6.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-30.078533172607422, -29.210237503051758, -28.341941833496094, -27.47364616394043, -26.605350494384766, -25.7370548248291, -24.868759155273438, -24.000463485717773, -23.13216781616211, -22.263872146606445, -21.39557647705078, -20.527280807495117, -19.658985137939453, -18.79068946838379, -17.922393798828125, -17.05409812927246, -16.185802459716797, -15.317506790161133, -14.449211120605469, -13.580915451049805, -12.71261978149414, -11.844324111938477, -10.976028442382812, -10.107732772827148, -9.239435195922852, -8.371139526367188, -7.502843856811523, -6.634548187255859, -5.766252517700195, -4.897956371307373, -4.029660701751709, -3.161365032196045, -2.293069839477539, -1.424774169921875, -0.5564783811569214, 0.3118174076080322, 1.1801130771636963, 2.0484089851379395, 2.9167046546936035, 3.7850003242492676, 4.653295993804932, 5.521591663360596, 6.38988733291626, 7.258183479309082, 8.126479148864746, 8.99477481842041, 9.863070487976074, 10.731366157531738, 11.599661827087402, 12.467957496643066, 13.33625316619873, 14.204548835754395, 15.072844505310059, 15.941141128540039, 16.809436798095703, 17.677732467651367, 18.54602813720703, 19.414323806762695, 20.28261947631836, 21.150915145874023, 22.019210815429688, 22.88750648498535, 23.755802154541016, 24.62409782409668, 25.492393493652344]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 3.0, 10.0, 9.0, 24.0, 11.0, 21.0, 28.0, 18.0, 24.0, 43.0, 31.0, 38.0, 39.0, 20.0, 52.0, 35.0, 40.0, 54.0, 53.0, 41.0, 47.0, 47.0, 36.0, 42.0, 36.0, 40.0, 33.0, 16.0, 17.0, 22.0, 13.0, 15.0, 13.0, 10.0, 6.0, 5.0, 5.0, 2.0, 3.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.798828125, -3.678924560546875, -3.55902099609375, -3.439117431640625, -3.3192138671875, -3.199310302734375, -3.07940673828125, -2.959503173828125, -2.839599609375, -2.719696044921875, -2.59979248046875, -2.479888916015625, -2.3599853515625, -2.240081787109375, -2.12017822265625, -2.000274658203125, -1.88037109375, -1.760467529296875, -1.64056396484375, -1.520660400390625, -1.4007568359375, -1.280853271484375, -1.16094970703125, -1.041046142578125, -0.921142578125, -0.801239013671875, -0.68133544921875, -0.561431884765625, -0.4415283203125, -0.321624755859375, -0.20172119140625, -0.081817626953125, 0.0380859375, 0.157989501953125, 0.27789306640625, 0.397796630859375, 0.5177001953125, 0.637603759765625, 0.75750732421875, 0.877410888671875, 0.997314453125, 1.117218017578125, 1.23712158203125, 1.357025146484375, 1.4769287109375, 1.596832275390625, 1.71673583984375, 1.836639404296875, 1.95654296875, 2.076446533203125, 2.19635009765625, 2.316253662109375, 2.4361572265625, 2.556060791015625, 2.67596435546875, 2.795867919921875, 2.915771484375, 3.035675048828125, 3.15557861328125, 3.275482177734375, 3.3953857421875, 3.515289306640625, 3.63519287109375, 3.755096435546875, 3.875]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 3.0, 7.0, 7.0, 8.0, 7.0, 13.0, 18.0, 16.0, 19.0, 27.0, 32.0, 54.0, 62.0, 94.0, 194.0, 551.0, 2623.0, 15792.0, 121524.0, 1080785.0, 2430620.0, 476184.0, 55541.0, 7780.0, 1487.0, 385.0, 145.0, 66.0, 47.0, 34.0, 31.0, 28.0, 29.0, 21.0, 14.0, 8.0, 6.0, 10.0, 5.0, 3.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-9.625, -9.3524169921875, -9.079833984375, -8.8072509765625, -8.53466796875, -8.2620849609375, -7.989501953125, -7.7169189453125, -7.4443359375, -7.1717529296875, -6.899169921875, -6.6265869140625, -6.35400390625, -6.0814208984375, -5.808837890625, -5.5362548828125, -5.263671875, -4.9910888671875, -4.718505859375, -4.4459228515625, -4.17333984375, -3.9007568359375, -3.628173828125, -3.3555908203125, -3.0830078125, -2.8104248046875, -2.537841796875, -2.2652587890625, -1.99267578125, -1.7200927734375, -1.447509765625, -1.1749267578125, -0.90234375, -0.6297607421875, -0.357177734375, -0.0845947265625, 0.18798828125, 0.4605712890625, 0.733154296875, 1.0057373046875, 1.2783203125, 1.5509033203125, 1.823486328125, 2.0960693359375, 2.36865234375, 2.6412353515625, 2.913818359375, 3.1864013671875, 3.458984375, 3.7315673828125, 4.004150390625, 4.2767333984375, 4.54931640625, 4.8218994140625, 5.094482421875, 5.3670654296875, 5.6396484375, 5.9122314453125, 6.184814453125, 6.4573974609375, 6.72998046875, 7.0025634765625, 7.275146484375, 7.5477294921875, 7.8203125]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 2.0, 2.0, 5.0, 3.0, 11.0, 12.0, 24.0, 35.0, 39.0, 43.0, 103.0, 143.0, 203.0, 304.0, 432.0, 505.0, 563.0, 453.0, 345.0, 295.0, 167.0, 127.0, 85.0, 67.0, 33.0, 24.0, 22.0, 15.0, 7.0, 5.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.2265625, -6.9508056640625, -6.675048828125, -6.3992919921875, -6.12353515625, -5.8477783203125, -5.572021484375, -5.2962646484375, -5.0205078125, -4.7447509765625, -4.468994140625, -4.1932373046875, -3.91748046875, -3.6417236328125, -3.365966796875, -3.0902099609375, -2.814453125, -2.5386962890625, -2.262939453125, -1.9871826171875, -1.71142578125, -1.4356689453125, -1.159912109375, -0.8841552734375, -0.6083984375, -0.3326416015625, -0.056884765625, 0.2188720703125, 0.49462890625, 0.7703857421875, 1.046142578125, 1.3218994140625, 1.59765625, 1.8734130859375, 2.149169921875, 2.4249267578125, 2.70068359375, 2.9764404296875, 3.252197265625, 3.5279541015625, 3.8037109375, 4.0794677734375, 4.355224609375, 4.6309814453125, 4.90673828125, 5.1824951171875, 5.458251953125, 5.7340087890625, 6.009765625, 6.2855224609375, 6.561279296875, 6.8370361328125, 7.11279296875, 7.3885498046875, 7.664306640625, 7.9400634765625, 8.2158203125, 8.4915771484375, 8.767333984375, 9.0430908203125, 9.31884765625, 9.5946044921875, 9.870361328125, 10.1461181640625, 10.421875]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 7.0, 8.0, 5.0, 13.0, 19.0, 32.0, 30.0, 53.0, 81.0, 129.0, 215.0, 379.0, 769.0, 3086.0, 36387.0, 711834.0, 3092936.0, 327151.0, 17896.0, 1917.0, 578.0, 265.0, 170.0, 96.0, 73.0, 43.0, 42.0, 28.0, 19.0, 6.0, 5.0, 4.0, 7.0, 3.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.75, -17.2481689453125, -16.746337890625, -16.2445068359375, -15.74267578125, -15.2408447265625, -14.739013671875, -14.2371826171875, -13.7353515625, -13.2335205078125, -12.731689453125, -12.2298583984375, -11.72802734375, -11.2261962890625, -10.724365234375, -10.2225341796875, -9.720703125, -9.2188720703125, -8.717041015625, -8.2152099609375, -7.71337890625, -7.2115478515625, -6.709716796875, -6.2078857421875, -5.7060546875, -5.2042236328125, -4.702392578125, -4.2005615234375, -3.69873046875, -3.1968994140625, -2.695068359375, -2.1932373046875, -1.69140625, -1.1895751953125, -0.687744140625, -0.1859130859375, 0.31591796875, 0.8177490234375, 1.319580078125, 1.8214111328125, 2.3232421875, 2.8250732421875, 3.326904296875, 3.8287353515625, 4.33056640625, 4.8323974609375, 5.334228515625, 5.8360595703125, 6.337890625, 6.8397216796875, 7.341552734375, 7.8433837890625, 8.34521484375, 8.8470458984375, 9.348876953125, 9.8507080078125, 10.3525390625, 10.8543701171875, 11.356201171875, 11.8580322265625, 12.35986328125, 12.8616943359375, 13.363525390625, 13.8653564453125, 14.3671875]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 19.0, 95.0, 218.0, 306.0, 241.0, 100.0, 27.0, 6.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.3333740234375, -58.01591110229492, -54.69845199584961, -51.38098907470703, -48.06352996826172, -44.74606704711914, -41.42860412597656, -38.11114501953125, -34.79368591308594, -31.476224899291992, -28.158763885498047, -24.84130096435547, -21.523841857910156, -18.206378936767578, -14.888917922973633, -11.571456909179688, -8.25399398803711, -4.936532974243164, -1.6190714836120605, 1.698390007019043, 5.015851020812988, 8.33331298828125, 11.650774002075195, 14.96823501586914, 18.285696029663086, 21.60315704345703, 24.920618057250977, 28.238079071044922, 31.5555419921875, 34.87300109863281, 38.19046401977539, 41.50792694091797, 44.82538604736328, 48.14284896850586, 51.46030807495117, 54.77777099609375, 58.09523010253906, 61.41269302368164, 64.73015594482422, 68.04761505126953, 71.36507415771484, 74.68253326416016, 78.0, 81.31745910644531, 84.63491821289062, 87.95237731933594, 91.26984405517578, 94.5873031616211, 97.90476989746094, 101.22222900390625, 104.5396957397461, 107.8571548461914, 111.17461395263672, 114.49208068847656, 117.80953979492188, 121.12699890136719, 124.4444580078125, 127.76191711425781, 131.07937622070312, 134.39683532714844, 137.7143096923828, 141.03176879882812, 144.34922790527344, 147.66668701171875, 150.98414611816406]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 4.0, 3.0, 4.0, 7.0, 6.0, 8.0, 8.0, 7.0, 15.0, 14.0, 20.0, 22.0, 17.0, 29.0, 25.0, 36.0, 27.0, 31.0, 31.0, 32.0, 38.0, 38.0, 32.0, 41.0, 46.0, 48.0, 34.0, 30.0, 32.0, 38.0, 40.0, 26.0, 28.0, 25.0, 21.0, 20.0, 24.0, 16.0, 14.0, 9.0, 10.0, 4.0, 9.0, 6.0, 7.0, 7.0, 8.0, 4.0, 6.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-22.10610008239746, -21.42341423034668, -20.7407283782959, -20.058042526245117, -19.37535858154297, -18.692672729492188, -18.009986877441406, -17.327301025390625, -16.644615173339844, -15.961929321289062, -15.279243469238281, -14.596558570861816, -13.913872718811035, -13.231186866760254, -12.548501968383789, -11.865816116333008, -11.183130264282227, -10.500444412231445, -9.817758560180664, -9.1350736618042, -8.452387809753418, -7.769701957702637, -7.087016582489014, -6.404331207275391, -5.721645355224609, -5.038959503173828, -4.356274127960205, -3.673588514328003, -2.990902900695801, -2.3082172870635986, -1.6255316734313965, -0.9428462982177734, -0.2601585388183594, 0.4225270748138428, 1.105212688446045, 1.787898302078247, 2.470583915710449, 3.1532695293426514, 3.8359551429748535, 4.518640518188477, 5.201326370239258, 5.884012222290039, 6.566697597503662, 7.249382972717285, 7.932068824768066, 8.614754676818848, 9.297439575195312, 9.980125427246094, 10.662811279296875, 11.345497131347656, 12.028182983398438, 12.710867881774902, 13.393553733825684, 14.076239585876465, 14.75892448425293, 15.441610336303711, 16.124296188354492, 16.806982040405273, 17.489667892456055, 18.172353744506836, 18.855037689208984, 19.537723541259766, 20.220409393310547, 20.903095245361328, 21.58578109741211]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 5.0, 9.0, 5.0, 7.0, 13.0, 17.0, 23.0, 24.0, 30.0, 30.0, 22.0, 44.0, 36.0, 30.0, 33.0, 36.0, 32.0, 53.0, 50.0, 46.0, 46.0, 55.0, 42.0, 53.0, 40.0, 39.0, 25.0, 22.0, 23.0, 27.0, 19.0, 11.0, 14.0, 6.0, 9.0, 7.0, 9.0, 9.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.88671875, -3.76800537109375, -3.6492919921875, -3.53057861328125, -3.411865234375, -3.29315185546875, -3.1744384765625, -3.05572509765625, -2.93701171875, -2.81829833984375, -2.6995849609375, -2.58087158203125, -2.462158203125, -2.34344482421875, -2.2247314453125, -2.10601806640625, -1.9873046875, -1.86859130859375, -1.7498779296875, -1.63116455078125, -1.512451171875, -1.39373779296875, -1.2750244140625, -1.15631103515625, -1.03759765625, -0.91888427734375, -0.8001708984375, -0.68145751953125, -0.562744140625, -0.44403076171875, -0.3253173828125, -0.20660400390625, -0.087890625, 0.03082275390625, 0.1495361328125, 0.26824951171875, 0.386962890625, 0.50567626953125, 0.6243896484375, 0.74310302734375, 0.86181640625, 0.98052978515625, 1.0992431640625, 1.21795654296875, 1.336669921875, 1.45538330078125, 1.5740966796875, 1.69281005859375, 1.8115234375, 1.93023681640625, 2.0489501953125, 2.16766357421875, 2.286376953125, 2.40509033203125, 2.5238037109375, 2.64251708984375, 2.76123046875, 2.87994384765625, 2.9986572265625, 3.11737060546875, 3.236083984375, 3.35479736328125, 3.4735107421875, 3.59222412109375, 3.7109375]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 5.0, 6.0, 5.0, 17.0, 15.0, 27.0, 44.0, 72.0, 137.0, 219.0, 412.0, 732.0, 1322.0, 2334.0, 4103.0, 6886.0, 11550.0, 18591.0, 28492.0, 41998.0, 59915.0, 81115.0, 105598.0, 129037.0, 134922.0, 118318.0, 91993.0, 68921.0, 49630.0, 34111.0, 22562.0, 14321.0, 8847.0, 5223.0, 3118.0, 1716.0, 950.0, 565.0, 316.0, 166.0, 106.0, 48.0, 35.0, 27.0, 16.0, 3.0, 6.0, 2.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3515625, -1.306854248046875, -1.26214599609375, -1.217437744140625, -1.1727294921875, -1.128021240234375, -1.08331298828125, -1.038604736328125, -0.993896484375, -0.949188232421875, -0.90447998046875, -0.859771728515625, -0.8150634765625, -0.770355224609375, -0.72564697265625, -0.680938720703125, -0.63623046875, -0.591522216796875, -0.54681396484375, -0.502105712890625, -0.4573974609375, -0.412689208984375, -0.36798095703125, -0.323272705078125, -0.278564453125, -0.233856201171875, -0.18914794921875, -0.144439697265625, -0.0997314453125, -0.055023193359375, -0.01031494140625, 0.034393310546875, 0.0791015625, 0.123809814453125, 0.16851806640625, 0.213226318359375, 0.2579345703125, 0.302642822265625, 0.34735107421875, 0.392059326171875, 0.436767578125, 0.481475830078125, 0.52618408203125, 0.570892333984375, 0.6156005859375, 0.660308837890625, 0.70501708984375, 0.749725341796875, 0.79443359375, 0.839141845703125, 0.88385009765625, 0.928558349609375, 0.9732666015625, 1.017974853515625, 1.06268310546875, 1.107391357421875, 1.152099609375, 1.196807861328125, 1.24151611328125, 1.286224365234375, 1.3309326171875, 1.375640869140625, 1.42034912109375, 1.465057373046875, 1.509765625]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 1.0, 2.0, 5.0, 4.0, 5.0, 7.0, 16.0, 11.0, 7.0, 17.0, 16.0, 19.0, 18.0, 20.0, 32.0, 22.0, 30.0, 30.0, 30.0, 38.0, 41.0, 35.0, 41.0, 49.0, 1054.0, 34.0, 33.0, 31.0, 34.0, 38.0, 34.0, 31.0, 29.0, 20.0, 30.0, 26.0, 19.0, 29.0, 16.0, 8.0, 17.0, 7.0, 6.0, 7.0, 6.0, 5.0, 5.0, 6.0, 4.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.947265625, -2.855987548828125, -2.76470947265625, -2.673431396484375, -2.5821533203125, -2.490875244140625, -2.39959716796875, -2.308319091796875, -2.217041015625, -2.125762939453125, -2.03448486328125, -1.943206787109375, -1.8519287109375, -1.760650634765625, -1.66937255859375, -1.578094482421875, -1.48681640625, -1.395538330078125, -1.30426025390625, -1.212982177734375, -1.1217041015625, -1.030426025390625, -0.93914794921875, -0.847869873046875, -0.756591796875, -0.665313720703125, -0.57403564453125, -0.482757568359375, -0.3914794921875, -0.300201416015625, -0.20892333984375, -0.117645263671875, -0.0263671875, 0.064910888671875, 0.15618896484375, 0.247467041015625, 0.3387451171875, 0.430023193359375, 0.52130126953125, 0.612579345703125, 0.703857421875, 0.795135498046875, 0.88641357421875, 0.977691650390625, 1.0689697265625, 1.160247802734375, 1.25152587890625, 1.342803955078125, 1.43408203125, 1.525360107421875, 1.61663818359375, 1.707916259765625, 1.7991943359375, 1.890472412109375, 1.98175048828125, 2.073028564453125, 2.164306640625, 2.255584716796875, 2.34686279296875, 2.438140869140625, 2.5294189453125, 2.620697021484375, 2.71197509765625, 2.803253173828125, 2.89453125]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 6.0, 9.0, 14.0, 21.0, 39.0, 56.0, 82.0, 122.0, 185.0, 290.0, 410.0, 659.0, 956.0, 1347.0, 2027.0, 2979.0, 4432.0, 6357.0, 9649.0, 14373.0, 23728.0, 62630.0, 1803909.0, 89858.0, 25745.0, 15787.0, 10157.0, 6750.0, 4730.0, 3176.0, 2211.0, 1421.0, 1008.0, 666.0, 445.0, 271.0, 206.0, 158.0, 86.0, 65.0, 40.0, 31.0, 13.0, 16.0, 5.0, 7.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.943359375, -2.852996826171875, -2.76263427734375, -2.672271728515625, -2.5819091796875, -2.491546630859375, -2.40118408203125, -2.310821533203125, -2.220458984375, -2.130096435546875, -2.03973388671875, -1.949371337890625, -1.8590087890625, -1.768646240234375, -1.67828369140625, -1.587921142578125, -1.49755859375, -1.407196044921875, -1.31683349609375, -1.226470947265625, -1.1361083984375, -1.045745849609375, -0.95538330078125, -0.865020751953125, -0.774658203125, -0.684295654296875, -0.59393310546875, -0.503570556640625, -0.4132080078125, -0.322845458984375, -0.23248291015625, -0.142120361328125, -0.0517578125, 0.038604736328125, 0.12896728515625, 0.219329833984375, 0.3096923828125, 0.400054931640625, 0.49041748046875, 0.580780029296875, 0.671142578125, 0.761505126953125, 0.85186767578125, 0.942230224609375, 1.0325927734375, 1.122955322265625, 1.21331787109375, 1.303680419921875, 1.39404296875, 1.484405517578125, 1.57476806640625, 1.665130615234375, 1.7554931640625, 1.845855712890625, 1.93621826171875, 2.026580810546875, 2.116943359375, 2.207305908203125, 2.29766845703125, 2.388031005859375, 2.4783935546875, 2.568756103515625, 2.65911865234375, 2.749481201171875, 2.83984375]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 7.0, 7.0, 9.0, 10.0, 18.0, 16.0, 28.0, 26.0, 39.0, 42.0, 46.0, 38.0, 39.0, 58.0, 44.0, 38.0, 44.0, 50.0, 45.0, 48.0, 54.0, 49.0, 40.0, 45.0, 34.0, 29.0, 23.0, 18.0, 11.0, 9.0, 9.0, 8.0, 4.0, 3.0, 1.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1419677734375, -0.13744354248046875, -0.1329193115234375, -0.12839508056640625, -0.123870849609375, -0.11934661865234375, -0.1148223876953125, -0.11029815673828125, -0.10577392578125, -0.10124969482421875, -0.0967254638671875, -0.09220123291015625, -0.087677001953125, -0.08315277099609375, -0.0786285400390625, -0.07410430908203125, -0.069580078125, -0.06505584716796875, -0.0605316162109375, -0.05600738525390625, -0.051483154296875, -0.04695892333984375, -0.0424346923828125, -0.03791046142578125, -0.03338623046875, -0.02886199951171875, -0.0243377685546875, -0.01981353759765625, -0.015289306640625, -0.01076507568359375, -0.0062408447265625, -0.00171661376953125, 0.0028076171875, 0.00733184814453125, 0.0118560791015625, 0.01638031005859375, 0.020904541015625, 0.02542877197265625, 0.0299530029296875, 0.03447723388671875, 0.03900146484375, 0.04352569580078125, 0.0480499267578125, 0.05257415771484375, 0.057098388671875, 0.06162261962890625, 0.0661468505859375, 0.07067108154296875, 0.0751953125, 0.07971954345703125, 0.0842437744140625, 0.08876800537109375, 0.093292236328125, 0.09781646728515625, 0.1023406982421875, 0.10686492919921875, 0.11138916015625, 0.11591339111328125, 0.1204376220703125, 0.12496185302734375, 0.129486083984375, 0.13401031494140625, 0.1385345458984375, 0.14305877685546875, 0.1475830078125]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 1.0, 4.0, 3.0, 2.0, 4.0, 4.0, 8.0, 9.0, 20.0, 20.0, 31.0, 37.0, 52.0, 69.0, 108.0, 188.0, 364.0, 716.0, 2606.0, 900959.0, 140613.0, 1378.0, 606.0, 278.0, 157.0, 76.0, 61.0, 48.0, 37.0, 20.0, 15.0, 16.0, 14.0, 6.0, 6.0, 4.0, 2.0, 5.0, 4.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-3.134765625, -3.04473876953125, -2.9547119140625, -2.86468505859375, -2.774658203125, -2.68463134765625, -2.5946044921875, -2.50457763671875, -2.41455078125, -2.32452392578125, -2.2344970703125, -2.14447021484375, -2.054443359375, -1.96441650390625, -1.8743896484375, -1.78436279296875, -1.6943359375, -1.60430908203125, -1.5142822265625, -1.42425537109375, -1.334228515625, -1.24420166015625, -1.1541748046875, -1.06414794921875, -0.97412109375, -0.88409423828125, -0.7940673828125, -0.70404052734375, -0.614013671875, -0.52398681640625, -0.4339599609375, -0.34393310546875, -0.25390625, -0.16387939453125, -0.0738525390625, 0.01617431640625, 0.106201171875, 0.19622802734375, 0.2862548828125, 0.37628173828125, 0.46630859375, 0.55633544921875, 0.6463623046875, 0.73638916015625, 0.826416015625, 0.91644287109375, 1.0064697265625, 1.09649658203125, 1.1865234375, 1.27655029296875, 1.3665771484375, 1.45660400390625, 1.546630859375, 1.63665771484375, 1.7266845703125, 1.81671142578125, 1.90673828125, 1.99676513671875, 2.0867919921875, 2.17681884765625, 2.266845703125, 2.35687255859375, 2.4468994140625, 2.53692626953125, 2.626953125]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 13.0, 79.0, 571.0, 315.0, 28.0, 6.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.785524368286133, -5.661980152130127, -5.538435935974121, -5.414891719818115, -5.291347026824951, -5.167802810668945, -5.0442585945129395, -4.920714378356934, -4.797170162200928, -4.673625946044922, -4.550081729888916, -4.42653751373291, -4.302992820739746, -4.17944860458374, -4.055904388427734, -3.9323601722717285, -3.8088159561157227, -3.685271739959717, -3.561727285385132, -3.438183069229126, -3.31463885307312, -3.191094398498535, -3.0675501823425293, -2.9440059661865234, -2.8204615116119385, -2.6969172954559326, -2.5733728408813477, -2.449828624725342, -2.326284408569336, -2.20274019241333, -2.079195737838745, -1.9556515216827393, -1.8321073055267334, -1.708562970161438, -1.5850187540054321, -1.4614744186401367, -1.3379302024841309, -1.2143858671188354, -1.09084153175354, -0.9672973155975342, -0.8437530398368835, -0.7202087640762329, -0.5966644883155823, -0.47312018275260925, -0.3495759069919586, -0.2260316014289856, -0.10248732566833496, 0.021056950092315674, 0.1446012258529663, 0.26814550161361694, 0.3916897773742676, 0.515234112739563, 0.6387783288955688, 0.7623226642608643, 0.8858669400215149, 1.0094112157821655, 1.132955551147461, 1.2564998865127563, 1.3800441026687622, 1.5035884380340576, 1.6271326541900635, 1.7506769895553589, 1.8742213249206543, 1.9977655410766602, 2.121309757232666]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 6.0, 2.0, 5.0, 7.0, 10.0, 12.0, 13.0, 15.0, 20.0, 19.0, 38.0, 27.0, 44.0, 36.0, 53.0, 31.0, 57.0, 48.0, 60.0, 40.0, 54.0, 48.0, 51.0, 33.0, 50.0, 32.0, 31.0, 42.0, 25.0, 20.0, 26.0, 9.0, 16.0, 10.0, 3.0, 5.0, 6.0, 4.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8512094616889954, -0.8237989544868469, -0.7963884472846985, -0.76897794008255, -0.7415674328804016, -0.7141569256782532, -0.68674635887146, -0.6593358516693115, -0.6319253444671631, -0.6045148372650146, -0.5771043300628662, -0.5496938228607178, -0.5222833156585693, -0.4948728084564209, -0.4674622714519501, -0.44005176424980164, -0.4126412868499756, -0.38523077964782715, -0.3578202724456787, -0.3304097652435303, -0.30299925804138184, -0.2755887508392334, -0.24817821383476257, -0.22076770663261414, -0.1933571994304657, -0.16594669222831726, -0.13853618502616882, -0.11112566292285919, -0.08371515572071075, -0.05630464851856232, -0.028894126415252686, -0.001483619213104248, 0.025926828384399414, 0.05333733931183815, 0.08074785023927689, 0.10815836489200592, 0.13556887209415436, 0.1629793792963028, 0.19038990139961243, 0.21780040860176086, 0.2452109158039093, 0.27262142300605774, 0.3000319302082062, 0.327442467212677, 0.35485297441482544, 0.3822634816169739, 0.4096739888191223, 0.43708449602127075, 0.4644950032234192, 0.4919055104255676, 0.5193160176277161, 0.5467265248298645, 0.5741370320320129, 0.6015475392341614, 0.6289581060409546, 0.656368613243103, 0.6837791204452515, 0.7111896276473999, 0.7386001348495483, 0.7660106420516968, 0.7934211492538452, 0.8208316564559937, 0.8482421636581421, 0.8756526708602905, 0.903063178062439]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 2.0, 2.0, 3.0, 11.0, 5.0, 9.0, 21.0, 18.0, 14.0, 9.0, 18.0, 32.0, 28.0, 24.0, 38.0, 31.0, 39.0, 35.0, 38.0, 42.0, 32.0, 56.0, 41.0, 50.0, 47.0, 54.0, 35.0, 27.0, 25.0, 42.0, 32.0, 25.0, 26.0, 22.0, 12.0, 11.0, 9.0, 7.0, 10.0, 3.0, 9.0, 3.0, 2.0, 3.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.869140625, -3.75714111328125, -3.6451416015625, -3.53314208984375, -3.421142578125, -3.30914306640625, -3.1971435546875, -3.08514404296875, -2.97314453125, -2.86114501953125, -2.7491455078125, -2.63714599609375, -2.525146484375, -2.41314697265625, -2.3011474609375, -2.18914794921875, -2.0771484375, -1.96514892578125, -1.8531494140625, -1.74114990234375, -1.629150390625, -1.51715087890625, -1.4051513671875, -1.29315185546875, -1.18115234375, -1.06915283203125, -0.9571533203125, -0.84515380859375, -0.733154296875, -0.62115478515625, -0.5091552734375, -0.39715576171875, -0.28515625, -0.17315673828125, -0.0611572265625, 0.05084228515625, 0.162841796875, 0.27484130859375, 0.3868408203125, 0.49884033203125, 0.61083984375, 0.72283935546875, 0.8348388671875, 0.94683837890625, 1.058837890625, 1.17083740234375, 1.2828369140625, 1.39483642578125, 1.5068359375, 1.61883544921875, 1.7308349609375, 1.84283447265625, 1.954833984375, 2.06683349609375, 2.1788330078125, 2.29083251953125, 2.40283203125, 2.51483154296875, 2.6268310546875, 2.73883056640625, 2.850830078125, 2.96282958984375, 3.0748291015625, 3.18682861328125, 3.298828125]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 8.0, 11.0, 15.0, 31.0, 42.0, 88.0, 178.0, 285.0, 553.0, 932.0, 1748.0, 3467.0, 6311.0, 11854.0, 22449.0, 43194.0, 82967.0, 164334.0, 315763.0, 193694.0, 95364.0, 49665.0, 26290.0, 13746.0, 7235.0, 3872.0, 2015.0, 1113.0, 578.0, 320.0, 172.0, 102.0, 57.0, 41.0, 24.0, 14.0, 9.0, 4.0, 4.0, 4.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-3.47265625, -3.36279296875, -3.2529296875, -3.14306640625, -3.033203125, -2.92333984375, -2.8134765625, -2.70361328125, -2.59375, -2.48388671875, -2.3740234375, -2.26416015625, -2.154296875, -2.04443359375, -1.9345703125, -1.82470703125, -1.71484375, -1.60498046875, -1.4951171875, -1.38525390625, -1.275390625, -1.16552734375, -1.0556640625, -0.94580078125, -0.8359375, -0.72607421875, -0.6162109375, -0.50634765625, -0.396484375, -0.28662109375, -0.1767578125, -0.06689453125, 0.04296875, 0.15283203125, 0.2626953125, 0.37255859375, 0.482421875, 0.59228515625, 0.7021484375, 0.81201171875, 0.921875, 1.03173828125, 1.1416015625, 1.25146484375, 1.361328125, 1.47119140625, 1.5810546875, 1.69091796875, 1.80078125, 1.91064453125, 2.0205078125, 2.13037109375, 2.240234375, 2.35009765625, 2.4599609375, 2.56982421875, 2.6796875, 2.78955078125, 2.8994140625, 3.00927734375, 3.119140625, 3.22900390625, 3.3388671875, 3.44873046875, 3.55859375]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 4.0, 4.0, 6.0, 2.0, 5.0, 8.0, 8.0, 6.0, 18.0, 23.0, 15.0, 21.0, 23.0, 37.0, 30.0, 39.0, 40.0, 51.0, 66.0, 75.0, 216.0, 1438.0, 339.0, 152.0, 69.0, 52.0, 48.0, 50.0, 45.0, 28.0, 23.0, 25.0, 14.0, 17.0, 23.0, 5.0, 9.0, 12.0, 6.0, 4.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.9375, -10.5126953125, -10.087890625, -9.6630859375, -9.23828125, -8.8134765625, -8.388671875, -7.9638671875, -7.5390625, -7.1142578125, -6.689453125, -6.2646484375, -5.83984375, -5.4150390625, -4.990234375, -4.5654296875, -4.140625, -3.7158203125, -3.291015625, -2.8662109375, -2.44140625, -2.0166015625, -1.591796875, -1.1669921875, -0.7421875, -0.3173828125, 0.107421875, 0.5322265625, 0.95703125, 1.3818359375, 1.806640625, 2.2314453125, 2.65625, 3.0810546875, 3.505859375, 3.9306640625, 4.35546875, 4.7802734375, 5.205078125, 5.6298828125, 6.0546875, 6.4794921875, 6.904296875, 7.3291015625, 7.75390625, 8.1787109375, 8.603515625, 9.0283203125, 9.453125, 9.8779296875, 10.302734375, 10.7275390625, 11.15234375, 11.5771484375, 12.001953125, 12.4267578125, 12.8515625, 13.2763671875, 13.701171875, 14.1259765625, 14.55078125, 14.9755859375, 15.400390625, 15.8251953125, 16.25]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 6.0, 10.0, 27.0, 17.0, 50.0, 88.0, 93.0, 195.0, 329.0, 1117.0, 53910.0, 3083869.0, 4636.0, 635.0, 281.0, 179.0, 91.0, 70.0, 42.0, 24.0, 19.0, 7.0, 8.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.15625, -38.68603515625, -37.2158203125, -35.74560546875, -34.275390625, -32.80517578125, -31.3349609375, -29.86474609375, -28.39453125, -26.92431640625, -25.4541015625, -23.98388671875, -22.513671875, -21.04345703125, -19.5732421875, -18.10302734375, -16.6328125, -15.16259765625, -13.6923828125, -12.22216796875, -10.751953125, -9.28173828125, -7.8115234375, -6.34130859375, -4.87109375, -3.40087890625, -1.9306640625, -0.46044921875, 1.009765625, 2.47998046875, 3.9501953125, 5.42041015625, 6.890625, 8.36083984375, 9.8310546875, 11.30126953125, 12.771484375, 14.24169921875, 15.7119140625, 17.18212890625, 18.65234375, 20.12255859375, 21.5927734375, 23.06298828125, 24.533203125, 26.00341796875, 27.4736328125, 28.94384765625, 30.4140625, 31.88427734375, 33.3544921875, 34.82470703125, 36.294921875, 37.76513671875, 39.2353515625, 40.70556640625, 42.17578125, 43.64599609375, 45.1162109375, 46.58642578125, 48.056640625, 49.52685546875, 50.9970703125, 52.46728515625, 53.9375]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [2.0, 4.0, 2.0, 96.0, 790.0, 125.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.61100196838379, -19.16728973388672, -13.723576545715332, -8.279863357543945, -2.836151123046875, 2.6075611114501953, 8.051275253295898, 13.494985580444336, 18.93869972229004, 24.38241195678711, 29.826126098632812, 35.26983642578125, 40.71355056762695, 46.157264709472656, 51.600975036621094, 57.04468536376953, 62.4884033203125, 67.93211364746094, 73.3758316040039, 78.81954193115234, 84.26325225830078, 89.70697021484375, 95.15068054199219, 100.59439086914062, 106.03810119628906, 111.4818115234375, 116.92552947998047, 122.3692398071289, 127.81295013427734, 133.2566680908203, 138.70037841796875, 144.1440887451172, 149.5878143310547, 155.03152465820312, 160.47523498535156, 165.9189453125, 171.3626708984375, 176.80638122558594, 182.25009155273438, 187.6938018798828, 193.13751220703125, 198.5812225341797, 204.02493286132812, 209.46865844726562, 214.91236877441406, 220.3560791015625, 225.79978942871094, 231.24349975585938, 236.68722534179688, 242.1309356689453, 247.57464599609375, 253.01837158203125, 258.4620666503906, 263.9057922363281, 269.3494873046875, 274.793212890625, 280.2369079589844, 285.6806335449219, 291.12432861328125, 296.56805419921875, 302.0117492675781, 307.4554748535156, 312.899169921875, 318.3428955078125, 323.78662109375]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 8.0, 7.0, 5.0, 4.0, 5.0, 9.0, 10.0, 15.0, 16.0, 13.0, 17.0, 24.0, 40.0, 35.0, 22.0, 50.0, 36.0, 22.0, 50.0, 51.0, 43.0, 37.0, 35.0, 35.0, 47.0, 36.0, 34.0, 33.0, 36.0, 38.0, 34.0, 33.0, 31.0, 24.0, 13.0, 9.0, 6.0, 3.0, 9.0, 7.0, 6.0, 8.0, 4.0, 5.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-33.7557258605957, -32.700504302978516, -31.645282745361328, -30.590059280395508, -29.53483772277832, -28.479616165161133, -27.424392700195312, -26.369171142578125, -25.313949584960938, -24.25872802734375, -23.203506469726562, -22.148283004760742, -21.093061447143555, -20.037839889526367, -18.982616424560547, -17.92739486694336, -16.872173309326172, -15.816951751708984, -14.76172924041748, -13.706506729125977, -12.651285171508789, -11.596063613891602, -10.540841102600098, -9.485618591308594, -8.430397033691406, -7.3751749992370605, -6.319952964782715, -5.264730930328369, -4.209508895874023, -3.1542868614196777, -2.099064826965332, -1.0438427925109863, 0.011379241943359375, 1.066601276397705, 2.121823310852051, 3.1770453453063965, 4.232267379760742, 5.287489414215088, 6.342711448669434, 7.397933483123779, 8.453155517578125, 9.508377075195312, 10.563599586486816, 11.61882209777832, 12.674043655395508, 13.729265213012695, 14.7844877243042, 15.839710235595703, 16.89493179321289, 17.950153350830078, 19.005374908447266, 20.060598373413086, 21.115819931030273, 22.17104148864746, 23.22626495361328, 24.28148651123047, 25.336708068847656, 26.391929626464844, 27.44715118408203, 28.50237464904785, 29.55759620666504, 30.612817764282227, 31.668041229248047, 32.723262786865234, 33.77848434448242]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 5.0, 8.0, 8.0, 9.0, 11.0, 10.0, 13.0, 19.0, 19.0, 24.0, 29.0, 27.0, 33.0, 26.0, 26.0, 38.0, 32.0, 33.0, 43.0, 38.0, 50.0, 35.0, 44.0, 43.0, 54.0, 33.0, 36.0, 45.0, 20.0, 21.0, 24.0, 25.0, 16.0, 19.0, 13.0, 8.0, 12.0, 13.0, 8.0, 6.0, 7.0, 4.0, 4.0, 4.0, 0.0, 5.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.734375, -3.62078857421875, -3.5072021484375, -3.39361572265625, -3.280029296875, -3.16644287109375, -3.0528564453125, -2.93927001953125, -2.82568359375, -2.71209716796875, -2.5985107421875, -2.48492431640625, -2.371337890625, -2.25775146484375, -2.1441650390625, -2.03057861328125, -1.9169921875, -1.80340576171875, -1.6898193359375, -1.57623291015625, -1.462646484375, -1.34906005859375, -1.2354736328125, -1.12188720703125, -1.00830078125, -0.89471435546875, -0.7811279296875, -0.66754150390625, -0.553955078125, -0.44036865234375, -0.3267822265625, -0.21319580078125, -0.099609375, 0.01397705078125, 0.1275634765625, 0.24114990234375, 0.354736328125, 0.46832275390625, 0.5819091796875, 0.69549560546875, 0.80908203125, 0.92266845703125, 1.0362548828125, 1.14984130859375, 1.263427734375, 1.37701416015625, 1.4906005859375, 1.60418701171875, 1.7177734375, 1.83135986328125, 1.9449462890625, 2.05853271484375, 2.172119140625, 2.28570556640625, 2.3992919921875, 2.51287841796875, 2.62646484375, 2.74005126953125, 2.8536376953125, 2.96722412109375, 3.080810546875, 3.19439697265625, 3.3079833984375, 3.42156982421875, 3.53515625]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 9.0, 7.0, 8.0, 13.0, 10.0, 15.0, 17.0, 35.0, 43.0, 41.0, 75.0, 91.0, 154.0, 287.0, 716.0, 2363.0, 10904.0, 62914.0, 416663.0, 1944135.0, 1457378.0, 250768.0, 38225.0, 6714.0, 1530.0, 508.0, 217.0, 125.0, 91.0, 46.0, 55.0, 26.0, 19.0, 15.0, 14.0, 11.0, 9.0, 6.0, 8.0, 8.0, 4.0, 6.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-8.9375, -8.695068359375, -8.45263671875, -8.210205078125, -7.9677734375, -7.725341796875, -7.48291015625, -7.240478515625, -6.998046875, -6.755615234375, -6.51318359375, -6.270751953125, -6.0283203125, -5.785888671875, -5.54345703125, -5.301025390625, -5.05859375, -4.816162109375, -4.57373046875, -4.331298828125, -4.0888671875, -3.846435546875, -3.60400390625, -3.361572265625, -3.119140625, -2.876708984375, -2.63427734375, -2.391845703125, -2.1494140625, -1.906982421875, -1.66455078125, -1.422119140625, -1.1796875, -0.937255859375, -0.69482421875, -0.452392578125, -0.2099609375, 0.032470703125, 0.27490234375, 0.517333984375, 0.759765625, 1.002197265625, 1.24462890625, 1.487060546875, 1.7294921875, 1.971923828125, 2.21435546875, 2.456787109375, 2.69921875, 2.941650390625, 3.18408203125, 3.426513671875, 3.6689453125, 3.911376953125, 4.15380859375, 4.396240234375, 4.638671875, 4.881103515625, 5.12353515625, 5.365966796875, 5.6083984375, 5.850830078125, 6.09326171875, 6.335693359375, 6.578125]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 5.0, 8.0, 12.0, 13.0, 12.0, 21.0, 42.0, 55.0, 65.0, 78.0, 114.0, 155.0, 225.0, 273.0, 337.0, 428.0, 500.0, 449.0, 357.0, 225.0, 183.0, 118.0, 106.0, 74.0, 51.0, 49.0, 31.0, 27.0, 20.0, 19.0, 8.0, 7.0, 5.0, 3.0, 6.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.91015625, -6.67462158203125, -6.4390869140625, -6.20355224609375, -5.968017578125, -5.73248291015625, -5.4969482421875, -5.26141357421875, -5.02587890625, -4.79034423828125, -4.5548095703125, -4.31927490234375, -4.083740234375, -3.84820556640625, -3.6126708984375, -3.37713623046875, -3.1416015625, -2.90606689453125, -2.6705322265625, -2.43499755859375, -2.199462890625, -1.96392822265625, -1.7283935546875, -1.49285888671875, -1.25732421875, -1.02178955078125, -0.7862548828125, -0.55072021484375, -0.315185546875, -0.07965087890625, 0.1558837890625, 0.39141845703125, 0.626953125, 0.86248779296875, 1.0980224609375, 1.33355712890625, 1.569091796875, 1.80462646484375, 2.0401611328125, 2.27569580078125, 2.51123046875, 2.74676513671875, 2.9822998046875, 3.21783447265625, 3.453369140625, 3.68890380859375, 3.9244384765625, 4.15997314453125, 4.3955078125, 4.63104248046875, 4.8665771484375, 5.10211181640625, 5.337646484375, 5.57318115234375, 5.8087158203125, 6.04425048828125, 6.27978515625, 6.51531982421875, 6.7508544921875, 6.98638916015625, 7.221923828125, 7.45745849609375, 7.6929931640625, 7.92852783203125, 8.1640625]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 3.0, 3.0, 9.0, 8.0, 12.0, 17.0, 23.0, 31.0, 32.0, 47.0, 56.0, 104.0, 138.0, 196.0, 337.0, 717.0, 4354.0, 207390.0, 3705113.0, 268772.0, 5039.0, 776.0, 397.0, 231.0, 137.0, 120.0, 62.0, 47.0, 35.0, 29.0, 14.0, 10.0, 13.0, 7.0, 6.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.140625, -25.383544921875, -24.62646484375, -23.869384765625, -23.1123046875, -22.355224609375, -21.59814453125, -20.841064453125, -20.083984375, -19.326904296875, -18.56982421875, -17.812744140625, -17.0556640625, -16.298583984375, -15.54150390625, -14.784423828125, -14.02734375, -13.270263671875, -12.51318359375, -11.756103515625, -10.9990234375, -10.241943359375, -9.48486328125, -8.727783203125, -7.970703125, -7.213623046875, -6.45654296875, -5.699462890625, -4.9423828125, -4.185302734375, -3.42822265625, -2.671142578125, -1.9140625, -1.156982421875, -0.39990234375, 0.357177734375, 1.1142578125, 1.871337890625, 2.62841796875, 3.385498046875, 4.142578125, 4.899658203125, 5.65673828125, 6.413818359375, 7.1708984375, 7.927978515625, 8.68505859375, 9.442138671875, 10.19921875, 10.956298828125, 11.71337890625, 12.470458984375, 13.2275390625, 13.984619140625, 14.74169921875, 15.498779296875, 16.255859375, 17.012939453125, 17.77001953125, 18.527099609375, 19.2841796875, 20.041259765625, 20.79833984375, 21.555419921875, 22.3125]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 32.0, 155.0, 365.0, 323.0, 116.0, 22.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-119.3353271484375, -115.04901123046875, -110.76270294189453, -106.47639465332031, -102.19007873535156, -97.90376281738281, -93.6174545288086, -89.33114624023438, -85.04483032226562, -80.75851440429688, -76.47220611572266, -72.18589782714844, -67.89958190917969, -63.6132698059082, -59.32695770263672, -55.040645599365234, -50.75433349609375, -46.468021392822266, -42.18170928955078, -37.8953971862793, -33.60908508300781, -29.322772979736328, -25.036460876464844, -20.75014877319336, -16.463836669921875, -12.17752456665039, -7.891212463378906, -3.604900360107422, 0.6814117431640625, 4.967723846435547, 9.254035949707031, 13.540348052978516, 17.826675415039062, 22.112987518310547, 26.39929962158203, 30.685611724853516, 34.971923828125, 39.258235931396484, 43.54454803466797, 47.83086013793945, 52.11717224121094, 56.40348434448242, 60.689796447753906, 64.97610473632812, 69.26242065429688, 73.54873657226562, 77.83504486083984, 82.12135314941406, 86.40766906738281, 90.69398498535156, 94.98029327392578, 99.2666015625, 103.55291748046875, 107.8392333984375, 112.12554168701172, 116.41184997558594, 120.69816589355469, 124.98448181152344, 129.27078247070312, 133.55709838867188, 137.84341430664062, 142.12973022460938, 146.41604614257812, 150.7023468017578, 154.98866271972656]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 4.0, 5.0, 0.0, 7.0, 9.0, 9.0, 13.0, 13.0, 17.0, 20.0, 19.0, 18.0, 20.0, 28.0, 22.0, 37.0, 28.0, 28.0, 31.0, 40.0, 46.0, 46.0, 48.0, 40.0, 39.0, 43.0, 42.0, 44.0, 26.0, 38.0, 24.0, 30.0, 26.0, 20.0, 20.0, 15.0, 12.0, 11.0, 13.0, 11.0, 11.0, 6.0, 7.0, 2.0, 4.0, 6.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0], "bins": [-23.969219207763672, -23.230419158935547, -22.491621017456055, -21.75282096862793, -21.014020919799805, -20.275222778320312, -19.536422729492188, -18.797622680664062, -18.058822631835938, -17.320022583007812, -16.58122444152832, -15.842424392700195, -15.10362434387207, -14.364825248718262, -13.626026153564453, -12.887226104736328, -12.148427963256836, -11.409628868103027, -10.670828819274902, -9.932029724121094, -9.193229675292969, -8.45443058013916, -7.715631484985352, -6.976831912994385, -6.238032341003418, -5.499232769012451, -4.760433197021484, -4.021634101867676, -3.282834529876709, -2.544034957885742, -1.8052358627319336, -1.0664362907409668, -0.32763671875, 0.41116273403167725, 1.1499621868133545, 1.8887615203857422, 2.627561092376709, 3.366360664367676, 4.105159759521484, 4.843959331512451, 5.582758903503418, 6.321558475494385, 7.060358047485352, 7.79915714263916, 8.537956237792969, 9.276756286621094, 10.015555381774902, 10.754354476928711, 11.493154525756836, 12.231953620910645, 12.97075366973877, 13.709552764892578, 14.448352813720703, 15.187151908874512, 15.92595100402832, 16.664751052856445, 17.403549194335938, 18.142349243164062, 18.881147384643555, 19.61994743347168, 20.358747482299805, 21.097545623779297, 21.836345672607422, 22.575145721435547, 23.313945770263672]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 0.0, 4.0, 8.0, 5.0, 8.0, 14.0, 9.0, 18.0, 13.0, 22.0, 21.0, 19.0, 30.0, 18.0, 25.0, 29.0, 36.0, 40.0, 38.0, 30.0, 37.0, 57.0, 40.0, 38.0, 36.0, 40.0, 43.0, 40.0, 43.0, 30.0, 31.0, 24.0, 18.0, 20.0, 26.0, 11.0, 16.0, 12.0, 11.0, 6.0, 12.0, 5.0, 6.0, 3.0, 4.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.365234375, -3.258026123046875, -3.15081787109375, -3.043609619140625, -2.9364013671875, -2.829193115234375, -2.72198486328125, -2.614776611328125, -2.507568359375, -2.400360107421875, -2.29315185546875, -2.185943603515625, -2.0787353515625, -1.971527099609375, -1.86431884765625, -1.757110595703125, -1.64990234375, -1.542694091796875, -1.43548583984375, -1.328277587890625, -1.2210693359375, -1.113861083984375, -1.00665283203125, -0.899444580078125, -0.792236328125, -0.685028076171875, -0.57781982421875, -0.470611572265625, -0.3634033203125, -0.256195068359375, -0.14898681640625, -0.041778564453125, 0.0654296875, 0.172637939453125, 0.27984619140625, 0.387054443359375, 0.4942626953125, 0.601470947265625, 0.70867919921875, 0.815887451171875, 0.923095703125, 1.030303955078125, 1.13751220703125, 1.244720458984375, 1.3519287109375, 1.459136962890625, 1.56634521484375, 1.673553466796875, 1.78076171875, 1.887969970703125, 1.99517822265625, 2.102386474609375, 2.2095947265625, 2.316802978515625, 2.42401123046875, 2.531219482421875, 2.638427734375, 2.745635986328125, 2.85284423828125, 2.960052490234375, 3.0672607421875, 3.174468994140625, 3.28167724609375, 3.388885498046875, 3.49609375]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 8.0, 4.0, 10.0, 14.0, 35.0, 46.0, 78.0, 126.0, 234.0, 425.0, 672.0, 1252.0, 2123.0, 3516.0, 5853.0, 9451.0, 15035.0, 22822.0, 34057.0, 48015.0, 64637.0, 83059.0, 98653.0, 109556.0, 112020.0, 103795.0, 90150.0, 72745.0, 55291.0, 39619.0, 27402.0, 18064.0, 11680.0, 7265.0, 4410.0, 2655.0, 1580.0, 931.0, 529.0, 310.0, 179.0, 95.0, 57.0, 31.0, 18.0, 15.0, 18.0, 6.0, 4.0, 4.0, 0.0, 3.0, 5.0, 0.0, 2.0], "bins": [-1.435546875, -1.392333984375, -1.34912109375, -1.305908203125, -1.2626953125, -1.219482421875, -1.17626953125, -1.133056640625, -1.08984375, -1.046630859375, -1.00341796875, -0.960205078125, -0.9169921875, -0.873779296875, -0.83056640625, -0.787353515625, -0.744140625, -0.700927734375, -0.65771484375, -0.614501953125, -0.5712890625, -0.528076171875, -0.48486328125, -0.441650390625, -0.3984375, -0.355224609375, -0.31201171875, -0.268798828125, -0.2255859375, -0.182373046875, -0.13916015625, -0.095947265625, -0.052734375, -0.009521484375, 0.03369140625, 0.076904296875, 0.1201171875, 0.163330078125, 0.20654296875, 0.249755859375, 0.29296875, 0.336181640625, 0.37939453125, 0.422607421875, 0.4658203125, 0.509033203125, 0.55224609375, 0.595458984375, 0.638671875, 0.681884765625, 0.72509765625, 0.768310546875, 0.8115234375, 0.854736328125, 0.89794921875, 0.941162109375, 0.984375, 1.027587890625, 1.07080078125, 1.114013671875, 1.1572265625, 1.200439453125, 1.24365234375, 1.286865234375, 1.330078125]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 5.0, 4.0, 7.0, 13.0, 15.0, 16.0, 13.0, 12.0, 25.0, 28.0, 21.0, 36.0, 51.0, 34.0, 46.0, 34.0, 36.0, 41.0, 42.0, 1066.0, 48.0, 56.0, 47.0, 39.0, 50.0, 33.0, 28.0, 32.0, 30.0, 19.0, 27.0, 20.0, 10.0, 15.0, 8.0, 10.0, 5.0, 2.0, 1.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.25, -4.125518798828125, -4.00103759765625, -3.876556396484375, -3.7520751953125, -3.627593994140625, -3.50311279296875, -3.378631591796875, -3.254150390625, -3.129669189453125, -3.00518798828125, -2.880706787109375, -2.7562255859375, -2.631744384765625, -2.50726318359375, -2.382781982421875, -2.25830078125, -2.133819580078125, -2.00933837890625, -1.884857177734375, -1.7603759765625, -1.635894775390625, -1.51141357421875, -1.386932373046875, -1.262451171875, -1.137969970703125, -1.01348876953125, -0.889007568359375, -0.7645263671875, -0.640045166015625, -0.51556396484375, -0.391082763671875, -0.2666015625, -0.142120361328125, -0.01763916015625, 0.106842041015625, 0.2313232421875, 0.355804443359375, 0.48028564453125, 0.604766845703125, 0.729248046875, 0.853729248046875, 0.97821044921875, 1.102691650390625, 1.2271728515625, 1.351654052734375, 1.47613525390625, 1.600616455078125, 1.72509765625, 1.849578857421875, 1.97406005859375, 2.098541259765625, 2.2230224609375, 2.347503662109375, 2.47198486328125, 2.596466064453125, 2.720947265625, 2.845428466796875, 2.96990966796875, 3.094390869140625, 3.2188720703125, 3.343353271484375, 3.46783447265625, 3.592315673828125, 3.716796875]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 7.0, 8.0, 9.0, 4.0, 15.0, 19.0, 25.0, 43.0, 54.0, 96.0, 158.0, 212.0, 314.0, 434.0, 587.0, 876.0, 1200.0, 1718.0, 2505.0, 3488.0, 4857.0, 6747.0, 9728.0, 13938.0, 21234.0, 40790.0, 1581931.0, 312206.0, 31902.0, 18773.0, 12668.0, 9019.0, 6398.0, 4426.0, 3209.0, 2242.0, 1603.0, 1100.0, 785.0, 544.0, 404.0, 286.0, 184.0, 113.0, 91.0, 70.0, 34.0, 26.0, 23.0, 11.0, 10.0, 4.0, 3.0, 7.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-2.658203125, -2.572113037109375, -2.48602294921875, -2.399932861328125, -2.3138427734375, -2.227752685546875, -2.14166259765625, -2.055572509765625, -1.969482421875, -1.883392333984375, -1.79730224609375, -1.711212158203125, -1.6251220703125, -1.539031982421875, -1.45294189453125, -1.366851806640625, -1.28076171875, -1.194671630859375, -1.10858154296875, -1.022491455078125, -0.9364013671875, -0.850311279296875, -0.76422119140625, -0.678131103515625, -0.592041015625, -0.505950927734375, -0.41986083984375, -0.333770751953125, -0.2476806640625, -0.161590576171875, -0.07550048828125, 0.010589599609375, 0.0966796875, 0.182769775390625, 0.26885986328125, 0.354949951171875, 0.4410400390625, 0.527130126953125, 0.61322021484375, 0.699310302734375, 0.785400390625, 0.871490478515625, 0.95758056640625, 1.043670654296875, 1.1297607421875, 1.215850830078125, 1.30194091796875, 1.388031005859375, 1.47412109375, 1.560211181640625, 1.64630126953125, 1.732391357421875, 1.8184814453125, 1.904571533203125, 1.99066162109375, 2.076751708984375, 2.162841796875, 2.248931884765625, 2.33502197265625, 2.421112060546875, 2.5072021484375, 2.593292236328125, 2.67938232421875, 2.765472412109375, 2.8515625]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 2.0, 2.0, 4.0, 8.0, 6.0, 5.0, 12.0, 16.0, 16.0, 21.0, 20.0, 21.0, 32.0, 34.0, 41.0, 38.0, 45.0, 35.0, 42.0, 42.0, 41.0, 45.0, 52.0, 50.0, 44.0, 54.0, 44.0, 43.0, 30.0, 23.0, 26.0, 12.0, 17.0, 9.0, 12.0, 13.0, 10.0, 9.0, 2.0, 6.0, 6.0, 3.0, 3.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.10430908203125, -0.10097789764404297, -0.09764671325683594, -0.0943155288696289, -0.09098434448242188, -0.08765316009521484, -0.08432197570800781, -0.08099079132080078, -0.07765960693359375, -0.07432842254638672, -0.07099723815917969, -0.06766605377197266, -0.06433486938476562, -0.061003684997558594, -0.05767250061035156, -0.05434131622314453, -0.0510101318359375, -0.04767894744873047, -0.04434776306152344, -0.041016578674316406, -0.037685394287109375, -0.034354209899902344, -0.031023025512695312, -0.02769184112548828, -0.02436065673828125, -0.02102947235107422, -0.017698287963867188, -0.014367103576660156, -0.011035919189453125, -0.007704734802246094, -0.0043735504150390625, -0.0010423660278320312, 0.002288818359375, 0.005620002746582031, 0.008951187133789062, 0.012282371520996094, 0.015613555908203125, 0.018944740295410156, 0.022275924682617188, 0.02560710906982422, 0.02893829345703125, 0.03226947784423828, 0.03560066223144531, 0.038931846618652344, 0.042263031005859375, 0.045594215393066406, 0.04892539978027344, 0.05225658416748047, 0.0555877685546875, 0.05891895294189453, 0.06225013732910156, 0.0655813217163086, 0.06891250610351562, 0.07224369049072266, 0.07557487487792969, 0.07890605926513672, 0.08223724365234375, 0.08556842803955078, 0.08889961242675781, 0.09223079681396484, 0.09556198120117188, 0.0988931655883789, 0.10222434997558594, 0.10555553436279297, 0.10888671875]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 7.0, 5.0, 5.0, 7.0, 16.0, 7.0, 12.0, 13.0, 20.0, 19.0, 27.0, 35.0, 48.0, 71.0, 111.0, 155.0, 277.0, 592.0, 2043.0, 221472.0, 815696.0, 6211.0, 741.0, 379.0, 190.0, 104.0, 55.0, 53.0, 39.0, 31.0, 26.0, 19.0, 14.0, 10.0, 4.0, 11.0, 9.0, 3.0, 4.0, 3.0, 4.0, 3.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.244140625, -2.176483154296875, -2.10882568359375, -2.041168212890625, -1.9735107421875, -1.905853271484375, -1.83819580078125, -1.770538330078125, -1.702880859375, -1.635223388671875, -1.56756591796875, -1.499908447265625, -1.4322509765625, -1.364593505859375, -1.29693603515625, -1.229278564453125, -1.16162109375, -1.093963623046875, -1.02630615234375, -0.958648681640625, -0.8909912109375, -0.823333740234375, -0.75567626953125, -0.688018798828125, -0.620361328125, -0.552703857421875, -0.48504638671875, -0.417388916015625, -0.3497314453125, -0.282073974609375, -0.21441650390625, -0.146759033203125, -0.0791015625, -0.011444091796875, 0.05621337890625, 0.123870849609375, 0.1915283203125, 0.259185791015625, 0.32684326171875, 0.394500732421875, 0.462158203125, 0.529815673828125, 0.59747314453125, 0.665130615234375, 0.7327880859375, 0.800445556640625, 0.86810302734375, 0.935760498046875, 1.00341796875, 1.071075439453125, 1.13873291015625, 1.206390380859375, 1.2740478515625, 1.341705322265625, 1.40936279296875, 1.477020263671875, 1.544677734375, 1.612335205078125, 1.67999267578125, 1.747650146484375, 1.8153076171875, 1.882965087890625, 1.95062255859375, 2.018280029296875, 2.0859375]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 14.0, 80.0, 486.0, 373.0, 51.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.4483866691589355, -4.339649200439453, -4.230912208557129, -4.1221747398376465, -4.013437271118164, -3.90470027923584, -3.7959628105163574, -3.687225580215454, -3.578488349914551, -3.4697511196136475, -3.361013650894165, -3.2522764205932617, -3.1435391902923584, -3.034801959991455, -2.9260644912719727, -2.8173272609710693, -2.708589792251587, -2.5998525619506836, -2.491115093231201, -2.382377862930298, -2.2736406326293945, -2.164903163909912, -2.056165933609009, -1.9474287033081055, -1.8386913537979126, -1.7299540042877197, -1.6212167739868164, -1.5124794244766235, -1.4037420749664307, -1.2950048446655273, -1.1862674951553345, -1.0775301456451416, -0.9687929153442383, -0.8600556254386902, -0.7513183355331421, -0.6425809860229492, -0.5338436961174011, -0.425106406211853, -0.31636905670166016, -0.20763176679611206, -0.09889447689056396, 0.009842827916145325, 0.11858013272285461, 0.2273174524307251, 0.3360547423362732, 0.4447920322418213, 0.5535293817520142, 0.6622666716575623, 0.7710039615631104, 0.8797412514686584, 0.9884785413742065, 1.0972158908843994, 1.2059531211853027, 1.3146904706954956, 1.4234278202056885, 1.5321650505065918, 1.6409024000167847, 1.7496397495269775, 1.8583769798278809, 1.9671143293380737, 2.0758516788482666, 2.18458890914917, 2.2933263778686523, 2.4020636081695557, 2.510800838470459]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 5.0, 6.0, 7.0, 19.0, 13.0, 22.0, 31.0, 39.0, 39.0, 55.0, 70.0, 59.0, 57.0, 74.0, 86.0, 70.0, 74.0, 54.0, 47.0, 44.0, 36.0, 28.0, 24.0, 21.0, 17.0, 6.0, 9.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5316909551620483, -0.5025368928909302, -0.473382830619812, -0.44422876834869385, -0.4150747060775757, -0.3859206438064575, -0.35676658153533936, -0.3276125192642212, -0.298458456993103, -0.26930439472198486, -0.2401503324508667, -0.21099627017974854, -0.18184220790863037, -0.1526881456375122, -0.12353408336639404, -0.09438002109527588, -0.06522595882415771, -0.03607189655303955, -0.006917834281921387, 0.022236227989196777, 0.05139029026031494, 0.0805443525314331, 0.10969841480255127, 0.13885247707366943, 0.1680065393447876, 0.19716060161590576, 0.22631466388702393, 0.2554687261581421, 0.28462278842926025, 0.3137768507003784, 0.3429309129714966, 0.37208497524261475, 0.4012390375137329, 0.4303930997848511, 0.45954716205596924, 0.4887012243270874, 0.5178552865982056, 0.5470093488693237, 0.5761634111404419, 0.6053174734115601, 0.6344715356826782, 0.6636255979537964, 0.6927796602249146, 0.7219337224960327, 0.7510877847671509, 0.780241847038269, 0.8093959093093872, 0.8385499715805054, 0.8677040338516235, 0.8968580961227417, 0.9260121583938599, 0.955166220664978, 0.9843202829360962, 1.0134743452072144, 1.0426284074783325, 1.0717824697494507, 1.1009365320205688, 1.130090594291687, 1.1592446565628052, 1.1883987188339233, 1.2175527811050415, 1.2467068433761597, 1.2758609056472778, 1.305014967918396, 1.3341690301895142]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 3.0, 4.0, 3.0, 4.0, 13.0, 12.0, 11.0, 23.0, 11.0, 17.0, 22.0, 23.0, 31.0, 35.0, 39.0, 36.0, 37.0, 25.0, 50.0, 46.0, 49.0, 61.0, 48.0, 46.0, 53.0, 41.0, 43.0, 34.0, 34.0, 29.0, 19.0, 21.0, 13.0, 13.0, 12.0, 9.0, 16.0, 6.0, 4.0, 3.0, 2.0, 2.0, 3.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.083984375, -2.960113525390625, -2.83624267578125, -2.712371826171875, -2.5885009765625, -2.464630126953125, -2.34075927734375, -2.216888427734375, -2.093017578125, -1.969146728515625, -1.84527587890625, -1.721405029296875, -1.5975341796875, -1.473663330078125, -1.34979248046875, -1.225921630859375, -1.10205078125, -0.978179931640625, -0.85430908203125, -0.730438232421875, -0.6065673828125, -0.482696533203125, -0.35882568359375, -0.234954833984375, -0.111083984375, 0.012786865234375, 0.13665771484375, 0.260528564453125, 0.3843994140625, 0.508270263671875, 0.63214111328125, 0.756011962890625, 0.8798828125, 1.003753662109375, 1.12762451171875, 1.251495361328125, 1.3753662109375, 1.499237060546875, 1.62310791015625, 1.746978759765625, 1.870849609375, 1.994720458984375, 2.11859130859375, 2.242462158203125, 2.3663330078125, 2.490203857421875, 2.61407470703125, 2.737945556640625, 2.86181640625, 2.985687255859375, 3.10955810546875, 3.233428955078125, 3.3572998046875, 3.481170654296875, 3.60504150390625, 3.728912353515625, 3.852783203125, 3.976654052734375, 4.10052490234375, 4.224395751953125, 4.3482666015625, 4.472137451171875, 4.59600830078125, 4.719879150390625, 4.84375]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 9.0, 7.0, 11.0, 19.0, 40.0, 70.0, 99.0, 146.0, 291.0, 506.0, 865.0, 1592.0, 2982.0, 5829.0, 10812.0, 20535.0, 40799.0, 80548.0, 159995.0, 316741.0, 201008.0, 100387.0, 50780.0, 25897.0, 13433.0, 7002.0, 3726.0, 1974.0, 1029.0, 618.0, 290.0, 193.0, 107.0, 79.0, 40.0, 25.0, 17.0, 20.0, 7.0, 11.0, 7.0, 6.0, 4.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.697265625, -3.576690673828125, -3.45611572265625, -3.335540771484375, -3.2149658203125, -3.094390869140625, -2.97381591796875, -2.853240966796875, -2.732666015625, -2.612091064453125, -2.49151611328125, -2.370941162109375, -2.2503662109375, -2.129791259765625, -2.00921630859375, -1.888641357421875, -1.76806640625, -1.647491455078125, -1.52691650390625, -1.406341552734375, -1.2857666015625, -1.165191650390625, -1.04461669921875, -0.924041748046875, -0.803466796875, -0.682891845703125, -0.56231689453125, -0.441741943359375, -0.3211669921875, -0.200592041015625, -0.08001708984375, 0.040557861328125, 0.1611328125, 0.281707763671875, 0.40228271484375, 0.522857666015625, 0.6434326171875, 0.764007568359375, 0.88458251953125, 1.005157470703125, 1.125732421875, 1.246307373046875, 1.36688232421875, 1.487457275390625, 1.6080322265625, 1.728607177734375, 1.84918212890625, 1.969757080078125, 2.09033203125, 2.210906982421875, 2.33148193359375, 2.452056884765625, 2.5726318359375, 2.693206787109375, 2.81378173828125, 2.934356689453125, 3.054931640625, 3.175506591796875, 3.29608154296875, 3.416656494140625, 3.5372314453125, 3.657806396484375, 3.77838134765625, 3.898956298828125, 4.01953125]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 6.0, 2.0, 4.0, 1.0, 5.0, 0.0, 5.0, 2.0, 8.0, 6.0, 6.0, 13.0, 9.0, 13.0, 13.0, 20.0, 21.0, 31.0, 25.0, 33.0, 44.0, 51.0, 41.0, 58.0, 75.0, 122.0, 238.0, 1448.0, 168.0, 118.0, 72.0, 65.0, 48.0, 24.0, 47.0, 36.0, 22.0, 26.0, 16.0, 15.0, 19.0, 21.0, 5.0, 10.0, 6.0, 14.0, 6.0, 7.0, 2.0, 7.0, 1.0, 1.0, 1.0, 2.0, 6.0, 1.0, 2.0], "bins": [-12.453125, -12.0904541015625, -11.727783203125, -11.3651123046875, -11.00244140625, -10.6397705078125, -10.277099609375, -9.9144287109375, -9.5517578125, -9.1890869140625, -8.826416015625, -8.4637451171875, -8.10107421875, -7.7384033203125, -7.375732421875, -7.0130615234375, -6.650390625, -6.2877197265625, -5.925048828125, -5.5623779296875, -5.19970703125, -4.8370361328125, -4.474365234375, -4.1116943359375, -3.7490234375, -3.3863525390625, -3.023681640625, -2.6610107421875, -2.29833984375, -1.9356689453125, -1.572998046875, -1.2103271484375, -0.84765625, -0.4849853515625, -0.122314453125, 0.2403564453125, 0.60302734375, 0.9656982421875, 1.328369140625, 1.6910400390625, 2.0537109375, 2.4163818359375, 2.779052734375, 3.1417236328125, 3.50439453125, 3.8670654296875, 4.229736328125, 4.5924072265625, 4.955078125, 5.3177490234375, 5.680419921875, 6.0430908203125, 6.40576171875, 6.7684326171875, 7.131103515625, 7.4937744140625, 7.8564453125, 8.2191162109375, 8.581787109375, 8.9444580078125, 9.30712890625, 9.6697998046875, 10.032470703125, 10.3951416015625, 10.7578125]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 4.0, 5.0, 3.0, 8.0, 23.0, 31.0, 35.0, 54.0, 86.0, 121.0, 223.0, 438.0, 1251.0, 35147.0, 3097663.0, 8825.0, 913.0, 385.0, 179.0, 111.0, 68.0, 38.0, 34.0, 17.0, 19.0, 8.0, 5.0, 6.0, 2.0, 0.0, 4.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-51.3125, -49.775390625, -48.23828125, -46.701171875, -45.1640625, -43.626953125, -42.08984375, -40.552734375, -39.015625, -37.478515625, -35.94140625, -34.404296875, -32.8671875, -31.330078125, -29.79296875, -28.255859375, -26.71875, -25.181640625, -23.64453125, -22.107421875, -20.5703125, -19.033203125, -17.49609375, -15.958984375, -14.421875, -12.884765625, -11.34765625, -9.810546875, -8.2734375, -6.736328125, -5.19921875, -3.662109375, -2.125, -0.587890625, 0.94921875, 2.486328125, 4.0234375, 5.560546875, 7.09765625, 8.634765625, 10.171875, 11.708984375, 13.24609375, 14.783203125, 16.3203125, 17.857421875, 19.39453125, 20.931640625, 22.46875, 24.005859375, 25.54296875, 27.080078125, 28.6171875, 30.154296875, 31.69140625, 33.228515625, 34.765625, 36.302734375, 37.83984375, 39.376953125, 40.9140625, 42.451171875, 43.98828125, 45.525390625, 47.0625]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [2.0, 154.0, 864.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.065074920654297, -15.64610767364502, -2.227140426635742, 11.191825866699219, 24.610794067382812, 38.02975845336914, 51.448726654052734, 64.86769104003906, 78.28666687011719, 91.70563507080078, 105.12460327148438, 118.54356384277344, 131.96253967285156, 145.38150024414062, 158.80047607421875, 172.2194366455078, 185.63839721679688, 199.05735778808594, 212.47633361816406, 225.89529418945312, 239.31427001953125, 252.7332305908203, 266.1521911621094, 279.5711669921875, 292.9901428222656, 306.40911865234375, 319.82806396484375, 333.2470397949219, 346.666015625, 360.0849609375, 373.5039367675781, 386.92291259765625, 400.3418884277344, 413.7608642578125, 427.1798095703125, 440.5987854003906, 454.01776123046875, 467.43670654296875, 480.8556823730469, 494.274658203125, 507.6936340332031, 521.1126098632812, 534.5315551757812, 547.9505615234375, 561.3695068359375, 574.7884521484375, 588.2074584960938, 601.6264038085938, 615.0453491210938, 628.4642944335938, 641.88330078125, 655.30224609375, 668.72119140625, 682.1401977539062, 695.5591430664062, 708.9781494140625, 722.3970947265625, 735.8160400390625, 749.2350463867188, 762.6539916992188, 776.0729370117188, 789.491943359375, 802.910888671875, 816.329833984375, 829.7488403320312]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 5.0, 7.0, 7.0, 7.0, 10.0, 16.0, 13.0, 16.0, 20.0, 23.0, 31.0, 40.0, 30.0, 42.0, 28.0, 30.0, 33.0, 30.0, 58.0, 41.0, 35.0, 40.0, 40.0, 40.0, 44.0, 36.0, 30.0, 36.0, 34.0, 20.0, 25.0, 24.0, 18.0, 19.0, 15.0, 13.0, 14.0, 10.0, 4.0, 3.0, 3.0, 4.0, 7.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-34.10143280029297, -33.0416259765625, -31.9818172454834, -30.922008514404297, -29.862201690673828, -28.802392959594727, -27.742584228515625, -26.682777404785156, -25.622970581054688, -24.563161849975586, -23.503355026245117, -22.443546295166016, -21.383739471435547, -20.323930740356445, -19.264122009277344, -18.204315185546875, -17.144506454467773, -16.084697723388672, -15.024890899658203, -13.965082168579102, -12.905275344848633, -11.845466613769531, -10.785658836364746, -9.725851058959961, -8.666043281555176, -7.606235504150391, -6.5464277267456055, -5.486619472503662, -4.426811695098877, -3.367003917694092, -2.3071956634521484, -1.2473878860473633, -0.18758010864257812, 0.8722277879714966, 1.9320356845855713, 2.9918437004089355, 4.051651477813721, 5.111459255218506, 6.171267509460449, 7.231075286865234, 8.29088306427002, 9.350690841674805, 10.41049861907959, 11.470306396484375, 12.530115127563477, 13.589921951293945, 14.649730682373047, 15.709538459777832, 16.769346237182617, 17.82915496826172, 18.888961791992188, 19.94877052307129, 21.008577346801758, 22.06838607788086, 23.128192901611328, 24.18800163269043, 25.24781036376953, 26.307619094848633, 27.3674259185791, 28.427234649658203, 29.487041473388672, 30.546850204467773, 31.606658935546875, 32.666465759277344, 33.72627258300781]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 2.0, 6.0, 8.0, 9.0, 8.0, 13.0, 18.0, 24.0, 23.0, 29.0, 37.0, 40.0, 48.0, 51.0, 52.0, 68.0, 48.0, 56.0, 44.0, 66.0, 60.0, 43.0, 57.0, 46.0, 43.0, 23.0, 13.0, 9.0, 21.0, 11.0, 10.0, 6.0, 7.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.87109375, -3.70477294921875, -3.5384521484375, -3.37213134765625, -3.205810546875, -3.03948974609375, -2.8731689453125, -2.70684814453125, -2.54052734375, -2.37420654296875, -2.2078857421875, -2.04156494140625, -1.875244140625, -1.70892333984375, -1.5426025390625, -1.37628173828125, -1.2099609375, -1.04364013671875, -0.8773193359375, -0.71099853515625, -0.544677734375, -0.37835693359375, -0.2120361328125, -0.04571533203125, 0.12060546875, 0.28692626953125, 0.4532470703125, 0.61956787109375, 0.785888671875, 0.95220947265625, 1.1185302734375, 1.28485107421875, 1.451171875, 1.61749267578125, 1.7838134765625, 1.95013427734375, 2.116455078125, 2.28277587890625, 2.4490966796875, 2.61541748046875, 2.78173828125, 2.94805908203125, 3.1143798828125, 3.28070068359375, 3.447021484375, 3.61334228515625, 3.7796630859375, 3.94598388671875, 4.1123046875, 4.27862548828125, 4.4449462890625, 4.61126708984375, 4.777587890625, 4.94390869140625, 5.1102294921875, 5.27655029296875, 5.44287109375, 5.60919189453125, 5.7755126953125, 5.94183349609375, 6.108154296875, 6.27447509765625, 6.4407958984375, 6.60711669921875, 6.7734375]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 4.0, 3.0, 5.0, 7.0, 16.0, 24.0, 26.0, 34.0, 59.0, 88.0, 120.0, 202.0, 309.0, 615.0, 1427.0, 3953.0, 12001.0, 38305.0, 127898.0, 450614.0, 1295372.0, 1454471.0, 574569.0, 164831.0, 47165.0, 14281.0, 4617.0, 1622.0, 716.0, 332.0, 210.0, 121.0, 68.0, 54.0, 41.0, 33.0, 24.0, 15.0, 12.0, 10.0, 4.0, 5.0, 4.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.96875, -4.80364990234375, -4.6385498046875, -4.47344970703125, -4.308349609375, -4.14324951171875, -3.9781494140625, -3.81304931640625, -3.64794921875, -3.48284912109375, -3.3177490234375, -3.15264892578125, -2.987548828125, -2.82244873046875, -2.6573486328125, -2.49224853515625, -2.3271484375, -2.16204833984375, -1.9969482421875, -1.83184814453125, -1.666748046875, -1.50164794921875, -1.3365478515625, -1.17144775390625, -1.00634765625, -0.84124755859375, -0.6761474609375, -0.51104736328125, -0.345947265625, -0.18084716796875, -0.0157470703125, 0.14935302734375, 0.314453125, 0.47955322265625, 0.6446533203125, 0.80975341796875, 0.974853515625, 1.13995361328125, 1.3050537109375, 1.47015380859375, 1.63525390625, 1.80035400390625, 1.9654541015625, 2.13055419921875, 2.295654296875, 2.46075439453125, 2.6258544921875, 2.79095458984375, 2.9560546875, 3.12115478515625, 3.2862548828125, 3.45135498046875, 3.616455078125, 3.78155517578125, 3.9466552734375, 4.11175537109375, 4.27685546875, 4.44195556640625, 4.6070556640625, 4.77215576171875, 4.937255859375, 5.10235595703125, 5.2674560546875, 5.43255615234375, 5.59765625]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 2.0, 3.0, 2.0, 2.0, 5.0, 7.0, 8.0, 4.0, 10.0, 14.0, 14.0, 20.0, 24.0, 37.0, 37.0, 43.0, 53.0, 90.0, 101.0, 125.0, 143.0, 237.0, 294.0, 305.0, 321.0, 343.0, 311.0, 300.0, 231.0, 221.0, 165.0, 127.0, 96.0, 79.0, 61.0, 48.0, 44.0, 42.0, 28.0, 20.0, 7.0, 10.0, 10.0, 7.0, 11.0, 4.0, 7.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0], "bins": [-5.74609375, -5.56915283203125, -5.3922119140625, -5.21527099609375, -5.038330078125, -4.86138916015625, -4.6844482421875, -4.50750732421875, -4.33056640625, -4.15362548828125, -3.9766845703125, -3.79974365234375, -3.622802734375, -3.44586181640625, -3.2689208984375, -3.09197998046875, -2.9150390625, -2.73809814453125, -2.5611572265625, -2.38421630859375, -2.207275390625, -2.03033447265625, -1.8533935546875, -1.67645263671875, -1.49951171875, -1.32257080078125, -1.1456298828125, -0.96868896484375, -0.791748046875, -0.61480712890625, -0.4378662109375, -0.26092529296875, -0.083984375, 0.09295654296875, 0.2698974609375, 0.44683837890625, 0.623779296875, 0.80072021484375, 0.9776611328125, 1.15460205078125, 1.33154296875, 1.50848388671875, 1.6854248046875, 1.86236572265625, 2.039306640625, 2.21624755859375, 2.3931884765625, 2.57012939453125, 2.7470703125, 2.92401123046875, 3.1009521484375, 3.27789306640625, 3.454833984375, 3.63177490234375, 3.8087158203125, 3.98565673828125, 4.16259765625, 4.33953857421875, 4.5164794921875, 4.69342041015625, 4.870361328125, 5.04730224609375, 5.2242431640625, 5.40118408203125, 5.578125]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 5.0, 3.0, 7.0, 14.0, 9.0, 7.0, 15.0, 21.0, 21.0, 39.0, 47.0, 49.0, 69.0, 68.0, 105.0, 137.0, 176.0, 264.0, 477.0, 1470.0, 14477.0, 264978.0, 3051938.0, 813787.0, 41225.0, 2999.0, 644.0, 298.0, 228.0, 170.0, 127.0, 88.0, 69.0, 47.0, 49.0, 31.0, 24.0, 22.0, 19.0, 13.0, 8.0, 11.0, 3.0, 6.0, 2.0, 4.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0], "bins": [-16.03125, -15.5087890625, -14.986328125, -14.4638671875, -13.94140625, -13.4189453125, -12.896484375, -12.3740234375, -11.8515625, -11.3291015625, -10.806640625, -10.2841796875, -9.76171875, -9.2392578125, -8.716796875, -8.1943359375, -7.671875, -7.1494140625, -6.626953125, -6.1044921875, -5.58203125, -5.0595703125, -4.537109375, -4.0146484375, -3.4921875, -2.9697265625, -2.447265625, -1.9248046875, -1.40234375, -0.8798828125, -0.357421875, 0.1650390625, 0.6875, 1.2099609375, 1.732421875, 2.2548828125, 2.77734375, 3.2998046875, 3.822265625, 4.3447265625, 4.8671875, 5.3896484375, 5.912109375, 6.4345703125, 6.95703125, 7.4794921875, 8.001953125, 8.5244140625, 9.046875, 9.5693359375, 10.091796875, 10.6142578125, 11.13671875, 11.6591796875, 12.181640625, 12.7041015625, 13.2265625, 13.7490234375, 14.271484375, 14.7939453125, 15.31640625, 15.8388671875, 16.361328125, 16.8837890625, 17.40625]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 16.0, 72.0, 275.0, 355.0, 239.0, 51.0, 9.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-115.02243041992188, -111.11607360839844, -107.209716796875, -103.30335998535156, -99.3969955444336, -95.49063873291016, -91.58428192138672, -87.67792510986328, -83.77156066894531, -79.86520385742188, -75.95884704589844, -72.052490234375, -68.14612579345703, -64.2397689819336, -60.333412170410156, -56.42705535888672, -52.52069854736328, -48.614341735839844, -44.70798110961914, -40.8016242980957, -36.895263671875, -32.98890686035156, -29.082550048828125, -25.176191329956055, -21.269832611083984, -17.363473892211914, -13.45711612701416, -9.550758361816406, -5.644399642944336, -1.7380409240722656, 2.168315887451172, 6.074674606323242, 9.981033325195312, 13.887392044067383, 17.793750762939453, 21.70010757446289, 25.60646629333496, 29.51282501220703, 33.41918182373047, 37.325538635253906, 41.23189926147461, 45.13825607299805, 49.04461669921875, 52.95097351074219, 56.857330322265625, 60.76369094848633, 64.6700439453125, 68.57640838623047, 72.4827651977539, 76.38912200927734, 80.29547882080078, 84.20184326171875, 88.10820007324219, 92.01455688476562, 95.92091369628906, 99.8272705078125, 103.73362731933594, 107.63998413085938, 111.54634094238281, 115.45269775390625, 119.35906219482422, 123.26541900634766, 127.1717758178711, 131.07814025878906, 134.9844970703125]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 6.0, 2.0, 2.0, 3.0, 4.0, 4.0, 3.0, 10.0, 8.0, 12.0, 13.0, 18.0, 20.0, 17.0, 31.0, 22.0, 31.0, 33.0, 38.0, 44.0, 49.0, 40.0, 39.0, 50.0, 46.0, 38.0, 30.0, 37.0, 48.0, 29.0, 44.0, 34.0, 31.0, 24.0, 18.0, 23.0, 30.0, 15.0, 13.0, 19.0, 6.0, 8.0, 5.0, 4.0, 4.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-23.099918365478516, -22.330669403076172, -21.561420440673828, -20.792171478271484, -20.022924423217773, -19.25367546081543, -18.484426498413086, -17.715177536010742, -16.94593048095703, -16.176681518554688, -15.40743350982666, -14.638184547424316, -13.868936538696289, -13.099687576293945, -12.330438613891602, -11.561189651489258, -10.791940689086914, -10.02269172668457, -9.253443717956543, -8.4841947555542, -7.714946269989014, -6.945697784423828, -6.176448822021484, -5.407200336456299, -4.637951850891113, -3.8687033653259277, -3.099454641342163, -2.3302059173583984, -1.560957431793213, -0.7917089462280273, -0.022459983825683594, 0.746788501739502, 1.5160369873046875, 2.285285472869873, 3.0545341968536377, 3.8237829208374023, 4.593031406402588, 5.362279891967773, 6.131528854370117, 6.900777339935303, 7.670025825500488, 8.439274787902832, 9.20852279663086, 9.977771759033203, 10.747020721435547, 11.516268730163574, 12.285517692565918, 13.054765701293945, 13.824014663696289, 14.593263626098633, 15.36251163482666, 16.131759643554688, 16.90100860595703, 17.670257568359375, 18.43950653076172, 19.208755493164062, 19.978004455566406, 20.74725341796875, 21.516502380371094, 22.285751342773438, 23.05499839782715, 23.824247360229492, 24.593496322631836, 25.36274528503418, 26.13199234008789]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 8.0, 4.0, 3.0, 9.0, 14.0, 8.0, 10.0, 23.0, 16.0, 16.0, 19.0, 23.0, 21.0, 25.0, 21.0, 41.0, 37.0, 40.0, 38.0, 30.0, 28.0, 41.0, 55.0, 39.0, 41.0, 41.0, 39.0, 33.0, 32.0, 49.0, 35.0, 29.0, 28.0, 20.0, 21.0, 18.0, 7.0, 6.0, 5.0, 4.0, 9.0, 6.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.2265625, -3.1153564453125, -3.004150390625, -2.8929443359375, -2.78173828125, -2.6705322265625, -2.559326171875, -2.4481201171875, -2.3369140625, -2.2257080078125, -2.114501953125, -2.0032958984375, -1.89208984375, -1.7808837890625, -1.669677734375, -1.5584716796875, -1.447265625, -1.3360595703125, -1.224853515625, -1.1136474609375, -1.00244140625, -0.8912353515625, -0.780029296875, -0.6688232421875, -0.5576171875, -0.4464111328125, -0.335205078125, -0.2239990234375, -0.11279296875, -0.0015869140625, 0.109619140625, 0.2208251953125, 0.33203125, 0.4432373046875, 0.554443359375, 0.6656494140625, 0.77685546875, 0.8880615234375, 0.999267578125, 1.1104736328125, 1.2216796875, 1.3328857421875, 1.444091796875, 1.5552978515625, 1.66650390625, 1.7777099609375, 1.888916015625, 2.0001220703125, 2.111328125, 2.2225341796875, 2.333740234375, 2.4449462890625, 2.55615234375, 2.6673583984375, 2.778564453125, 2.8897705078125, 3.0009765625, 3.1121826171875, 3.223388671875, 3.3345947265625, 3.44580078125, 3.5570068359375, 3.668212890625, 3.7794189453125, 3.890625]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 6.0, 12.0, 12.0, 17.0, 25.0, 46.0, 42.0, 72.0, 115.0, 145.0, 225.0, 301.0, 483.0, 714.0, 1216.0, 2205.0, 4041.0, 7379.0, 13285.0, 23688.0, 40820.0, 67175.0, 102109.0, 140026.0, 163252.0, 154452.0, 120707.0, 83175.0, 51871.0, 30839.0, 17679.0, 9768.0, 5423.0, 2884.0, 1617.0, 976.0, 580.0, 358.0, 246.0, 176.0, 106.0, 82.0, 56.0, 60.0, 25.0, 28.0, 15.0, 12.0, 8.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-1.7705078125, -1.7147216796875, -1.658935546875, -1.6031494140625, -1.54736328125, -1.4915771484375, -1.435791015625, -1.3800048828125, -1.32421875, -1.2684326171875, -1.212646484375, -1.1568603515625, -1.10107421875, -1.0452880859375, -0.989501953125, -0.9337158203125, -0.8779296875, -0.8221435546875, -0.766357421875, -0.7105712890625, -0.65478515625, -0.5989990234375, -0.543212890625, -0.4874267578125, -0.431640625, -0.3758544921875, -0.320068359375, -0.2642822265625, -0.20849609375, -0.1527099609375, -0.096923828125, -0.0411376953125, 0.0146484375, 0.0704345703125, 0.126220703125, 0.1820068359375, 0.23779296875, 0.2935791015625, 0.349365234375, 0.4051513671875, 0.4609375, 0.5167236328125, 0.572509765625, 0.6282958984375, 0.68408203125, 0.7398681640625, 0.795654296875, 0.8514404296875, 0.9072265625, 0.9630126953125, 1.018798828125, 1.0745849609375, 1.13037109375, 1.1861572265625, 1.241943359375, 1.2977294921875, 1.353515625, 1.4093017578125, 1.465087890625, 1.5208740234375, 1.57666015625, 1.6324462890625, 1.688232421875, 1.7440185546875, 1.7998046875]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 6.0, 9.0, 7.0, 4.0, 11.0, 10.0, 10.0, 8.0, 12.0, 17.0, 20.0, 20.0, 21.0, 24.0, 24.0, 24.0, 23.0, 33.0, 26.0, 37.0, 31.0, 38.0, 37.0, 31.0, 1061.0, 41.0, 31.0, 39.0, 30.0, 36.0, 30.0, 23.0, 36.0, 17.0, 23.0, 39.0, 16.0, 14.0, 9.0, 13.0, 22.0, 4.0, 12.0, 13.0, 10.0, 5.0, 6.0, 6.0, 3.0, 1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 3.0], "bins": [-2.83203125, -2.7430419921875, -2.654052734375, -2.5650634765625, -2.47607421875, -2.3870849609375, -2.298095703125, -2.2091064453125, -2.1201171875, -2.0311279296875, -1.942138671875, -1.8531494140625, -1.76416015625, -1.6751708984375, -1.586181640625, -1.4971923828125, -1.408203125, -1.3192138671875, -1.230224609375, -1.1412353515625, -1.05224609375, -0.9632568359375, -0.874267578125, -0.7852783203125, -0.6962890625, -0.6072998046875, -0.518310546875, -0.4293212890625, -0.34033203125, -0.2513427734375, -0.162353515625, -0.0733642578125, 0.015625, 0.1046142578125, 0.193603515625, 0.2825927734375, 0.37158203125, 0.4605712890625, 0.549560546875, 0.6385498046875, 0.7275390625, 0.8165283203125, 0.905517578125, 0.9945068359375, 1.08349609375, 1.1724853515625, 1.261474609375, 1.3504638671875, 1.439453125, 1.5284423828125, 1.617431640625, 1.7064208984375, 1.79541015625, 1.8843994140625, 1.973388671875, 2.0623779296875, 2.1513671875, 2.2403564453125, 2.329345703125, 2.4183349609375, 2.50732421875, 2.5963134765625, 2.685302734375, 2.7742919921875, 2.86328125]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 2.0, 6.0, 3.0, 14.0, 18.0, 28.0, 41.0, 42.0, 75.0, 136.0, 217.0, 293.0, 487.0, 770.0, 1305.0, 2111.0, 3340.0, 5523.0, 9030.0, 14947.0, 26554.0, 71126.0, 1829822.0, 67428.0, 25975.0, 14828.0, 8744.0, 5467.0, 3312.0, 2080.0, 1231.0, 777.0, 498.0, 344.0, 213.0, 139.0, 79.0, 48.0, 29.0, 21.0, 11.0, 14.0, 2.0, 3.0, 4.0, 2.0, 1.0, 1.0, 3.0], "bins": [-4.1171875, -4.007354736328125, -3.89752197265625, -3.787689208984375, -3.6778564453125, -3.568023681640625, -3.45819091796875, -3.348358154296875, -3.238525390625, -3.128692626953125, -3.01885986328125, -2.909027099609375, -2.7991943359375, -2.689361572265625, -2.57952880859375, -2.469696044921875, -2.35986328125, -2.250030517578125, -2.14019775390625, -2.030364990234375, -1.9205322265625, -1.810699462890625, -1.70086669921875, -1.591033935546875, -1.481201171875, -1.371368408203125, -1.26153564453125, -1.151702880859375, -1.0418701171875, -0.932037353515625, -0.82220458984375, -0.712371826171875, -0.6025390625, -0.492706298828125, -0.38287353515625, -0.273040771484375, -0.1632080078125, -0.053375244140625, 0.05645751953125, 0.166290283203125, 0.276123046875, 0.385955810546875, 0.49578857421875, 0.605621337890625, 0.7154541015625, 0.825286865234375, 0.93511962890625, 1.044952392578125, 1.15478515625, 1.264617919921875, 1.37445068359375, 1.484283447265625, 1.5941162109375, 1.703948974609375, 1.81378173828125, 1.923614501953125, 2.033447265625, 2.143280029296875, 2.25311279296875, 2.362945556640625, 2.4727783203125, 2.582611083984375, 2.69244384765625, 2.802276611328125, 2.912109375]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 4.0, 12.0, 12.0, 42.0, 152.0, 295.0, 256.0, 112.0, 60.0, 11.0, 11.0, 5.0, 5.0, 2.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.59423828125, -0.5743942260742188, -0.5545501708984375, -0.5347061157226562, -0.514862060546875, -0.49501800537109375, -0.4751739501953125, -0.45532989501953125, -0.43548583984375, -0.41564178466796875, -0.3957977294921875, -0.37595367431640625, -0.356109619140625, -0.33626556396484375, -0.3164215087890625, -0.29657745361328125, -0.2767333984375, -0.25688934326171875, -0.2370452880859375, -0.21720123291015625, -0.197357177734375, -0.17751312255859375, -0.1576690673828125, -0.13782501220703125, -0.11798095703125, -0.09813690185546875, -0.0782928466796875, -0.05844879150390625, -0.038604736328125, -0.01876068115234375, 0.0010833740234375, 0.02092742919921875, 0.040771484375, 0.06061553955078125, 0.0804595947265625, 0.10030364990234375, 0.120147705078125, 0.13999176025390625, 0.1598358154296875, 0.17967987060546875, 0.19952392578125, 0.21936798095703125, 0.2392120361328125, 0.25905609130859375, 0.278900146484375, 0.29874420166015625, 0.3185882568359375, 0.33843231201171875, 0.3582763671875, 0.37812042236328125, 0.3979644775390625, 0.41780853271484375, 0.437652587890625, 0.45749664306640625, 0.4773406982421875, 0.49718475341796875, 0.51702880859375, 0.5368728637695312, 0.5567169189453125, 0.5765609741210938, 0.596405029296875, 0.6162490844726562, 0.6360931396484375, 0.6559371948242188, 0.67578125]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 5.0, 4.0, 4.0, 3.0, 14.0, 9.0, 22.0, 30.0, 45.0, 134.0, 718.0, 120288.0, 926012.0, 974.0, 142.0, 49.0, 35.0, 12.0, 14.0, 10.0, 6.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.7890625, -12.4134521484375, -12.037841796875, -11.6622314453125, -11.28662109375, -10.9110107421875, -10.535400390625, -10.1597900390625, -9.7841796875, -9.4085693359375, -9.032958984375, -8.6573486328125, -8.28173828125, -7.9061279296875, -7.530517578125, -7.1549072265625, -6.779296875, -6.4036865234375, -6.028076171875, -5.6524658203125, -5.27685546875, -4.9012451171875, -4.525634765625, -4.1500244140625, -3.7744140625, -3.3988037109375, -3.023193359375, -2.6475830078125, -2.27197265625, -1.8963623046875, -1.520751953125, -1.1451416015625, -0.76953125, -0.3939208984375, -0.018310546875, 0.3572998046875, 0.73291015625, 1.1085205078125, 1.484130859375, 1.8597412109375, 2.2353515625, 2.6109619140625, 2.986572265625, 3.3621826171875, 3.73779296875, 4.1134033203125, 4.489013671875, 4.8646240234375, 5.240234375, 5.6158447265625, 5.991455078125, 6.3670654296875, 6.74267578125, 7.1182861328125, 7.493896484375, 7.8695068359375, 8.2451171875, 8.6207275390625, 8.996337890625, 9.3719482421875, 9.74755859375, 10.1231689453125, 10.498779296875, 10.8743896484375, 11.25]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 10.0, 87.0, 560.0, 311.0, 34.0, 10.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.219789981842041, -6.063536643981934, -5.907282829284668, -5.7510294914245605, -5.594776153564453, -5.4385223388671875, -5.28226900100708, -5.126015663146973, -4.969761848449707, -4.8135085105896, -4.657254695892334, -4.501001358032227, -4.344747543334961, -4.1884942054748535, -4.032240867614746, -3.8759872913360596, -3.719733715057373, -3.5634801387786865, -3.4072265625, -3.2509732246398926, -3.094719648361206, -2.9384660720825195, -2.782212734222412, -2.6259591579437256, -2.469705581665039, -2.3134520053863525, -2.157198429107666, -2.0009450912475586, -1.844691514968872, -1.6884379386901855, -1.5321844816207886, -1.3759310245513916, -1.2196776866912842, -1.0634241104125977, -0.9071706533432007, -0.7509171366691589, -0.5946636199951172, -0.43841010332107544, -0.2821565866470337, -0.12590312957763672, 0.030350446701049805, 0.18660396337509155, 0.3428574800491333, 0.49911099672317505, 0.6553645133972168, 0.8116180300712585, 0.9678715467453003, 1.1241250038146973, 1.2803785800933838, 1.4366321563720703, 1.5928856134414673, 1.7491390705108643, 1.9053926467895508, 2.0616462230682373, 2.217899799346924, 2.3741531372070312, 2.5304067134857178, 2.6866602897644043, 2.8429136276245117, 2.9991672039031982, 3.1554207801818848, 3.3116743564605713, 3.467927932739258, 3.6241812705993652, 3.7804348468780518]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [4.0, 2.0, 4.0, 3.0, 2.0, 7.0, 6.0, 12.0, 14.0, 13.0, 23.0, 21.0, 26.0, 40.0, 36.0, 43.0, 47.0, 54.0, 60.0, 48.0, 51.0, 63.0, 50.0, 40.0, 56.0, 41.0, 42.0, 34.0, 36.0, 30.0, 28.0, 18.0, 18.0, 11.0, 6.0, 10.0, 7.0, 4.0, 3.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7579973340034485, -0.7226315140724182, -0.6872656345367432, -0.6518998146057129, -0.6165339946746826, -0.5811681747436523, -0.5458023548126221, -0.510436475276947, -0.47507065534591675, -0.4397048354148865, -0.4043389856815338, -0.36897313594818115, -0.3336073160171509, -0.2982414960861206, -0.26287564635276794, -0.22750981152057648, -0.192143976688385, -0.15677814185619354, -0.12141230702400208, -0.08604647219181061, -0.05068063735961914, -0.015314802527427673, 0.020051032304763794, 0.05541686713695526, 0.09078270196914673, 0.1261485368013382, 0.16151437163352966, 0.19688020646572113, 0.2322460412979126, 0.26761186122894287, 0.30297771096229553, 0.3383435606956482, 0.37370944023132324, 0.4090752601623535, 0.4444411098957062, 0.47980695962905884, 0.5151727795600891, 0.5505385994911194, 0.5859044790267944, 0.6212702989578247, 0.656636118888855, 0.6920019388198853, 0.7273677587509155, 0.7627336382865906, 0.7980994582176208, 0.8334652781486511, 0.8688311576843262, 0.9041969776153564, 0.9395627975463867, 0.974928617477417, 1.0102944374084473, 1.0456602573394775, 1.0810260772705078, 1.1163920164108276, 1.151757836341858, 1.1871236562728882, 1.2224894762039185, 1.2578552961349487, 1.293221116065979, 1.3285869359970093, 1.363952875137329, 1.3993186950683594, 1.4346845149993896, 1.47005033493042, 1.5054161548614502]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 3.0, 6.0, 6.0, 13.0, 14.0, 8.0, 15.0, 8.0, 21.0, 24.0, 16.0, 27.0, 20.0, 27.0, 27.0, 29.0, 31.0, 47.0, 29.0, 43.0, 38.0, 39.0, 46.0, 44.0, 47.0, 39.0, 35.0, 38.0, 31.0, 27.0, 25.0, 36.0, 31.0, 25.0, 21.0, 10.0, 14.0, 6.0, 7.0, 2.0, 7.0, 7.0, 2.0, 5.0, 1.0, 2.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0], "bins": [-3.52734375, -3.41668701171875, -3.3060302734375, -3.19537353515625, -3.084716796875, -2.97406005859375, -2.8634033203125, -2.75274658203125, -2.64208984375, -2.53143310546875, -2.4207763671875, -2.31011962890625, -2.199462890625, -2.08880615234375, -1.9781494140625, -1.86749267578125, -1.7568359375, -1.64617919921875, -1.5355224609375, -1.42486572265625, -1.314208984375, -1.20355224609375, -1.0928955078125, -0.98223876953125, -0.87158203125, -0.76092529296875, -0.6502685546875, -0.53961181640625, -0.428955078125, -0.31829833984375, -0.2076416015625, -0.09698486328125, 0.013671875, 0.12432861328125, 0.2349853515625, 0.34564208984375, 0.456298828125, 0.56695556640625, 0.6776123046875, 0.78826904296875, 0.89892578125, 1.00958251953125, 1.1202392578125, 1.23089599609375, 1.341552734375, 1.45220947265625, 1.5628662109375, 1.67352294921875, 1.7841796875, 1.89483642578125, 2.0054931640625, 2.11614990234375, 2.226806640625, 2.33746337890625, 2.4481201171875, 2.55877685546875, 2.66943359375, 2.78009033203125, 2.8907470703125, 3.00140380859375, 3.112060546875, 3.22271728515625, 3.3333740234375, 3.44403076171875, 3.5546875]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 5.0, 6.0, 12.0, 11.0, 28.0, 35.0, 58.0, 137.0, 242.0, 511.0, 994.0, 1990.0, 3927.0, 8097.0, 16856.0, 36579.0, 81622.0, 175537.0, 379947.0, 183986.0, 85609.0, 37823.0, 17872.0, 8365.0, 4092.0, 2094.0, 1083.0, 470.0, 249.0, 134.0, 76.0, 45.0, 17.0, 20.0, 14.0, 3.0, 8.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.03515625, -4.8934326171875, -4.751708984375, -4.6099853515625, -4.46826171875, -4.3265380859375, -4.184814453125, -4.0430908203125, -3.9013671875, -3.7596435546875, -3.617919921875, -3.4761962890625, -3.33447265625, -3.1927490234375, -3.051025390625, -2.9093017578125, -2.767578125, -2.6258544921875, -2.484130859375, -2.3424072265625, -2.20068359375, -2.0589599609375, -1.917236328125, -1.7755126953125, -1.6337890625, -1.4920654296875, -1.350341796875, -1.2086181640625, -1.06689453125, -0.9251708984375, -0.783447265625, -0.6417236328125, -0.5, -0.3582763671875, -0.216552734375, -0.0748291015625, 0.06689453125, 0.2086181640625, 0.350341796875, 0.4920654296875, 0.6337890625, 0.7755126953125, 0.917236328125, 1.0589599609375, 1.20068359375, 1.3424072265625, 1.484130859375, 1.6258544921875, 1.767578125, 1.9093017578125, 2.051025390625, 2.1927490234375, 2.33447265625, 2.4761962890625, 2.617919921875, 2.7596435546875, 2.9013671875, 3.0430908203125, 3.184814453125, 3.3265380859375, 3.46826171875, 3.6099853515625, 3.751708984375, 3.8934326171875, 4.03515625]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 5.0, 5.0, 2.0, 5.0, 5.0, 11.0, 12.0, 13.0, 14.0, 11.0, 14.0, 16.0, 27.0, 30.0, 29.0, 34.0, 34.0, 44.0, 37.0, 47.0, 80.0, 123.0, 201.0, 1413.0, 280.0, 117.0, 62.0, 55.0, 41.0, 39.0, 37.0, 23.0, 23.0, 24.0, 24.0, 15.0, 10.0, 16.0, 15.0, 11.0, 6.0, 9.0, 6.0, 4.0, 7.0, 5.0, 5.0, 5.0, 4.0, 4.0, 0.0, 2.0, 1.0], "bins": [-12.7421875, -12.3746337890625, -12.007080078125, -11.6395263671875, -11.27197265625, -10.9044189453125, -10.536865234375, -10.1693115234375, -9.8017578125, -9.4342041015625, -9.066650390625, -8.6990966796875, -8.33154296875, -7.9639892578125, -7.596435546875, -7.2288818359375, -6.861328125, -6.4937744140625, -6.126220703125, -5.7586669921875, -5.39111328125, -5.0235595703125, -4.656005859375, -4.2884521484375, -3.9208984375, -3.5533447265625, -3.185791015625, -2.8182373046875, -2.45068359375, -2.0831298828125, -1.715576171875, -1.3480224609375, -0.98046875, -0.6129150390625, -0.245361328125, 0.1221923828125, 0.48974609375, 0.8572998046875, 1.224853515625, 1.5924072265625, 1.9599609375, 2.3275146484375, 2.695068359375, 3.0626220703125, 3.43017578125, 3.7977294921875, 4.165283203125, 4.5328369140625, 4.900390625, 5.2679443359375, 5.635498046875, 6.0030517578125, 6.37060546875, 6.7381591796875, 7.105712890625, 7.4732666015625, 7.8408203125, 8.2083740234375, 8.575927734375, 8.9434814453125, 9.31103515625, 9.6785888671875, 10.046142578125, 10.4136962890625, 10.78125]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 5.0, 9.0, 13.0, 17.0, 14.0, 33.0, 22.0, 44.0, 57.0, 58.0, 78.0, 117.0, 214.0, 356.0, 689.0, 1676.0, 6567.0, 800256.0, 2319990.0, 11537.0, 1894.0, 870.0, 380.0, 243.0, 164.0, 117.0, 70.0, 48.0, 51.0, 27.0, 26.0, 16.0, 14.0, 9.0, 6.0, 7.0, 3.0, 3.0, 4.0, 2.0, 0.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.375, -24.4384765625, -23.501953125, -22.5654296875, -21.62890625, -20.6923828125, -19.755859375, -18.8193359375, -17.8828125, -16.9462890625, -16.009765625, -15.0732421875, -14.13671875, -13.2001953125, -12.263671875, -11.3271484375, -10.390625, -9.4541015625, -8.517578125, -7.5810546875, -6.64453125, -5.7080078125, -4.771484375, -3.8349609375, -2.8984375, -1.9619140625, -1.025390625, -0.0888671875, 0.84765625, 1.7841796875, 2.720703125, 3.6572265625, 4.59375, 5.5302734375, 6.466796875, 7.4033203125, 8.33984375, 9.2763671875, 10.212890625, 11.1494140625, 12.0859375, 13.0224609375, 13.958984375, 14.8955078125, 15.83203125, 16.7685546875, 17.705078125, 18.6416015625, 19.578125, 20.5146484375, 21.451171875, 22.3876953125, 23.32421875, 24.2607421875, 25.197265625, 26.1337890625, 27.0703125, 28.0068359375, 28.943359375, 29.8798828125, 30.81640625, 31.7529296875, 32.689453125, 33.6259765625, 34.5625]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [30.0, 680.0, 305.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.17264175415039, -4.986987590789795, 1.1986665725708008, 7.384321212768555, 13.569974899291992, 19.75562858581543, 25.9412841796875, 32.12693786621094, 38.312591552734375, 44.49824523925781, 50.68389892578125, 56.86955261230469, 63.055206298828125, 69.24085998535156, 75.426513671875, 81.61216735839844, 87.79782104492188, 93.98347473144531, 100.16912841796875, 106.35478210449219, 112.54043579101562, 118.72608947753906, 124.9117431640625, 131.09739685058594, 137.28305053710938, 143.4687042236328, 149.65435791015625, 155.8400115966797, 162.02566528320312, 168.21131896972656, 174.39697265625, 180.58262634277344, 186.76829528808594, 192.95394897460938, 199.1396026611328, 205.32525634765625, 211.5109100341797, 217.69656372070312, 223.88221740722656, 230.06787109375, 236.25352478027344, 242.43917846679688, 248.6248321533203, 254.81048583984375, 260.99615478515625, 267.1817932128906, 273.3674621582031, 279.5531005859375, 285.73876953125, 291.9244384765625, 298.1100769042969, 304.2957458496094, 310.48138427734375, 316.66705322265625, 322.8526916503906, 329.0383605957031, 335.2239990234375, 341.40966796875, 347.5953063964844, 353.7809753417969, 359.96661376953125, 366.15228271484375, 372.3379211425781, 378.5235900878906, 384.709228515625]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 6.0, 5.0, 7.0, 3.0, 13.0, 4.0, 8.0, 18.0, 10.0, 14.0, 16.0, 20.0, 16.0, 27.0, 29.0, 35.0, 36.0, 40.0, 40.0, 33.0, 35.0, 38.0, 40.0, 28.0, 51.0, 34.0, 28.0, 40.0, 28.0, 31.0, 43.0, 38.0, 27.0, 27.0, 17.0, 24.0, 17.0, 9.0, 10.0, 14.0, 10.0, 8.0, 6.0, 8.0, 6.0, 4.0, 0.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-30.199892044067383, -29.228544235229492, -28.25719451904297, -27.285846710205078, -26.314498901367188, -25.343151092529297, -24.371803283691406, -23.400453567504883, -22.429105758666992, -21.4577579498291, -20.486408233642578, -19.515060424804688, -18.543712615966797, -17.572364807128906, -16.601016998291016, -15.629667282104492, -14.658319473266602, -13.686971664428711, -12.715622901916504, -11.744274139404297, -10.772926330566406, -9.801578521728516, -8.830229759216309, -7.85888147354126, -6.887533187866211, -5.916184902191162, -4.944836616516113, -3.9734883308410645, -3.0021400451660156, -2.030791759490967, -1.059443473815918, -0.08809518814086914, 0.8832550048828125, 1.8546032905578613, 2.82595157623291, 3.797299861907959, 4.768648147583008, 5.739996433258057, 6.7113447189331055, 7.682693004608154, 8.654041290283203, 9.625389099121094, 10.5967378616333, 11.568086624145508, 12.539434432983398, 13.510782241821289, 14.482131004333496, 15.453479766845703, 16.424827575683594, 17.396175384521484, 18.367523193359375, 19.3388729095459, 20.31022071838379, 21.28156852722168, 22.252918243408203, 23.224266052246094, 24.195613861083984, 25.166961669921875, 26.138309478759766, 27.10965919494629, 28.08100700378418, 29.05235481262207, 30.023704528808594, 30.995052337646484, 31.966400146484375]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 0.0, 5.0, 3.0, 3.0, 5.0, 10.0, 6.0, 12.0, 15.0, 10.0, 18.0, 7.0, 19.0, 24.0, 22.0, 34.0, 31.0, 36.0, 40.0, 44.0, 38.0, 38.0, 55.0, 47.0, 52.0, 39.0, 53.0, 43.0, 51.0, 35.0, 31.0, 28.0, 28.0, 26.0, 26.0, 16.0, 11.0, 6.0, 10.0, 7.0, 4.0, 7.0, 6.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.58203125, -3.4512939453125, -3.320556640625, -3.1898193359375, -3.05908203125, -2.9283447265625, -2.797607421875, -2.6668701171875, -2.5361328125, -2.4053955078125, -2.274658203125, -2.1439208984375, -2.01318359375, -1.8824462890625, -1.751708984375, -1.6209716796875, -1.490234375, -1.3594970703125, -1.228759765625, -1.0980224609375, -0.96728515625, -0.8365478515625, -0.705810546875, -0.5750732421875, -0.4443359375, -0.3135986328125, -0.182861328125, -0.0521240234375, 0.07861328125, 0.2093505859375, 0.340087890625, 0.4708251953125, 0.6015625, 0.7322998046875, 0.863037109375, 0.9937744140625, 1.12451171875, 1.2552490234375, 1.385986328125, 1.5167236328125, 1.6474609375, 1.7781982421875, 1.908935546875, 2.0396728515625, 2.17041015625, 2.3011474609375, 2.431884765625, 2.5626220703125, 2.693359375, 2.8240966796875, 2.954833984375, 3.0855712890625, 3.21630859375, 3.3470458984375, 3.477783203125, 3.6085205078125, 3.7392578125, 3.8699951171875, 4.000732421875, 4.1314697265625, 4.26220703125, 4.3929443359375, 4.523681640625, 4.6544189453125, 4.78515625]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 6.0, 5.0, 7.0, 15.0, 10.0, 20.0, 22.0, 22.0, 36.0, 47.0, 77.0, 119.0, 197.0, 316.0, 751.0, 1783.0, 5324.0, 17303.0, 65060.0, 257155.0, 959085.0, 1753615.0, 836369.0, 220007.0, 54917.0, 14753.0, 4450.0, 1429.0, 625.0, 290.0, 166.0, 90.0, 57.0, 39.0, 33.0, 21.0, 15.0, 12.0, 10.0, 14.0, 4.0, 5.0, 6.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.19921875, -5.01641845703125, -4.8336181640625, -4.65081787109375, -4.468017578125, -4.28521728515625, -4.1024169921875, -3.91961669921875, -3.73681640625, -3.55401611328125, -3.3712158203125, -3.18841552734375, -3.005615234375, -2.82281494140625, -2.6400146484375, -2.45721435546875, -2.2744140625, -2.09161376953125, -1.9088134765625, -1.72601318359375, -1.543212890625, -1.36041259765625, -1.1776123046875, -0.99481201171875, -0.81201171875, -0.62921142578125, -0.4464111328125, -0.26361083984375, -0.080810546875, 0.10198974609375, 0.2847900390625, 0.46759033203125, 0.650390625, 0.83319091796875, 1.0159912109375, 1.19879150390625, 1.381591796875, 1.56439208984375, 1.7471923828125, 1.92999267578125, 2.11279296875, 2.29559326171875, 2.4783935546875, 2.66119384765625, 2.843994140625, 3.02679443359375, 3.2095947265625, 3.39239501953125, 3.5751953125, 3.75799560546875, 3.9407958984375, 4.12359619140625, 4.306396484375, 4.48919677734375, 4.6719970703125, 4.85479736328125, 5.03759765625, 5.22039794921875, 5.4031982421875, 5.58599853515625, 5.768798828125, 5.95159912109375, 6.1343994140625, 6.31719970703125, 6.5]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 6.0, 10.0, 15.0, 23.0, 27.0, 36.0, 28.0, 41.0, 54.0, 67.0, 99.0, 135.0, 164.0, 234.0, 272.0, 336.0, 376.0, 418.0, 391.0, 297.0, 269.0, 183.0, 147.0, 106.0, 89.0, 55.0, 41.0, 33.0, 35.0, 19.0, 22.0, 12.0, 10.0, 4.0, 6.0, 4.0, 6.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.8515625, -6.6448974609375, -6.438232421875, -6.2315673828125, -6.02490234375, -5.8182373046875, -5.611572265625, -5.4049072265625, -5.1982421875, -4.9915771484375, -4.784912109375, -4.5782470703125, -4.37158203125, -4.1649169921875, -3.958251953125, -3.7515869140625, -3.544921875, -3.3382568359375, -3.131591796875, -2.9249267578125, -2.71826171875, -2.5115966796875, -2.304931640625, -2.0982666015625, -1.8916015625, -1.6849365234375, -1.478271484375, -1.2716064453125, -1.06494140625, -0.8582763671875, -0.651611328125, -0.4449462890625, -0.23828125, -0.0316162109375, 0.175048828125, 0.3817138671875, 0.58837890625, 0.7950439453125, 1.001708984375, 1.2083740234375, 1.4150390625, 1.6217041015625, 1.828369140625, 2.0350341796875, 2.24169921875, 2.4483642578125, 2.655029296875, 2.8616943359375, 3.068359375, 3.2750244140625, 3.481689453125, 3.6883544921875, 3.89501953125, 4.1016845703125, 4.308349609375, 4.5150146484375, 4.7216796875, 4.9283447265625, 5.135009765625, 5.3416748046875, 5.54833984375, 5.7550048828125, 5.961669921875, 6.1683349609375, 6.375]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 5.0, 5.0, 5.0, 6.0, 9.0, 13.0, 23.0, 25.0, 32.0, 36.0, 48.0, 60.0, 80.0, 123.0, 183.0, 284.0, 420.0, 1235.0, 47140.0, 3569209.0, 568937.0, 4716.0, 609.0, 299.0, 204.0, 155.0, 95.0, 73.0, 60.0, 43.0, 33.0, 31.0, 24.0, 20.0, 19.0, 9.0, 10.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.53125, -25.63916015625, -24.7470703125, -23.85498046875, -22.962890625, -22.07080078125, -21.1787109375, -20.28662109375, -19.39453125, -18.50244140625, -17.6103515625, -16.71826171875, -15.826171875, -14.93408203125, -14.0419921875, -13.14990234375, -12.2578125, -11.36572265625, -10.4736328125, -9.58154296875, -8.689453125, -7.79736328125, -6.9052734375, -6.01318359375, -5.12109375, -4.22900390625, -3.3369140625, -2.44482421875, -1.552734375, -0.66064453125, 0.2314453125, 1.12353515625, 2.015625, 2.90771484375, 3.7998046875, 4.69189453125, 5.583984375, 6.47607421875, 7.3681640625, 8.26025390625, 9.15234375, 10.04443359375, 10.9365234375, 11.82861328125, 12.720703125, 13.61279296875, 14.5048828125, 15.39697265625, 16.2890625, 17.18115234375, 18.0732421875, 18.96533203125, 19.857421875, 20.74951171875, 21.6416015625, 22.53369140625, 23.42578125, 24.31787109375, 25.2099609375, 26.10205078125, 26.994140625, 27.88623046875, 28.7783203125, 29.67041015625, 30.5625]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 31.0, 261.0, 523.0, 192.0, 9.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-156.70713806152344, -151.19044494628906, -145.6737518310547, -140.1570587158203, -134.64035034179688, -129.1236572265625, -123.60696411132812, -118.09027099609375, -112.57357788085938, -107.056884765625, -101.54019165039062, -96.02349090576172, -90.50679779052734, -84.99010467529297, -79.47340393066406, -73.95671081542969, -68.44001770019531, -62.92332458496094, -57.4066276550293, -51.889930725097656, -46.37323760986328, -40.856544494628906, -35.339847564697266, -29.823150634765625, -24.30645751953125, -18.789762496948242, -13.273067474365234, -7.756372451782227, -2.2396774291992188, 3.277017593383789, 8.793712615966797, 14.310409545898438, 19.827117919921875, 25.343812942504883, 30.86050796508789, 36.37720489501953, 41.893898010253906, 47.41059112548828, 52.92728805541992, 58.44398498535156, 63.96067810058594, 69.47737121582031, 74.99406433105469, 80.5107650756836, 86.02745819091797, 91.54415130615234, 97.06085205078125, 102.57754516601562, 108.09423828125, 113.61093139648438, 119.12762451171875, 124.64432525634766, 130.1610107421875, 135.67771911621094, 141.1944122314453, 146.7111053466797, 152.22779846191406, 157.74449157714844, 163.2611846923828, 168.7778778076172, 174.29458618164062, 179.811279296875, 185.32797241210938, 190.84466552734375, 196.36135864257812]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 5.0, 5.0, 8.0, 5.0, 10.0, 16.0, 12.0, 15.0, 17.0, 23.0, 30.0, 31.0, 27.0, 31.0, 39.0, 41.0, 44.0, 45.0, 47.0, 50.0, 41.0, 54.0, 36.0, 34.0, 39.0, 34.0, 39.0, 18.0, 43.0, 23.0, 26.0, 15.0, 32.0, 12.0, 17.0, 9.0, 10.0, 11.0, 5.0, 2.0, 3.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.268800735473633, -25.446353912353516, -24.6239070892334, -23.80146026611328, -22.979015350341797, -22.15656852722168, -21.334121704101562, -20.511674880981445, -19.689228057861328, -18.86678123474121, -18.044334411621094, -17.22188949584961, -16.399442672729492, -15.576995849609375, -14.754549026489258, -13.93210220336914, -13.109657287597656, -12.287210464477539, -11.464764595031738, -10.642317771911621, -9.81987190246582, -8.997425079345703, -8.174978256225586, -7.352531909942627, -6.530085563659668, -5.707639217376709, -4.88519287109375, -4.062746047973633, -3.240299701690674, -2.417853355407715, -1.5954065322875977, -0.7729601860046387, 0.0494842529296875, 0.871930718421936, 1.6943771839141846, 2.5168237686157227, 3.3392701148986816, 4.161716461181641, 4.984163284301758, 5.806609630584717, 6.629055976867676, 7.451502323150635, 8.273948669433594, 9.096395492553711, 9.918842315673828, 10.741288185119629, 11.563735008239746, 12.386180877685547, 13.208627700805664, 14.031074523925781, 14.853520393371582, 15.6759672164917, 16.4984130859375, 17.320859909057617, 18.143306732177734, 18.96575355529785, 19.78820037841797, 20.610647201538086, 21.433094024658203, 22.255538940429688, 23.077985763549805, 23.900432586669922, 24.72287940979004, 25.545326232910156, 26.36777114868164]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 3.0, 4.0, 2.0, 2.0, 3.0, 9.0, 12.0, 10.0, 14.0, 11.0, 15.0, 15.0, 11.0, 17.0, 23.0, 37.0, 26.0, 29.0, 25.0, 28.0, 45.0, 38.0, 22.0, 41.0, 46.0, 49.0, 40.0, 38.0, 37.0, 50.0, 33.0, 26.0, 20.0, 22.0, 27.0, 26.0, 16.0, 21.0, 21.0, 21.0, 13.0, 18.0, 13.0, 8.0, 5.0, 5.0, 3.0, 7.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0], "bins": [-3.103515625, -2.998382568359375, -2.89324951171875, -2.788116455078125, -2.6829833984375, -2.577850341796875, -2.47271728515625, -2.367584228515625, -2.262451171875, -2.157318115234375, -2.05218505859375, -1.947052001953125, -1.8419189453125, -1.736785888671875, -1.63165283203125, -1.526519775390625, -1.42138671875, -1.316253662109375, -1.21112060546875, -1.105987548828125, -1.0008544921875, -0.895721435546875, -0.79058837890625, -0.685455322265625, -0.580322265625, -0.475189208984375, -0.37005615234375, -0.264923095703125, -0.1597900390625, -0.054656982421875, 0.05047607421875, 0.155609130859375, 0.2607421875, 0.365875244140625, 0.47100830078125, 0.576141357421875, 0.6812744140625, 0.786407470703125, 0.89154052734375, 0.996673583984375, 1.101806640625, 1.206939697265625, 1.31207275390625, 1.417205810546875, 1.5223388671875, 1.627471923828125, 1.73260498046875, 1.837738037109375, 1.94287109375, 2.048004150390625, 2.15313720703125, 2.258270263671875, 2.3634033203125, 2.468536376953125, 2.57366943359375, 2.678802490234375, 2.783935546875, 2.889068603515625, 2.99420166015625, 3.099334716796875, 3.2044677734375, 3.309600830078125, 3.41473388671875, 3.519866943359375, 3.625]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 8.0, 12.0, 19.0, 27.0, 36.0, 68.0, 124.0, 199.0, 400.0, 757.0, 1531.0, 2978.0, 5906.0, 11503.0, 21581.0, 39038.0, 67831.0, 109533.0, 157421.0, 186148.0, 163745.0, 115676.0, 72924.0, 42211.0, 23174.0, 12707.0, 6400.0, 3202.0, 1564.0, 876.0, 427.0, 236.0, 128.0, 64.0, 39.0, 24.0, 8.0, 9.0, 10.0, 6.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.7431640625, -1.6927337646484375, -1.642303466796875, -1.5918731689453125, -1.54144287109375, -1.4910125732421875, -1.440582275390625, -1.3901519775390625, -1.3397216796875, -1.2892913818359375, -1.238861083984375, -1.1884307861328125, -1.13800048828125, -1.0875701904296875, -1.037139892578125, -0.9867095947265625, -0.936279296875, -0.8858489990234375, -0.835418701171875, -0.7849884033203125, -0.73455810546875, -0.6841278076171875, -0.633697509765625, -0.5832672119140625, -0.5328369140625, -0.4824066162109375, -0.431976318359375, -0.3815460205078125, -0.33111572265625, -0.2806854248046875, -0.230255126953125, -0.1798248291015625, -0.12939453125, -0.0789642333984375, -0.028533935546875, 0.0218963623046875, 0.07232666015625, 0.1227569580078125, 0.173187255859375, 0.2236175537109375, 0.2740478515625, 0.3244781494140625, 0.374908447265625, 0.4253387451171875, 0.47576904296875, 0.5261993408203125, 0.576629638671875, 0.6270599365234375, 0.677490234375, 0.7279205322265625, 0.778350830078125, 0.8287811279296875, 0.87921142578125, 0.9296417236328125, 0.980072021484375, 1.0305023193359375, 1.0809326171875, 1.1313629150390625, 1.181793212890625, 1.2322235107421875, 1.28265380859375, 1.3330841064453125, 1.383514404296875, 1.4339447021484375, 1.484375]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 5.0, 3.0, 5.0, 5.0, 6.0, 11.0, 9.0, 12.0, 18.0, 11.0, 24.0, 28.0, 25.0, 21.0, 35.0, 33.0, 29.0, 53.0, 25.0, 34.0, 41.0, 28.0, 1063.0, 43.0, 52.0, 43.0, 41.0, 30.0, 26.0, 26.0, 42.0, 32.0, 28.0, 23.0, 23.0, 5.0, 19.0, 14.0, 9.0, 21.0, 6.0, 5.0, 3.0, 7.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.974609375, -2.877532958984375, -2.78045654296875, -2.683380126953125, -2.5863037109375, -2.489227294921875, -2.39215087890625, -2.295074462890625, -2.197998046875, -2.100921630859375, -2.00384521484375, -1.906768798828125, -1.8096923828125, -1.712615966796875, -1.61553955078125, -1.518463134765625, -1.42138671875, -1.324310302734375, -1.22723388671875, -1.130157470703125, -1.0330810546875, -0.936004638671875, -0.83892822265625, -0.741851806640625, -0.644775390625, -0.547698974609375, -0.45062255859375, -0.353546142578125, -0.2564697265625, -0.159393310546875, -0.06231689453125, 0.034759521484375, 0.1318359375, 0.228912353515625, 0.32598876953125, 0.423065185546875, 0.5201416015625, 0.617218017578125, 0.71429443359375, 0.811370849609375, 0.908447265625, 1.005523681640625, 1.10260009765625, 1.199676513671875, 1.2967529296875, 1.393829345703125, 1.49090576171875, 1.587982177734375, 1.68505859375, 1.782135009765625, 1.87921142578125, 1.976287841796875, 2.0733642578125, 2.170440673828125, 2.26751708984375, 2.364593505859375, 2.461669921875, 2.558746337890625, 2.65582275390625, 2.752899169921875, 2.8499755859375, 2.947052001953125, 3.04412841796875, 3.141204833984375, 3.23828125]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 2.0, 2.0, 5.0, 5.0, 12.0, 11.0, 20.0, 27.0, 35.0, 41.0, 75.0, 135.0, 161.0, 247.0, 402.0, 546.0, 836.0, 1215.0, 1828.0, 2783.0, 3945.0, 6285.0, 9363.0, 14338.0, 22688.0, 51148.0, 1760150.0, 140776.0, 29220.0, 17675.0, 11038.0, 7272.0, 4901.0, 3249.0, 2125.0, 1459.0, 1021.0, 687.0, 435.0, 300.0, 216.0, 153.0, 82.0, 84.0, 43.0, 29.0, 24.0, 19.0, 9.0, 6.0, 3.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.408203125, -2.334564208984375, -2.26092529296875, -2.187286376953125, -2.1136474609375, -2.040008544921875, -1.96636962890625, -1.892730712890625, -1.819091796875, -1.745452880859375, -1.67181396484375, -1.598175048828125, -1.5245361328125, -1.450897216796875, -1.37725830078125, -1.303619384765625, -1.22998046875, -1.156341552734375, -1.08270263671875, -1.009063720703125, -0.9354248046875, -0.861785888671875, -0.78814697265625, -0.714508056640625, -0.640869140625, -0.567230224609375, -0.49359130859375, -0.419952392578125, -0.3463134765625, -0.272674560546875, -0.19903564453125, -0.125396728515625, -0.0517578125, 0.021881103515625, 0.09552001953125, 0.169158935546875, 0.2427978515625, 0.316436767578125, 0.39007568359375, 0.463714599609375, 0.537353515625, 0.610992431640625, 0.68463134765625, 0.758270263671875, 0.8319091796875, 0.905548095703125, 0.97918701171875, 1.052825927734375, 1.12646484375, 1.200103759765625, 1.27374267578125, 1.347381591796875, 1.4210205078125, 1.494659423828125, 1.56829833984375, 1.641937255859375, 1.715576171875, 1.789215087890625, 1.86285400390625, 1.936492919921875, 2.0101318359375, 2.083770751953125, 2.15740966796875, 2.231048583984375, 2.3046875]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 2.0, 4.0, 7.0, 9.0, 8.0, 11.0, 30.0, 32.0, 46.0, 50.0, 69.0, 84.0, 82.0, 78.0, 81.0, 79.0, 54.0, 69.0, 48.0, 40.0, 34.0, 17.0, 18.0, 13.0, 8.0, 10.0, 2.0, 9.0, 6.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.196533203125, -0.1916055679321289, -0.1866779327392578, -0.18175029754638672, -0.17682266235351562, -0.17189502716064453, -0.16696739196777344, -0.16203975677490234, -0.15711212158203125, -0.15218448638916016, -0.14725685119628906, -0.14232921600341797, -0.13740158081054688, -0.13247394561767578, -0.1275463104248047, -0.1226186752319336, -0.1176910400390625, -0.1127634048461914, -0.10783576965332031, -0.10290813446044922, -0.09798049926757812, -0.09305286407470703, -0.08812522888183594, -0.08319759368896484, -0.07826995849609375, -0.07334232330322266, -0.06841468811035156, -0.06348705291748047, -0.058559417724609375, -0.05363178253173828, -0.04870414733886719, -0.043776512145996094, -0.038848876953125, -0.033921241760253906, -0.028993606567382812, -0.02406597137451172, -0.019138336181640625, -0.014210700988769531, -0.009283065795898438, -0.004355430603027344, 0.00057220458984375, 0.005499839782714844, 0.010427474975585938, 0.015355110168457031, 0.020282745361328125, 0.02521038055419922, 0.030138015747070312, 0.035065650939941406, 0.0399932861328125, 0.044920921325683594, 0.04984855651855469, 0.05477619171142578, 0.059703826904296875, 0.06463146209716797, 0.06955909729003906, 0.07448673248291016, 0.07941436767578125, 0.08434200286865234, 0.08926963806152344, 0.09419727325439453, 0.09912490844726562, 0.10405254364013672, 0.10898017883300781, 0.1139078140258789, 0.11883544921875]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 6.0, 5.0, 5.0, 10.0, 11.0, 14.0, 22.0, 21.0, 52.0, 79.0, 101.0, 164.0, 328.0, 950.0, 301921.0, 742837.0, 1127.0, 386.0, 198.0, 100.0, 79.0, 47.0, 33.0, 16.0, 17.0, 11.0, 3.0, 4.0, 3.0, 4.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.32421875, -2.22760009765625, -2.1309814453125, -2.03436279296875, -1.937744140625, -1.84112548828125, -1.7445068359375, -1.64788818359375, -1.55126953125, -1.45465087890625, -1.3580322265625, -1.26141357421875, -1.164794921875, -1.06817626953125, -0.9715576171875, -0.87493896484375, -0.7783203125, -0.68170166015625, -0.5850830078125, -0.48846435546875, -0.391845703125, -0.29522705078125, -0.1986083984375, -0.10198974609375, -0.00537109375, 0.09124755859375, 0.1878662109375, 0.28448486328125, 0.381103515625, 0.47772216796875, 0.5743408203125, 0.67095947265625, 0.767578125, 0.86419677734375, 0.9608154296875, 1.05743408203125, 1.154052734375, 1.25067138671875, 1.3472900390625, 1.44390869140625, 1.54052734375, 1.63714599609375, 1.7337646484375, 1.83038330078125, 1.927001953125, 2.02362060546875, 2.1202392578125, 2.21685791015625, 2.3134765625, 2.41009521484375, 2.5067138671875, 2.60333251953125, 2.699951171875, 2.79656982421875, 2.8931884765625, 2.98980712890625, 3.08642578125, 3.18304443359375, 3.2796630859375, 3.37628173828125, 3.472900390625, 3.56951904296875, 3.6661376953125, 3.76275634765625, 3.859375]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 7.0, 9.0, 68.0, 483.0, 385.0, 52.0, 9.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.3855667114257812, -2.3299570083618164, -2.2743475437164307, -2.218737840652466, -2.163128137588501, -2.1075186729431152, -2.0519089698791504, -1.9962992668151855, -1.9406896829605103, -1.885080099105835, -1.8294703960418701, -1.7738608121871948, -1.7182512283325195, -1.6626415252685547, -1.6070319414138794, -1.551422357559204, -1.4958126544952393, -1.440203070640564, -1.3845933675765991, -1.3289837837219238, -1.273374080657959, -1.2177644968032837, -1.1621549129486084, -1.1065452098846436, -1.0509356260299683, -0.9953259825706482, -0.9397163391113281, -0.8841067552566528, -0.8284971117973328, -0.7728874683380127, -0.7172778844833374, -0.6616682410240173, -0.6060587167739868, -0.5504490733146667, -0.49483945965766907, -0.4392298460006714, -0.3836202025413513, -0.32801055908203125, -0.27240094542503357, -0.2167913317680359, -0.16118168830871582, -0.10557205975055695, -0.04996243119239807, 0.005647197365760803, 0.06125682592391968, 0.11686646938323975, 0.17247608304023743, 0.2280856966972351, 0.2836953401565552, 0.33930498361587524, 0.3949145972728729, 0.4505242109298706, 0.5061338543891907, 0.5617434978485107, 0.617353081703186, 0.6729627251625061, 0.7285723686218262, 0.7841820120811462, 0.8397916555404663, 0.8954012393951416, 0.9510108828544617, 1.0066205263137817, 1.062230110168457, 1.1178398132324219, 1.1734493970870972]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 5.0, 6.0, 9.0, 7.0, 9.0, 12.0, 12.0, 18.0, 20.0, 21.0, 29.0, 31.0, 40.0, 35.0, 44.0, 36.0, 42.0, 49.0, 39.0, 48.0, 56.0, 42.0, 39.0, 42.0, 29.0, 31.0, 39.0, 36.0, 30.0, 36.0, 19.0, 17.0, 24.0, 12.0, 8.0, 7.0, 6.0, 10.0, 8.0, 4.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.38053226470947266, -0.36782175302505493, -0.3551112413406372, -0.3424007296562195, -0.32969021797180176, -0.31697970628738403, -0.3042692244052887, -0.29155871272087097, -0.27884820103645325, -0.2661376893520355, -0.2534271776676178, -0.24071668088436127, -0.22800616919994354, -0.21529565751552582, -0.2025851607322693, -0.18987464904785156, -0.17716413736343384, -0.1644536256790161, -0.1517431139945984, -0.13903261721134186, -0.12632210552692413, -0.11361159384250641, -0.10090108960866928, -0.08819058537483215, -0.07548007369041443, -0.0627695620059967, -0.050059057772159576, -0.03734854981303215, -0.024638041853904724, -0.011927530169487, 0.0007829740643501282, 0.013493478298187256, 0.02620398998260498, 0.03891449794173241, 0.05162500590085983, 0.06433551013469696, 0.07704602181911469, 0.08975653350353241, 0.10246703773736954, 0.11517754197120667, 0.1278880536556244, 0.14059856534004211, 0.15330907702445984, 0.16601957380771637, 0.1787300854921341, 0.19144059717655182, 0.20415109395980835, 0.21686160564422607, 0.2295721173286438, 0.24228262901306152, 0.25499314069747925, 0.267703652381897, 0.2804141640663147, 0.2931246757507324, 0.30583515763282776, 0.3185456693172455, 0.3312561810016632, 0.34396669268608093, 0.35667720437049866, 0.3693877160549164, 0.3820981979370117, 0.39480870962142944, 0.40751922130584717, 0.4202297329902649, 0.4329402446746826]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 4.0, 5.0, 4.0, 3.0, 10.0, 6.0, 12.0, 12.0, 16.0, 19.0, 11.0, 25.0, 23.0, 14.0, 28.0, 32.0, 29.0, 40.0, 34.0, 41.0, 49.0, 36.0, 30.0, 41.0, 50.0, 43.0, 38.0, 30.0, 38.0, 42.0, 31.0, 38.0, 27.0, 11.0, 24.0, 17.0, 13.0, 15.0, 15.0, 12.0, 15.0, 9.0, 5.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0], "bins": [-3.521484375, -3.4114990234375, -3.301513671875, -3.1915283203125, -3.08154296875, -2.9715576171875, -2.861572265625, -2.7515869140625, -2.6416015625, -2.5316162109375, -2.421630859375, -2.3116455078125, -2.20166015625, -2.0916748046875, -1.981689453125, -1.8717041015625, -1.76171875, -1.6517333984375, -1.541748046875, -1.4317626953125, -1.32177734375, -1.2117919921875, -1.101806640625, -0.9918212890625, -0.8818359375, -0.7718505859375, -0.661865234375, -0.5518798828125, -0.44189453125, -0.3319091796875, -0.221923828125, -0.1119384765625, -0.001953125, 0.1080322265625, 0.218017578125, 0.3280029296875, 0.43798828125, 0.5479736328125, 0.657958984375, 0.7679443359375, 0.8779296875, 0.9879150390625, 1.097900390625, 1.2078857421875, 1.31787109375, 1.4278564453125, 1.537841796875, 1.6478271484375, 1.7578125, 1.8677978515625, 1.977783203125, 2.0877685546875, 2.19775390625, 2.3077392578125, 2.417724609375, 2.5277099609375, 2.6376953125, 2.7476806640625, 2.857666015625, 2.9676513671875, 3.07763671875, 3.1876220703125, 3.297607421875, 3.4075927734375, 3.517578125]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 7.0, 3.0, 3.0, 4.0, 7.0, 11.0, 13.0, 17.0, 14.0, 31.0, 49.0, 55.0, 95.0, 173.0, 279.0, 491.0, 938.0, 1691.0, 3179.0, 5711.0, 10294.0, 19448.0, 39053.0, 81246.0, 173679.0, 328586.0, 198926.0, 92700.0, 43894.0, 22005.0, 11713.0, 6482.0, 3364.0, 1938.0, 1038.0, 522.0, 343.0, 218.0, 121.0, 77.0, 40.0, 34.0, 18.0, 15.0, 11.0, 7.0, 4.0, 5.0, 6.0, 2.0, 5.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-3.734375, -3.61614990234375, -3.4979248046875, -3.37969970703125, -3.261474609375, -3.14324951171875, -3.0250244140625, -2.90679931640625, -2.78857421875, -2.67034912109375, -2.5521240234375, -2.43389892578125, -2.315673828125, -2.19744873046875, -2.0792236328125, -1.96099853515625, -1.8427734375, -1.72454833984375, -1.6063232421875, -1.48809814453125, -1.369873046875, -1.25164794921875, -1.1334228515625, -1.01519775390625, -0.89697265625, -0.77874755859375, -0.6605224609375, -0.54229736328125, -0.424072265625, -0.30584716796875, -0.1876220703125, -0.06939697265625, 0.048828125, 0.16705322265625, 0.2852783203125, 0.40350341796875, 0.521728515625, 0.63995361328125, 0.7581787109375, 0.87640380859375, 0.99462890625, 1.11285400390625, 1.2310791015625, 1.34930419921875, 1.467529296875, 1.58575439453125, 1.7039794921875, 1.82220458984375, 1.9404296875, 2.05865478515625, 2.1768798828125, 2.29510498046875, 2.413330078125, 2.53155517578125, 2.6497802734375, 2.76800537109375, 2.88623046875, 3.00445556640625, 3.1226806640625, 3.24090576171875, 3.359130859375, 3.47735595703125, 3.5955810546875, 3.71380615234375, 3.83203125]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 6.0, 4.0, 2.0, 5.0, 6.0, 8.0, 6.0, 9.0, 9.0, 8.0, 11.0, 17.0, 22.0, 21.0, 36.0, 35.0, 27.0, 39.0, 41.0, 47.0, 72.0, 84.0, 211.0, 1420.0, 285.0, 151.0, 96.0, 51.0, 38.0, 41.0, 41.0, 27.0, 36.0, 26.0, 26.0, 14.0, 15.0, 19.0, 16.0, 12.0, 5.0, 6.0, 4.0, 6.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-13.4140625, -13.0059814453125, -12.597900390625, -12.1898193359375, -11.78173828125, -11.3736572265625, -10.965576171875, -10.5574951171875, -10.1494140625, -9.7413330078125, -9.333251953125, -8.9251708984375, -8.51708984375, -8.1090087890625, -7.700927734375, -7.2928466796875, -6.884765625, -6.4766845703125, -6.068603515625, -5.6605224609375, -5.25244140625, -4.8443603515625, -4.436279296875, -4.0281982421875, -3.6201171875, -3.2120361328125, -2.803955078125, -2.3958740234375, -1.98779296875, -1.5797119140625, -1.171630859375, -0.7635498046875, -0.35546875, 0.0526123046875, 0.460693359375, 0.8687744140625, 1.27685546875, 1.6849365234375, 2.093017578125, 2.5010986328125, 2.9091796875, 3.3172607421875, 3.725341796875, 4.1334228515625, 4.54150390625, 4.9495849609375, 5.357666015625, 5.7657470703125, 6.173828125, 6.5819091796875, 6.989990234375, 7.3980712890625, 7.80615234375, 8.2142333984375, 8.622314453125, 9.0303955078125, 9.4384765625, 9.8465576171875, 10.254638671875, 10.6627197265625, 11.07080078125, 11.4788818359375, 11.886962890625, 12.2950439453125, 12.703125]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 4.0, 4.0, 12.0, 11.0, 25.0, 33.0, 21.0, 49.0, 66.0, 92.0, 122.0, 187.0, 313.0, 615.0, 2906.0, 497003.0, 2635319.0, 7041.0, 835.0, 333.0, 198.0, 157.0, 96.0, 74.0, 48.0, 40.0, 20.0, 24.0, 12.0, 12.0, 13.0, 8.0, 7.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-39.15625, -38.072509765625, -36.98876953125, -35.905029296875, -34.8212890625, -33.737548828125, -32.65380859375, -31.570068359375, -30.486328125, -29.402587890625, -28.31884765625, -27.235107421875, -26.1513671875, -25.067626953125, -23.98388671875, -22.900146484375, -21.81640625, -20.732666015625, -19.64892578125, -18.565185546875, -17.4814453125, -16.397705078125, -15.31396484375, -14.230224609375, -13.146484375, -12.062744140625, -10.97900390625, -9.895263671875, -8.8115234375, -7.727783203125, -6.64404296875, -5.560302734375, -4.4765625, -3.392822265625, -2.30908203125, -1.225341796875, -0.1416015625, 0.942138671875, 2.02587890625, 3.109619140625, 4.193359375, 5.277099609375, 6.36083984375, 7.444580078125, 8.5283203125, 9.612060546875, 10.69580078125, 11.779541015625, 12.86328125, 13.947021484375, 15.03076171875, 16.114501953125, 17.1982421875, 18.281982421875, 19.36572265625, 20.449462890625, 21.533203125, 22.616943359375, 23.70068359375, 24.784423828125, 25.8681640625, 26.951904296875, 28.03564453125, 29.119384765625, 30.203125]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 16.0, 866.0, 134.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.810543060302734, -32.789588928222656, -25.768630981445312, -18.7476749420166, -11.72671890258789, -4.705760955810547, 2.3151931762695312, 9.33614730834961, 16.357105255126953, 23.378061294555664, 30.399017333984375, 37.41997528076172, 44.4409294128418, 51.46188735961914, 58.48284149169922, 65.50379943847656, 72.52474975585938, 79.54570770263672, 86.56666564941406, 93.58761596679688, 100.60857391357422, 107.62953186035156, 114.65048217773438, 121.67144012451172, 128.69239807128906, 135.71334838867188, 142.73431396484375, 149.75526428222656, 156.77621459960938, 163.79718017578125, 170.81813049316406, 177.83908081054688, 184.86004638671875, 191.88099670410156, 198.90196228027344, 205.92291259765625, 212.94387817382812, 219.96482849121094, 226.98577880859375, 234.00674438476562, 241.02769470214844, 248.04864501953125, 255.06961059570312, 262.090576171875, 269.11151123046875, 276.1324768066406, 283.1534423828125, 290.17437744140625, 297.1953430175781, 304.21630859375, 311.23724365234375, 318.2582092285156, 325.2791748046875, 332.30010986328125, 339.3210754394531, 346.342041015625, 353.36297607421875, 360.3839416503906, 367.4048767089844, 374.42584228515625, 381.4468078613281, 388.4677734375, 395.48870849609375, 402.5096740722656, 409.5306396484375]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 0.0, 7.0, 6.0, 7.0, 9.0, 9.0, 9.0, 7.0, 11.0, 26.0, 24.0, 24.0, 31.0, 24.0, 30.0, 14.0, 24.0, 30.0, 39.0, 33.0, 45.0, 47.0, 53.0, 48.0, 45.0, 35.0, 34.0, 38.0, 28.0, 38.0, 28.0, 32.0, 29.0, 25.0, 17.0, 16.0, 21.0, 11.0, 21.0, 10.0, 8.0, 5.0, 1.0, 1.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.868797302246094, -29.8741512298584, -28.87950325012207, -27.884857177734375, -26.890209197998047, -25.89556312561035, -24.900917053222656, -23.906269073486328, -22.91162109375, -21.916975021362305, -20.922327041625977, -19.92768096923828, -18.933032989501953, -17.938386917114258, -16.943740844726562, -15.949092864990234, -14.954446792602539, -13.959799766540527, -12.965152740478516, -11.97050666809082, -10.975858688354492, -9.981212615966797, -8.986565589904785, -7.991918563842773, -6.997271537780762, -6.00262451171875, -5.007977485656738, -4.013330936431885, -3.018683910369873, -2.0240368843078613, -1.0293903350830078, -0.034743309020996094, 0.9599037170410156, 1.9545506238937378, 2.94919753074646, 3.9438443183898926, 4.938491344451904, 5.933138370513916, 6.9277849197387695, 7.922431945800781, 8.917078971862793, 9.911725997924805, 10.906373023986816, 11.901020050048828, 12.895666122436523, 13.890314102172852, 14.884960174560547, 15.879607200622559, 16.87425422668457, 17.868900299072266, 18.863548278808594, 19.85819435119629, 20.852842330932617, 21.847488403320312, 22.84213638305664, 23.836782455444336, 24.83142852783203, 25.826074600219727, 26.820722579956055, 27.81536865234375, 28.810016632080078, 29.804662704467773, 30.79930877685547, 31.793956756591797, 32.788604736328125]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 4.0, 5.0, 10.0, 11.0, 8.0, 17.0, 20.0, 16.0, 17.0, 16.0, 21.0, 29.0, 20.0, 36.0, 30.0, 31.0, 35.0, 35.0, 39.0, 36.0, 55.0, 50.0, 42.0, 44.0, 44.0, 30.0, 47.0, 32.0, 21.0, 30.0, 27.0, 13.0, 27.0, 17.0, 15.0, 12.0, 12.0, 10.0, 3.0, 12.0, 7.0, 5.0, 4.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5234375, -3.40533447265625, -3.2872314453125, -3.16912841796875, -3.051025390625, -2.93292236328125, -2.8148193359375, -2.69671630859375, -2.57861328125, -2.46051025390625, -2.3424072265625, -2.22430419921875, -2.106201171875, -1.98809814453125, -1.8699951171875, -1.75189208984375, -1.6337890625, -1.51568603515625, -1.3975830078125, -1.27947998046875, -1.161376953125, -1.04327392578125, -0.9251708984375, -0.80706787109375, -0.68896484375, -0.57086181640625, -0.4527587890625, -0.33465576171875, -0.216552734375, -0.09844970703125, 0.0196533203125, 0.13775634765625, 0.255859375, 0.37396240234375, 0.4920654296875, 0.61016845703125, 0.728271484375, 0.84637451171875, 0.9644775390625, 1.08258056640625, 1.20068359375, 1.31878662109375, 1.4368896484375, 1.55499267578125, 1.673095703125, 1.79119873046875, 1.9093017578125, 2.02740478515625, 2.1455078125, 2.26361083984375, 2.3817138671875, 2.49981689453125, 2.617919921875, 2.73602294921875, 2.8541259765625, 2.97222900390625, 3.09033203125, 3.20843505859375, 3.3265380859375, 3.44464111328125, 3.562744140625, 3.68084716796875, 3.7989501953125, 3.91705322265625, 4.03515625]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 6.0, 6.0, 3.0, 7.0, 16.0, 14.0, 16.0, 23.0, 36.0, 50.0, 68.0, 100.0, 151.0, 273.0, 558.0, 1506.0, 5163.0, 20675.0, 96226.0, 459086.0, 1727040.0, 1441896.0, 346725.0, 72931.0, 15900.0, 3809.0, 1101.0, 401.0, 188.0, 91.0, 61.0, 36.0, 26.0, 26.0, 18.0, 15.0, 9.0, 11.0, 7.0, 2.0, 3.0, 4.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.265625, -6.04888916015625, -5.8321533203125, -5.61541748046875, -5.398681640625, -5.18194580078125, -4.9652099609375, -4.74847412109375, -4.53173828125, -4.31500244140625, -4.0982666015625, -3.88153076171875, -3.664794921875, -3.44805908203125, -3.2313232421875, -3.01458740234375, -2.7978515625, -2.58111572265625, -2.3643798828125, -2.14764404296875, -1.930908203125, -1.71417236328125, -1.4974365234375, -1.28070068359375, -1.06396484375, -0.84722900390625, -0.6304931640625, -0.41375732421875, -0.197021484375, 0.01971435546875, 0.2364501953125, 0.45318603515625, 0.669921875, 0.88665771484375, 1.1033935546875, 1.32012939453125, 1.536865234375, 1.75360107421875, 1.9703369140625, 2.18707275390625, 2.40380859375, 2.62054443359375, 2.8372802734375, 3.05401611328125, 3.270751953125, 3.48748779296875, 3.7042236328125, 3.92095947265625, 4.1376953125, 4.35443115234375, 4.5711669921875, 4.78790283203125, 5.004638671875, 5.22137451171875, 5.4381103515625, 5.65484619140625, 5.87158203125, 6.08831787109375, 6.3050537109375, 6.52178955078125, 6.738525390625, 6.95526123046875, 7.1719970703125, 7.38873291015625, 7.60546875]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 6.0, 4.0, 4.0, 7.0, 10.0, 5.0, 10.0, 18.0, 31.0, 34.0, 34.0, 46.0, 47.0, 88.0, 109.0, 136.0, 166.0, 201.0, 289.0, 323.0, 386.0, 382.0, 359.0, 329.0, 230.0, 188.0, 135.0, 106.0, 94.0, 65.0, 46.0, 33.0, 33.0, 30.0, 16.0, 22.0, 13.0, 9.0, 9.0, 2.0, 3.0, 7.0, 4.0, 1.0, 2.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.6640625, -5.4765625, -5.2890625, -5.1015625, -4.9140625, -4.7265625, -4.5390625, -4.3515625, -4.1640625, -3.9765625, -3.7890625, -3.6015625, -3.4140625, -3.2265625, -3.0390625, -2.8515625, -2.6640625, -2.4765625, -2.2890625, -2.1015625, -1.9140625, -1.7265625, -1.5390625, -1.3515625, -1.1640625, -0.9765625, -0.7890625, -0.6015625, -0.4140625, -0.2265625, -0.0390625, 0.1484375, 0.3359375, 0.5234375, 0.7109375, 0.8984375, 1.0859375, 1.2734375, 1.4609375, 1.6484375, 1.8359375, 2.0234375, 2.2109375, 2.3984375, 2.5859375, 2.7734375, 2.9609375, 3.1484375, 3.3359375, 3.5234375, 3.7109375, 3.8984375, 4.0859375, 4.2734375, 4.4609375, 4.6484375, 4.8359375, 5.0234375, 5.2109375, 5.3984375, 5.5859375, 5.7734375, 5.9609375, 6.1484375, 6.3359375]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 4.0, 6.0, 2.0, 3.0, 5.0, 12.0, 8.0, 20.0, 22.0, 20.0, 26.0, 43.0, 42.0, 69.0, 92.0, 103.0, 157.0, 236.0, 340.0, 857.0, 10552.0, 831810.0, 3290313.0, 56146.0, 1884.0, 486.0, 255.0, 199.0, 147.0, 95.0, 68.0, 48.0, 47.0, 34.0, 36.0, 22.0, 23.0, 5.0, 14.0, 7.0, 6.0, 5.0, 5.0, 2.0, 2.0, 6.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-25.890625, -25.086669921875, -24.28271484375, -23.478759765625, -22.6748046875, -21.870849609375, -21.06689453125, -20.262939453125, -19.458984375, -18.655029296875, -17.85107421875, -17.047119140625, -16.2431640625, -15.439208984375, -14.63525390625, -13.831298828125, -13.02734375, -12.223388671875, -11.41943359375, -10.615478515625, -9.8115234375, -9.007568359375, -8.20361328125, -7.399658203125, -6.595703125, -5.791748046875, -4.98779296875, -4.183837890625, -3.3798828125, -2.575927734375, -1.77197265625, -0.968017578125, -0.1640625, 0.639892578125, 1.44384765625, 2.247802734375, 3.0517578125, 3.855712890625, 4.65966796875, 5.463623046875, 6.267578125, 7.071533203125, 7.87548828125, 8.679443359375, 9.4833984375, 10.287353515625, 11.09130859375, 11.895263671875, 12.69921875, 13.503173828125, 14.30712890625, 15.111083984375, 15.9150390625, 16.718994140625, 17.52294921875, 18.326904296875, 19.130859375, 19.934814453125, 20.73876953125, 21.542724609375, 22.3466796875, 23.150634765625, 23.95458984375, 24.758544921875, 25.5625]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 19.0, 101.0, 270.0, 332.0, 202.0, 73.0, 12.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.63215637207031, -72.39237976074219, -69.15259552001953, -65.9128189086914, -62.673038482666016, -59.433258056640625, -56.193477630615234, -52.953697204589844, -49.71392059326172, -46.47414016723633, -43.23435974121094, -39.99458312988281, -36.75480270385742, -33.51502227783203, -30.27524185180664, -27.035463333129883, -23.79568099975586, -20.55590057373047, -17.31612205505371, -14.07634162902832, -10.836562156677246, -7.596782684326172, -4.357002258300781, -1.1172237396240234, 2.122556686401367, 5.362336158752441, 8.602115631103516, 11.841896057128906, 15.08167552947998, 18.321455001831055, 21.561235427856445, 24.801013946533203, 28.040794372558594, 31.280574798583984, 34.520355224609375, 37.7601318359375, 40.99991226196289, 44.23969268798828, 47.47947311401367, 50.71925354003906, 53.95903015136719, 57.19881057739258, 60.43859100341797, 63.678367614746094, 66.91815185546875, 70.15792846679688, 73.397705078125, 76.63748931884766, 79.87727355957031, 83.11705017089844, 86.3568344116211, 89.59661102294922, 92.83639526367188, 96.076171875, 99.31594848632812, 102.55573272705078, 105.7955093383789, 109.03528594970703, 112.27507019042969, 115.51484680175781, 118.75463104248047, 121.9944076538086, 125.23419189453125, 128.47396850585938, 131.7137451171875]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 4.0, 5.0, 2.0, 5.0, 12.0, 6.0, 6.0, 15.0, 14.0, 19.0, 17.0, 29.0, 24.0, 30.0, 33.0, 30.0, 39.0, 38.0, 37.0, 31.0, 39.0, 45.0, 56.0, 55.0, 48.0, 44.0, 33.0, 38.0, 41.0, 21.0, 34.0, 23.0, 31.0, 17.0, 20.0, 17.0, 10.0, 9.0, 9.0, 10.0, 3.0, 3.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.90259552001953, -24.12870216369629, -23.35481071472168, -22.580917358398438, -21.807025909423828, -21.033132553100586, -20.259239196777344, -19.485347747802734, -18.711454391479492, -17.93756103515625, -17.16366958618164, -16.3897762298584, -15.615883827209473, -14.841991424560547, -14.068098068237305, -13.294205665588379, -12.520313262939453, -11.746420860290527, -10.972528457641602, -10.19863510131836, -9.424742698669434, -8.650850296020508, -7.876957416534424, -7.10306453704834, -6.329172134399414, -5.555279731750488, -4.781386852264404, -4.00749397277832, -3.2336015701293945, -2.4597089290618896, -1.6858162879943848, -0.9119234085083008, -0.1380290985107422, 0.6358635425567627, 1.4097561836242676, 2.1836488246917725, 2.9575414657592773, 3.7314341068267822, 4.505326747894287, 5.279219627380371, 6.053112030029297, 6.827004432678223, 7.600897312164307, 8.37479019165039, 9.148682594299316, 9.922574996948242, 10.696468353271484, 11.47036075592041, 12.244253158569336, 13.018145561218262, 13.792037963867188, 14.56593132019043, 15.339823722839355, 16.11371612548828, 16.887609481811523, 17.661502838134766, 18.435394287109375, 19.209287643432617, 19.983179092407227, 20.75707244873047, 21.530963897705078, 22.30485725402832, 23.078750610351562, 23.852642059326172, 24.626535415649414]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 5.0, 2.0, 0.0, 4.0, 7.0, 3.0, 8.0, 9.0, 10.0, 12.0, 20.0, 15.0, 21.0, 17.0, 18.0, 30.0, 26.0, 24.0, 29.0, 26.0, 35.0, 52.0, 42.0, 36.0, 41.0, 52.0, 47.0, 50.0, 45.0, 33.0, 43.0, 24.0, 34.0, 22.0, 26.0, 27.0, 8.0, 14.0, 25.0, 11.0, 15.0, 7.0, 9.0, 6.0, 3.0, 5.0, 3.0, 6.0, 2.0, 4.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.310546875, -3.196685791015625, -3.08282470703125, -2.968963623046875, -2.8551025390625, -2.741241455078125, -2.62738037109375, -2.513519287109375, -2.399658203125, -2.285797119140625, -2.17193603515625, -2.058074951171875, -1.9442138671875, -1.830352783203125, -1.71649169921875, -1.602630615234375, -1.48876953125, -1.374908447265625, -1.26104736328125, -1.147186279296875, -1.0333251953125, -0.919464111328125, -0.80560302734375, -0.691741943359375, -0.577880859375, -0.464019775390625, -0.35015869140625, -0.236297607421875, -0.1224365234375, -0.008575439453125, 0.10528564453125, 0.219146728515625, 0.3330078125, 0.446868896484375, 0.56072998046875, 0.674591064453125, 0.7884521484375, 0.902313232421875, 1.01617431640625, 1.130035400390625, 1.243896484375, 1.357757568359375, 1.47161865234375, 1.585479736328125, 1.6993408203125, 1.813201904296875, 1.92706298828125, 2.040924072265625, 2.15478515625, 2.268646240234375, 2.38250732421875, 2.496368408203125, 2.6102294921875, 2.724090576171875, 2.83795166015625, 2.951812744140625, 3.065673828125, 3.179534912109375, 3.29339599609375, 3.407257080078125, 3.5211181640625, 3.634979248046875, 3.74884033203125, 3.862701416015625, 3.9765625]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 6.0, 2.0, 5.0, 9.0, 20.0, 40.0, 56.0, 102.0, 194.0, 407.0, 814.0, 1423.0, 3069.0, 5729.0, 10648.0, 19889.0, 35001.0, 58684.0, 91194.0, 128181.0, 156261.0, 158817.0, 133861.0, 97186.0, 63154.0, 37648.0, 21411.0, 11742.0, 6259.0, 3298.0, 1638.0, 862.0, 438.0, 239.0, 116.0, 50.0, 37.0, 23.0, 19.0, 8.0, 3.0, 8.0, 5.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1591796875, -1.120635986328125, -1.08209228515625, -1.043548583984375, -1.0050048828125, -0.966461181640625, -0.92791748046875, -0.889373779296875, -0.850830078125, -0.812286376953125, -0.77374267578125, -0.735198974609375, -0.6966552734375, -0.658111572265625, -0.61956787109375, -0.581024169921875, -0.54248046875, -0.503936767578125, -0.46539306640625, -0.426849365234375, -0.3883056640625, -0.349761962890625, -0.31121826171875, -0.272674560546875, -0.234130859375, -0.195587158203125, -0.15704345703125, -0.118499755859375, -0.0799560546875, -0.041412353515625, -0.00286865234375, 0.035675048828125, 0.07421875, 0.112762451171875, 0.15130615234375, 0.189849853515625, 0.2283935546875, 0.266937255859375, 0.30548095703125, 0.344024658203125, 0.382568359375, 0.421112060546875, 0.45965576171875, 0.498199462890625, 0.5367431640625, 0.575286865234375, 0.61383056640625, 0.652374267578125, 0.69091796875, 0.729461669921875, 0.76800537109375, 0.806549072265625, 0.8450927734375, 0.883636474609375, 0.92218017578125, 0.960723876953125, 0.999267578125, 1.037811279296875, 1.07635498046875, 1.114898681640625, 1.1534423828125, 1.191986083984375, 1.23052978515625, 1.269073486328125, 1.3076171875]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 7.0, 9.0, 8.0, 11.0, 6.0, 20.0, 20.0, 15.0, 17.0, 26.0, 22.0, 18.0, 34.0, 32.0, 27.0, 33.0, 32.0, 37.0, 58.0, 48.0, 1071.0, 49.0, 36.0, 36.0, 39.0, 37.0, 20.0, 34.0, 36.0, 26.0, 25.0, 20.0, 15.0, 18.0, 18.0, 9.0, 9.0, 7.0, 10.0, 4.0, 8.0, 6.0, 1.0, 1.0, 4.0, 4.0, 0.0, 2.0, 2.0, 1.0, 2.0], "bins": [-2.857421875, -2.77191162109375, -2.6864013671875, -2.60089111328125, -2.515380859375, -2.42987060546875, -2.3443603515625, -2.25885009765625, -2.17333984375, -2.08782958984375, -2.0023193359375, -1.91680908203125, -1.831298828125, -1.74578857421875, -1.6602783203125, -1.57476806640625, -1.4892578125, -1.40374755859375, -1.3182373046875, -1.23272705078125, -1.147216796875, -1.06170654296875, -0.9761962890625, -0.89068603515625, -0.80517578125, -0.71966552734375, -0.6341552734375, -0.54864501953125, -0.463134765625, -0.37762451171875, -0.2921142578125, -0.20660400390625, -0.12109375, -0.03558349609375, 0.0499267578125, 0.13543701171875, 0.220947265625, 0.30645751953125, 0.3919677734375, 0.47747802734375, 0.56298828125, 0.64849853515625, 0.7340087890625, 0.81951904296875, 0.905029296875, 0.99053955078125, 1.0760498046875, 1.16156005859375, 1.2470703125, 1.33258056640625, 1.4180908203125, 1.50360107421875, 1.589111328125, 1.67462158203125, 1.7601318359375, 1.84564208984375, 1.93115234375, 2.01666259765625, 2.1021728515625, 2.18768310546875, 2.273193359375, 2.35870361328125, 2.4442138671875, 2.52972412109375, 2.615234375]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 5.0, 8.0, 19.0, 21.0, 18.0, 39.0, 42.0, 86.0, 105.0, 145.0, 228.0, 302.0, 414.0, 635.0, 914.0, 1386.0, 1978.0, 2856.0, 4378.0, 6368.0, 9677.0, 14476.0, 22690.0, 46290.0, 1740771.0, 160746.0, 28753.0, 18050.0, 11779.0, 7713.0, 5273.0, 3499.0, 2316.0, 1577.0, 1072.0, 755.0, 525.0, 377.0, 297.0, 172.0, 106.0, 99.0, 56.0, 41.0, 27.0, 17.0, 15.0, 7.0, 11.0, 1.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.904296875, -1.84234619140625, -1.7803955078125, -1.71844482421875, -1.656494140625, -1.59454345703125, -1.5325927734375, -1.47064208984375, -1.40869140625, -1.34674072265625, -1.2847900390625, -1.22283935546875, -1.160888671875, -1.09893798828125, -1.0369873046875, -0.97503662109375, -0.9130859375, -0.85113525390625, -0.7891845703125, -0.72723388671875, -0.665283203125, -0.60333251953125, -0.5413818359375, -0.47943115234375, -0.41748046875, -0.35552978515625, -0.2935791015625, -0.23162841796875, -0.169677734375, -0.10772705078125, -0.0457763671875, 0.01617431640625, 0.078125, 0.14007568359375, 0.2020263671875, 0.26397705078125, 0.325927734375, 0.38787841796875, 0.4498291015625, 0.51177978515625, 0.57373046875, 0.63568115234375, 0.6976318359375, 0.75958251953125, 0.821533203125, 0.88348388671875, 0.9454345703125, 1.00738525390625, 1.0693359375, 1.13128662109375, 1.1932373046875, 1.25518798828125, 1.317138671875, 1.37908935546875, 1.4410400390625, 1.50299072265625, 1.56494140625, 1.62689208984375, 1.6888427734375, 1.75079345703125, 1.812744140625, 1.87469482421875, 1.9366455078125, 1.99859619140625, 2.060546875]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 3.0, 1.0, 4.0, 4.0, 4.0, 6.0, 7.0, 9.0, 12.0, 18.0, 25.0, 26.0, 33.0, 45.0, 28.0, 49.0, 47.0, 46.0, 59.0, 47.0, 53.0, 72.0, 35.0, 49.0, 48.0, 44.0, 36.0, 31.0, 19.0, 29.0, 25.0, 20.0, 21.0, 11.0, 7.0, 4.0, 5.0, 3.0, 6.0, 3.0, 0.0, 4.0, 1.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0560302734375, -0.054070472717285156, -0.05211067199707031, -0.05015087127685547, -0.048191070556640625, -0.04623126983642578, -0.04427146911621094, -0.042311668395996094, -0.04035186767578125, -0.038392066955566406, -0.03643226623535156, -0.03447246551513672, -0.032512664794921875, -0.03055286407470703, -0.028593063354492188, -0.026633262634277344, -0.0246734619140625, -0.022713661193847656, -0.020753860473632812, -0.01879405975341797, -0.016834259033203125, -0.014874458312988281, -0.012914657592773438, -0.010954856872558594, -0.00899505615234375, -0.007035255432128906, -0.0050754547119140625, -0.0031156539916992188, -0.001155853271484375, 0.0008039474487304688, 0.0027637481689453125, 0.004723548889160156, 0.006683349609375, 0.008643150329589844, 0.010602951049804688, 0.012562751770019531, 0.014522552490234375, 0.01648235321044922, 0.018442153930664062, 0.020401954650878906, 0.02236175537109375, 0.024321556091308594, 0.026281356811523438, 0.02824115753173828, 0.030200958251953125, 0.03216075897216797, 0.03412055969238281, 0.036080360412597656, 0.0380401611328125, 0.039999961853027344, 0.04195976257324219, 0.04391956329345703, 0.045879364013671875, 0.04783916473388672, 0.04979896545410156, 0.051758766174316406, 0.05371856689453125, 0.055678367614746094, 0.05763816833496094, 0.05959796905517578, 0.061557769775390625, 0.06351757049560547, 0.06547737121582031, 0.06743717193603516, 0.06939697265625]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 6.0, 2.0, 5.0, 4.0, 6.0, 5.0, 13.0, 14.0, 20.0, 16.0, 26.0, 31.0, 36.0, 36.0, 44.0, 80.0, 159.0, 207.0, 328.0, 740.0, 8010.0, 833374.0, 202044.0, 1934.0, 524.0, 263.0, 185.0, 103.0, 63.0, 59.0, 45.0, 36.0, 30.0, 30.0, 20.0, 9.0, 10.0, 9.0, 7.0, 4.0, 2.0, 5.0, 3.0, 1.0, 3.0, 4.0, 2.0, 0.0, 0.0, 3.0, 0.0, 2.0], "bins": [-1.23046875, -1.194061279296875, -1.15765380859375, -1.121246337890625, -1.0848388671875, -1.048431396484375, -1.01202392578125, -0.975616455078125, -0.939208984375, -0.902801513671875, -0.86639404296875, -0.829986572265625, -0.7935791015625, -0.757171630859375, -0.72076416015625, -0.684356689453125, -0.64794921875, -0.611541748046875, -0.57513427734375, -0.538726806640625, -0.5023193359375, -0.465911865234375, -0.42950439453125, -0.393096923828125, -0.356689453125, -0.320281982421875, -0.28387451171875, -0.247467041015625, -0.2110595703125, -0.174652099609375, -0.13824462890625, -0.101837158203125, -0.0654296875, -0.029022216796875, 0.00738525390625, 0.043792724609375, 0.0802001953125, 0.116607666015625, 0.15301513671875, 0.189422607421875, 0.225830078125, 0.262237548828125, 0.29864501953125, 0.335052490234375, 0.3714599609375, 0.407867431640625, 0.44427490234375, 0.480682373046875, 0.51708984375, 0.553497314453125, 0.58990478515625, 0.626312255859375, 0.6627197265625, 0.699127197265625, 0.73553466796875, 0.771942138671875, 0.808349609375, 0.844757080078125, 0.88116455078125, 0.917572021484375, 0.9539794921875, 0.990386962890625, 1.02679443359375, 1.063201904296875, 1.099609375]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 13.0, 66.0, 221.0, 441.0, 219.0, 41.0, 11.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6726258397102356, -0.6450998783111572, -0.6175739169120789, -0.5900479555130005, -0.5625219345092773, -0.5349960327148438, -0.5074700117111206, -0.47994405031204224, -0.45241808891296387, -0.4248921275138855, -0.39736616611480713, -0.36984017491340637, -0.342314213514328, -0.31478825211524963, -0.2872622609138489, -0.2597362995147705, -0.23221033811569214, -0.20468437671661377, -0.1771584004163742, -0.14963242411613464, -0.12210646271705627, -0.0945805013179779, -0.06705452501773834, -0.03952854871749878, -0.01200258731842041, 0.015523381531238556, 0.04304935038089752, 0.07057531923055649, 0.09810128808021545, 0.12562724947929382, 0.1531532257795334, 0.18067920207977295, 0.2082052230834961, 0.23573118448257446, 0.26325714588165283, 0.2907831370830536, 0.31830909848213196, 0.3458350598812103, 0.3733610510826111, 0.40088701248168945, 0.4284129738807678, 0.4559389352798462, 0.48346489667892456, 0.5109908580780029, 0.5385168790817261, 0.5660427808761597, 0.5935688018798828, 0.6210947632789612, 0.6486207246780396, 0.6761466860771179, 0.7036726474761963, 0.7311986088752747, 0.758724570274353, 0.7862505912780762, 0.8137765526771545, 0.8413025140762329, 0.8688284754753113, 0.8963544368743896, 0.923880398273468, 0.9514063596725464, 0.9789323806762695, 1.0064582824707031, 1.0339843034744263, 1.0615103244781494, 1.089036226272583]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 5.0, 9.0, 7.0, 8.0, 8.0, 7.0, 12.0, 18.0, 19.0, 13.0, 27.0, 21.0, 29.0, 24.0, 36.0, 34.0, 31.0, 28.0, 37.0, 42.0, 29.0, 44.0, 41.0, 40.0, 34.0, 34.0, 34.0, 46.0, 30.0, 32.0, 34.0, 24.0, 23.0, 17.0, 21.0, 21.0, 14.0, 14.0, 8.0, 7.0, 14.0, 10.0, 5.0, 7.0, 2.0, 3.0, 4.0, 4.0, 0.0, 1.0, 1.0], "bins": [-0.10023313760757446, -0.09730792045593262, -0.09438270330429077, -0.09145748615264893, -0.08853226900100708, -0.08560705184936523, -0.08268183469772339, -0.07975661754608154, -0.0768314003944397, -0.07390618324279785, -0.070980966091156, -0.06805574893951416, -0.06513053178787231, -0.06220531463623047, -0.05928009748458862, -0.05635488033294678, -0.05342966318130493, -0.050504446029663086, -0.04757922887802124, -0.044654011726379395, -0.04172879457473755, -0.0388035774230957, -0.03587836027145386, -0.03295314311981201, -0.030027925968170166, -0.02710270881652832, -0.024177491664886475, -0.02125227451324463, -0.018327057361602783, -0.015401840209960938, -0.012476623058319092, -0.009551405906677246, -0.0066261887550354, -0.0037009716033935547, -0.000775754451751709, 0.0021494626998901367, 0.005074679851531982, 0.007999897003173828, 0.010925114154815674, 0.01385033130645752, 0.016775548458099365, 0.01970076560974121, 0.022625982761383057, 0.025551199913024902, 0.028476417064666748, 0.031401634216308594, 0.03432685136795044, 0.037252068519592285, 0.04017728567123413, 0.04310250282287598, 0.04602771997451782, 0.04895293712615967, 0.051878154277801514, 0.05480337142944336, 0.057728588581085205, 0.06065380573272705, 0.0635790228843689, 0.06650424003601074, 0.06942945718765259, 0.07235467433929443, 0.07527989149093628, 0.07820510864257812, 0.08113032579421997, 0.08405554294586182, 0.08698076009750366]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 2.0, 2.0, 4.0, 2.0, 13.0, 6.0, 9.0, 6.0, 12.0, 21.0, 17.0, 19.0, 21.0, 17.0, 22.0, 18.0, 28.0, 26.0, 35.0, 36.0, 41.0, 42.0, 36.0, 45.0, 37.0, 39.0, 36.0, 57.0, 43.0, 45.0, 27.0, 29.0, 26.0, 25.0, 32.0, 27.0, 16.0, 10.0, 12.0, 10.0, 9.0, 10.0, 6.0, 12.0, 5.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.333984375, -3.22418212890625, -3.1143798828125, -3.00457763671875, -2.894775390625, -2.78497314453125, -2.6751708984375, -2.56536865234375, -2.45556640625, -2.34576416015625, -2.2359619140625, -2.12615966796875, -2.016357421875, -1.90655517578125, -1.7967529296875, -1.68695068359375, -1.5771484375, -1.46734619140625, -1.3575439453125, -1.24774169921875, -1.137939453125, -1.02813720703125, -0.9183349609375, -0.80853271484375, -0.69873046875, -0.58892822265625, -0.4791259765625, -0.36932373046875, -0.259521484375, -0.14971923828125, -0.0399169921875, 0.06988525390625, 0.1796875, 0.28948974609375, 0.3992919921875, 0.50909423828125, 0.618896484375, 0.72869873046875, 0.8385009765625, 0.94830322265625, 1.05810546875, 1.16790771484375, 1.2777099609375, 1.38751220703125, 1.497314453125, 1.60711669921875, 1.7169189453125, 1.82672119140625, 1.9365234375, 2.04632568359375, 2.1561279296875, 2.26593017578125, 2.375732421875, 2.48553466796875, 2.5953369140625, 2.70513916015625, 2.81494140625, 2.92474365234375, 3.0345458984375, 3.14434814453125, 3.254150390625, 3.36395263671875, 3.4737548828125, 3.58355712890625, 3.693359375]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 2.0, 9.0, 3.0, 5.0, 8.0, 8.0, 9.0, 28.0, 27.0, 26.0, 47.0, 62.0, 97.0, 153.0, 277.0, 463.0, 766.0, 1275.0, 2321.0, 4025.0, 6839.0, 11923.0, 20441.0, 34863.0, 59375.0, 101441.0, 171557.0, 272690.0, 148475.0, 87535.0, 51595.0, 30190.0, 17469.0, 10293.0, 6013.0, 3421.0, 2013.0, 1084.0, 691.0, 381.0, 214.0, 145.0, 90.0, 65.0, 37.0, 19.0, 26.0, 16.0, 10.0, 9.0, 7.0, 3.0, 4.0, 4.0, 7.0, 2.0, 4.0, 4.0, 2.0, 0.0, 1.0], "bins": [-3.060546875, -2.959747314453125, -2.85894775390625, -2.758148193359375, -2.6573486328125, -2.556549072265625, -2.45574951171875, -2.354949951171875, -2.254150390625, -2.153350830078125, -2.05255126953125, -1.951751708984375, -1.8509521484375, -1.750152587890625, -1.64935302734375, -1.548553466796875, -1.44775390625, -1.346954345703125, -1.24615478515625, -1.145355224609375, -1.0445556640625, -0.943756103515625, -0.84295654296875, -0.742156982421875, -0.641357421875, -0.540557861328125, -0.43975830078125, -0.338958740234375, -0.2381591796875, -0.137359619140625, -0.03656005859375, 0.064239501953125, 0.1650390625, 0.265838623046875, 0.36663818359375, 0.467437744140625, 0.5682373046875, 0.669036865234375, 0.76983642578125, 0.870635986328125, 0.971435546875, 1.072235107421875, 1.17303466796875, 1.273834228515625, 1.3746337890625, 1.475433349609375, 1.57623291015625, 1.677032470703125, 1.77783203125, 1.878631591796875, 1.97943115234375, 2.080230712890625, 2.1810302734375, 2.281829833984375, 2.38262939453125, 2.483428955078125, 2.584228515625, 2.685028076171875, 2.78582763671875, 2.886627197265625, 2.9874267578125, 3.088226318359375, 3.18902587890625, 3.289825439453125, 3.390625]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 4.0, 7.0, 6.0, 5.0, 11.0, 10.0, 11.0, 15.0, 17.0, 19.0, 13.0, 29.0, 27.0, 51.0, 40.0, 48.0, 60.0, 74.0, 113.0, 248.0, 1454.0, 238.0, 130.0, 58.0, 39.0, 57.0, 43.0, 35.0, 29.0, 30.0, 25.0, 21.0, 14.0, 17.0, 13.0, 14.0, 9.0, 5.0, 8.0, 2.0, 2.0, 3.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-14.3984375, -14.0042724609375, -13.610107421875, -13.2159423828125, -12.82177734375, -12.4276123046875, -12.033447265625, -11.6392822265625, -11.2451171875, -10.8509521484375, -10.456787109375, -10.0626220703125, -9.66845703125, -9.2742919921875, -8.880126953125, -8.4859619140625, -8.091796875, -7.6976318359375, -7.303466796875, -6.9093017578125, -6.51513671875, -6.1209716796875, -5.726806640625, -5.3326416015625, -4.9384765625, -4.5443115234375, -4.150146484375, -3.7559814453125, -3.36181640625, -2.9676513671875, -2.573486328125, -2.1793212890625, -1.78515625, -1.3909912109375, -0.996826171875, -0.6026611328125, -0.20849609375, 0.1856689453125, 0.579833984375, 0.9739990234375, 1.3681640625, 1.7623291015625, 2.156494140625, 2.5506591796875, 2.94482421875, 3.3389892578125, 3.733154296875, 4.1273193359375, 4.521484375, 4.9156494140625, 5.309814453125, 5.7039794921875, 6.09814453125, 6.4923095703125, 6.886474609375, 7.2806396484375, 7.6748046875, 8.0689697265625, 8.463134765625, 8.8572998046875, 9.25146484375, 9.6456298828125, 10.039794921875, 10.4339599609375, 10.828125]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 6.0, 0.0, 3.0, 7.0, 11.0, 6.0, 16.0, 19.0, 37.0, 57.0, 56.0, 83.0, 121.0, 204.0, 309.0, 641.0, 1953.0, 50504.0, 3050149.0, 38153.0, 1855.0, 601.0, 310.0, 175.0, 115.0, 104.0, 55.0, 38.0, 38.0, 27.0, 18.0, 15.0, 7.0, 6.0, 5.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.125, -31.07080078125, -30.0166015625, -28.96240234375, -27.908203125, -26.85400390625, -25.7998046875, -24.74560546875, -23.69140625, -22.63720703125, -21.5830078125, -20.52880859375, -19.474609375, -18.42041015625, -17.3662109375, -16.31201171875, -15.2578125, -14.20361328125, -13.1494140625, -12.09521484375, -11.041015625, -9.98681640625, -8.9326171875, -7.87841796875, -6.82421875, -5.77001953125, -4.7158203125, -3.66162109375, -2.607421875, -1.55322265625, -0.4990234375, 0.55517578125, 1.609375, 2.66357421875, 3.7177734375, 4.77197265625, 5.826171875, 6.88037109375, 7.9345703125, 8.98876953125, 10.04296875, 11.09716796875, 12.1513671875, 13.20556640625, 14.259765625, 15.31396484375, 16.3681640625, 17.42236328125, 18.4765625, 19.53076171875, 20.5849609375, 21.63916015625, 22.693359375, 23.74755859375, 24.8017578125, 25.85595703125, 26.91015625, 27.96435546875, 29.0185546875, 30.07275390625, 31.126953125, 32.18115234375, 33.2353515625, 34.28955078125, 35.34375]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 207.0, 808.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-82.94216918945312, -74.82086181640625, -66.6995620727539, -58.5782585144043, -50.45695495605469, -42.33565139770508, -34.21434783935547, -26.09304428100586, -17.97174072265625, -9.85043716430664, -1.7291336059570312, 6.392169952392578, 14.513473510742188, 22.634777069091797, 30.756080627441406, 38.877384185791016, 46.998687744140625, 55.119991302490234, 63.241294860839844, 71.36259460449219, 79.48390197753906, 87.60520935058594, 95.72650909423828, 103.84780883789062, 111.9691162109375, 120.09042358398438, 128.21173095703125, 136.33302307128906, 144.45433044433594, 152.5756378173828, 160.69692993164062, 168.8182373046875, 176.9395751953125, 185.06088256835938, 193.18218994140625, 201.30348205566406, 209.42478942871094, 217.5460968017578, 225.66738891601562, 233.7886962890625, 241.91000366210938, 250.03131103515625, 258.1526184082031, 266.27392578125, 274.39520263671875, 282.5165100097656, 290.6378173828125, 298.7591247558594, 306.88043212890625, 315.0017395019531, 323.123046875, 331.2443542480469, 339.36566162109375, 347.4869384765625, 355.6082458496094, 363.72955322265625, 371.8508605957031, 379.97216796875, 388.0934753417969, 396.21478271484375, 404.3360595703125, 412.4573669433594, 420.57867431640625, 428.6999816894531, 436.8212890625]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 7.0, 4.0, 3.0, 9.0, 17.0, 17.0, 22.0, 24.0, 32.0, 29.0, 31.0, 44.0, 35.0, 47.0, 42.0, 49.0, 60.0, 56.0, 48.0, 47.0, 43.0, 35.0, 36.0, 53.0, 25.0, 41.0, 29.0, 12.0, 24.0, 14.0, 12.0, 12.0, 8.0, 7.0, 10.0, 3.0, 7.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-41.40367889404297, -40.222679138183594, -39.04167938232422, -37.860679626464844, -36.67967987060547, -35.498680114746094, -34.31768035888672, -33.136680603027344, -31.9556827545166, -30.774682998657227, -29.59368324279785, -28.412683486938477, -27.231685638427734, -26.05068588256836, -24.869686126708984, -23.68868637084961, -22.507686614990234, -21.32668685913086, -20.145687103271484, -18.96468734741211, -17.783687591552734, -16.60268783569336, -15.421689987182617, -14.240690231323242, -13.059690475463867, -11.878690719604492, -10.697690963745117, -9.516692161560059, -8.335692405700684, -7.154692649841309, -5.973693370819092, -4.792694091796875, -3.6116905212402344, -2.4306910037994385, -1.2496914863586426, -0.06869196891784668, 1.1123075485229492, 2.293307304382324, 3.474306583404541, 4.655305862426758, 5.836305618286133, 7.017305374145508, 8.198305130004883, 9.379303932189941, 10.560303688049316, 11.741303443908691, 12.92230224609375, 14.103302001953125, 15.2843017578125, 16.465301513671875, 17.64630126953125, 18.827301025390625, 20.00830078125, 21.189300537109375, 22.370298385620117, 23.551298141479492, 24.732297897338867, 25.913297653198242, 27.094297409057617, 28.275297164916992, 29.456295013427734, 30.63729476928711, 31.818294525146484, 32.99929428100586, 34.180294036865234]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 0.0, 6.0, 5.0, 3.0, 14.0, 13.0, 10.0, 12.0, 20.0, 20.0, 18.0, 21.0, 28.0, 26.0, 18.0, 28.0, 35.0, 35.0, 44.0, 39.0, 49.0, 49.0, 40.0, 44.0, 28.0, 51.0, 46.0, 46.0, 37.0, 26.0, 28.0, 28.0, 28.0, 22.0, 17.0, 17.0, 11.0, 10.0, 6.0, 10.0, 6.0, 3.0, 6.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.751953125, -3.627349853515625, -3.50274658203125, -3.378143310546875, -3.2535400390625, -3.128936767578125, -3.00433349609375, -2.879730224609375, -2.755126953125, -2.630523681640625, -2.50592041015625, -2.381317138671875, -2.2567138671875, -2.132110595703125, -2.00750732421875, -1.882904052734375, -1.75830078125, -1.633697509765625, -1.50909423828125, -1.384490966796875, -1.2598876953125, -1.135284423828125, -1.01068115234375, -0.886077880859375, -0.761474609375, -0.636871337890625, -0.51226806640625, -0.387664794921875, -0.2630615234375, -0.138458251953125, -0.01385498046875, 0.110748291015625, 0.2353515625, 0.359954833984375, 0.48455810546875, 0.609161376953125, 0.7337646484375, 0.858367919921875, 0.98297119140625, 1.107574462890625, 1.232177734375, 1.356781005859375, 1.48138427734375, 1.605987548828125, 1.7305908203125, 1.855194091796875, 1.97979736328125, 2.104400634765625, 2.22900390625, 2.353607177734375, 2.47821044921875, 2.602813720703125, 2.7274169921875, 2.852020263671875, 2.97662353515625, 3.101226806640625, 3.225830078125, 3.350433349609375, 3.47503662109375, 3.599639892578125, 3.7242431640625, 3.848846435546875, 3.97344970703125, 4.098052978515625, 4.22265625]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 2.0, 5.0, 3.0, 3.0, 4.0, 1.0, 11.0, 5.0, 7.0, 14.0, 13.0, 15.0, 15.0, 17.0, 30.0, 27.0, 36.0, 55.0, 110.0, 192.0, 381.0, 942.0, 2967.0, 11368.0, 49904.0, 231804.0, 1088162.0, 1995366.0, 639905.0, 134113.0, 28923.0, 6715.0, 1881.0, 626.0, 258.0, 136.0, 74.0, 33.0, 27.0, 26.0, 36.0, 8.0, 18.0, 9.0, 6.0, 8.0, 7.0, 6.0, 6.0, 6.0, 1.0, 2.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.66015625, -6.447509765625, -6.23486328125, -6.022216796875, -5.8095703125, -5.596923828125, -5.38427734375, -5.171630859375, -4.958984375, -4.746337890625, -4.53369140625, -4.321044921875, -4.1083984375, -3.895751953125, -3.68310546875, -3.470458984375, -3.2578125, -3.045166015625, -2.83251953125, -2.619873046875, -2.4072265625, -2.194580078125, -1.98193359375, -1.769287109375, -1.556640625, -1.343994140625, -1.13134765625, -0.918701171875, -0.7060546875, -0.493408203125, -0.28076171875, -0.068115234375, 0.14453125, 0.357177734375, 0.56982421875, 0.782470703125, 0.9951171875, 1.207763671875, 1.42041015625, 1.633056640625, 1.845703125, 2.058349609375, 2.27099609375, 2.483642578125, 2.6962890625, 2.908935546875, 3.12158203125, 3.334228515625, 3.546875, 3.759521484375, 3.97216796875, 4.184814453125, 4.3974609375, 4.610107421875, 4.82275390625, 5.035400390625, 5.248046875, 5.460693359375, 5.67333984375, 5.885986328125, 6.0986328125, 6.311279296875, 6.52392578125, 6.736572265625, 6.94921875]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 6.0, 7.0, 4.0, 10.0, 14.0, 19.0, 22.0, 32.0, 39.0, 43.0, 62.0, 87.0, 116.0, 153.0, 210.0, 280.0, 361.0, 426.0, 444.0, 355.0, 354.0, 259.0, 202.0, 125.0, 123.0, 90.0, 64.0, 39.0, 18.0, 26.0, 21.0, 13.0, 13.0, 8.0, 11.0, 2.0, 7.0, 2.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.640625, -6.44744873046875, -6.2542724609375, -6.06109619140625, -5.867919921875, -5.67474365234375, -5.4815673828125, -5.28839111328125, -5.09521484375, -4.90203857421875, -4.7088623046875, -4.51568603515625, -4.322509765625, -4.12933349609375, -3.9361572265625, -3.74298095703125, -3.5498046875, -3.35662841796875, -3.1634521484375, -2.97027587890625, -2.777099609375, -2.58392333984375, -2.3907470703125, -2.19757080078125, -2.00439453125, -1.81121826171875, -1.6180419921875, -1.42486572265625, -1.231689453125, -1.03851318359375, -0.8453369140625, -0.65216064453125, -0.458984375, -0.26580810546875, -0.0726318359375, 0.12054443359375, 0.313720703125, 0.50689697265625, 0.7000732421875, 0.89324951171875, 1.08642578125, 1.27960205078125, 1.4727783203125, 1.66595458984375, 1.859130859375, 2.05230712890625, 2.2454833984375, 2.43865966796875, 2.6318359375, 2.82501220703125, 3.0181884765625, 3.21136474609375, 3.404541015625, 3.59771728515625, 3.7908935546875, 3.98406982421875, 4.17724609375, 4.37042236328125, 4.5635986328125, 4.75677490234375, 4.949951171875, 5.14312744140625, 5.3363037109375, 5.52947998046875, 5.72265625]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 8.0, 3.0, 2.0, 11.0, 8.0, 13.0, 11.0, 23.0, 20.0, 31.0, 41.0, 61.0, 85.0, 135.0, 144.0, 230.0, 396.0, 868.0, 35337.0, 3818846.0, 334258.0, 2250.0, 506.0, 281.0, 212.0, 130.0, 98.0, 65.0, 43.0, 38.0, 37.0, 22.0, 18.0, 17.0, 8.0, 7.0, 5.0, 5.0, 5.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-31.21875, -30.20166015625, -29.1845703125, -28.16748046875, -27.150390625, -26.13330078125, -25.1162109375, -24.09912109375, -23.08203125, -22.06494140625, -21.0478515625, -20.03076171875, -19.013671875, -17.99658203125, -16.9794921875, -15.96240234375, -14.9453125, -13.92822265625, -12.9111328125, -11.89404296875, -10.876953125, -9.85986328125, -8.8427734375, -7.82568359375, -6.80859375, -5.79150390625, -4.7744140625, -3.75732421875, -2.740234375, -1.72314453125, -0.7060546875, 0.31103515625, 1.328125, 2.34521484375, 3.3623046875, 4.37939453125, 5.396484375, 6.41357421875, 7.4306640625, 8.44775390625, 9.46484375, 10.48193359375, 11.4990234375, 12.51611328125, 13.533203125, 14.55029296875, 15.5673828125, 16.58447265625, 17.6015625, 18.61865234375, 19.6357421875, 20.65283203125, 21.669921875, 22.68701171875, 23.7041015625, 24.72119140625, 25.73828125, 26.75537109375, 27.7724609375, 28.78955078125, 29.806640625, 30.82373046875, 31.8408203125, 32.85791015625, 33.875]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 14.0, 39.0, 94.0, 115.0, 169.0, 179.0, 170.0, 110.0, 67.0, 37.0, 9.0, 4.0, 1.0, 2.0], "bins": [-87.52429962158203, -85.94474792480469, -84.36518859863281, -82.78562927246094, -81.2060775756836, -79.62652587890625, -78.04696655273438, -76.4674072265625, -74.88785552978516, -73.30830383300781, -71.72874450683594, -70.14918518066406, -68.56963348388672, -66.99008178710938, -65.4105224609375, -63.83096694946289, -62.25141143798828, -60.67185592651367, -59.09230041503906, -57.51274490356445, -55.933189392089844, -54.353633880615234, -52.774078369140625, -51.194522857666016, -49.614967346191406, -48.0354118347168, -46.45585632324219, -44.87630081176758, -43.29674530029297, -41.71718978881836, -40.13763427734375, -38.55807876586914, -36.97852325439453, -35.39896774291992, -33.81941223144531, -32.2398567199707, -30.660301208496094, -29.080745697021484, -27.501190185546875, -25.921634674072266, -24.342077255249023, -22.762521743774414, -21.182966232299805, -19.603410720825195, -18.023855209350586, -16.444299697875977, -14.864744186401367, -13.285188674926758, -11.705633163452148, -10.126077651977539, -8.54652214050293, -6.96696662902832, -5.387411117553711, -3.8078556060791016, -2.228300094604492, -0.6487445831298828, 0.9308109283447266, 2.510366439819336, 4.089921951293945, 5.669477462768555, 7.249032974243164, 8.828588485717773, 10.408143997192383, 11.987699508666992, 13.567255020141602]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 3.0, 2.0, 4.0, 3.0, 3.0, 2.0, 5.0, 9.0, 11.0, 10.0, 9.0, 17.0, 14.0, 14.0, 16.0, 23.0, 19.0, 35.0, 15.0, 20.0, 34.0, 36.0, 38.0, 31.0, 34.0, 40.0, 35.0, 34.0, 32.0, 47.0, 47.0, 26.0, 31.0, 40.0, 30.0, 30.0, 23.0, 23.0, 18.0, 20.0, 13.0, 18.0, 15.0, 14.0, 10.0, 10.0, 10.0, 11.0, 10.0, 4.0, 2.0, 6.0, 5.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.190101623535156, -16.613265991210938, -16.03643226623535, -15.459596633911133, -14.88276195526123, -14.305927276611328, -13.72909164428711, -13.152256965637207, -12.575422286987305, -11.998587608337402, -11.4217529296875, -10.844917297363281, -10.268082618713379, -9.691247940063477, -9.114412307739258, -8.537577629089355, -7.960742950439453, -7.383908271789551, -6.80707311630249, -6.23023796081543, -5.653403282165527, -5.076568603515625, -4.4997334480285645, -3.922898292541504, -3.3460636138916016, -2.76922869682312, -2.1923937797546387, -1.6155588626861572, -1.0387239456176758, -0.46188902854919434, 0.11494588851928711, 0.6917810440063477, 1.26861572265625, 1.8454506397247314, 2.422285556793213, 2.9991204738616943, 3.575955390930176, 4.152790069580078, 4.729625225067139, 5.306460380554199, 5.883295059204102, 6.460129737854004, 7.0369648933410645, 7.613800048828125, 8.190634727478027, 8.76746940612793, 9.344305038452148, 9.92113971710205, 10.497974395751953, 11.074809074401855, 11.651643753051758, 12.228479385375977, 12.805314064025879, 13.382148742675781, 13.958984375, 14.535819053649902, 15.112653732299805, 15.689488410949707, 16.26632308959961, 16.843158721923828, 17.419994354248047, 17.996828079223633, 18.57366371154785, 19.150497436523438, 19.727333068847656]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 4.0, 0.0, 4.0, 7.0, 4.0, 5.0, 8.0, 14.0, 6.0, 18.0, 19.0, 17.0, 22.0, 28.0, 18.0, 29.0, 29.0, 35.0, 35.0, 36.0, 43.0, 43.0, 35.0, 38.0, 47.0, 46.0, 48.0, 33.0, 44.0, 33.0, 30.0, 37.0, 32.0, 20.0, 29.0, 18.0, 15.0, 16.0, 10.0, 8.0, 8.0, 6.0, 8.0, 1.0, 4.0, 5.0, 7.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-3.443359375, -3.3310546875, -3.21875, -3.1064453125, -2.994140625, -2.8818359375, -2.76953125, -2.6572265625, -2.544921875, -2.4326171875, -2.3203125, -2.2080078125, -2.095703125, -1.9833984375, -1.87109375, -1.7587890625, -1.646484375, -1.5341796875, -1.421875, -1.3095703125, -1.197265625, -1.0849609375, -0.97265625, -0.8603515625, -0.748046875, -0.6357421875, -0.5234375, -0.4111328125, -0.298828125, -0.1865234375, -0.07421875, 0.0380859375, 0.150390625, 0.2626953125, 0.375, 0.4873046875, 0.599609375, 0.7119140625, 0.82421875, 0.9365234375, 1.048828125, 1.1611328125, 1.2734375, 1.3857421875, 1.498046875, 1.6103515625, 1.72265625, 1.8349609375, 1.947265625, 2.0595703125, 2.171875, 2.2841796875, 2.396484375, 2.5087890625, 2.62109375, 2.7333984375, 2.845703125, 2.9580078125, 3.0703125, 3.1826171875, 3.294921875, 3.4072265625, 3.51953125, 3.6318359375, 3.744140625]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 6.0, 4.0, 8.0, 14.0, 15.0, 40.0, 36.0, 69.0, 106.0, 176.0, 293.0, 434.0, 632.0, 1109.0, 1821.0, 2822.0, 4474.0, 7081.0, 10902.0, 16934.0, 25339.0, 36895.0, 52348.0, 72591.0, 94025.0, 114497.0, 125191.0, 119231.0, 100882.0, 78878.0, 58300.0, 41370.0, 28361.0, 19110.0, 12493.0, 8146.0, 5269.0, 3249.0, 2091.0, 1242.0, 773.0, 472.0, 313.0, 201.0, 127.0, 62.0, 54.0, 25.0, 16.0, 15.0, 12.0, 1.0, 4.0, 7.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0], "bins": [-0.69482421875, -0.6721572875976562, -0.6494903564453125, -0.6268234252929688, -0.604156494140625, -0.5814895629882812, -0.5588226318359375, -0.5361557006835938, -0.51348876953125, -0.49082183837890625, -0.4681549072265625, -0.44548797607421875, -0.422821044921875, -0.40015411376953125, -0.3774871826171875, -0.35482025146484375, -0.3321533203125, -0.30948638916015625, -0.2868194580078125, -0.26415252685546875, -0.241485595703125, -0.21881866455078125, -0.1961517333984375, -0.17348480224609375, -0.15081787109375, -0.12815093994140625, -0.1054840087890625, -0.08281707763671875, -0.060150146484375, -0.03748321533203125, -0.0148162841796875, 0.00785064697265625, 0.030517578125, 0.05318450927734375, 0.0758514404296875, 0.09851837158203125, 0.121185302734375, 0.14385223388671875, 0.1665191650390625, 0.18918609619140625, 0.21185302734375, 0.23451995849609375, 0.2571868896484375, 0.27985382080078125, 0.302520751953125, 0.32518768310546875, 0.3478546142578125, 0.37052154541015625, 0.3931884765625, 0.41585540771484375, 0.4385223388671875, 0.46118927001953125, 0.483856201171875, 0.5065231323242188, 0.5291900634765625, 0.5518569946289062, 0.57452392578125, 0.5971908569335938, 0.6198577880859375, 0.6425247192382812, 0.665191650390625, 0.6878585815429688, 0.7105255126953125, 0.7331924438476562, 0.755859375]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 5.0, 6.0, 4.0, 7.0, 5.0, 6.0, 11.0, 7.0, 17.0, 14.0, 19.0, 26.0, 22.0, 21.0, 27.0, 35.0, 35.0, 39.0, 31.0, 41.0, 44.0, 35.0, 47.0, 1072.0, 41.0, 53.0, 40.0, 36.0, 33.0, 37.0, 25.0, 27.0, 28.0, 25.0, 17.0, 11.0, 15.0, 15.0, 11.0, 5.0, 9.0, 6.0, 9.0, 5.0, 5.0, 0.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.77734375, -2.688873291015625, -2.60040283203125, -2.511932373046875, -2.4234619140625, -2.334991455078125, -2.24652099609375, -2.158050537109375, -2.069580078125, -1.981109619140625, -1.89263916015625, -1.804168701171875, -1.7156982421875, -1.627227783203125, -1.53875732421875, -1.450286865234375, -1.36181640625, -1.273345947265625, -1.18487548828125, -1.096405029296875, -1.0079345703125, -0.919464111328125, -0.83099365234375, -0.742523193359375, -0.654052734375, -0.565582275390625, -0.47711181640625, -0.388641357421875, -0.3001708984375, -0.211700439453125, -0.12322998046875, -0.034759521484375, 0.0537109375, 0.142181396484375, 0.23065185546875, 0.319122314453125, 0.4075927734375, 0.496063232421875, 0.58453369140625, 0.673004150390625, 0.761474609375, 0.849945068359375, 0.93841552734375, 1.026885986328125, 1.1153564453125, 1.203826904296875, 1.29229736328125, 1.380767822265625, 1.46923828125, 1.557708740234375, 1.64617919921875, 1.734649658203125, 1.8231201171875, 1.911590576171875, 2.00006103515625, 2.088531494140625, 2.177001953125, 2.265472412109375, 2.35394287109375, 2.442413330078125, 2.5308837890625, 2.619354248046875, 2.70782470703125, 2.796295166015625, 2.884765625]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 2.0, 6.0, 3.0, 10.0, 13.0, 25.0, 44.0, 47.0, 55.0, 86.0, 172.0, 203.0, 328.0, 502.0, 693.0, 1153.0, 1725.0, 2629.0, 4031.0, 6347.0, 10019.0, 16605.0, 27777.0, 111500.0, 1798210.0, 53083.0, 23240.0, 14139.0, 8728.0, 5660.0, 3439.0, 2274.0, 1438.0, 1016.0, 639.0, 410.0, 278.0, 197.0, 134.0, 82.0, 66.0, 50.0, 34.0, 19.0, 6.0, 7.0, 6.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.94140625, -1.8848876953125, -1.828369140625, -1.7718505859375, -1.71533203125, -1.6588134765625, -1.602294921875, -1.5457763671875, -1.4892578125, -1.4327392578125, -1.376220703125, -1.3197021484375, -1.26318359375, -1.2066650390625, -1.150146484375, -1.0936279296875, -1.037109375, -0.9805908203125, -0.924072265625, -0.8675537109375, -0.81103515625, -0.7545166015625, -0.697998046875, -0.6414794921875, -0.5849609375, -0.5284423828125, -0.471923828125, -0.4154052734375, -0.35888671875, -0.3023681640625, -0.245849609375, -0.1893310546875, -0.1328125, -0.0762939453125, -0.019775390625, 0.0367431640625, 0.09326171875, 0.1497802734375, 0.206298828125, 0.2628173828125, 0.3193359375, 0.3758544921875, 0.432373046875, 0.4888916015625, 0.54541015625, 0.6019287109375, 0.658447265625, 0.7149658203125, 0.771484375, 0.8280029296875, 0.884521484375, 0.9410400390625, 0.99755859375, 1.0540771484375, 1.110595703125, 1.1671142578125, 1.2236328125, 1.2801513671875, 1.336669921875, 1.3931884765625, 1.44970703125, 1.5062255859375, 1.562744140625, 1.6192626953125, 1.67578125]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 3.0, 0.0, 2.0, 1.0, 4.0, 8.0, 8.0, 11.0, 15.0, 13.0, 24.0, 21.0, 22.0, 40.0, 43.0, 58.0, 57.0, 67.0, 61.0, 84.0, 93.0, 59.0, 63.0, 50.0, 39.0, 31.0, 25.0, 26.0, 27.0, 15.0, 11.0, 8.0, 5.0, 8.0, 3.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06622314453125, -0.06329345703125, -0.06036376953125, -0.05743408203125, -0.05450439453125, -0.05157470703125, -0.04864501953125, -0.04571533203125, -0.04278564453125, -0.03985595703125, -0.03692626953125, -0.03399658203125, -0.03106689453125, -0.02813720703125, -0.02520751953125, -0.02227783203125, -0.01934814453125, -0.01641845703125, -0.01348876953125, -0.01055908203125, -0.00762939453125, -0.00469970703125, -0.00177001953125, 0.00115966796875, 0.00408935546875, 0.00701904296875, 0.00994873046875, 0.01287841796875, 0.01580810546875, 0.01873779296875, 0.02166748046875, 0.02459716796875, 0.02752685546875, 0.03045654296875, 0.03338623046875, 0.03631591796875, 0.03924560546875, 0.04217529296875, 0.04510498046875, 0.04803466796875, 0.05096435546875, 0.05389404296875, 0.05682373046875, 0.05975341796875, 0.06268310546875, 0.06561279296875, 0.06854248046875, 0.07147216796875, 0.07440185546875, 0.07733154296875, 0.08026123046875, 0.08319091796875, 0.08612060546875, 0.08905029296875, 0.09197998046875, 0.09490966796875, 0.09783935546875, 0.10076904296875, 0.10369873046875, 0.10662841796875, 0.10955810546875, 0.11248779296875, 0.11541748046875, 0.11834716796875, 0.12127685546875]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 7.0, 1.0, 2.0, 8.0, 9.0, 9.0, 15.0, 23.0, 30.0, 35.0, 41.0, 87.0, 161.0, 268.0, 827.0, 93566.0, 951267.0, 1335.0, 362.0, 161.0, 123.0, 65.0, 41.0, 24.0, 20.0, 24.0, 18.0, 7.0, 8.0, 10.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-2.748046875, -2.6812896728515625, -2.614532470703125, -2.5477752685546875, -2.48101806640625, -2.4142608642578125, -2.347503662109375, -2.2807464599609375, -2.2139892578125, -2.1472320556640625, -2.080474853515625, -2.0137176513671875, -1.94696044921875, -1.8802032470703125, -1.813446044921875, -1.7466888427734375, -1.679931640625, -1.6131744384765625, -1.546417236328125, -1.4796600341796875, -1.41290283203125, -1.3461456298828125, -1.279388427734375, -1.2126312255859375, -1.1458740234375, -1.0791168212890625, -1.012359619140625, -0.9456024169921875, -0.87884521484375, -0.8120880126953125, -0.745330810546875, -0.6785736083984375, -0.61181640625, -0.5450592041015625, -0.478302001953125, -0.4115447998046875, -0.34478759765625, -0.2780303955078125, -0.211273193359375, -0.1445159912109375, -0.0777587890625, -0.0110015869140625, 0.055755615234375, 0.1225128173828125, 0.18927001953125, 0.2560272216796875, 0.322784423828125, 0.3895416259765625, 0.456298828125, 0.5230560302734375, 0.589813232421875, 0.6565704345703125, 0.72332763671875, 0.7900848388671875, 0.856842041015625, 0.9235992431640625, 0.9903564453125, 1.0571136474609375, 1.123870849609375, 1.1906280517578125, 1.25738525390625, 1.3241424560546875, 1.390899658203125, 1.4576568603515625, 1.5244140625]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 24.0, 756.0, 224.0, 6.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.046271800994873, -1.9934687614440918, -1.9406657218933105, -1.8878625631332397, -1.8350595235824585, -1.7822564840316772, -1.7294533252716064, -1.6766502857208252, -1.623847246170044, -1.5710442066192627, -1.5182411670684814, -1.4654380083084106, -1.4126349687576294, -1.3598319292068481, -1.3070287704467773, -1.254225730895996, -1.2014226913452148, -1.1486196517944336, -1.0958166122436523, -1.0430134534835815, -0.9902104139328003, -0.937407374382019, -0.884604275226593, -0.831801176071167, -0.7789981365203857, -0.7261950969696045, -0.6733919978141785, -0.6205888986587524, -0.5677858591079712, -0.5149828195571899, -0.4621797204017639, -0.4093766510486603, -0.3565737009048462, -0.30377063155174255, -0.2509675621986389, -0.19816449284553528, -0.14536142349243164, -0.092558354139328, -0.039755284786224365, 0.013047784566879272, 0.06585085391998291, 0.11865392327308655, 0.17145699262619019, 0.22426006197929382, 0.27706313133239746, 0.3298662006855011, 0.38266927003860474, 0.4354723393917084, 0.488275408744812, 0.5410784482955933, 0.5938815474510193, 0.6466846466064453, 0.6994876861572266, 0.7522907257080078, 0.8050938248634338, 0.8578969240188599, 0.9106999635696411, 0.9635030031204224, 1.0163061618804932, 1.0691092014312744, 1.1219122409820557, 1.174715280532837, 1.2275183200836182, 1.280321478843689, 1.3331245183944702]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 4.0, 10.0, 11.0, 17.0, 24.0, 22.0, 35.0, 40.0, 63.0, 70.0, 64.0, 72.0, 56.0, 75.0, 61.0, 70.0, 60.0, 63.0, 51.0, 35.0, 30.0, 28.0, 14.0, 11.0, 7.0, 12.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3676096796989441, -0.356763631105423, -0.34591755270957947, -0.33507150411605835, -0.32422545552253723, -0.3133794069290161, -0.3025333285331726, -0.2916872799396515, -0.28084123134613037, -0.26999518275260925, -0.25914910435676575, -0.24830305576324463, -0.2374570071697235, -0.2266109436750412, -0.2157648801803589, -0.20491883158683777, -0.19407275319099426, -0.18322668969631195, -0.17238064110279083, -0.16153457760810852, -0.1506885290145874, -0.1398424655199051, -0.12899640202522278, -0.11815034598112106, -0.10730428993701935, -0.09645823389291763, -0.08561217784881592, -0.0747661143541336, -0.06392005831003189, -0.053074002265930176, -0.042227938771247864, -0.03138188272714615, -0.020535826683044434, -0.00968976877629757, 0.001156289130449295, 0.012002348899841309, 0.022848404943943024, 0.03369446098804474, 0.04454052448272705, 0.055386580526828766, 0.06623263657093048, 0.0770786926150322, 0.08792474865913391, 0.09877081215381622, 0.10961686819791794, 0.12046292424201965, 0.13130898773670197, 0.14215505123138428, 0.1530010998249054, 0.1638471633195877, 0.17469321191310883, 0.18553927540779114, 0.19638532400131226, 0.20723138749599457, 0.21807745099067688, 0.228923499584198, 0.2397695630788803, 0.2506156265735626, 0.26146167516708374, 0.27230775356292725, 0.28315380215644836, 0.2939998507499695, 0.304845929145813, 0.3156919777393341, 0.3265380263328552]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 3.0, 4.0, 7.0, 3.0, 5.0, 4.0, 10.0, 5.0, 11.0, 12.0, 17.0, 20.0, 19.0, 22.0, 31.0, 20.0, 34.0, 30.0, 45.0, 41.0, 36.0, 33.0, 40.0, 43.0, 44.0, 42.0, 48.0, 29.0, 44.0, 39.0, 34.0, 29.0, 34.0, 30.0, 18.0, 16.0, 17.0, 19.0, 9.0, 8.0, 12.0, 10.0, 4.0, 5.0, 3.0, 7.0, 5.0, 2.0, 3.0, 1.0, 5.0, 0.0, 0.0, 1.0], "bins": [-3.8203125, -3.707672119140625, -3.59503173828125, -3.482391357421875, -3.3697509765625, -3.257110595703125, -3.14447021484375, -3.031829833984375, -2.919189453125, -2.806549072265625, -2.69390869140625, -2.581268310546875, -2.4686279296875, -2.355987548828125, -2.24334716796875, -2.130706787109375, -2.01806640625, -1.905426025390625, -1.79278564453125, -1.680145263671875, -1.5675048828125, -1.454864501953125, -1.34222412109375, -1.229583740234375, -1.116943359375, -1.004302978515625, -0.89166259765625, -0.779022216796875, -0.6663818359375, -0.553741455078125, -0.44110107421875, -0.328460693359375, -0.2158203125, -0.103179931640625, 0.00946044921875, 0.122100830078125, 0.2347412109375, 0.347381591796875, 0.46002197265625, 0.572662353515625, 0.685302734375, 0.797943115234375, 0.91058349609375, 1.023223876953125, 1.1358642578125, 1.248504638671875, 1.36114501953125, 1.473785400390625, 1.58642578125, 1.699066162109375, 1.81170654296875, 1.924346923828125, 2.0369873046875, 2.149627685546875, 2.26226806640625, 2.374908447265625, 2.487548828125, 2.600189208984375, 2.71282958984375, 2.825469970703125, 2.9381103515625, 3.050750732421875, 3.16339111328125, 3.276031494140625, 3.388671875]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 2.0, 8.0, 4.0, 7.0, 7.0, 15.0, 11.0, 16.0, 29.0, 30.0, 51.0, 57.0, 115.0, 171.0, 340.0, 781.0, 1781.0, 4410.0, 11278.0, 27441.0, 67345.0, 187430.0, 427931.0, 199307.0, 70999.0, 28803.0, 11831.0, 4704.0, 1931.0, 824.0, 371.0, 165.0, 115.0, 66.0, 51.0, 28.0, 21.0, 14.0, 11.0, 8.0, 11.0, 7.0, 5.0, 6.0, 4.0, 4.0, 2.0, 4.0, 4.0, 4.0, 1.0, 0.0, 1.0], "bins": [-5.3984375, -5.2374267578125, -5.076416015625, -4.9154052734375, -4.75439453125, -4.5933837890625, -4.432373046875, -4.2713623046875, -4.1103515625, -3.9493408203125, -3.788330078125, -3.6273193359375, -3.46630859375, -3.3052978515625, -3.144287109375, -2.9832763671875, -2.822265625, -2.6612548828125, -2.500244140625, -2.3392333984375, -2.17822265625, -2.0172119140625, -1.856201171875, -1.6951904296875, -1.5341796875, -1.3731689453125, -1.212158203125, -1.0511474609375, -0.89013671875, -0.7291259765625, -0.568115234375, -0.4071044921875, -0.24609375, -0.0850830078125, 0.075927734375, 0.2369384765625, 0.39794921875, 0.5589599609375, 0.719970703125, 0.8809814453125, 1.0419921875, 1.2030029296875, 1.364013671875, 1.5250244140625, 1.68603515625, 1.8470458984375, 2.008056640625, 2.1690673828125, 2.330078125, 2.4910888671875, 2.652099609375, 2.8131103515625, 2.97412109375, 3.1351318359375, 3.296142578125, 3.4571533203125, 3.6181640625, 3.7791748046875, 3.940185546875, 4.1011962890625, 4.26220703125, 4.4232177734375, 4.584228515625, 4.7452392578125, 4.90625]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 3.0, 10.0, 6.0, 7.0, 4.0, 10.0, 14.0, 5.0, 15.0, 12.0, 18.0, 30.0, 20.0, 28.0, 36.0, 41.0, 38.0, 61.0, 72.0, 129.0, 251.0, 1488.0, 223.0, 107.0, 76.0, 60.0, 52.0, 34.0, 35.0, 30.0, 22.0, 19.0, 15.0, 15.0, 17.0, 13.0, 4.0, 6.0, 6.0, 7.0, 3.0, 3.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.3203125, -11.915771484375, -11.51123046875, -11.106689453125, -10.7021484375, -10.297607421875, -9.89306640625, -9.488525390625, -9.083984375, -8.679443359375, -8.27490234375, -7.870361328125, -7.4658203125, -7.061279296875, -6.65673828125, -6.252197265625, -5.84765625, -5.443115234375, -5.03857421875, -4.634033203125, -4.2294921875, -3.824951171875, -3.42041015625, -3.015869140625, -2.611328125, -2.206787109375, -1.80224609375, -1.397705078125, -0.9931640625, -0.588623046875, -0.18408203125, 0.220458984375, 0.625, 1.029541015625, 1.43408203125, 1.838623046875, 2.2431640625, 2.647705078125, 3.05224609375, 3.456787109375, 3.861328125, 4.265869140625, 4.67041015625, 5.074951171875, 5.4794921875, 5.884033203125, 6.28857421875, 6.693115234375, 7.09765625, 7.502197265625, 7.90673828125, 8.311279296875, 8.7158203125, 9.120361328125, 9.52490234375, 9.929443359375, 10.333984375, 10.738525390625, 11.14306640625, 11.547607421875, 11.9521484375, 12.356689453125, 12.76123046875, 13.165771484375, 13.5703125]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 6.0, 9.0, 20.0, 17.0, 35.0, 60.0, 119.0, 188.0, 574.0, 5924.0, 3126994.0, 10555.0, 667.0, 247.0, 120.0, 58.0, 37.0, 26.0, 20.0, 15.0, 6.0, 5.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-63.15625, -61.27392578125, -59.3916015625, -57.50927734375, -55.626953125, -53.74462890625, -51.8623046875, -49.97998046875, -48.09765625, -46.21533203125, -44.3330078125, -42.45068359375, -40.568359375, -38.68603515625, -36.8037109375, -34.92138671875, -33.0390625, -31.15673828125, -29.2744140625, -27.39208984375, -25.509765625, -23.62744140625, -21.7451171875, -19.86279296875, -17.98046875, -16.09814453125, -14.2158203125, -12.33349609375, -10.451171875, -8.56884765625, -6.6865234375, -4.80419921875, -2.921875, -1.03955078125, 0.8427734375, 2.72509765625, 4.607421875, 6.48974609375, 8.3720703125, 10.25439453125, 12.13671875, 14.01904296875, 15.9013671875, 17.78369140625, 19.666015625, 21.54833984375, 23.4306640625, 25.31298828125, 27.1953125, 29.07763671875, 30.9599609375, 32.84228515625, 34.724609375, 36.60693359375, 38.4892578125, 40.37158203125, 42.25390625, 44.13623046875, 46.0185546875, 47.90087890625, 49.783203125, 51.66552734375, 53.5478515625, 55.43017578125, 57.3125]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 987.0, 26.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-109.11361694335938, -97.85798645019531, -86.60236358642578, -75.34674072265625, -64.09111022949219, -52.83548355102539, -41.579856872558594, -30.324234008789062, -19.068603515625, -7.812976837158203, 3.4426498413085938, 14.69827651977539, 25.953903198242188, 37.209529876708984, 48.46515655517578, 59.72077941894531, 70.97640991210938, 82.23204040527344, 93.48766326904297, 104.7432861328125, 115.99891662597656, 127.25454711914062, 138.51016235351562, 149.7657928466797, 161.02142333984375, 172.2770538330078, 183.53268432617188, 194.78829956054688, 206.04393005371094, 217.299560546875, 228.55517578125, 239.81080627441406, 251.06640625, 262.322021484375, 273.5776672363281, 284.8332824707031, 296.08892822265625, 307.34454345703125, 318.60015869140625, 329.85577392578125, 341.1114196777344, 352.3670349121094, 363.6226806640625, 374.8782958984375, 386.1339111328125, 397.3895568847656, 408.6451721191406, 419.90081787109375, 431.15643310546875, 442.41204833984375, 453.6676940917969, 464.9233093261719, 476.178955078125, 487.4345703125, 498.690185546875, 509.94580078125, 521.201416015625, 532.45703125, 543.712646484375, 554.9683227539062, 566.2239379882812, 577.4795532226562, 588.7351684570312, 599.9907836914062, 611.2464599609375]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 4.0, 2.0, 3.0, 4.0, 3.0, 4.0, 5.0, 7.0, 12.0, 15.0, 10.0, 6.0, 20.0, 17.0, 17.0, 16.0, 22.0, 28.0, 32.0, 30.0, 39.0, 26.0, 24.0, 38.0, 40.0, 42.0, 35.0, 45.0, 29.0, 38.0, 32.0, 33.0, 27.0, 27.0, 28.0, 29.0, 26.0, 20.0, 26.0, 23.0, 18.0, 16.0, 13.0, 7.0, 14.0, 9.0, 12.0, 6.0, 3.0, 7.0, 4.0, 4.0, 4.0, 3.0, 4.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0], "bins": [-28.298845291137695, -27.367408752441406, -26.435972213745117, -25.504535675048828, -24.57309913635254, -23.64166259765625, -22.71022605895996, -21.778789520263672, -20.847352981567383, -19.915916442871094, -18.984479904174805, -18.053043365478516, -17.121606826782227, -16.190170288085938, -15.258733749389648, -14.32729721069336, -13.395859718322754, -12.464423179626465, -11.532986640930176, -10.601550102233887, -9.670113563537598, -8.738676071166992, -7.807240009307861, -6.875803470611572, -5.944366931915283, -5.012930393218994, -4.081493854522705, -3.150057077407837, -2.218620538711548, -1.2871837615966797, -0.3557472229003906, 0.5756893157958984, 1.5071258544921875, 2.4385623931884766, 3.3699989318847656, 4.301435470581055, 5.232872009277344, 6.164309024810791, 7.09574556350708, 8.027181625366211, 8.9586181640625, 9.890054702758789, 10.821491241455078, 11.752927780151367, 12.684364318847656, 13.615800857543945, 14.547237396240234, 15.478673934936523, 16.410110473632812, 17.3415470123291, 18.27298355102539, 19.20442008972168, 20.13585662841797, 21.067293167114258, 21.998729705810547, 22.930166244506836, 23.861604690551758, 24.793041229248047, 25.724477767944336, 26.655914306640625, 27.587350845336914, 28.518787384033203, 29.450223922729492, 30.38166046142578, 31.31309700012207]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 5.0, 8.0, 7.0, 14.0, 9.0, 12.0, 11.0, 14.0, 15.0, 24.0, 19.0, 19.0, 28.0, 29.0, 42.0, 40.0, 37.0, 31.0, 43.0, 39.0, 45.0, 35.0, 37.0, 46.0, 46.0, 32.0, 43.0, 35.0, 33.0, 28.0, 29.0, 20.0, 21.0, 11.0, 12.0, 17.0, 15.0, 11.0, 9.0, 5.0, 5.0, 4.0, 0.0, 6.0, 4.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0], "bins": [-4.1796875, -4.05694580078125, -3.9342041015625, -3.81146240234375, -3.688720703125, -3.56597900390625, -3.4432373046875, -3.32049560546875, -3.19775390625, -3.07501220703125, -2.9522705078125, -2.82952880859375, -2.706787109375, -2.58404541015625, -2.4613037109375, -2.33856201171875, -2.2158203125, -2.09307861328125, -1.9703369140625, -1.84759521484375, -1.724853515625, -1.60211181640625, -1.4793701171875, -1.35662841796875, -1.23388671875, -1.11114501953125, -0.9884033203125, -0.86566162109375, -0.742919921875, -0.62017822265625, -0.4974365234375, -0.37469482421875, -0.251953125, -0.12921142578125, -0.0064697265625, 0.11627197265625, 0.239013671875, 0.36175537109375, 0.4844970703125, 0.60723876953125, 0.72998046875, 0.85272216796875, 0.9754638671875, 1.09820556640625, 1.220947265625, 1.34368896484375, 1.4664306640625, 1.58917236328125, 1.7119140625, 1.83465576171875, 1.9573974609375, 2.08013916015625, 2.202880859375, 2.32562255859375, 2.4483642578125, 2.57110595703125, 2.69384765625, 2.81658935546875, 2.9393310546875, 3.06207275390625, 3.184814453125, 3.30755615234375, 3.4302978515625, 3.55303955078125, 3.67578125]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 6.0, 5.0, 5.0, 8.0, 15.0, 20.0, 17.0, 23.0, 44.0, 66.0, 82.0, 158.0, 208.0, 264.0, 489.0, 810.0, 1510.0, 3017.0, 6021.0, 12887.0, 27937.0, 61474.0, 136548.0, 293190.0, 586487.0, 950034.0, 956537.0, 596449.0, 300388.0, 140332.0, 63534.0, 29085.0, 13419.0, 6280.0, 3193.0, 1618.0, 852.0, 466.0, 295.0, 182.0, 108.0, 71.0, 51.0, 44.0, 20.0, 12.0, 7.0, 12.0, 5.0, 4.0, 5.0, 0.0, 0.0, 1.0], "bins": [-3.765625, -3.66107177734375, -3.5565185546875, -3.45196533203125, -3.347412109375, -3.24285888671875, -3.1383056640625, -3.03375244140625, -2.92919921875, -2.82464599609375, -2.7200927734375, -2.61553955078125, -2.510986328125, -2.40643310546875, -2.3018798828125, -2.19732666015625, -2.0927734375, -1.98822021484375, -1.8836669921875, -1.77911376953125, -1.674560546875, -1.57000732421875, -1.4654541015625, -1.36090087890625, -1.25634765625, -1.15179443359375, -1.0472412109375, -0.94268798828125, -0.838134765625, -0.73358154296875, -0.6290283203125, -0.52447509765625, -0.419921875, -0.31536865234375, -0.2108154296875, -0.10626220703125, -0.001708984375, 0.10284423828125, 0.2073974609375, 0.31195068359375, 0.41650390625, 0.52105712890625, 0.6256103515625, 0.73016357421875, 0.834716796875, 0.93927001953125, 1.0438232421875, 1.14837646484375, 1.2529296875, 1.35748291015625, 1.4620361328125, 1.56658935546875, 1.671142578125, 1.77569580078125, 1.8802490234375, 1.98480224609375, 2.08935546875, 2.19390869140625, 2.2984619140625, 2.40301513671875, 2.507568359375, 2.61212158203125, 2.7166748046875, 2.82122802734375, 2.92578125]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 7.0, 13.0, 21.0, 26.0, 51.0, 104.0, 178.0, 297.0, 521.0, 683.0, 738.0, 534.0, 366.0, 195.0, 120.0, 74.0, 60.0, 39.0, 18.0, 6.0, 7.0, 7.0, 8.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-13.4609375, -13.0880126953125, -12.715087890625, -12.3421630859375, -11.96923828125, -11.5963134765625, -11.223388671875, -10.8504638671875, -10.4775390625, -10.1046142578125, -9.731689453125, -9.3587646484375, -8.98583984375, -8.6129150390625, -8.239990234375, -7.8670654296875, -7.494140625, -7.1212158203125, -6.748291015625, -6.3753662109375, -6.00244140625, -5.6295166015625, -5.256591796875, -4.8836669921875, -4.5107421875, -4.1378173828125, -3.764892578125, -3.3919677734375, -3.01904296875, -2.6461181640625, -2.273193359375, -1.9002685546875, -1.52734375, -1.1544189453125, -0.781494140625, -0.4085693359375, -0.03564453125, 0.3372802734375, 0.710205078125, 1.0831298828125, 1.4560546875, 1.8289794921875, 2.201904296875, 2.5748291015625, 2.94775390625, 3.3206787109375, 3.693603515625, 4.0665283203125, 4.439453125, 4.8123779296875, 5.185302734375, 5.5582275390625, 5.93115234375, 6.3040771484375, 6.677001953125, 7.0499267578125, 7.4228515625, 7.7957763671875, 8.168701171875, 8.5416259765625, 8.91455078125, 9.2874755859375, 9.660400390625, 10.0333251953125, 10.40625]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 4.0, 10.0, 11.0, 21.0, 38.0, 65.0, 100.0, 194.0, 463.0, 1273.0, 16031.0, 4135249.0, 38370.0, 1477.0, 559.0, 208.0, 97.0, 47.0, 28.0, 18.0, 8.0, 3.0, 5.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.625, -43.115234375, -41.60546875, -40.095703125, -38.5859375, -37.076171875, -35.56640625, -34.056640625, -32.546875, -31.037109375, -29.52734375, -28.017578125, -26.5078125, -24.998046875, -23.48828125, -21.978515625, -20.46875, -18.958984375, -17.44921875, -15.939453125, -14.4296875, -12.919921875, -11.41015625, -9.900390625, -8.390625, -6.880859375, -5.37109375, -3.861328125, -2.3515625, -0.841796875, 0.66796875, 2.177734375, 3.6875, 5.197265625, 6.70703125, 8.216796875, 9.7265625, 11.236328125, 12.74609375, 14.255859375, 15.765625, 17.275390625, 18.78515625, 20.294921875, 21.8046875, 23.314453125, 24.82421875, 26.333984375, 27.84375, 29.353515625, 30.86328125, 32.373046875, 33.8828125, 35.392578125, 36.90234375, 38.412109375, 39.921875, 41.431640625, 42.94140625, 44.451171875, 45.9609375, 47.470703125, 48.98046875, 50.490234375, 52.0]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 99.0, 853.0, 61.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-474.0621032714844, -464.0599060058594, -454.0577087402344, -444.0555419921875, -434.0533447265625, -424.0511474609375, -414.0489501953125, -404.0467529296875, -394.0445861816406, -384.0423889160156, -374.0401916503906, -364.03802490234375, -354.03582763671875, -344.03363037109375, -334.03143310546875, -324.02923583984375, -314.02703857421875, -304.02484130859375, -294.02264404296875, -284.0204772949219, -274.0182800292969, -264.0160827636719, -254.01388549804688, -244.01170349121094, -234.009521484375, -224.00732421875, -214.00514221191406, -204.00294494628906, -194.00076293945312, -183.99856567382812, -173.99636840820312, -163.9941864013672, -153.99200439453125, -143.98980712890625, -133.9876251220703, -123.98542785644531, -113.98324584960938, -103.98104858398438, -93.9788589477539, -83.97666931152344, -73.97447967529297, -63.9722900390625, -53.97010040283203, -43.9679069519043, -33.96571731567383, -23.96352767944336, -13.961334228515625, -3.9591445922851562, 6.0430450439453125, 16.04523468017578, 26.047426223754883, 36.049617767333984, 46.05180740356445, 56.05399703979492, 66.05619049072266, 76.05838012695312, 86.0605697631836, 96.06275939941406, 106.06494903564453, 116.067138671875, 126.0693359375, 136.07151794433594, 146.07371520996094, 156.07589721679688, 166.07809448242188]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 7.0, 7.0, 8.0, 8.0, 11.0, 6.0, 13.0, 24.0, 24.0, 24.0, 35.0, 48.0, 47.0, 40.0, 42.0, 55.0, 56.0, 38.0, 60.0, 63.0, 45.0, 58.0, 48.0, 44.0, 34.0, 29.0, 28.0, 25.0, 23.0, 18.0, 6.0, 15.0, 11.0, 5.0, 3.0, 6.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.591800689697266, -27.50762176513672, -26.42344093322754, -25.339262008666992, -24.255081176757812, -23.170902252197266, -22.08672332763672, -21.002544403076172, -19.918363571166992, -18.834184646606445, -17.750003814697266, -16.66582489013672, -15.581645011901855, -14.497465133666992, -13.413286209106445, -12.329106330871582, -11.244926452636719, -10.160746574401855, -9.076566696166992, -7.992387771606445, -6.908207893371582, -5.824028015136719, -4.739848613739014, -3.6556692123413086, -2.5714893341064453, -1.4873096942901611, -0.40313005447387695, 0.6810495853424072, 1.7652292251586914, 2.8494091033935547, 3.9335885047912598, 5.017767906188965, 6.1019439697265625, 7.186123847961426, 8.270303726196289, 9.354482650756836, 10.4386625289917, 11.522842407226562, 12.60702133178711, 13.691201210021973, 14.775381088256836, 15.8595609664917, 16.943740844726562, 18.02791976928711, 19.112098693847656, 20.196279525756836, 21.280458450317383, 22.364639282226562, 23.44881820678711, 24.532997131347656, 25.617177963256836, 26.701356887817383, 27.785537719726562, 28.86971664428711, 29.953895568847656, 31.038074493408203, 32.12225341796875, 33.2064323425293, 34.290611267089844, 35.374794006347656, 36.4589729309082, 37.54315185546875, 38.6273307800293, 39.711509704589844, 40.795692443847656]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 3.0, 7.0, 4.0, 1.0, 7.0, 4.0, 8.0, 14.0, 10.0, 11.0, 14.0, 20.0, 23.0, 21.0, 20.0, 24.0, 28.0, 36.0, 34.0, 51.0, 35.0, 51.0, 43.0, 50.0, 44.0, 46.0, 35.0, 41.0, 30.0, 46.0, 37.0, 22.0, 30.0, 30.0, 30.0, 12.0, 19.0, 12.0, 11.0, 14.0, 8.0, 4.0, 3.0, 6.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-3.79296875, -3.676605224609375, -3.56024169921875, -3.443878173828125, -3.3275146484375, -3.211151123046875, -3.09478759765625, -2.978424072265625, -2.862060546875, -2.745697021484375, -2.62933349609375, -2.512969970703125, -2.3966064453125, -2.280242919921875, -2.16387939453125, -2.047515869140625, -1.93115234375, -1.814788818359375, -1.69842529296875, -1.582061767578125, -1.4656982421875, -1.349334716796875, -1.23297119140625, -1.116607666015625, -1.000244140625, -0.883880615234375, -0.76751708984375, -0.651153564453125, -0.5347900390625, -0.418426513671875, -0.30206298828125, -0.185699462890625, -0.0693359375, 0.047027587890625, 0.16339111328125, 0.279754638671875, 0.3961181640625, 0.512481689453125, 0.62884521484375, 0.745208740234375, 0.861572265625, 0.977935791015625, 1.09429931640625, 1.210662841796875, 1.3270263671875, 1.443389892578125, 1.55975341796875, 1.676116943359375, 1.79248046875, 1.908843994140625, 2.02520751953125, 2.141571044921875, 2.2579345703125, 2.374298095703125, 2.49066162109375, 2.607025146484375, 2.723388671875, 2.839752197265625, 2.95611572265625, 3.072479248046875, 3.1888427734375, 3.305206298828125, 3.42156982421875, 3.537933349609375, 3.654296875]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 8.0, 10.0, 16.0, 22.0, 45.0, 71.0, 121.0, 200.0, 368.0, 648.0, 1048.0, 2131.0, 3657.0, 6440.0, 11445.0, 20081.0, 33871.0, 55012.0, 83164.0, 116579.0, 143853.0, 152686.0, 134245.0, 102861.0, 70674.0, 45545.0, 27094.0, 16085.0, 9023.0, 5093.0, 2774.0, 1560.0, 929.0, 506.0, 285.0, 170.0, 104.0, 47.0, 34.0, 27.0, 17.0, 5.0, 5.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.7578125, -0.7319412231445312, -0.7060699462890625, -0.6801986694335938, -0.654327392578125, -0.6284561157226562, -0.6025848388671875, -0.5767135620117188, -0.55084228515625, -0.5249710083007812, -0.4990997314453125, -0.47322845458984375, -0.447357177734375, -0.42148590087890625, -0.3956146240234375, -0.36974334716796875, -0.3438720703125, -0.31800079345703125, -0.2921295166015625, -0.26625823974609375, -0.240386962890625, -0.21451568603515625, -0.1886444091796875, -0.16277313232421875, -0.13690185546875, -0.11103057861328125, -0.0851593017578125, -0.05928802490234375, -0.033416748046875, -0.00754547119140625, 0.0183258056640625, 0.04419708251953125, 0.070068359375, 0.09593963623046875, 0.1218109130859375, 0.14768218994140625, 0.173553466796875, 0.19942474365234375, 0.2252960205078125, 0.25116729736328125, 0.27703857421875, 0.30290985107421875, 0.3287811279296875, 0.35465240478515625, 0.380523681640625, 0.40639495849609375, 0.4322662353515625, 0.45813751220703125, 0.4840087890625, 0.5098800659179688, 0.5357513427734375, 0.5616226196289062, 0.587493896484375, 0.6133651733398438, 0.6392364501953125, 0.6651077270507812, 0.69097900390625, 0.7168502807617188, 0.7427215576171875, 0.7685928344726562, 0.794464111328125, 0.8203353881835938, 0.8462066650390625, 0.8720779418945312, 0.89794921875]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 5.0, 6.0, 8.0, 10.0, 13.0, 7.0, 13.0, 17.0, 13.0, 23.0, 27.0, 21.0, 32.0, 29.0, 33.0, 23.0, 28.0, 43.0, 28.0, 29.0, 41.0, 43.0, 1059.0, 35.0, 48.0, 33.0, 40.0, 32.0, 40.0, 27.0, 23.0, 25.0, 28.0, 16.0, 24.0, 20.0, 16.0, 13.0, 9.0, 13.0, 4.0, 6.0, 6.0, 9.0, 3.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0], "bins": [-2.8046875, -2.7225341796875, -2.640380859375, -2.5582275390625, -2.47607421875, -2.3939208984375, -2.311767578125, -2.2296142578125, -2.1474609375, -2.0653076171875, -1.983154296875, -1.9010009765625, -1.81884765625, -1.7366943359375, -1.654541015625, -1.5723876953125, -1.490234375, -1.4080810546875, -1.325927734375, -1.2437744140625, -1.16162109375, -1.0794677734375, -0.997314453125, -0.9151611328125, -0.8330078125, -0.7508544921875, -0.668701171875, -0.5865478515625, -0.50439453125, -0.4222412109375, -0.340087890625, -0.2579345703125, -0.17578125, -0.0936279296875, -0.011474609375, 0.0706787109375, 0.15283203125, 0.2349853515625, 0.317138671875, 0.3992919921875, 0.4814453125, 0.5635986328125, 0.645751953125, 0.7279052734375, 0.81005859375, 0.8922119140625, 0.974365234375, 1.0565185546875, 1.138671875, 1.2208251953125, 1.302978515625, 1.3851318359375, 1.46728515625, 1.5494384765625, 1.631591796875, 1.7137451171875, 1.7958984375, 1.8780517578125, 1.960205078125, 2.0423583984375, 2.12451171875, 2.2066650390625, 2.288818359375, 2.3709716796875, 2.453125]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 6.0, 6.0, 9.0, 11.0, 22.0, 18.0, 22.0, 37.0, 58.0, 62.0, 121.0, 183.0, 230.0, 371.0, 571.0, 762.0, 1219.0, 1846.0, 2820.0, 4295.0, 6613.0, 10141.0, 15890.0, 26613.0, 76249.0, 1801386.0, 76020.0, 26240.0, 15947.0, 10153.0, 6616.0, 4296.0, 2733.0, 1875.0, 1211.0, 754.0, 541.0, 355.0, 273.0, 160.0, 122.0, 88.0, 58.0, 35.0, 26.0, 19.0, 13.0, 9.0, 12.0, 9.0, 3.0, 5.0, 3.0], "bins": [-1.6875, -1.641265869140625, -1.59503173828125, -1.548797607421875, -1.5025634765625, -1.456329345703125, -1.41009521484375, -1.363861083984375, -1.317626953125, -1.271392822265625, -1.22515869140625, -1.178924560546875, -1.1326904296875, -1.086456298828125, -1.04022216796875, -0.993988037109375, -0.94775390625, -0.901519775390625, -0.85528564453125, -0.809051513671875, -0.7628173828125, -0.716583251953125, -0.67034912109375, -0.624114990234375, -0.577880859375, -0.531646728515625, -0.48541259765625, -0.439178466796875, -0.3929443359375, -0.346710205078125, -0.30047607421875, -0.254241943359375, -0.2080078125, -0.161773681640625, -0.11553955078125, -0.069305419921875, -0.0230712890625, 0.023162841796875, 0.06939697265625, 0.115631103515625, 0.161865234375, 0.208099365234375, 0.25433349609375, 0.300567626953125, 0.3468017578125, 0.393035888671875, 0.43927001953125, 0.485504150390625, 0.53173828125, 0.577972412109375, 0.62420654296875, 0.670440673828125, 0.7166748046875, 0.762908935546875, 0.80914306640625, 0.855377197265625, 0.901611328125, 0.947845458984375, 0.99407958984375, 1.040313720703125, 1.0865478515625, 1.132781982421875, 1.17901611328125, 1.225250244140625, 1.271484375]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 1.0, 6.0, 7.0, 9.0, 20.0, 13.0, 18.0, 25.0, 30.0, 43.0, 72.0, 61.0, 72.0, 75.0, 93.0, 77.0, 77.0, 61.0, 58.0, 46.0, 38.0, 22.0, 22.0, 14.0, 8.0, 7.0, 6.0, 5.0, 3.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1016845703125, -0.09835433959960938, -0.09502410888671875, -0.09169387817382812, -0.0883636474609375, -0.08503341674804688, -0.08170318603515625, -0.07837295532226562, -0.075042724609375, -0.07171249389648438, -0.06838226318359375, -0.06505203247070312, -0.0617218017578125, -0.058391571044921875, -0.05506134033203125, -0.051731109619140625, -0.04840087890625, -0.045070648193359375, -0.04174041748046875, -0.038410186767578125, -0.0350799560546875, -0.031749725341796875, -0.02841949462890625, -0.025089263916015625, -0.021759033203125, -0.018428802490234375, -0.01509857177734375, -0.011768341064453125, -0.0084381103515625, -0.005107879638671875, -0.00177764892578125, 0.001552581787109375, 0.0048828125, 0.008213043212890625, 0.01154327392578125, 0.014873504638671875, 0.0182037353515625, 0.021533966064453125, 0.02486419677734375, 0.028194427490234375, 0.031524658203125, 0.034854888916015625, 0.03818511962890625, 0.041515350341796875, 0.0448455810546875, 0.048175811767578125, 0.05150604248046875, 0.054836273193359375, 0.05816650390625, 0.061496734619140625, 0.06482696533203125, 0.06815719604492188, 0.0714874267578125, 0.07481765747070312, 0.07814788818359375, 0.08147811889648438, 0.084808349609375, 0.08813858032226562, 0.09146881103515625, 0.09479904174804688, 0.0981292724609375, 0.10145950317382812, 0.10478973388671875, 0.10811996459960938, 0.1114501953125]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 5.0, 5.0, 4.0, 8.0, 8.0, 10.0, 9.0, 20.0, 23.0, 29.0, 52.0, 75.0, 126.0, 209.0, 434.0, 3527.0, 1038237.0, 4688.0, 482.0, 201.0, 136.0, 83.0, 48.0, 42.0, 19.0, 19.0, 14.0, 16.0, 10.0, 9.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.3828125, -2.311737060546875, -2.24066162109375, -2.169586181640625, -2.0985107421875, -2.027435302734375, -1.95635986328125, -1.885284423828125, -1.814208984375, -1.743133544921875, -1.67205810546875, -1.600982666015625, -1.5299072265625, -1.458831787109375, -1.38775634765625, -1.316680908203125, -1.24560546875, -1.174530029296875, -1.10345458984375, -1.032379150390625, -0.9613037109375, -0.890228271484375, -0.81915283203125, -0.748077392578125, -0.677001953125, -0.605926513671875, -0.53485107421875, -0.463775634765625, -0.3927001953125, -0.321624755859375, -0.25054931640625, -0.179473876953125, -0.1083984375, -0.037322998046875, 0.03375244140625, 0.104827880859375, 0.1759033203125, 0.246978759765625, 0.31805419921875, 0.389129638671875, 0.460205078125, 0.531280517578125, 0.60235595703125, 0.673431396484375, 0.7445068359375, 0.815582275390625, 0.88665771484375, 0.957733154296875, 1.02880859375, 1.099884033203125, 1.17095947265625, 1.242034912109375, 1.3131103515625, 1.384185791015625, 1.45526123046875, 1.526336669921875, 1.597412109375, 1.668487548828125, 1.73956298828125, 1.810638427734375, 1.8817138671875, 1.952789306640625, 2.02386474609375, 2.094940185546875, 2.166015625]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 21.0, 78.0, 292.0, 381.0, 173.0, 55.0, 7.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.3907513916492462, -0.3739166259765625, -0.3570818305015564, -0.3402470350265503, -0.3234122693538666, -0.30657750368118286, -0.28974270820617676, -0.27290791273117065, -0.25607314705848694, -0.23923836648464203, -0.22240358591079712, -0.2055688053369522, -0.1887340247631073, -0.1718992441892624, -0.15506446361541748, -0.13822968304157257, -0.12139490246772766, -0.10456012189388275, -0.08772534132003784, -0.07089056074619293, -0.05405578017234802, -0.03722099959850311, -0.020386219024658203, -0.0035514384508132935, 0.013283342123031616, 0.030118122696876526, 0.046952903270721436, 0.06378768384456635, 0.08062246441841125, 0.09745724499225616, 0.11429202556610107, 0.13112680613994598, 0.14796161651611328, 0.1647963970899582, 0.1816311776638031, 0.198465958237648, 0.21530073881149292, 0.23213551938533783, 0.24897029995918274, 0.26580506563186646, 0.28263986110687256, 0.29947465658187866, 0.3163094222545624, 0.3331441879272461, 0.3499789834022522, 0.3668137788772583, 0.383648544549942, 0.40048331022262573, 0.41731810569763184, 0.43415290117263794, 0.45098766684532166, 0.46782243251800537, 0.4846572279930115, 0.5014920234680176, 0.5183267593383789, 0.535161554813385, 0.5519963502883911, 0.5688311457633972, 0.5856659412384033, 0.6025006771087646, 0.6193354725837708, 0.6361702680587769, 0.6530050039291382, 0.6698397994041443, 0.6866745948791504]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 8.0, 9.0, 18.0, 17.0, 26.0, 25.0, 43.0, 40.0, 46.0, 40.0, 49.0, 56.0, 60.0, 65.0, 62.0, 53.0, 53.0, 53.0, 54.0, 51.0, 33.0, 31.0, 34.0, 23.0, 15.0, 15.0, 8.0, 9.0, 3.0, 8.0, 5.0, 2.0, 1.0], "bins": [-0.24803680181503296, -0.2424740493297577, -0.23691128194332123, -0.23134852945804596, -0.2257857620716095, -0.22022300958633423, -0.21466025710105896, -0.2090974897146225, -0.20353472232818604, -0.19797196984291077, -0.1924092024564743, -0.18684644997119904, -0.18128368258476257, -0.1757209300994873, -0.17015817761421204, -0.16459541022777557, -0.1590326577425003, -0.15346990525722504, -0.14790713787078857, -0.1423443853855133, -0.13678161799907684, -0.13121886551380157, -0.1256560981273651, -0.12009334564208984, -0.11453058570623398, -0.10896782577037811, -0.10340506583452225, -0.09784230589866638, -0.09227955341339111, -0.08671678602695465, -0.08115403354167938, -0.07559127360582352, -0.07002851366996765, -0.06446575373411179, -0.05890299379825592, -0.05334023758769035, -0.04777747765183449, -0.04221471771597862, -0.036651961505413055, -0.03108920156955719, -0.025526441633701324, -0.01996368169784546, -0.014400923624634743, -0.008838165551424026, -0.003275405615568161, 0.0022873543202877045, 0.007850110530853271, 0.013412870466709137, 0.018975630402565002, 0.024538390338420868, 0.030101148411631584, 0.0356639064848423, 0.041226666420698166, 0.04678942635655403, 0.0523521825671196, 0.057914942502975464, 0.06347770243883133, 0.0690404623746872, 0.07460322231054306, 0.08016598224639893, 0.0857287347316742, 0.09129150211811066, 0.09685425460338593, 0.10241701453924179, 0.10797977447509766]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 12.0, 4.0, 9.0, 9.0, 10.0, 9.0, 10.0, 12.0, 20.0, 25.0, 18.0, 21.0, 22.0, 25.0, 35.0, 37.0, 37.0, 44.0, 53.0, 46.0, 52.0, 43.0, 46.0, 50.0, 45.0, 50.0, 35.0, 30.0, 30.0, 27.0, 30.0, 15.0, 13.0, 16.0, 14.0, 11.0, 9.0, 5.0, 7.0, 5.0, 3.0, 5.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-4.05859375, -3.93817138671875, -3.8177490234375, -3.69732666015625, -3.576904296875, -3.45648193359375, -3.3360595703125, -3.21563720703125, -3.09521484375, -2.97479248046875, -2.8543701171875, -2.73394775390625, -2.613525390625, -2.49310302734375, -2.3726806640625, -2.25225830078125, -2.1318359375, -2.01141357421875, -1.8909912109375, -1.77056884765625, -1.650146484375, -1.52972412109375, -1.4093017578125, -1.28887939453125, -1.16845703125, -1.04803466796875, -0.9276123046875, -0.80718994140625, -0.686767578125, -0.56634521484375, -0.4459228515625, -0.32550048828125, -0.205078125, -0.08465576171875, 0.0357666015625, 0.15618896484375, 0.276611328125, 0.39703369140625, 0.5174560546875, 0.63787841796875, 0.75830078125, 0.87872314453125, 0.9991455078125, 1.11956787109375, 1.239990234375, 1.36041259765625, 1.4808349609375, 1.60125732421875, 1.7216796875, 1.84210205078125, 1.9625244140625, 2.08294677734375, 2.203369140625, 2.32379150390625, 2.4442138671875, 2.56463623046875, 2.68505859375, 2.80548095703125, 2.9259033203125, 3.04632568359375, 3.166748046875, 3.28717041015625, 3.4075927734375, 3.52801513671875, 3.6484375]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 9.0, 13.0, 27.0, 39.0, 85.0, 130.0, 240.0, 393.0, 786.0, 1516.0, 2985.0, 5654.0, 10775.0, 21254.0, 42648.0, 89126.0, 185290.0, 277942.0, 208536.0, 102529.0, 48575.0, 24329.0, 12308.0, 6321.0, 3304.0, 1755.0, 905.0, 514.0, 245.0, 126.0, 87.0, 43.0, 26.0, 18.0, 12.0, 5.0, 2.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.91015625, -4.782928466796875, -4.65570068359375, -4.528472900390625, -4.4012451171875, -4.274017333984375, -4.14678955078125, -4.019561767578125, -3.892333984375, -3.765106201171875, -3.63787841796875, -3.510650634765625, -3.3834228515625, -3.256195068359375, -3.12896728515625, -3.001739501953125, -2.87451171875, -2.747283935546875, -2.62005615234375, -2.492828369140625, -2.3656005859375, -2.238372802734375, -2.11114501953125, -1.983917236328125, -1.856689453125, -1.729461669921875, -1.60223388671875, -1.475006103515625, -1.3477783203125, -1.220550537109375, -1.09332275390625, -0.966094970703125, -0.8388671875, -0.711639404296875, -0.58441162109375, -0.457183837890625, -0.3299560546875, -0.202728271484375, -0.07550048828125, 0.051727294921875, 0.178955078125, 0.306182861328125, 0.43341064453125, 0.560638427734375, 0.6878662109375, 0.815093994140625, 0.94232177734375, 1.069549560546875, 1.19677734375, 1.324005126953125, 1.45123291015625, 1.578460693359375, 1.7056884765625, 1.832916259765625, 1.96014404296875, 2.087371826171875, 2.214599609375, 2.341827392578125, 2.46905517578125, 2.596282958984375, 2.7235107421875, 2.850738525390625, 2.97796630859375, 3.105194091796875, 3.232421875]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 7.0, 7.0, 5.0, 3.0, 10.0, 13.0, 19.0, 23.0, 24.0, 27.0, 34.0, 46.0, 54.0, 51.0, 106.0, 172.0, 350.0, 1457.0, 205.0, 85.0, 66.0, 47.0, 47.0, 46.0, 29.0, 29.0, 24.0, 21.0, 12.0, 15.0, 9.0, 6.0, 4.0, 2.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.4296875, -12.9151611328125, -12.400634765625, -11.8861083984375, -11.37158203125, -10.8570556640625, -10.342529296875, -9.8280029296875, -9.3134765625, -8.7989501953125, -8.284423828125, -7.7698974609375, -7.25537109375, -6.7408447265625, -6.226318359375, -5.7117919921875, -5.197265625, -4.6827392578125, -4.168212890625, -3.6536865234375, -3.13916015625, -2.6246337890625, -2.110107421875, -1.5955810546875, -1.0810546875, -0.5665283203125, -0.052001953125, 0.4625244140625, 0.97705078125, 1.4915771484375, 2.006103515625, 2.5206298828125, 3.03515625, 3.5496826171875, 4.064208984375, 4.5787353515625, 5.09326171875, 5.6077880859375, 6.122314453125, 6.6368408203125, 7.1513671875, 7.6658935546875, 8.180419921875, 8.6949462890625, 9.20947265625, 9.7239990234375, 10.238525390625, 10.7530517578125, 11.267578125, 11.7821044921875, 12.296630859375, 12.8111572265625, 13.32568359375, 13.8402099609375, 14.354736328125, 14.8692626953125, 15.3837890625, 15.8983154296875, 16.412841796875, 16.9273681640625, 17.44189453125, 17.9564208984375, 18.470947265625, 18.9854736328125, 19.5]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 4.0, 2.0, 8.0, 12.0, 29.0, 27.0, 41.0, 65.0, 70.0, 141.0, 196.0, 343.0, 809.0, 4379.0, 234231.0, 2865828.0, 36435.0, 1805.0, 541.0, 265.0, 144.0, 95.0, 74.0, 55.0, 25.0, 19.0, 14.0, 12.0, 7.0, 6.0, 8.0, 5.0, 1.0, 4.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.34375, -24.55908203125, -23.7744140625, -22.98974609375, -22.205078125, -21.42041015625, -20.6357421875, -19.85107421875, -19.06640625, -18.28173828125, -17.4970703125, -16.71240234375, -15.927734375, -15.14306640625, -14.3583984375, -13.57373046875, -12.7890625, -12.00439453125, -11.2197265625, -10.43505859375, -9.650390625, -8.86572265625, -8.0810546875, -7.29638671875, -6.51171875, -5.72705078125, -4.9423828125, -4.15771484375, -3.373046875, -2.58837890625, -1.8037109375, -1.01904296875, -0.234375, 0.55029296875, 1.3349609375, 2.11962890625, 2.904296875, 3.68896484375, 4.4736328125, 5.25830078125, 6.04296875, 6.82763671875, 7.6123046875, 8.39697265625, 9.181640625, 9.96630859375, 10.7509765625, 11.53564453125, 12.3203125, 13.10498046875, 13.8896484375, 14.67431640625, 15.458984375, 16.24365234375, 17.0283203125, 17.81298828125, 18.59765625, 19.38232421875, 20.1669921875, 20.95166015625, 21.736328125, 22.52099609375, 23.3056640625, 24.09033203125, 24.875]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 22.0, 603.0, 382.0, 7.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.80795669555664, -18.895423889160156, -13.982892036437988, -9.07036018371582, -4.157827377319336, 0.7547054290771484, 5.667236328125, 10.579769134521484, 15.492301940917969, 20.404834747314453, 25.317367553710938, 30.22989845275879, 35.142433166503906, 40.054962158203125, 44.96749496459961, 49.880027770996094, 54.79256057739258, 59.70509338378906, 64.61762237548828, 69.53015899658203, 74.44268798828125, 79.355224609375, 84.26775360107422, 89.18028259277344, 94.09281921386719, 99.0053482055664, 103.91788482666016, 108.83041381835938, 113.74295043945312, 118.65547943115234, 123.56800842285156, 128.4805450439453, 133.39308166503906, 138.3056182861328, 143.2181396484375, 148.13067626953125, 153.043212890625, 157.95574951171875, 162.86827087402344, 167.7808074951172, 172.69334411621094, 177.6058807373047, 182.51840209960938, 187.43093872070312, 192.34347534179688, 197.25601196289062, 202.1685333251953, 207.08106994628906, 211.99359130859375, 216.9061279296875, 221.8186492919922, 226.73118591308594, 231.6437225341797, 236.55625915527344, 241.46878051757812, 246.38131713867188, 251.29385375976562, 256.2063903808594, 261.1189270019531, 266.0314636230469, 270.9439697265625, 275.85650634765625, 280.76904296875, 285.68157958984375, 290.5941162109375]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 6.0, 4.0, 10.0, 4.0, 7.0, 11.0, 15.0, 13.0, 29.0, 24.0, 25.0, 18.0, 28.0, 24.0, 38.0, 33.0, 51.0, 53.0, 30.0, 34.0, 43.0, 57.0, 48.0, 57.0, 41.0, 29.0, 35.0, 29.0, 25.0, 29.0, 26.0, 25.0, 19.0, 25.0, 12.0, 11.0, 13.0, 6.0, 2.0, 7.0, 6.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.06659698486328, -32.05134201049805, -31.036088943481445, -30.02083396911621, -29.00558090209961, -27.990325927734375, -26.97507095336914, -25.959815979003906, -24.944562911987305, -23.92930793762207, -22.91405487060547, -21.898799896240234, -20.883544921875, -19.8682918548584, -18.853036880493164, -17.837783813476562, -16.822528839111328, -15.80727481842041, -14.792020797729492, -13.776765823364258, -12.76151180267334, -11.746257781982422, -10.731002807617188, -9.71574878692627, -8.700494766235352, -7.685240745544434, -6.669986248016357, -5.654731750488281, -4.639477729797363, -3.6242237091064453, -2.608969211578369, -1.593714714050293, -0.5784568786621094, 0.4367973804473877, 1.4520516395568848, 2.467305898666382, 3.482560157775879, 4.497814178466797, 5.513068675994873, 6.528323173522949, 7.543577194213867, 8.558831214904785, 9.574085235595703, 10.589340209960938, 11.604594230651855, 12.619848251342773, 13.635103225708008, 14.650357246398926, 15.665611267089844, 16.680866241455078, 17.69611930847168, 18.711374282836914, 19.726627349853516, 20.74188232421875, 21.757137298583984, 22.77239227294922, 23.78764533996582, 24.802900314331055, 25.818153381347656, 26.83340835571289, 27.848663330078125, 28.863916397094727, 29.87917137145996, 30.894424438476562, 31.909679412841797]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 4.0, 7.0, 5.0, 14.0, 9.0, 16.0, 20.0, 13.0, 14.0, 22.0, 24.0, 22.0, 36.0, 25.0, 47.0, 48.0, 43.0, 51.0, 52.0, 67.0, 55.0, 46.0, 49.0, 46.0, 45.0, 30.0, 30.0, 32.0, 23.0, 24.0, 17.0, 10.0, 14.0, 17.0, 8.0, 5.0, 9.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.52734375, -4.38616943359375, -4.2449951171875, -4.10382080078125, -3.962646484375, -3.82147216796875, -3.6802978515625, -3.53912353515625, -3.39794921875, -3.25677490234375, -3.1156005859375, -2.97442626953125, -2.833251953125, -2.69207763671875, -2.5509033203125, -2.40972900390625, -2.2685546875, -2.12738037109375, -1.9862060546875, -1.84503173828125, -1.703857421875, -1.56268310546875, -1.4215087890625, -1.28033447265625, -1.13916015625, -0.99798583984375, -0.8568115234375, -0.71563720703125, -0.574462890625, -0.43328857421875, -0.2921142578125, -0.15093994140625, -0.009765625, 0.13140869140625, 0.2725830078125, 0.41375732421875, 0.554931640625, 0.69610595703125, 0.8372802734375, 0.97845458984375, 1.11962890625, 1.26080322265625, 1.4019775390625, 1.54315185546875, 1.684326171875, 1.82550048828125, 1.9666748046875, 2.10784912109375, 2.2490234375, 2.39019775390625, 2.5313720703125, 2.67254638671875, 2.813720703125, 2.95489501953125, 3.0960693359375, 3.23724365234375, 3.37841796875, 3.51959228515625, 3.6607666015625, 3.80194091796875, 3.943115234375, 4.08428955078125, 4.2254638671875, 4.36663818359375, 4.5078125]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 5.0, 1.0, 3.0, 9.0, 7.0, 5.0, 7.0, 20.0, 6.0, 18.0, 18.0, 23.0, 25.0, 40.0, 59.0, 116.0, 222.0, 685.0, 2209.0, 10275.0, 59793.0, 376484.0, 1931892.0, 1499151.0, 261292.0, 41926.0, 7402.0, 1659.0, 477.0, 165.0, 84.0, 39.0, 35.0, 24.0, 11.0, 19.0, 29.0, 14.0, 6.0, 10.0, 4.0, 7.0, 4.0, 6.0, 3.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.203125, -7.96807861328125, -7.7330322265625, -7.49798583984375, -7.262939453125, -7.02789306640625, -6.7928466796875, -6.55780029296875, -6.32275390625, -6.08770751953125, -5.8526611328125, -5.61761474609375, -5.382568359375, -5.14752197265625, -4.9124755859375, -4.67742919921875, -4.4423828125, -4.20733642578125, -3.9722900390625, -3.73724365234375, -3.502197265625, -3.26715087890625, -3.0321044921875, -2.79705810546875, -2.56201171875, -2.32696533203125, -2.0919189453125, -1.85687255859375, -1.621826171875, -1.38677978515625, -1.1517333984375, -0.91668701171875, -0.681640625, -0.44659423828125, -0.2115478515625, 0.02349853515625, 0.258544921875, 0.49359130859375, 0.7286376953125, 0.96368408203125, 1.19873046875, 1.43377685546875, 1.6688232421875, 1.90386962890625, 2.138916015625, 2.37396240234375, 2.6090087890625, 2.84405517578125, 3.0791015625, 3.31414794921875, 3.5491943359375, 3.78424072265625, 4.019287109375, 4.25433349609375, 4.4893798828125, 4.72442626953125, 4.95947265625, 5.19451904296875, 5.4295654296875, 5.66461181640625, 5.899658203125, 6.13470458984375, 6.3697509765625, 6.60479736328125, 6.83984375]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 6.0, 1.0, 3.0, 4.0, 9.0, 8.0, 11.0, 17.0, 30.0, 36.0, 39.0, 58.0, 62.0, 129.0, 171.0, 202.0, 303.0, 402.0, 492.0, 504.0, 401.0, 341.0, 269.0, 174.0, 118.0, 82.0, 51.0, 45.0, 30.0, 23.0, 18.0, 13.0, 9.0, 7.0, 5.0, 6.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.96484375, -6.76104736328125, -6.5572509765625, -6.35345458984375, -6.149658203125, -5.94586181640625, -5.7420654296875, -5.53826904296875, -5.33447265625, -5.13067626953125, -4.9268798828125, -4.72308349609375, -4.519287109375, -4.31549072265625, -4.1116943359375, -3.90789794921875, -3.7041015625, -3.50030517578125, -3.2965087890625, -3.09271240234375, -2.888916015625, -2.68511962890625, -2.4813232421875, -2.27752685546875, -2.07373046875, -1.86993408203125, -1.6661376953125, -1.46234130859375, -1.258544921875, -1.05474853515625, -0.8509521484375, -0.64715576171875, -0.443359375, -0.23956298828125, -0.0357666015625, 0.16802978515625, 0.371826171875, 0.57562255859375, 0.7794189453125, 0.98321533203125, 1.18701171875, 1.39080810546875, 1.5946044921875, 1.79840087890625, 2.002197265625, 2.20599365234375, 2.4097900390625, 2.61358642578125, 2.8173828125, 3.02117919921875, 3.2249755859375, 3.42877197265625, 3.632568359375, 3.83636474609375, 4.0401611328125, 4.24395751953125, 4.44775390625, 4.65155029296875, 4.8553466796875, 5.05914306640625, 5.262939453125, 5.46673583984375, 5.6705322265625, 5.87432861328125, 6.078125]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 5.0, 2.0, 4.0, 7.0, 7.0, 15.0, 21.0, 18.0, 26.0, 43.0, 54.0, 87.0, 125.0, 219.0, 365.0, 722.0, 2533.0, 72164.0, 3429771.0, 674905.0, 10682.0, 1137.0, 483.0, 289.0, 201.0, 114.0, 90.0, 53.0, 41.0, 43.0, 22.0, 14.0, 8.0, 8.0, 4.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.953125, -20.224365234375, -19.49560546875, -18.766845703125, -18.0380859375, -17.309326171875, -16.58056640625, -15.851806640625, -15.123046875, -14.394287109375, -13.66552734375, -12.936767578125, -12.2080078125, -11.479248046875, -10.75048828125, -10.021728515625, -9.29296875, -8.564208984375, -7.83544921875, -7.106689453125, -6.3779296875, -5.649169921875, -4.92041015625, -4.191650390625, -3.462890625, -2.734130859375, -2.00537109375, -1.276611328125, -0.5478515625, 0.180908203125, 0.90966796875, 1.638427734375, 2.3671875, 3.095947265625, 3.82470703125, 4.553466796875, 5.2822265625, 6.010986328125, 6.73974609375, 7.468505859375, 8.197265625, 8.926025390625, 9.65478515625, 10.383544921875, 11.1123046875, 11.841064453125, 12.56982421875, 13.298583984375, 14.02734375, 14.756103515625, 15.48486328125, 16.213623046875, 16.9423828125, 17.671142578125, 18.39990234375, 19.128662109375, 19.857421875, 20.586181640625, 21.31494140625, 22.043701171875, 22.7724609375, 23.501220703125, 24.22998046875, 24.958740234375, 25.6875]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 16.0, 109.0, 409.0, 390.0, 83.0, 7.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.02190399169922, -34.20477294921875, -30.38764190673828, -26.570512771606445, -22.753381729125977, -18.936250686645508, -15.119121551513672, -11.301990509033203, -7.484859466552734, -3.667728900909424, 0.14940166473388672, 3.966531753540039, 7.783662796020508, 11.600793838500977, 15.417922973632812, 19.23505401611328, 23.05218505859375, 26.86931610107422, 30.686447143554688, 34.503578186035156, 38.320709228515625, 42.137840270996094, 45.9549674987793, 49.772098541259766, 53.589229583740234, 57.4063606262207, 61.22349166870117, 65.04061889648438, 68.85774993896484, 72.67488098144531, 76.49201202392578, 80.30914306640625, 84.12628173828125, 87.94341278076172, 91.76054382324219, 95.57767486572266, 99.39480590820312, 103.2119369506836, 107.02906799316406, 110.84619140625, 114.663330078125, 118.48046112060547, 122.29759216308594, 126.1147232055664, 129.93185424804688, 133.7489776611328, 137.5661163330078, 141.38323974609375, 145.20037841796875, 149.0175018310547, 152.8346405029297, 156.65176391601562, 160.46890258789062, 164.28602600097656, 168.10316467285156, 171.9202880859375, 175.73741149902344, 179.55453491210938, 183.37167358398438, 187.1887969970703, 191.0059356689453, 194.82305908203125, 198.64019775390625, 202.4573211669922, 206.2744598388672]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 0.0, 3.0, 4.0, 9.0, 8.0, 8.0, 16.0, 7.0, 13.0, 23.0, 20.0, 22.0, 30.0, 40.0, 29.0, 33.0, 38.0, 51.0, 54.0, 47.0, 48.0, 44.0, 54.0, 41.0, 43.0, 43.0, 39.0, 36.0, 30.0, 30.0, 23.0, 21.0, 22.0, 19.0, 11.0, 13.0, 10.0, 5.0, 6.0, 3.0, 6.0, 1.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-24.15087890625, -23.43014144897461, -22.709402084350586, -21.988664627075195, -21.267925262451172, -20.54718780517578, -19.82645034790039, -19.105710983276367, -18.384971618652344, -17.664234161376953, -16.94349479675293, -16.22275733947754, -15.502017974853516, -14.781280517578125, -14.060542106628418, -13.339803695678711, -12.61906623840332, -11.898327827453613, -11.177589416503906, -10.456851959228516, -9.736112594604492, -9.015375137329102, -8.294636726379395, -7.5738983154296875, -6.8531599044799805, -6.132421493530273, -5.411683082580566, -4.690945148468018, -3.9702067375183105, -3.2494683265686035, -2.5287303924560547, -1.8079919815063477, -1.0872554779052734, -0.36651718616485596, 0.3542211055755615, 1.0749592781066895, 1.7956976890563965, 2.5164361000061035, 3.2371740341186523, 3.9579124450683594, 4.678650856018066, 5.399389266967773, 6.1201276779174805, 6.840865612030029, 7.561604022979736, 8.282342910766602, 9.003080368041992, 9.7238187789917, 10.444557189941406, 11.165295600891113, 11.88603401184082, 12.606771469116211, 13.327510833740234, 14.048248291015625, 14.768986701965332, 15.489725112915039, 16.210464477539062, 16.931201934814453, 17.651941299438477, 18.372678756713867, 19.09341812133789, 19.81415557861328, 20.534893035888672, 21.255632400512695, 21.976369857788086]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 4.0, 5.0, 5.0, 7.0, 8.0, 12.0, 13.0, 15.0, 22.0, 15.0, 28.0, 20.0, 24.0, 25.0, 40.0, 48.0, 51.0, 45.0, 43.0, 37.0, 58.0, 47.0, 42.0, 52.0, 44.0, 42.0, 43.0, 31.0, 33.0, 26.0, 25.0, 19.0, 15.0, 18.0, 8.0, 7.0, 6.0, 7.0, 5.0, 5.0, 0.0, 4.0, 0.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.685546875, -3.560089111328125, -3.43463134765625, -3.309173583984375, -3.1837158203125, -3.058258056640625, -2.93280029296875, -2.807342529296875, -2.681884765625, -2.556427001953125, -2.43096923828125, -2.305511474609375, -2.1800537109375, -2.054595947265625, -1.92913818359375, -1.803680419921875, -1.67822265625, -1.552764892578125, -1.42730712890625, -1.301849365234375, -1.1763916015625, -1.050933837890625, -0.92547607421875, -0.800018310546875, -0.674560546875, -0.549102783203125, -0.42364501953125, -0.298187255859375, -0.1727294921875, -0.047271728515625, 0.07818603515625, 0.203643798828125, 0.3291015625, 0.454559326171875, 0.58001708984375, 0.705474853515625, 0.8309326171875, 0.956390380859375, 1.08184814453125, 1.207305908203125, 1.332763671875, 1.458221435546875, 1.58367919921875, 1.709136962890625, 1.8345947265625, 1.960052490234375, 2.08551025390625, 2.210968017578125, 2.33642578125, 2.461883544921875, 2.58734130859375, 2.712799072265625, 2.8382568359375, 2.963714599609375, 3.08917236328125, 3.214630126953125, 3.340087890625, 3.465545654296875, 3.59100341796875, 3.716461181640625, 3.8419189453125, 3.967376708984375, 4.09283447265625, 4.218292236328125, 4.34375]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 15.0, 13.0, 25.0, 31.0, 58.0, 106.0, 170.0, 258.0, 520.0, 781.0, 1393.0, 2493.0, 3927.0, 6636.0, 10884.0, 17328.0, 27580.0, 41994.0, 61387.0, 84765.0, 110052.0, 126897.0, 130762.0, 117682.0, 95002.0, 71012.0, 49377.0, 32994.0, 21252.0, 13068.0, 8166.0, 4781.0, 2937.0, 1722.0, 975.0, 622.0, 380.0, 175.0, 144.0, 78.0, 45.0, 29.0, 11.0, 8.0, 9.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.5400390625, -0.5232696533203125, -0.506500244140625, -0.4897308349609375, -0.47296142578125, -0.4561920166015625, -0.439422607421875, -0.4226531982421875, -0.4058837890625, -0.3891143798828125, -0.372344970703125, -0.3555755615234375, -0.33880615234375, -0.3220367431640625, -0.305267333984375, -0.2884979248046875, -0.271728515625, -0.2549591064453125, -0.238189697265625, -0.2214202880859375, -0.20465087890625, -0.1878814697265625, -0.171112060546875, -0.1543426513671875, -0.1375732421875, -0.1208038330078125, -0.104034423828125, -0.0872650146484375, -0.07049560546875, -0.0537261962890625, -0.036956787109375, -0.0201873779296875, -0.00341796875, 0.0133514404296875, 0.030120849609375, 0.0468902587890625, 0.06365966796875, 0.0804290771484375, 0.097198486328125, 0.1139678955078125, 0.1307373046875, 0.1475067138671875, 0.164276123046875, 0.1810455322265625, 0.19781494140625, 0.2145843505859375, 0.231353759765625, 0.2481231689453125, 0.264892578125, 0.2816619873046875, 0.298431396484375, 0.3152008056640625, 0.33197021484375, 0.3487396240234375, 0.365509033203125, 0.3822784423828125, 0.3990478515625, 0.4158172607421875, 0.432586669921875, 0.4493560791015625, 0.46612548828125, 0.4828948974609375, 0.499664306640625, 0.5164337158203125, 0.533203125]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 3.0, 3.0, 2.0, 11.0, 7.0, 11.0, 17.0, 12.0, 25.0, 24.0, 25.0, 30.0, 25.0, 31.0, 33.0, 32.0, 33.0, 32.0, 45.0, 53.0, 47.0, 1063.0, 43.0, 44.0, 37.0, 44.0, 33.0, 23.0, 27.0, 30.0, 24.0, 26.0, 27.0, 20.0, 17.0, 15.0, 13.0, 11.0, 5.0, 6.0, 5.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.767578125, -2.679656982421875, -2.59173583984375, -2.503814697265625, -2.4158935546875, -2.327972412109375, -2.24005126953125, -2.152130126953125, -2.064208984375, -1.976287841796875, -1.88836669921875, -1.800445556640625, -1.7125244140625, -1.624603271484375, -1.53668212890625, -1.448760986328125, -1.36083984375, -1.272918701171875, -1.18499755859375, -1.097076416015625, -1.0091552734375, -0.921234130859375, -0.83331298828125, -0.745391845703125, -0.657470703125, -0.569549560546875, -0.48162841796875, -0.393707275390625, -0.3057861328125, -0.217864990234375, -0.12994384765625, -0.042022705078125, 0.0458984375, 0.133819580078125, 0.22174072265625, 0.309661865234375, 0.3975830078125, 0.485504150390625, 0.57342529296875, 0.661346435546875, 0.749267578125, 0.837188720703125, 0.92510986328125, 1.013031005859375, 1.1009521484375, 1.188873291015625, 1.27679443359375, 1.364715576171875, 1.45263671875, 1.540557861328125, 1.62847900390625, 1.716400146484375, 1.8043212890625, 1.892242431640625, 1.98016357421875, 2.068084716796875, 2.156005859375, 2.243927001953125, 2.33184814453125, 2.419769287109375, 2.5076904296875, 2.595611572265625, 2.68353271484375, 2.771453857421875, 2.859375]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 5.0, 9.0, 7.0, 16.0, 20.0, 31.0, 53.0, 53.0, 92.0, 124.0, 176.0, 244.0, 384.0, 547.0, 820.0, 1086.0, 1690.0, 2463.0, 3611.0, 5065.0, 7687.0, 11022.0, 16370.0, 24985.0, 68207.0, 1764595.0, 105691.0, 27085.0, 17391.0, 11822.0, 8153.0, 5535.0, 3784.0, 2567.0, 1769.0, 1189.0, 863.0, 578.0, 389.0, 329.0, 179.0, 156.0, 97.0, 67.0, 42.0, 22.0, 23.0, 15.0, 13.0, 5.0, 4.0, 6.0, 2.0, 5.0, 3.0], "bins": [-1.0693359375, -1.0384140014648438, -1.0074920654296875, -0.9765701293945312, -0.945648193359375, -0.9147262573242188, -0.8838043212890625, -0.8528823852539062, -0.82196044921875, -0.7910385131835938, -0.7601165771484375, -0.7291946411132812, -0.698272705078125, -0.6673507690429688, -0.6364288330078125, -0.6055068969726562, -0.5745849609375, -0.5436630249023438, -0.5127410888671875, -0.48181915283203125, -0.450897216796875, -0.41997528076171875, -0.3890533447265625, -0.35813140869140625, -0.32720947265625, -0.29628753662109375, -0.2653656005859375, -0.23444366455078125, -0.203521728515625, -0.17259979248046875, -0.1416778564453125, -0.11075592041015625, -0.079833984375, -0.04891204833984375, -0.0179901123046875, 0.01293182373046875, 0.043853759765625, 0.07477569580078125, 0.1056976318359375, 0.13661956787109375, 0.16754150390625, 0.19846343994140625, 0.2293853759765625, 0.26030731201171875, 0.291229248046875, 0.32215118408203125, 0.3530731201171875, 0.38399505615234375, 0.4149169921875, 0.44583892822265625, 0.4767608642578125, 0.5076828002929688, 0.538604736328125, 0.5695266723632812, 0.6004486083984375, 0.6313705444335938, 0.66229248046875, 0.6932144165039062, 0.7241363525390625, 0.7550582885742188, 0.785980224609375, 0.8169021606445312, 0.8478240966796875, 0.8787460327148438, 0.90966796875]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 4.0, 2.0, 6.0, 7.0, 6.0, 9.0, 5.0, 7.0, 9.0, 17.0, 16.0, 18.0, 21.0, 24.0, 26.0, 27.0, 39.0, 48.0, 61.0, 66.0, 65.0, 60.0, 53.0, 55.0, 47.0, 48.0, 32.0, 44.0, 38.0, 29.0, 21.0, 20.0, 20.0, 10.0, 6.0, 8.0, 5.0, 6.0, 6.0, 4.0, 7.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.06781005859375, -0.06559944152832031, -0.06338882446289062, -0.06117820739746094, -0.05896759033203125, -0.05675697326660156, -0.054546356201171875, -0.05233573913574219, -0.0501251220703125, -0.04791450500488281, -0.045703887939453125, -0.04349327087402344, -0.04128265380859375, -0.03907203674316406, -0.036861419677734375, -0.03465080261230469, -0.032440185546875, -0.030229568481445312, -0.028018951416015625, -0.025808334350585938, -0.02359771728515625, -0.021387100219726562, -0.019176483154296875, -0.016965866088867188, -0.0147552490234375, -0.012544631958007812, -0.010334014892578125, -0.008123397827148438, -0.00591278076171875, -0.0037021636962890625, -0.001491546630859375, 0.0007190704345703125, 0.0029296875, 0.0051403045654296875, 0.007350921630859375, 0.009561538696289062, 0.01177215576171875, 0.013982772827148438, 0.016193389892578125, 0.018404006958007812, 0.0206146240234375, 0.022825241088867188, 0.025035858154296875, 0.027246475219726562, 0.02945709228515625, 0.03166770935058594, 0.033878326416015625, 0.03608894348144531, 0.038299560546875, 0.04051017761230469, 0.042720794677734375, 0.04493141174316406, 0.04714202880859375, 0.04935264587402344, 0.051563262939453125, 0.05377388000488281, 0.0559844970703125, 0.05819511413574219, 0.060405731201171875, 0.06261634826660156, 0.06482696533203125, 0.06703758239746094, 0.06924819946289062, 0.07145881652832031, 0.07366943359375]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 5.0, 6.0, 5.0, 6.0, 5.0, 11.0, 7.0, 1.0, 25.0, 16.0, 33.0, 37.0, 41.0, 65.0, 80.0, 112.0, 201.0, 339.0, 866.0, 91341.0, 952726.0, 1407.0, 471.0, 235.0, 146.0, 80.0, 53.0, 47.0, 40.0, 28.0, 28.0, 20.0, 18.0, 9.0, 7.0, 6.0, 7.0, 8.0, 9.0, 7.0, 0.0, 2.0, 7.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.546875, -1.5002288818359375, -1.453582763671875, -1.4069366455078125, -1.36029052734375, -1.3136444091796875, -1.266998291015625, -1.2203521728515625, -1.1737060546875, -1.1270599365234375, -1.080413818359375, -1.0337677001953125, -0.98712158203125, -0.9404754638671875, -0.893829345703125, -0.8471832275390625, -0.800537109375, -0.7538909912109375, -0.707244873046875, -0.6605987548828125, -0.61395263671875, -0.5673065185546875, -0.520660400390625, -0.4740142822265625, -0.4273681640625, -0.3807220458984375, -0.334075927734375, -0.2874298095703125, -0.24078369140625, -0.1941375732421875, -0.147491455078125, -0.1008453369140625, -0.05419921875, -0.0075531005859375, 0.039093017578125, 0.0857391357421875, 0.13238525390625, 0.1790313720703125, 0.225677490234375, 0.2723236083984375, 0.3189697265625, 0.3656158447265625, 0.412261962890625, 0.4589080810546875, 0.50555419921875, 0.5522003173828125, 0.598846435546875, 0.6454925537109375, 0.692138671875, 0.7387847900390625, 0.785430908203125, 0.8320770263671875, 0.87872314453125, 0.9253692626953125, 0.972015380859375, 1.0186614990234375, 1.0653076171875, 1.1119537353515625, 1.158599853515625, 1.2052459716796875, 1.25189208984375, 1.2985382080078125, 1.345184326171875, 1.3918304443359375, 1.4384765625]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 33.0, 600.0, 332.0, 41.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15637043118476868, -0.12965568900108337, -0.10294094681739807, -0.07622619718313217, -0.04951145499944687, -0.02279670536518097, 0.0039180368185043335, 0.030632779002189636, 0.05734752118587494, 0.08406226336956024, 0.11077700555324554, 0.13749176263809204, 0.16420650482177734, 0.19092124700546265, 0.21763598918914795, 0.24435073137283325, 0.27106547355651855, 0.29778021574020386, 0.32449495792388916, 0.35120970010757446, 0.37792444229125977, 0.40463918447494507, 0.43135392665863037, 0.4580686688423157, 0.484783411026001, 0.5114981532096863, 0.5382128953933716, 0.5649276375770569, 0.5916423797607422, 0.6183571219444275, 0.6450718641281128, 0.6717866063117981, 0.6985014081001282, 0.7252161502838135, 0.7519308924674988, 0.7786456346511841, 0.8053603768348694, 0.8320751190185547, 0.85878986120224, 0.8855046033859253, 0.9122193455696106, 0.9389340877532959, 0.9656488299369812, 0.9923635721206665, 1.0190783739089966, 1.045793056488037, 1.0725078582763672, 1.0992225408554077, 1.1259373426437378, 1.1526521444320679, 1.1793668270111084, 1.2060816287994385, 1.232796311378479, 1.259511113166809, 1.2862257957458496, 1.3129405975341797, 1.3396552801132202, 1.3663700819015503, 1.3930847644805908, 1.419799566268921, 1.4465142488479614, 1.4732290506362915, 1.499943733215332, 1.526658535003662, 1.5533732175827026]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 3.0, 7.0, 9.0, 3.0, 3.0, 7.0, 9.0, 18.0, 22.0, 13.0, 21.0, 17.0, 27.0, 28.0, 29.0, 22.0, 38.0, 38.0, 21.0, 31.0, 32.0, 40.0, 35.0, 41.0, 29.0, 42.0, 31.0, 46.0, 34.0, 39.0, 41.0, 31.0, 23.0, 26.0, 25.0, 11.0, 12.0, 17.0, 17.0, 15.0, 12.0, 9.0, 8.0, 7.0, 6.0, 1.0, 5.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.18165600299835205, -0.17578279972076416, -0.16990958154201508, -0.16403637826442719, -0.1581631600856781, -0.1522899568080902, -0.14641675353050232, -0.14054353535175323, -0.13467031717300415, -0.12879711389541626, -0.12292389571666718, -0.11705069243907928, -0.1111774742603302, -0.10530427098274231, -0.09943106025457382, -0.09355784952640533, -0.08768464624881744, -0.08181143552064896, -0.07593822479248047, -0.07006502151489258, -0.0641918033361435, -0.058318596333265305, -0.052445389330387115, -0.04657217860221863, -0.04069896787405014, -0.03482575714588165, -0.028952548280358315, -0.023079339414834976, -0.01720612868666649, -0.011332917958498001, -0.005459710955619812, 0.00041349977254867554, 0.006286710500717163, 0.012159920297563076, 0.01803313009440899, 0.023906338959932327, 0.029779549688100815, 0.0356527604162693, 0.04152596741914749, 0.04739917814731598, 0.05327238887548447, 0.059145599603652954, 0.06501881033182144, 0.07089202105998993, 0.07676522433757782, 0.0826384425163269, 0.0885116457939148, 0.09438485652208328, 0.10025806725025177, 0.10613127797842026, 0.11200448870658875, 0.11787769198417664, 0.12375091016292572, 0.1296241134405136, 0.1354973316192627, 0.14137053489685059, 0.14724373817443848, 0.15311694145202637, 0.15899015963077545, 0.16486336290836334, 0.17073658108711243, 0.17660978436470032, 0.1824829876422882, 0.1883562058210373, 0.19422942399978638]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 11.0, 6.0, 3.0, 15.0, 8.0, 18.0, 13.0, 20.0, 29.0, 25.0, 23.0, 31.0, 50.0, 56.0, 56.0, 55.0, 48.0, 47.0, 52.0, 50.0, 58.0, 45.0, 41.0, 43.0, 36.0, 36.0, 26.0, 14.0, 26.0, 15.0, 13.0, 11.0, 10.0, 5.0, 2.0, 1.0, 3.0, 6.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.55078125, -4.41094970703125, -4.2711181640625, -4.13128662109375, -3.991455078125, -3.85162353515625, -3.7117919921875, -3.57196044921875, -3.43212890625, -3.29229736328125, -3.1524658203125, -3.01263427734375, -2.872802734375, -2.73297119140625, -2.5931396484375, -2.45330810546875, -2.3134765625, -2.17364501953125, -2.0338134765625, -1.89398193359375, -1.754150390625, -1.61431884765625, -1.4744873046875, -1.33465576171875, -1.19482421875, -1.05499267578125, -0.9151611328125, -0.77532958984375, -0.635498046875, -0.49566650390625, -0.3558349609375, -0.21600341796875, -0.076171875, 0.06365966796875, 0.2034912109375, 0.34332275390625, 0.483154296875, 0.62298583984375, 0.7628173828125, 0.90264892578125, 1.04248046875, 1.18231201171875, 1.3221435546875, 1.46197509765625, 1.601806640625, 1.74163818359375, 1.8814697265625, 2.02130126953125, 2.1611328125, 2.30096435546875, 2.4407958984375, 2.58062744140625, 2.720458984375, 2.86029052734375, 3.0001220703125, 3.13995361328125, 3.27978515625, 3.41961669921875, 3.5594482421875, 3.69927978515625, 3.839111328125, 3.97894287109375, 4.1187744140625, 4.25860595703125, 4.3984375]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 11.0, 13.0, 9.0, 14.0, 17.0, 27.0, 31.0, 46.0, 64.0, 104.0, 185.0, 392.0, 906.0, 1967.0, 4636.0, 10700.0, 26130.0, 75736.0, 256233.0, 422863.0, 165595.0, 49924.0, 18626.0, 7932.0, 3540.0, 1450.0, 611.0, 319.0, 149.0, 97.0, 67.0, 49.0, 35.0, 30.0, 13.0, 5.0, 7.0, 5.0, 4.0, 5.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.3828125, -5.2109375, -5.0390625, -4.8671875, -4.6953125, -4.5234375, -4.3515625, -4.1796875, -4.0078125, -3.8359375, -3.6640625, -3.4921875, -3.3203125, -3.1484375, -2.9765625, -2.8046875, -2.6328125, -2.4609375, -2.2890625, -2.1171875, -1.9453125, -1.7734375, -1.6015625, -1.4296875, -1.2578125, -1.0859375, -0.9140625, -0.7421875, -0.5703125, -0.3984375, -0.2265625, -0.0546875, 0.1171875, 0.2890625, 0.4609375, 0.6328125, 0.8046875, 0.9765625, 1.1484375, 1.3203125, 1.4921875, 1.6640625, 1.8359375, 2.0078125, 2.1796875, 2.3515625, 2.5234375, 2.6953125, 2.8671875, 3.0390625, 3.2109375, 3.3828125, 3.5546875, 3.7265625, 3.8984375, 4.0703125, 4.2421875, 4.4140625, 4.5859375, 4.7578125, 4.9296875, 5.1015625, 5.2734375, 5.4453125, 5.6171875]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 5.0, 8.0, 7.0, 8.0, 5.0, 9.0, 6.0, 16.0, 11.0, 24.0, 19.0, 19.0, 20.0, 37.0, 36.0, 31.0, 40.0, 43.0, 58.0, 84.0, 178.0, 313.0, 1343.0, 192.0, 104.0, 66.0, 47.0, 31.0, 36.0, 29.0, 38.0, 26.0, 30.0, 23.0, 14.0, 13.0, 9.0, 14.0, 13.0, 9.0, 10.0, 9.0, 6.0, 1.0, 3.0, 1.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0], "bins": [-10.9765625, -10.6546630859375, -10.332763671875, -10.0108642578125, -9.68896484375, -9.3670654296875, -9.045166015625, -8.7232666015625, -8.4013671875, -8.0794677734375, -7.757568359375, -7.4356689453125, -7.11376953125, -6.7918701171875, -6.469970703125, -6.1480712890625, -5.826171875, -5.5042724609375, -5.182373046875, -4.8604736328125, -4.53857421875, -4.2166748046875, -3.894775390625, -3.5728759765625, -3.2509765625, -2.9290771484375, -2.607177734375, -2.2852783203125, -1.96337890625, -1.6414794921875, -1.319580078125, -0.9976806640625, -0.67578125, -0.3538818359375, -0.031982421875, 0.2899169921875, 0.61181640625, 0.9337158203125, 1.255615234375, 1.5775146484375, 1.8994140625, 2.2213134765625, 2.543212890625, 2.8651123046875, 3.18701171875, 3.5089111328125, 3.830810546875, 4.1527099609375, 4.474609375, 4.7965087890625, 5.118408203125, 5.4403076171875, 5.76220703125, 6.0841064453125, 6.406005859375, 6.7279052734375, 7.0498046875, 7.3717041015625, 7.693603515625, 8.0155029296875, 8.33740234375, 8.6593017578125, 8.981201171875, 9.3031005859375, 9.625]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 3.0, 2.0, 6.0, 4.0, 5.0, 4.0, 8.0, 11.0, 19.0, 18.0, 21.0, 17.0, 25.0, 46.0, 69.0, 76.0, 114.0, 143.0, 231.0, 350.0, 738.0, 2855.0, 28992.0, 1653550.0, 1427713.0, 26227.0, 2577.0, 740.0, 343.0, 210.0, 172.0, 98.0, 68.0, 53.0, 48.0, 29.0, 28.0, 18.0, 16.0, 17.0, 9.0, 7.0, 5.0, 8.0, 6.0, 2.0, 2.0, 3.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.6875, -14.16259765625, -13.6376953125, -13.11279296875, -12.587890625, -12.06298828125, -11.5380859375, -11.01318359375, -10.48828125, -9.96337890625, -9.4384765625, -8.91357421875, -8.388671875, -7.86376953125, -7.3388671875, -6.81396484375, -6.2890625, -5.76416015625, -5.2392578125, -4.71435546875, -4.189453125, -3.66455078125, -3.1396484375, -2.61474609375, -2.08984375, -1.56494140625, -1.0400390625, -0.51513671875, 0.009765625, 0.53466796875, 1.0595703125, 1.58447265625, 2.109375, 2.63427734375, 3.1591796875, 3.68408203125, 4.208984375, 4.73388671875, 5.2587890625, 5.78369140625, 6.30859375, 6.83349609375, 7.3583984375, 7.88330078125, 8.408203125, 8.93310546875, 9.4580078125, 9.98291015625, 10.5078125, 11.03271484375, 11.5576171875, 12.08251953125, 12.607421875, 13.13232421875, 13.6572265625, 14.18212890625, 14.70703125, 15.23193359375, 15.7568359375, 16.28173828125, 16.806640625, 17.33154296875, 17.8564453125, 18.38134765625, 18.90625]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 26.0, 124.0, 349.0, 379.0, 113.0, 22.0, 2.0, 0.0, 0.0, 2.0], "bins": [-107.14595031738281, -105.26579284667969, -103.38563537597656, -101.50547790527344, -99.62532806396484, -97.74517059326172, -95.8650131225586, -93.98485565185547, -92.10469818115234, -90.22454071044922, -88.3443832397461, -86.4642333984375, -84.58407592773438, -82.70391845703125, -80.82376098632812, -78.943603515625, -77.06344604492188, -75.18328857421875, -73.30313110351562, -71.4229736328125, -69.5428237915039, -67.66266632080078, -65.78250885009766, -63.90235137939453, -62.02220153808594, -60.14204406738281, -58.26189041137695, -56.38173294067383, -54.5015754699707, -52.621421813964844, -50.74126434326172, -48.861106872558594, -46.98094940185547, -45.100791931152344, -43.220638275146484, -41.34048080444336, -39.460323333740234, -37.580169677734375, -35.70001220703125, -33.819854736328125, -31.939701080322266, -30.059545516967773, -28.17938804626465, -26.299232482910156, -24.41907501220703, -22.53891944885254, -20.658763885498047, -18.778606414794922, -16.898448944091797, -15.018292427062988, -13.13813591003418, -11.257980346679688, -9.377823829650879, -7.49766731262207, -5.617511749267578, -3.7373552322387695, -1.8571996688842773, 0.02295660972595215, 1.9031128883361816, 3.783268928527832, 5.663425445556641, 7.543581962585449, 9.423737525939941, 11.30389404296875, 13.184050559997559]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 4.0, 2.0, 4.0, 7.0, 5.0, 11.0, 11.0, 15.0, 11.0, 10.0, 22.0, 25.0, 38.0, 28.0, 36.0, 31.0, 48.0, 31.0, 42.0, 39.0, 44.0, 46.0, 52.0, 47.0, 46.0, 49.0, 45.0, 29.0, 28.0, 29.0, 25.0, 16.0, 26.0, 28.0, 17.0, 16.0, 11.0, 7.0, 7.0, 3.0, 5.0, 1.0, 7.0, 2.0, 3.0, 1.0, 0.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.771194458007812, -26.84799575805664, -25.92479705810547, -25.00160026550293, -24.078401565551758, -23.155202865600586, -22.232006072998047, -21.308807373046875, -20.385608673095703, -19.46240997314453, -18.53921127319336, -17.61601448059082, -16.69281578063965, -15.769617080688477, -14.846419334411621, -13.923221588134766, -13.000022888183594, -12.076824188232422, -11.153626441955566, -10.230428695678711, -9.307229995727539, -8.384031295776367, -7.460833549499512, -6.537635326385498, -5.614437103271484, -4.691238880157471, -3.768040657043457, -2.8448424339294434, -1.9216442108154297, -0.998445987701416, -0.07524776458740234, 0.8479504585266113, 1.7711505889892578, 2.6943488121032715, 3.617547035217285, 4.540745258331299, 5.4639434814453125, 6.387141704559326, 7.31033992767334, 8.233537673950195, 9.156736373901367, 10.079935073852539, 11.003132820129395, 11.92633056640625, 12.849529266357422, 13.772727966308594, 14.69592571258545, 15.619123458862305, 16.542322158813477, 17.46552085876465, 18.388717651367188, 19.31191635131836, 20.23511505126953, 21.158313751220703, 22.081512451171875, 23.004709243774414, 23.927907943725586, 24.851106643676758, 25.774303436279297, 26.69750213623047, 27.62070083618164, 28.543899536132812, 29.467098236083984, 30.390295028686523, 31.313493728637695]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 3.0, 3.0, 4.0, 4.0, 3.0, 11.0, 9.0, 12.0, 23.0, 22.0, 25.0, 27.0, 34.0, 33.0, 42.0, 34.0, 47.0, 53.0, 42.0, 66.0, 46.0, 53.0, 56.0, 54.0, 46.0, 35.0, 37.0, 29.0, 36.0, 25.0, 12.0, 28.0, 13.0, 5.0, 2.0, 10.0, 9.0, 5.0, 4.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.21875, -4.078369140625, -3.93798828125, -3.797607421875, -3.6572265625, -3.516845703125, -3.37646484375, -3.236083984375, -3.095703125, -2.955322265625, -2.81494140625, -2.674560546875, -2.5341796875, -2.393798828125, -2.25341796875, -2.113037109375, -1.97265625, -1.832275390625, -1.69189453125, -1.551513671875, -1.4111328125, -1.270751953125, -1.13037109375, -0.989990234375, -0.849609375, -0.709228515625, -0.56884765625, -0.428466796875, -0.2880859375, -0.147705078125, -0.00732421875, 0.133056640625, 0.2734375, 0.413818359375, 0.55419921875, 0.694580078125, 0.8349609375, 0.975341796875, 1.11572265625, 1.256103515625, 1.396484375, 1.536865234375, 1.67724609375, 1.817626953125, 1.9580078125, 2.098388671875, 2.23876953125, 2.379150390625, 2.51953125, 2.659912109375, 2.80029296875, 2.940673828125, 3.0810546875, 3.221435546875, 3.36181640625, 3.502197265625, 3.642578125, 3.782958984375, 3.92333984375, 4.063720703125, 4.2041015625, 4.344482421875, 4.48486328125, 4.625244140625, 4.765625]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 1.0, 5.0, 3.0, 6.0, 5.0, 18.0, 12.0, 16.0, 15.0, 27.0, 38.0, 68.0, 108.0, 197.0, 390.0, 808.0, 1965.0, 5466.0, 17070.0, 59822.0, 217821.0, 788248.0, 1740388.0, 977511.0, 278780.0, 74268.0, 20831.0, 6371.0, 2238.0, 846.0, 407.0, 188.0, 106.0, 68.0, 49.0, 22.0, 27.0, 16.0, 18.0, 10.0, 10.0, 3.0, 4.0, 6.0, 2.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.09375, -4.9324951171875, -4.771240234375, -4.6099853515625, -4.44873046875, -4.2874755859375, -4.126220703125, -3.9649658203125, -3.8037109375, -3.6424560546875, -3.481201171875, -3.3199462890625, -3.15869140625, -2.9974365234375, -2.836181640625, -2.6749267578125, -2.513671875, -2.3524169921875, -2.191162109375, -2.0299072265625, -1.86865234375, -1.7073974609375, -1.546142578125, -1.3848876953125, -1.2236328125, -1.0623779296875, -0.901123046875, -0.7398681640625, -0.57861328125, -0.4173583984375, -0.256103515625, -0.0948486328125, 0.06640625, 0.2276611328125, 0.388916015625, 0.5501708984375, 0.71142578125, 0.8726806640625, 1.033935546875, 1.1951904296875, 1.3564453125, 1.5177001953125, 1.678955078125, 1.8402099609375, 2.00146484375, 2.1627197265625, 2.323974609375, 2.4852294921875, 2.646484375, 2.8077392578125, 2.968994140625, 3.1302490234375, 3.29150390625, 3.4527587890625, 3.614013671875, 3.7752685546875, 3.9365234375, 4.0977783203125, 4.259033203125, 4.4202880859375, 4.58154296875, 4.7427978515625, 4.904052734375, 5.0653076171875, 5.2265625]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 8.0, 4.0, 7.0, 10.0, 3.0, 11.0, 23.0, 24.0, 41.0, 51.0, 79.0, 86.0, 115.0, 178.0, 207.0, 276.0, 336.0, 401.0, 415.0, 386.0, 336.0, 247.0, 208.0, 152.0, 119.0, 84.0, 70.0, 57.0, 30.0, 29.0, 19.0, 15.0, 12.0, 12.0, 6.0, 9.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-4.96484375, -4.80218505859375, -4.6395263671875, -4.47686767578125, -4.314208984375, -4.15155029296875, -3.9888916015625, -3.82623291015625, -3.66357421875, -3.50091552734375, -3.3382568359375, -3.17559814453125, -3.012939453125, -2.85028076171875, -2.6876220703125, -2.52496337890625, -2.3623046875, -2.19964599609375, -2.0369873046875, -1.87432861328125, -1.711669921875, -1.54901123046875, -1.3863525390625, -1.22369384765625, -1.06103515625, -0.89837646484375, -0.7357177734375, -0.57305908203125, -0.410400390625, -0.24774169921875, -0.0850830078125, 0.07757568359375, 0.240234375, 0.40289306640625, 0.5655517578125, 0.72821044921875, 0.890869140625, 1.05352783203125, 1.2161865234375, 1.37884521484375, 1.54150390625, 1.70416259765625, 1.8668212890625, 2.02947998046875, 2.192138671875, 2.35479736328125, 2.5174560546875, 2.68011474609375, 2.8427734375, 3.00543212890625, 3.1680908203125, 3.33074951171875, 3.493408203125, 3.65606689453125, 3.8187255859375, 3.98138427734375, 4.14404296875, 4.30670166015625, 4.4693603515625, 4.63201904296875, 4.794677734375, 4.95733642578125, 5.1199951171875, 5.28265380859375, 5.4453125]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 7.0, 5.0, 12.0, 18.0, 32.0, 45.0, 70.0, 121.0, 195.0, 314.0, 583.0, 1589.0, 16703.0, 851719.0, 3234914.0, 82579.0, 3426.0, 887.0, 411.0, 243.0, 167.0, 97.0, 51.0, 28.0, 20.0, 18.0, 8.0, 9.0, 2.0, 3.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-25.21875, -24.60693359375, -23.9951171875, -23.38330078125, -22.771484375, -22.15966796875, -21.5478515625, -20.93603515625, -20.32421875, -19.71240234375, -19.1005859375, -18.48876953125, -17.876953125, -17.26513671875, -16.6533203125, -16.04150390625, -15.4296875, -14.81787109375, -14.2060546875, -13.59423828125, -12.982421875, -12.37060546875, -11.7587890625, -11.14697265625, -10.53515625, -9.92333984375, -9.3115234375, -8.69970703125, -8.087890625, -7.47607421875, -6.8642578125, -6.25244140625, -5.640625, -5.02880859375, -4.4169921875, -3.80517578125, -3.193359375, -2.58154296875, -1.9697265625, -1.35791015625, -0.74609375, -0.13427734375, 0.4775390625, 1.08935546875, 1.701171875, 2.31298828125, 2.9248046875, 3.53662109375, 4.1484375, 4.76025390625, 5.3720703125, 5.98388671875, 6.595703125, 7.20751953125, 7.8193359375, 8.43115234375, 9.04296875, 9.65478515625, 10.2666015625, 10.87841796875, 11.490234375, 12.10205078125, 12.7138671875, 13.32568359375, 13.9375]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 65.0, 387.0, 434.0, 120.0, 9.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.4931411743164, -69.65304565429688, -65.81295776367188, -61.972862243652344, -58.13276672363281, -54.29267501831055, -50.45258331298828, -46.61248779296875, -42.772396087646484, -38.93230438232422, -35.09220886230469, -31.252117156982422, -27.412023544311523, -23.571929931640625, -19.73183822631836, -15.891744613647461, -12.051651000976562, -8.211557388305664, -4.371464729309082, -0.5313720703125, 3.3087215423583984, 7.148815155029297, 10.988906860351562, 14.829000473022461, 18.66909408569336, 22.509187698364258, 26.349281311035156, 30.189373016357422, 34.02946472167969, 37.86956024169922, 41.709651947021484, 45.54974365234375, 49.38983154296875, 53.229923248291016, 57.07001876831055, 60.91011047363281, 64.75020599365234, 68.59030151367188, 72.43038940429688, 76.2704849243164, 80.11058044433594, 83.95067596435547, 87.79076385498047, 91.630859375, 95.47095489501953, 99.31105041503906, 103.15113830566406, 106.9912338256836, 110.8313217163086, 114.67141723632812, 118.51150512695312, 122.35160064697266, 126.19169616699219, 130.0317840576172, 133.87188720703125, 137.71197509765625, 141.55206298828125, 145.39215087890625, 149.2322540283203, 153.0723419189453, 156.9124298095703, 160.75253295898438, 164.59262084960938, 168.43270874023438, 172.27281188964844]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 3.0, 3.0, 8.0, 3.0, 8.0, 6.0, 10.0, 7.0, 16.0, 11.0, 20.0, 18.0, 20.0, 32.0, 26.0, 21.0, 32.0, 27.0, 45.0, 37.0, 45.0, 53.0, 46.0, 49.0, 46.0, 35.0, 39.0, 35.0, 43.0, 33.0, 32.0, 26.0, 25.0, 18.0, 25.0, 21.0, 14.0, 10.0, 8.0, 7.0, 12.0, 9.0, 6.0, 11.0, 2.0, 3.0, 2.0, 3.0, 4.0, 1.0], "bins": [-22.357097625732422, -21.753122329711914, -21.14914894104004, -20.54517364501953, -19.941198348999023, -19.33722496032715, -18.73324966430664, -18.129276275634766, -17.525300979614258, -16.92132568359375, -16.317352294921875, -15.713376998901367, -15.109402656555176, -14.505428314208984, -13.901453018188477, -13.297478675842285, -12.693503379821777, -12.089529037475586, -11.485553741455078, -10.881579399108887, -10.277605056762695, -9.673629760742188, -9.069655418395996, -8.465681076049805, -7.861706256866455, -7.2577314376831055, -6.653757095336914, -6.0497822761535645, -5.445807456970215, -4.841833114624023, -4.237858295440674, -3.6338839530944824, -3.029909133911133, -2.4259345531463623, -1.8219598531723022, -1.2179851531982422, -0.6140105724334717, -0.010035991668701172, 0.5939388275146484, 1.1979131698608398, 1.8018879890441895, 2.40586256980896, 3.0098371505737305, 3.61381196975708, 4.21778678894043, 4.821761131286621, 5.425735950469971, 6.029710292816162, 6.633685111999512, 7.237659931182861, 7.841634273529053, 8.445609092712402, 9.049583435058594, 9.653558731079102, 10.257533073425293, 10.861507415771484, 11.465482711791992, 12.069457054138184, 12.673432350158691, 13.277406692504883, 13.881381034851074, 14.485355377197266, 15.089330673217773, 15.693305015563965, 16.297279357910156]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 4.0, 4.0, 4.0, 9.0, 9.0, 12.0, 22.0, 18.0, 17.0, 18.0, 43.0, 37.0, 47.0, 48.0, 47.0, 41.0, 65.0, 57.0, 68.0, 51.0, 53.0, 43.0, 45.0, 39.0, 33.0, 41.0, 27.0, 16.0, 19.0, 23.0, 15.0, 14.0, 5.0, 5.0, 3.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.7734375, -4.62432861328125, -4.4752197265625, -4.32611083984375, -4.177001953125, -4.02789306640625, -3.8787841796875, -3.72967529296875, -3.58056640625, -3.43145751953125, -3.2823486328125, -3.13323974609375, -2.984130859375, -2.83502197265625, -2.6859130859375, -2.53680419921875, -2.3876953125, -2.23858642578125, -2.0894775390625, -1.94036865234375, -1.791259765625, -1.64215087890625, -1.4930419921875, -1.34393310546875, -1.19482421875, -1.04571533203125, -0.8966064453125, -0.74749755859375, -0.598388671875, -0.44927978515625, -0.3001708984375, -0.15106201171875, -0.001953125, 0.14715576171875, 0.2962646484375, 0.44537353515625, 0.594482421875, 0.74359130859375, 0.8927001953125, 1.04180908203125, 1.19091796875, 1.34002685546875, 1.4891357421875, 1.63824462890625, 1.787353515625, 1.93646240234375, 2.0855712890625, 2.23468017578125, 2.3837890625, 2.53289794921875, 2.6820068359375, 2.83111572265625, 2.980224609375, 3.12933349609375, 3.2784423828125, 3.42755126953125, 3.57666015625, 3.72576904296875, 3.8748779296875, 4.02398681640625, 4.173095703125, 4.32220458984375, 4.4713134765625, 4.62042236328125, 4.76953125]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 6.0, 9.0, 17.0, 24.0, 31.0, 72.0, 109.0, 177.0, 254.0, 390.0, 630.0, 971.0, 1685.0, 2556.0, 3964.0, 6460.0, 9813.0, 14962.0, 22095.0, 32549.0, 46076.0, 62919.0, 81675.0, 99369.0, 112641.0, 115566.0, 105962.0, 89590.0, 70552.0, 52762.0, 37651.0, 26207.0, 17575.0, 11535.0, 7840.0, 5093.0, 3268.0, 2001.0, 1324.0, 789.0, 528.0, 340.0, 204.0, 129.0, 81.0, 44.0, 25.0, 21.0, 5.0, 6.0, 10.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.437744140625, -0.4237213134765625, -0.409698486328125, -0.3956756591796875, -0.38165283203125, -0.3676300048828125, -0.353607177734375, -0.3395843505859375, -0.3255615234375, -0.3115386962890625, -0.297515869140625, -0.2834930419921875, -0.26947021484375, -0.2554473876953125, -0.241424560546875, -0.2274017333984375, -0.21337890625, -0.1993560791015625, -0.185333251953125, -0.1713104248046875, -0.15728759765625, -0.1432647705078125, -0.129241943359375, -0.1152191162109375, -0.1011962890625, -0.0871734619140625, -0.073150634765625, -0.0591278076171875, -0.04510498046875, -0.0310821533203125, -0.017059326171875, -0.0030364990234375, 0.010986328125, 0.0250091552734375, 0.039031982421875, 0.0530548095703125, 0.06707763671875, 0.0811004638671875, 0.095123291015625, 0.1091461181640625, 0.1231689453125, 0.1371917724609375, 0.151214599609375, 0.1652374267578125, 0.17926025390625, 0.1932830810546875, 0.207305908203125, 0.2213287353515625, 0.2353515625, 0.2493743896484375, 0.263397216796875, 0.2774200439453125, 0.29144287109375, 0.3054656982421875, 0.319488525390625, 0.3335113525390625, 0.3475341796875, 0.3615570068359375, 0.375579833984375, 0.3896026611328125, 0.40362548828125, 0.4176483154296875, 0.431671142578125, 0.4456939697265625, 0.459716796875]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 6.0, 5.0, 2.0, 10.0, 13.0, 12.0, 14.0, 13.0, 14.0, 19.0, 27.0, 27.0, 32.0, 26.0, 36.0, 33.0, 25.0, 37.0, 46.0, 42.0, 34.0, 1064.0, 45.0, 37.0, 36.0, 49.0, 31.0, 37.0, 26.0, 27.0, 23.0, 33.0, 24.0, 17.0, 22.0, 11.0, 16.0, 14.0, 7.0, 11.0, 6.0, 5.0, 3.0, 2.0, 7.0, 3.0, 0.0, 1.0, 1.0, 3.0], "bins": [-3.06640625, -2.9798583984375, -2.893310546875, -2.8067626953125, -2.72021484375, -2.6336669921875, -2.547119140625, -2.4605712890625, -2.3740234375, -2.2874755859375, -2.200927734375, -2.1143798828125, -2.02783203125, -1.9412841796875, -1.854736328125, -1.7681884765625, -1.681640625, -1.5950927734375, -1.508544921875, -1.4219970703125, -1.33544921875, -1.2489013671875, -1.162353515625, -1.0758056640625, -0.9892578125, -0.9027099609375, -0.816162109375, -0.7296142578125, -0.64306640625, -0.5565185546875, -0.469970703125, -0.3834228515625, -0.296875, -0.2103271484375, -0.123779296875, -0.0372314453125, 0.04931640625, 0.1358642578125, 0.222412109375, 0.3089599609375, 0.3955078125, 0.4820556640625, 0.568603515625, 0.6551513671875, 0.74169921875, 0.8282470703125, 0.914794921875, 1.0013427734375, 1.087890625, 1.1744384765625, 1.260986328125, 1.3475341796875, 1.43408203125, 1.5206298828125, 1.607177734375, 1.6937255859375, 1.7802734375, 1.8668212890625, 1.953369140625, 2.0399169921875, 2.12646484375, 2.2130126953125, 2.299560546875, 2.3861083984375, 2.47265625]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 5.0, 7.0, 9.0, 4.0, 9.0, 16.0, 17.0, 40.0, 54.0, 57.0, 112.0, 124.0, 195.0, 248.0, 425.0, 558.0, 807.0, 1109.0, 1715.0, 2425.0, 3440.0, 4842.0, 7009.0, 10077.0, 14818.0, 22036.0, 45103.0, 1545987.0, 336582.0, 34999.0, 19984.0, 13470.0, 9252.0, 6586.0, 4629.0, 3085.0, 2256.0, 1531.0, 1044.0, 750.0, 523.0, 361.0, 283.0, 166.0, 123.0, 83.0, 53.0, 48.0, 31.0, 20.0, 12.0, 7.0, 7.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.8564453125, -0.8287124633789062, -0.8009796142578125, -0.7732467651367188, -0.745513916015625, -0.7177810668945312, -0.6900482177734375, -0.6623153686523438, -0.63458251953125, -0.6068496704101562, -0.5791168212890625, -0.5513839721679688, -0.523651123046875, -0.49591827392578125, -0.4681854248046875, -0.44045257568359375, -0.4127197265625, -0.38498687744140625, -0.3572540283203125, -0.32952117919921875, -0.301788330078125, -0.27405548095703125, -0.2463226318359375, -0.21858978271484375, -0.19085693359375, -0.16312408447265625, -0.1353912353515625, -0.10765838623046875, -0.079925537109375, -0.05219268798828125, -0.0244598388671875, 0.00327301025390625, 0.031005859375, 0.05873870849609375, 0.0864715576171875, 0.11420440673828125, 0.141937255859375, 0.16967010498046875, 0.1974029541015625, 0.22513580322265625, 0.25286865234375, 0.28060150146484375, 0.3083343505859375, 0.33606719970703125, 0.363800048828125, 0.39153289794921875, 0.4192657470703125, 0.44699859619140625, 0.4747314453125, 0.5024642944335938, 0.5301971435546875, 0.5579299926757812, 0.585662841796875, 0.6133956909179688, 0.6411285400390625, 0.6688613891601562, 0.69659423828125, 0.7243270874023438, 0.7520599365234375, 0.7797927856445312, 0.807525634765625, 0.8352584838867188, 0.8629913330078125, 0.8907241821289062, 0.91845703125]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 5.0, 4.0, 4.0, 12.0, 4.0, 17.0, 8.0, 13.0, 16.0, 18.0, 20.0, 21.0, 30.0, 37.0, 39.0, 38.0, 49.0, 57.0, 56.0, 61.0, 60.0, 61.0, 45.0, 62.0, 37.0, 30.0, 26.0, 31.0, 25.0, 18.0, 21.0, 17.0, 12.0, 6.0, 7.0, 7.0, 4.0, 5.0, 3.0, 0.0, 3.0, 2.0, 3.0, 3.0, 0.0, 4.0, 3.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0], "bins": [-0.055511474609375, -0.053720951080322266, -0.05193042755126953, -0.0501399040222168, -0.04834938049316406, -0.04655885696411133, -0.044768333435058594, -0.04297780990600586, -0.041187286376953125, -0.03939676284790039, -0.037606239318847656, -0.03581571578979492, -0.03402519226074219, -0.03223466873168945, -0.03044414520263672, -0.028653621673583984, -0.02686309814453125, -0.025072574615478516, -0.02328205108642578, -0.021491527557373047, -0.019701004028320312, -0.017910480499267578, -0.016119956970214844, -0.01432943344116211, -0.012538909912109375, -0.01074838638305664, -0.008957862854003906, -0.007167339324951172, -0.0053768157958984375, -0.003586292266845703, -0.0017957687377929688, -5.245208740234375e-06, 0.0017852783203125, 0.0035758018493652344, 0.005366325378417969, 0.007156848907470703, 0.008947372436523438, 0.010737895965576172, 0.012528419494628906, 0.01431894302368164, 0.016109466552734375, 0.01789999008178711, 0.019690513610839844, 0.021481037139892578, 0.023271560668945312, 0.025062084197998047, 0.02685260772705078, 0.028643131256103516, 0.03043365478515625, 0.032224178314208984, 0.03401470184326172, 0.03580522537231445, 0.03759574890136719, 0.03938627243041992, 0.041176795959472656, 0.04296731948852539, 0.044757843017578125, 0.04654836654663086, 0.048338890075683594, 0.05012941360473633, 0.05191993713378906, 0.0537104606628418, 0.05550098419189453, 0.057291507720947266, 0.05908203125]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 5.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 3.0, 6.0, 4.0, 7.0, 4.0, 8.0, 16.0, 18.0, 27.0, 25.0, 34.0, 44.0, 45.0, 81.0, 133.0, 218.0, 353.0, 1141.0, 667937.0, 376301.0, 1077.0, 388.0, 194.0, 130.0, 86.0, 59.0, 47.0, 25.0, 25.0, 28.0, 14.0, 14.0, 8.0, 12.0, 9.0, 10.0, 5.0, 2.0, 3.0, 2.0, 0.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.318359375, -1.2771148681640625, -1.235870361328125, -1.1946258544921875, -1.15338134765625, -1.1121368408203125, -1.070892333984375, -1.0296478271484375, -0.9884033203125, -0.9471588134765625, -0.905914306640625, -0.8646697998046875, -0.82342529296875, -0.7821807861328125, -0.740936279296875, -0.6996917724609375, -0.658447265625, -0.6172027587890625, -0.575958251953125, -0.5347137451171875, -0.49346923828125, -0.4522247314453125, -0.410980224609375, -0.3697357177734375, -0.3284912109375, -0.2872467041015625, -0.246002197265625, -0.2047576904296875, -0.16351318359375, -0.1222686767578125, -0.081024169921875, -0.0397796630859375, 0.00146484375, 0.0427093505859375, 0.083953857421875, 0.1251983642578125, 0.16644287109375, 0.2076873779296875, 0.248931884765625, 0.2901763916015625, 0.3314208984375, 0.3726654052734375, 0.413909912109375, 0.4551544189453125, 0.49639892578125, 0.5376434326171875, 0.578887939453125, 0.6201324462890625, 0.661376953125, 0.7026214599609375, 0.743865966796875, 0.7851104736328125, 0.82635498046875, 0.8675994873046875, 0.908843994140625, 0.9500885009765625, 0.9913330078125, 1.0325775146484375, 1.073822021484375, 1.1150665283203125, 1.15631103515625, 1.1975555419921875, 1.238800048828125, 1.2800445556640625, 1.3212890625]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 12.0, 851.0, 153.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09116511791944504, -0.057837069034576416, -0.024509020149707794, 0.008819028735160828, 0.04214707762002945, 0.07547513395547867, 0.1088031753897667, 0.14213120937347412, 0.17545926570892334, 0.20878732204437256, 0.24211536347866058, 0.2754434049129486, 0.3087714612483978, 0.34209951758384705, 0.3754275441169739, 0.4087556004524231, 0.4420836567878723, 0.47541171312332153, 0.5087397694587708, 0.54206782579422, 0.5753958225250244, 0.6087238788604736, 0.6420519351959229, 0.6753799915313721, 0.7087080478668213, 0.7420361042022705, 0.7753641605377197, 0.808692216873169, 0.8420202732086182, 0.8753483295440674, 0.9086763262748718, 0.942004382610321, 0.975332498550415, 1.0086605548858643, 1.0419886112213135, 1.0753166675567627, 1.108644723892212, 1.1419727802276611, 1.1753008365631104, 1.2086288928985596, 1.2419569492340088, 1.275285005569458, 1.3086130619049072, 1.3419411182403564, 1.3752691745758057, 1.4085972309112549, 1.441925287246704, 1.4752533435821533, 1.508581280708313, 1.5419093370437622, 1.5752373933792114, 1.6085654497146606, 1.6418935060501099, 1.675221562385559, 1.7085496187210083, 1.741877555847168, 1.7752056121826172, 1.8085336685180664, 1.8418617248535156, 1.8751897811889648, 1.908517837524414, 1.9418458938598633, 1.9751739501953125, 2.0085020065307617, 2.041830062866211]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 4.0, 4.0, 2.0, 1.0, 7.0, 6.0, 5.0, 9.0, 7.0, 18.0, 15.0, 17.0, 28.0, 27.0, 27.0, 32.0, 40.0, 45.0, 53.0, 51.0, 49.0, 49.0, 56.0, 60.0, 35.0, 50.0, 47.0, 45.0, 29.0, 27.0, 30.0, 33.0, 19.0, 16.0, 17.0, 12.0, 12.0, 7.0, 6.0, 3.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.14256954193115234, -0.13848519325256348, -0.13440082967281342, -0.13031648099422455, -0.12623213231563568, -0.12214777618646622, -0.11806342005729675, -0.11397907137870789, -0.10989471524953842, -0.10581035912036896, -0.10172601044178009, -0.09764165431261063, -0.09355729818344116, -0.0894729495048523, -0.08538859337568283, -0.08130423724651337, -0.0772198885679245, -0.07313553243875504, -0.06905118376016617, -0.0649668276309967, -0.06088247522711754, -0.05679812282323837, -0.05271376669406891, -0.04862941429018974, -0.04454506188631058, -0.04046070948243141, -0.036376357078552246, -0.03229200094938278, -0.028207648545503616, -0.02412329614162445, -0.020038941875100136, -0.01595458760857582, -0.011870235204696655, -0.007785881869494915, -0.0037015285342931747, 0.0003828248009085655, 0.004467178136110306, 0.008551530539989471, 0.012635884806513786, 0.0167202390730381, 0.020804591476917267, 0.024888943880796432, 0.028973298147320747, 0.03305765241384506, 0.03714200481772423, 0.041226357221603394, 0.04531071335077286, 0.04939506575465202, 0.05347941815853119, 0.057563770562410355, 0.06164812296628952, 0.06573247909545898, 0.06981682777404785, 0.07390118390321732, 0.07798554003238678, 0.08206988871097565, 0.08615424484014511, 0.09023860096931458, 0.09432294964790344, 0.0984073057770729, 0.10249166190624237, 0.10657601058483124, 0.1106603667140007, 0.11474472284317017, 0.11882907152175903]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 0.0, 4.0, 2.0, 4.0, 10.0, 9.0, 9.0, 18.0, 16.0, 11.0, 26.0, 22.0, 39.0, 35.0, 47.0, 43.0, 38.0, 48.0, 43.0, 36.0, 50.0, 50.0, 43.0, 51.0, 45.0, 42.0, 41.0, 58.0, 23.0, 24.0, 17.0, 14.0, 21.0, 14.0, 17.0, 9.0, 8.0, 4.0, 8.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.2890625, -4.157470703125, -4.02587890625, -3.894287109375, -3.7626953125, -3.631103515625, -3.49951171875, -3.367919921875, -3.236328125, -3.104736328125, -2.97314453125, -2.841552734375, -2.7099609375, -2.578369140625, -2.44677734375, -2.315185546875, -2.18359375, -2.052001953125, -1.92041015625, -1.788818359375, -1.6572265625, -1.525634765625, -1.39404296875, -1.262451171875, -1.130859375, -0.999267578125, -0.86767578125, -0.736083984375, -0.6044921875, -0.472900390625, -0.34130859375, -0.209716796875, -0.078125, 0.053466796875, 0.18505859375, 0.316650390625, 0.4482421875, 0.579833984375, 0.71142578125, 0.843017578125, 0.974609375, 1.106201171875, 1.23779296875, 1.369384765625, 1.5009765625, 1.632568359375, 1.76416015625, 1.895751953125, 2.02734375, 2.158935546875, 2.29052734375, 2.422119140625, 2.5537109375, 2.685302734375, 2.81689453125, 2.948486328125, 3.080078125, 3.211669921875, 3.34326171875, 3.474853515625, 3.6064453125, 3.738037109375, 3.86962890625, 4.001220703125, 4.1328125]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 8.0, 12.0, 10.0, 19.0, 14.0, 30.0, 34.0, 79.0, 83.0, 120.0, 253.0, 619.0, 1935.0, 6222.0, 20610.0, 71315.0, 486641.0, 375151.0, 59352.0, 17950.0, 5237.0, 1683.0, 548.0, 212.0, 126.0, 95.0, 59.0, 37.0, 41.0, 25.0, 10.0, 6.0, 8.0, 9.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.6015625, -10.32208251953125, -10.0426025390625, -9.76312255859375, -9.483642578125, -9.20416259765625, -8.9246826171875, -8.64520263671875, -8.36572265625, -8.08624267578125, -7.8067626953125, -7.52728271484375, -7.247802734375, -6.96832275390625, -6.6888427734375, -6.40936279296875, -6.1298828125, -5.85040283203125, -5.5709228515625, -5.29144287109375, -5.011962890625, -4.73248291015625, -4.4530029296875, -4.17352294921875, -3.89404296875, -3.61456298828125, -3.3350830078125, -3.05560302734375, -2.776123046875, -2.49664306640625, -2.2171630859375, -1.93768310546875, -1.658203125, -1.37872314453125, -1.0992431640625, -0.81976318359375, -0.540283203125, -0.26080322265625, 0.0186767578125, 0.29815673828125, 0.57763671875, 0.85711669921875, 1.1365966796875, 1.41607666015625, 1.695556640625, 1.97503662109375, 2.2545166015625, 2.53399658203125, 2.8134765625, 3.09295654296875, 3.3724365234375, 3.65191650390625, 3.931396484375, 4.21087646484375, 4.4903564453125, 4.76983642578125, 5.04931640625, 5.32879638671875, 5.6082763671875, 5.88775634765625, 6.167236328125, 6.44671630859375, 6.7261962890625, 7.00567626953125, 7.28515625]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 6.0, 0.0, 4.0, 4.0, 5.0, 3.0, 3.0, 9.0, 3.0, 10.0, 21.0, 13.0, 23.0, 22.0, 21.0, 29.0, 30.0, 26.0, 49.0, 45.0, 49.0, 68.0, 74.0, 173.0, 1403.0, 334.0, 141.0, 83.0, 68.0, 52.0, 35.0, 36.0, 41.0, 23.0, 19.0, 24.0, 24.0, 18.0, 15.0, 10.0, 8.0, 5.0, 6.0, 3.0, 4.0, 5.0, 3.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-10.0859375, -9.7591552734375, -9.432373046875, -9.1055908203125, -8.77880859375, -8.4520263671875, -8.125244140625, -7.7984619140625, -7.4716796875, -7.1448974609375, -6.818115234375, -6.4913330078125, -6.16455078125, -5.8377685546875, -5.510986328125, -5.1842041015625, -4.857421875, -4.5306396484375, -4.203857421875, -3.8770751953125, -3.55029296875, -3.2235107421875, -2.896728515625, -2.5699462890625, -2.2431640625, -1.9163818359375, -1.589599609375, -1.2628173828125, -0.93603515625, -0.6092529296875, -0.282470703125, 0.0443115234375, 0.37109375, 0.6978759765625, 1.024658203125, 1.3514404296875, 1.67822265625, 2.0050048828125, 2.331787109375, 2.6585693359375, 2.9853515625, 3.3121337890625, 3.638916015625, 3.9656982421875, 4.29248046875, 4.6192626953125, 4.946044921875, 5.2728271484375, 5.599609375, 5.9263916015625, 6.253173828125, 6.5799560546875, 6.90673828125, 7.2335205078125, 7.560302734375, 7.8870849609375, 8.2138671875, 8.5406494140625, 8.867431640625, 9.1942138671875, 9.52099609375, 9.8477783203125, 10.174560546875, 10.5013427734375, 10.828125]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 6.0, 6.0, 4.0, 5.0, 6.0, 11.0, 7.0, 13.0, 14.0, 14.0, 18.0, 25.0, 41.0, 61.0, 48.0, 71.0, 120.0, 151.0, 232.0, 382.0, 753.0, 2527.0, 14595.0, 181909.0, 2782944.0, 144991.0, 12561.0, 2240.0, 714.0, 341.0, 234.0, 179.0, 106.0, 84.0, 62.0, 47.0, 48.0, 34.0, 19.0, 17.0, 15.0, 7.0, 7.0, 11.0, 3.0, 4.0, 8.0, 6.0, 8.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-14.984375, -14.5228271484375, -14.061279296875, -13.5997314453125, -13.13818359375, -12.6766357421875, -12.215087890625, -11.7535400390625, -11.2919921875, -10.8304443359375, -10.368896484375, -9.9073486328125, -9.44580078125, -8.9842529296875, -8.522705078125, -8.0611572265625, -7.599609375, -7.1380615234375, -6.676513671875, -6.2149658203125, -5.75341796875, -5.2918701171875, -4.830322265625, -4.3687744140625, -3.9072265625, -3.4456787109375, -2.984130859375, -2.5225830078125, -2.06103515625, -1.5994873046875, -1.137939453125, -0.6763916015625, -0.21484375, 0.2467041015625, 0.708251953125, 1.1697998046875, 1.63134765625, 2.0928955078125, 2.554443359375, 3.0159912109375, 3.4775390625, 3.9390869140625, 4.400634765625, 4.8621826171875, 5.32373046875, 5.7852783203125, 6.246826171875, 6.7083740234375, 7.169921875, 7.6314697265625, 8.093017578125, 8.5545654296875, 9.01611328125, 9.4776611328125, 9.939208984375, 10.4007568359375, 10.8623046875, 11.3238525390625, 11.785400390625, 12.2469482421875, 12.70849609375, 13.1700439453125, 13.631591796875, 14.0931396484375, 14.5546875]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 374.0, 631.0, 12.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.249436378479004, -6.529106140136719, -0.8087759017944336, 4.911555290222168, 10.631884574890137, 16.352214813232422, 22.072547912597656, 27.792877197265625, 33.513206481933594, 39.23353576660156, 44.95386505126953, 50.674198150634766, 56.394527435302734, 62.1148567199707, 67.83518981933594, 73.5555191040039, 79.27584838867188, 84.99617767333984, 90.71650695800781, 96.43684387207031, 102.15716552734375, 107.87750244140625, 113.59783172607422, 119.31816101074219, 125.03849029541016, 130.75881958007812, 136.47915649414062, 142.19947814941406, 147.91981506347656, 153.64013671875, 159.3604736328125, 165.080810546875, 170.80111694335938, 176.52145385742188, 182.2417755126953, 187.9621124267578, 193.68243408203125, 199.40277099609375, 205.12310791015625, 210.8434295654297, 216.56375122070312, 222.28408813476562, 228.00440979003906, 233.72474670410156, 239.445068359375, 245.1654052734375, 250.8857421875, 256.6060791015625, 262.326416015625, 268.0467529296875, 273.76708984375, 279.4873962402344, 285.2077331542969, 290.9280700683594, 296.6484069824219, 302.36871337890625, 308.08905029296875, 313.80938720703125, 319.52972412109375, 325.2500305175781, 330.9703674316406, 336.6907043457031, 342.4110412597656, 348.13134765625, 353.8516845703125]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 10.0, 12.0, 11.0, 19.0, 20.0, 22.0, 23.0, 28.0, 25.0, 40.0, 33.0, 46.0, 57.0, 42.0, 48.0, 34.0, 62.0, 53.0, 52.0, 42.0, 43.0, 44.0, 32.0, 30.0, 25.0, 22.0, 25.0, 23.0, 7.0, 14.0, 10.0, 5.0, 11.0, 8.0, 5.0, 10.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.69005012512207, -25.686086654663086, -24.68212127685547, -23.678157806396484, -22.6741943359375, -21.670230865478516, -20.6662654876709, -19.662302017211914, -18.658336639404297, -17.654373168945312, -16.650407791137695, -15.646444320678711, -14.642480850219727, -13.638516426086426, -12.634552001953125, -11.63058853149414, -10.626625061035156, -9.622660636901855, -8.618697166442871, -7.61473274230957, -6.610768795013428, -5.606804847717285, -4.602840423583984, -3.598876476287842, -2.594912528991699, -1.590948462486267, -0.586984395980835, 0.4169797897338867, 1.4209437370300293, 2.424907684326172, 3.4288721084594727, 4.432836055755615, 5.436798095703125, 6.440762042999268, 7.44472599029541, 8.448690414428711, 9.452653884887695, 10.456618309020996, 11.460582733154297, 12.464546203613281, 13.468510627746582, 14.472475051879883, 15.476438522338867, 16.480403900146484, 17.48436737060547, 18.488330841064453, 19.492294311523438, 20.496259689331055, 21.50022315979004, 22.504186630249023, 23.50815200805664, 24.512115478515625, 25.51607894897461, 26.520042419433594, 27.52400779724121, 28.527971267700195, 29.531936645507812, 30.535900115966797, 31.539865493774414, 32.54383087158203, 33.547794342041016, 34.5517578125, 35.555721282958984, 36.55968475341797, 37.56364822387695]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 3.0, 1.0, 6.0, 4.0, 6.0, 6.0, 10.0, 16.0, 11.0, 20.0, 19.0, 16.0, 31.0, 31.0, 33.0, 25.0, 30.0, 52.0, 42.0, 49.0, 54.0, 39.0, 48.0, 40.0, 39.0, 40.0, 43.0, 44.0, 38.0, 36.0, 25.0, 27.0, 25.0, 18.0, 12.0, 13.0, 16.0, 10.0, 7.0, 6.0, 10.0, 5.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.947265625, -3.815643310546875, -3.68402099609375, -3.552398681640625, -3.4207763671875, -3.289154052734375, -3.15753173828125, -3.025909423828125, -2.894287109375, -2.762664794921875, -2.63104248046875, -2.499420166015625, -2.3677978515625, -2.236175537109375, -2.10455322265625, -1.972930908203125, -1.84130859375, -1.709686279296875, -1.57806396484375, -1.446441650390625, -1.3148193359375, -1.183197021484375, -1.05157470703125, -0.919952392578125, -0.788330078125, -0.656707763671875, -0.52508544921875, -0.393463134765625, -0.2618408203125, -0.130218505859375, 0.00140380859375, 0.133026123046875, 0.2646484375, 0.396270751953125, 0.52789306640625, 0.659515380859375, 0.7911376953125, 0.922760009765625, 1.05438232421875, 1.186004638671875, 1.317626953125, 1.449249267578125, 1.58087158203125, 1.712493896484375, 1.8441162109375, 1.975738525390625, 2.10736083984375, 2.238983154296875, 2.37060546875, 2.502227783203125, 2.63385009765625, 2.765472412109375, 2.8970947265625, 3.028717041015625, 3.16033935546875, 3.291961669921875, 3.423583984375, 3.555206298828125, 3.68682861328125, 3.818450927734375, 3.9500732421875, 4.081695556640625, 4.21331787109375, 4.344940185546875, 4.4765625]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 2.0, 2.0, 4.0, 4.0, 8.0, 11.0, 18.0, 29.0, 61.0, 74.0, 104.0, 213.0, 346.0, 600.0, 1245.0, 2658.0, 6169.0, 15112.0, 40730.0, 116637.0, 344163.0, 932153.0, 1457560.0, 821846.0, 294717.0, 100686.0, 35133.0, 13570.0, 5519.0, 2464.0, 1118.0, 564.0, 316.0, 171.0, 99.0, 65.0, 27.0, 21.0, 20.0, 13.0, 10.0, 3.0, 11.0, 4.0, 6.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.08984375, -3.959716796875, -3.82958984375, -3.699462890625, -3.5693359375, -3.439208984375, -3.30908203125, -3.178955078125, -3.048828125, -2.918701171875, -2.78857421875, -2.658447265625, -2.5283203125, -2.398193359375, -2.26806640625, -2.137939453125, -2.0078125, -1.877685546875, -1.74755859375, -1.617431640625, -1.4873046875, -1.357177734375, -1.22705078125, -1.096923828125, -0.966796875, -0.836669921875, -0.70654296875, -0.576416015625, -0.4462890625, -0.316162109375, -0.18603515625, -0.055908203125, 0.07421875, 0.204345703125, 0.33447265625, 0.464599609375, 0.5947265625, 0.724853515625, 0.85498046875, 0.985107421875, 1.115234375, 1.245361328125, 1.37548828125, 1.505615234375, 1.6357421875, 1.765869140625, 1.89599609375, 2.026123046875, 2.15625, 2.286376953125, 2.41650390625, 2.546630859375, 2.6767578125, 2.806884765625, 2.93701171875, 3.067138671875, 3.197265625, 3.327392578125, 3.45751953125, 3.587646484375, 3.7177734375, 3.847900390625, 3.97802734375, 4.108154296875, 4.23828125]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 8.0, 6.0, 18.0, 18.0, 32.0, 32.0, 55.0, 80.0, 130.0, 148.0, 230.0, 330.0, 387.0, 490.0, 477.0, 390.0, 308.0, 254.0, 199.0, 126.0, 88.0, 62.0, 50.0, 42.0, 32.0, 16.0, 10.0, 12.0, 11.0, 10.0, 6.0, 8.0, 2.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.95703125, -5.772216796875, -5.58740234375, -5.402587890625, -5.2177734375, -5.032958984375, -4.84814453125, -4.663330078125, -4.478515625, -4.293701171875, -4.10888671875, -3.924072265625, -3.7392578125, -3.554443359375, -3.36962890625, -3.184814453125, -3.0, -2.815185546875, -2.63037109375, -2.445556640625, -2.2607421875, -2.075927734375, -1.89111328125, -1.706298828125, -1.521484375, -1.336669921875, -1.15185546875, -0.967041015625, -0.7822265625, -0.597412109375, -0.41259765625, -0.227783203125, -0.04296875, 0.141845703125, 0.32666015625, 0.511474609375, 0.6962890625, 0.881103515625, 1.06591796875, 1.250732421875, 1.435546875, 1.620361328125, 1.80517578125, 1.989990234375, 2.1748046875, 2.359619140625, 2.54443359375, 2.729248046875, 2.9140625, 3.098876953125, 3.28369140625, 3.468505859375, 3.6533203125, 3.838134765625, 4.02294921875, 4.207763671875, 4.392578125, 4.577392578125, 4.76220703125, 4.947021484375, 5.1318359375, 5.316650390625, 5.50146484375, 5.686279296875, 5.87109375]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 5.0, 8.0, 12.0, 18.0, 26.0, 44.0, 64.0, 110.0, 173.0, 386.0, 784.0, 3248.0, 105535.0, 3845702.0, 231464.0, 4783.0, 991.0, 415.0, 232.0, 110.0, 66.0, 41.0, 20.0, 15.0, 8.0, 7.0, 3.0, 3.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.578125, -28.830810546875, -28.08349609375, -27.336181640625, -26.5888671875, -25.841552734375, -25.09423828125, -24.346923828125, -23.599609375, -22.852294921875, -22.10498046875, -21.357666015625, -20.6103515625, -19.863037109375, -19.11572265625, -18.368408203125, -17.62109375, -16.873779296875, -16.12646484375, -15.379150390625, -14.6318359375, -13.884521484375, -13.13720703125, -12.389892578125, -11.642578125, -10.895263671875, -10.14794921875, -9.400634765625, -8.6533203125, -7.906005859375, -7.15869140625, -6.411376953125, -5.6640625, -4.916748046875, -4.16943359375, -3.422119140625, -2.6748046875, -1.927490234375, -1.18017578125, -0.432861328125, 0.314453125, 1.061767578125, 1.80908203125, 2.556396484375, 3.3037109375, 4.051025390625, 4.79833984375, 5.545654296875, 6.29296875, 7.040283203125, 7.78759765625, 8.534912109375, 9.2822265625, 10.029541015625, 10.77685546875, 11.524169921875, 12.271484375, 13.018798828125, 13.76611328125, 14.513427734375, 15.2607421875, 16.008056640625, 16.75537109375, 17.502685546875, 18.25]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 569.0, 439.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-268.3351745605469, -259.057861328125, -249.78054809570312, -240.50323486328125, -231.22592163085938, -221.9486083984375, -212.6713104248047, -203.3939971923828, -194.11668395996094, -184.83937072753906, -175.5620574951172, -166.2847442626953, -157.0074462890625, -147.73013305664062, -138.45281982421875, -129.17550659179688, -119.898193359375, -110.62088012695312, -101.34356689453125, -92.0662612915039, -82.78894805908203, -73.51163482666016, -64.23432922363281, -54.95701599121094, -45.67970275878906, -36.40238952636719, -27.125080108642578, -17.847768783569336, -8.570457458496094, 0.7068557739257812, 9.98416519165039, 19.261474609375, 28.538818359375, 37.816131591796875, 47.093441009521484, 56.370750427246094, 65.64806365966797, 74.92537689208984, 84.20268249511719, 93.47999572753906, 102.75730895996094, 112.03462219238281, 121.31193542480469, 130.58924865722656, 139.86654663085938, 149.14385986328125, 158.42117309570312, 167.698486328125, 176.97579956054688, 186.25311279296875, 195.53042602539062, 204.8077392578125, 214.08505249023438, 223.36236572265625, 232.63966369628906, 241.91697692871094, 251.1942901611328, 260.4715881347656, 269.7489013671875, 279.0262145996094, 288.30352783203125, 297.5808410644531, 306.858154296875, 316.1354675292969, 325.41278076171875]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 4.0, 3.0, 5.0, 11.0, 12.0, 8.0, 18.0, 15.0, 19.0, 19.0, 27.0, 40.0, 32.0, 41.0, 51.0, 53.0, 50.0, 45.0, 41.0, 56.0, 55.0, 53.0, 48.0, 59.0, 36.0, 48.0, 25.0, 27.0, 16.0, 13.0, 15.0, 18.0, 7.0, 17.0, 7.0, 3.0, 8.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-27.222604751586914, -26.49002456665039, -25.757444381713867, -25.024864196777344, -24.29228401184082, -23.559703826904297, -22.827123641967773, -22.09454345703125, -21.361963272094727, -20.629383087158203, -19.89680290222168, -19.164222717285156, -18.431642532348633, -17.69906234741211, -16.966482162475586, -16.233901977539062, -15.501321792602539, -14.768741607666016, -14.036161422729492, -13.303581237792969, -12.571001052856445, -11.838420867919922, -11.105840682983398, -10.373260498046875, -9.640680313110352, -8.908100128173828, -8.175519943237305, -7.442939758300781, -6.710359573364258, -5.977779388427734, -5.245199203491211, -4.5126190185546875, -3.7800369262695312, -3.047456741333008, -2.3148765563964844, -1.582296371459961, -0.8497161865234375, -0.11713600158691406, 0.6154441833496094, 1.3480243682861328, 2.0806045532226562, 2.8131847381591797, 3.545764923095703, 4.278345108032227, 5.01092529296875, 5.743505477905273, 6.476085662841797, 7.20866584777832, 7.941246032714844, 8.673826217651367, 9.40640640258789, 10.138986587524414, 10.871566772460938, 11.604146957397461, 12.336727142333984, 13.069307327270508, 13.801887512207031, 14.534467697143555, 15.267047882080078, 15.999628067016602, 16.732208251953125, 17.46478843688965, 18.197368621826172, 18.929948806762695, 19.66252899169922]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 2.0, 4.0, 12.0, 10.0, 11.0, 11.0, 15.0, 17.0, 23.0, 22.0, 21.0, 33.0, 24.0, 32.0, 42.0, 40.0, 41.0, 43.0, 45.0, 40.0, 29.0, 43.0, 46.0, 38.0, 51.0, 30.0, 38.0, 33.0, 36.0, 24.0, 28.0, 25.0, 20.0, 16.0, 14.0, 8.0, 7.0, 5.0, 6.0, 7.0, 6.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.640625, -3.52044677734375, -3.4002685546875, -3.28009033203125, -3.159912109375, -3.03973388671875, -2.9195556640625, -2.79937744140625, -2.67919921875, -2.55902099609375, -2.4388427734375, -2.31866455078125, -2.198486328125, -2.07830810546875, -1.9581298828125, -1.83795166015625, -1.7177734375, -1.59759521484375, -1.4774169921875, -1.35723876953125, -1.237060546875, -1.11688232421875, -0.9967041015625, -0.87652587890625, -0.75634765625, -0.63616943359375, -0.5159912109375, -0.39581298828125, -0.275634765625, -0.15545654296875, -0.0352783203125, 0.08489990234375, 0.205078125, 0.32525634765625, 0.4454345703125, 0.56561279296875, 0.685791015625, 0.80596923828125, 0.9261474609375, 1.04632568359375, 1.16650390625, 1.28668212890625, 1.4068603515625, 1.52703857421875, 1.647216796875, 1.76739501953125, 1.8875732421875, 2.00775146484375, 2.1279296875, 2.24810791015625, 2.3682861328125, 2.48846435546875, 2.608642578125, 2.72882080078125, 2.8489990234375, 2.96917724609375, 3.08935546875, 3.20953369140625, 3.3297119140625, 3.44989013671875, 3.570068359375, 3.69024658203125, 3.8104248046875, 3.93060302734375, 4.05078125]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 6.0, 18.0, 22.0, 40.0, 79.0, 107.0, 166.0, 298.0, 464.0, 741.0, 1206.0, 1862.0, 3157.0, 5020.0, 7752.0, 12051.0, 18325.0, 27606.0, 39984.0, 56287.0, 76152.0, 97267.0, 114664.0, 122053.0, 114595.0, 96771.0, 76398.0, 56454.0, 39932.0, 27472.0, 18459.0, 11901.0, 7899.0, 4953.0, 3175.0, 1988.0, 1280.0, 768.0, 453.0, 290.0, 168.0, 108.0, 64.0, 42.0, 23.0, 11.0, 10.0, 7.0, 5.0, 4.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.48193359375, -0.4675483703613281, -0.45316314697265625, -0.4387779235839844, -0.4243927001953125, -0.4100074768066406, -0.39562225341796875, -0.3812370300292969, -0.366851806640625, -0.3524665832519531, -0.33808135986328125, -0.3236961364746094, -0.3093109130859375, -0.2949256896972656, -0.28054046630859375, -0.2661552429199219, -0.25177001953125, -0.23738479614257812, -0.22299957275390625, -0.20861434936523438, -0.1942291259765625, -0.17984390258789062, -0.16545867919921875, -0.15107345581054688, -0.136688232421875, -0.12230300903320312, -0.10791778564453125, -0.09353256225585938, -0.0791473388671875, -0.06476211547851562, -0.05037689208984375, -0.035991668701171875, -0.0216064453125, -0.007221221923828125, 0.00716400146484375, 0.021549224853515625, 0.0359344482421875, 0.050319671630859375, 0.06470489501953125, 0.07909011840820312, 0.093475341796875, 0.10786056518554688, 0.12224578857421875, 0.13663101196289062, 0.1510162353515625, 0.16540145874023438, 0.17978668212890625, 0.19417190551757812, 0.20855712890625, 0.22294235229492188, 0.23732757568359375, 0.2517127990722656, 0.2660980224609375, 0.2804832458496094, 0.29486846923828125, 0.3092536926269531, 0.323638916015625, 0.3380241394042969, 0.35240936279296875, 0.3667945861816406, 0.3811798095703125, 0.3955650329589844, 0.40995025634765625, 0.4243354797363281, 0.438720703125]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 6.0, 4.0, 2.0, 7.0, 9.0, 7.0, 9.0, 15.0, 11.0, 20.0, 11.0, 26.0, 15.0, 30.0, 23.0, 34.0, 29.0, 36.0, 43.0, 38.0, 40.0, 38.0, 48.0, 1079.0, 43.0, 43.0, 33.0, 27.0, 31.0, 25.0, 34.0, 32.0, 31.0, 21.0, 23.0, 22.0, 18.0, 11.0, 9.0, 10.0, 8.0, 10.0, 6.0, 8.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.58203125, -2.493499755859375, -2.40496826171875, -2.316436767578125, -2.2279052734375, -2.139373779296875, -2.05084228515625, -1.962310791015625, -1.873779296875, -1.785247802734375, -1.69671630859375, -1.608184814453125, -1.5196533203125, -1.431121826171875, -1.34259033203125, -1.254058837890625, -1.16552734375, -1.076995849609375, -0.98846435546875, -0.899932861328125, -0.8114013671875, -0.722869873046875, -0.63433837890625, -0.545806884765625, -0.457275390625, -0.368743896484375, -0.28021240234375, -0.191680908203125, -0.1031494140625, -0.014617919921875, 0.07391357421875, 0.162445068359375, 0.2509765625, 0.339508056640625, 0.42803955078125, 0.516571044921875, 0.6051025390625, 0.693634033203125, 0.78216552734375, 0.870697021484375, 0.959228515625, 1.047760009765625, 1.13629150390625, 1.224822998046875, 1.3133544921875, 1.401885986328125, 1.49041748046875, 1.578948974609375, 1.66748046875, 1.756011962890625, 1.84454345703125, 1.933074951171875, 2.0216064453125, 2.110137939453125, 2.19866943359375, 2.287200927734375, 2.375732421875, 2.464263916015625, 2.55279541015625, 2.641326904296875, 2.7298583984375, 2.818389892578125, 2.90692138671875, 2.995452880859375, 3.083984375]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 4.0, 8.0, 8.0, 15.0, 21.0, 25.0, 50.0, 42.0, 89.0, 139.0, 198.0, 267.0, 405.0, 608.0, 878.0, 1327.0, 1932.0, 2985.0, 4387.0, 6586.0, 9309.0, 14329.0, 22190.0, 43240.0, 1558736.0, 334857.0, 34510.0, 20101.0, 13158.0, 8702.0, 5763.0, 3870.0, 2749.0, 1773.0, 1247.0, 813.0, 601.0, 416.0, 249.0, 189.0, 128.0, 84.0, 59.0, 33.0, 23.0, 14.0, 3.0, 11.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.88818359375, -0.8594284057617188, -0.8306732177734375, -0.8019180297851562, -0.773162841796875, -0.7444076538085938, -0.7156524658203125, -0.6868972778320312, -0.65814208984375, -0.6293869018554688, -0.6006317138671875, -0.5718765258789062, -0.543121337890625, -0.5143661499023438, -0.4856109619140625, -0.45685577392578125, -0.4281005859375, -0.39934539794921875, -0.3705902099609375, -0.34183502197265625, -0.313079833984375, -0.28432464599609375, -0.2555694580078125, -0.22681427001953125, -0.19805908203125, -0.16930389404296875, -0.1405487060546875, -0.11179351806640625, -0.083038330078125, -0.05428314208984375, -0.0255279541015625, 0.00322723388671875, 0.031982421875, 0.06073760986328125, 0.0894927978515625, 0.11824798583984375, 0.147003173828125, 0.17575836181640625, 0.2045135498046875, 0.23326873779296875, 0.26202392578125, 0.29077911376953125, 0.3195343017578125, 0.34828948974609375, 0.377044677734375, 0.40579986572265625, 0.4345550537109375, 0.46331024169921875, 0.4920654296875, 0.5208206176757812, 0.5495758056640625, 0.5783309936523438, 0.607086181640625, 0.6358413696289062, 0.6645965576171875, 0.6933517456054688, 0.72210693359375, 0.7508621215820312, 0.7796173095703125, 0.8083724975585938, 0.837127685546875, 0.8658828735351562, 0.8946380615234375, 0.9233932495117188, 0.9521484375]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 1.0, 4.0, 8.0, 3.0, 8.0, 5.0, 7.0, 12.0, 11.0, 15.0, 11.0, 27.0, 21.0, 28.0, 41.0, 40.0, 43.0, 39.0, 57.0, 54.0, 54.0, 64.0, 56.0, 55.0, 48.0, 45.0, 42.0, 39.0, 21.0, 28.0, 22.0, 16.0, 16.0, 12.0, 16.0, 9.0, 9.0, 4.0, 3.0, 4.0, 0.0, 4.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.049957275390625, -0.048249244689941406, -0.04654121398925781, -0.04483318328857422, -0.043125152587890625, -0.04141712188720703, -0.03970909118652344, -0.038001060485839844, -0.03629302978515625, -0.034584999084472656, -0.03287696838378906, -0.03116893768310547, -0.029460906982421875, -0.02775287628173828, -0.026044845581054688, -0.024336814880371094, -0.0226287841796875, -0.020920753479003906, -0.019212722778320312, -0.01750469207763672, -0.015796661376953125, -0.014088630676269531, -0.012380599975585938, -0.010672569274902344, -0.00896453857421875, -0.007256507873535156, -0.0055484771728515625, -0.0038404464721679688, -0.002132415771484375, -0.00042438507080078125, 0.0012836456298828125, 0.0029916763305664062, 0.00469970703125, 0.006407737731933594, 0.008115768432617188, 0.009823799133300781, 0.011531829833984375, 0.013239860534667969, 0.014947891235351562, 0.016655921936035156, 0.01836395263671875, 0.020071983337402344, 0.021780014038085938, 0.02348804473876953, 0.025196075439453125, 0.02690410614013672, 0.028612136840820312, 0.030320167541503906, 0.0320281982421875, 0.033736228942871094, 0.03544425964355469, 0.03715229034423828, 0.038860321044921875, 0.04056835174560547, 0.04227638244628906, 0.043984413146972656, 0.04569244384765625, 0.047400474548339844, 0.04910850524902344, 0.05081653594970703, 0.052524566650390625, 0.05423259735107422, 0.05594062805175781, 0.057648658752441406, 0.059356689453125]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 4.0, 3.0, 3.0, 7.0, 3.0, 9.0, 11.0, 17.0, 14.0, 17.0, 27.0, 27.0, 29.0, 46.0, 79.0, 106.0, 131.0, 220.0, 466.0, 1408.0, 913746.0, 130198.0, 879.0, 396.0, 210.0, 118.0, 92.0, 65.0, 42.0, 38.0, 36.0, 19.0, 16.0, 16.0, 9.0, 11.0, 6.0, 8.0, 7.0, 6.0, 5.0, 4.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 2.0, 2.0], "bins": [-1.2666015625, -1.2302703857421875, -1.193939208984375, -1.1576080322265625, -1.12127685546875, -1.0849456787109375, -1.048614501953125, -1.0122833251953125, -0.9759521484375, -0.9396209716796875, -0.903289794921875, -0.8669586181640625, -0.83062744140625, -0.7942962646484375, -0.757965087890625, -0.7216339111328125, -0.685302734375, -0.6489715576171875, -0.612640380859375, -0.5763092041015625, -0.53997802734375, -0.5036468505859375, -0.467315673828125, -0.4309844970703125, -0.3946533203125, -0.3583221435546875, -0.321990966796875, -0.2856597900390625, -0.24932861328125, -0.2129974365234375, -0.176666259765625, -0.1403350830078125, -0.10400390625, -0.0676727294921875, -0.031341552734375, 0.0049896240234375, 0.04132080078125, 0.0776519775390625, 0.113983154296875, 0.1503143310546875, 0.1866455078125, 0.2229766845703125, 0.259307861328125, 0.2956390380859375, 0.33197021484375, 0.3683013916015625, 0.404632568359375, 0.4409637451171875, 0.477294921875, 0.5136260986328125, 0.549957275390625, 0.5862884521484375, 0.62261962890625, 0.6589508056640625, 0.695281982421875, 0.7316131591796875, 0.7679443359375, 0.8042755126953125, 0.840606689453125, 0.8769378662109375, 0.91326904296875, 0.9496002197265625, 0.985931396484375, 1.0222625732421875, 1.05859375]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 4.0, 298.0, 683.0, 33.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08759688585996628, -0.07340381294488907, -0.059210747480392456, -0.04501767456531525, -0.030824605375528336, -0.016631536185741425, -0.002438463270664215, 0.011754602193832397, 0.025947675108909607, 0.04014074429869652, 0.05433381348848343, 0.06852688640356064, 0.08271995186805725, 0.09691302478313446, 0.11110609769821167, 0.12529915571212769, 0.1394922435283661, 0.1536853164434433, 0.1678783893585205, 0.18207144737243652, 0.19626452028751373, 0.21045759320259094, 0.22465066611766815, 0.23884373903274536, 0.2530367970466614, 0.2672298550605774, 0.2814229428768158, 0.2956160008907318, 0.3098090887069702, 0.32400214672088623, 0.33819520473480225, 0.35238829255104065, 0.36658135056495667, 0.3807744085788727, 0.3949674963951111, 0.4091605544090271, 0.4233536422252655, 0.4375467002391815, 0.4517397880554199, 0.46593284606933594, 0.48012590408325195, 0.49431896209716797, 0.508512020111084, 0.5227051377296448, 0.5368981957435608, 0.5510912537574768, 0.5652843117713928, 0.5794773697853088, 0.5936704874038696, 0.6078635454177856, 0.6220566034317017, 0.6362497210502625, 0.6504427790641785, 0.6646358370780945, 0.6788288950920105, 0.6930219531059265, 0.7072150111198425, 0.7214080691337585, 0.7356011271476746, 0.7497942447662354, 0.7639873027801514, 0.7781803607940674, 0.7923734188079834, 0.8065664768218994, 0.8207595944404602]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 9.0, 2.0, 4.0, 3.0, 11.0, 10.0, 6.0, 11.0, 10.0, 19.0, 18.0, 16.0, 22.0, 25.0, 26.0, 29.0, 27.0, 25.0, 35.0, 25.0, 33.0, 33.0, 42.0, 33.0, 39.0, 37.0, 31.0, 32.0, 31.0, 32.0, 31.0, 37.0, 25.0, 29.0, 21.0, 25.0, 23.0, 21.0, 12.0, 13.0, 20.0, 15.0, 18.0, 8.0, 13.0, 6.0, 3.0, 5.0, 5.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.04950571060180664, -0.047937165945768356, -0.04636862128973007, -0.044800080358982086, -0.0432315357029438, -0.04166299104690552, -0.04009445011615753, -0.03852590546011925, -0.03695736080408096, -0.03538881614804268, -0.033820271492004395, -0.03225173056125641, -0.030683185905218124, -0.02911464124917984, -0.027546098455786705, -0.02597755566239357, -0.024409011006355286, -0.022840466350317, -0.021271923556923866, -0.01970338076353073, -0.018134836107492447, -0.016566291451454163, -0.014997748658061028, -0.013429204933345318, -0.011860661208629608, -0.010292117483913898, -0.008723573759198189, -0.007155030034482479, -0.005586486309766769, -0.00401794258505106, -0.00244939886033535, -0.0008808551356196404, 0.0006876885890960693, 0.002256232313811779, 0.0038247760385274887, 0.005393319763243198, 0.006961863487958908, 0.008530407212674618, 0.010098950937390327, 0.011667494662106037, 0.013236038386821747, 0.014804582111537457, 0.016373125836253166, 0.0179416686296463, 0.019510213285684586, 0.02107875794172287, 0.022647300735116005, 0.02421584352850914, 0.025784388184547424, 0.02735293284058571, 0.028921475633978844, 0.03049001842737198, 0.03205856308341026, 0.03362710773944855, 0.03519564867019653, 0.03676419332623482, 0.0383327379822731, 0.039901282638311386, 0.04146982729434967, 0.043038368225097656, 0.04460691288113594, 0.046175457537174225, 0.04774399846792221, 0.049312543123960495, 0.05088108777999878]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 4.0, 7.0, 7.0, 8.0, 11.0, 10.0, 16.0, 18.0, 14.0, 22.0, 22.0, 25.0, 31.0, 37.0, 34.0, 37.0, 33.0, 34.0, 40.0, 33.0, 45.0, 42.0, 53.0, 53.0, 28.0, 34.0, 49.0, 45.0, 32.0, 22.0, 19.0, 34.0, 28.0, 15.0, 10.0, 13.0, 12.0, 12.0, 6.0, 8.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.75, -3.629241943359375, -3.50848388671875, -3.387725830078125, -3.2669677734375, -3.146209716796875, -3.02545166015625, -2.904693603515625, -2.783935546875, -2.663177490234375, -2.54241943359375, -2.421661376953125, -2.3009033203125, -2.180145263671875, -2.05938720703125, -1.938629150390625, -1.81787109375, -1.697113037109375, -1.57635498046875, -1.455596923828125, -1.3348388671875, -1.214080810546875, -1.09332275390625, -0.972564697265625, -0.851806640625, -0.731048583984375, -0.61029052734375, -0.489532470703125, -0.3687744140625, -0.248016357421875, -0.12725830078125, -0.006500244140625, 0.1142578125, 0.235015869140625, 0.35577392578125, 0.476531982421875, 0.5972900390625, 0.718048095703125, 0.83880615234375, 0.959564208984375, 1.080322265625, 1.201080322265625, 1.32183837890625, 1.442596435546875, 1.5633544921875, 1.684112548828125, 1.80487060546875, 1.925628662109375, 2.04638671875, 2.167144775390625, 2.28790283203125, 2.408660888671875, 2.5294189453125, 2.650177001953125, 2.77093505859375, 2.891693115234375, 3.012451171875, 3.133209228515625, 3.25396728515625, 3.374725341796875, 3.4954833984375, 3.616241455078125, 3.73699951171875, 3.857757568359375, 3.978515625]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 2.0, 6.0, 9.0, 8.0, 17.0, 39.0, 46.0, 66.0, 93.0, 142.0, 212.0, 351.0, 539.0, 808.0, 1387.0, 2238.0, 3689.0, 6136.0, 10225.0, 17378.0, 28829.0, 48171.0, 83315.0, 153114.0, 236093.0, 195374.0, 108138.0, 60936.0, 36224.0, 21953.0, 13125.0, 7849.0, 4689.0, 2826.0, 1717.0, 1035.0, 625.0, 403.0, 259.0, 172.0, 110.0, 67.0, 45.0, 30.0, 22.0, 14.0, 14.0, 10.0, 5.0, 2.0, 1.0, 0.0, 0.0, 3.0], "bins": [-3.673828125, -3.568023681640625, -3.46221923828125, -3.356414794921875, -3.2506103515625, -3.144805908203125, -3.03900146484375, -2.933197021484375, -2.827392578125, -2.721588134765625, -2.61578369140625, -2.509979248046875, -2.4041748046875, -2.298370361328125, -2.19256591796875, -2.086761474609375, -1.98095703125, -1.875152587890625, -1.76934814453125, -1.663543701171875, -1.5577392578125, -1.451934814453125, -1.34613037109375, -1.240325927734375, -1.134521484375, -1.028717041015625, -0.92291259765625, -0.817108154296875, -0.7113037109375, -0.605499267578125, -0.49969482421875, -0.393890380859375, -0.2880859375, -0.182281494140625, -0.07647705078125, 0.029327392578125, 0.1351318359375, 0.240936279296875, 0.34674072265625, 0.452545166015625, 0.558349609375, 0.664154052734375, 0.76995849609375, 0.875762939453125, 0.9815673828125, 1.087371826171875, 1.19317626953125, 1.298980712890625, 1.40478515625, 1.510589599609375, 1.61639404296875, 1.722198486328125, 1.8280029296875, 1.933807373046875, 2.03961181640625, 2.145416259765625, 2.251220703125, 2.357025146484375, 2.46282958984375, 2.568634033203125, 2.6744384765625, 2.780242919921875, 2.88604736328125, 2.991851806640625, 3.09765625]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 2.0, 1.0, 2.0, 6.0, 5.0, 7.0, 11.0, 11.0, 8.0, 21.0, 14.0, 17.0, 21.0, 27.0, 26.0, 47.0, 37.0, 34.0, 63.0, 44.0, 73.0, 119.0, 192.0, 1326.0, 263.0, 147.0, 89.0, 58.0, 62.0, 54.0, 30.0, 38.0, 31.0, 24.0, 19.0, 16.0, 20.0, 15.0, 13.0, 10.0, 5.0, 14.0, 11.0, 8.0, 3.0, 4.0, 5.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-10.125, -9.824462890625, -9.52392578125, -9.223388671875, -8.9228515625, -8.622314453125, -8.32177734375, -8.021240234375, -7.720703125, -7.420166015625, -7.11962890625, -6.819091796875, -6.5185546875, -6.218017578125, -5.91748046875, -5.616943359375, -5.31640625, -5.015869140625, -4.71533203125, -4.414794921875, -4.1142578125, -3.813720703125, -3.51318359375, -3.212646484375, -2.912109375, -2.611572265625, -2.31103515625, -2.010498046875, -1.7099609375, -1.409423828125, -1.10888671875, -0.808349609375, -0.5078125, -0.207275390625, 0.09326171875, 0.393798828125, 0.6943359375, 0.994873046875, 1.29541015625, 1.595947265625, 1.896484375, 2.197021484375, 2.49755859375, 2.798095703125, 3.0986328125, 3.399169921875, 3.69970703125, 4.000244140625, 4.30078125, 4.601318359375, 4.90185546875, 5.202392578125, 5.5029296875, 5.803466796875, 6.10400390625, 6.404541015625, 6.705078125, 7.005615234375, 7.30615234375, 7.606689453125, 7.9072265625, 8.207763671875, 8.50830078125, 8.808837890625, 9.109375]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 1.0, 4.0, 6.0, 4.0, 7.0, 6.0, 13.0, 20.0, 30.0, 50.0, 58.0, 98.0, 130.0, 174.0, 217.0, 339.0, 632.0, 1789.0, 9583.0, 81051.0, 1587212.0, 1378900.0, 72965.0, 8863.0, 1787.0, 650.0, 350.0, 230.0, 150.0, 115.0, 62.0, 55.0, 48.0, 26.0, 24.0, 14.0, 9.0, 16.0, 6.0, 4.0, 6.0, 4.0, 3.0, 2.0, 0.0, 2.0], "bins": [-14.3359375, -13.9681396484375, -13.600341796875, -13.2325439453125, -12.86474609375, -12.4969482421875, -12.129150390625, -11.7613525390625, -11.3935546875, -11.0257568359375, -10.657958984375, -10.2901611328125, -9.92236328125, -9.5545654296875, -9.186767578125, -8.8189697265625, -8.451171875, -8.0833740234375, -7.715576171875, -7.3477783203125, -6.97998046875, -6.6121826171875, -6.244384765625, -5.8765869140625, -5.5087890625, -5.1409912109375, -4.773193359375, -4.4053955078125, -4.03759765625, -3.6697998046875, -3.302001953125, -2.9342041015625, -2.56640625, -2.1986083984375, -1.830810546875, -1.4630126953125, -1.09521484375, -0.7274169921875, -0.359619140625, 0.0081787109375, 0.3759765625, 0.7437744140625, 1.111572265625, 1.4793701171875, 1.84716796875, 2.2149658203125, 2.582763671875, 2.9505615234375, 3.318359375, 3.6861572265625, 4.053955078125, 4.4217529296875, 4.78955078125, 5.1573486328125, 5.525146484375, 5.8929443359375, 6.2607421875, 6.6285400390625, 6.996337890625, 7.3641357421875, 7.73193359375, 8.0997314453125, 8.467529296875, 8.8353271484375, 9.203125]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 188.0, 817.0, 11.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-153.61669921875, -146.72955322265625, -139.84242248535156, -132.95529174804688, -126.06814575195312, -119.1810073852539, -112.29386901855469, -105.40673065185547, -98.51959228515625, -91.63245391845703, -84.74531555175781, -77.8581771850586, -70.97103881835938, -64.08390045166016, -57.19676208496094, -50.30962371826172, -43.4224853515625, -36.53534698486328, -29.648208618164062, -22.761070251464844, -15.873931884765625, -8.986793518066406, -2.0996551513671875, 4.787483215332031, 11.67462158203125, 18.56175994873047, 25.448898315429688, 32.336036682128906, 39.223175048828125, 46.110313415527344, 52.99745178222656, 59.88459014892578, 66.771728515625, 73.65886688232422, 80.54600524902344, 87.43314361572266, 94.32028198242188, 101.2074203491211, 108.09455871582031, 114.98169708251953, 121.86883544921875, 128.7559814453125, 135.6431121826172, 142.53024291992188, 149.41738891601562, 156.30453491210938, 163.19166564941406, 170.07879638671875, 176.9659423828125, 183.85308837890625, 190.74021911621094, 197.62734985351562, 204.51449584960938, 211.40164184570312, 218.2887725830078, 225.1759033203125, 232.06304931640625, 238.9501953125, 245.8373260498047, 252.72445678710938, 259.6116027832031, 266.4987487792969, 273.3858642578125, 280.27301025390625, 287.16015625]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 7.0, 5.0, 11.0, 7.0, 16.0, 9.0, 20.0, 28.0, 30.0, 29.0, 47.0, 47.0, 49.0, 48.0, 40.0, 67.0, 58.0, 51.0, 55.0, 52.0, 58.0, 38.0, 44.0, 42.0, 33.0, 29.0, 18.0, 15.0, 15.0, 13.0, 13.0, 7.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-38.56748580932617, -37.49684143066406, -36.42619323730469, -35.35554885864258, -34.2849006652832, -33.214256286621094, -32.14360809326172, -31.07296371459961, -30.0023193359375, -28.931673049926758, -27.861026763916016, -26.790382385253906, -25.719736099243164, -24.649089813232422, -23.57844352722168, -22.507797241210938, -21.437150955200195, -20.366504669189453, -19.29585838317871, -18.22521209716797, -17.15456771850586, -16.083921432495117, -15.013275146484375, -13.942628860473633, -12.871983528137207, -11.801337242126465, -10.730691909790039, -9.660045623779297, -8.589399337768555, -7.518754005432129, -6.448107719421387, -5.377461910247803, -4.306814193725586, -3.236168384552002, -2.165522336959839, -1.0948762893676758, -0.024230480194091797, 1.0464153289794922, 2.1170616149902344, 3.1877074241638184, 4.258353233337402, 5.328999042510986, 6.39964485168457, 7.4702911376953125, 8.540937423706055, 9.61158275604248, 10.682229042053223, 11.752874374389648, 12.82352066040039, 13.894166946411133, 14.964812278747559, 16.035457611083984, 17.106103897094727, 18.17675018310547, 19.24739646911621, 20.318042755126953, 21.388687133789062, 22.459333419799805, 23.529979705810547, 24.600624084472656, 25.6712703704834, 26.74191665649414, 27.812562942504883, 28.883209228515625, 29.953855514526367]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 7.0, 2.0, 3.0, 11.0, 5.0, 13.0, 9.0, 15.0, 18.0, 29.0, 14.0, 28.0, 27.0, 32.0, 33.0, 38.0, 34.0, 38.0, 47.0, 38.0, 56.0, 44.0, 50.0, 34.0, 45.0, 41.0, 44.0, 50.0, 24.0, 33.0, 30.0, 23.0, 22.0, 17.0, 12.0, 7.0, 12.0, 6.0, 7.0, 6.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0703125, -3.93890380859375, -3.8074951171875, -3.67608642578125, -3.544677734375, -3.41326904296875, -3.2818603515625, -3.15045166015625, -3.01904296875, -2.88763427734375, -2.7562255859375, -2.62481689453125, -2.493408203125, -2.36199951171875, -2.2305908203125, -2.09918212890625, -1.9677734375, -1.83636474609375, -1.7049560546875, -1.57354736328125, -1.442138671875, -1.31072998046875, -1.1793212890625, -1.04791259765625, -0.91650390625, -0.78509521484375, -0.6536865234375, -0.52227783203125, -0.390869140625, -0.25946044921875, -0.1280517578125, 0.00335693359375, 0.134765625, 0.26617431640625, 0.3975830078125, 0.52899169921875, 0.660400390625, 0.79180908203125, 0.9232177734375, 1.05462646484375, 1.18603515625, 1.31744384765625, 1.4488525390625, 1.58026123046875, 1.711669921875, 1.84307861328125, 1.9744873046875, 2.10589599609375, 2.2373046875, 2.36871337890625, 2.5001220703125, 2.63153076171875, 2.762939453125, 2.89434814453125, 3.0257568359375, 3.15716552734375, 3.28857421875, 3.41998291015625, 3.5513916015625, 3.68280029296875, 3.814208984375, 3.94561767578125, 4.0770263671875, 4.20843505859375, 4.33984375]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [4.0, 2.0, 2.0, 1.0, 2.0, 7.0, 2.0, 8.0, 12.0, 7.0, 9.0, 9.0, 16.0, 17.0, 10.0, 24.0, 30.0, 28.0, 41.0, 52.0, 53.0, 66.0, 96.0, 186.0, 413.0, 1616.0, 11763.0, 241679.0, 3258975.0, 649900.0, 25412.0, 2508.0, 608.0, 191.0, 110.0, 81.0, 73.0, 55.0, 32.0, 33.0, 24.0, 19.0, 19.0, 17.0, 19.0, 12.0, 14.0, 9.0, 5.0, 5.0, 8.0, 6.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0], "bins": [-11.7265625, -11.317138671875, -10.90771484375, -10.498291015625, -10.0888671875, -9.679443359375, -9.27001953125, -8.860595703125, -8.451171875, -8.041748046875, -7.63232421875, -7.222900390625, -6.8134765625, -6.404052734375, -5.99462890625, -5.585205078125, -5.17578125, -4.766357421875, -4.35693359375, -3.947509765625, -3.5380859375, -3.128662109375, -2.71923828125, -2.309814453125, -1.900390625, -1.490966796875, -1.08154296875, -0.672119140625, -0.2626953125, 0.146728515625, 0.55615234375, 0.965576171875, 1.375, 1.784423828125, 2.19384765625, 2.603271484375, 3.0126953125, 3.422119140625, 3.83154296875, 4.240966796875, 4.650390625, 5.059814453125, 5.46923828125, 5.878662109375, 6.2880859375, 6.697509765625, 7.10693359375, 7.516357421875, 7.92578125, 8.335205078125, 8.74462890625, 9.154052734375, 9.5634765625, 9.972900390625, 10.38232421875, 10.791748046875, 11.201171875, 11.610595703125, 12.02001953125, 12.429443359375, 12.8388671875, 13.248291015625, 13.65771484375, 14.067138671875, 14.4765625]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 1.0, 4.0, 3.0, 8.0, 6.0, 7.0, 16.0, 25.0, 20.0, 41.0, 62.0, 65.0, 117.0, 165.0, 234.0, 354.0, 448.0, 544.0, 474.0, 387.0, 330.0, 221.0, 157.0, 101.0, 84.0, 47.0, 46.0, 26.0, 19.0, 16.0, 12.0, 13.0, 7.0, 3.0, 5.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.984375, -4.80572509765625, -4.6270751953125, -4.44842529296875, -4.269775390625, -4.09112548828125, -3.9124755859375, -3.73382568359375, -3.55517578125, -3.37652587890625, -3.1978759765625, -3.01922607421875, -2.840576171875, -2.66192626953125, -2.4832763671875, -2.30462646484375, -2.1259765625, -1.94732666015625, -1.7686767578125, -1.59002685546875, -1.411376953125, -1.23272705078125, -1.0540771484375, -0.87542724609375, -0.69677734375, -0.51812744140625, -0.3394775390625, -0.16082763671875, 0.017822265625, 0.19647216796875, 0.3751220703125, 0.55377197265625, 0.732421875, 0.91107177734375, 1.0897216796875, 1.26837158203125, 1.447021484375, 1.62567138671875, 1.8043212890625, 1.98297119140625, 2.16162109375, 2.34027099609375, 2.5189208984375, 2.69757080078125, 2.876220703125, 3.05487060546875, 3.2335205078125, 3.41217041015625, 3.5908203125, 3.76947021484375, 3.9481201171875, 4.12677001953125, 4.305419921875, 4.48406982421875, 4.6627197265625, 4.84136962890625, 5.02001953125, 5.19866943359375, 5.3773193359375, 5.55596923828125, 5.734619140625, 5.91326904296875, 6.0919189453125, 6.27056884765625, 6.44921875]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 3.0, 4.0, 5.0, 4.0, 9.0, 9.0, 16.0, 21.0, 37.0, 55.0, 100.0, 255.0, 689.0, 6041.0, 358438.0, 3748082.0, 77115.0, 2421.0, 513.0, 210.0, 111.0, 58.0, 35.0, 23.0, 11.0, 9.0, 6.0, 7.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.8359375, -12.1358642578125, -11.435791015625, -10.7357177734375, -10.03564453125, -9.3355712890625, -8.635498046875, -7.9354248046875, -7.2353515625, -6.5352783203125, -5.835205078125, -5.1351318359375, -4.43505859375, -3.7349853515625, -3.034912109375, -2.3348388671875, -1.634765625, -0.9346923828125, -0.234619140625, 0.4654541015625, 1.16552734375, 1.8656005859375, 2.565673828125, 3.2657470703125, 3.9658203125, 4.6658935546875, 5.365966796875, 6.0660400390625, 6.76611328125, 7.4661865234375, 8.166259765625, 8.8663330078125, 9.56640625, 10.2664794921875, 10.966552734375, 11.6666259765625, 12.36669921875, 13.0667724609375, 13.766845703125, 14.4669189453125, 15.1669921875, 15.8670654296875, 16.567138671875, 17.2672119140625, 17.96728515625, 18.6673583984375, 19.367431640625, 20.0675048828125, 20.767578125, 21.4676513671875, 22.167724609375, 22.8677978515625, 23.56787109375, 24.2679443359375, 24.968017578125, 25.6680908203125, 26.3681640625, 27.0682373046875, 27.768310546875, 28.4683837890625, 29.16845703125, 29.8685302734375, 30.568603515625, 31.2686767578125, 31.96875]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 11.0, 36.0, 97.0, 161.0, 208.0, 212.0, 158.0, 91.0, 21.0, 11.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.830326080322266, -57.453983306884766, -56.07764434814453, -54.70130157470703, -53.32495880126953, -51.9486198425293, -50.5722770690918, -49.19593811035156, -47.81959533691406, -46.44325256347656, -45.06691360473633, -43.69057083129883, -42.314231872558594, -40.937889099121094, -39.561546325683594, -38.185203552246094, -36.80886459350586, -35.43252182006836, -34.056182861328125, -32.679840087890625, -31.303499221801758, -29.92715835571289, -28.55081558227539, -27.174474716186523, -25.798133850097656, -24.42179298400879, -23.045452117919922, -21.669109344482422, -20.292768478393555, -18.916427612304688, -17.540084838867188, -16.16374397277832, -14.787399291992188, -13.41105842590332, -12.034716606140137, -10.658374786376953, -9.282033920288086, -7.9056925773620605, -6.529351234436035, -5.153009414672852, -3.7766685485839844, -2.400327205657959, -1.0239858627319336, 0.3523554801940918, 1.7286968231201172, 3.1050381660461426, 4.481379508972168, 5.857721328735352, 7.234062194824219, 8.610403060913086, 9.98674488067627, 11.363086700439453, 12.73942756652832, 14.115768432617188, 15.492110252380371, 16.868452072143555, 18.244792938232422, 19.62113380432129, 20.997474670410156, 22.373817443847656, 23.750158309936523, 25.12649917602539, 26.50284194946289, 27.879182815551758, 29.255523681640625]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 1.0, 0.0, 0.0, 5.0, 1.0, 5.0, 6.0, 6.0, 11.0, 12.0, 14.0, 19.0, 9.0, 23.0, 25.0, 26.0, 22.0, 36.0, 38.0, 45.0, 46.0, 45.0, 36.0, 41.0, 48.0, 41.0, 59.0, 39.0, 44.0, 40.0, 25.0, 21.0, 29.0, 40.0, 20.0, 29.0, 12.0, 23.0, 15.0, 16.0, 16.0, 6.0, 4.0, 8.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.183191299438477, -20.547462463378906, -19.911731719970703, -19.276002883911133, -18.640274047851562, -18.00454330444336, -17.36881446838379, -16.73308563232422, -16.097354888916016, -15.461625099182129, -14.825895309448242, -14.190166473388672, -13.554436683654785, -12.918706893920898, -12.282978057861328, -11.647248268127441, -11.011518478393555, -10.375788688659668, -9.740058898925781, -9.104330062866211, -8.468600273132324, -7.8328704833984375, -7.197141170501709, -6.5614118576049805, -5.925682067871094, -5.289952278137207, -4.6542229652404785, -4.01849365234375, -3.3827638626098633, -2.7470343112945557, -2.111304759979248, -1.4755754470825195, -0.8398475646972656, -0.204118013381958, 0.4316115379333496, 1.0673410892486572, 1.7030706405639648, 2.3388001918792725, 2.97452974319458, 3.6102590560913086, 4.245988845825195, 4.881718635559082, 5.5174479484558105, 6.153177261352539, 6.788907051086426, 7.4246368408203125, 8.060365676879883, 8.69609546661377, 9.331825256347656, 9.967555046081543, 10.60328483581543, 11.239013671875, 11.874743461608887, 12.510473251342773, 13.146202087402344, 13.78193187713623, 14.417661666870117, 15.053391456604004, 15.68912124633789, 16.32485008239746, 16.96057891845703, 17.596309661865234, 18.232038497924805, 18.867767333984375, 19.503498077392578]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 0.0, 1.0, 5.0, 6.0, 5.0, 8.0, 8.0, 15.0, 12.0, 12.0, 12.0, 18.0, 21.0, 40.0, 40.0, 39.0, 47.0, 36.0, 45.0, 48.0, 48.0, 57.0, 55.0, 39.0, 47.0, 40.0, 39.0, 40.0, 41.0, 28.0, 27.0, 31.0, 20.0, 17.0, 17.0, 13.0, 12.0, 3.0, 5.0, 4.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.27734375, -4.1422119140625, -4.007080078125, -3.8719482421875, -3.73681640625, -3.6016845703125, -3.466552734375, -3.3314208984375, -3.1962890625, -3.0611572265625, -2.926025390625, -2.7908935546875, -2.65576171875, -2.5206298828125, -2.385498046875, -2.2503662109375, -2.115234375, -1.9801025390625, -1.844970703125, -1.7098388671875, -1.57470703125, -1.4395751953125, -1.304443359375, -1.1693115234375, -1.0341796875, -0.8990478515625, -0.763916015625, -0.6287841796875, -0.49365234375, -0.3585205078125, -0.223388671875, -0.0882568359375, 0.046875, 0.1820068359375, 0.317138671875, 0.4522705078125, 0.58740234375, 0.7225341796875, 0.857666015625, 0.9927978515625, 1.1279296875, 1.2630615234375, 1.398193359375, 1.5333251953125, 1.66845703125, 1.8035888671875, 1.938720703125, 2.0738525390625, 2.208984375, 2.3441162109375, 2.479248046875, 2.6143798828125, 2.74951171875, 2.8846435546875, 3.019775390625, 3.1549072265625, 3.2900390625, 3.4251708984375, 3.560302734375, 3.6954345703125, 3.83056640625, 3.9656982421875, 4.100830078125, 4.2359619140625, 4.37109375]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 5.0, 0.0, 2.0, 5.0, 8.0, 13.0, 23.0, 28.0, 63.0, 99.0, 160.0, 292.0, 469.0, 834.0, 1382.0, 2273.0, 3641.0, 6091.0, 9914.0, 16073.0, 25840.0, 39568.0, 58502.0, 81912.0, 106956.0, 126760.0, 133852.0, 121092.0, 98063.0, 73432.0, 50931.0, 33732.0, 21743.0, 13584.0, 8534.0, 4954.0, 3102.0, 1889.0, 1121.0, 624.0, 411.0, 256.0, 127.0, 91.0, 44.0, 28.0, 15.0, 14.0, 5.0, 3.0, 3.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.49365234375, -0.4783782958984375, -0.463104248046875, -0.4478302001953125, -0.43255615234375, -0.4172821044921875, -0.402008056640625, -0.3867340087890625, -0.3714599609375, -0.3561859130859375, -0.340911865234375, -0.3256378173828125, -0.31036376953125, -0.2950897216796875, -0.279815673828125, -0.2645416259765625, -0.249267578125, -0.2339935302734375, -0.218719482421875, -0.2034454345703125, -0.18817138671875, -0.1728973388671875, -0.157623291015625, -0.1423492431640625, -0.1270751953125, -0.1118011474609375, -0.096527099609375, -0.0812530517578125, -0.06597900390625, -0.0507049560546875, -0.035430908203125, -0.0201568603515625, -0.0048828125, 0.0103912353515625, 0.025665283203125, 0.0409393310546875, 0.05621337890625, 0.0714874267578125, 0.086761474609375, 0.1020355224609375, 0.1173095703125, 0.1325836181640625, 0.147857666015625, 0.1631317138671875, 0.17840576171875, 0.1936798095703125, 0.208953857421875, 0.2242279052734375, 0.239501953125, 0.2547760009765625, 0.270050048828125, 0.2853240966796875, 0.30059814453125, 0.3158721923828125, 0.331146240234375, 0.3464202880859375, 0.3616943359375, 0.3769683837890625, 0.392242431640625, 0.4075164794921875, 0.42279052734375, 0.4380645751953125, 0.453338623046875, 0.4686126708984375, 0.48388671875]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 6.0, 5.0, 6.0, 11.0, 18.0, 13.0, 11.0, 26.0, 21.0, 26.0, 17.0, 28.0, 40.0, 29.0, 45.0, 44.0, 41.0, 38.0, 37.0, 41.0, 1066.0, 33.0, 39.0, 45.0, 35.0, 28.0, 21.0, 33.0, 27.0, 38.0, 20.0, 23.0, 17.0, 11.0, 12.0, 9.0, 13.0, 11.0, 6.0, 13.0, 6.0, 5.0, 4.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.6328125, -2.554046630859375, -2.47528076171875, -2.396514892578125, -2.3177490234375, -2.238983154296875, -2.16021728515625, -2.081451416015625, -2.002685546875, -1.923919677734375, -1.84515380859375, -1.766387939453125, -1.6876220703125, -1.608856201171875, -1.53009033203125, -1.451324462890625, -1.37255859375, -1.293792724609375, -1.21502685546875, -1.136260986328125, -1.0574951171875, -0.978729248046875, -0.89996337890625, -0.821197509765625, -0.742431640625, -0.663665771484375, -0.58489990234375, -0.506134033203125, -0.4273681640625, -0.348602294921875, -0.26983642578125, -0.191070556640625, -0.1123046875, -0.033538818359375, 0.04522705078125, 0.123992919921875, 0.2027587890625, 0.281524658203125, 0.36029052734375, 0.439056396484375, 0.517822265625, 0.596588134765625, 0.67535400390625, 0.754119873046875, 0.8328857421875, 0.911651611328125, 0.99041748046875, 1.069183349609375, 1.14794921875, 1.226715087890625, 1.30548095703125, 1.384246826171875, 1.4630126953125, 1.541778564453125, 1.62054443359375, 1.699310302734375, 1.778076171875, 1.856842041015625, 1.93560791015625, 2.014373779296875, 2.0931396484375, 2.171905517578125, 2.25067138671875, 2.329437255859375, 2.408203125]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 6.0, 3.0, 3.0, 14.0, 20.0, 24.0, 38.0, 62.0, 70.0, 104.0, 184.0, 228.0, 359.0, 541.0, 804.0, 1151.0, 1727.0, 2614.0, 3792.0, 5541.0, 8280.0, 12168.0, 18414.0, 30206.0, 166896.0, 1717485.0, 55270.0, 23571.0, 15653.0, 10173.0, 6927.0, 4752.0, 3254.0, 2252.0, 1480.0, 1029.0, 644.0, 434.0, 293.0, 229.0, 132.0, 102.0, 66.0, 40.0, 44.0, 28.0, 7.0, 7.0, 7.0, 1.0, 7.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.87158203125, -0.8445892333984375, -0.817596435546875, -0.7906036376953125, -0.76361083984375, -0.7366180419921875, -0.709625244140625, -0.6826324462890625, -0.6556396484375, -0.6286468505859375, -0.601654052734375, -0.5746612548828125, -0.54766845703125, -0.5206756591796875, -0.493682861328125, -0.4666900634765625, -0.439697265625, -0.4127044677734375, -0.385711669921875, -0.3587188720703125, -0.33172607421875, -0.3047332763671875, -0.277740478515625, -0.2507476806640625, -0.2237548828125, -0.1967620849609375, -0.169769287109375, -0.1427764892578125, -0.11578369140625, -0.0887908935546875, -0.061798095703125, -0.0348052978515625, -0.0078125, 0.0191802978515625, 0.046173095703125, 0.0731658935546875, 0.10015869140625, 0.1271514892578125, 0.154144287109375, 0.1811370849609375, 0.2081298828125, 0.2351226806640625, 0.262115478515625, 0.2891082763671875, 0.31610107421875, 0.3430938720703125, 0.370086669921875, 0.3970794677734375, 0.424072265625, 0.4510650634765625, 0.478057861328125, 0.5050506591796875, 0.53204345703125, 0.5590362548828125, 0.586029052734375, 0.6130218505859375, 0.6400146484375, 0.6670074462890625, 0.694000244140625, 0.7209930419921875, 0.74798583984375, 0.7749786376953125, 0.801971435546875, 0.8289642333984375, 0.85595703125]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 5.0, 8.0, 7.0, 5.0, 5.0, 14.0, 12.0, 12.0, 22.0, 22.0, 30.0, 38.0, 42.0, 45.0, 53.0, 50.0, 68.0, 60.0, 61.0, 56.0, 47.0, 53.0, 42.0, 45.0, 41.0, 31.0, 18.0, 22.0, 18.0, 21.0, 13.0, 11.0, 7.0, 4.0, 2.0, 4.0, 2.0, 5.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.045806884765625, -0.04428243637084961, -0.04275798797607422, -0.04123353958129883, -0.03970909118652344, -0.03818464279174805, -0.036660194396972656, -0.035135746002197266, -0.033611297607421875, -0.032086849212646484, -0.030562400817871094, -0.029037952423095703, -0.027513504028320312, -0.025989055633544922, -0.02446460723876953, -0.02294015884399414, -0.02141571044921875, -0.01989126205444336, -0.01836681365966797, -0.016842365264892578, -0.015317916870117188, -0.013793468475341797, -0.012269020080566406, -0.010744571685791016, -0.009220123291015625, -0.007695674896240234, -0.006171226501464844, -0.004646778106689453, -0.0031223297119140625, -0.0015978813171386719, -7.343292236328125e-05, 0.0014510154724121094, 0.0029754638671875, 0.004499912261962891, 0.006024360656738281, 0.007548809051513672, 0.009073257446289062, 0.010597705841064453, 0.012122154235839844, 0.013646602630615234, 0.015171051025390625, 0.016695499420166016, 0.018219947814941406, 0.019744396209716797, 0.021268844604492188, 0.022793292999267578, 0.02431774139404297, 0.02584218978881836, 0.02736663818359375, 0.02889108657836914, 0.03041553497314453, 0.03193998336791992, 0.03346443176269531, 0.0349888801574707, 0.036513328552246094, 0.038037776947021484, 0.039562225341796875, 0.041086673736572266, 0.042611122131347656, 0.04413557052612305, 0.04566001892089844, 0.04718446731567383, 0.04870891571044922, 0.05023336410522461, 0.0517578125]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 7.0, 6.0, 5.0, 5.0, 16.0, 16.0, 25.0, 21.0, 28.0, 41.0, 53.0, 90.0, 95.0, 137.0, 263.0, 502.0, 1573.0, 977104.0, 66654.0, 854.0, 353.0, 213.0, 148.0, 78.0, 71.0, 42.0, 37.0, 26.0, 19.0, 16.0, 15.0, 5.0, 7.0, 11.0, 9.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.107421875, -1.0746612548828125, -1.041900634765625, -1.0091400146484375, -0.97637939453125, -0.9436187744140625, -0.910858154296875, -0.8780975341796875, -0.8453369140625, -0.8125762939453125, -0.779815673828125, -0.7470550537109375, -0.71429443359375, -0.6815338134765625, -0.648773193359375, -0.6160125732421875, -0.583251953125, -0.5504913330078125, -0.517730712890625, -0.4849700927734375, -0.45220947265625, -0.4194488525390625, -0.386688232421875, -0.3539276123046875, -0.3211669921875, -0.2884063720703125, -0.255645751953125, -0.2228851318359375, -0.19012451171875, -0.1573638916015625, -0.124603271484375, -0.0918426513671875, -0.05908203125, -0.0263214111328125, 0.006439208984375, 0.0391998291015625, 0.07196044921875, 0.1047210693359375, 0.137481689453125, 0.1702423095703125, 0.2030029296875, 0.2357635498046875, 0.268524169921875, 0.3012847900390625, 0.33404541015625, 0.3668060302734375, 0.399566650390625, 0.4323272705078125, 0.465087890625, 0.4978485107421875, 0.530609130859375, 0.5633697509765625, 0.59613037109375, 0.6288909912109375, 0.661651611328125, 0.6944122314453125, 0.7271728515625, 0.7599334716796875, 0.792694091796875, 0.8254547119140625, 0.85821533203125, 0.8909759521484375, 0.923736572265625, 0.9564971923828125, 0.9892578125]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 17.0, 658.0, 336.0, 7.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2145560085773468, -0.2025274634361267, -0.1904989331960678, -0.17847038805484772, -0.16644185781478882, -0.15441331267356873, -0.14238476753234863, -0.13035622239112854, -0.11832769215106964, -0.10629915446043015, -0.09427061676979065, -0.08224207162857056, -0.07021353393793106, -0.058184996247291565, -0.04615645110607147, -0.034127913415431976, -0.02209937572479248, -0.010070836171507835, 0.0019577033817768097, 0.013986244797706604, 0.0260147824883461, 0.038043320178985596, 0.05007186532020569, 0.062100403010845184, 0.07412894070148468, 0.08615747839212418, 0.09818601608276367, 0.11021456122398376, 0.12224309891462326, 0.13427163660526276, 0.14630018174648285, 0.15832871198654175, 0.17035728693008423, 0.18238583207130432, 0.19441436231136322, 0.2064429074525833, 0.2184714376926422, 0.2304999828338623, 0.2425285279750824, 0.2545570731163025, 0.2665855884552002, 0.2786141335964203, 0.2906426787376404, 0.3026711940765381, 0.3146997392177582, 0.32672828435897827, 0.33875682950019836, 0.35078537464141846, 0.36281391978263855, 0.37484246492385864, 0.38687101006507874, 0.39889955520629883, 0.41092807054519653, 0.4229566156864166, 0.4349851608276367, 0.4470137059688568, 0.4590422511100769, 0.471070796251297, 0.4830993413925171, 0.4951278567314148, 0.5071564316749573, 0.519184947013855, 0.5312135219573975, 0.5432420372962952, 0.5552705526351929]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 9.0, 9.0, 9.0, 24.0, 19.0, 26.0, 24.0, 39.0, 40.0, 40.0, 51.0, 59.0, 54.0, 66.0, 56.0, 78.0, 55.0, 49.0, 43.0, 41.0, 35.0, 34.0, 28.0, 24.0, 17.0, 18.0, 16.0, 12.0, 11.0, 3.0, 7.0, 3.0, 2.0, 1.0, 2.0, 1.0, 4.0], "bins": [-0.07628607749938965, -0.07444486021995544, -0.07260364294052124, -0.07076243311166763, -0.06892121583223343, -0.06707999855279922, -0.06523878872394562, -0.06339757144451141, -0.06155635416507721, -0.059715136885643005, -0.0578739233314991, -0.056032709777355194, -0.05419149249792099, -0.052350275218486786, -0.05050906166434288, -0.048667848110198975, -0.04682663083076477, -0.044985413551330566, -0.04314419999718666, -0.041302986443042755, -0.03946176916360855, -0.03762055188417435, -0.03577933833003044, -0.033938124775886536, -0.03209690749645233, -0.030255692079663277, -0.028414476662874222, -0.026573261246085167, -0.024732045829296112, -0.022890830412507057, -0.021049614995718002, -0.019208399578928947, -0.017367184162139893, -0.015525968745350838, -0.013684753328561783, -0.011843537911772728, -0.010002322494983673, -0.008161107078194618, -0.006319891661405563, -0.0044786762446165085, -0.0026374608278274536, -0.0007962454110383987, 0.0010449700057506561, 0.002886185422539711, 0.004727400839328766, 0.006568616256117821, 0.008409831672906876, 0.01025104708969593, 0.012092262506484985, 0.01393347792327404, 0.015774693340063095, 0.01761590875685215, 0.019457124173641205, 0.02129833959043026, 0.023139555007219315, 0.02498077042400837, 0.026821985840797424, 0.02866320125758648, 0.030504416674375534, 0.03234563022851944, 0.034186847507953644, 0.03602806478738785, 0.037869278341531754, 0.03971049189567566, 0.04155170917510986]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 2.0, 3.0, 5.0, 7.0, 7.0, 6.0, 7.0, 5.0, 6.0, 12.0, 16.0, 22.0, 23.0, 18.0, 38.0, 38.0, 36.0, 30.0, 43.0, 45.0, 45.0, 37.0, 47.0, 40.0, 52.0, 47.0, 46.0, 33.0, 43.0, 45.0, 23.0, 27.0, 27.0, 30.0, 19.0, 22.0, 14.0, 15.0, 3.0, 8.0, 3.0, 5.0, 3.0, 4.0, 6.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.359375, -3.2353515625, -3.111328125, -2.9873046875, -2.86328125, -2.7392578125, -2.615234375, -2.4912109375, -2.3671875, -2.2431640625, -2.119140625, -1.9951171875, -1.87109375, -1.7470703125, -1.623046875, -1.4990234375, -1.375, -1.2509765625, -1.126953125, -1.0029296875, -0.87890625, -0.7548828125, -0.630859375, -0.5068359375, -0.3828125, -0.2587890625, -0.134765625, -0.0107421875, 0.11328125, 0.2373046875, 0.361328125, 0.4853515625, 0.609375, 0.7333984375, 0.857421875, 0.9814453125, 1.10546875, 1.2294921875, 1.353515625, 1.4775390625, 1.6015625, 1.7255859375, 1.849609375, 1.9736328125, 2.09765625, 2.2216796875, 2.345703125, 2.4697265625, 2.59375, 2.7177734375, 2.841796875, 2.9658203125, 3.08984375, 3.2138671875, 3.337890625, 3.4619140625, 3.5859375, 3.7099609375, 3.833984375, 3.9580078125, 4.08203125, 4.2060546875, 4.330078125, 4.4541015625, 4.578125]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 5.0, 3.0, 8.0, 9.0, 10.0, 20.0, 26.0, 25.0, 42.0, 65.0, 112.0, 201.0, 348.0, 660.0, 1295.0, 2887.0, 6248.0, 13918.0, 30642.0, 68506.0, 165698.0, 339166.0, 242080.0, 97737.0, 42674.0, 19603.0, 8880.0, 3986.0, 1803.0, 826.0, 463.0, 204.0, 132.0, 88.0, 51.0, 37.0, 34.0, 22.0, 16.0, 10.0, 10.0, 4.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.578125, -5.41265869140625, -5.2471923828125, -5.08172607421875, -4.916259765625, -4.75079345703125, -4.5853271484375, -4.41986083984375, -4.25439453125, -4.08892822265625, -3.9234619140625, -3.75799560546875, -3.592529296875, -3.42706298828125, -3.2615966796875, -3.09613037109375, -2.9306640625, -2.76519775390625, -2.5997314453125, -2.43426513671875, -2.268798828125, -2.10333251953125, -1.9378662109375, -1.77239990234375, -1.60693359375, -1.44146728515625, -1.2760009765625, -1.11053466796875, -0.945068359375, -0.77960205078125, -0.6141357421875, -0.44866943359375, -0.283203125, -0.11773681640625, 0.0477294921875, 0.21319580078125, 0.378662109375, 0.54412841796875, 0.7095947265625, 0.87506103515625, 1.04052734375, 1.20599365234375, 1.3714599609375, 1.53692626953125, 1.702392578125, 1.86785888671875, 2.0333251953125, 2.19879150390625, 2.3642578125, 2.52972412109375, 2.6951904296875, 2.86065673828125, 3.026123046875, 3.19158935546875, 3.3570556640625, 3.52252197265625, 3.68798828125, 3.85345458984375, 4.0189208984375, 4.18438720703125, 4.349853515625, 4.51531982421875, 4.6807861328125, 4.84625244140625, 5.01171875]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 3.0, 2.0, 0.0, 3.0, 2.0, 5.0, 5.0, 7.0, 7.0, 6.0, 8.0, 12.0, 18.0, 12.0, 26.0, 26.0, 19.0, 33.0, 26.0, 33.0, 39.0, 36.0, 67.0, 78.0, 102.0, 192.0, 262.0, 1311.0, 163.0, 100.0, 73.0, 58.0, 41.0, 26.0, 28.0, 32.0, 23.0, 34.0, 21.0, 13.0, 17.0, 29.0, 9.0, 10.0, 15.0, 2.0, 6.0, 3.0, 4.0, 8.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-7.37890625, -7.11541748046875, -6.8519287109375, -6.58843994140625, -6.324951171875, -6.06146240234375, -5.7979736328125, -5.53448486328125, -5.27099609375, -5.00750732421875, -4.7440185546875, -4.48052978515625, -4.217041015625, -3.95355224609375, -3.6900634765625, -3.42657470703125, -3.1630859375, -2.89959716796875, -2.6361083984375, -2.37261962890625, -2.109130859375, -1.84564208984375, -1.5821533203125, -1.31866455078125, -1.05517578125, -0.79168701171875, -0.5281982421875, -0.26470947265625, -0.001220703125, 0.26226806640625, 0.5257568359375, 0.78924560546875, 1.052734375, 1.31622314453125, 1.5797119140625, 1.84320068359375, 2.106689453125, 2.37017822265625, 2.6336669921875, 2.89715576171875, 3.16064453125, 3.42413330078125, 3.6876220703125, 3.95111083984375, 4.214599609375, 4.47808837890625, 4.7415771484375, 5.00506591796875, 5.2685546875, 5.53204345703125, 5.7955322265625, 6.05902099609375, 6.322509765625, 6.58599853515625, 6.8494873046875, 7.11297607421875, 7.37646484375, 7.63995361328125, 7.9034423828125, 8.16693115234375, 8.430419921875, 8.69390869140625, 8.9573974609375, 9.22088623046875, 9.484375]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 2.0, 6.0, 8.0, 7.0, 10.0, 12.0, 16.0, 19.0, 35.0, 43.0, 60.0, 72.0, 117.0, 145.0, 211.0, 313.0, 417.0, 952.0, 3766.0, 30174.0, 571721.0, 2432588.0, 92453.0, 9215.0, 1542.0, 580.0, 388.0, 229.0, 175.0, 116.0, 78.0, 65.0, 39.0, 33.0, 26.0, 19.0, 16.0, 5.0, 9.0, 9.0, 7.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-13.25, -12.8388671875, -12.427734375, -12.0166015625, -11.60546875, -11.1943359375, -10.783203125, -10.3720703125, -9.9609375, -9.5498046875, -9.138671875, -8.7275390625, -8.31640625, -7.9052734375, -7.494140625, -7.0830078125, -6.671875, -6.2607421875, -5.849609375, -5.4384765625, -5.02734375, -4.6162109375, -4.205078125, -3.7939453125, -3.3828125, -2.9716796875, -2.560546875, -2.1494140625, -1.73828125, -1.3271484375, -0.916015625, -0.5048828125, -0.09375, 0.3173828125, 0.728515625, 1.1396484375, 1.55078125, 1.9619140625, 2.373046875, 2.7841796875, 3.1953125, 3.6064453125, 4.017578125, 4.4287109375, 4.83984375, 5.2509765625, 5.662109375, 6.0732421875, 6.484375, 6.8955078125, 7.306640625, 7.7177734375, 8.12890625, 8.5400390625, 8.951171875, 9.3623046875, 9.7734375, 10.1845703125, 10.595703125, 11.0068359375, 11.41796875, 11.8291015625, 12.240234375, 12.6513671875, 13.0625]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 7.0, 36.0, 220.0, 435.0, 262.0, 50.0, 5.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-72.3733901977539, -69.93568420410156, -67.49797058105469, -65.06026458740234, -62.622554779052734, -60.184844970703125, -57.74713897705078, -55.30942916870117, -52.87171936035156, -50.43400955200195, -47.996299743652344, -45.55859375, -43.12088394165039, -40.68317413330078, -38.24546813964844, -35.80775833129883, -33.37004852294922, -30.93233871459961, -28.494630813598633, -26.056922912597656, -23.619213104248047, -21.181503295898438, -18.74379539489746, -16.306087493896484, -13.868377685546875, -11.430668830871582, -8.992959976196289, -6.555251121520996, -4.117542266845703, -1.6798334121704102, 0.7578754425048828, 3.1955833435058594, 5.63330078125, 8.071009635925293, 10.508718490600586, 12.946427345275879, 15.384136199951172, 17.82184600830078, 20.259553909301758, 22.697261810302734, 25.134971618652344, 27.572681427001953, 30.01038932800293, 32.448097229003906, 34.885807037353516, 37.323516845703125, 39.76122283935547, 42.19893264770508, 44.63664245605469, 47.0743522644043, 49.512062072753906, 51.94976806640625, 54.38747787475586, 56.82518768310547, 59.26289367675781, 61.70060348510742, 64.13831329345703, 66.57601928710938, 69.01373291015625, 71.4514389038086, 73.88914489746094, 76.32685852050781, 78.76456451416016, 81.2022705078125, 83.63998413085938]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 1.0, 4.0, 0.0, 4.0, 9.0, 4.0, 3.0, 9.0, 6.0, 6.0, 8.0, 13.0, 13.0, 20.0, 20.0, 18.0, 23.0, 24.0, 24.0, 43.0, 33.0, 28.0, 33.0, 40.0, 36.0, 46.0, 45.0, 42.0, 40.0, 45.0, 34.0, 32.0, 38.0, 33.0, 19.0, 26.0, 20.0, 19.0, 19.0, 18.0, 15.0, 16.0, 11.0, 14.0, 12.0, 8.0, 8.0, 7.0, 10.0, 2.0, 4.0, 5.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-21.475048065185547, -20.82901382446289, -20.1829776763916, -19.536943435668945, -18.890907287597656, -18.244873046875, -17.598838806152344, -16.952804565429688, -16.3067684173584, -15.660733222961426, -15.014698028564453, -14.368663787841797, -13.722628593444824, -13.076593399047852, -12.430559158325195, -11.784523963928223, -11.13848876953125, -10.492453575134277, -9.846418380737305, -9.200384140014648, -8.554348945617676, -7.908313751220703, -7.262279033660889, -6.616244316101074, -5.970209121704102, -5.324173927307129, -4.6781392097473145, -4.0321044921875, -3.3860692977905273, -2.740034341812134, -2.0939993858337402, -1.4479646682739258, -0.8019294738769531, -0.15589451789855957, 0.490140438079834, 1.1361753940582275, 1.782210350036621, 2.4282453060150146, 3.074280261993408, 3.7203149795532227, 4.366350173950195, 5.012385368347168, 5.658420085906982, 6.304454803466797, 6.9504899978637695, 7.596525192260742, 8.242559432983398, 8.888594627380371, 9.534629821777344, 10.180665016174316, 10.826700210571289, 11.472734451293945, 12.118769645690918, 12.76480484008789, 13.410839080810547, 14.05687427520752, 14.702909469604492, 15.348944664001465, 15.994979858398438, 16.641014099121094, 17.28704833984375, 17.93308448791504, 18.579118728637695, 19.225154876708984, 19.87118911743164]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 6.0, 4.0, 8.0, 11.0, 13.0, 13.0, 17.0, 14.0, 18.0, 20.0, 31.0, 36.0, 35.0, 34.0, 45.0, 44.0, 57.0, 40.0, 41.0, 33.0, 46.0, 40.0, 53.0, 39.0, 43.0, 46.0, 36.0, 30.0, 21.0, 28.0, 20.0, 17.0, 14.0, 19.0, 8.0, 7.0, 6.0, 4.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.625, -4.4898681640625, -4.354736328125, -4.2196044921875, -4.08447265625, -3.9493408203125, -3.814208984375, -3.6790771484375, -3.5439453125, -3.4088134765625, -3.273681640625, -3.1385498046875, -3.00341796875, -2.8682861328125, -2.733154296875, -2.5980224609375, -2.462890625, -2.3277587890625, -2.192626953125, -2.0574951171875, -1.92236328125, -1.7872314453125, -1.652099609375, -1.5169677734375, -1.3818359375, -1.2467041015625, -1.111572265625, -0.9764404296875, -0.84130859375, -0.7061767578125, -0.571044921875, -0.4359130859375, -0.30078125, -0.1656494140625, -0.030517578125, 0.1046142578125, 0.23974609375, 0.3748779296875, 0.510009765625, 0.6451416015625, 0.7802734375, 0.9154052734375, 1.050537109375, 1.1856689453125, 1.32080078125, 1.4559326171875, 1.591064453125, 1.7261962890625, 1.861328125, 1.9964599609375, 2.131591796875, 2.2667236328125, 2.40185546875, 2.5369873046875, 2.672119140625, 2.8072509765625, 2.9423828125, 3.0775146484375, 3.212646484375, 3.3477783203125, 3.48291015625, 3.6180419921875, 3.753173828125, 3.8883056640625, 4.0234375]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 4.0, 4.0, 8.0, 16.0, 20.0, 36.0, 33.0, 52.0, 65.0, 111.0, 165.0, 302.0, 413.0, 748.0, 657363.0, 3532702.0, 906.0, 444.0, 316.0, 184.0, 117.0, 78.0, 51.0, 47.0, 31.0, 21.0, 9.0, 13.0, 11.0, 7.0, 4.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.875, -40.9326171875, -38.990234375, -37.0478515625, -35.10546875, -33.1630859375, -31.220703125, -29.2783203125, -27.3359375, -25.3935546875, -23.451171875, -21.5087890625, -19.56640625, -17.6240234375, -15.681640625, -13.7392578125, -11.796875, -9.8544921875, -7.912109375, -5.9697265625, -4.02734375, -2.0849609375, -0.142578125, 1.7998046875, 3.7421875, 5.6845703125, 7.626953125, 9.5693359375, 11.51171875, 13.4541015625, 15.396484375, 17.3388671875, 19.28125, 21.2236328125, 23.166015625, 25.1083984375, 27.05078125, 28.9931640625, 30.935546875, 32.8779296875, 34.8203125, 36.7626953125, 38.705078125, 40.6474609375, 42.58984375, 44.5322265625, 46.474609375, 48.4169921875, 50.359375, 52.3017578125, 54.244140625, 56.1865234375, 58.12890625, 60.0712890625, 62.013671875, 63.9560546875, 65.8984375, 67.8408203125, 69.783203125, 71.7255859375, 73.66796875, 75.6103515625, 77.552734375, 79.4951171875, 81.4375]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 2.0, 3.0, 5.0, 1.0, 4.0, 11.0, 10.0, 10.0, 15.0, 17.0, 17.0, 22.0, 46.0, 55.0, 60.0, 97.0, 140.0, 201.0, 292.0, 413.0, 530.0, 515.0, 487.0, 336.0, 233.0, 137.0, 107.0, 74.0, 63.0, 44.0, 27.0, 27.0, 21.0, 8.0, 10.0, 11.0, 16.0, 4.0, 2.0, 3.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.171875, -6.00091552734375, -5.8299560546875, -5.65899658203125, -5.488037109375, -5.31707763671875, -5.1461181640625, -4.97515869140625, -4.80419921875, -4.63323974609375, -4.4622802734375, -4.29132080078125, -4.120361328125, -3.94940185546875, -3.7784423828125, -3.60748291015625, -3.4365234375, -3.26556396484375, -3.0946044921875, -2.92364501953125, -2.752685546875, -2.58172607421875, -2.4107666015625, -2.23980712890625, -2.06884765625, -1.89788818359375, -1.7269287109375, -1.55596923828125, -1.385009765625, -1.21405029296875, -1.0430908203125, -0.87213134765625, -0.701171875, -0.53021240234375, -0.3592529296875, -0.18829345703125, -0.017333984375, 0.15362548828125, 0.3245849609375, 0.49554443359375, 0.66650390625, 0.83746337890625, 1.0084228515625, 1.17938232421875, 1.350341796875, 1.52130126953125, 1.6922607421875, 1.86322021484375, 2.0341796875, 2.20513916015625, 2.3760986328125, 2.54705810546875, 2.718017578125, 2.88897705078125, 3.0599365234375, 3.23089599609375, 3.40185546875, 3.57281494140625, 3.7437744140625, 3.91473388671875, 4.085693359375, 4.25665283203125, 4.4276123046875, 4.59857177734375, 4.76953125]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 7.0, 6.0, 13.0, 13.0, 20.0, 34.0, 44.0, 97.0, 214.0, 1108.0, 445688.0, 3743618.0, 2814.0, 329.0, 129.0, 60.0, 32.0, 21.0, 14.0, 14.0, 5.0, 6.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.8125, -35.4560546875, -34.099609375, -32.7431640625, -31.38671875, -30.0302734375, -28.673828125, -27.3173828125, -25.9609375, -24.6044921875, -23.248046875, -21.8916015625, -20.53515625, -19.1787109375, -17.822265625, -16.4658203125, -15.109375, -13.7529296875, -12.396484375, -11.0400390625, -9.68359375, -8.3271484375, -6.970703125, -5.6142578125, -4.2578125, -2.9013671875, -1.544921875, -0.1884765625, 1.16796875, 2.5244140625, 3.880859375, 5.2373046875, 6.59375, 7.9501953125, 9.306640625, 10.6630859375, 12.01953125, 13.3759765625, 14.732421875, 16.0888671875, 17.4453125, 18.8017578125, 20.158203125, 21.5146484375, 22.87109375, 24.2275390625, 25.583984375, 26.9404296875, 28.296875, 29.6533203125, 31.009765625, 32.3662109375, 33.72265625, 35.0791015625, 36.435546875, 37.7919921875, 39.1484375, 40.5048828125, 41.861328125, 43.2177734375, 44.57421875, 45.9306640625, 47.287109375, 48.6435546875, 50.0]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 23.0, 182.0, 432.0, 295.0, 76.0, 8.0, 0.0, 1.0], "bins": [-166.9603271484375, -164.11468505859375, -161.26902770996094, -158.4233856201172, -155.57774353027344, -152.7321014404297, -149.88644409179688, -147.04080200195312, -144.19515991210938, -141.34951782226562, -138.5038604736328, -135.65821838378906, -132.8125762939453, -129.96693420410156, -127.12128448486328, -124.275634765625, -121.42999267578125, -118.58434295654297, -115.73870086669922, -112.89305114746094, -110.04740905761719, -107.2017593383789, -104.35611724853516, -101.51046752929688, -98.6648178100586, -95.81916809082031, -92.97352600097656, -90.12787628173828, -87.28223419189453, -84.43658447265625, -81.5909423828125, -78.74529266357422, -75.89965057373047, -73.05400085449219, -70.20835876464844, -67.36270904541016, -64.5170669555664, -61.67142105102539, -58.825775146484375, -55.980125427246094, -53.13447952270508, -50.28883361816406, -47.44318771362305, -44.59754180908203, -41.751895904541016, -38.90625, -36.06060028076172, -33.21495819091797, -30.369312286376953, -27.523666381835938, -24.678020477294922, -21.832374572753906, -18.98672866821289, -16.141082763671875, -13.295434951782227, -10.449789047241211, -7.604142189025879, -4.758496284484863, -1.9128499031066895, 0.9327964782714844, 3.7784423828125, 6.624088287353516, 9.469735145568848, 12.315381050109863, 15.161026954650879]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 1.0, 5.0, 4.0, 6.0, 13.0, 7.0, 12.0, 17.0, 18.0, 15.0, 22.0, 22.0, 29.0, 28.0, 38.0, 32.0, 32.0, 41.0, 41.0, 37.0, 54.0, 44.0, 43.0, 39.0, 30.0, 49.0, 39.0, 37.0, 33.0, 34.0, 31.0, 24.0, 22.0, 17.0, 17.0, 12.0, 13.0, 13.0, 7.0, 7.0, 3.0, 3.0, 4.0, 5.0, 5.0, 2.0, 1.0, 2.0, 1.0], "bins": [-21.367782592773438, -20.78986167907715, -20.21194076538086, -19.634021759033203, -19.056100845336914, -18.478179931640625, -17.900259017944336, -17.322338104248047, -16.74441909790039, -16.1664981842041, -15.588578224182129, -15.01065731048584, -14.432737350463867, -13.854816436767578, -13.276895523071289, -12.698975563049316, -12.121054649353027, -11.543133735656738, -10.965213775634766, -10.387292861938477, -9.809372901916504, -9.231451988220215, -8.653532028198242, -8.075611114501953, -7.497690677642822, -6.919770240783691, -6.3418498039245605, -5.76392936706543, -5.186008453369141, -4.608088493347168, -4.030167579650879, -3.452247142791748, -2.874326705932617, -2.2964062690734863, -1.718485713005066, -1.1405651569366455, -0.5626447200775146, 0.015275716781616211, 0.5931963920593262, 1.171116828918457, 1.749037265777588, 2.3269577026367188, 2.9048781394958496, 3.4827988147735596, 4.0607194900512695, 4.638639450073242, 5.216560363769531, 5.794480800628662, 6.372401237487793, 6.950321674346924, 7.528242111206055, 8.106163024902344, 8.684082984924316, 9.262003898620605, 9.839923858642578, 10.417844772338867, 10.995765686035156, 11.573686599731445, 12.151606559753418, 12.729527473449707, 13.30744743347168, 13.885368347167969, 14.463289260864258, 15.04120922088623, 15.619129180908203]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 1.0, 4.0, 2.0, 6.0, 12.0, 11.0, 17.0, 16.0, 21.0, 18.0, 23.0, 37.0, 29.0, 46.0, 42.0, 47.0, 36.0, 46.0, 57.0, 47.0, 58.0, 55.0, 37.0, 52.0, 44.0, 34.0, 24.0, 25.0, 29.0, 26.0, 21.0, 19.0, 18.0, 12.0, 9.0, 8.0, 3.0, 1.0, 3.0, 2.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.4609375, -4.3272705078125, -4.193603515625, -4.0599365234375, -3.92626953125, -3.7926025390625, -3.658935546875, -3.5252685546875, -3.3916015625, -3.2579345703125, -3.124267578125, -2.9906005859375, -2.85693359375, -2.7232666015625, -2.589599609375, -2.4559326171875, -2.322265625, -2.1885986328125, -2.054931640625, -1.9212646484375, -1.78759765625, -1.6539306640625, -1.520263671875, -1.3865966796875, -1.2529296875, -1.1192626953125, -0.985595703125, -0.8519287109375, -0.71826171875, -0.5845947265625, -0.450927734375, -0.3172607421875, -0.18359375, -0.0499267578125, 0.083740234375, 0.2174072265625, 0.35107421875, 0.4847412109375, 0.618408203125, 0.7520751953125, 0.8857421875, 1.0194091796875, 1.153076171875, 1.2867431640625, 1.42041015625, 1.5540771484375, 1.687744140625, 1.8214111328125, 1.955078125, 2.0887451171875, 2.222412109375, 2.3560791015625, 2.48974609375, 2.6234130859375, 2.757080078125, 2.8907470703125, 3.0244140625, 3.1580810546875, 3.291748046875, 3.4254150390625, 3.55908203125, 3.6927490234375, 3.826416015625, 3.9600830078125, 4.09375]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 9.0, 3.0, 10.0, 13.0, 17.0, 38.0, 50.0, 77.0, 113.0, 226.0, 307.0, 548.0, 889.0, 1470.0, 2380.0, 3844.0, 6095.0, 9493.0, 14733.0, 21815.0, 32672.0, 46886.0, 65017.0, 85910.0, 104769.0, 117724.0, 118825.0, 107915.0, 88765.0, 67956.0, 49706.0, 34555.0, 23202.0, 15506.0, 9954.0, 6350.0, 3948.0, 2611.0, 1578.0, 1042.0, 597.0, 349.0, 220.0, 149.0, 83.0, 60.0, 32.0, 13.0, 11.0, 12.0, 9.0, 4.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.3857421875, -0.37247467041015625, -0.3592071533203125, -0.34593963623046875, -0.332672119140625, -0.31940460205078125, -0.3061370849609375, -0.29286956787109375, -0.27960205078125, -0.26633453369140625, -0.2530670166015625, -0.23979949951171875, -0.226531982421875, -0.21326446533203125, -0.1999969482421875, -0.18672943115234375, -0.1734619140625, -0.16019439697265625, -0.1469268798828125, -0.13365936279296875, -0.120391845703125, -0.10712432861328125, -0.0938568115234375, -0.08058929443359375, -0.06732177734375, -0.05405426025390625, -0.0407867431640625, -0.02751922607421875, -0.014251708984375, -0.00098419189453125, 0.0122833251953125, 0.02555084228515625, 0.038818359375, 0.05208587646484375, 0.0653533935546875, 0.07862091064453125, 0.091888427734375, 0.10515594482421875, 0.1184234619140625, 0.13169097900390625, 0.14495849609375, 0.15822601318359375, 0.1714935302734375, 0.18476104736328125, 0.198028564453125, 0.21129608154296875, 0.2245635986328125, 0.23783111572265625, 0.2510986328125, 0.26436614990234375, 0.2776336669921875, 0.29090118408203125, 0.304168701171875, 0.31743621826171875, 0.3307037353515625, 0.34397125244140625, 0.35723876953125, 0.37050628662109375, 0.3837738037109375, 0.39704132080078125, 0.410308837890625, 0.42357635498046875, 0.4368438720703125, 0.45011138916015625, 0.46337890625]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 5.0, 1.0, 4.0, 4.0, 6.0, 7.0, 7.0, 11.0, 6.0, 12.0, 13.0, 24.0, 21.0, 18.0, 22.0, 31.0, 39.0, 37.0, 31.0, 34.0, 29.0, 41.0, 34.0, 38.0, 1068.0, 52.0, 53.0, 45.0, 35.0, 35.0, 38.0, 33.0, 36.0, 27.0, 19.0, 25.0, 16.0, 12.0, 10.0, 12.0, 12.0, 7.0, 10.0, 5.0, 9.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.841796875, -2.755096435546875, -2.66839599609375, -2.581695556640625, -2.4949951171875, -2.408294677734375, -2.32159423828125, -2.234893798828125, -2.148193359375, -2.061492919921875, -1.97479248046875, -1.888092041015625, -1.8013916015625, -1.714691162109375, -1.62799072265625, -1.541290283203125, -1.45458984375, -1.367889404296875, -1.28118896484375, -1.194488525390625, -1.1077880859375, -1.021087646484375, -0.93438720703125, -0.847686767578125, -0.760986328125, -0.674285888671875, -0.58758544921875, -0.500885009765625, -0.4141845703125, -0.327484130859375, -0.24078369140625, -0.154083251953125, -0.0673828125, 0.019317626953125, 0.10601806640625, 0.192718505859375, 0.2794189453125, 0.366119384765625, 0.45281982421875, 0.539520263671875, 0.626220703125, 0.712921142578125, 0.79962158203125, 0.886322021484375, 0.9730224609375, 1.059722900390625, 1.14642333984375, 1.233123779296875, 1.31982421875, 1.406524658203125, 1.49322509765625, 1.579925537109375, 1.6666259765625, 1.753326416015625, 1.84002685546875, 1.926727294921875, 2.013427734375, 2.100128173828125, 2.18682861328125, 2.273529052734375, 2.3602294921875, 2.446929931640625, 2.53363037109375, 2.620330810546875, 2.70703125]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 5.0, 2.0, 8.0, 10.0, 12.0, 14.0, 32.0, 43.0, 85.0, 116.0, 212.0, 251.0, 426.0, 659.0, 1028.0, 1479.0, 2328.0, 3563.0, 5347.0, 8296.0, 12638.0, 20091.0, 35434.0, 303602.0, 1591644.0, 46377.0, 22559.0, 13991.0, 9277.0, 6145.0, 3855.0, 2639.0, 1744.0, 1139.0, 710.0, 461.0, 293.0, 244.0, 116.0, 95.0, 47.0, 43.0, 24.0, 22.0, 13.0, 12.0, 8.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.0126953125, -0.9838714599609375, -0.955047607421875, -0.9262237548828125, -0.89739990234375, -0.8685760498046875, -0.839752197265625, -0.8109283447265625, -0.7821044921875, -0.7532806396484375, -0.724456787109375, -0.6956329345703125, -0.66680908203125, -0.6379852294921875, -0.609161376953125, -0.5803375244140625, -0.551513671875, -0.5226898193359375, -0.493865966796875, -0.4650421142578125, -0.43621826171875, -0.4073944091796875, -0.378570556640625, -0.3497467041015625, -0.3209228515625, -0.2920989990234375, -0.263275146484375, -0.2344512939453125, -0.20562744140625, -0.1768035888671875, -0.147979736328125, -0.1191558837890625, -0.09033203125, -0.0615081787109375, -0.032684326171875, -0.0038604736328125, 0.02496337890625, 0.0537872314453125, 0.082611083984375, 0.1114349365234375, 0.1402587890625, 0.1690826416015625, 0.197906494140625, 0.2267303466796875, 0.25555419921875, 0.2843780517578125, 0.313201904296875, 0.3420257568359375, 0.370849609375, 0.3996734619140625, 0.428497314453125, 0.4573211669921875, 0.48614501953125, 0.5149688720703125, 0.543792724609375, 0.5726165771484375, 0.6014404296875, 0.6302642822265625, 0.659088134765625, 0.6879119873046875, 0.71673583984375, 0.7455596923828125, 0.774383544921875, 0.8032073974609375, 0.83203125]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 3.0, 5.0, 5.0, 3.0, 12.0, 12.0, 19.0, 21.0, 27.0, 34.0, 54.0, 43.0, 52.0, 78.0, 83.0, 80.0, 72.0, 61.0, 71.0, 65.0, 43.0, 29.0, 29.0, 27.0, 17.0, 9.0, 16.0, 6.0, 10.0, 6.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0526123046875, -0.05029869079589844, -0.047985076904296875, -0.04567146301269531, -0.04335784912109375, -0.04104423522949219, -0.038730621337890625, -0.03641700744628906, -0.0341033935546875, -0.03178977966308594, -0.029476165771484375, -0.027162551879882812, -0.02484893798828125, -0.022535324096679688, -0.020221710205078125, -0.017908096313476562, -0.015594482421875, -0.013280868530273438, -0.010967254638671875, -0.008653640747070312, -0.00634002685546875, -0.0040264129638671875, -0.001712799072265625, 0.0006008148193359375, 0.0029144287109375, 0.0052280426025390625, 0.007541656494140625, 0.009855270385742188, 0.01216888427734375, 0.014482498168945312, 0.016796112060546875, 0.019109725952148438, 0.02142333984375, 0.023736953735351562, 0.026050567626953125, 0.028364181518554688, 0.03067779541015625, 0.03299140930175781, 0.035305023193359375, 0.03761863708496094, 0.0399322509765625, 0.04224586486816406, 0.044559478759765625, 0.04687309265136719, 0.04918670654296875, 0.05150032043457031, 0.053813934326171875, 0.05612754821777344, 0.058441162109375, 0.06075477600097656, 0.06306838989257812, 0.06538200378417969, 0.06769561767578125, 0.07000923156738281, 0.07232284545898438, 0.07463645935058594, 0.0769500732421875, 0.07926368713378906, 0.08157730102539062, 0.08389091491699219, 0.08620452880859375, 0.08851814270019531, 0.09083175659179688, 0.09314537048339844, 0.095458984375]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 2.0, 8.0, 13.0, 8.0, 15.0, 14.0, 30.0, 35.0, 67.0, 74.0, 109.0, 203.0, 380.0, 941.0, 156586.0, 887732.0, 1271.0, 429.0, 217.0, 116.0, 102.0, 55.0, 36.0, 32.0, 24.0, 20.0, 8.0, 4.0, 6.0, 3.0, 4.0, 3.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.005859375, -1.9570465087890625, -1.908233642578125, -1.8594207763671875, -1.81060791015625, -1.7617950439453125, -1.712982177734375, -1.6641693115234375, -1.6153564453125, -1.5665435791015625, -1.517730712890625, -1.4689178466796875, -1.42010498046875, -1.3712921142578125, -1.322479248046875, -1.2736663818359375, -1.224853515625, -1.1760406494140625, -1.127227783203125, -1.0784149169921875, -1.02960205078125, -0.9807891845703125, -0.931976318359375, -0.8831634521484375, -0.8343505859375, -0.7855377197265625, -0.736724853515625, -0.6879119873046875, -0.63909912109375, -0.5902862548828125, -0.541473388671875, -0.4926605224609375, -0.44384765625, -0.3950347900390625, -0.346221923828125, -0.2974090576171875, -0.24859619140625, -0.1997833251953125, -0.150970458984375, -0.1021575927734375, -0.0533447265625, -0.0045318603515625, 0.044281005859375, 0.0930938720703125, 0.14190673828125, 0.1907196044921875, 0.239532470703125, 0.2883453369140625, 0.337158203125, 0.3859710693359375, 0.434783935546875, 0.4835968017578125, 0.53240966796875, 0.5812225341796875, 0.630035400390625, 0.6788482666015625, 0.7276611328125, 0.7764739990234375, 0.825286865234375, 0.8740997314453125, 0.92291259765625, 0.9717254638671875, 1.020538330078125, 1.0693511962890625, 1.1181640625]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 104.0, 775.0, 127.0, 8.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08783669769763947, -0.07442665100097656, -0.06101659685373306, -0.04760655015707016, -0.03419649973511696, -0.020786449313163757, -0.0073764026165008545, 0.006033651530742645, 0.019443698227405548, 0.03285374864935875, 0.04626379907131195, 0.059673845767974854, 0.07308389246463776, 0.08649394661188126, 0.09990399330854416, 0.11331404745578766, 0.12672409415245056, 0.14013414084911346, 0.15354418754577637, 0.16695424914360046, 0.18036429584026337, 0.19377434253692627, 0.20718438923358917, 0.22059443593025208, 0.23400449752807617, 0.24741454422473907, 0.260824590921402, 0.2742346525192261, 0.2876446843147278, 0.3010547459125519, 0.314464807510376, 0.3278748393058777, 0.3412849009037018, 0.3546949625015259, 0.3681049942970276, 0.3815150558948517, 0.3949250876903534, 0.4083351492881775, 0.4217451810836792, 0.4351552426815033, 0.4485653042793274, 0.4619753658771515, 0.4753853976726532, 0.4887954592704773, 0.502205491065979, 0.5156155824661255, 0.5290256142616272, 0.5424356460571289, 0.5558456778526306, 0.5692557096481323, 0.5826658010482788, 0.5960758328437805, 0.6094858646392822, 0.6228959560394287, 0.6363059878349304, 0.6497160196304321, 0.6631261110305786, 0.6765361428260803, 0.6899462342262268, 0.7033562660217285, 0.7167662978172302, 0.7301763296127319, 0.7435864210128784, 0.7569964528083801, 0.7704064846038818]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 5.0, 4.0, 6.0, 2.0, 5.0, 8.0, 10.0, 16.0, 15.0, 18.0, 15.0, 18.0, 24.0, 24.0, 35.0, 36.0, 41.0, 34.0, 48.0, 44.0, 26.0, 33.0, 48.0, 50.0, 31.0, 50.0, 36.0, 43.0, 37.0, 41.0, 26.0, 28.0, 25.0, 20.0, 19.0, 20.0, 17.0, 11.0, 11.0, 10.0, 1.0, 4.0, 1.0, 6.0, 3.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.062151432037353516, -0.06006906181573868, -0.05798669159412384, -0.055904321372509, -0.053821951150894165, -0.05173958092927933, -0.04965721070766449, -0.04757484048604965, -0.045492470264434814, -0.04341010004281998, -0.04132772982120514, -0.0392453595995903, -0.037162989377975464, -0.035080619156360626, -0.03299824893474579, -0.03091587871313095, -0.028833508491516113, -0.026751138269901276, -0.024668768048286438, -0.0225863978266716, -0.020504027605056763, -0.018421657383441925, -0.016339287161827087, -0.01425691694021225, -0.012174546718597412, -0.010092176496982574, -0.008009806275367737, -0.005927436053752899, -0.0038450658321380615, -0.0017626956105232239, 0.00031967461109161377, 0.0024020448327064514, 0.004484415054321289, 0.006566785275936127, 0.008649155497550964, 0.010731525719165802, 0.01281389594078064, 0.014896266162395477, 0.016978636384010315, 0.019061006605625153, 0.02114337682723999, 0.023225747048854828, 0.025308117270469666, 0.027390487492084503, 0.02947285771369934, 0.03155522793531418, 0.033637598156929016, 0.035719968378543854, 0.03780233860015869, 0.03988470882177353, 0.04196707904338837, 0.044049449265003204, 0.04613181948661804, 0.04821418970823288, 0.05029655992984772, 0.052378930151462555, 0.05446130037307739, 0.05654367059469223, 0.05862604081630707, 0.060708411037921906, 0.06279078125953674, 0.06487315148115158, 0.06695552170276642, 0.06903789192438126, 0.0711202621459961]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 2.0, 2.0, 5.0, 8.0, 10.0, 12.0, 16.0, 20.0, 24.0, 23.0, 28.0, 33.0, 33.0, 35.0, 53.0, 39.0, 39.0, 62.0, 42.0, 60.0, 53.0, 44.0, 44.0, 41.0, 43.0, 33.0, 37.0, 32.0, 23.0, 29.0, 13.0, 21.0, 12.0, 9.0, 4.0, 5.0, 6.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.11328125, -3.9764404296875, -3.839599609375, -3.7027587890625, -3.56591796875, -3.4290771484375, -3.292236328125, -3.1553955078125, -3.0185546875, -2.8817138671875, -2.744873046875, -2.6080322265625, -2.47119140625, -2.3343505859375, -2.197509765625, -2.0606689453125, -1.923828125, -1.7869873046875, -1.650146484375, -1.5133056640625, -1.37646484375, -1.2396240234375, -1.102783203125, -0.9659423828125, -0.8291015625, -0.6922607421875, -0.555419921875, -0.4185791015625, -0.28173828125, -0.1448974609375, -0.008056640625, 0.1287841796875, 0.265625, 0.4024658203125, 0.539306640625, 0.6761474609375, 0.81298828125, 0.9498291015625, 1.086669921875, 1.2235107421875, 1.3603515625, 1.4971923828125, 1.634033203125, 1.7708740234375, 1.90771484375, 2.0445556640625, 2.181396484375, 2.3182373046875, 2.455078125, 2.5919189453125, 2.728759765625, 2.8656005859375, 3.00244140625, 3.1392822265625, 3.276123046875, 3.4129638671875, 3.5498046875, 3.6866455078125, 3.823486328125, 3.9603271484375, 4.09716796875, 4.2340087890625, 4.370849609375, 4.5076904296875, 4.64453125]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 0.0, 4.0, 9.0, 6.0, 10.0, 13.0, 21.0, 29.0, 44.0, 74.0, 117.0, 156.0, 216.0, 477.0, 931.0, 2182.0, 5612.0, 14708.0, 39445.0, 107421.0, 302605.0, 358879.0, 135496.0, 49314.0, 18462.0, 7133.0, 2705.0, 1152.0, 530.0, 292.0, 176.0, 113.0, 70.0, 49.0, 35.0, 31.0, 16.0, 8.0, 8.0, 7.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.55078125, -5.3779296875, -5.205078125, -5.0322265625, -4.859375, -4.6865234375, -4.513671875, -4.3408203125, -4.16796875, -3.9951171875, -3.822265625, -3.6494140625, -3.4765625, -3.3037109375, -3.130859375, -2.9580078125, -2.78515625, -2.6123046875, -2.439453125, -2.2666015625, -2.09375, -1.9208984375, -1.748046875, -1.5751953125, -1.40234375, -1.2294921875, -1.056640625, -0.8837890625, -0.7109375, -0.5380859375, -0.365234375, -0.1923828125, -0.01953125, 0.1533203125, 0.326171875, 0.4990234375, 0.671875, 0.8447265625, 1.017578125, 1.1904296875, 1.36328125, 1.5361328125, 1.708984375, 1.8818359375, 2.0546875, 2.2275390625, 2.400390625, 2.5732421875, 2.74609375, 2.9189453125, 3.091796875, 3.2646484375, 3.4375, 3.6103515625, 3.783203125, 3.9560546875, 4.12890625, 4.3017578125, 4.474609375, 4.6474609375, 4.8203125, 4.9931640625, 5.166015625, 5.3388671875, 5.51171875]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 4.0, 2.0, 3.0, 7.0, 6.0, 6.0, 8.0, 10.0, 4.0, 10.0, 20.0, 19.0, 14.0, 21.0, 28.0, 33.0, 42.0, 61.0, 55.0, 72.0, 120.0, 199.0, 1360.0, 301.0, 181.0, 94.0, 58.0, 50.0, 36.0, 33.0, 33.0, 30.0, 20.0, 22.0, 12.0, 22.0, 11.0, 7.0, 7.0, 6.0, 8.0, 5.0, 6.0, 2.0, 8.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.7890625, -8.4952392578125, -8.201416015625, -7.9075927734375, -7.61376953125, -7.3199462890625, -7.026123046875, -6.7322998046875, -6.4384765625, -6.1446533203125, -5.850830078125, -5.5570068359375, -5.26318359375, -4.9693603515625, -4.675537109375, -4.3817138671875, -4.087890625, -3.7940673828125, -3.500244140625, -3.2064208984375, -2.91259765625, -2.6187744140625, -2.324951171875, -2.0311279296875, -1.7373046875, -1.4434814453125, -1.149658203125, -0.8558349609375, -0.56201171875, -0.2681884765625, 0.025634765625, 0.3194580078125, 0.61328125, 0.9071044921875, 1.200927734375, 1.4947509765625, 1.78857421875, 2.0823974609375, 2.376220703125, 2.6700439453125, 2.9638671875, 3.2576904296875, 3.551513671875, 3.8453369140625, 4.13916015625, 4.4329833984375, 4.726806640625, 5.0206298828125, 5.314453125, 5.6082763671875, 5.902099609375, 6.1959228515625, 6.48974609375, 6.7835693359375, 7.077392578125, 7.3712158203125, 7.6650390625, 7.9588623046875, 8.252685546875, 8.5465087890625, 8.84033203125, 9.1341552734375, 9.427978515625, 9.7218017578125, 10.015625]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 3.0, 6.0, 3.0, 6.0, 6.0, 13.0, 18.0, 16.0, 24.0, 27.0, 49.0, 57.0, 105.0, 152.0, 212.0, 328.0, 553.0, 999.0, 2926.0, 2408327.0, 726904.0, 2504.0, 955.0, 555.0, 303.0, 200.0, 131.0, 72.0, 68.0, 51.0, 28.0, 20.0, 20.0, 15.0, 12.0, 12.0, 4.0, 3.0, 2.0, 3.0, 4.0, 5.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-28.90625, -28.001220703125, -27.09619140625, -26.191162109375, -25.2861328125, -24.381103515625, -23.47607421875, -22.571044921875, -21.666015625, -20.760986328125, -19.85595703125, -18.950927734375, -18.0458984375, -17.140869140625, -16.23583984375, -15.330810546875, -14.42578125, -13.520751953125, -12.61572265625, -11.710693359375, -10.8056640625, -9.900634765625, -8.99560546875, -8.090576171875, -7.185546875, -6.280517578125, -5.37548828125, -4.470458984375, -3.5654296875, -2.660400390625, -1.75537109375, -0.850341796875, 0.0546875, 0.959716796875, 1.86474609375, 2.769775390625, 3.6748046875, 4.579833984375, 5.48486328125, 6.389892578125, 7.294921875, 8.199951171875, 9.10498046875, 10.010009765625, 10.9150390625, 11.820068359375, 12.72509765625, 13.630126953125, 14.53515625, 15.440185546875, 16.34521484375, 17.250244140625, 18.1552734375, 19.060302734375, 19.96533203125, 20.870361328125, 21.775390625, 22.680419921875, 23.58544921875, 24.490478515625, 25.3955078125, 26.300537109375, 27.20556640625, 28.110595703125, 29.015625]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 36.0, 233.0, 426.0, 265.0, 48.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.376766204833984, -45.91666030883789, -43.45655059814453, -40.99644470214844, -38.536338806152344, -36.076229095458984, -33.61612319946289, -31.156015396118164, -28.695907592773438, -26.23579978942871, -23.775691986083984, -21.31558609008789, -18.855478286743164, -16.395370483398438, -13.935263633728027, -11.475156784057617, -9.01504898071289, -6.554941654205322, -4.094834327697754, -1.6347270011901855, 0.8253803253173828, 3.2854881286621094, 5.7455949783325195, 8.20570182800293, 10.665809631347656, 13.125917434692383, 15.586024284362793, 18.046131134033203, 20.50623893737793, 22.966346740722656, 25.42645263671875, 27.886560440063477, 30.34667205810547, 32.80677795410156, 35.26688766479492, 37.726993560791016, 40.187103271484375, 42.64720916748047, 45.10731506347656, 47.567420959472656, 50.027530670166016, 52.48763656616211, 54.94774627685547, 57.40785217285156, 59.867958068847656, 62.328067779541016, 64.78817749023438, 67.24828338623047, 69.70838928222656, 72.16849517822266, 74.62860107421875, 77.08871459960938, 79.54882049560547, 82.00892639160156, 84.46903228759766, 86.92913818359375, 89.38925170898438, 91.84935760498047, 94.30946350097656, 96.76957702636719, 99.22968292236328, 101.68978881835938, 104.14989471435547, 106.61000061035156, 109.07010650634766]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 3.0, 5.0, 8.0, 7.0, 4.0, 15.0, 10.0, 17.0, 19.0, 19.0, 28.0, 26.0, 32.0, 35.0, 44.0, 33.0, 40.0, 30.0, 41.0, 38.0, 41.0, 44.0, 35.0, 49.0, 35.0, 27.0, 44.0, 39.0, 34.0, 33.0, 24.0, 31.0, 15.0, 15.0, 26.0, 11.0, 16.0, 5.0, 9.0, 6.0, 5.0, 1.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.178943634033203, -28.336078643798828, -27.49321174621582, -26.650346755981445, -25.80748176574707, -24.964614868164062, -24.121749877929688, -23.278884887695312, -22.436019897460938, -21.593154907226562, -20.750288009643555, -19.90742301940918, -19.064558029174805, -18.221691131591797, -17.378826141357422, -16.535961151123047, -15.693095207214355, -14.850229263305664, -14.007364273071289, -13.164498329162598, -12.321633338928223, -11.478767395019531, -10.635902404785156, -9.793036460876465, -8.950170516967773, -8.107304573059082, -7.264439582824707, -6.421573638916016, -5.578708648681641, -4.735842704772949, -3.892977237701416, -3.050111770629883, -2.207246780395508, -1.3643813133239746, -0.5215157270431519, 0.3213498592376709, 1.164215326309204, 2.0070810317993164, 2.8499464988708496, 3.692811965942383, 4.535677433013916, 5.378542900085449, 6.221408367156982, 7.064273834228516, 7.907139778137207, 8.750005722045898, 9.592870712280273, 10.435735702514648, 11.27860164642334, 12.121467590332031, 12.964332580566406, 13.807198524475098, 14.650063514709473, 15.492929458618164, 16.33579444885254, 17.178661346435547, 18.021526336669922, 18.864391326904297, 19.707258224487305, 20.55012321472168, 21.392988204956055, 22.235855102539062, 23.078720092773438, 23.921585083007812, 24.764450073242188]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 9.0, 3.0, 7.0, 6.0, 9.0, 10.0, 12.0, 9.0, 17.0, 24.0, 13.0, 25.0, 29.0, 30.0, 41.0, 30.0, 33.0, 36.0, 50.0, 49.0, 48.0, 43.0, 66.0, 44.0, 41.0, 46.0, 44.0, 39.0, 31.0, 19.0, 26.0, 16.0, 15.0, 14.0, 20.0, 14.0, 8.0, 9.0, 10.0, 5.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.935546875, -3.808929443359375, -3.68231201171875, -3.555694580078125, -3.4290771484375, -3.302459716796875, -3.17584228515625, -3.049224853515625, -2.922607421875, -2.795989990234375, -2.66937255859375, -2.542755126953125, -2.4161376953125, -2.289520263671875, -2.16290283203125, -2.036285400390625, -1.90966796875, -1.783050537109375, -1.65643310546875, -1.529815673828125, -1.4031982421875, -1.276580810546875, -1.14996337890625, -1.023345947265625, -0.896728515625, -0.770111083984375, -0.64349365234375, -0.516876220703125, -0.3902587890625, -0.263641357421875, -0.13702392578125, -0.010406494140625, 0.1162109375, 0.242828369140625, 0.36944580078125, 0.496063232421875, 0.6226806640625, 0.749298095703125, 0.87591552734375, 1.002532958984375, 1.129150390625, 1.255767822265625, 1.38238525390625, 1.509002685546875, 1.6356201171875, 1.762237548828125, 1.88885498046875, 2.015472412109375, 2.14208984375, 2.268707275390625, 2.39532470703125, 2.521942138671875, 2.6485595703125, 2.775177001953125, 2.90179443359375, 3.028411865234375, 3.155029296875, 3.281646728515625, 3.40826416015625, 3.534881591796875, 3.6614990234375, 3.788116455078125, 3.91473388671875, 4.041351318359375, 4.16796875]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 7.0, 6.0, 13.0, 21.0, 20.0, 41.0, 64.0, 127.0, 230.0, 543.0, 1565.0, 5501.0, 30526.0, 329078.0, 2411849.0, 1272577.0, 122631.0, 14516.0, 3097.0, 1032.0, 394.0, 197.0, 82.0, 58.0, 41.0, 30.0, 10.0, 7.0, 6.0, 6.0, 6.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.97265625, -7.68585205078125, -7.3990478515625, -7.11224365234375, -6.825439453125, -6.53863525390625, -6.2518310546875, -5.96502685546875, -5.67822265625, -5.39141845703125, -5.1046142578125, -4.81781005859375, -4.531005859375, -4.24420166015625, -3.9573974609375, -3.67059326171875, -3.3837890625, -3.09698486328125, -2.8101806640625, -2.52337646484375, -2.236572265625, -1.94976806640625, -1.6629638671875, -1.37615966796875, -1.08935546875, -0.80255126953125, -0.5157470703125, -0.22894287109375, 0.057861328125, 0.34466552734375, 0.6314697265625, 0.91827392578125, 1.205078125, 1.49188232421875, 1.7786865234375, 2.06549072265625, 2.352294921875, 2.63909912109375, 2.9259033203125, 3.21270751953125, 3.49951171875, 3.78631591796875, 4.0731201171875, 4.35992431640625, 4.646728515625, 4.93353271484375, 5.2203369140625, 5.50714111328125, 5.7939453125, 6.08074951171875, 6.3675537109375, 6.65435791015625, 6.941162109375, 7.22796630859375, 7.5147705078125, 7.80157470703125, 8.08837890625, 8.37518310546875, 8.6619873046875, 8.94879150390625, 9.235595703125, 9.52239990234375, 9.8092041015625, 10.09600830078125, 10.3828125]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 7.0, 8.0, 3.0, 12.0, 14.0, 17.0, 27.0, 31.0, 50.0, 50.0, 65.0, 81.0, 126.0, 139.0, 163.0, 261.0, 343.0, 412.0, 463.0, 379.0, 332.0, 250.0, 174.0, 139.0, 117.0, 82.0, 69.0, 62.0, 43.0, 40.0, 30.0, 25.0, 17.0, 14.0, 9.0, 7.0, 5.0, 3.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.69140625, -4.5205078125, -4.349609375, -4.1787109375, -4.0078125, -3.8369140625, -3.666015625, -3.4951171875, -3.32421875, -3.1533203125, -2.982421875, -2.8115234375, -2.640625, -2.4697265625, -2.298828125, -2.1279296875, -1.95703125, -1.7861328125, -1.615234375, -1.4443359375, -1.2734375, -1.1025390625, -0.931640625, -0.7607421875, -0.58984375, -0.4189453125, -0.248046875, -0.0771484375, 0.09375, 0.2646484375, 0.435546875, 0.6064453125, 0.77734375, 0.9482421875, 1.119140625, 1.2900390625, 1.4609375, 1.6318359375, 1.802734375, 1.9736328125, 2.14453125, 2.3154296875, 2.486328125, 2.6572265625, 2.828125, 2.9990234375, 3.169921875, 3.3408203125, 3.51171875, 3.6826171875, 3.853515625, 4.0244140625, 4.1953125, 4.3662109375, 4.537109375, 4.7080078125, 4.87890625, 5.0498046875, 5.220703125, 5.3916015625, 5.5625, 5.7333984375, 5.904296875, 6.0751953125, 6.24609375]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 0.0, 0.0, 1.0, 5.0, 4.0, 8.0, 7.0, 12.0, 33.0, 80.0, 272.0, 1125.0, 11205.0, 3589523.0, 587364.0, 3700.0, 617.0, 220.0, 56.0, 29.0, 14.0, 6.0, 5.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.375, -31.4453125, -30.515625, -29.5859375, -28.65625, -27.7265625, -26.796875, -25.8671875, -24.9375, -24.0078125, -23.078125, -22.1484375, -21.21875, -20.2890625, -19.359375, -18.4296875, -17.5, -16.5703125, -15.640625, -14.7109375, -13.78125, -12.8515625, -11.921875, -10.9921875, -10.0625, -9.1328125, -8.203125, -7.2734375, -6.34375, -5.4140625, -4.484375, -3.5546875, -2.625, -1.6953125, -0.765625, 0.1640625, 1.09375, 2.0234375, 2.953125, 3.8828125, 4.8125, 5.7421875, 6.671875, 7.6015625, 8.53125, 9.4609375, 10.390625, 11.3203125, 12.25, 13.1796875, 14.109375, 15.0390625, 15.96875, 16.8984375, 17.828125, 18.7578125, 19.6875, 20.6171875, 21.546875, 22.4765625, 23.40625, 24.3359375, 25.265625, 26.1953125, 27.125]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 33.0, 781.0, 199.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-368.15032958984375, -359.9121398925781, -351.6739196777344, -343.43572998046875, -335.1975402832031, -326.9593505859375, -318.72113037109375, -310.4829406738281, -302.2447509765625, -294.0065612792969, -285.7683410644531, -277.5301513671875, -269.2919616699219, -261.05377197265625, -252.8155517578125, -244.57736206054688, -236.33914184570312, -228.10093688964844, -219.8627471923828, -211.62454223632812, -203.3863525390625, -195.1481475830078, -186.90994262695312, -178.6717529296875, -170.4335479736328, -162.19534301757812, -153.9571533203125, -145.7189483642578, -137.48074340820312, -129.2425537109375, -121.00434875488281, -112.76615142822266, -104.52793884277344, -96.28974151611328, -88.05154418945312, -79.81333923339844, -71.57514190673828, -63.336944580078125, -55.0987434387207, -46.86054229736328, -38.622344970703125, -30.384145736694336, -22.145946502685547, -13.907747268676758, -5.669548034667969, 2.5686492919921875, 10.80685043334961, 19.04505157470703, 27.283248901367188, 35.521446228027344, 43.759647369384766, 51.99784851074219, 60.236045837402344, 68.4742431640625, 76.71244812011719, 84.95064544677734, 93.1888427734375, 101.42704010009766, 109.66523742675781, 117.9034423828125, 126.14163970947266, 134.3798370361328, 142.6180419921875, 150.85623168945312, 159.0944366455078]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 6.0, 3.0, 6.0, 3.0, 11.0, 8.0, 6.0, 14.0, 15.0, 9.0, 21.0, 19.0, 23.0, 29.0, 28.0, 31.0, 38.0, 44.0, 33.0, 35.0, 41.0, 36.0, 37.0, 38.0, 37.0, 29.0, 34.0, 29.0, 39.0, 36.0, 35.0, 21.0, 27.0, 20.0, 18.0, 23.0, 17.0, 31.0, 16.0, 9.0, 12.0, 4.0, 8.0, 12.0, 4.0, 4.0, 7.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-20.639530181884766, -19.99694061279297, -19.354352951049805, -18.711763381958008, -18.069175720214844, -17.426586151123047, -16.78399658203125, -16.141408920288086, -15.498819351196289, -14.856230735778809, -14.213642120361328, -13.571052551269531, -12.92846393585205, -12.28587532043457, -11.64328670501709, -11.00069808959961, -10.358109474182129, -9.715520858764648, -9.072932243347168, -8.430343627929688, -7.787754058837891, -7.14516544342041, -6.50257682800293, -5.859987735748291, -5.2173991203308105, -4.57481050491333, -3.9322214126586914, -3.289632797241211, -2.6470439434051514, -2.004455089569092, -1.3618664741516113, -0.7192773818969727, -0.07668876647949219, 0.5659000277519226, 1.2084888219833374, 1.8510775566101074, 2.493666410446167, 3.1362552642822266, 3.778843879699707, 4.421432971954346, 5.064021587371826, 5.706610202789307, 6.349199295043945, 6.991787910461426, 7.634376525878906, 8.276966094970703, 8.919553756713867, 9.562143325805664, 10.204731941223145, 10.847320556640625, 11.489909172058105, 12.132497787475586, 12.775087356567383, 13.417675971984863, 14.060264587402344, 14.70285415649414, 15.345441818237305, 15.988030433654785, 16.630619049072266, 17.273208618164062, 17.915796279907227, 18.558385848999023, 19.200973510742188, 19.843563079833984, 20.48615264892578]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 7.0, 7.0, 8.0, 11.0, 7.0, 18.0, 15.0, 26.0, 28.0, 17.0, 40.0, 43.0, 40.0, 43.0, 47.0, 67.0, 60.0, 43.0, 60.0, 52.0, 52.0, 39.0, 43.0, 40.0, 42.0, 30.0, 27.0, 24.0, 15.0, 19.0, 12.0, 11.0, 6.0, 5.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.08984375, -3.967620849609375, -3.84539794921875, -3.723175048828125, -3.6009521484375, -3.478729248046875, -3.35650634765625, -3.234283447265625, -3.112060546875, -2.989837646484375, -2.86761474609375, -2.745391845703125, -2.6231689453125, -2.500946044921875, -2.37872314453125, -2.256500244140625, -2.13427734375, -2.012054443359375, -1.88983154296875, -1.767608642578125, -1.6453857421875, -1.523162841796875, -1.40093994140625, -1.278717041015625, -1.156494140625, -1.034271240234375, -0.91204833984375, -0.789825439453125, -0.6676025390625, -0.545379638671875, -0.42315673828125, -0.300933837890625, -0.1787109375, -0.056488037109375, 0.06573486328125, 0.187957763671875, 0.3101806640625, 0.432403564453125, 0.55462646484375, 0.676849365234375, 0.799072265625, 0.921295166015625, 1.04351806640625, 1.165740966796875, 1.2879638671875, 1.410186767578125, 1.53240966796875, 1.654632568359375, 1.77685546875, 1.899078369140625, 2.02130126953125, 2.143524169921875, 2.2657470703125, 2.387969970703125, 2.51019287109375, 2.632415771484375, 2.754638671875, 2.876861572265625, 2.99908447265625, 3.121307373046875, 3.2435302734375, 3.365753173828125, 3.48797607421875, 3.610198974609375, 3.732421875]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 7.0, 6.0, 3.0, 11.0, 10.0, 25.0, 33.0, 68.0, 102.0, 193.0, 281.0, 551.0, 988.0, 1783.0, 3192.0, 5563.0, 9380.0, 16009.0, 26696.0, 42385.0, 65052.0, 92650.0, 122994.0, 142697.0, 141452.0, 120480.0, 90140.0, 62646.0, 40996.0, 25336.0, 15377.0, 9230.0, 5376.0, 3028.0, 1657.0, 985.0, 527.0, 272.0, 148.0, 103.0, 50.0, 30.0, 21.0, 8.0, 13.0, 7.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.446044921875, -0.4332847595214844, -0.42052459716796875, -0.4077644348144531, -0.3950042724609375, -0.3822441101074219, -0.36948394775390625, -0.3567237854003906, -0.343963623046875, -0.3312034606933594, -0.31844329833984375, -0.3056831359863281, -0.2929229736328125, -0.2801628112792969, -0.26740264892578125, -0.2546424865722656, -0.24188232421875, -0.22912216186523438, -0.21636199951171875, -0.20360183715820312, -0.1908416748046875, -0.17808151245117188, -0.16532135009765625, -0.15256118774414062, -0.139801025390625, -0.12704086303710938, -0.11428070068359375, -0.10152053833007812, -0.0887603759765625, -0.07600021362304688, -0.06324005126953125, -0.050479888916015625, -0.0377197265625, -0.024959564208984375, -0.01219940185546875, 0.000560760498046875, 0.0133209228515625, 0.026081085205078125, 0.03884124755859375, 0.051601409912109375, 0.064361572265625, 0.07712173461914062, 0.08988189697265625, 0.10264205932617188, 0.1154022216796875, 0.12816238403320312, 0.14092254638671875, 0.15368270874023438, 0.16644287109375, 0.17920303344726562, 0.19196319580078125, 0.20472335815429688, 0.2174835205078125, 0.23024368286132812, 0.24300384521484375, 0.2557640075683594, 0.268524169921875, 0.2812843322753906, 0.29404449462890625, 0.3068046569824219, 0.3195648193359375, 0.3323249816894531, 0.34508514404296875, 0.3578453063964844, 0.37060546875]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 5.0, 3.0, 1.0, 1.0, 6.0, 4.0, 1.0, 5.0, 15.0, 11.0, 10.0, 9.0, 14.0, 12.0, 23.0, 18.0, 28.0, 27.0, 27.0, 31.0, 39.0, 28.0, 37.0, 36.0, 33.0, 45.0, 34.0, 1081.0, 36.0, 38.0, 28.0, 39.0, 41.0, 34.0, 27.0, 28.0, 23.0, 14.0, 20.0, 24.0, 21.0, 9.0, 16.0, 9.0, 10.0, 4.0, 6.0, 8.0, 7.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 2.0], "bins": [-2.458984375, -2.3887939453125, -2.318603515625, -2.2484130859375, -2.17822265625, -2.1080322265625, -2.037841796875, -1.9676513671875, -1.8974609375, -1.8272705078125, -1.757080078125, -1.6868896484375, -1.61669921875, -1.5465087890625, -1.476318359375, -1.4061279296875, -1.3359375, -1.2657470703125, -1.195556640625, -1.1253662109375, -1.05517578125, -0.9849853515625, -0.914794921875, -0.8446044921875, -0.7744140625, -0.7042236328125, -0.634033203125, -0.5638427734375, -0.49365234375, -0.4234619140625, -0.353271484375, -0.2830810546875, -0.212890625, -0.1427001953125, -0.072509765625, -0.0023193359375, 0.06787109375, 0.1380615234375, 0.208251953125, 0.2784423828125, 0.3486328125, 0.4188232421875, 0.489013671875, 0.5592041015625, 0.62939453125, 0.6995849609375, 0.769775390625, 0.8399658203125, 0.91015625, 0.9803466796875, 1.050537109375, 1.1207275390625, 1.19091796875, 1.2611083984375, 1.331298828125, 1.4014892578125, 1.4716796875, 1.5418701171875, 1.612060546875, 1.6822509765625, 1.75244140625, 1.8226318359375, 1.892822265625, 1.9630126953125, 2.033203125]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 6.0, 9.0, 4.0, 18.0, 32.0, 49.0, 57.0, 74.0, 130.0, 184.0, 264.0, 355.0, 485.0, 640.0, 947.0, 1361.0, 1912.0, 2714.0, 3759.0, 5235.0, 7562.0, 10944.0, 15963.0, 24559.0, 53331.0, 1514582.0, 342472.0, 39927.0, 21783.0, 14207.0, 9850.0, 6865.0, 5030.0, 3379.0, 2466.0, 1825.0, 1211.0, 866.0, 563.0, 461.0, 317.0, 219.0, 144.0, 106.0, 87.0, 67.0, 36.0, 25.0, 14.0, 10.0, 9.0, 10.0, 6.0, 5.0, 1.0, 1.0, 2.0, 2.0], "bins": [-0.62158203125, -0.602081298828125, -0.58258056640625, -0.563079833984375, -0.5435791015625, -0.524078369140625, -0.50457763671875, -0.485076904296875, -0.465576171875, -0.446075439453125, -0.42657470703125, -0.407073974609375, -0.3875732421875, -0.368072509765625, -0.34857177734375, -0.329071044921875, -0.3095703125, -0.290069580078125, -0.27056884765625, -0.251068115234375, -0.2315673828125, -0.212066650390625, -0.19256591796875, -0.173065185546875, -0.153564453125, -0.134063720703125, -0.11456298828125, -0.095062255859375, -0.0755615234375, -0.056060791015625, -0.03656005859375, -0.017059326171875, 0.00244140625, 0.021942138671875, 0.04144287109375, 0.060943603515625, 0.0804443359375, 0.099945068359375, 0.11944580078125, 0.138946533203125, 0.158447265625, 0.177947998046875, 0.19744873046875, 0.216949462890625, 0.2364501953125, 0.255950927734375, 0.27545166015625, 0.294952392578125, 0.314453125, 0.333953857421875, 0.35345458984375, 0.372955322265625, 0.3924560546875, 0.411956787109375, 0.43145751953125, 0.450958251953125, 0.470458984375, 0.489959716796875, 0.50946044921875, 0.528961181640625, 0.5484619140625, 0.567962646484375, 0.58746337890625, 0.606964111328125, 0.62646484375]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 7.0, 12.0, 5.0, 10.0, 16.0, 31.0, 38.0, 39.0, 54.0, 70.0, 65.0, 94.0, 107.0, 75.0, 78.0, 77.0, 48.0, 50.0, 32.0, 32.0, 20.0, 6.0, 12.0, 9.0, 7.0, 2.0, 3.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0806884765625, -0.07814311981201172, -0.07559776306152344, -0.07305240631103516, -0.07050704956054688, -0.0679616928100586, -0.06541633605957031, -0.06287097930908203, -0.06032562255859375, -0.05778026580810547, -0.05523490905761719, -0.052689552307128906, -0.050144195556640625, -0.047598838806152344, -0.04505348205566406, -0.04250812530517578, -0.0399627685546875, -0.03741741180419922, -0.03487205505371094, -0.032326698303222656, -0.029781341552734375, -0.027235984802246094, -0.024690628051757812, -0.02214527130126953, -0.01959991455078125, -0.01705455780029297, -0.014509201049804688, -0.011963844299316406, -0.009418487548828125, -0.006873130798339844, -0.0043277740478515625, -0.0017824172973632812, 0.000762939453125, 0.0033082962036132812, 0.0058536529541015625, 0.008399009704589844, 0.010944366455078125, 0.013489723205566406, 0.016035079956054688, 0.01858043670654297, 0.02112579345703125, 0.02367115020751953, 0.026216506958007812, 0.028761863708496094, 0.031307220458984375, 0.033852577209472656, 0.03639793395996094, 0.03894329071044922, 0.0414886474609375, 0.04403400421142578, 0.04657936096191406, 0.049124717712402344, 0.051670074462890625, 0.054215431213378906, 0.05676078796386719, 0.05930614471435547, 0.06185150146484375, 0.06439685821533203, 0.06694221496582031, 0.0694875717163086, 0.07203292846679688, 0.07457828521728516, 0.07712364196777344, 0.07966899871826172, 0.08221435546875]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 6.0, 1.0, 6.0, 10.0, 13.0, 22.0, 18.0, 39.0, 51.0, 79.0, 140.0, 239.0, 426.0, 1186.0, 1008513.0, 36096.0, 816.0, 340.0, 197.0, 114.0, 87.0, 57.0, 39.0, 17.0, 14.0, 9.0, 9.0, 7.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6513671875, -1.5995025634765625, -1.547637939453125, -1.4957733154296875, -1.44390869140625, -1.3920440673828125, -1.340179443359375, -1.2883148193359375, -1.2364501953125, -1.1845855712890625, -1.132720947265625, -1.0808563232421875, -1.02899169921875, -0.9771270751953125, -0.925262451171875, -0.8733978271484375, -0.821533203125, -0.7696685791015625, -0.717803955078125, -0.6659393310546875, -0.61407470703125, -0.5622100830078125, -0.510345458984375, -0.4584808349609375, -0.4066162109375, -0.3547515869140625, -0.302886962890625, -0.2510223388671875, -0.19915771484375, -0.1472930908203125, -0.095428466796875, -0.0435638427734375, 0.00830078125, 0.0601654052734375, 0.112030029296875, 0.1638946533203125, 0.21575927734375, 0.2676239013671875, 0.319488525390625, 0.3713531494140625, 0.4232177734375, 0.4750823974609375, 0.526947021484375, 0.5788116455078125, 0.63067626953125, 0.6825408935546875, 0.734405517578125, 0.7862701416015625, 0.838134765625, 0.8899993896484375, 0.941864013671875, 0.9937286376953125, 1.04559326171875, 1.0974578857421875, 1.149322509765625, 1.2011871337890625, 1.2530517578125, 1.3049163818359375, 1.356781005859375, 1.4086456298828125, 1.46051025390625, 1.5123748779296875, 1.564239501953125, 1.6161041259765625, 1.66796875]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 74.0, 935.0, 8.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15605765581130981, -0.13125838339328766, -0.1064591184258461, -0.08165985345840454, -0.056860581040382385, -0.03206130862236023, -0.007262051105499268, 0.017537221312522888, 0.042336493730545044, 0.0671357661485672, 0.09193503111600876, 0.11673429608345032, 0.14153356850147247, 0.16633284091949463, 0.1911320984363556, 0.21593137085437775, 0.2407306432723999, 0.26552990078926086, 0.2903291881084442, 0.3151284456253052, 0.3399277329444885, 0.3647269904613495, 0.38952624797821045, 0.4143255352973938, 0.43912479281425476, 0.4639240503311157, 0.4887233376502991, 0.5135226249694824, 0.538321852684021, 0.5631211400032043, 0.5879204273223877, 0.6127196550369263, 0.6375188827514648, 0.6623181700706482, 0.6871173977851868, 0.7119166851043701, 0.7367159724235535, 0.7615152597427368, 0.7863144874572754, 0.8111137747764587, 0.8359130620956421, 0.8607123494148254, 0.885511577129364, 0.9103108644485474, 0.9351101517677307, 0.9599094390869141, 0.9847086668014526, 1.0095078945159912, 1.0343072414398193, 1.059106469154358, 1.083905816078186, 1.1087050437927246, 1.1335042715072632, 1.1583036184310913, 1.1831028461456299, 1.2079020738601685, 1.232701301574707, 1.2575005292892456, 1.2822998762130737, 1.3070991039276123, 1.3318983316421509, 1.356697678565979, 1.3814969062805176, 1.4062961339950562, 1.4310954809188843]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 10.0, 10.0, 16.0, 19.0, 19.0, 26.0, 34.0, 37.0, 46.0, 57.0, 63.0, 49.0, 64.0, 54.0, 52.0, 76.0, 50.0, 49.0, 53.0, 50.0, 38.0, 35.0, 29.0, 20.0, 23.0, 6.0, 5.0, 2.0, 6.0, 1.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10929155349731445, -0.10621154308319092, -0.10313153266906738, -0.10005152970552444, -0.09697151929140091, -0.09389150887727737, -0.09081150591373444, -0.0877314954996109, -0.08465148508548737, -0.08157147467136383, -0.0784914642572403, -0.07541146129369736, -0.07233145087957382, -0.06925144046545029, -0.06617143750190735, -0.06309142708778381, -0.06001141667366028, -0.05693140625953674, -0.053851399570703506, -0.05077139288187027, -0.047691382467746735, -0.0446113720536232, -0.04153136536478996, -0.038451358675956726, -0.03537134826183319, -0.032291337847709656, -0.02921133115887642, -0.026131322607398033, -0.023051314055919647, -0.01997130550444126, -0.016891296952962875, -0.01381128840148449, -0.010731279850006104, -0.007651271298527718, -0.004571262747049332, -0.0014912541955709457, 0.0015887543559074402, 0.004668762907385826, 0.007748771458864212, 0.010828780010342598, 0.013908788561820984, 0.01698879711329937, 0.020068805664777756, 0.02314881421625614, 0.026228822767734528, 0.029308831319212914, 0.0323888398706913, 0.035468846559524536, 0.03854885697364807, 0.041628867387771606, 0.04470887407660484, 0.04778888076543808, 0.050868891179561615, 0.05394890159368515, 0.05702890828251839, 0.060108914971351624, 0.06318892538547516, 0.0662689357995987, 0.06934894621372223, 0.07242894917726517, 0.0755089595913887, 0.07858897000551224, 0.08166897296905518, 0.08474898338317871, 0.08782899379730225]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 2.0, 3.0, 2.0, 9.0, 6.0, 16.0, 7.0, 13.0, 23.0, 24.0, 27.0, 19.0, 38.0, 32.0, 35.0, 38.0, 42.0, 36.0, 51.0, 44.0, 50.0, 49.0, 48.0, 42.0, 39.0, 33.0, 42.0, 36.0, 33.0, 25.0, 23.0, 28.0, 21.0, 13.0, 12.0, 12.0, 7.0, 6.0, 6.0, 3.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.169921875, -3.06549072265625, -2.9610595703125, -2.85662841796875, -2.752197265625, -2.64776611328125, -2.5433349609375, -2.43890380859375, -2.33447265625, -2.23004150390625, -2.1256103515625, -2.02117919921875, -1.916748046875, -1.81231689453125, -1.7078857421875, -1.60345458984375, -1.4990234375, -1.39459228515625, -1.2901611328125, -1.18572998046875, -1.081298828125, -0.97686767578125, -0.8724365234375, -0.76800537109375, -0.66357421875, -0.55914306640625, -0.4547119140625, -0.35028076171875, -0.245849609375, -0.14141845703125, -0.0369873046875, 0.06744384765625, 0.171875, 0.27630615234375, 0.3807373046875, 0.48516845703125, 0.589599609375, 0.69403076171875, 0.7984619140625, 0.90289306640625, 1.00732421875, 1.11175537109375, 1.2161865234375, 1.32061767578125, 1.425048828125, 1.52947998046875, 1.6339111328125, 1.73834228515625, 1.8427734375, 1.94720458984375, 2.0516357421875, 2.15606689453125, 2.260498046875, 2.36492919921875, 2.4693603515625, 2.57379150390625, 2.67822265625, 2.78265380859375, 2.8870849609375, 2.99151611328125, 3.095947265625, 3.20037841796875, 3.3048095703125, 3.40924072265625, 3.513671875]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 5.0, 7.0, 6.0, 8.0, 11.0, 8.0, 18.0, 20.0, 40.0, 62.0, 83.0, 112.0, 171.0, 288.0, 437.0, 675.0, 1139.0, 2435.0, 5846.0, 15346.0, 43951.0, 147145.0, 512049.0, 223617.0, 60451.0, 20503.0, 7505.0, 3069.0, 1425.0, 763.0, 456.0, 278.0, 210.0, 141.0, 96.0, 53.0, 34.0, 28.0, 22.0, 17.0, 9.0, 9.0, 11.0, 2.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.46484375, -4.2972412109375, -4.129638671875, -3.9620361328125, -3.79443359375, -3.6268310546875, -3.459228515625, -3.2916259765625, -3.1240234375, -2.9564208984375, -2.788818359375, -2.6212158203125, -2.45361328125, -2.2860107421875, -2.118408203125, -1.9508056640625, -1.783203125, -1.6156005859375, -1.447998046875, -1.2803955078125, -1.11279296875, -0.9451904296875, -0.777587890625, -0.6099853515625, -0.4423828125, -0.2747802734375, -0.107177734375, 0.0604248046875, 0.22802734375, 0.3956298828125, 0.563232421875, 0.7308349609375, 0.8984375, 1.0660400390625, 1.233642578125, 1.4012451171875, 1.56884765625, 1.7364501953125, 1.904052734375, 2.0716552734375, 2.2392578125, 2.4068603515625, 2.574462890625, 2.7420654296875, 2.90966796875, 3.0772705078125, 3.244873046875, 3.4124755859375, 3.580078125, 3.7476806640625, 3.915283203125, 4.0828857421875, 4.25048828125, 4.4180908203125, 4.585693359375, 4.7532958984375, 4.9208984375, 5.0885009765625, 5.256103515625, 5.4237060546875, 5.59130859375, 5.7589111328125, 5.926513671875, 6.0941162109375, 6.26171875]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 2.0, 0.0, 3.0, 4.0, 6.0, 10.0, 15.0, 13.0, 21.0, 26.0, 22.0, 19.0, 36.0, 34.0, 44.0, 60.0, 71.0, 112.0, 197.0, 1412.0, 316.0, 160.0, 93.0, 74.0, 38.0, 42.0, 35.0, 25.0, 25.0, 17.0, 17.0, 29.0, 9.0, 11.0, 12.0, 10.0, 8.0, 6.0, 3.0, 4.0, 4.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-8.8046875, -8.54412841796875, -8.2835693359375, -8.02301025390625, -7.762451171875, -7.50189208984375, -7.2413330078125, -6.98077392578125, -6.72021484375, -6.45965576171875, -6.1990966796875, -5.93853759765625, -5.677978515625, -5.41741943359375, -5.1568603515625, -4.89630126953125, -4.6357421875, -4.37518310546875, -4.1146240234375, -3.85406494140625, -3.593505859375, -3.33294677734375, -3.0723876953125, -2.81182861328125, -2.55126953125, -2.29071044921875, -2.0301513671875, -1.76959228515625, -1.509033203125, -1.24847412109375, -0.9879150390625, -0.72735595703125, -0.466796875, -0.20623779296875, 0.0543212890625, 0.31488037109375, 0.575439453125, 0.83599853515625, 1.0965576171875, 1.35711669921875, 1.61767578125, 1.87823486328125, 2.1387939453125, 2.39935302734375, 2.659912109375, 2.92047119140625, 3.1810302734375, 3.44158935546875, 3.7021484375, 3.96270751953125, 4.2232666015625, 4.48382568359375, 4.744384765625, 5.00494384765625, 5.2655029296875, 5.52606201171875, 5.78662109375, 6.04718017578125, 6.3077392578125, 6.56829833984375, 6.828857421875, 7.08941650390625, 7.3499755859375, 7.61053466796875, 7.87109375]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 4.0, 2.0, 5.0, 6.0, 8.0, 12.0, 18.0, 18.0, 20.0, 31.0, 37.0, 37.0, 68.0, 83.0, 143.0, 183.0, 259.0, 394.0, 651.0, 1366.0, 6115.0, 2962886.0, 167912.0, 2864.0, 998.0, 516.0, 305.0, 218.0, 144.0, 85.0, 68.0, 67.0, 37.0, 32.0, 29.0, 16.0, 14.0, 16.0, 5.0, 12.0, 8.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0], "bins": [-23.859375, -23.193115234375, -22.52685546875, -21.860595703125, -21.1943359375, -20.528076171875, -19.86181640625, -19.195556640625, -18.529296875, -17.863037109375, -17.19677734375, -16.530517578125, -15.8642578125, -15.197998046875, -14.53173828125, -13.865478515625, -13.19921875, -12.532958984375, -11.86669921875, -11.200439453125, -10.5341796875, -9.867919921875, -9.20166015625, -8.535400390625, -7.869140625, -7.202880859375, -6.53662109375, -5.870361328125, -5.2041015625, -4.537841796875, -3.87158203125, -3.205322265625, -2.5390625, -1.872802734375, -1.20654296875, -0.540283203125, 0.1259765625, 0.792236328125, 1.45849609375, 2.124755859375, 2.791015625, 3.457275390625, 4.12353515625, 4.789794921875, 5.4560546875, 6.122314453125, 6.78857421875, 7.454833984375, 8.12109375, 8.787353515625, 9.45361328125, 10.119873046875, 10.7861328125, 11.452392578125, 12.11865234375, 12.784912109375, 13.451171875, 14.117431640625, 14.78369140625, 15.449951171875, 16.1162109375, 16.782470703125, 17.44873046875, 18.114990234375, 18.78125]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 4.0, 155.0, 627.0, 219.0, 8.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.983757019042969, -9.33194637298584, -5.680135726928711, -2.028325080871582, 1.6234855651855469, 5.275295257568359, 8.927106857299805, 12.57891845703125, 16.230728149414062, 19.882537841796875, 23.53434944152832, 27.186161041259766, 30.837970733642578, 34.48978042602539, 38.14159393310547, 41.79340362548828, 45.445213317871094, 49.097023010253906, 52.74883270263672, 56.4006462097168, 60.05245590209961, 63.70426559448242, 67.3560791015625, 71.00788879394531, 74.65969848632812, 78.31150817871094, 81.96331787109375, 85.61512756347656, 89.26693725585938, 92.91874694824219, 96.57056427001953, 100.22237396240234, 103.87419128417969, 107.5260009765625, 111.17781066894531, 114.82962036132812, 118.48143005371094, 122.13323974609375, 125.7850570678711, 129.43685913085938, 133.08868408203125, 136.74049377441406, 140.39230346679688, 144.0441131591797, 147.6959228515625, 151.3477325439453, 154.99954223632812, 158.6513671875, 162.30316162109375, 165.95497131347656, 169.60678100585938, 173.2585906982422, 176.910400390625, 180.5622100830078, 184.21401977539062, 187.8658447265625, 191.51763916015625, 195.16944885253906, 198.82125854492188, 202.4730682373047, 206.1248779296875, 209.7766876220703, 213.42849731445312, 217.080322265625, 220.7321319580078]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 6.0, 8.0, 6.0, 13.0, 12.0, 12.0, 16.0, 26.0, 19.0, 22.0, 28.0, 35.0, 38.0, 42.0, 47.0, 44.0, 48.0, 49.0, 51.0, 43.0, 52.0, 56.0, 36.0, 45.0, 29.0, 30.0, 33.0, 35.0, 17.0, 23.0, 20.0, 11.0, 8.0, 10.0, 7.0, 5.0, 6.0, 5.0, 5.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0], "bins": [-31.48773193359375, -30.65091323852539, -29.8140926361084, -28.97727394104004, -28.14045524597168, -27.303634643554688, -26.466815948486328, -25.62999725341797, -24.79317855834961, -23.95635986328125, -23.119539260864258, -22.2827205657959, -21.44590187072754, -20.609081268310547, -19.772262573242188, -18.935443878173828, -18.098623275756836, -17.261804580688477, -16.424983978271484, -15.588165283203125, -14.751346588134766, -13.91452693939209, -13.077707290649414, -12.240888595581055, -11.404068946838379, -10.567249298095703, -9.730430603027344, -8.893610954284668, -8.056791305541992, -7.219972610473633, -6.383152961730957, -5.5463337898254395, -4.709514617919922, -3.8726954460144043, -3.0358760356903076, -2.199056625366211, -1.3622374534606934, -0.5254182815551758, 0.3114013671875, 1.1482205390930176, 1.9850397109985352, 2.8218588829040527, 3.6586782932281494, 4.495497703552246, 5.332316875457764, 6.169136047363281, 7.005955696105957, 7.842774868011475, 8.679594039916992, 9.516413688659668, 10.353232383728027, 11.190052032470703, 12.026870727539062, 12.863690376281738, 13.700510025024414, 14.537328720092773, 15.37414836883545, 16.210968017578125, 17.047786712646484, 17.884605407714844, 18.721426010131836, 19.558244705200195, 20.395065307617188, 21.231884002685547, 22.068702697753906]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 4.0, 9.0, 11.0, 7.0, 20.0, 21.0, 20.0, 29.0, 27.0, 39.0, 48.0, 44.0, 49.0, 45.0, 42.0, 72.0, 48.0, 56.0, 46.0, 63.0, 46.0, 49.0, 32.0, 42.0, 30.0, 31.0, 17.0, 13.0, 16.0, 4.0, 6.0, 8.0, 6.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.28125, -4.148193359375, -4.01513671875, -3.882080078125, -3.7490234375, -3.615966796875, -3.48291015625, -3.349853515625, -3.216796875, -3.083740234375, -2.95068359375, -2.817626953125, -2.6845703125, -2.551513671875, -2.41845703125, -2.285400390625, -2.15234375, -2.019287109375, -1.88623046875, -1.753173828125, -1.6201171875, -1.487060546875, -1.35400390625, -1.220947265625, -1.087890625, -0.954833984375, -0.82177734375, -0.688720703125, -0.5556640625, -0.422607421875, -0.28955078125, -0.156494140625, -0.0234375, 0.109619140625, 0.24267578125, 0.375732421875, 0.5087890625, 0.641845703125, 0.77490234375, 0.907958984375, 1.041015625, 1.174072265625, 1.30712890625, 1.440185546875, 1.5732421875, 1.706298828125, 1.83935546875, 1.972412109375, 2.10546875, 2.238525390625, 2.37158203125, 2.504638671875, 2.6376953125, 2.770751953125, 2.90380859375, 3.036865234375, 3.169921875, 3.302978515625, 3.43603515625, 3.569091796875, 3.7021484375, 3.835205078125, 3.96826171875, 4.101318359375, 4.234375]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 10.0, 12.0, 10.0, 24.0, 46.0, 83.0, 140.0, 278.0, 506.0, 974.0, 1869.0, 3833.0, 9237.0, 26585.0, 124099.0, 758959.0, 2193138.0, 877476.0, 147919.0, 30562.0, 10166.0, 4151.0, 2067.0, 1006.0, 498.0, 278.0, 135.0, 91.0, 54.0, 26.0, 17.0, 6.0, 8.0, 5.0, 5.0, 4.0, 0.0, 0.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-6.27734375, -6.08447265625, -5.8916015625, -5.69873046875, -5.505859375, -5.31298828125, -5.1201171875, -4.92724609375, -4.734375, -4.54150390625, -4.3486328125, -4.15576171875, -3.962890625, -3.77001953125, -3.5771484375, -3.38427734375, -3.19140625, -2.99853515625, -2.8056640625, -2.61279296875, -2.419921875, -2.22705078125, -2.0341796875, -1.84130859375, -1.6484375, -1.45556640625, -1.2626953125, -1.06982421875, -0.876953125, -0.68408203125, -0.4912109375, -0.29833984375, -0.10546875, 0.08740234375, 0.2802734375, 0.47314453125, 0.666015625, 0.85888671875, 1.0517578125, 1.24462890625, 1.4375, 1.63037109375, 1.8232421875, 2.01611328125, 2.208984375, 2.40185546875, 2.5947265625, 2.78759765625, 2.98046875, 3.17333984375, 3.3662109375, 3.55908203125, 3.751953125, 3.94482421875, 4.1376953125, 4.33056640625, 4.5234375, 4.71630859375, 4.9091796875, 5.10205078125, 5.294921875, 5.48779296875, 5.6806640625, 5.87353515625, 6.06640625]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 4.0, 10.0, 14.0, 10.0, 23.0, 23.0, 40.0, 54.0, 112.0, 132.0, 250.0, 345.0, 543.0, 628.0, 589.0, 438.0, 278.0, 202.0, 149.0, 74.0, 62.0, 30.0, 20.0, 17.0, 9.0, 5.0, 6.0, 4.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.0390625, -8.7930908203125, -8.547119140625, -8.3011474609375, -8.05517578125, -7.8092041015625, -7.563232421875, -7.3172607421875, -7.0712890625, -6.8253173828125, -6.579345703125, -6.3333740234375, -6.08740234375, -5.8414306640625, -5.595458984375, -5.3494873046875, -5.103515625, -4.8575439453125, -4.611572265625, -4.3656005859375, -4.11962890625, -3.8736572265625, -3.627685546875, -3.3817138671875, -3.1357421875, -2.8897705078125, -2.643798828125, -2.3978271484375, -2.15185546875, -1.9058837890625, -1.659912109375, -1.4139404296875, -1.16796875, -0.9219970703125, -0.676025390625, -0.4300537109375, -0.18408203125, 0.0618896484375, 0.307861328125, 0.5538330078125, 0.7998046875, 1.0457763671875, 1.291748046875, 1.5377197265625, 1.78369140625, 2.0296630859375, 2.275634765625, 2.5216064453125, 2.767578125, 3.0135498046875, 3.259521484375, 3.5054931640625, 3.75146484375, 3.9974365234375, 4.243408203125, 4.4893798828125, 4.7353515625, 4.9813232421875, 5.227294921875, 5.4732666015625, 5.71923828125, 5.9652099609375, 6.211181640625, 6.4571533203125, 6.703125]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 1.0, 3.0, 6.0, 3.0, 6.0, 8.0, 12.0, 22.0, 38.0, 57.0, 97.0, 200.0, 499.0, 1427.0, 6826.0, 279292.0, 3844613.0, 55561.0, 3889.0, 965.0, 361.0, 154.0, 77.0, 51.0, 34.0, 26.0, 19.0, 6.0, 4.0, 7.0, 6.0, 1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.359375, -16.7470703125, -16.134765625, -15.5224609375, -14.91015625, -14.2978515625, -13.685546875, -13.0732421875, -12.4609375, -11.8486328125, -11.236328125, -10.6240234375, -10.01171875, -9.3994140625, -8.787109375, -8.1748046875, -7.5625, -6.9501953125, -6.337890625, -5.7255859375, -5.11328125, -4.5009765625, -3.888671875, -3.2763671875, -2.6640625, -2.0517578125, -1.439453125, -0.8271484375, -0.21484375, 0.3974609375, 1.009765625, 1.6220703125, 2.234375, 2.8466796875, 3.458984375, 4.0712890625, 4.68359375, 5.2958984375, 5.908203125, 6.5205078125, 7.1328125, 7.7451171875, 8.357421875, 8.9697265625, 9.58203125, 10.1943359375, 10.806640625, 11.4189453125, 12.03125, 12.6435546875, 13.255859375, 13.8681640625, 14.48046875, 15.0927734375, 15.705078125, 16.3173828125, 16.9296875, 17.5419921875, 18.154296875, 18.7666015625, 19.37890625, 19.9912109375, 20.603515625, 21.2158203125, 21.828125]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 217.0, 777.0, 17.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-319.93829345703125, -311.35498046875, -302.7716979980469, -294.1883850097656, -285.6050720214844, -277.0217590332031, -268.4384765625, -259.85516357421875, -251.2718505859375, -242.6885528564453, -234.10523986816406, -225.52194213867188, -216.93862915039062, -208.35533142089844, -199.77203369140625, -191.188720703125, -182.6054229736328, -174.02212524414062, -165.43881225585938, -156.8555145263672, -148.27220153808594, -139.68890380859375, -131.1055908203125, -122.52229309082031, -113.9389877319336, -105.35568237304688, -96.77237701416016, -88.18907165527344, -79.60577392578125, -71.0224609375, -62.43916320800781, -53.855857849121094, -45.27256774902344, -36.68926239013672, -28.105958938598633, -19.522655487060547, -10.939350128173828, -2.3560447692871094, 6.227256774902344, 14.810562133789062, 23.39386749267578, 31.9771728515625, 40.56047821044922, 49.14377975463867, 57.72708511352539, 66.31039428710938, 74.89369201660156, 83.47699737548828, 92.060302734375, 100.64360809326172, 109.22691345214844, 117.81021118164062, 126.39352416992188, 134.97682189941406, 143.56011962890625, 152.1434326171875, 160.72674560546875, 169.31004333496094, 177.8933563232422, 186.47665405273438, 195.05996704101562, 203.6432647705078, 212.2265625, 220.80987548828125, 229.39317321777344]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 9.0, 9.0, 5.0, 15.0, 27.0, 26.0, 36.0, 33.0, 38.0, 42.0, 51.0, 51.0, 46.0, 60.0, 45.0, 47.0, 54.0, 71.0, 47.0, 42.0, 45.0, 36.0, 44.0, 32.0, 16.0, 25.0, 13.0, 14.0, 9.0, 6.0, 7.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.655248641967773, -28.69641876220703, -27.73758888244629, -26.778759002685547, -25.819931030273438, -24.861101150512695, -23.902271270751953, -22.94344139099121, -21.98461151123047, -21.025781631469727, -20.066951751708984, -19.108123779296875, -18.149293899536133, -17.19046401977539, -16.23163414001465, -15.272804260253906, -14.313976287841797, -13.355146408081055, -12.396317481994629, -11.437487602233887, -10.478658676147461, -9.519828796386719, -8.560998916625977, -7.602169513702393, -6.643340110778809, -5.684510707855225, -4.725681304931641, -3.7668514251708984, -2.8080220222473145, -1.8491926193237305, -0.8903627395629883, 0.0684666633605957, 1.0272979736328125, 1.986127495765686, 2.9449570178985596, 3.9037866592407227, 4.862616062164307, 5.821445465087891, 6.780275344848633, 7.739104747772217, 8.6979341506958, 9.656764030456543, 10.615592956542969, 11.574422836303711, 12.533252716064453, 13.492081642150879, 14.450911521911621, 15.409740447998047, 16.36857032775879, 17.32740020751953, 18.286230087280273, 19.245059967041016, 20.203887939453125, 21.162717819213867, 22.12154769897461, 23.08037757873535, 24.039207458496094, 24.998037338256836, 25.956867218017578, 26.915695190429688, 27.87452507019043, 28.833354949951172, 29.792184829711914, 30.751014709472656, 31.709842681884766]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 5.0, 4.0, 10.0, 12.0, 7.0, 11.0, 9.0, 17.0, 16.0, 13.0, 14.0, 16.0, 25.0, 28.0, 34.0, 21.0, 34.0, 36.0, 41.0, 46.0, 36.0, 46.0, 35.0, 45.0, 38.0, 49.0, 39.0, 43.0, 31.0, 34.0, 32.0, 24.0, 13.0, 20.0, 24.0, 20.0, 22.0, 10.0, 12.0, 8.0, 6.0, 4.0, 5.0, 0.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.677734375, -2.59130859375, -2.5048828125, -2.41845703125, -2.33203125, -2.24560546875, -2.1591796875, -2.07275390625, -1.986328125, -1.89990234375, -1.8134765625, -1.72705078125, -1.640625, -1.55419921875, -1.4677734375, -1.38134765625, -1.294921875, -1.20849609375, -1.1220703125, -1.03564453125, -0.94921875, -0.86279296875, -0.7763671875, -0.68994140625, -0.603515625, -0.51708984375, -0.4306640625, -0.34423828125, -0.2578125, -0.17138671875, -0.0849609375, 0.00146484375, 0.087890625, 0.17431640625, 0.2607421875, 0.34716796875, 0.43359375, 0.52001953125, 0.6064453125, 0.69287109375, 0.779296875, 0.86572265625, 0.9521484375, 1.03857421875, 1.125, 1.21142578125, 1.2978515625, 1.38427734375, 1.470703125, 1.55712890625, 1.6435546875, 1.72998046875, 1.81640625, 1.90283203125, 1.9892578125, 2.07568359375, 2.162109375, 2.24853515625, 2.3349609375, 2.42138671875, 2.5078125, 2.59423828125, 2.6806640625, 2.76708984375, 2.853515625]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 8.0, 5.0, 13.0, 14.0, 26.0, 37.0, 83.0, 117.0, 209.0, 393.0, 630.0, 1057.0, 1929.0, 3292.0, 5515.0, 9505.0, 15592.0, 25378.0, 39774.0, 60060.0, 85906.0, 115271.0, 136203.0, 139743.0, 122993.0, 96180.0, 68354.0, 45687.0, 29122.0, 18261.0, 11225.0, 6630.0, 3982.0, 2317.0, 1225.0, 752.0, 465.0, 249.0, 144.0, 77.0, 55.0, 35.0, 25.0, 6.0, 11.0, 8.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.3271484375, -0.316650390625, -0.30615234375, -0.295654296875, -0.28515625, -0.274658203125, -0.26416015625, -0.253662109375, -0.2431640625, -0.232666015625, -0.22216796875, -0.211669921875, -0.201171875, -0.190673828125, -0.18017578125, -0.169677734375, -0.1591796875, -0.148681640625, -0.13818359375, -0.127685546875, -0.1171875, -0.106689453125, -0.09619140625, -0.085693359375, -0.0751953125, -0.064697265625, -0.05419921875, -0.043701171875, -0.033203125, -0.022705078125, -0.01220703125, -0.001708984375, 0.0087890625, 0.019287109375, 0.02978515625, 0.040283203125, 0.05078125, 0.061279296875, 0.07177734375, 0.082275390625, 0.0927734375, 0.103271484375, 0.11376953125, 0.124267578125, 0.134765625, 0.145263671875, 0.15576171875, 0.166259765625, 0.1767578125, 0.187255859375, 0.19775390625, 0.208251953125, 0.21875, 0.229248046875, 0.23974609375, 0.250244140625, 0.2607421875, 0.271240234375, 0.28173828125, 0.292236328125, 0.302734375, 0.313232421875, 0.32373046875, 0.334228515625, 0.3447265625]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 5.0, 2.0, 1.0, 2.0, 4.0, 6.0, 4.0, 9.0, 10.0, 11.0, 14.0, 15.0, 20.0, 21.0, 28.0, 25.0, 35.0, 31.0, 31.0, 27.0, 32.0, 31.0, 35.0, 42.0, 29.0, 37.0, 1060.0, 42.0, 35.0, 37.0, 29.0, 27.0, 27.0, 33.0, 24.0, 31.0, 18.0, 24.0, 23.0, 20.0, 18.0, 20.0, 11.0, 9.0, 8.0, 9.0, 5.0, 3.0, 6.0, 7.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.091796875, -2.0272216796875, -1.962646484375, -1.8980712890625, -1.83349609375, -1.7689208984375, -1.704345703125, -1.6397705078125, -1.5751953125, -1.5106201171875, -1.446044921875, -1.3814697265625, -1.31689453125, -1.2523193359375, -1.187744140625, -1.1231689453125, -1.05859375, -0.9940185546875, -0.929443359375, -0.8648681640625, -0.80029296875, -0.7357177734375, -0.671142578125, -0.6065673828125, -0.5419921875, -0.4774169921875, -0.412841796875, -0.3482666015625, -0.28369140625, -0.2191162109375, -0.154541015625, -0.0899658203125, -0.025390625, 0.0391845703125, 0.103759765625, 0.1683349609375, 0.23291015625, 0.2974853515625, 0.362060546875, 0.4266357421875, 0.4912109375, 0.5557861328125, 0.620361328125, 0.6849365234375, 0.74951171875, 0.8140869140625, 0.878662109375, 0.9432373046875, 1.0078125, 1.0723876953125, 1.136962890625, 1.2015380859375, 1.26611328125, 1.3306884765625, 1.395263671875, 1.4598388671875, 1.5244140625, 1.5889892578125, 1.653564453125, 1.7181396484375, 1.78271484375, 1.8472900390625, 1.911865234375, 1.9764404296875, 2.041015625]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 5.0, 7.0, 14.0, 14.0, 34.0, 31.0, 78.0, 104.0, 117.0, 171.0, 246.0, 357.0, 455.0, 728.0, 954.0, 1459.0, 2045.0, 2741.0, 3995.0, 5717.0, 8266.0, 11654.0, 17090.0, 27348.0, 74000.0, 1661626.0, 178978.0, 34577.0, 20232.0, 13192.0, 9187.0, 6473.0, 4587.0, 3162.0, 2192.0, 1512.0, 1151.0, 768.0, 505.0, 418.0, 269.0, 202.0, 154.0, 108.0, 74.0, 38.0, 34.0, 21.0, 11.0, 10.0, 9.0, 4.0, 6.0, 4.0, 2.0, 0.0, 1.0], "bins": [-0.5859375, -0.5680084228515625, -0.550079345703125, -0.5321502685546875, -0.51422119140625, -0.4962921142578125, -0.478363037109375, -0.4604339599609375, -0.4425048828125, -0.4245758056640625, -0.406646728515625, -0.3887176513671875, -0.37078857421875, -0.3528594970703125, -0.334930419921875, -0.3170013427734375, -0.299072265625, -0.2811431884765625, -0.263214111328125, -0.2452850341796875, -0.22735595703125, -0.2094268798828125, -0.191497802734375, -0.1735687255859375, -0.1556396484375, -0.1377105712890625, -0.119781494140625, -0.1018524169921875, -0.08392333984375, -0.0659942626953125, -0.048065185546875, -0.0301361083984375, -0.01220703125, 0.0057220458984375, 0.023651123046875, 0.0415802001953125, 0.05950927734375, 0.0774383544921875, 0.095367431640625, 0.1132965087890625, 0.1312255859375, 0.1491546630859375, 0.167083740234375, 0.1850128173828125, 0.20294189453125, 0.2208709716796875, 0.238800048828125, 0.2567291259765625, 0.274658203125, 0.2925872802734375, 0.310516357421875, 0.3284454345703125, 0.34637451171875, 0.3643035888671875, 0.382232666015625, 0.4001617431640625, 0.4180908203125, 0.4360198974609375, 0.453948974609375, 0.4718780517578125, 0.48980712890625, 0.5077362060546875, 0.525665283203125, 0.5435943603515625, 0.5615234375]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 6.0, 0.0, 5.0, 7.0, 3.0, 6.0, 6.0, 6.0, 17.0, 11.0, 10.0, 17.0, 23.0, 20.0, 32.0, 29.0, 37.0, 36.0, 47.0, 55.0, 49.0, 57.0, 55.0, 50.0, 42.0, 63.0, 35.0, 39.0, 43.0, 26.0, 29.0, 34.0, 20.0, 14.0, 12.0, 9.0, 8.0, 12.0, 6.0, 10.0, 4.0, 2.0, 3.0, 1.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.0472412109375, -0.04590177536010742, -0.044562339782714844, -0.043222904205322266, -0.04188346862792969, -0.04054403305053711, -0.03920459747314453, -0.03786516189575195, -0.036525726318359375, -0.0351862907409668, -0.03384685516357422, -0.03250741958618164, -0.031167984008789062, -0.029828548431396484, -0.028489112854003906, -0.027149677276611328, -0.02581024169921875, -0.024470806121826172, -0.023131370544433594, -0.021791934967041016, -0.020452499389648438, -0.01911306381225586, -0.01777362823486328, -0.016434192657470703, -0.015094757080078125, -0.013755321502685547, -0.012415885925292969, -0.01107645034790039, -0.009737014770507812, -0.008397579193115234, -0.007058143615722656, -0.005718708038330078, -0.0043792724609375, -0.003039836883544922, -0.0017004013061523438, -0.0003609657287597656, 0.0009784698486328125, 0.0023179054260253906, 0.0036573410034179688, 0.004996776580810547, 0.006336212158203125, 0.007675647735595703, 0.009015083312988281, 0.01035451889038086, 0.011693954467773438, 0.013033390045166016, 0.014372825622558594, 0.015712261199951172, 0.01705169677734375, 0.018391132354736328, 0.019730567932128906, 0.021070003509521484, 0.022409439086914062, 0.02374887466430664, 0.02508831024169922, 0.026427745819091797, 0.027767181396484375, 0.029106616973876953, 0.03044605255126953, 0.03178548812866211, 0.03312492370605469, 0.034464359283447266, 0.035803794860839844, 0.03714323043823242, 0.038482666015625]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 4.0, 4.0, 5.0, 10.0, 10.0, 9.0, 12.0, 14.0, 25.0, 17.0, 27.0, 35.0, 46.0, 65.0, 88.0, 103.0, 149.0, 186.0, 273.0, 452.0, 828.0, 2803.0, 1014769.0, 25803.0, 1054.0, 552.0, 334.0, 214.0, 173.0, 106.0, 82.0, 55.0, 50.0, 48.0, 23.0, 30.0, 20.0, 19.0, 12.0, 10.0, 9.0, 7.0, 4.0, 9.0, 3.0, 4.0, 1.0, 0.0, 5.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.79833984375, -0.7723236083984375, -0.746307373046875, -0.7202911376953125, -0.69427490234375, -0.6682586669921875, -0.642242431640625, -0.6162261962890625, -0.5902099609375, -0.5641937255859375, -0.538177490234375, -0.5121612548828125, -0.48614501953125, -0.4601287841796875, -0.434112548828125, -0.4080963134765625, -0.382080078125, -0.3560638427734375, -0.330047607421875, -0.3040313720703125, -0.27801513671875, -0.2519989013671875, -0.225982666015625, -0.1999664306640625, -0.1739501953125, -0.1479339599609375, -0.121917724609375, -0.0959014892578125, -0.06988525390625, -0.0438690185546875, -0.017852783203125, 0.0081634521484375, 0.0341796875, 0.0601959228515625, 0.086212158203125, 0.1122283935546875, 0.13824462890625, 0.1642608642578125, 0.190277099609375, 0.2162933349609375, 0.2423095703125, 0.2683258056640625, 0.294342041015625, 0.3203582763671875, 0.34637451171875, 0.3723907470703125, 0.398406982421875, 0.4244232177734375, 0.450439453125, 0.4764556884765625, 0.502471923828125, 0.5284881591796875, 0.55450439453125, 0.5805206298828125, 0.606536865234375, 0.6325531005859375, 0.6585693359375, 0.6845855712890625, 0.710601806640625, 0.7366180419921875, 0.76263427734375, 0.7886505126953125, 0.814666748046875, 0.8406829833984375, 0.86669921875]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 784.0, 230.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10468485951423645, -0.07773575931787491, -0.050786662846803665, -0.023837566375732422, 0.00311153382062912, 0.03006063401699066, 0.057009726762771606, 0.08395883440971375, 0.11090792715549469, 0.13785701990127563, 0.16480612754821777, 0.19175522029399872, 0.21870431303977966, 0.2456534206867218, 0.27260249853134155, 0.2995516061782837, 0.32650071382522583, 0.35344982147216797, 0.3803988993167877, 0.40734800696372986, 0.434297114610672, 0.46124619245529175, 0.4881953001022339, 0.515144407749176, 0.5420935153961182, 0.5690426230430603, 0.5959917306900024, 0.6229407787322998, 0.6498898863792419, 0.6768389940261841, 0.7037881016731262, 0.7307372093200684, 0.7576863169670105, 0.7846354246139526, 0.8115845322608948, 0.8385336399078369, 0.8654826879501343, 0.8924317955970764, 0.9193809032440186, 0.9463300108909607, 0.9732791185379028, 1.0002281665802002, 1.027177333831787, 1.0541263818740845, 1.0810755491256714, 1.1080245971679688, 1.1349737644195557, 1.161922812461853, 1.1888718605041504, 1.2158209085464478, 1.2427700757980347, 1.269719123840332, 1.296668291091919, 1.3236173391342163, 1.3505663871765137, 1.3775155544281006, 1.4044647216796875, 1.4314137697219849, 1.4583629369735718, 1.4853119850158691, 1.512261152267456, 1.5392102003097534, 1.5661592483520508, 1.5931084156036377, 1.620057463645935]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 5.0, 12.0, 8.0, 10.0, 16.0, 11.0, 18.0, 25.0, 36.0, 38.0, 54.0, 41.0, 59.0, 62.0, 60.0, 55.0, 62.0, 71.0, 54.0, 53.0, 38.0, 40.0, 41.0, 33.0, 28.0, 20.0, 14.0, 14.0, 8.0, 7.0, 4.0, 1.0, 5.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08601337671279907, -0.08378785848617554, -0.0815623477101326, -0.07933683693408966, -0.07711131870746613, -0.07488580048084259, -0.07266028970479965, -0.07043477892875671, -0.06820926070213318, -0.06598374247550964, -0.0637582316994667, -0.06153271719813347, -0.05930720269680023, -0.057081688195466995, -0.05485617369413376, -0.05263065919280052, -0.050405144691467285, -0.04817963019013405, -0.04595411568880081, -0.043728601187467575, -0.04150308668613434, -0.0392775721848011, -0.037052057683467865, -0.03482654318213463, -0.03260102868080139, -0.030375514179468155, -0.028149999678134918, -0.02592448517680168, -0.023698970675468445, -0.021473456174135208, -0.01924794167280197, -0.017022427171468735, -0.014796912670135498, -0.012571398168802261, -0.010345883667469025, -0.008120369166135788, -0.005894854664802551, -0.0036693401634693146, -0.0014438256621360779, 0.0007816888391971588, 0.0030072033405303955, 0.005232717841863632, 0.007458232343196869, 0.009683746844530106, 0.011909261345863342, 0.014134775847196579, 0.016360290348529816, 0.018585804849863052, 0.02081131935119629, 0.023036833852529526, 0.025262348353862762, 0.027487862855196, 0.029713377356529236, 0.03193889185786247, 0.03416440635919571, 0.036389920860528946, 0.03861543536186218, 0.04084094986319542, 0.043066464364528656, 0.04529197886586189, 0.04751749336719513, 0.049743007868528366, 0.0519685223698616, 0.05419403687119484, 0.056419551372528076]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 6.0, 2.0, 1.0, 5.0, 9.0, 4.0, 4.0, 3.0, 10.0, 13.0, 15.0, 6.0, 14.0, 9.0, 19.0, 21.0, 20.0, 25.0, 18.0, 26.0, 22.0, 36.0, 29.0, 26.0, 47.0, 31.0, 26.0, 33.0, 44.0, 41.0, 45.0, 38.0, 45.0, 36.0, 32.0, 36.0, 27.0, 18.0, 26.0, 26.0, 18.0, 17.0, 14.0, 19.0, 12.0, 3.0, 7.0, 8.0, 5.0, 7.0, 4.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.41015625, -2.329864501953125, -2.24957275390625, -2.169281005859375, -2.0889892578125, -2.008697509765625, -1.92840576171875, -1.848114013671875, -1.767822265625, -1.687530517578125, -1.60723876953125, -1.526947021484375, -1.4466552734375, -1.366363525390625, -1.28607177734375, -1.205780029296875, -1.12548828125, -1.045196533203125, -0.96490478515625, -0.884613037109375, -0.8043212890625, -0.724029541015625, -0.64373779296875, -0.563446044921875, -0.483154296875, -0.402862548828125, -0.32257080078125, -0.242279052734375, -0.1619873046875, -0.081695556640625, -0.00140380859375, 0.078887939453125, 0.1591796875, 0.239471435546875, 0.31976318359375, 0.400054931640625, 0.4803466796875, 0.560638427734375, 0.64093017578125, 0.721221923828125, 0.801513671875, 0.881805419921875, 0.96209716796875, 1.042388916015625, 1.1226806640625, 1.202972412109375, 1.28326416015625, 1.363555908203125, 1.44384765625, 1.524139404296875, 1.60443115234375, 1.684722900390625, 1.7650146484375, 1.845306396484375, 1.92559814453125, 2.005889892578125, 2.086181640625, 2.166473388671875, 2.24676513671875, 2.327056884765625, 2.4073486328125, 2.487640380859375, 2.56793212890625, 2.648223876953125, 2.728515625]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 10.0, 14.0, 16.0, 20.0, 24.0, 36.0, 44.0, 57.0, 70.0, 134.0, 180.0, 237.0, 379.0, 537.0, 1026.0, 1818.0, 4190.0, 11044.0, 37267.0, 161486.0, 484717.0, 260180.0, 57875.0, 16147.0, 5480.0, 2303.0, 1216.0, 697.0, 449.0, 293.0, 202.0, 133.0, 73.0, 57.0, 44.0, 33.0, 32.0, 15.0, 12.0, 3.0, 5.0, 4.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.24609375, -4.1160888671875, -3.986083984375, -3.8560791015625, -3.72607421875, -3.5960693359375, -3.466064453125, -3.3360595703125, -3.2060546875, -3.0760498046875, -2.946044921875, -2.8160400390625, -2.68603515625, -2.5560302734375, -2.426025390625, -2.2960205078125, -2.166015625, -2.0360107421875, -1.906005859375, -1.7760009765625, -1.64599609375, -1.5159912109375, -1.385986328125, -1.2559814453125, -1.1259765625, -0.9959716796875, -0.865966796875, -0.7359619140625, -0.60595703125, -0.4759521484375, -0.345947265625, -0.2159423828125, -0.0859375, 0.0440673828125, 0.174072265625, 0.3040771484375, 0.43408203125, 0.5640869140625, 0.694091796875, 0.8240966796875, 0.9541015625, 1.0841064453125, 1.214111328125, 1.3441162109375, 1.47412109375, 1.6041259765625, 1.734130859375, 1.8641357421875, 1.994140625, 2.1241455078125, 2.254150390625, 2.3841552734375, 2.51416015625, 2.6441650390625, 2.774169921875, 2.9041748046875, 3.0341796875, 3.1641845703125, 3.294189453125, 3.4241943359375, 3.55419921875, 3.6842041015625, 3.814208984375, 3.9442138671875, 4.07421875]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 3.0, 4.0, 8.0, 10.0, 8.0, 17.0, 29.0, 35.0, 39.0, 40.0, 47.0, 53.0, 81.0, 89.0, 238.0, 1425.0, 321.0, 163.0, 94.0, 65.0, 53.0, 49.0, 45.0, 29.0, 26.0, 22.0, 14.0, 10.0, 18.0, 5.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.9296875, -10.5625, -10.1953125, -9.828125, -9.4609375, -9.09375, -8.7265625, -8.359375, -7.9921875, -7.625, -7.2578125, -6.890625, -6.5234375, -6.15625, -5.7890625, -5.421875, -5.0546875, -4.6875, -4.3203125, -3.953125, -3.5859375, -3.21875, -2.8515625, -2.484375, -2.1171875, -1.75, -1.3828125, -1.015625, -0.6484375, -0.28125, 0.0859375, 0.453125, 0.8203125, 1.1875, 1.5546875, 1.921875, 2.2890625, 2.65625, 3.0234375, 3.390625, 3.7578125, 4.125, 4.4921875, 4.859375, 5.2265625, 5.59375, 5.9609375, 6.328125, 6.6953125, 7.0625, 7.4296875, 7.796875, 8.1640625, 8.53125, 8.8984375, 9.265625, 9.6328125, 10.0, 10.3671875, 10.734375, 11.1015625, 11.46875, 11.8359375, 12.203125, 12.5703125]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 12.0, 7.0, 11.0, 32.0, 50.0, 75.0, 98.0, 191.0, 411.0, 1079.0, 32396.0, 3107107.0, 2940.0, 649.0, 277.0, 141.0, 87.0, 53.0, 29.0, 26.0, 21.0, 5.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-31.078125, -30.114990234375, -29.15185546875, -28.188720703125, -27.2255859375, -26.262451171875, -25.29931640625, -24.336181640625, -23.373046875, -22.409912109375, -21.44677734375, -20.483642578125, -19.5205078125, -18.557373046875, -17.59423828125, -16.631103515625, -15.66796875, -14.704833984375, -13.74169921875, -12.778564453125, -11.8154296875, -10.852294921875, -9.88916015625, -8.926025390625, -7.962890625, -6.999755859375, -6.03662109375, -5.073486328125, -4.1103515625, -3.147216796875, -2.18408203125, -1.220947265625, -0.2578125, 0.705322265625, 1.66845703125, 2.631591796875, 3.5947265625, 4.557861328125, 5.52099609375, 6.484130859375, 7.447265625, 8.410400390625, 9.37353515625, 10.336669921875, 11.2998046875, 12.262939453125, 13.22607421875, 14.189208984375, 15.15234375, 16.115478515625, 17.07861328125, 18.041748046875, 19.0048828125, 19.968017578125, 20.93115234375, 21.894287109375, 22.857421875, 23.820556640625, 24.78369140625, 25.746826171875, 26.7099609375, 27.673095703125, 28.63623046875, 29.599365234375, 30.5625]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 86.0, 852.0, 69.0, 2.0, 1.0], "bins": [-297.0060729980469, -292.09619140625, -287.1863098144531, -282.2763977050781, -277.36651611328125, -272.4566345214844, -267.5467529296875, -262.6368408203125, -257.7269592285156, -252.81707763671875, -247.9071807861328, -242.99729919433594, -238.08740234375, -233.17752075195312, -228.2676239013672, -223.3577423095703, -218.44784545898438, -213.5379638671875, -208.62806701660156, -203.7181854248047, -198.80828857421875, -193.89840698242188, -188.98851013183594, -184.07862854003906, -179.1687469482422, -174.2588653564453, -169.34896850585938, -164.4390869140625, -159.52919006347656, -154.6193084716797, -149.70941162109375, -144.79953002929688, -139.8896484375, -134.97976684570312, -130.0698699951172, -125.15998077392578, -120.25009155273438, -115.34020233154297, -110.43031311035156, -105.52043151855469, -100.61053466796875, -95.70064544677734, -90.79075622558594, -85.88086700439453, -80.97097778320312, -76.06108856201172, -71.15119934082031, -66.24131774902344, -61.3314208984375, -56.421531677246094, -51.51164245605469, -46.60175323486328, -41.691864013671875, -36.78197479248047, -31.872089385986328, -26.962200164794922, -22.05231285095215, -17.142423629760742, -12.232535362243652, -7.3226470947265625, -2.4127578735351562, 2.49713134765625, 7.407018661499023, 12.31690788269043, 17.226797103881836]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 3.0, 5.0, 6.0, 4.0, 7.0, 10.0, 12.0, 12.0, 25.0, 19.0, 35.0, 30.0, 37.0, 44.0, 47.0, 47.0, 44.0, 64.0, 58.0, 46.0, 46.0, 44.0, 46.0, 39.0, 35.0, 41.0, 34.0, 36.0, 26.0, 19.0, 23.0, 17.0, 9.0, 5.0, 8.0, 11.0, 6.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.6080379486084, -27.630172729492188, -26.652305603027344, -25.674440383911133, -24.696575164794922, -23.71870994567871, -22.7408447265625, -21.762977600097656, -20.785112380981445, -19.807247161865234, -18.82938003540039, -17.85151481628418, -16.87364959716797, -15.895784378051758, -14.91791820526123, -13.940052032470703, -12.962186813354492, -11.984321594238281, -11.006455421447754, -10.028589248657227, -9.050724029541016, -8.072858810424805, -7.094992637634277, -6.117126941680908, -5.139261245727539, -4.16139554977417, -3.183529853820801, -2.2056641578674316, -1.2277984619140625, -0.24993276596069336, 0.7279329299926758, 1.705798625946045, 2.6836624145507812, 3.6615281105041504, 4.6393938064575195, 5.617259502410889, 6.595125198364258, 7.572990894317627, 8.550856590270996, 9.528722763061523, 10.506587982177734, 11.484453201293945, 12.462319374084473, 13.440185546875, 14.418050765991211, 15.395915985107422, 16.373783111572266, 17.351648330688477, 18.329513549804688, 19.3073787689209, 20.28524398803711, 21.263111114501953, 22.240976333618164, 23.218841552734375, 24.19670867919922, 25.17457389831543, 26.15243911743164, 27.13030433654785, 28.108169555664062, 29.086036682128906, 30.063901901245117, 31.041767120361328, 32.01963424682617, 32.99749755859375, 33.975364685058594]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 4.0, 5.0, 6.0, 6.0, 10.0, 13.0, 19.0, 5.0, 17.0, 17.0, 21.0, 23.0, 28.0, 30.0, 42.0, 40.0, 48.0, 49.0, 50.0, 42.0, 35.0, 56.0, 38.0, 45.0, 46.0, 50.0, 40.0, 45.0, 30.0, 29.0, 28.0, 18.0, 17.0, 5.0, 9.0, 13.0, 6.0, 13.0, 4.0, 5.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.57421875, -3.44927978515625, -3.3243408203125, -3.19940185546875, -3.074462890625, -2.94952392578125, -2.8245849609375, -2.69964599609375, -2.57470703125, -2.44976806640625, -2.3248291015625, -2.19989013671875, -2.074951171875, -1.95001220703125, -1.8250732421875, -1.70013427734375, -1.5751953125, -1.45025634765625, -1.3253173828125, -1.20037841796875, -1.075439453125, -0.95050048828125, -0.8255615234375, -0.70062255859375, -0.57568359375, -0.45074462890625, -0.3258056640625, -0.20086669921875, -0.075927734375, 0.04901123046875, 0.1739501953125, 0.29888916015625, 0.423828125, 0.54876708984375, 0.6737060546875, 0.79864501953125, 0.923583984375, 1.04852294921875, 1.1734619140625, 1.29840087890625, 1.42333984375, 1.54827880859375, 1.6732177734375, 1.79815673828125, 1.923095703125, 2.04803466796875, 2.1729736328125, 2.29791259765625, 2.4228515625, 2.54779052734375, 2.6727294921875, 2.79766845703125, 2.922607421875, 3.04754638671875, 3.1724853515625, 3.29742431640625, 3.42236328125, 3.54730224609375, 3.6722412109375, 3.79718017578125, 3.922119140625, 4.04705810546875, 4.1719970703125, 4.29693603515625, 4.421875]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 11.0, 10.0, 10.0, 19.0, 26.0, 38.0, 45.0, 61.0, 93.0, 128.0, 189.0, 268.0, 423.0, 548.0, 854.0, 1538.0, 4996.0, 99078.0, 3078076.0, 981873.0, 19949.0, 2666.0, 1147.0, 685.0, 458.0, 345.0, 238.0, 182.0, 99.0, 58.0, 49.0, 34.0, 21.0, 16.0, 21.0, 7.0, 11.0, 5.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.5, -13.95849609375, -13.4169921875, -12.87548828125, -12.333984375, -11.79248046875, -11.2509765625, -10.70947265625, -10.16796875, -9.62646484375, -9.0849609375, -8.54345703125, -8.001953125, -7.46044921875, -6.9189453125, -6.37744140625, -5.8359375, -5.29443359375, -4.7529296875, -4.21142578125, -3.669921875, -3.12841796875, -2.5869140625, -2.04541015625, -1.50390625, -0.96240234375, -0.4208984375, 0.12060546875, 0.662109375, 1.20361328125, 1.7451171875, 2.28662109375, 2.828125, 3.36962890625, 3.9111328125, 4.45263671875, 4.994140625, 5.53564453125, 6.0771484375, 6.61865234375, 7.16015625, 7.70166015625, 8.2431640625, 8.78466796875, 9.326171875, 9.86767578125, 10.4091796875, 10.95068359375, 11.4921875, 12.03369140625, 12.5751953125, 13.11669921875, 13.658203125, 14.19970703125, 14.7412109375, 15.28271484375, 15.82421875, 16.36572265625, 16.9072265625, 17.44873046875, 17.990234375, 18.53173828125, 19.0732421875, 19.61474609375, 20.15625]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 7.0, 11.0, 17.0, 27.0, 59.0, 106.0, 189.0, 278.0, 463.0, 562.0, 646.0, 561.0, 420.0, 306.0, 188.0, 119.0, 55.0, 27.0, 15.0, 10.0, 8.0, 0.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.20703125, -5.93096923828125, -5.6549072265625, -5.37884521484375, -5.102783203125, -4.82672119140625, -4.5506591796875, -4.27459716796875, -3.99853515625, -3.72247314453125, -3.4464111328125, -3.17034912109375, -2.894287109375, -2.61822509765625, -2.3421630859375, -2.06610107421875, -1.7900390625, -1.51397705078125, -1.2379150390625, -0.96185302734375, -0.685791015625, -0.40972900390625, -0.1336669921875, 0.14239501953125, 0.41845703125, 0.69451904296875, 0.9705810546875, 1.24664306640625, 1.522705078125, 1.79876708984375, 2.0748291015625, 2.35089111328125, 2.626953125, 2.90301513671875, 3.1790771484375, 3.45513916015625, 3.731201171875, 4.00726318359375, 4.2833251953125, 4.55938720703125, 4.83544921875, 5.11151123046875, 5.3875732421875, 5.66363525390625, 5.939697265625, 6.21575927734375, 6.4918212890625, 6.76788330078125, 7.0439453125, 7.32000732421875, 7.5960693359375, 7.87213134765625, 8.148193359375, 8.42425537109375, 8.7003173828125, 8.97637939453125, 9.25244140625, 9.52850341796875, 9.8045654296875, 10.08062744140625, 10.356689453125, 10.63275146484375, 10.9088134765625, 11.18487548828125, 11.4609375]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 5.0, 8.0, 14.0, 19.0, 39.0, 81.0, 190.0, 375.0, 1018.0, 4062.0, 38481.0, 673459.0, 2952050.0, 491319.0, 28391.0, 3167.0, 860.0, 359.0, 196.0, 78.0, 40.0, 27.0, 21.0, 8.0, 4.0, 7.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.4375, -9.1466064453125, -8.855712890625, -8.5648193359375, -8.27392578125, -7.9830322265625, -7.692138671875, -7.4012451171875, -7.1103515625, -6.8194580078125, -6.528564453125, -6.2376708984375, -5.94677734375, -5.6558837890625, -5.364990234375, -5.0740966796875, -4.783203125, -4.4923095703125, -4.201416015625, -3.9105224609375, -3.61962890625, -3.3287353515625, -3.037841796875, -2.7469482421875, -2.4560546875, -2.1651611328125, -1.874267578125, -1.5833740234375, -1.29248046875, -1.0015869140625, -0.710693359375, -0.4197998046875, -0.12890625, 0.1619873046875, 0.452880859375, 0.7437744140625, 1.03466796875, 1.3255615234375, 1.616455078125, 1.9073486328125, 2.1982421875, 2.4891357421875, 2.780029296875, 3.0709228515625, 3.36181640625, 3.6527099609375, 3.943603515625, 4.2344970703125, 4.525390625, 4.8162841796875, 5.107177734375, 5.3980712890625, 5.68896484375, 5.9798583984375, 6.270751953125, 6.5616455078125, 6.8525390625, 7.1434326171875, 7.434326171875, 7.7252197265625, 8.01611328125, 8.3070068359375, 8.597900390625, 8.8887939453125, 9.1796875]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 6.0, 9.0, 19.0, 20.0, 25.0, 37.0, 45.0, 68.0, 91.0, 120.0, 111.0, 107.0, 103.0, 72.0, 47.0, 42.0, 32.0, 25.0, 6.0, 7.0, 6.0, 2.0, 7.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-60.47004318237305, -58.965980529785156, -57.461917877197266, -55.957855224609375, -54.453792572021484, -52.949729919433594, -51.4456672668457, -49.94160461425781, -48.43754196166992, -46.93347930908203, -45.42941665649414, -43.92535400390625, -42.42129135131836, -40.91722869873047, -39.41316604614258, -37.90910339355469, -36.4050407409668, -34.900978088378906, -33.396915435791016, -31.892852783203125, -30.388790130615234, -28.884727478027344, -27.380664825439453, -25.876602172851562, -24.372539520263672, -22.86847686767578, -21.36441421508789, -19.8603515625, -18.35628890991211, -16.85222625732422, -15.348163604736328, -13.844100952148438, -12.340034484863281, -10.83597183227539, -9.3319091796875, -7.827846527099609, -6.323783874511719, -4.819721221923828, -3.3156585693359375, -1.8115959167480469, -0.30753326416015625, 1.1965293884277344, 2.700592041015625, 4.204654693603516, 5.708717346191406, 7.212779998779297, 8.716842651367188, 10.220905303955078, 11.724967956542969, 13.22903060913086, 14.73309326171875, 16.23715591430664, 17.74121856689453, 19.245281219482422, 20.749343872070312, 22.253406524658203, 23.757469177246094, 25.261531829833984, 26.765594482421875, 28.269657135009766, 29.773719787597656, 31.277782440185547, 32.78184509277344, 34.28590774536133, 35.78997039794922]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 4.0, 4.0, 4.0, 5.0, 9.0, 11.0, 11.0, 29.0, 20.0, 22.0, 19.0, 48.0, 47.0, 54.0, 50.0, 66.0, 57.0, 48.0, 57.0, 49.0, 57.0, 59.0, 47.0, 48.0, 44.0, 41.0, 20.0, 23.0, 15.0, 12.0, 10.0, 8.0, 5.0, 4.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.1828498840332, -31.13653564453125, -30.090221405029297, -29.043909072875977, -27.997594833374023, -26.95128059387207, -25.90496826171875, -24.858654022216797, -23.812339782714844, -22.76602554321289, -21.719711303710938, -20.673398971557617, -19.627084732055664, -18.58077049255371, -17.53445816040039, -16.488143920898438, -15.441829681396484, -14.395515441894531, -13.349202156066895, -12.302888870239258, -11.256574630737305, -10.210260391235352, -9.163947105407715, -8.117633819580078, -7.071319580078125, -6.02500581741333, -4.978692054748535, -3.9323782920837402, -2.8860645294189453, -1.8397507667541504, -0.7934370040893555, 0.25287675857543945, 1.2991867065429688, 2.3455004692077637, 3.3918142318725586, 4.4381279945373535, 5.484441757202148, 6.530755519866943, 7.577069282531738, 8.623382568359375, 9.669696807861328, 10.716011047363281, 11.762324333190918, 12.808637619018555, 13.854951858520508, 14.901266098022461, 15.947579383850098, 16.993892669677734, 18.040206909179688, 19.08652114868164, 20.132835388183594, 21.179147720336914, 22.225461959838867, 23.27177619934082, 24.31808853149414, 25.364402770996094, 26.410717010498047, 27.45703125, 28.503345489501953, 29.549657821655273, 30.595972061157227, 31.64228630065918, 32.6885986328125, 33.73491287231445, 34.781227111816406]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 1.0, 9.0, 10.0, 5.0, 10.0, 8.0, 10.0, 16.0, 17.0, 16.0, 22.0, 28.0, 22.0, 32.0, 29.0, 39.0, 32.0, 30.0, 40.0, 40.0, 40.0, 29.0, 42.0, 28.0, 43.0, 30.0, 31.0, 37.0, 23.0, 38.0, 31.0, 23.0, 26.0, 29.0, 19.0, 24.0, 17.0, 19.0, 15.0, 8.0, 8.0, 13.0, 4.0, 4.0, 1.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-42.09375, -40.7578125, -39.421875, -38.0859375, -36.75, -35.4140625, -34.078125, -32.7421875, -31.40625, -30.0703125, -28.734375, -27.3984375, -26.0625, -24.7265625, -23.390625, -22.0546875, -20.71875, -19.3828125, -18.046875, -16.7109375, -15.375, -14.0390625, -12.703125, -11.3671875, -10.03125, -8.6953125, -7.359375, -6.0234375, -4.6875, -3.3515625, -2.015625, -0.6796875, 0.65625, 1.9921875, 3.328125, 4.6640625, 6.0, 7.3359375, 8.671875, 10.0078125, 11.34375, 12.6796875, 14.015625, 15.3515625, 16.6875, 18.0234375, 19.359375, 20.6953125, 22.03125, 23.3671875, 24.703125, 26.0390625, 27.375, 28.7109375, 30.046875, 31.3828125, 32.71875, 34.0546875, 35.390625, 36.7265625, 38.0625, 39.3984375, 40.734375, 42.0703125, 43.40625]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 8.0, 9.0, 23.0, 30.0, 39.0, 80.0, 122.0, 134.0, 240.0, 397.0, 577.0, 876.0, 1458.0, 2252.0, 3416.0, 5396.0, 8322.0, 12664.0, 18448.0, 26754.0, 37990.0, 52658.0, 69851.0, 87942.0, 103353.0, 111799.0, 109059.0, 98362.0, 81428.0, 63807.0, 47144.0, 33625.0, 23484.0, 15838.0, 10824.0, 7118.0, 4545.0, 2993.0, 1990.0, 1227.0, 807.0, 508.0, 347.0, 221.0, 160.0, 90.0, 46.0, 36.0, 21.0, 18.0, 14.0, 8.0, 4.0, 3.0, 1.0], "bins": [-2.9296875, -2.845550537109375, -2.76141357421875, -2.677276611328125, -2.5931396484375, -2.509002685546875, -2.42486572265625, -2.340728759765625, -2.256591796875, -2.172454833984375, -2.08831787109375, -2.004180908203125, -1.9200439453125, -1.835906982421875, -1.75177001953125, -1.667633056640625, -1.58349609375, -1.499359130859375, -1.41522216796875, -1.331085205078125, -1.2469482421875, -1.162811279296875, -1.07867431640625, -0.994537353515625, -0.910400390625, -0.826263427734375, -0.74212646484375, -0.657989501953125, -0.5738525390625, -0.489715576171875, -0.40557861328125, -0.321441650390625, -0.2373046875, -0.153167724609375, -0.06903076171875, 0.015106201171875, 0.0992431640625, 0.183380126953125, 0.26751708984375, 0.351654052734375, 0.435791015625, 0.519927978515625, 0.60406494140625, 0.688201904296875, 0.7723388671875, 0.856475830078125, 0.94061279296875, 1.024749755859375, 1.10888671875, 1.193023681640625, 1.27716064453125, 1.361297607421875, 1.4454345703125, 1.529571533203125, 1.61370849609375, 1.697845458984375, 1.781982421875, 1.866119384765625, 1.95025634765625, 2.034393310546875, 2.1185302734375, 2.202667236328125, 2.28680419921875, 2.370941162109375, 2.455078125]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [5.0, 0.0, 2.0, 1.0, 5.0, 4.0, 4.0, 4.0, 5.0, 6.0, 6.0, 4.0, 8.0, 8.0, 13.0, 13.0, 18.0, 17.0, 22.0, 23.0, 18.0, 27.0, 35.0, 41.0, 39.0, 36.0, 37.0, 35.0, 33.0, 38.0, 1052.0, 49.0, 37.0, 33.0, 37.0, 26.0, 29.0, 39.0, 22.0, 25.0, 23.0, 22.0, 23.0, 18.0, 15.0, 20.0, 14.0, 7.0, 6.0, 7.0, 7.0, 6.0, 3.0, 7.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-24.625, -23.808837890625, -22.99267578125, -22.176513671875, -21.3603515625, -20.544189453125, -19.72802734375, -18.911865234375, -18.095703125, -17.279541015625, -16.46337890625, -15.647216796875, -14.8310546875, -14.014892578125, -13.19873046875, -12.382568359375, -11.56640625, -10.750244140625, -9.93408203125, -9.117919921875, -8.3017578125, -7.485595703125, -6.66943359375, -5.853271484375, -5.037109375, -4.220947265625, -3.40478515625, -2.588623046875, -1.7724609375, -0.956298828125, -0.14013671875, 0.676025390625, 1.4921875, 2.308349609375, 3.12451171875, 3.940673828125, 4.7568359375, 5.572998046875, 6.38916015625, 7.205322265625, 8.021484375, 8.837646484375, 9.65380859375, 10.469970703125, 11.2861328125, 12.102294921875, 12.91845703125, 13.734619140625, 14.55078125, 15.366943359375, 16.18310546875, 16.999267578125, 17.8154296875, 18.631591796875, 19.44775390625, 20.263916015625, 21.080078125, 21.896240234375, 22.71240234375, 23.528564453125, 24.3447265625, 25.160888671875, 25.97705078125, 26.793212890625, 27.609375]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 9.0, 8.0, 17.0, 24.0, 30.0, 46.0, 67.0, 123.0, 139.0, 232.0, 335.0, 498.0, 706.0, 1067.0, 1623.0, 2383.0, 3446.0, 5275.0, 7537.0, 11426.0, 16473.0, 25566.0, 64802.0, 1600151.0, 253498.0, 37562.0, 20745.0, 14096.0, 9463.0, 6393.0, 4297.0, 2890.0, 1978.0, 1368.0, 934.0, 650.0, 417.0, 279.0, 194.0, 119.0, 87.0, 63.0, 46.0, 27.0, 14.0, 8.0, 8.0, 6.0, 7.0, 3.0, 2.0, 3.0, 0.0, 2.0, 2.0], "bins": [-7.55859375, -7.3280029296875, -7.097412109375, -6.8668212890625, -6.63623046875, -6.4056396484375, -6.175048828125, -5.9444580078125, -5.7138671875, -5.4832763671875, -5.252685546875, -5.0220947265625, -4.79150390625, -4.5609130859375, -4.330322265625, -4.0997314453125, -3.869140625, -3.6385498046875, -3.407958984375, -3.1773681640625, -2.94677734375, -2.7161865234375, -2.485595703125, -2.2550048828125, -2.0244140625, -1.7938232421875, -1.563232421875, -1.3326416015625, -1.10205078125, -0.8714599609375, -0.640869140625, -0.4102783203125, -0.1796875, 0.0509033203125, 0.281494140625, 0.5120849609375, 0.74267578125, 0.9732666015625, 1.203857421875, 1.4344482421875, 1.6650390625, 1.8956298828125, 2.126220703125, 2.3568115234375, 2.58740234375, 2.8179931640625, 3.048583984375, 3.2791748046875, 3.509765625, 3.7403564453125, 3.970947265625, 4.2015380859375, 4.43212890625, 4.6627197265625, 4.893310546875, 5.1239013671875, 5.3544921875, 5.5850830078125, 5.815673828125, 6.0462646484375, 6.27685546875, 6.5074462890625, 6.738037109375, 6.9686279296875, 7.19921875]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 1.0, 4.0, 10.0, 6.0, 11.0, 8.0, 15.0, 12.0, 10.0, 22.0, 21.0, 28.0, 32.0, 41.0, 30.0, 28.0, 32.0, 50.0, 50.0, 48.0, 50.0, 41.0, 48.0, 41.0, 44.0, 36.0, 40.0, 30.0, 25.0, 27.0, 19.0, 28.0, 22.0, 17.0, 9.0, 11.0, 6.0, 11.0, 9.0, 6.0, 6.0, 6.0, 1.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.251220703125, -0.24383544921875, -0.2364501953125, -0.22906494140625, -0.2216796875, -0.21429443359375, -0.2069091796875, -0.19952392578125, -0.192138671875, -0.18475341796875, -0.1773681640625, -0.16998291015625, -0.16259765625, -0.15521240234375, -0.1478271484375, -0.14044189453125, -0.133056640625, -0.12567138671875, -0.1182861328125, -0.11090087890625, -0.103515625, -0.09613037109375, -0.0887451171875, -0.08135986328125, -0.073974609375, -0.06658935546875, -0.0592041015625, -0.05181884765625, -0.04443359375, -0.03704833984375, -0.0296630859375, -0.02227783203125, -0.014892578125, -0.00750732421875, -0.0001220703125, 0.00726318359375, 0.0146484375, 0.02203369140625, 0.0294189453125, 0.03680419921875, 0.044189453125, 0.05157470703125, 0.0589599609375, 0.06634521484375, 0.07373046875, 0.08111572265625, 0.0885009765625, 0.09588623046875, 0.103271484375, 0.11065673828125, 0.1180419921875, 0.12542724609375, 0.1328125, 0.14019775390625, 0.1475830078125, 0.15496826171875, 0.162353515625, 0.16973876953125, 0.1771240234375, 0.18450927734375, 0.19189453125, 0.19927978515625, 0.2066650390625, 0.21405029296875, 0.221435546875]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 8.0, 8.0, 10.0, 13.0, 10.0, 23.0, 34.0, 49.0, 67.0, 78.0, 144.0, 189.0, 318.0, 466.0, 835.0, 1351.0, 2868.0, 7162.0, 21501.0, 76398.0, 241378.0, 383231.0, 215561.0, 65965.0, 18672.0, 6260.0, 2606.0, 1277.0, 728.0, 454.0, 257.0, 186.0, 122.0, 94.0, 65.0, 52.0, 33.0, 27.0, 14.0, 20.0, 7.0, 5.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.0771484375, -1.0417633056640625, -1.006378173828125, -0.9709930419921875, -0.93560791015625, -0.9002227783203125, -0.864837646484375, -0.8294525146484375, -0.7940673828125, -0.7586822509765625, -0.723297119140625, -0.6879119873046875, -0.65252685546875, -0.6171417236328125, -0.581756591796875, -0.5463714599609375, -0.510986328125, -0.4756011962890625, -0.440216064453125, -0.4048309326171875, -0.36944580078125, -0.3340606689453125, -0.298675537109375, -0.2632904052734375, -0.2279052734375, -0.1925201416015625, -0.157135009765625, -0.1217498779296875, -0.08636474609375, -0.0509796142578125, -0.015594482421875, 0.0197906494140625, 0.05517578125, 0.0905609130859375, 0.125946044921875, 0.1613311767578125, 0.19671630859375, 0.2321014404296875, 0.267486572265625, 0.3028717041015625, 0.3382568359375, 0.3736419677734375, 0.409027099609375, 0.4444122314453125, 0.47979736328125, 0.5151824951171875, 0.550567626953125, 0.5859527587890625, 0.621337890625, 0.6567230224609375, 0.692108154296875, 0.7274932861328125, 0.76287841796875, 0.7982635498046875, 0.833648681640625, 0.8690338134765625, 0.9044189453125, 0.9398040771484375, 0.975189208984375, 1.0105743408203125, 1.04595947265625, 1.0813446044921875, 1.116729736328125, 1.1521148681640625, 1.1875]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 21.0, 25.0, 51.0, 99.0, 153.0, 161.0, 159.0, 118.0, 92.0, 43.0, 33.0, 15.0, 13.0, 6.0, 5.0, 1.0, 1.0, 6.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4240718185901642, -0.40688422322273254, -0.3896966576576233, -0.37250906229019165, -0.35532146692276, -0.33813387155532837, -0.3209463059902191, -0.3037587106227875, -0.2865711450576782, -0.2693835496902466, -0.25219598412513733, -0.2350083887577057, -0.21782079339027405, -0.2006332129240036, -0.18344563245773315, -0.1662580370903015, -0.14907044172286987, -0.13188286125659943, -0.11469526588916779, -0.09750768542289734, -0.0803200975060463, -0.06313250958919525, -0.045944929122924805, -0.02875734120607376, -0.011569753289222717, 0.005617832764983177, 0.02280541881918907, 0.03999300301074982, 0.05718059092760086, 0.0743681788444519, 0.09155575931072235, 0.1087433472275734, 0.12593090534210205, 0.1431184858083725, 0.16030608117580414, 0.17749366164207458, 0.19468125700950623, 0.21186883747577667, 0.22905641794204712, 0.24624401330947876, 0.2634316086769104, 0.28061920404434204, 0.2978067696094513, 0.31499436497688293, 0.3321819603443146, 0.34936952590942383, 0.36655712127685547, 0.3837447166442871, 0.40093228220939636, 0.418119877576828, 0.43530744314193726, 0.4524950385093689, 0.46968263387680054, 0.4868702292442322, 0.504057765007019, 0.5212453603744507, 0.5384329557418823, 0.555620551109314, 0.5728081464767456, 0.5899957418441772, 0.6071832776069641, 0.6243708729743958, 0.6415584683418274, 0.658746063709259, 0.6759336590766907]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 4.0, 3.0, 7.0, 2.0, 6.0, 9.0, 17.0, 16.0, 18.0, 30.0, 33.0, 37.0, 33.0, 57.0, 37.0, 48.0, 54.0, 61.0, 48.0, 67.0, 61.0, 57.0, 41.0, 52.0, 36.0, 34.0, 34.0, 20.0, 17.0, 14.0, 10.0, 14.0, 12.0, 2.0, 8.0, 3.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3645206093788147, -0.3522201478481293, -0.33991971611976624, -0.3276192545890808, -0.3153187930583954, -0.30301833152770996, -0.2907178997993469, -0.2784174382686615, -0.2661169767379761, -0.25381651520729065, -0.24151606857776642, -0.2292156219482422, -0.21691516041755676, -0.20461471378803253, -0.1923142671585083, -0.18001380562782288, -0.16771335899829865, -0.15541291236877441, -0.143112450838089, -0.13081200420856476, -0.11851154267787933, -0.1062110960483551, -0.09391064196825027, -0.08161018788814545, -0.06930973380804062, -0.05700927972793579, -0.04470882564783096, -0.032408375293016434, -0.020107921212911606, -0.007807467132806778, 0.0044929832220077515, 0.01679343730211258, 0.029093891382217407, 0.041394345462322235, 0.05369479954242706, 0.0659952461719513, 0.07829570770263672, 0.09059615433216095, 0.10289660841226578, 0.1151970624923706, 0.12749752402305603, 0.13979797065258026, 0.15209843218326569, 0.16439887881278992, 0.17669934034347534, 0.18899978697299957, 0.2013002336025238, 0.21360069513320923, 0.22590114176273346, 0.2382015883922577, 0.2505020499229431, 0.26280251145362854, 0.2751029431819916, 0.287403404712677, 0.2997038662433624, 0.31200432777404785, 0.3243047595024109, 0.3366052210330963, 0.34890565276145935, 0.3612061142921448, 0.3735065758228302, 0.3858070373535156, 0.39810746908187866, 0.4104079306125641, 0.4227083921432495]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 4.0, 4.0, 6.0, 6.0, 5.0, 9.0, 13.0, 5.0, 7.0, 14.0, 16.0, 18.0, 30.0, 24.0, 29.0, 28.0, 29.0, 30.0, 30.0, 41.0, 29.0, 40.0, 38.0, 34.0, 34.0, 29.0, 48.0, 27.0, 34.0, 36.0, 26.0, 35.0, 16.0, 28.0, 21.0, 37.0, 21.0, 25.0, 19.0, 20.0, 13.0, 10.0, 6.0, 7.0, 10.0, 1.0, 7.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 3.0], "bins": [-44.875, -43.5703125, -42.265625, -40.9609375, -39.65625, -38.3515625, -37.046875, -35.7421875, -34.4375, -33.1328125, -31.828125, -30.5234375, -29.21875, -27.9140625, -26.609375, -25.3046875, -24.0, -22.6953125, -21.390625, -20.0859375, -18.78125, -17.4765625, -16.171875, -14.8671875, -13.5625, -12.2578125, -10.953125, -9.6484375, -8.34375, -7.0390625, -5.734375, -4.4296875, -3.125, -1.8203125, -0.515625, 0.7890625, 2.09375, 3.3984375, 4.703125, 6.0078125, 7.3125, 8.6171875, 9.921875, 11.2265625, 12.53125, 13.8359375, 15.140625, 16.4453125, 17.75, 19.0546875, 20.359375, 21.6640625, 22.96875, 24.2734375, 25.578125, 26.8828125, 28.1875, 29.4921875, 30.796875, 32.1015625, 33.40625, 34.7109375, 36.015625, 37.3203125, 38.625]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 3.0, 3.0, 2.0, 6.0, 10.0, 3.0, 5.0, 11.0, 11.0, 13.0, 20.0, 12.0, 17.0, 25.0, 27.0, 49.0, 53.0, 98.0, 120.0, 219.0, 352.0, 737.0, 1938.0, 12225.0, 111027.0, 545277.0, 327514.0, 41133.0, 5058.0, 1191.0, 539.0, 268.0, 150.0, 116.0, 63.0, 41.0, 36.0, 25.0, 30.0, 26.0, 18.0, 28.0, 15.0, 9.0, 10.0, 2.0, 7.0, 3.0, 6.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0], "bins": [-8.7265625, -8.4603271484375, -8.194091796875, -7.9278564453125, -7.66162109375, -7.3953857421875, -7.129150390625, -6.8629150390625, -6.5966796875, -6.3304443359375, -6.064208984375, -5.7979736328125, -5.53173828125, -5.2655029296875, -4.999267578125, -4.7330322265625, -4.466796875, -4.2005615234375, -3.934326171875, -3.6680908203125, -3.40185546875, -3.1356201171875, -2.869384765625, -2.6031494140625, -2.3369140625, -2.0706787109375, -1.804443359375, -1.5382080078125, -1.27197265625, -1.0057373046875, -0.739501953125, -0.4732666015625, -0.20703125, 0.0592041015625, 0.325439453125, 0.5916748046875, 0.85791015625, 1.1241455078125, 1.390380859375, 1.6566162109375, 1.9228515625, 2.1890869140625, 2.455322265625, 2.7215576171875, 2.98779296875, 3.2540283203125, 3.520263671875, 3.7864990234375, 4.052734375, 4.3189697265625, 4.585205078125, 4.8514404296875, 5.11767578125, 5.3839111328125, 5.650146484375, 5.9163818359375, 6.1826171875, 6.4488525390625, 6.715087890625, 6.9813232421875, 7.24755859375, 7.5137939453125, 7.780029296875, 8.0462646484375, 8.3125]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 8.0, 8.0, 10.0, 22.0, 36.0, 39.0, 59.0, 59.0, 87.0, 93.0, 404.0, 1837.0, 76.0, 83.0, 58.0, 50.0, 32.0, 31.0, 31.0, 7.0, 9.0, 7.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-144.125, -140.3349609375, -136.544921875, -132.7548828125, -128.96484375, -125.1748046875, -121.384765625, -117.5947265625, -113.8046875, -110.0146484375, -106.224609375, -102.4345703125, -98.64453125, -94.8544921875, -91.064453125, -87.2744140625, -83.484375, -79.6943359375, -75.904296875, -72.1142578125, -68.32421875, -64.5341796875, -60.744140625, -56.9541015625, -53.1640625, -49.3740234375, -45.583984375, -41.7939453125, -38.00390625, -34.2138671875, -30.423828125, -26.6337890625, -22.84375, -19.0537109375, -15.263671875, -11.4736328125, -7.68359375, -3.8935546875, -0.103515625, 3.6865234375, 7.4765625, 11.2666015625, 15.056640625, 18.8466796875, 22.63671875, 26.4267578125, 30.216796875, 34.0068359375, 37.796875, 41.5869140625, 45.376953125, 49.1669921875, 52.95703125, 56.7470703125, 60.537109375, 64.3271484375, 68.1171875, 71.9072265625, 75.697265625, 79.4873046875, 83.27734375, 87.0673828125, 90.857421875, 94.6474609375, 98.4375]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 7.0, 3.0, 10.0, 14.0, 22.0, 36.0, 84.0, 145.0, 282.0, 687.0, 1877.0, 8050.0, 168866.0, 2902266.0, 56145.0, 4749.0, 1402.0, 560.0, 232.0, 111.0, 55.0, 33.0, 24.0, 11.0, 8.0, 8.0, 7.0, 7.0, 4.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.0859375, -10.708251953125, -10.33056640625, -9.952880859375, -9.5751953125, -9.197509765625, -8.81982421875, -8.442138671875, -8.064453125, -7.686767578125, -7.30908203125, -6.931396484375, -6.5537109375, -6.176025390625, -5.79833984375, -5.420654296875, -5.04296875, -4.665283203125, -4.28759765625, -3.909912109375, -3.5322265625, -3.154541015625, -2.77685546875, -2.399169921875, -2.021484375, -1.643798828125, -1.26611328125, -0.888427734375, -0.5107421875, -0.133056640625, 0.24462890625, 0.622314453125, 1.0, 1.377685546875, 1.75537109375, 2.133056640625, 2.5107421875, 2.888427734375, 3.26611328125, 3.643798828125, 4.021484375, 4.399169921875, 4.77685546875, 5.154541015625, 5.5322265625, 5.909912109375, 6.28759765625, 6.665283203125, 7.04296875, 7.420654296875, 7.79833984375, 8.176025390625, 8.5537109375, 8.931396484375, 9.30908203125, 9.686767578125, 10.064453125, 10.442138671875, 10.81982421875, 11.197509765625, 11.5751953125, 11.952880859375, 12.33056640625, 12.708251953125, 13.0859375]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 5.0, 1.0, 2.0, 3.0, 5.0, 4.0, 10.0, 13.0, 26.0, 57.0, 96.0, 136.0, 182.0, 146.0, 118.0, 71.0, 34.0, 31.0, 16.0, 10.0, 8.0, 6.0, 3.0, 4.0, 2.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-99.04679107666016, -95.68722534179688, -92.32765197753906, -88.96808624267578, -85.6085205078125, -82.24895477294922, -78.88938903808594, -75.52981567382812, -72.17024993896484, -68.81068420410156, -65.45111083984375, -62.09154510498047, -58.73197937011719, -55.372413635253906, -52.01284408569336, -48.65327453613281, -45.29370880126953, -41.93414306640625, -38.5745735168457, -35.215003967285156, -31.855438232421875, -28.49587059020996, -25.136302947998047, -21.776735305786133, -18.41716766357422, -15.057600021362305, -11.69803237915039, -8.338464736938477, -4.9788970947265625, -1.6193294525146484, 1.7402381896972656, 5.09980583190918, 8.459373474121094, 11.818941116333008, 15.178508758544922, 18.538076400756836, 21.89764404296875, 25.257211685180664, 28.616779327392578, 31.976346969604492, 35.335914611816406, 38.69548034667969, 42.055049896240234, 45.41461944580078, 48.77418518066406, 52.133750915527344, 55.49332046508789, 58.85289001464844, 62.21245574951172, 65.572021484375, 68.93159484863281, 72.2911605834961, 75.65072631835938, 79.01029205322266, 82.36985778808594, 85.72943115234375, 89.08899688720703, 92.44856262207031, 95.80813598632812, 99.1677017211914, 102.52726745605469, 105.88683319091797, 109.24639892578125, 112.60597229003906, 115.96553802490234]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 6.0, 9.0, 4.0, 6.0, 7.0, 15.0, 19.0, 17.0, 22.0, 27.0, 14.0, 29.0, 22.0, 22.0, 44.0, 30.0, 32.0, 35.0, 45.0, 38.0, 51.0, 40.0, 43.0, 44.0, 32.0, 29.0, 52.0, 31.0, 34.0, 35.0, 21.0, 26.0, 19.0, 16.0, 12.0, 15.0, 11.0, 11.0, 10.0, 7.0, 7.0, 3.0, 2.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-91.53153228759766, -88.742431640625, -85.95333099365234, -83.16423034667969, -80.3751220703125, -77.58602142333984, -74.79692077636719, -72.00782012939453, -69.21871948242188, -66.42961883544922, -63.6405143737793, -60.85141372680664, -58.06230926513672, -55.27320861816406, -52.484107971191406, -49.69500732421875, -46.90589904785156, -44.116798400878906, -41.327693939208984, -38.53859329223633, -35.749488830566406, -32.96038818359375, -30.171287536621094, -27.382184982299805, -24.593082427978516, -21.803979873657227, -19.014877319335938, -16.22577667236328, -13.436674118041992, -10.647571563720703, -7.858470916748047, -5.069368362426758, -2.2802734375, 0.5088286399841309, 3.2979307174682617, 6.087032318115234, 8.876134872436523, 11.665237426757812, 14.454338073730469, 17.243440628051758, 20.032543182373047, 22.821645736694336, 25.610748291015625, 28.39984893798828, 31.18895149230957, 33.97805404663086, 36.767154693603516, 39.55625915527344, 42.345359802246094, 45.13446044921875, 47.92356491088867, 50.71266555786133, 53.50177001953125, 56.290870666503906, 59.07997131347656, 61.86907196044922, 64.65817260742188, 67.44727325439453, 70.23637390136719, 73.02548217773438, 75.81458282470703, 78.60368347167969, 81.39278411865234, 84.181884765625, 86.97099304199219]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 1.0, 9.0, 1.0, 8.0, 2.0, 12.0, 8.0, 29.0, 34.0, 62.0, 75.0, 137.0, 226.0, 313.0, 526.0, 750.0, 1173.0, 1771.0, 2689.0, 3802.0, 5942.0, 1014552.0, 5400.0, 3578.0, 2552.0, 1691.0, 1135.0, 767.0, 452.0, 290.0, 213.0, 113.0, 83.0, 50.0, 41.0, 20.0, 15.0, 10.0, 8.0, 5.0, 7.0, 3.0, 1.0, 6.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.844104766845703, -17.257566452026367, -16.6710262298584, -16.084487915039062, -15.49794864654541, -14.911409378051758, -14.324870109558105, -13.738330841064453, -13.151792526245117, -12.565253257751465, -11.978713989257812, -11.392175674438477, -10.805636405944824, -10.219097137451172, -9.63255786895752, -9.046018600463867, -8.459479331970215, -7.8729400634765625, -7.286401271820068, -6.699862003326416, -6.113323211669922, -5.5267839431762695, -4.940244674682617, -4.353705883026123, -3.7671666145324707, -3.1806275844573975, -2.594088554382324, -2.007549285888672, -1.4210102558135986, -0.8344712257385254, -0.24793195724487305, 0.3386068344116211, 0.9251461029052734, 1.5116851329803467, 2.09822416305542, 2.6847634315490723, 3.2713024616241455, 3.8578414916992188, 4.444380760192871, 5.030919551849365, 5.617458820343018, 6.20399808883667, 6.790536880493164, 7.377076148986816, 7.963615417480469, 8.550153732299805, 9.136693954467773, 9.72323226928711, 10.309771537780762, 10.896310806274414, 11.482850074768066, 12.069389343261719, 12.655927658081055, 13.242466926574707, 13.82900619506836, 14.415544509887695, 15.002084732055664, 15.588624000549316, 16.17516326904297, 16.761701583862305, 17.348241806030273, 17.93478012084961, 18.521320343017578, 19.107858657836914, 19.69439697265625]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 5.0, 4.0, 9.0, 8.0, 17.0, 26.0, 66.0, 226.0, 51357680.0, 105023.0, 152.0, 47.0, 23.0, 8.0, 12.0, 5.0, 5.0, 8.0, 1.0, 3.0, 1.0, 4.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1286.7197265625, -1243.8087158203125, -1200.897705078125, -1157.9866943359375, -1115.07568359375, -1072.1646728515625, -1029.253662109375, -986.3425903320312, -943.4315795898438, -900.5205688476562, -857.6095581054688, -814.698486328125, -771.7874755859375, -728.87646484375, -685.9654541015625, -643.054443359375, -600.1434326171875, -557.232421875, -514.3214111328125, -471.4103698730469, -428.4993591308594, -385.5883483886719, -342.67730712890625, -299.76629638671875, -256.85528564453125, -213.94427490234375, -171.0332489013672, -128.12222290039062, -85.21121215820312, -42.300201416015625, 0.61083984375, 43.5218505859375, 86.432861328125, 129.3438720703125, 172.25489807128906, 215.16592407226562, 258.0769348144531, 300.9879455566406, 343.89898681640625, 386.80999755859375, 429.72100830078125, 472.63201904296875, 515.5430297851562, 558.4541015625, 601.3651123046875, 644.276123046875, 687.1871337890625, 730.09814453125, 773.0091552734375, 815.920166015625, 858.8311767578125, 901.7421875, 944.6531982421875, 987.564208984375, 1030.475341796875, 1073.38623046875, 1116.29736328125, 1159.2083740234375, 1202.119384765625, 1245.0303955078125, 1287.94140625, 1330.8524169921875, 1373.763427734375, 1416.674560546875, 1459.58544921875]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 2.0, 4.0, 6.0, 2.0, 7.0, 9.0, 16.0, 11.0, 14.0, 23.0, 32.0, 78.0, 101.0, 140.0, 159.0, 127.0, 101.0, 53.0, 40.0, 21.0, 15.0, 14.0, 3.0, 6.0, 4.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-110.87443542480469, -107.54249572753906, -104.21056365966797, -100.87862396240234, -97.54668426513672, -94.21475219726562, -90.8828125, -87.55087280273438, -84.21893310546875, -80.88699340820312, -77.55506134033203, -74.2231216430664, -70.89118194580078, -67.55924987792969, -64.22731018066406, -60.89537048339844, -57.563438415527344, -54.231502532958984, -50.89956283569336, -47.567626953125, -44.235687255859375, -40.903751373291016, -37.571815490722656, -34.23987579345703, -30.907939910888672, -27.57600212097168, -24.244064331054688, -20.912128448486328, -17.580190658569336, -14.248252868652344, -10.916316986083984, -7.584379196166992, -4.25244140625, -0.920504093170166, 2.411433219909668, 5.743370056152344, 9.075307846069336, 12.407245635986328, 15.739181518554688, 19.07111930847168, 22.403057098388672, 25.734994888305664, 29.066932678222656, 32.398868560791016, 35.730804443359375, 39.062744140625, 42.39468002319336, 45.72661590576172, 49.058555603027344, 52.3904914855957, 55.72243118286133, 59.05436706542969, 62.38630676269531, 65.71824645996094, 69.05017852783203, 72.38211822509766, 75.71405029296875, 79.04598999023438, 82.37792205810547, 85.7098617553711, 89.04180145263672, 92.37373352050781, 95.70567321777344, 99.03761291503906, 102.36955261230469]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 9.0, 6.0, 8.0, 14.0, 18.0, 11.0, 20.0, 27.0, 35.0, 35.0, 37.0, 49.0, 71.0, 60.0, 71.0, 69.0, 70.0, 59.0, 49.0, 50.0, 50.0, 35.0, 32.0, 25.0, 30.0, 20.0, 6.0, 11.0, 13.0, 4.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-101.3824691772461, -97.91344451904297, -94.44441223144531, -90.97538757324219, -87.50635528564453, -84.0373306274414, -80.56829833984375, -77.09927368164062, -73.6302490234375, -70.16122436523438, -66.69219207763672, -63.223167419433594, -59.7541389465332, -56.28511047363281, -52.81608200073242, -49.34705352783203, -45.87802505493164, -42.40899658203125, -38.93996810913086, -35.47093963623047, -32.001914978027344, -28.532886505126953, -25.063858032226562, -21.594831466674805, -18.125802993774414, -14.65677547454834, -11.187747955322266, -7.718719482421875, -4.249691963195801, -0.7806644439697266, 2.688364028930664, 6.157390594482422, 9.626419067382812, 13.095446586608887, 16.56447410583496, 20.03350257873535, 23.50252914428711, 26.9715576171875, 30.44058609008789, 33.90961456298828, 37.378639221191406, 40.8476676940918, 44.31669616699219, 47.78572082519531, 51.2547492980957, 54.723777770996094, 58.192806243896484, 61.661834716796875, 65.130859375, 68.59988403320312, 72.06891632080078, 75.5379409790039, 79.00697326660156, 82.47599792480469, 85.94502258300781, 89.41405487060547, 92.88308715820312, 96.35211181640625, 99.8211441040039, 103.29016876220703, 106.75920104980469, 110.22822570800781, 113.69725036621094, 117.1662826538086, 120.63530731201172]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 8.0, 13.0, 7.0, 11.0, 21.0, 26.0, 39.0, 74.0, 84.0, 116.0, 169.0, 250.0, 338.0, 417.0, 609.0, 842.0, 1156.0, 1672.0, 2407.0, 3642.0, 5337.0, 8253.0, 13725.0, 26337.0, 68577.0, 525829.0, 3336509.0, 110440.0, 35959.0, 18360.0, 10449.0, 6798.0, 4421.0, 3062.0, 2089.0, 1593.0, 1138.0, 895.0, 668.0, 474.0, 369.0, 300.0, 205.0, 152.0, 117.0, 86.0, 78.0, 49.0, 26.0, 29.0, 21.0, 11.0, 15.0, 5.0, 7.0, 4.0, 5.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.205078125, -3.09527587890625, -2.9854736328125, -2.87567138671875, -2.765869140625, -2.65606689453125, -2.5462646484375, -2.43646240234375, -2.32666015625, -2.21685791015625, -2.1070556640625, -1.99725341796875, -1.887451171875, -1.77764892578125, -1.6678466796875, -1.55804443359375, -1.4482421875, -1.33843994140625, -1.2286376953125, -1.11883544921875, -1.009033203125, -0.89923095703125, -0.7894287109375, -0.67962646484375, -0.56982421875, -0.46002197265625, -0.3502197265625, -0.24041748046875, -0.130615234375, -0.02081298828125, 0.0889892578125, 0.19879150390625, 0.30859375, 0.41839599609375, 0.5281982421875, 0.63800048828125, 0.747802734375, 0.85760498046875, 0.9674072265625, 1.07720947265625, 1.18701171875, 1.29681396484375, 1.4066162109375, 1.51641845703125, 1.626220703125, 1.73602294921875, 1.8458251953125, 1.95562744140625, 2.0654296875, 2.17523193359375, 2.2850341796875, 2.39483642578125, 2.504638671875, 2.61444091796875, 2.7242431640625, 2.83404541015625, 2.94384765625, 3.05364990234375, 3.1634521484375, 3.27325439453125, 3.383056640625, 3.49285888671875, 3.6026611328125, 3.71246337890625, 3.822265625]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 2.0, 5.0, 2.0, 2.0, 2.0, 4.0, 4.0, 15.0, 10.0, 8.0, 16.0, 17.0, 30.0, 73.0, 201.0, 287.0, 155.0, 59.0, 24.0, 13.0, 10.0, 15.0, 8.0, 5.0, 6.0, 1.0, 5.0, 4.0, 4.0, 2.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.6826171875, -0.6622085571289062, -0.6417999267578125, -0.6213912963867188, -0.600982666015625, -0.5805740356445312, -0.5601654052734375, -0.5397567749023438, -0.51934814453125, -0.49893951416015625, -0.4785308837890625, -0.45812225341796875, -0.437713623046875, -0.41730499267578125, -0.3968963623046875, -0.37648773193359375, -0.3560791015625, -0.33567047119140625, -0.3152618408203125, -0.29485321044921875, -0.274444580078125, -0.25403594970703125, -0.2336273193359375, -0.21321868896484375, -0.19281005859375, -0.17240142822265625, -0.1519927978515625, -0.13158416748046875, -0.111175537109375, -0.09076690673828125, -0.0703582763671875, -0.04994964599609375, -0.029541015625, -0.00913238525390625, 0.0112762451171875, 0.03168487548828125, 0.052093505859375, 0.07250213623046875, 0.0929107666015625, 0.11331939697265625, 0.13372802734375, 0.15413665771484375, 0.1745452880859375, 0.19495391845703125, 0.215362548828125, 0.23577117919921875, 0.2561798095703125, 0.27658843994140625, 0.2969970703125, 0.31740570068359375, 0.3378143310546875, 0.35822296142578125, 0.378631591796875, 0.39904022216796875, 0.4194488525390625, 0.43985748291015625, 0.46026611328125, 0.48067474365234375, 0.5010833740234375, 0.5214920043945312, 0.541900634765625, 0.5623092651367188, 0.5827178955078125, 0.6031265258789062, 0.62353515625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 6.0, 4.0, 7.0, 5.0, 13.0, 23.0, 25.0, 31.0, 51.0, 72.0, 104.0, 188.0, 275.0, 525.0, 845.0, 1452.0, 2794.0, 5539.0, 12474.0, 33168.0, 111639.0, 665385.0, 2935788.0, 310934.0, 70383.0, 23220.0, 9512.0, 4522.0, 2266.0, 1226.0, 629.0, 453.0, 282.0, 148.0, 90.0, 61.0, 49.0, 35.0, 18.0, 20.0, 11.0, 7.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.380859375, -3.265533447265625, -3.15020751953125, -3.034881591796875, -2.9195556640625, -2.804229736328125, -2.68890380859375, -2.573577880859375, -2.458251953125, -2.342926025390625, -2.22760009765625, -2.112274169921875, -1.9969482421875, -1.881622314453125, -1.76629638671875, -1.650970458984375, -1.53564453125, -1.420318603515625, -1.30499267578125, -1.189666748046875, -1.0743408203125, -0.959014892578125, -0.84368896484375, -0.728363037109375, -0.613037109375, -0.497711181640625, -0.38238525390625, -0.267059326171875, -0.1517333984375, -0.036407470703125, 0.07891845703125, 0.194244384765625, 0.3095703125, 0.424896240234375, 0.54022216796875, 0.655548095703125, 0.7708740234375, 0.886199951171875, 1.00152587890625, 1.116851806640625, 1.232177734375, 1.347503662109375, 1.46282958984375, 1.578155517578125, 1.6934814453125, 1.808807373046875, 1.92413330078125, 2.039459228515625, 2.15478515625, 2.270111083984375, 2.38543701171875, 2.500762939453125, 2.6160888671875, 2.731414794921875, 2.84674072265625, 2.962066650390625, 3.077392578125, 3.192718505859375, 3.30804443359375, 3.423370361328125, 3.5386962890625, 3.654022216796875, 3.76934814453125, 3.884674072265625, 4.0]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 4.0, 4.0, 9.0, 8.0, 7.0, 11.0, 27.0, 25.0, 33.0, 31.0, 46.0, 72.0, 77.0, 137.0, 205.0, 310.0, 463.0, 890.0, 548.0, 325.0, 217.0, 152.0, 93.0, 84.0, 51.0, 50.0, 28.0, 45.0, 27.0, 15.0, 14.0, 9.0, 15.0, 11.0, 1.0, 11.0, 3.0, 4.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.8486328125, -0.8218612670898438, -0.7950897216796875, -0.7683181762695312, -0.741546630859375, -0.7147750854492188, -0.6880035400390625, -0.6612319946289062, -0.63446044921875, -0.6076889038085938, -0.5809173583984375, -0.5541458129882812, -0.527374267578125, -0.5006027221679688, -0.4738311767578125, -0.44705963134765625, -0.4202880859375, -0.39351654052734375, -0.3667449951171875, -0.33997344970703125, -0.313201904296875, -0.28643035888671875, -0.2596588134765625, -0.23288726806640625, -0.20611572265625, -0.17934417724609375, -0.1525726318359375, -0.12580108642578125, -0.099029541015625, -0.07225799560546875, -0.0454864501953125, -0.01871490478515625, 0.008056640625, 0.03482818603515625, 0.0615997314453125, 0.08837127685546875, 0.115142822265625, 0.14191436767578125, 0.1686859130859375, 0.19545745849609375, 0.22222900390625, 0.24900054931640625, 0.2757720947265625, 0.30254364013671875, 0.329315185546875, 0.35608673095703125, 0.3828582763671875, 0.40962982177734375, 0.4364013671875, 0.46317291259765625, 0.4899444580078125, 0.5167160034179688, 0.543487548828125, 0.5702590942382812, 0.5970306396484375, 0.6238021850585938, 0.65057373046875, 0.6773452758789062, 0.7041168212890625, 0.7308883666992188, 0.757659912109375, 0.7844314575195312, 0.8112030029296875, 0.8379745483398438, 0.86474609375]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 4.0, 9.0, 8.0, 18.0, 25.0, 12.0, 52.0, 43.0, 70.0, 120.0, 120.0, 130.0, 102.0, 106.0, 59.0, 40.0, 21.0, 11.0, 13.0, 13.0, 2.0, 5.0, 5.0, 8.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.125276565551758, -5.868943214416504, -5.61260986328125, -5.356276035308838, -5.099942684173584, -4.84360933303833, -4.587275505065918, -4.330942153930664, -4.07460880279541, -3.8182754516601562, -3.5619418621063232, -3.3056082725524902, -3.0492749214172363, -2.7929415702819824, -2.5366079807281494, -2.2802743911743164, -2.0239410400390625, -1.767607569694519, -1.5112740993499756, -1.2549406290054321, -0.9986071586608887, -0.7422736883163452, -0.48594021797180176, -0.2296067476272583, 0.026726722717285156, 0.2830601930618286, 0.5393936634063721, 0.7957271337509155, 1.052060604095459, 1.3083940744400024, 1.564727544784546, 1.8210610151290894, 2.077394485473633, 2.3337278366088867, 2.5900614261627197, 2.8463950157165527, 3.1027283668518066, 3.3590617179870605, 3.6153953075408936, 3.8717288970947266, 4.1280622482299805, 4.384395599365234, 4.640728950500488, 4.8970627784729, 5.153396129608154, 5.409729480743408, 5.66606330871582, 5.922396659851074, 6.178730010986328, 6.435063362121582, 6.691396713256836, 6.947730541229248, 7.204063892364502, 7.460397243499756, 7.716731071472168, 7.973064422607422, 8.229397773742676, 8.48573112487793, 8.742064476013184, 8.998397827148438, 9.254732131958008, 9.511065483093262, 9.767398834228516, 10.02373218536377, 10.280065536499023]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 4.0, 4.0, 3.0, 10.0, 6.0, 18.0, 21.0, 28.0, 19.0, 20.0, 38.0, 45.0, 37.0, 57.0, 46.0, 50.0, 43.0, 60.0, 48.0, 48.0, 47.0, 47.0, 41.0, 45.0, 40.0, 28.0, 30.0, 37.0, 13.0, 12.0, 14.0, 10.0, 10.0, 10.0, 8.0, 2.0, 0.0, 6.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.141849517822266, -4.988551616668701, -4.835253715515137, -4.681955814361572, -4.528657913208008, -4.375360012054443, -4.222062110900879, -4.068763732910156, -3.915466070175171, -3.7621681690216064, -3.608870267868042, -3.4555723667144775, -3.302274227142334, -3.1489763259887695, -2.995678424835205, -2.8423805236816406, -2.689082622528076, -2.5357847213745117, -2.3824868202209473, -2.229188919067383, -2.0758910179138184, -1.9225929975509644, -1.7692949771881104, -1.615997076034546, -1.4626991748809814, -1.309401273727417, -1.1561033725738525, -1.0028053522109985, -0.8495074510574341, -0.6962095499038696, -0.5429115891456604, -0.38961362838745117, -0.23631525039672852, -0.08301731944084167, 0.07028061151504517, 0.223578542470932, 0.37687647342681885, 0.5301743745803833, 0.6834723353385925, 0.8367702960968018, 0.9900681972503662, 1.1433660984039307, 1.2966639995574951, 1.4499620199203491, 1.6032599210739136, 1.756557822227478, 1.909855842590332, 2.0631537437438965, 2.216451644897461, 2.3697495460510254, 2.52304744720459, 2.6763453483581543, 2.8296432495117188, 2.982941150665283, 3.1362392902374268, 3.289537191390991, 3.4428350925445557, 3.59613299369812, 3.7494308948516846, 3.902728796005249, 4.056026935577393, 4.209324836730957, 4.3626227378845215, 4.515920639038086, 4.66921854019165]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 5.0, 3.0, 4.0, 6.0, 13.0, 17.0, 36.0, 49.0, 67.0, 81.0, 141.0, 196.0, 300.0, 481.0, 657.0, 974.0, 1422.0, 1983.0, 2850.0, 4281.0, 5928.0, 8617.0, 12696.0, 20712.0, 48055.0, 183081.0, 441562.0, 199763.0, 51513.0, 21381.0, 12993.0, 8705.0, 6090.0, 4256.0, 3013.0, 2097.0, 1429.0, 973.0, 676.0, 475.0, 312.0, 203.0, 156.0, 92.0, 69.0, 40.0, 39.0, 30.0, 18.0, 12.0, 4.0, 5.0, 1.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-1.98828125, -1.92315673828125, -1.8580322265625, -1.79290771484375, -1.727783203125, -1.66265869140625, -1.5975341796875, -1.53240966796875, -1.46728515625, -1.40216064453125, -1.3370361328125, -1.27191162109375, -1.206787109375, -1.14166259765625, -1.0765380859375, -1.01141357421875, -0.9462890625, -0.88116455078125, -0.8160400390625, -0.75091552734375, -0.685791015625, -0.62066650390625, -0.5555419921875, -0.49041748046875, -0.42529296875, -0.36016845703125, -0.2950439453125, -0.22991943359375, -0.164794921875, -0.09967041015625, -0.0345458984375, 0.03057861328125, 0.095703125, 0.16082763671875, 0.2259521484375, 0.29107666015625, 0.356201171875, 0.42132568359375, 0.4864501953125, 0.55157470703125, 0.61669921875, 0.68182373046875, 0.7469482421875, 0.81207275390625, 0.877197265625, 0.94232177734375, 1.0074462890625, 1.07257080078125, 1.1376953125, 1.20281982421875, 1.2679443359375, 1.33306884765625, 1.398193359375, 1.46331787109375, 1.5284423828125, 1.59356689453125, 1.65869140625, 1.72381591796875, 1.7889404296875, 1.85406494140625, 1.919189453125, 1.98431396484375, 2.0494384765625, 2.11456298828125, 2.1796875]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 5.0, 4.0, 5.0, 6.0, 3.0, 3.0, 5.0, 10.0, 8.0, 10.0, 25.0, 42.0, 82.0, 160.0, 225.0, 161.0, 85.0, 61.0, 26.0, 15.0, 13.0, 6.0, 10.0, 3.0, 4.0, 6.0, 5.0, 2.0, 4.0, 3.0, 0.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.72314453125, -0.701751708984375, -0.68035888671875, -0.658966064453125, -0.6375732421875, -0.616180419921875, -0.59478759765625, -0.573394775390625, -0.552001953125, -0.530609130859375, -0.50921630859375, -0.487823486328125, -0.4664306640625, -0.445037841796875, -0.42364501953125, -0.402252197265625, -0.380859375, -0.359466552734375, -0.33807373046875, -0.316680908203125, -0.2952880859375, -0.273895263671875, -0.25250244140625, -0.231109619140625, -0.209716796875, -0.188323974609375, -0.16693115234375, -0.145538330078125, -0.1241455078125, -0.102752685546875, -0.08135986328125, -0.059967041015625, -0.03857421875, -0.017181396484375, 0.00421142578125, 0.025604248046875, 0.0469970703125, 0.068389892578125, 0.08978271484375, 0.111175537109375, 0.132568359375, 0.153961181640625, 0.17535400390625, 0.196746826171875, 0.2181396484375, 0.239532470703125, 0.26092529296875, 0.282318115234375, 0.3037109375, 0.325103759765625, 0.34649658203125, 0.367889404296875, 0.3892822265625, 0.410675048828125, 0.43206787109375, 0.453460693359375, 0.474853515625, 0.496246337890625, 0.51763916015625, 0.539031982421875, 0.5604248046875, 0.581817626953125, 0.60321044921875, 0.624603271484375, 0.64599609375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 3.0, 0.0, 3.0, 7.0, 5.0, 12.0, 13.0, 18.0, 28.0, 38.0, 57.0, 81.0, 133.0, 199.0, 279.0, 461.0, 762.0, 1236.0, 2029.0, 3373.0, 6043.0, 11106.0, 21888.0, 47783.0, 114403.0, 251536.0, 303278.0, 157187.0, 65358.0, 29000.0, 13999.0, 7545.0, 4219.0, 2466.0, 1493.0, 909.0, 568.0, 362.0, 219.0, 156.0, 110.0, 78.0, 35.0, 26.0, 18.0, 13.0, 8.0, 8.0, 7.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.095703125, -2.023895263671875, -1.95208740234375, -1.880279541015625, -1.8084716796875, -1.736663818359375, -1.66485595703125, -1.593048095703125, -1.521240234375, -1.449432373046875, -1.37762451171875, -1.305816650390625, -1.2340087890625, -1.162200927734375, -1.09039306640625, -1.018585205078125, -0.94677734375, -0.874969482421875, -0.80316162109375, -0.731353759765625, -0.6595458984375, -0.587738037109375, -0.51593017578125, -0.444122314453125, -0.372314453125, -0.300506591796875, -0.22869873046875, -0.156890869140625, -0.0850830078125, -0.013275146484375, 0.05853271484375, 0.130340576171875, 0.2021484375, 0.273956298828125, 0.34576416015625, 0.417572021484375, 0.4893798828125, 0.561187744140625, 0.63299560546875, 0.704803466796875, 0.776611328125, 0.848419189453125, 0.92022705078125, 0.992034912109375, 1.0638427734375, 1.135650634765625, 1.20745849609375, 1.279266357421875, 1.35107421875, 1.422882080078125, 1.49468994140625, 1.566497802734375, 1.6383056640625, 1.710113525390625, 1.78192138671875, 1.853729248046875, 1.925537109375, 1.997344970703125, 2.06915283203125, 2.140960693359375, 2.2127685546875, 2.284576416015625, 2.35638427734375, 2.428192138671875, 2.5]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 7.0, 2.0, 6.0, 7.0, 15.0, 13.0, 12.0, 18.0, 13.0, 18.0, 22.0, 26.0, 22.0, 27.0, 45.0, 40.0, 46.0, 45.0, 46.0, 52.0, 34.0, 36.0, 45.0, 42.0, 37.0, 42.0, 43.0, 38.0, 34.0, 20.0, 20.0, 20.0, 23.0, 14.0, 17.0, 9.0, 10.0, 11.0, 11.0, 3.0, 3.0, 8.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.412109375, -2.33538818359375, -2.2586669921875, -2.18194580078125, -2.105224609375, -2.02850341796875, -1.9517822265625, -1.87506103515625, -1.79833984375, -1.72161865234375, -1.6448974609375, -1.56817626953125, -1.491455078125, -1.41473388671875, -1.3380126953125, -1.26129150390625, -1.1845703125, -1.10784912109375, -1.0311279296875, -0.95440673828125, -0.877685546875, -0.80096435546875, -0.7242431640625, -0.64752197265625, -0.57080078125, -0.49407958984375, -0.4173583984375, -0.34063720703125, -0.263916015625, -0.18719482421875, -0.1104736328125, -0.03375244140625, 0.04296875, 0.11968994140625, 0.1964111328125, 0.27313232421875, 0.349853515625, 0.42657470703125, 0.5032958984375, 0.58001708984375, 0.65673828125, 0.73345947265625, 0.8101806640625, 0.88690185546875, 0.963623046875, 1.04034423828125, 1.1170654296875, 1.19378662109375, 1.2705078125, 1.34722900390625, 1.4239501953125, 1.50067138671875, 1.577392578125, 1.65411376953125, 1.7308349609375, 1.80755615234375, 1.88427734375, 1.96099853515625, 2.0377197265625, 2.11444091796875, 2.191162109375, 2.26788330078125, 2.3446044921875, 2.42132568359375, 2.498046875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 1.0, 3.0, 4.0, 9.0, 12.0, 13.0, 10.0, 26.0, 23.0, 27.0, 42.0, 66.0, 90.0, 117.0, 185.0, 256.0, 431.0, 678.0, 1148.0, 2039.0, 4082.0, 8570.0, 21628.0, 88953.0, 621523.0, 234534.0, 38832.0, 12850.0, 5693.0, 2802.0, 1518.0, 810.0, 527.0, 328.0, 227.0, 137.0, 89.0, 74.0, 46.0, 25.0, 27.0, 22.0, 18.0, 15.0, 7.0, 9.0, 6.0, 12.0, 4.0, 7.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-9.4453125, -9.147705078125, -8.85009765625, -8.552490234375, -8.2548828125, -7.957275390625, -7.65966796875, -7.362060546875, -7.064453125, -6.766845703125, -6.46923828125, -6.171630859375, -5.8740234375, -5.576416015625, -5.27880859375, -4.981201171875, -4.68359375, -4.385986328125, -4.08837890625, -3.790771484375, -3.4931640625, -3.195556640625, -2.89794921875, -2.600341796875, -2.302734375, -2.005126953125, -1.70751953125, -1.409912109375, -1.1123046875, -0.814697265625, -0.51708984375, -0.219482421875, 0.078125, 0.375732421875, 0.67333984375, 0.970947265625, 1.2685546875, 1.566162109375, 1.86376953125, 2.161376953125, 2.458984375, 2.756591796875, 3.05419921875, 3.351806640625, 3.6494140625, 3.947021484375, 4.24462890625, 4.542236328125, 4.83984375, 5.137451171875, 5.43505859375, 5.732666015625, 6.0302734375, 6.327880859375, 6.62548828125, 6.923095703125, 7.220703125, 7.518310546875, 7.81591796875, 8.113525390625, 8.4111328125, 8.708740234375, 9.00634765625, 9.303955078125, 9.6015625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 0.0, 3.0, 4.0, 3.0, 9.0, 6.0, 8.0, 9.0, 16.0, 21.0, 28.0, 42.0, 55.0, 79.0, 108.0, 132.0, 139.0, 78.0, 67.0, 53.0, 33.0, 26.0, 25.0, 25.0, 10.0, 4.0, 9.0, 1.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0008993148803710938, -0.0008680969476699829, -0.0008368790149688721, -0.0008056610822677612, -0.0007744431495666504, -0.0007432252168655396, -0.0007120072841644287, -0.0006807893514633179, -0.000649571418762207, -0.0006183534860610962, -0.0005871355533599854, -0.0005559176206588745, -0.0005246996879577637, -0.0004934817552566528, -0.000462263822555542, -0.00043104588985443115, -0.0003998279571533203, -0.00036861002445220947, -0.00033739209175109863, -0.0003061741590499878, -0.00027495622634887695, -0.0002437382936477661, -0.00021252036094665527, -0.00018130242824554443, -0.0001500844955444336, -0.00011886656284332275, -8.764863014221191e-05, -5.6430697441101074e-05, -2.5212764739990234e-05, 6.0051679611206055e-06, 3.7223100662231445e-05, 6.844103336334229e-05, 9.965896606445312e-05, 0.00013087689876556396, 0.0001620948314666748, 0.00019331276416778564, 0.00022453069686889648, 0.0002557486295700073, 0.00028696656227111816, 0.000318184494972229, 0.00034940242767333984, 0.0003806203603744507, 0.0004118382930755615, 0.00044305622577667236, 0.0004742741584777832, 0.000505492091178894, 0.0005367100238800049, 0.0005679279565811157, 0.0005991458892822266, 0.0006303638219833374, 0.0006615817546844482, 0.0006927996873855591, 0.0007240176200866699, 0.0007552355527877808, 0.0007864534854888916, 0.0008176714181900024, 0.0008488893508911133, 0.0008801072835922241, 0.000911325216293335, 0.0009425431489944458, 0.0009737610816955566, 0.0010049790143966675, 0.0010361969470977783, 0.0010674148797988892, 0.0010986328125]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 6.0, 6.0, 10.0, 17.0, 18.0, 17.0, 23.0, 46.0, 68.0, 75.0, 146.0, 288.0, 462.0, 823.0, 1572.0, 3109.0, 6892.0, 17651.0, 61349.0, 380055.0, 465828.0, 75106.0, 20067.0, 7589.0, 3504.0, 1721.0, 882.0, 459.0, 300.0, 171.0, 93.0, 72.0, 38.0, 35.0, 14.0, 13.0, 13.0, 8.0, 4.0, 4.0, 3.0, 6.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.01953125, -5.82574462890625, -5.6319580078125, -5.43817138671875, -5.244384765625, -5.05059814453125, -4.8568115234375, -4.66302490234375, -4.46923828125, -4.27545166015625, -4.0816650390625, -3.88787841796875, -3.694091796875, -3.50030517578125, -3.3065185546875, -3.11273193359375, -2.9189453125, -2.72515869140625, -2.5313720703125, -2.33758544921875, -2.143798828125, -1.95001220703125, -1.7562255859375, -1.56243896484375, -1.36865234375, -1.17486572265625, -0.9810791015625, -0.78729248046875, -0.593505859375, -0.39971923828125, -0.2059326171875, -0.01214599609375, 0.181640625, 0.37542724609375, 0.5692138671875, 0.76300048828125, 0.956787109375, 1.15057373046875, 1.3443603515625, 1.53814697265625, 1.73193359375, 1.92572021484375, 2.1195068359375, 2.31329345703125, 2.507080078125, 2.70086669921875, 2.8946533203125, 3.08843994140625, 3.2822265625, 3.47601318359375, 3.6697998046875, 3.86358642578125, 4.057373046875, 4.25115966796875, 4.4449462890625, 4.63873291015625, 4.83251953125, 5.02630615234375, 5.2200927734375, 5.41387939453125, 5.607666015625, 5.80145263671875, 5.9952392578125, 6.18902587890625, 6.3828125]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 5.0, 1.0, 5.0, 2.0, 3.0, 5.0, 11.0, 12.0, 16.0, 20.0, 24.0, 28.0, 29.0, 31.0, 61.0, 71.0, 69.0, 72.0, 74.0, 69.0, 74.0, 66.0, 51.0, 41.0, 32.0, 35.0, 20.0, 26.0, 13.0, 9.0, 7.0, 8.0, 7.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.58203125, -3.471649169921875, -3.36126708984375, -3.250885009765625, -3.1405029296875, -3.030120849609375, -2.91973876953125, -2.809356689453125, -2.698974609375, -2.588592529296875, -2.47821044921875, -2.367828369140625, -2.2574462890625, -2.147064208984375, -2.03668212890625, -1.926300048828125, -1.81591796875, -1.705535888671875, -1.59515380859375, -1.484771728515625, -1.3743896484375, -1.264007568359375, -1.15362548828125, -1.043243408203125, -0.932861328125, -0.822479248046875, -0.71209716796875, -0.601715087890625, -0.4913330078125, -0.380950927734375, -0.27056884765625, -0.160186767578125, -0.0498046875, 0.060577392578125, 0.17095947265625, 0.281341552734375, 0.3917236328125, 0.502105712890625, 0.61248779296875, 0.722869873046875, 0.833251953125, 0.943634033203125, 1.05401611328125, 1.164398193359375, 1.2747802734375, 1.385162353515625, 1.49554443359375, 1.605926513671875, 1.71630859375, 1.826690673828125, 1.93707275390625, 2.047454833984375, 2.1578369140625, 2.268218994140625, 2.37860107421875, 2.488983154296875, 2.599365234375, 2.709747314453125, 2.82012939453125, 2.930511474609375, 3.0408935546875, 3.151275634765625, 3.26165771484375, 3.372039794921875, 3.482421875]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 3.0, 7.0, 7.0, 13.0, 27.0, 74.0, 175.0, 369.0, 211.0, 73.0, 19.0, 16.0, 9.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-107.4625244140625, -103.82679748535156, -100.19107055664062, -96.55533599853516, -92.91960906982422, -89.28388214111328, -85.64815521240234, -82.01242065429688, -78.37669372558594, -74.740966796875, -71.10523986816406, -67.4695053100586, -63.833778381347656, -60.19805145263672, -56.56232452392578, -52.92659378051758, -49.29086685180664, -45.6551399230957, -42.0194091796875, -38.38368225097656, -34.74795150756836, -31.112224578857422, -27.47649574279785, -23.84076690673828, -20.20503807067871, -16.56930923461914, -12.93358039855957, -9.297852516174316, -5.662123680114746, -2.026395797729492, 1.6093330383300781, 5.245061874389648, 8.880790710449219, 12.516519546508789, 16.15224838256836, 19.787975311279297, 23.4237060546875, 27.059432983398438, 30.695161819458008, 34.33089065551758, 37.96662139892578, 41.60234832763672, 45.23807907104492, 48.87380599975586, 52.50953674316406, 56.145263671875, 59.78099060058594, 63.41672134399414, 67.05244445800781, 70.68817138671875, 74.32389831542969, 77.95963287353516, 81.5953598022461, 85.23108673095703, 88.86681365966797, 92.50254821777344, 96.13827514648438, 99.77400207519531, 103.40972900390625, 107.04546356201172, 110.68119049072266, 114.3169174194336, 117.95264434814453, 121.58837890625, 125.22410583496094]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 5.0, 1.0, 5.0, 7.0, 1.0, 6.0, 5.0, 18.0, 23.0, 32.0, 61.0, 91.0, 113.0, 158.0, 135.0, 93.0, 75.0, 58.0, 26.0, 14.0, 9.0, 5.0, 10.0, 5.0, 6.0, 4.0, 5.0, 2.0, 4.0, 5.0, 2.0, 2.0, 2.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.16999435424805, -44.762420654296875, -43.35485076904297, -41.9472770690918, -40.539703369140625, -39.13213348388672, -37.72455978393555, -36.316986083984375, -34.90941619873047, -33.5018424987793, -32.09427261352539, -30.68669891357422, -29.27912712097168, -27.87155532836914, -26.46398162841797, -25.05640983581543, -23.64883804321289, -22.24126625061035, -20.833694458007812, -19.42612075805664, -18.0185489654541, -16.610977172851562, -15.203404426574707, -13.795831680297852, -12.388259887695312, -10.980688095092773, -9.573115348815918, -8.165542602539062, -6.757970809936523, -5.350398540496826, -3.942826271057129, -2.5352535247802734, -1.1276779174804688, 0.2798943519592285, 1.6874666213989258, 3.095038890838623, 4.50261116027832, 5.910183429718018, 7.317755699157715, 8.72532844543457, 10.13290023803711, 11.540472030639648, 12.948044776916504, 14.35561752319336, 15.763189315795898, 17.170761108398438, 18.57833480834961, 19.98590660095215, 21.393478393554688, 22.801050186157227, 24.208621978759766, 25.616195678710938, 27.023767471313477, 28.431339263916016, 29.838912963867188, 31.246484756469727, 32.654056549072266, 34.06163024902344, 35.469200134277344, 36.876773834228516, 38.28434753417969, 39.691917419433594, 41.099491119384766, 42.50706481933594, 43.914634704589844]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 2.0, 1.0, 4.0, 2.0, 6.0, 6.0, 12.0, 11.0, 11.0, 24.0, 25.0, 30.0, 37.0, 51.0, 79.0, 109.0, 150.0, 232.0, 341.0, 538.0, 829.0, 1364.0, 2579.0, 5109.0, 11240.0, 33531.0, 224626.0, 3713467.0, 154090.0, 27005.0, 9374.0, 4075.0, 2182.0, 1189.0, 662.0, 404.0, 254.0, 178.0, 125.0, 86.0, 70.0, 46.0, 32.0, 13.0, 22.0, 27.0, 12.0, 7.0, 6.0, 3.0, 4.0, 1.0, 3.0, 3.0, 2.0, 4.0], "bins": [-8.3828125, -8.14617919921875, -7.9095458984375, -7.67291259765625, -7.436279296875, -7.19964599609375, -6.9630126953125, -6.72637939453125, -6.48974609375, -6.25311279296875, -6.0164794921875, -5.77984619140625, -5.543212890625, -5.30657958984375, -5.0699462890625, -4.83331298828125, -4.5966796875, -4.36004638671875, -4.1234130859375, -3.88677978515625, -3.650146484375, -3.41351318359375, -3.1768798828125, -2.94024658203125, -2.70361328125, -2.46697998046875, -2.2303466796875, -1.99371337890625, -1.757080078125, -1.52044677734375, -1.2838134765625, -1.04718017578125, -0.810546875, -0.57391357421875, -0.3372802734375, -0.10064697265625, 0.135986328125, 0.37261962890625, 0.6092529296875, 0.84588623046875, 1.08251953125, 1.31915283203125, 1.5557861328125, 1.79241943359375, 2.029052734375, 2.26568603515625, 2.5023193359375, 2.73895263671875, 2.9755859375, 3.21221923828125, 3.4488525390625, 3.68548583984375, 3.922119140625, 4.15875244140625, 4.3953857421875, 4.63201904296875, 4.86865234375, 5.10528564453125, 5.3419189453125, 5.57855224609375, 5.815185546875, 6.05181884765625, 6.2884521484375, 6.52508544921875, 6.76171875]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 3.0, 5.0, 5.0, 3.0, 2.0, 8.0, 6.0, 8.0, 4.0, 8.0, 15.0, 17.0, 43.0, 49.0, 72.0, 142.0, 166.0, 132.0, 97.0, 60.0, 54.0, 28.0, 20.0, 5.0, 11.0, 7.0, 8.0, 4.0, 4.0, 5.0, 3.0, 3.0, 2.0, 1.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.51806640625, -0.499481201171875, -0.48089599609375, -0.462310791015625, -0.4437255859375, -0.425140380859375, -0.40655517578125, -0.387969970703125, -0.369384765625, -0.350799560546875, -0.33221435546875, -0.313629150390625, -0.2950439453125, -0.276458740234375, -0.25787353515625, -0.239288330078125, -0.220703125, -0.202117919921875, -0.18353271484375, -0.164947509765625, -0.1463623046875, -0.127777099609375, -0.10919189453125, -0.090606689453125, -0.072021484375, -0.053436279296875, -0.03485107421875, -0.016265869140625, 0.0023193359375, 0.020904541015625, 0.03948974609375, 0.058074951171875, 0.07666015625, 0.095245361328125, 0.11383056640625, 0.132415771484375, 0.1510009765625, 0.169586181640625, 0.18817138671875, 0.206756591796875, 0.225341796875, 0.243927001953125, 0.26251220703125, 0.281097412109375, 0.2996826171875, 0.318267822265625, 0.33685302734375, 0.355438232421875, 0.3740234375, 0.392608642578125, 0.41119384765625, 0.429779052734375, 0.4483642578125, 0.466949462890625, 0.48553466796875, 0.504119873046875, 0.522705078125, 0.541290283203125, 0.55987548828125, 0.578460693359375, 0.5970458984375, 0.615631103515625, 0.63421630859375, 0.652801513671875, 0.67138671875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 8.0, 8.0, 6.0, 13.0, 14.0, 18.0, 36.0, 60.0, 92.0, 138.0, 224.0, 450.0, 746.0, 1534.0, 3100.0, 6930.0, 18260.0, 59544.0, 290493.0, 2907022.0, 742481.0, 113289.0, 30083.0, 10725.0, 4590.0, 1995.0, 1095.0, 529.0, 310.0, 182.0, 119.0, 58.0, 38.0, 33.0, 26.0, 13.0, 11.0, 6.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.90625, -5.73614501953125, -5.5660400390625, -5.39593505859375, -5.225830078125, -5.05572509765625, -4.8856201171875, -4.71551513671875, -4.54541015625, -4.37530517578125, -4.2052001953125, -4.03509521484375, -3.864990234375, -3.69488525390625, -3.5247802734375, -3.35467529296875, -3.1845703125, -3.01446533203125, -2.8443603515625, -2.67425537109375, -2.504150390625, -2.33404541015625, -2.1639404296875, -1.99383544921875, -1.82373046875, -1.65362548828125, -1.4835205078125, -1.31341552734375, -1.143310546875, -0.97320556640625, -0.8031005859375, -0.63299560546875, -0.462890625, -0.29278564453125, -0.1226806640625, 0.04742431640625, 0.217529296875, 0.38763427734375, 0.5577392578125, 0.72784423828125, 0.89794921875, 1.06805419921875, 1.2381591796875, 1.40826416015625, 1.578369140625, 1.74847412109375, 1.9185791015625, 2.08868408203125, 2.2587890625, 2.42889404296875, 2.5989990234375, 2.76910400390625, 2.939208984375, 3.10931396484375, 3.2794189453125, 3.44952392578125, 3.61962890625, 3.78973388671875, 3.9598388671875, 4.12994384765625, 4.300048828125, 4.47015380859375, 4.6402587890625, 4.81036376953125, 4.98046875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 4.0, 7.0, 4.0, 10.0, 8.0, 14.0, 13.0, 23.0, 29.0, 50.0, 84.0, 96.0, 123.0, 207.0, 305.0, 524.0, 1047.0, 500.0, 328.0, 187.0, 124.0, 86.0, 76.0, 41.0, 44.0, 39.0, 22.0, 14.0, 10.0, 11.0, 8.0, 8.0, 4.0, 4.0, 4.0, 2.0, 5.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.69482421875, -0.6740875244140625, -0.653350830078125, -0.6326141357421875, -0.61187744140625, -0.5911407470703125, -0.570404052734375, -0.5496673583984375, -0.5289306640625, -0.5081939697265625, -0.487457275390625, -0.4667205810546875, -0.44598388671875, -0.4252471923828125, -0.404510498046875, -0.3837738037109375, -0.363037109375, -0.3423004150390625, -0.321563720703125, -0.3008270263671875, -0.28009033203125, -0.2593536376953125, -0.238616943359375, -0.2178802490234375, -0.1971435546875, -0.1764068603515625, -0.155670166015625, -0.1349334716796875, -0.11419677734375, -0.0934600830078125, -0.072723388671875, -0.0519866943359375, -0.03125, -0.0105133056640625, 0.010223388671875, 0.0309600830078125, 0.05169677734375, 0.0724334716796875, 0.093170166015625, 0.1139068603515625, 0.1346435546875, 0.1553802490234375, 0.176116943359375, 0.1968536376953125, 0.21759033203125, 0.2383270263671875, 0.259063720703125, 0.2798004150390625, 0.300537109375, 0.3212738037109375, 0.342010498046875, 0.3627471923828125, 0.38348388671875, 0.4042205810546875, 0.424957275390625, 0.4456939697265625, 0.4664306640625, 0.4871673583984375, 0.507904052734375, 0.5286407470703125, 0.54937744140625, 0.5701141357421875, 0.590850830078125, 0.6115875244140625, 0.63232421875]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 6.0, 5.0, 15.0, 63.0, 213.0, 326.0, 251.0, 80.0, 27.0, 15.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-23.600658416748047, -23.09544563293457, -22.590232849121094, -22.085020065307617, -21.57980728149414, -21.074594497680664, -20.569381713867188, -20.06416893005371, -19.558956146240234, -19.053743362426758, -18.54853057861328, -18.043317794799805, -17.538105010986328, -17.03289222717285, -16.527679443359375, -16.0224666595459, -15.517253875732422, -15.012041091918945, -14.506828308105469, -14.001615524291992, -13.496402740478516, -12.991189956665039, -12.485977172851562, -11.980764389038086, -11.47555160522461, -10.970338821411133, -10.465126037597656, -9.95991325378418, -9.454700469970703, -8.949487686157227, -8.44427490234375, -7.939062118530273, -7.433849334716797, -6.92863655090332, -6.423423767089844, -5.918210983276367, -5.412998199462891, -4.907785415649414, -4.4025726318359375, -3.897359848022461, -3.3921470642089844, -2.886934280395508, -2.3817214965820312, -1.8765087127685547, -1.3712959289550781, -0.8660831451416016, -0.360870361328125, 0.14434242248535156, 0.6495552062988281, 1.1547679901123047, 1.6599807739257812, 2.165193557739258, 2.6704063415527344, 3.175619125366211, 3.6808319091796875, 4.186044692993164, 4.691257476806641, 5.196470260620117, 5.701683044433594, 6.20689582824707, 6.712108612060547, 7.217321395874023, 7.7225341796875, 8.227746963500977, 8.732959747314453]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 3.0, 4.0, 3.0, 2.0, 3.0, 8.0, 12.0, 7.0, 16.0, 9.0, 15.0, 28.0, 22.0, 38.0, 46.0, 66.0, 60.0, 46.0, 70.0, 72.0, 73.0, 73.0, 59.0, 44.0, 43.0, 48.0, 26.0, 21.0, 20.0, 14.0, 14.0, 14.0, 5.0, 3.0, 6.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.3469691276550293, -3.228933572769165, -3.110898017883301, -2.9928627014160156, -2.8748271465301514, -2.756791591644287, -2.638756036758423, -2.5207204818725586, -2.4026851654052734, -2.284649610519409, -2.166614055633545, -2.0485787391662598, -1.9305431842803955, -1.8125076293945312, -1.694472074508667, -1.5764366388320923, -1.458401083946228, -1.3403655290603638, -1.222330093383789, -1.1042945384979248, -0.9862591028213501, -0.8682235479354858, -0.7501880526542664, -0.6321525573730469, -0.5141170620918274, -0.3960815668106079, -0.2780460715293884, -0.16001054644584656, -0.041975051164627075, 0.0760604739189148, 0.19409596920013428, 0.31213146448135376, 0.43016695976257324, 0.5482024550437927, 0.6662379503250122, 0.7842735052108765, 0.9023089408874512, 1.0203444957733154, 1.1383800506591797, 1.2564154863357544, 1.374450922012329, 1.4924864768981934, 1.610521912574768, 1.7285574674606323, 1.846592903137207, 1.9646284580230713, 2.0826640129089355, 2.2006993293762207, 2.318735122680664, 2.4367706775665283, 2.5548062324523926, 2.6728415489196777, 2.790877103805542, 2.9089126586914062, 3.0269482135772705, 3.1449837684631348, 3.26301908493042, 3.381054639816284, 3.4990901947021484, 3.6171255111694336, 3.735161066055298, 3.853196620941162, 3.9712321758270264, 4.089267730712891, 4.207303047180176]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 6.0, 8.0, 7.0, 6.0, 20.0, 21.0, 31.0, 48.0, 65.0, 108.0, 142.0, 261.0, 362.0, 627.0, 957.0, 1638.0, 2683.0, 4564.0, 8143.0, 14169.0, 28514.0, 74780.0, 230198.0, 382101.0, 185078.0, 59811.0, 24305.0, 12428.0, 7027.0, 4070.0, 2420.0, 1473.0, 909.0, 559.0, 372.0, 194.0, 131.0, 96.0, 67.0, 57.0, 22.0, 23.0, 13.0, 15.0, 10.0, 8.0, 6.0, 1.0, 4.0, 0.0, 3.0, 2.0, 1.0], "bins": [-3.181640625, -3.089141845703125, -2.99664306640625, -2.904144287109375, -2.8116455078125, -2.719146728515625, -2.62664794921875, -2.534149169921875, -2.441650390625, -2.349151611328125, -2.25665283203125, -2.164154052734375, -2.0716552734375, -1.979156494140625, -1.88665771484375, -1.794158935546875, -1.70166015625, -1.609161376953125, -1.51666259765625, -1.424163818359375, -1.3316650390625, -1.239166259765625, -1.14666748046875, -1.054168701171875, -0.961669921875, -0.869171142578125, -0.77667236328125, -0.684173583984375, -0.5916748046875, -0.499176025390625, -0.40667724609375, -0.314178466796875, -0.2216796875, -0.129180908203125, -0.03668212890625, 0.055816650390625, 0.1483154296875, 0.240814208984375, 0.33331298828125, 0.425811767578125, 0.518310546875, 0.610809326171875, 0.70330810546875, 0.795806884765625, 0.8883056640625, 0.980804443359375, 1.07330322265625, 1.165802001953125, 1.25830078125, 1.350799560546875, 1.44329833984375, 1.535797119140625, 1.6282958984375, 1.720794677734375, 1.81329345703125, 1.905792236328125, 1.998291015625, 2.090789794921875, 2.18328857421875, 2.275787353515625, 2.3682861328125, 2.460784912109375, 2.55328369140625, 2.645782470703125, 2.73828125]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 4.0, 1.0, 5.0, 7.0, 7.0, 10.0, 6.0, 15.0, 14.0, 36.0, 36.0, 67.0, 107.0, 112.0, 146.0, 118.0, 88.0, 63.0, 43.0, 30.0, 13.0, 10.0, 14.0, 10.0, 8.0, 3.0, 5.0, 5.0, 0.0, 1.0, 4.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.450439453125, -0.4327964782714844, -0.41515350341796875, -0.3975105285644531, -0.3798675537109375, -0.3622245788574219, -0.34458160400390625, -0.3269386291503906, -0.309295654296875, -0.2916526794433594, -0.27400970458984375, -0.2563667297363281, -0.2387237548828125, -0.22108078002929688, -0.20343780517578125, -0.18579483032226562, -0.16815185546875, -0.15050888061523438, -0.13286590576171875, -0.11522293090820312, -0.0975799560546875, -0.07993698120117188, -0.06229400634765625, -0.044651031494140625, -0.027008056640625, -0.009365081787109375, 0.00827789306640625, 0.025920867919921875, 0.0435638427734375, 0.061206817626953125, 0.07884979248046875, 0.09649276733398438, 0.1141357421875, 0.13177871704101562, 0.14942169189453125, 0.16706466674804688, 0.1847076416015625, 0.20235061645507812, 0.21999359130859375, 0.23763656616210938, 0.255279541015625, 0.2729225158691406, 0.29056549072265625, 0.3082084655761719, 0.3258514404296875, 0.3434944152832031, 0.36113739013671875, 0.3787803649902344, 0.39642333984375, 0.4140663146972656, 0.43170928955078125, 0.4493522644042969, 0.4669952392578125, 0.4846382141113281, 0.5022811889648438, 0.5199241638183594, 0.537567138671875, 0.5552101135253906, 0.5728530883789062, 0.5904960632324219, 0.6081390380859375, 0.6257820129394531, 0.6434249877929688, 0.6610679626464844, 0.6787109375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 1.0, 7.0, 7.0, 11.0, 7.0, 16.0, 33.0, 48.0, 68.0, 112.0, 205.0, 342.0, 531.0, 1073.0, 1899.0, 3468.0, 7106.0, 15294.0, 36133.0, 88639.0, 205624.0, 309190.0, 213232.0, 95079.0, 38197.0, 16439.0, 7496.0, 3723.0, 1910.0, 1101.0, 646.0, 359.0, 192.0, 120.0, 84.0, 48.0, 35.0, 23.0, 16.0, 12.0, 4.0, 4.0, 7.0, 6.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.416015625, -2.34173583984375, -2.2674560546875, -2.19317626953125, -2.118896484375, -2.04461669921875, -1.9703369140625, -1.89605712890625, -1.82177734375, -1.74749755859375, -1.6732177734375, -1.59893798828125, -1.524658203125, -1.45037841796875, -1.3760986328125, -1.30181884765625, -1.2275390625, -1.15325927734375, -1.0789794921875, -1.00469970703125, -0.930419921875, -0.85614013671875, -0.7818603515625, -0.70758056640625, -0.63330078125, -0.55902099609375, -0.4847412109375, -0.41046142578125, -0.336181640625, -0.26190185546875, -0.1876220703125, -0.11334228515625, -0.0390625, 0.03521728515625, 0.1094970703125, 0.18377685546875, 0.258056640625, 0.33233642578125, 0.4066162109375, 0.48089599609375, 0.55517578125, 0.62945556640625, 0.7037353515625, 0.77801513671875, 0.852294921875, 0.92657470703125, 1.0008544921875, 1.07513427734375, 1.1494140625, 1.22369384765625, 1.2979736328125, 1.37225341796875, 1.446533203125, 1.52081298828125, 1.5950927734375, 1.66937255859375, 1.74365234375, 1.81793212890625, 1.8922119140625, 1.96649169921875, 2.040771484375, 2.11505126953125, 2.1893310546875, 2.26361083984375, 2.337890625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 3.0, 1.0, 3.0, 5.0, 6.0, 7.0, 9.0, 11.0, 6.0, 7.0, 10.0, 22.0, 26.0, 21.0, 22.0, 38.0, 39.0, 37.0, 47.0, 41.0, 40.0, 42.0, 41.0, 42.0, 34.0, 36.0, 30.0, 44.0, 43.0, 46.0, 37.0, 35.0, 25.0, 25.0, 22.0, 18.0, 16.0, 14.0, 8.0, 11.0, 8.0, 10.0, 5.0, 3.0, 2.0, 0.0, 3.0, 6.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.95703125, -1.8983154296875, -1.839599609375, -1.7808837890625, -1.72216796875, -1.6634521484375, -1.604736328125, -1.5460205078125, -1.4873046875, -1.4285888671875, -1.369873046875, -1.3111572265625, -1.25244140625, -1.1937255859375, -1.135009765625, -1.0762939453125, -1.017578125, -0.9588623046875, -0.900146484375, -0.8414306640625, -0.78271484375, -0.7239990234375, -0.665283203125, -0.6065673828125, -0.5478515625, -0.4891357421875, -0.430419921875, -0.3717041015625, -0.31298828125, -0.2542724609375, -0.195556640625, -0.1368408203125, -0.078125, -0.0194091796875, 0.039306640625, 0.0980224609375, 0.15673828125, 0.2154541015625, 0.274169921875, 0.3328857421875, 0.3916015625, 0.4503173828125, 0.509033203125, 0.5677490234375, 0.62646484375, 0.6851806640625, 0.743896484375, 0.8026123046875, 0.861328125, 0.9200439453125, 0.978759765625, 1.0374755859375, 1.09619140625, 1.1549072265625, 1.213623046875, 1.2723388671875, 1.3310546875, 1.3897705078125, 1.448486328125, 1.5072021484375, 1.56591796875, 1.6246337890625, 1.683349609375, 1.7420654296875, 1.80078125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 2.0, 8.0, 7.0, 20.0, 13.0, 28.0, 46.0, 68.0, 128.0, 183.0, 307.0, 540.0, 1080.0, 2301.0, 5978.0, 18746.0, 86158.0, 515727.0, 341408.0, 54123.0, 13226.0, 4567.0, 1842.0, 885.0, 497.0, 238.0, 136.0, 100.0, 68.0, 34.0, 24.0, 23.0, 16.0, 8.0, 7.0, 7.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.88671875, -7.646728515625, -7.40673828125, -7.166748046875, -6.9267578125, -6.686767578125, -6.44677734375, -6.206787109375, -5.966796875, -5.726806640625, -5.48681640625, -5.246826171875, -5.0068359375, -4.766845703125, -4.52685546875, -4.286865234375, -4.046875, -3.806884765625, -3.56689453125, -3.326904296875, -3.0869140625, -2.846923828125, -2.60693359375, -2.366943359375, -2.126953125, -1.886962890625, -1.64697265625, -1.406982421875, -1.1669921875, -0.927001953125, -0.68701171875, -0.447021484375, -0.20703125, 0.032958984375, 0.27294921875, 0.512939453125, 0.7529296875, 0.992919921875, 1.23291015625, 1.472900390625, 1.712890625, 1.952880859375, 2.19287109375, 2.432861328125, 2.6728515625, 2.912841796875, 3.15283203125, 3.392822265625, 3.6328125, 3.872802734375, 4.11279296875, 4.352783203125, 4.5927734375, 4.832763671875, 5.07275390625, 5.312744140625, 5.552734375, 5.792724609375, 6.03271484375, 6.272705078125, 6.5126953125, 6.752685546875, 6.99267578125, 7.232666015625, 7.47265625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 4.0, 1.0, 7.0, 7.0, 10.0, 6.0, 11.0, 22.0, 25.0, 44.0, 41.0, 60.0, 82.0, 99.0, 106.0, 104.0, 85.0, 82.0, 51.0, 43.0, 26.0, 20.0, 16.0, 12.0, 8.0, 10.0, 9.0, 5.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0006551742553710938, -0.0006363466382026672, -0.0006175190210342407, -0.0005986914038658142, -0.0005798637866973877, -0.0005610361695289612, -0.0005422085523605347, -0.0005233809351921082, -0.0005045533180236816, -0.0004857257008552551, -0.0004668980836868286, -0.0004480704665184021, -0.0004292428493499756, -0.00041041523218154907, -0.00039158761501312256, -0.00037275999784469604, -0.00035393238067626953, -0.000335104763507843, -0.0003162771463394165, -0.00029744952917099, -0.0002786219120025635, -0.00025979429483413696, -0.00024096667766571045, -0.00022213906049728394, -0.00020331144332885742, -0.0001844838261604309, -0.0001656562089920044, -0.00014682859182357788, -0.00012800097465515137, -0.00010917335748672485, -9.034574031829834e-05, -7.151812314987183e-05, -5.269050598144531e-05, -3.38628888130188e-05, -1.5035271644592285e-05, 3.7923455238342285e-06, 2.2619962692260742e-05, 4.1447579860687256e-05, 6.027519702911377e-05, 7.910281419754028e-05, 9.79304313659668e-05, 0.00011675804853439331, 0.00013558566570281982, 0.00015441328287124634, 0.00017324090003967285, 0.00019206851720809937, 0.00021089613437652588, 0.0002297237515449524, 0.0002485513687133789, 0.0002673789858818054, 0.00028620660305023193, 0.00030503422021865845, 0.00032386183738708496, 0.0003426894545555115, 0.000361517071723938, 0.0003803446888923645, 0.000399172306060791, 0.00041799992322921753, 0.00043682754039764404, 0.00045565515756607056, 0.00047448277473449707, 0.0004933103919029236, 0.0005121380090713501, 0.0005309656262397766, 0.0005497932434082031]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [5.0, 1.0, 3.0, 2.0, 3.0, 0.0, 6.0, 10.0, 12.0, 6.0, 13.0, 14.0, 17.0, 36.0, 30.0, 43.0, 68.0, 128.0, 162.0, 309.0, 463.0, 750.0, 1383.0, 2636.0, 5807.0, 13947.0, 40601.0, 144668.0, 423524.0, 289228.0, 80797.0, 25251.0, 9562.0, 4267.0, 2119.0, 1046.0, 583.0, 364.0, 248.0, 132.0, 115.0, 64.0, 40.0, 25.0, 19.0, 15.0, 12.0, 3.0, 6.0, 6.0, 5.0, 2.0, 4.0, 6.0, 0.0, 2.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.99609375, -3.85723876953125, -3.7183837890625, -3.57952880859375, -3.440673828125, -3.30181884765625, -3.1629638671875, -3.02410888671875, -2.88525390625, -2.74639892578125, -2.6075439453125, -2.46868896484375, -2.329833984375, -2.19097900390625, -2.0521240234375, -1.91326904296875, -1.7744140625, -1.63555908203125, -1.4967041015625, -1.35784912109375, -1.218994140625, -1.08013916015625, -0.9412841796875, -0.80242919921875, -0.66357421875, -0.52471923828125, -0.3858642578125, -0.24700927734375, -0.108154296875, 0.03070068359375, 0.1695556640625, 0.30841064453125, 0.447265625, 0.58612060546875, 0.7249755859375, 0.86383056640625, 1.002685546875, 1.14154052734375, 1.2803955078125, 1.41925048828125, 1.55810546875, 1.69696044921875, 1.8358154296875, 1.97467041015625, 2.113525390625, 2.25238037109375, 2.3912353515625, 2.53009033203125, 2.6689453125, 2.80780029296875, 2.9466552734375, 3.08551025390625, 3.224365234375, 3.36322021484375, 3.5020751953125, 3.64093017578125, 3.77978515625, 3.91864013671875, 4.0574951171875, 4.19635009765625, 4.335205078125, 4.47406005859375, 4.6129150390625, 4.75177001953125, 4.890625]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 4.0, 8.0, 8.0, 10.0, 7.0, 21.0, 23.0, 40.0, 41.0, 43.0, 67.0, 81.0, 97.0, 84.0, 94.0, 79.0, 70.0, 61.0, 37.0, 31.0, 28.0, 11.0, 15.0, 13.0, 10.0, 5.0, 8.0, 4.0, 1.0, 1.0, 2.0, 5.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.755859375, -2.65966796875, -2.5634765625, -2.46728515625, -2.37109375, -2.27490234375, -2.1787109375, -2.08251953125, -1.986328125, -1.89013671875, -1.7939453125, -1.69775390625, -1.6015625, -1.50537109375, -1.4091796875, -1.31298828125, -1.216796875, -1.12060546875, -1.0244140625, -0.92822265625, -0.83203125, -0.73583984375, -0.6396484375, -0.54345703125, -0.447265625, -0.35107421875, -0.2548828125, -0.15869140625, -0.0625, 0.03369140625, 0.1298828125, 0.22607421875, 0.322265625, 0.41845703125, 0.5146484375, 0.61083984375, 0.70703125, 0.80322265625, 0.8994140625, 0.99560546875, 1.091796875, 1.18798828125, 1.2841796875, 1.38037109375, 1.4765625, 1.57275390625, 1.6689453125, 1.76513671875, 1.861328125, 1.95751953125, 2.0537109375, 2.14990234375, 2.24609375, 2.34228515625, 2.4384765625, 2.53466796875, 2.630859375, 2.72705078125, 2.8232421875, 2.91943359375, 3.015625, 3.11181640625, 3.2080078125, 3.30419921875, 3.400390625]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 8.0, 22.0, 88.0, 260.0, 376.0, 176.0, 35.0, 16.0, 7.0, 9.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.739253997802734, -53.519935607910156, -51.30061721801758, -49.081298828125, -46.86198425292969, -44.642662048339844, -42.42334747314453, -40.20402908325195, -37.984710693359375, -35.7653923034668, -33.54607391357422, -31.326757431030273, -29.107439041137695, -26.888120651245117, -24.668804168701172, -22.449485778808594, -20.230167388916016, -18.010848999023438, -15.791531562805176, -13.572214126586914, -11.352895736694336, -9.133577346801758, -6.914259910583496, -4.694942474365234, -2.4756240844726562, -0.25630617141723633, 1.9630117416381836, 4.1823296546936035, 6.401647567749023, 8.620965957641602, 10.840283393859863, 13.059600830078125, 15.278915405273438, 17.498233795166016, 19.717552185058594, 21.93686866760254, 24.156187057495117, 26.375505447387695, 28.59482192993164, 30.81414031982422, 33.0334587097168, 35.252777099609375, 37.47209548950195, 39.69141387939453, 41.910728454589844, 44.13005065917969, 46.349365234375, 48.56868362426758, 50.788002014160156, 53.007320404052734, 55.22663879394531, 57.44595718383789, 59.66527557373047, 61.88459014892578, 64.10391235351562, 66.32322692871094, 68.54254150390625, 70.76185607910156, 72.9811782836914, 75.20049285888672, 77.41981506347656, 79.63912963867188, 81.85845184326172, 84.07776641845703, 86.29708862304688]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 4.0, 5.0, 8.0, 13.0, 11.0, 19.0, 32.0, 39.0, 71.0, 67.0, 97.0, 117.0, 106.0, 96.0, 96.0, 64.0, 46.0, 39.0, 20.0, 9.0, 7.0, 6.0, 5.0, 11.0, 6.0, 2.0, 3.0, 4.0, 0.0, 2.0, 2.0], "bins": [-43.785804748535156, -42.836490631103516, -41.887176513671875, -40.937862396240234, -39.988548278808594, -39.03923797607422, -38.08992385864258, -37.14060974121094, -36.1912956237793, -35.241981506347656, -34.292667388916016, -33.343353271484375, -32.394039154052734, -31.444726943969727, -30.495412826538086, -29.546100616455078, -28.596786499023438, -27.647472381591797, -26.698158264160156, -25.74884605407715, -24.799531936645508, -23.850217819213867, -22.900903701782227, -21.95159149169922, -21.002275466918945, -20.052961349487305, -19.103647232055664, -18.154335021972656, -17.205020904541016, -16.255706787109375, -15.306392669677734, -14.35707950592041, -13.407766342163086, -12.458452224731445, -11.509139060974121, -10.55982494354248, -9.610511779785156, -8.661197662353516, -7.711884021759033, -6.762570381164551, -5.813256740570068, -4.863943099975586, -3.9146294593811035, -2.965315580368042, -2.0160019397735596, -1.066688060760498, -0.11737442016601562, 0.8319392204284668, 1.7812528610229492, 2.7305665016174316, 3.679880142211914, 4.629194259643555, 5.578507423400879, 6.5278215408325195, 7.477135181427002, 8.426448822021484, 9.375762939453125, 10.325077056884766, 11.27439022064209, 12.22370433807373, 13.173017501831055, 14.122331619262695, 15.071645736694336, 16.020957946777344, 16.970272064208984]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 3.0, 6.0, 5.0, 9.0, 10.0, 14.0, 32.0, 57.0, 58.0, 98.0, 128.0, 220.0, 340.0, 491.0, 837.0, 1494.0, 2973.0, 6771.0, 18951.0, 78403.0, 1765073.0, 2205889.0, 79269.0, 19254.0, 6900.0, 3065.0, 1550.0, 853.0, 538.0, 295.0, 197.0, 139.0, 96.0, 72.0, 48.0, 36.0, 27.0, 26.0, 19.0, 10.0, 9.0, 8.0, 8.0, 1.0, 2.0, 5.0], "bins": [-8.65625, -8.434326171875, -8.21240234375, -7.990478515625, -7.7685546875, -7.546630859375, -7.32470703125, -7.102783203125, -6.880859375, -6.658935546875, -6.43701171875, -6.215087890625, -5.9931640625, -5.771240234375, -5.54931640625, -5.327392578125, -5.10546875, -4.883544921875, -4.66162109375, -4.439697265625, -4.2177734375, -3.995849609375, -3.77392578125, -3.552001953125, -3.330078125, -3.108154296875, -2.88623046875, -2.664306640625, -2.4423828125, -2.220458984375, -1.99853515625, -1.776611328125, -1.5546875, -1.332763671875, -1.11083984375, -0.888916015625, -0.6669921875, -0.445068359375, -0.22314453125, -0.001220703125, 0.220703125, 0.442626953125, 0.66455078125, 0.886474609375, 1.1083984375, 1.330322265625, 1.55224609375, 1.774169921875, 1.99609375, 2.218017578125, 2.43994140625, 2.661865234375, 2.8837890625, 3.105712890625, 3.32763671875, 3.549560546875, 3.771484375, 3.993408203125, 4.21533203125, 4.437255859375, 4.6591796875, 4.881103515625, 5.10302734375, 5.324951171875, 5.546875]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 4.0, 1.0, 3.0, 3.0, 9.0, 13.0, 10.0, 28.0, 36.0, 49.0, 79.0, 110.0, 147.0, 131.0, 117.0, 72.0, 61.0, 44.0, 29.0, 16.0, 14.0, 7.0, 5.0, 3.0, 4.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.5205078125, -0.5006027221679688, -0.4806976318359375, -0.46079254150390625, -0.440887451171875, -0.42098236083984375, -0.4010772705078125, -0.38117218017578125, -0.36126708984375, -0.34136199951171875, -0.3214569091796875, -0.30155181884765625, -0.281646728515625, -0.26174163818359375, -0.2418365478515625, -0.22193145751953125, -0.2020263671875, -0.18212127685546875, -0.1622161865234375, -0.14231109619140625, -0.122406005859375, -0.10250091552734375, -0.0825958251953125, -0.06269073486328125, -0.04278564453125, -0.02288055419921875, -0.0029754638671875, 0.01692962646484375, 0.036834716796875, 0.05673980712890625, 0.0766448974609375, 0.09654998779296875, 0.116455078125, 0.13636016845703125, 0.1562652587890625, 0.17617034912109375, 0.196075439453125, 0.21598052978515625, 0.2358856201171875, 0.25579071044921875, 0.27569580078125, 0.29560089111328125, 0.3155059814453125, 0.33541107177734375, 0.355316162109375, 0.37522125244140625, 0.3951263427734375, 0.41503143310546875, 0.4349365234375, 0.45484161376953125, 0.4747467041015625, 0.49465179443359375, 0.514556884765625, 0.5344619750976562, 0.5543670654296875, 0.5742721557617188, 0.59417724609375, 0.6140823364257812, 0.6339874267578125, 0.6538925170898438, 0.673797607421875, 0.6937026977539062, 0.7136077880859375, 0.7335128784179688, 0.75341796875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 5.0, 10.0, 12.0, 16.0, 23.0, 32.0, 75.0, 119.0, 206.0, 546.0, 1364.0, 3718.0, 13139.0, 75684.0, 1899039.0, 2103273.0, 77680.0, 13185.0, 3783.0, 1312.0, 556.0, 236.0, 107.0, 62.0, 43.0, 17.0, 11.0, 14.0, 7.0, 0.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.76171875, -6.48004150390625, -6.1983642578125, -5.91668701171875, -5.635009765625, -5.35333251953125, -5.0716552734375, -4.78997802734375, -4.50830078125, -4.22662353515625, -3.9449462890625, -3.66326904296875, -3.381591796875, -3.09991455078125, -2.8182373046875, -2.53656005859375, -2.2548828125, -1.97320556640625, -1.6915283203125, -1.40985107421875, -1.128173828125, -0.84649658203125, -0.5648193359375, -0.28314208984375, -0.00146484375, 0.28021240234375, 0.5618896484375, 0.84356689453125, 1.125244140625, 1.40692138671875, 1.6885986328125, 1.97027587890625, 2.251953125, 2.53363037109375, 2.8153076171875, 3.09698486328125, 3.378662109375, 3.66033935546875, 3.9420166015625, 4.22369384765625, 4.50537109375, 4.78704833984375, 5.0687255859375, 5.35040283203125, 5.632080078125, 5.91375732421875, 6.1954345703125, 6.47711181640625, 6.7587890625, 7.04046630859375, 7.3221435546875, 7.60382080078125, 7.885498046875, 8.16717529296875, 8.4488525390625, 8.73052978515625, 9.01220703125, 9.29388427734375, 9.5755615234375, 9.85723876953125, 10.138916015625, 10.42059326171875, 10.7022705078125, 10.98394775390625, 11.265625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 7.0, 7.0, 10.0, 8.0, 8.0, 23.0, 26.0, 29.0, 64.0, 94.0, 135.0, 234.0, 378.0, 752.0, 1150.0, 453.0, 244.0, 154.0, 89.0, 59.0, 38.0, 30.0, 24.0, 12.0, 12.0, 8.0, 6.0, 9.0, 4.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.99267578125, -0.9636459350585938, -0.9346160888671875, -0.9055862426757812, -0.876556396484375, -0.8475265502929688, -0.8184967041015625, -0.7894668579101562, -0.76043701171875, -0.7314071655273438, -0.7023773193359375, -0.6733474731445312, -0.644317626953125, -0.6152877807617188, -0.5862579345703125, -0.5572280883789062, -0.5281982421875, -0.49916839599609375, -0.4701385498046875, -0.44110870361328125, -0.412078857421875, -0.38304901123046875, -0.3540191650390625, -0.32498931884765625, -0.29595947265625, -0.26692962646484375, -0.2378997802734375, -0.20886993408203125, -0.179840087890625, -0.15081024169921875, -0.1217803955078125, -0.09275054931640625, -0.063720703125, -0.03469085693359375, -0.0056610107421875, 0.02336883544921875, 0.052398681640625, 0.08142852783203125, 0.1104583740234375, 0.13948822021484375, 0.16851806640625, 0.19754791259765625, 0.2265777587890625, 0.25560760498046875, 0.284637451171875, 0.31366729736328125, 0.3426971435546875, 0.37172698974609375, 0.4007568359375, 0.42978668212890625, 0.4588165283203125, 0.48784637451171875, 0.516876220703125, 0.5459060668945312, 0.5749359130859375, 0.6039657592773438, 0.63299560546875, 0.6620254516601562, 0.6910552978515625, 0.7200851440429688, 0.749114990234375, 0.7781448364257812, 0.8071746826171875, 0.8362045288085938, 0.865234375]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 7.0, 4.0, 8.0, 18.0, 20.0, 40.0, 59.0, 95.0, 108.0, 142.0, 138.0, 117.0, 90.0, 66.0, 38.0, 16.0, 13.0, 9.0, 5.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.022495269775391, -4.814618110656738, -4.606740951538086, -4.398864269256592, -4.1909871101379395, -3.983109951019287, -3.775233030319214, -3.5673561096191406, -3.3594789505004883, -3.151601791381836, -2.9437248706817627, -2.7358479499816895, -2.527970790863037, -2.3200936317443848, -2.1122167110443115, -1.9043396711349487, -1.696462631225586, -1.4885855913162231, -1.2807085514068604, -1.0728315114974976, -0.8649544715881348, -0.657077431678772, -0.4492003917694092, -0.2413233518600464, -0.033446311950683594, 0.1744307279586792, 0.382307767868042, 0.5901848077774048, 0.7980618476867676, 1.0059388875961304, 1.2138159275054932, 1.421692967414856, 1.6295700073242188, 1.8374470472335815, 2.0453240871429443, 2.2532010078430176, 2.46107816696167, 2.6689553260803223, 2.8768322467803955, 3.0847091674804688, 3.292586326599121, 3.5004634857177734, 3.7083404064178467, 3.91621732711792, 4.124094486236572, 4.331971645355225, 4.539848327636719, 4.747725486755371, 4.955602645874023, 5.163479804992676, 5.371356964111328, 5.579233646392822, 5.787110805511475, 5.994987964630127, 6.202864646911621, 6.410741806030273, 6.618618965148926, 6.826496124267578, 7.0343732833862305, 7.242249965667725, 7.450127124786377, 7.658004283905029, 7.865880966186523, 8.073758125305176, 8.281635284423828]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 2.0, 4.0, 4.0, 10.0, 8.0, 14.0, 16.0, 17.0, 26.0, 34.0, 42.0, 44.0, 42.0, 67.0, 64.0, 56.0, 57.0, 72.0, 55.0, 66.0, 63.0, 51.0, 35.0, 29.0, 24.0, 24.0, 20.0, 22.0, 20.0, 5.0, 6.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.4046130180358887, -3.275851249694824, -3.147089719772339, -3.0183279514312744, -2.889566421508789, -2.7608046531677246, -2.63204288482666, -2.5032811164855957, -2.3745195865631104, -2.245757818222046, -2.1169962882995605, -1.988234519958496, -1.8594728708267212, -1.7307112216949463, -1.6019494533538818, -1.473187804222107, -1.344426155090332, -1.2156645059585571, -1.0869028568267822, -0.9581410884857178, -0.8293794393539429, -0.700617790222168, -0.5718560814857483, -0.4430943727493286, -0.3143327236175537, -0.18557104468345642, -0.05680936574935913, 0.07195231318473816, 0.20071399211883545, 0.32947564125061035, 0.45823734998703003, 0.5869990587234497, 0.7157602310180664, 0.8445218801498413, 0.973283588886261, 1.1020452976226807, 1.2308069467544556, 1.3595685958862305, 1.488330364227295, 1.6170920133590698, 1.7458536624908447, 1.8746153116226196, 2.0033769607543945, 2.132138729095459, 2.2609004974365234, 2.389662027359009, 2.5184237957000732, 2.6471853256225586, 2.775947093963623, 2.9047088623046875, 3.033470392227173, 3.1622321605682373, 3.2909936904907227, 3.419755458831787, 3.5485172271728516, 3.677278995513916, 3.8060405254364014, 3.934802293777466, 4.063563823699951, 4.192325592041016, 4.32108736038208, 4.4498491287231445, 4.578610420227051, 4.707372188568115, 4.83613395690918]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 9.0, 4.0, 2.0, 1.0, 9.0, 12.0, 22.0, 29.0, 43.0, 63.0, 127.0, 177.0, 302.0, 511.0, 959.0, 2130.0, 4792.0, 12888.0, 42771.0, 172346.0, 474206.0, 248350.0, 60478.0, 17023.0, 6205.0, 2434.0, 1205.0, 607.0, 311.0, 187.0, 106.0, 69.0, 61.0, 32.0, 41.0, 14.0, 9.0, 7.0, 8.0, 3.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.3203125, -4.17926025390625, -4.0382080078125, -3.89715576171875, -3.756103515625, -3.61505126953125, -3.4739990234375, -3.33294677734375, -3.19189453125, -3.05084228515625, -2.9097900390625, -2.76873779296875, -2.627685546875, -2.48663330078125, -2.3455810546875, -2.20452880859375, -2.0634765625, -1.92242431640625, -1.7813720703125, -1.64031982421875, -1.499267578125, -1.35821533203125, -1.2171630859375, -1.07611083984375, -0.93505859375, -0.79400634765625, -0.6529541015625, -0.51190185546875, -0.370849609375, -0.22979736328125, -0.0887451171875, 0.05230712890625, 0.193359375, 0.33441162109375, 0.4754638671875, 0.61651611328125, 0.757568359375, 0.89862060546875, 1.0396728515625, 1.18072509765625, 1.32177734375, 1.46282958984375, 1.6038818359375, 1.74493408203125, 1.885986328125, 2.02703857421875, 2.1680908203125, 2.30914306640625, 2.4501953125, 2.59124755859375, 2.7322998046875, 2.87335205078125, 3.014404296875, 3.15545654296875, 3.2965087890625, 3.43756103515625, 3.57861328125, 3.71966552734375, 3.8607177734375, 4.00177001953125, 4.142822265625, 4.28387451171875, 4.4249267578125, 4.56597900390625, 4.70703125]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 1.0, 2.0, 2.0, 9.0, 7.0, 8.0, 12.0, 13.0, 41.0, 48.0, 70.0, 79.0, 119.0, 147.0, 131.0, 82.0, 75.0, 57.0, 41.0, 13.0, 17.0, 14.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.59814453125, -0.5779037475585938, -0.5576629638671875, -0.5374221801757812, -0.517181396484375, -0.49694061279296875, -0.4766998291015625, -0.45645904541015625, -0.43621826171875, -0.41597747802734375, -0.3957366943359375, -0.37549591064453125, -0.355255126953125, -0.33501434326171875, -0.3147735595703125, -0.29453277587890625, -0.2742919921875, -0.25405120849609375, -0.2338104248046875, -0.21356964111328125, -0.193328857421875, -0.17308807373046875, -0.1528472900390625, -0.13260650634765625, -0.11236572265625, -0.09212493896484375, -0.0718841552734375, -0.05164337158203125, -0.031402587890625, -0.01116180419921875, 0.0090789794921875, 0.02931976318359375, 0.049560546875, 0.06980133056640625, 0.0900421142578125, 0.11028289794921875, 0.130523681640625, 0.15076446533203125, 0.1710052490234375, 0.19124603271484375, 0.21148681640625, 0.23172760009765625, 0.2519683837890625, 0.27220916748046875, 0.292449951171875, 0.31269073486328125, 0.3329315185546875, 0.35317230224609375, 0.3734130859375, 0.39365386962890625, 0.4138946533203125, 0.43413543701171875, 0.454376220703125, 0.47461700439453125, 0.4948577880859375, 0.5150985717773438, 0.53533935546875, 0.5555801391601562, 0.5758209228515625, 0.5960617065429688, 0.616302490234375, 0.6365432739257812, 0.6567840576171875, 0.6770248413085938, 0.697265625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 7.0, 6.0, 4.0, 3.0, 11.0, 6.0, 18.0, 27.0, 49.0, 64.0, 94.0, 140.0, 229.0, 386.0, 650.0, 1229.0, 2613.0, 7392.0, 28403.0, 131023.0, 431361.0, 334860.0, 81943.0, 18426.0, 5136.0, 1993.0, 1001.0, 579.0, 329.0, 209.0, 113.0, 79.0, 67.0, 36.0, 15.0, 22.0, 11.0, 12.0, 4.0, 2.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.04296875, -4.89398193359375, -4.7449951171875, -4.59600830078125, -4.447021484375, -4.29803466796875, -4.1490478515625, -4.00006103515625, -3.85107421875, -3.70208740234375, -3.5531005859375, -3.40411376953125, -3.255126953125, -3.10614013671875, -2.9571533203125, -2.80816650390625, -2.6591796875, -2.51019287109375, -2.3612060546875, -2.21221923828125, -2.063232421875, -1.91424560546875, -1.7652587890625, -1.61627197265625, -1.46728515625, -1.31829833984375, -1.1693115234375, -1.02032470703125, -0.871337890625, -0.72235107421875, -0.5733642578125, -0.42437744140625, -0.275390625, -0.12640380859375, 0.0225830078125, 0.17156982421875, 0.320556640625, 0.46954345703125, 0.6185302734375, 0.76751708984375, 0.91650390625, 1.06549072265625, 1.2144775390625, 1.36346435546875, 1.512451171875, 1.66143798828125, 1.8104248046875, 1.95941162109375, 2.1083984375, 2.25738525390625, 2.4063720703125, 2.55535888671875, 2.704345703125, 2.85333251953125, 3.0023193359375, 3.15130615234375, 3.30029296875, 3.44927978515625, 3.5982666015625, 3.74725341796875, 3.896240234375, 4.04522705078125, 4.1942138671875, 4.34320068359375, 4.4921875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 1.0, 3.0, 7.0, 3.0, 3.0, 2.0, 6.0, 8.0, 10.0, 20.0, 12.0, 16.0, 16.0, 23.0, 17.0, 34.0, 40.0, 39.0, 45.0, 45.0, 37.0, 48.0, 40.0, 59.0, 54.0, 43.0, 57.0, 47.0, 39.0, 36.0, 34.0, 26.0, 27.0, 26.0, 15.0, 18.0, 7.0, 12.0, 8.0, 6.0, 4.0, 3.0, 3.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.443359375, -2.369293212890625, -2.29522705078125, -2.221160888671875, -2.1470947265625, -2.073028564453125, -1.99896240234375, -1.924896240234375, -1.850830078125, -1.776763916015625, -1.70269775390625, -1.628631591796875, -1.5545654296875, -1.480499267578125, -1.40643310546875, -1.332366943359375, -1.25830078125, -1.184234619140625, -1.11016845703125, -1.036102294921875, -0.9620361328125, -0.887969970703125, -0.81390380859375, -0.739837646484375, -0.665771484375, -0.591705322265625, -0.51763916015625, -0.443572998046875, -0.3695068359375, -0.295440673828125, -0.22137451171875, -0.147308349609375, -0.0732421875, 0.000823974609375, 0.07489013671875, 0.148956298828125, 0.2230224609375, 0.297088623046875, 0.37115478515625, 0.445220947265625, 0.519287109375, 0.593353271484375, 0.66741943359375, 0.741485595703125, 0.8155517578125, 0.889617919921875, 0.96368408203125, 1.037750244140625, 1.11181640625, 1.185882568359375, 1.25994873046875, 1.334014892578125, 1.4080810546875, 1.482147216796875, 1.55621337890625, 1.630279541015625, 1.704345703125, 1.778411865234375, 1.85247802734375, 1.926544189453125, 2.0006103515625, 2.074676513671875, 2.14874267578125, 2.222808837890625, 2.296875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 2.0, 4.0, 7.0, 15.0, 11.0, 10.0, 16.0, 41.0, 53.0, 86.0, 129.0, 243.0, 481.0, 1118.0, 3003.0, 10156.0, 42635.0, 233769.0, 529503.0, 180877.0, 33552.0, 8163.0, 2646.0, 982.0, 438.0, 255.0, 123.0, 72.0, 46.0, 38.0, 25.0, 19.0, 14.0, 13.0, 4.0, 4.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.65625, -3.531982421875, -3.40771484375, -3.283447265625, -3.1591796875, -3.034912109375, -2.91064453125, -2.786376953125, -2.662109375, -2.537841796875, -2.41357421875, -2.289306640625, -2.1650390625, -2.040771484375, -1.91650390625, -1.792236328125, -1.66796875, -1.543701171875, -1.41943359375, -1.295166015625, -1.1708984375, -1.046630859375, -0.92236328125, -0.798095703125, -0.673828125, -0.549560546875, -0.42529296875, -0.301025390625, -0.1767578125, -0.052490234375, 0.07177734375, 0.196044921875, 0.3203125, 0.444580078125, 0.56884765625, 0.693115234375, 0.8173828125, 0.941650390625, 1.06591796875, 1.190185546875, 1.314453125, 1.438720703125, 1.56298828125, 1.687255859375, 1.8115234375, 1.935791015625, 2.06005859375, 2.184326171875, 2.30859375, 2.432861328125, 2.55712890625, 2.681396484375, 2.8056640625, 2.929931640625, 3.05419921875, 3.178466796875, 3.302734375, 3.427001953125, 3.55126953125, 3.675537109375, 3.7998046875, 3.924072265625, 4.04833984375, 4.172607421875, 4.296875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 6.0, 8.0, 7.0, 15.0, 6.0, 16.0, 12.0, 23.0, 22.0, 38.0, 47.0, 41.0, 53.0, 58.0, 73.0, 71.0, 71.0, 59.0, 57.0, 51.0, 53.0, 34.0, 29.0, 40.0, 25.0, 23.0, 13.0, 11.0, 8.0, 9.0, 8.0, 5.0, 5.0, 4.0, 2.0, 5.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003960132598876953, -0.0003850683569908142, -0.0003741234540939331, -0.000363178551197052, -0.0003522336483001709, -0.0003412887454032898, -0.0003303438425064087, -0.0003193989396095276, -0.0003084540367126465, -0.0002975091338157654, -0.0002865642309188843, -0.0002756193280220032, -0.00026467442512512207, -0.00025372952222824097, -0.00024278461933135986, -0.00023183971643447876, -0.00022089481353759766, -0.00020994991064071655, -0.00019900500774383545, -0.00018806010484695435, -0.00017711520195007324, -0.00016617029905319214, -0.00015522539615631104, -0.00014428049325942993, -0.00013333559036254883, -0.00012239068746566772, -0.00011144578456878662, -0.00010050088167190552, -8.955597877502441e-05, -7.861107587814331e-05, -6.766617298126221e-05, -5.6721270084381104e-05, -4.57763671875e-05, -3.4831464290618896e-05, -2.3886561393737793e-05, -1.294165849685669e-05, -1.996755599975586e-06, 8.948147296905518e-06, 1.989305019378662e-05, 3.0837953090667725e-05, 4.178285598754883e-05, 5.272775888442993e-05, 6.367266178131104e-05, 7.461756467819214e-05, 8.556246757507324e-05, 9.650737047195435e-05, 0.00010745227336883545, 0.00011839717626571655, 0.00012934207916259766, 0.00014028698205947876, 0.00015123188495635986, 0.00016217678785324097, 0.00017312169075012207, 0.00018406659364700317, 0.00019501149654388428, 0.00020595639944076538, 0.00021690130233764648, 0.0002278462052345276, 0.0002387911081314087, 0.0002497360110282898, 0.0002606809139251709, 0.000271625816822052, 0.0002825707197189331, 0.0002935156226158142, 0.0003044605255126953]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 0.0, 1.0, 3.0, 1.0, 4.0, 8.0, 9.0, 9.0, 10.0, 35.0, 21.0, 37.0, 61.0, 81.0, 105.0, 165.0, 263.0, 548.0, 908.0, 1908.0, 4197.0, 11761.0, 40483.0, 190755.0, 541845.0, 193889.0, 41281.0, 11875.0, 4139.0, 1883.0, 915.0, 525.0, 266.0, 183.0, 124.0, 73.0, 48.0, 25.0, 28.0, 18.0, 17.0, 13.0, 10.0, 7.0, 5.0, 3.0, 6.0, 3.0, 1.0, 3.0, 0.0, 5.0, 0.0, 0.0, 2.0], "bins": [-4.61328125, -4.4755859375, -4.337890625, -4.2001953125, -4.0625, -3.9248046875, -3.787109375, -3.6494140625, -3.51171875, -3.3740234375, -3.236328125, -3.0986328125, -2.9609375, -2.8232421875, -2.685546875, -2.5478515625, -2.41015625, -2.2724609375, -2.134765625, -1.9970703125, -1.859375, -1.7216796875, -1.583984375, -1.4462890625, -1.30859375, -1.1708984375, -1.033203125, -0.8955078125, -0.7578125, -0.6201171875, -0.482421875, -0.3447265625, -0.20703125, -0.0693359375, 0.068359375, 0.2060546875, 0.34375, 0.4814453125, 0.619140625, 0.7568359375, 0.89453125, 1.0322265625, 1.169921875, 1.3076171875, 1.4453125, 1.5830078125, 1.720703125, 1.8583984375, 1.99609375, 2.1337890625, 2.271484375, 2.4091796875, 2.546875, 2.6845703125, 2.822265625, 2.9599609375, 3.09765625, 3.2353515625, 3.373046875, 3.5107421875, 3.6484375, 3.7861328125, 3.923828125, 4.0615234375, 4.19921875]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 4.0, 2.0, 4.0, 2.0, 2.0, 7.0, 5.0, 6.0, 16.0, 16.0, 21.0, 21.0, 42.0, 43.0, 85.0, 70.0, 93.0, 106.0, 102.0, 90.0, 63.0, 56.0, 29.0, 22.0, 20.0, 22.0, 12.0, 7.0, 11.0, 6.0, 9.0, 2.0, 2.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.681640625, -2.60400390625, -2.5263671875, -2.44873046875, -2.37109375, -2.29345703125, -2.2158203125, -2.13818359375, -2.060546875, -1.98291015625, -1.9052734375, -1.82763671875, -1.75, -1.67236328125, -1.5947265625, -1.51708984375, -1.439453125, -1.36181640625, -1.2841796875, -1.20654296875, -1.12890625, -1.05126953125, -0.9736328125, -0.89599609375, -0.818359375, -0.74072265625, -0.6630859375, -0.58544921875, -0.5078125, -0.43017578125, -0.3525390625, -0.27490234375, -0.197265625, -0.11962890625, -0.0419921875, 0.03564453125, 0.11328125, 0.19091796875, 0.2685546875, 0.34619140625, 0.423828125, 0.50146484375, 0.5791015625, 0.65673828125, 0.734375, 0.81201171875, 0.8896484375, 0.96728515625, 1.044921875, 1.12255859375, 1.2001953125, 1.27783203125, 1.35546875, 1.43310546875, 1.5107421875, 1.58837890625, 1.666015625, 1.74365234375, 1.8212890625, 1.89892578125, 1.9765625, 2.05419921875, 2.1318359375, 2.20947265625, 2.287109375]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 12.0, 36.0, 123.0, 308.0, 331.0, 136.0, 34.0, 7.0, 9.0, 6.0, 4.0, 2.0, 4.0, 0.0, 0.0, 1.0], "bins": [-113.63965606689453, -111.45718383789062, -109.27471160888672, -107.09223937988281, -104.9097671508789, -102.727294921875, -100.5448226928711, -98.36235046386719, -96.17987823486328, -93.99740600585938, -91.81493377685547, -89.63246154785156, -87.44998931884766, -85.26751708984375, -83.08504486083984, -80.90257263183594, -78.72010040283203, -76.53762817382812, -74.35515594482422, -72.17268371582031, -69.9902114868164, -67.8077392578125, -65.6252670288086, -63.44279479980469, -61.26032257080078, -59.077850341796875, -56.89537811279297, -54.71290588378906, -52.530433654785156, -50.34796142578125, -48.165489196777344, -45.98301696777344, -43.8005485534668, -41.61807632446289, -39.435604095458984, -37.25313186645508, -35.07065963745117, -32.888187408447266, -30.70571517944336, -28.523242950439453, -26.340770721435547, -24.15829849243164, -21.975826263427734, -19.793354034423828, -17.610881805419922, -15.428409576416016, -13.24593734741211, -11.063465118408203, -8.880992889404297, -6.698520660400391, -4.516048431396484, -2.333576202392578, -0.15110397338867188, 2.0313682556152344, 4.213840484619141, 6.396312713623047, 8.578784942626953, 10.76125717163086, 12.943729400634766, 15.126201629638672, 17.308673858642578, 19.491146087646484, 21.67361831665039, 23.856090545654297, 26.038562774658203]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 3.0, 4.0, 9.0, 7.0, 17.0, 18.0, 12.0, 22.0, 20.0, 36.0, 40.0, 30.0, 41.0, 44.0, 58.0, 64.0, 60.0, 57.0, 60.0, 50.0, 44.0, 48.0, 30.0, 43.0, 31.0, 37.0, 34.0, 28.0, 15.0, 11.0, 9.0, 7.0, 3.0, 2.0, 1.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-24.343381881713867, -23.67071533203125, -22.998048782348633, -22.325382232666016, -21.65271759033203, -20.980051040649414, -20.307384490966797, -19.63471794128418, -18.962051391601562, -18.289384841918945, -17.616718292236328, -16.944053649902344, -16.271387100219727, -15.59872055053711, -14.926054000854492, -14.253387451171875, -13.580721855163574, -12.908055305480957, -12.235389709472656, -11.562723159790039, -10.890056610107422, -10.217390060424805, -9.544724464416504, -8.872057914733887, -8.199392318725586, -7.526726245880127, -6.85405969619751, -6.181393623352051, -5.508727073669434, -4.836061000823975, -4.163394927978516, -3.4907283782958984, -2.8180618286132812, -2.145395517349243, -1.4727293252944946, -0.8000631332397461, -0.127396821975708, 0.5452694892883301, 1.217935562133789, 1.8906021118164062, 2.5632681846618652, 3.2359344959259033, 3.9086008071899414, 4.5812668800354, 5.253932952880859, 5.926599502563477, 6.5992655754089355, 7.271932125091553, 7.944598197937012, 8.617264747619629, 9.28993034362793, 9.962596893310547, 10.635263442993164, 11.307929992675781, 11.980595588684082, 12.6532621383667, 13.325927734375, 13.998594284057617, 14.671259880065918, 15.343926429748535, 16.016592025756836, 16.689258575439453, 17.36192512512207, 18.034591674804688, 18.707258224487305]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 5.0, 5.0, 3.0, 8.0, 6.0, 20.0, 29.0, 48.0, 89.0, 222.0, 457.0, 1743.0, 17456.0, 4063082.0, 106302.0, 3579.0, 680.0, 287.0, 112.0, 56.0, 43.0, 20.0, 10.0, 12.0, 4.0, 2.0, 4.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.890625, -16.30224609375, -15.7138671875, -15.12548828125, -14.537109375, -13.94873046875, -13.3603515625, -12.77197265625, -12.18359375, -11.59521484375, -11.0068359375, -10.41845703125, -9.830078125, -9.24169921875, -8.6533203125, -8.06494140625, -7.4765625, -6.88818359375, -6.2998046875, -5.71142578125, -5.123046875, -4.53466796875, -3.9462890625, -3.35791015625, -2.76953125, -2.18115234375, -1.5927734375, -1.00439453125, -0.416015625, 0.17236328125, 0.7607421875, 1.34912109375, 1.9375, 2.52587890625, 3.1142578125, 3.70263671875, 4.291015625, 4.87939453125, 5.4677734375, 6.05615234375, 6.64453125, 7.23291015625, 7.8212890625, 8.40966796875, 8.998046875, 9.58642578125, 10.1748046875, 10.76318359375, 11.3515625, 11.93994140625, 12.5283203125, 13.11669921875, 13.705078125, 14.29345703125, 14.8818359375, 15.47021484375, 16.05859375, 16.64697265625, 17.2353515625, 17.82373046875, 18.412109375, 19.00048828125, 19.5888671875, 20.17724609375, 20.765625]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 2.0, 5.0, 10.0, 11.0, 18.0, 20.0, 44.0, 65.0, 85.0, 88.0, 119.0, 135.0, 100.0, 94.0, 60.0, 49.0, 33.0, 22.0, 14.0, 8.0, 4.0, 6.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.78271484375, -0.7558975219726562, -0.7290802001953125, -0.7022628784179688, -0.675445556640625, -0.6486282348632812, -0.6218109130859375, -0.5949935913085938, -0.56817626953125, -0.5413589477539062, -0.5145416259765625, -0.48772430419921875, -0.460906982421875, -0.43408966064453125, -0.4072723388671875, -0.38045501708984375, -0.3536376953125, -0.32682037353515625, -0.3000030517578125, -0.27318572998046875, -0.246368408203125, -0.21955108642578125, -0.1927337646484375, -0.16591644287109375, -0.13909912109375, -0.11228179931640625, -0.0854644775390625, -0.05864715576171875, -0.031829833984375, -0.00501251220703125, 0.0218048095703125, 0.04862213134765625, 0.075439453125, 0.10225677490234375, 0.1290740966796875, 0.15589141845703125, 0.182708740234375, 0.20952606201171875, 0.2363433837890625, 0.26316070556640625, 0.28997802734375, 0.31679534912109375, 0.3436126708984375, 0.37042999267578125, 0.397247314453125, 0.42406463623046875, 0.4508819580078125, 0.47769927978515625, 0.5045166015625, 0.5313339233398438, 0.5581512451171875, 0.5849685668945312, 0.611785888671875, 0.6386032104492188, 0.6654205322265625, 0.6922378540039062, 0.71905517578125, 0.7458724975585938, 0.7726898193359375, 0.7995071411132812, 0.826324462890625, 0.8531417846679688, 0.8799591064453125, 0.9067764282226562, 0.93359375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 7.0, 6.0, 6.0, 5.0, 7.0, 14.0, 18.0, 19.0, 35.0, 54.0, 60.0, 126.0, 180.0, 356.0, 842.0, 2066.0, 6044.0, 22846.0, 113108.0, 1163155.0, 2666950.0, 173899.0, 31995.0, 7991.0, 2552.0, 917.0, 430.0, 195.0, 155.0, 86.0, 35.0, 38.0, 13.0, 25.0, 11.0, 6.0, 9.0, 9.0, 4.0, 2.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.8125, -5.64697265625, -5.4814453125, -5.31591796875, -5.150390625, -4.98486328125, -4.8193359375, -4.65380859375, -4.48828125, -4.32275390625, -4.1572265625, -3.99169921875, -3.826171875, -3.66064453125, -3.4951171875, -3.32958984375, -3.1640625, -2.99853515625, -2.8330078125, -2.66748046875, -2.501953125, -2.33642578125, -2.1708984375, -2.00537109375, -1.83984375, -1.67431640625, -1.5087890625, -1.34326171875, -1.177734375, -1.01220703125, -0.8466796875, -0.68115234375, -0.515625, -0.35009765625, -0.1845703125, -0.01904296875, 0.146484375, 0.31201171875, 0.4775390625, 0.64306640625, 0.80859375, 0.97412109375, 1.1396484375, 1.30517578125, 1.470703125, 1.63623046875, 1.8017578125, 1.96728515625, 2.1328125, 2.29833984375, 2.4638671875, 2.62939453125, 2.794921875, 2.96044921875, 3.1259765625, 3.29150390625, 3.45703125, 3.62255859375, 3.7880859375, 3.95361328125, 4.119140625, 4.28466796875, 4.4501953125, 4.61572265625, 4.78125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 4.0, 3.0, 5.0, 2.0, 9.0, 6.0, 11.0, 21.0, 27.0, 44.0, 63.0, 105.0, 116.0, 253.0, 414.0, 1051.0, 914.0, 384.0, 228.0, 138.0, 87.0, 57.0, 41.0, 19.0, 19.0, 13.0, 9.0, 8.0, 6.0, 5.0, 7.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.2236328125, -1.1913909912109375, -1.159149169921875, -1.1269073486328125, -1.09466552734375, -1.0624237060546875, -1.030181884765625, -0.9979400634765625, -0.9656982421875, -0.9334564208984375, -0.901214599609375, -0.8689727783203125, -0.83673095703125, -0.8044891357421875, -0.772247314453125, -0.7400054931640625, -0.707763671875, -0.6755218505859375, -0.643280029296875, -0.6110382080078125, -0.57879638671875, -0.5465545654296875, -0.514312744140625, -0.4820709228515625, -0.4498291015625, -0.4175872802734375, -0.385345458984375, -0.3531036376953125, -0.32086181640625, -0.2886199951171875, -0.256378173828125, -0.2241363525390625, -0.19189453125, -0.1596527099609375, -0.127410888671875, -0.0951690673828125, -0.06292724609375, -0.0306854248046875, 0.001556396484375, 0.0337982177734375, 0.0660400390625, 0.0982818603515625, 0.130523681640625, 0.1627655029296875, 0.19500732421875, 0.2272491455078125, 0.259490966796875, 0.2917327880859375, 0.323974609375, 0.3562164306640625, 0.388458251953125, 0.4207000732421875, 0.45294189453125, 0.4851837158203125, 0.517425537109375, 0.5496673583984375, 0.5819091796875, 0.6141510009765625, 0.646392822265625, 0.6786346435546875, 0.71087646484375, 0.7431182861328125, 0.775360107421875, 0.8076019287109375, 0.83984375]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 5.0, 9.0, 21.0, 37.0, 82.0, 182.0, 226.0, 217.0, 117.0, 67.0, 19.0, 16.0, 6.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.13654327392578, -15.759696006774902, -15.38284969329834, -15.006002426147461, -14.629156112670898, -14.25230884552002, -13.87546157836914, -13.498615264892578, -13.121768951416016, -12.744921684265137, -12.368075370788574, -11.991228103637695, -11.614381790161133, -11.237534523010254, -10.860687255859375, -10.483840942382812, -10.106993675231934, -9.730146408081055, -9.353300094604492, -8.976452827453613, -8.59960651397705, -8.222759246826172, -7.845912456512451, -7.4690656661987305, -7.09221887588501, -6.715372085571289, -6.338525295257568, -5.961678504943848, -5.584831237792969, -5.207984924316406, -4.831137657165527, -4.454290866851807, -4.077445030212402, -3.7005982398986816, -3.323751449584961, -2.946904420852661, -2.5700576305389404, -2.1932108402252197, -1.81636381149292, -1.4395170211791992, -1.0626702308654785, -0.685823380947113, -0.30897653102874756, 0.0678703784942627, 0.4447171688079834, 0.8215639591217041, 1.198410987854004, 1.5752577781677246, 1.9521045684814453, 2.328951358795166, 2.7057981491088867, 3.0826451778411865, 3.4594919681549072, 3.836338758468628, 4.213185787200928, 4.590032577514648, 4.966879367828369, 5.34372615814209, 5.7205729484558105, 6.097419738769531, 6.47426700592041, 6.851113319396973, 7.227960586547852, 7.604807376861572, 7.981654167175293]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 4.0, 6.0, 4.0, 6.0, 10.0, 10.0, 5.0, 10.0, 10.0, 14.0, 14.0, 25.0, 16.0, 28.0, 28.0, 22.0, 37.0, 37.0, 34.0, 40.0, 41.0, 44.0, 44.0, 41.0, 38.0, 46.0, 32.0, 40.0, 43.0, 28.0, 31.0, 23.0, 25.0, 28.0, 25.0, 19.0, 13.0, 17.0, 17.0, 10.0, 10.0, 4.0, 6.0, 5.0, 5.0, 1.0, 3.0, 1.0, 2.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.8845438957214355, -2.7907845973968506, -2.6970255374908447, -2.6032662391662598, -2.509506940841675, -2.415747880935669, -2.321988582611084, -2.228229522705078, -2.134470224380493, -2.040710926055908, -1.9469517469406128, -1.8531925678253174, -1.759433388710022, -1.6656742095947266, -1.5719149112701416, -1.4781557321548462, -1.3843964338302612, -1.2906372547149658, -1.1968779563903809, -1.1031187772750854, -1.00935959815979, -0.9156003594398499, -0.8218411207199097, -0.7280819416046143, -0.6343227028846741, -0.5405634641647339, -0.4468042850494385, -0.3530450463294983, -0.2592858374118805, -0.1655266284942627, -0.07176738977432251, 0.0219917893409729, 0.11575102806091309, 0.20951023697853088, 0.3032694458961487, 0.39702868461608887, 0.49078789353370667, 0.5845471024513245, 0.6783063411712646, 0.7720655202865601, 0.8658247590065002, 0.9595839977264404, 1.0533431768417358, 1.1471023559570312, 1.2408616542816162, 1.3346208333969116, 1.428380012512207, 1.522139310836792, 1.6158984899520874, 1.7096576690673828, 1.8034169673919678, 1.8971761465072632, 1.9909353256225586, 2.0846946239471436, 2.1784539222717285, 2.2722129821777344, 2.3659722805023193, 2.4597315788269043, 2.55349063873291, 2.647249937057495, 2.74100923538208, 2.834768295288086, 2.928527593612671, 3.022286891937256, 3.1160459518432617]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 7.0, 1.0, 3.0, 3.0, 3.0, 2.0, 4.0, 13.0, 14.0, 14.0, 16.0, 26.0, 42.0, 49.0, 73.0, 107.0, 192.0, 275.0, 566.0, 1049.0, 2064.0, 4890.0, 14163.0, 53712.0, 210509.0, 427717.0, 242146.0, 64047.0, 16520.0, 5533.0, 2206.0, 1100.0, 599.0, 336.0, 206.0, 105.0, 74.0, 51.0, 37.0, 23.0, 10.0, 18.0, 8.0, 5.0, 7.0, 2.0, 3.0, 5.0, 3.0, 2.0, 4.0, 0.0, 3.0, 0.0, 2.0, 1.0], "bins": [-4.3671875, -4.237060546875, -4.10693359375, -3.976806640625, -3.8466796875, -3.716552734375, -3.58642578125, -3.456298828125, -3.326171875, -3.196044921875, -3.06591796875, -2.935791015625, -2.8056640625, -2.675537109375, -2.54541015625, -2.415283203125, -2.28515625, -2.155029296875, -2.02490234375, -1.894775390625, -1.7646484375, -1.634521484375, -1.50439453125, -1.374267578125, -1.244140625, -1.114013671875, -0.98388671875, -0.853759765625, -0.7236328125, -0.593505859375, -0.46337890625, -0.333251953125, -0.203125, -0.072998046875, 0.05712890625, 0.187255859375, 0.3173828125, 0.447509765625, 0.57763671875, 0.707763671875, 0.837890625, 0.968017578125, 1.09814453125, 1.228271484375, 1.3583984375, 1.488525390625, 1.61865234375, 1.748779296875, 1.87890625, 2.009033203125, 2.13916015625, 2.269287109375, 2.3994140625, 2.529541015625, 2.65966796875, 2.789794921875, 2.919921875, 3.050048828125, 3.18017578125, 3.310302734375, 3.4404296875, 3.570556640625, 3.70068359375, 3.830810546875, 3.9609375]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 4.0, 9.0, 21.0, 23.0, 36.0, 57.0, 66.0, 89.0, 95.0, 113.0, 131.0, 98.0, 79.0, 59.0, 46.0, 18.0, 14.0, 8.0, 13.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.83544921875, -0.8090972900390625, -0.782745361328125, -0.7563934326171875, -0.73004150390625, -0.7036895751953125, -0.677337646484375, -0.6509857177734375, -0.6246337890625, -0.5982818603515625, -0.571929931640625, -0.5455780029296875, -0.51922607421875, -0.4928741455078125, -0.466522216796875, -0.4401702880859375, -0.413818359375, -0.3874664306640625, -0.361114501953125, -0.3347625732421875, -0.30841064453125, -0.2820587158203125, -0.255706787109375, -0.2293548583984375, -0.2030029296875, -0.1766510009765625, -0.150299072265625, -0.1239471435546875, -0.09759521484375, -0.0712432861328125, -0.044891357421875, -0.0185394287109375, 0.0078125, 0.0341644287109375, 0.060516357421875, 0.0868682861328125, 0.11322021484375, 0.1395721435546875, 0.165924072265625, 0.1922760009765625, 0.2186279296875, 0.2449798583984375, 0.271331787109375, 0.2976837158203125, 0.32403564453125, 0.3503875732421875, 0.376739501953125, 0.4030914306640625, 0.429443359375, 0.4557952880859375, 0.482147216796875, 0.5084991455078125, 0.53485107421875, 0.5612030029296875, 0.587554931640625, 0.6139068603515625, 0.6402587890625, 0.6666107177734375, 0.692962646484375, 0.7193145751953125, 0.74566650390625, 0.7720184326171875, 0.798370361328125, 0.8247222900390625, 0.85107421875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 7.0, 10.0, 12.0, 9.0, 17.0, 22.0, 29.0, 43.0, 55.0, 69.0, 124.0, 134.0, 211.0, 302.0, 407.0, 598.0, 1023.0, 2010.0, 4667.0, 13209.0, 46909.0, 160592.0, 354835.0, 302755.0, 111890.0, 31253.0, 9402.0, 3554.0, 1688.0, 934.0, 513.0, 328.0, 265.0, 205.0, 125.0, 98.0, 69.0, 55.0, 42.0, 20.0, 22.0, 17.0, 9.0, 4.0, 6.0, 1.0, 5.0, 1.0, 4.0, 2.0, 0.0, 0.0, 2.0, 2.0], "bins": [-3.876953125, -3.7589111328125, -3.640869140625, -3.5228271484375, -3.40478515625, -3.2867431640625, -3.168701171875, -3.0506591796875, -2.9326171875, -2.8145751953125, -2.696533203125, -2.5784912109375, -2.46044921875, -2.3424072265625, -2.224365234375, -2.1063232421875, -1.98828125, -1.8702392578125, -1.752197265625, -1.6341552734375, -1.51611328125, -1.3980712890625, -1.280029296875, -1.1619873046875, -1.0439453125, -0.9259033203125, -0.807861328125, -0.6898193359375, -0.57177734375, -0.4537353515625, -0.335693359375, -0.2176513671875, -0.099609375, 0.0184326171875, 0.136474609375, 0.2545166015625, 0.37255859375, 0.4906005859375, 0.608642578125, 0.7266845703125, 0.8447265625, 0.9627685546875, 1.080810546875, 1.1988525390625, 1.31689453125, 1.4349365234375, 1.552978515625, 1.6710205078125, 1.7890625, 1.9071044921875, 2.025146484375, 2.1431884765625, 2.26123046875, 2.3792724609375, 2.497314453125, 2.6153564453125, 2.7333984375, 2.8514404296875, 2.969482421875, 3.0875244140625, 3.20556640625, 3.3236083984375, 3.441650390625, 3.5596923828125, 3.677734375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 5.0, 0.0, 9.0, 9.0, 7.0, 6.0, 14.0, 14.0, 19.0, 17.0, 17.0, 23.0, 36.0, 44.0, 33.0, 45.0, 38.0, 39.0, 43.0, 54.0, 53.0, 43.0, 60.0, 38.0, 46.0, 28.0, 27.0, 31.0, 36.0, 30.0, 26.0, 18.0, 21.0, 13.0, 16.0, 12.0, 11.0, 7.0, 8.0, 3.0, 3.0, 1.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-2.880859375, -2.78985595703125, -2.6988525390625, -2.60784912109375, -2.516845703125, -2.42584228515625, -2.3348388671875, -2.24383544921875, -2.15283203125, -2.06182861328125, -1.9708251953125, -1.87982177734375, -1.788818359375, -1.69781494140625, -1.6068115234375, -1.51580810546875, -1.4248046875, -1.33380126953125, -1.2427978515625, -1.15179443359375, -1.060791015625, -0.96978759765625, -0.8787841796875, -0.78778076171875, -0.69677734375, -0.60577392578125, -0.5147705078125, -0.42376708984375, -0.332763671875, -0.24176025390625, -0.1507568359375, -0.05975341796875, 0.03125, 0.12225341796875, 0.2132568359375, 0.30426025390625, 0.395263671875, 0.48626708984375, 0.5772705078125, 0.66827392578125, 0.75927734375, 0.85028076171875, 0.9412841796875, 1.03228759765625, 1.123291015625, 1.21429443359375, 1.3052978515625, 1.39630126953125, 1.4873046875, 1.57830810546875, 1.6693115234375, 1.76031494140625, 1.851318359375, 1.94232177734375, 2.0333251953125, 2.12432861328125, 2.21533203125, 2.30633544921875, 2.3973388671875, 2.48834228515625, 2.579345703125, 2.67034912109375, 2.7613525390625, 2.85235595703125, 2.943359375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 4.0, 5.0, 4.0, 6.0, 14.0, 17.0, 25.0, 48.0, 60.0, 99.0, 218.0, 362.0, 699.0, 1536.0, 3834.0, 10565.0, 36716.0, 133366.0, 350371.0, 337706.0, 123062.0, 33514.0, 9882.0, 3558.0, 1414.0, 675.0, 345.0, 158.0, 96.0, 74.0, 39.0, 31.0, 17.0, 10.0, 11.0, 3.0, 8.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5234375, -2.453277587890625, -2.38311767578125, -2.312957763671875, -2.2427978515625, -2.172637939453125, -2.10247802734375, -2.032318115234375, -1.962158203125, -1.891998291015625, -1.82183837890625, -1.751678466796875, -1.6815185546875, -1.611358642578125, -1.54119873046875, -1.471038818359375, -1.40087890625, -1.330718994140625, -1.26055908203125, -1.190399169921875, -1.1202392578125, -1.050079345703125, -0.97991943359375, -0.909759521484375, -0.839599609375, -0.769439697265625, -0.69927978515625, -0.629119873046875, -0.5589599609375, -0.488800048828125, -0.41864013671875, -0.348480224609375, -0.2783203125, -0.208160400390625, -0.13800048828125, -0.067840576171875, 0.0023193359375, 0.072479248046875, 0.14263916015625, 0.212799072265625, 0.282958984375, 0.353118896484375, 0.42327880859375, 0.493438720703125, 0.5635986328125, 0.633758544921875, 0.70391845703125, 0.774078369140625, 0.84423828125, 0.914398193359375, 0.98455810546875, 1.054718017578125, 1.1248779296875, 1.195037841796875, 1.26519775390625, 1.335357666015625, 1.405517578125, 1.475677490234375, 1.54583740234375, 1.615997314453125, 1.6861572265625, 1.756317138671875, 1.82647705078125, 1.896636962890625, 1.966796875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 3.0, 4.0, 4.0, 3.0, 8.0, 17.0, 9.0, 20.0, 17.0, 21.0, 17.0, 24.0, 31.0, 33.0, 36.0, 52.0, 41.0, 51.0, 61.0, 60.0, 55.0, 45.0, 52.0, 44.0, 46.0, 49.0, 33.0, 33.0, 29.0, 27.0, 15.0, 11.0, 18.0, 10.0, 7.0, 4.0, 3.0, 7.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00025177001953125, -0.00024315714836120605, -0.0002345442771911621, -0.00022593140602111816, -0.00021731853485107422, -0.00020870566368103027, -0.00020009279251098633, -0.00019147992134094238, -0.00018286705017089844, -0.0001742541790008545, -0.00016564130783081055, -0.0001570284366607666, -0.00014841556549072266, -0.0001398026943206787, -0.00013118982315063477, -0.00012257695198059082, -0.00011396408081054688, -0.00010535120964050293, -9.673833847045898e-05, -8.812546730041504e-05, -7.95125961303711e-05, -7.089972496032715e-05, -6.22868537902832e-05, -5.367398262023926e-05, -4.506111145019531e-05, -3.644824028015137e-05, -2.7835369110107422e-05, -1.9222497940063477e-05, -1.0609626770019531e-05, -1.996755599975586e-06, 6.616115570068359e-06, 1.5228986740112305e-05, 2.384185791015625e-05, 3.2454729080200195e-05, 4.106760025024414e-05, 4.9680471420288086e-05, 5.829334259033203e-05, 6.690621376037598e-05, 7.551908493041992e-05, 8.413195610046387e-05, 9.274482727050781e-05, 0.00010135769844055176, 0.0001099705696105957, 0.00011858344078063965, 0.0001271963119506836, 0.00013580918312072754, 0.00014442205429077148, 0.00015303492546081543, 0.00016164779663085938, 0.00017026066780090332, 0.00017887353897094727, 0.0001874864101409912, 0.00019609928131103516, 0.0002047121524810791, 0.00021332502365112305, 0.000221937894821167, 0.00023055076599121094, 0.00023916363716125488, 0.00024777650833129883, 0.0002563893795013428, 0.0002650022506713867, 0.00027361512184143066, 0.0002822279930114746, 0.00029084086418151855, 0.0002994537353515625]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 3.0, 12.0, 11.0, 22.0, 15.0, 32.0, 50.0, 61.0, 88.0, 116.0, 167.0, 329.0, 559.0, 928.0, 2010.0, 4923.0, 15362.0, 58283.0, 253832.0, 487904.0, 167170.0, 38748.0, 10593.0, 3758.0, 1511.0, 832.0, 446.0, 246.0, 174.0, 94.0, 82.0, 60.0, 47.0, 31.0, 19.0, 9.0, 5.0, 7.0, 3.0, 6.0, 3.0, 3.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.689453125, -2.600860595703125, -2.51226806640625, -2.423675537109375, -2.3350830078125, -2.246490478515625, -2.15789794921875, -2.069305419921875, -1.980712890625, -1.892120361328125, -1.80352783203125, -1.714935302734375, -1.6263427734375, -1.537750244140625, -1.44915771484375, -1.360565185546875, -1.27197265625, -1.183380126953125, -1.09478759765625, -1.006195068359375, -0.9176025390625, -0.829010009765625, -0.74041748046875, -0.651824951171875, -0.563232421875, -0.474639892578125, -0.38604736328125, -0.297454833984375, -0.2088623046875, -0.120269775390625, -0.03167724609375, 0.056915283203125, 0.1455078125, 0.234100341796875, 0.32269287109375, 0.411285400390625, 0.4998779296875, 0.588470458984375, 0.67706298828125, 0.765655517578125, 0.854248046875, 0.942840576171875, 1.03143310546875, 1.120025634765625, 1.2086181640625, 1.297210693359375, 1.38580322265625, 1.474395751953125, 1.56298828125, 1.651580810546875, 1.74017333984375, 1.828765869140625, 1.9173583984375, 2.005950927734375, 2.09454345703125, 2.183135986328125, 2.271728515625, 2.360321044921875, 2.44891357421875, 2.537506103515625, 2.6260986328125, 2.714691162109375, 2.80328369140625, 2.891876220703125, 2.98046875]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 3.0, 5.0, 6.0, 4.0, 9.0, 11.0, 16.0, 21.0, 16.0, 24.0, 35.0, 42.0, 50.0, 59.0, 60.0, 79.0, 70.0, 73.0, 61.0, 51.0, 57.0, 54.0, 43.0, 35.0, 20.0, 20.0, 18.0, 15.0, 13.0, 8.0, 10.0, 5.0, 1.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3330078125, -1.2889251708984375, -1.244842529296875, -1.2007598876953125, -1.15667724609375, -1.1125946044921875, -1.068511962890625, -1.0244293212890625, -0.9803466796875, -0.9362640380859375, -0.892181396484375, -0.8480987548828125, -0.80401611328125, -0.7599334716796875, -0.715850830078125, -0.6717681884765625, -0.627685546875, -0.5836029052734375, -0.539520263671875, -0.4954376220703125, -0.45135498046875, -0.4072723388671875, -0.363189697265625, -0.3191070556640625, -0.2750244140625, -0.2309417724609375, -0.186859130859375, -0.1427764892578125, -0.09869384765625, -0.0546112060546875, -0.010528564453125, 0.0335540771484375, 0.07763671875, 0.1217193603515625, 0.165802001953125, 0.2098846435546875, 0.25396728515625, 0.2980499267578125, 0.342132568359375, 0.3862152099609375, 0.4302978515625, 0.4743804931640625, 0.518463134765625, 0.5625457763671875, 0.60662841796875, 0.6507110595703125, 0.694793701171875, 0.7388763427734375, 0.782958984375, 0.8270416259765625, 0.871124267578125, 0.9152069091796875, 0.95928955078125, 1.0033721923828125, 1.047454833984375, 1.0915374755859375, 1.1356201171875, 1.1797027587890625, 1.223785400390625, 1.2678680419921875, 1.31195068359375, 1.3560333251953125, 1.400115966796875, 1.4441986083984375, 1.48828125]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 11.0, 36.0, 119.0, 291.0, 319.0, 168.0, 41.0, 12.0, 5.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-103.31590270996094, -101.12723541259766, -98.93856811523438, -96.7499008178711, -94.56123352050781, -92.37256622314453, -90.18389892578125, -87.9952392578125, -85.80656433105469, -83.6178970336914, -81.42922973632812, -79.24056243896484, -77.05189514160156, -74.86322784423828, -72.674560546875, -70.48590087890625, -68.29723358154297, -66.10856628417969, -63.919898986816406, -61.731231689453125, -59.542564392089844, -57.35389709472656, -55.16523361206055, -52.976566314697266, -50.787899017333984, -48.5992317199707, -46.41056442260742, -44.22189712524414, -42.033233642578125, -39.844566345214844, -37.65589904785156, -35.46723175048828, -33.27857208251953, -31.08990478515625, -28.90123748779297, -26.71257209777832, -24.52390480041504, -22.335237503051758, -20.14657211303711, -17.957904815673828, -15.769237518310547, -13.580570220947266, -11.3919038772583, -9.203237533569336, -7.014570236206055, -4.825902938842773, -2.6372365951538086, -0.44857025146484375, 1.7400970458984375, 3.9287638664245605, 6.117430686950684, 8.306097030639648, 10.49476432800293, 12.683431625366211, 14.872097969055176, 17.06076431274414, 19.249431610107422, 21.438098907470703, 23.626766204833984, 25.815431594848633, 28.004098892211914, 30.192766189575195, 32.381431579589844, 34.570098876953125, 36.758766174316406]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 3.0, 0.0, 6.0, 5.0, 7.0, 8.0, 7.0, 9.0, 19.0, 16.0, 26.0, 16.0, 26.0, 19.0, 31.0, 28.0, 44.0, 33.0, 29.0, 35.0, 44.0, 38.0, 48.0, 59.0, 39.0, 36.0, 47.0, 35.0, 56.0, 29.0, 36.0, 32.0, 30.0, 13.0, 21.0, 19.0, 12.0, 12.0, 10.0, 5.0, 5.0, 5.0, 6.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.819198608398438, -16.242019653320312, -15.664841651916504, -15.087662696838379, -14.51048469543457, -13.933305740356445, -13.35612678527832, -12.778947830200195, -12.201769828796387, -11.624590873718262, -11.047412872314453, -10.470233917236328, -9.893054962158203, -9.315876960754395, -8.73869800567627, -8.161520004272461, -7.584341049194336, -7.007162570953369, -6.429984092712402, -5.852805137634277, -5.2756266593933105, -4.698448181152344, -4.121269226074219, -3.544090747833252, -2.966912269592285, -2.3897337913513184, -1.8125550746917725, -1.2353764772415161, -0.6581978797912598, -0.08101940155029297, 0.49615931510925293, 1.0733380317687988, 1.6505146026611328, 2.2276930809020996, 2.8048717975616455, 3.3820505142211914, 3.959228992462158, 4.536407470703125, 5.11358642578125, 5.690764904022217, 6.267943382263184, 6.84512186050415, 7.422300338745117, 7.999479293823242, 8.576658248901367, 9.153836250305176, 9.7310152053833, 10.30819320678711, 10.885372161865234, 11.46255111694336, 12.039729118347168, 12.616908073425293, 13.194086074829102, 13.771265029907227, 14.348443984985352, 14.925622940063477, 15.502800941467285, 16.079978942871094, 16.65715789794922, 17.234336853027344, 17.81151580810547, 18.388694763183594, 18.965871810913086, 19.54305076599121, 20.120229721069336]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 3.0, 3.0, 2.0, 5.0, 3.0, 13.0, 11.0, 14.0, 13.0, 27.0, 46.0, 61.0, 125.0, 183.0, 289.0, 554.0, 1106.0, 2864.0, 10552.0, 69562.0, 3351280.0, 707782.0, 38629.0, 7001.0, 2195.0, 913.0, 420.0, 228.0, 145.0, 84.0, 52.0, 28.0, 22.0, 18.0, 16.0, 8.0, 6.0, 5.0, 2.0, 5.0, 2.0, 3.0, 5.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-6.43359375, -6.25421142578125, -6.0748291015625, -5.89544677734375, -5.716064453125, -5.53668212890625, -5.3572998046875, -5.17791748046875, -4.99853515625, -4.81915283203125, -4.6397705078125, -4.46038818359375, -4.281005859375, -4.10162353515625, -3.9222412109375, -3.74285888671875, -3.5634765625, -3.38409423828125, -3.2047119140625, -3.02532958984375, -2.845947265625, -2.66656494140625, -2.4871826171875, -2.30780029296875, -2.12841796875, -1.94903564453125, -1.7696533203125, -1.59027099609375, -1.410888671875, -1.23150634765625, -1.0521240234375, -0.87274169921875, -0.693359375, -0.51397705078125, -0.3345947265625, -0.15521240234375, 0.024169921875, 0.20355224609375, 0.3829345703125, 0.56231689453125, 0.74169921875, 0.92108154296875, 1.1004638671875, 1.27984619140625, 1.459228515625, 1.63861083984375, 1.8179931640625, 1.99737548828125, 2.1767578125, 2.35614013671875, 2.5355224609375, 2.71490478515625, 2.894287109375, 3.07366943359375, 3.2530517578125, 3.43243408203125, 3.61181640625, 3.79119873046875, 3.9705810546875, 4.14996337890625, 4.329345703125, 4.50872802734375, 4.6881103515625, 4.86749267578125, 5.046875]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 4.0, 1.0, 2.0, 7.0, 3.0, 7.0, 11.0, 18.0, 29.0, 21.0, 39.0, 57.0, 51.0, 65.0, 99.0, 98.0, 107.0, 76.0, 70.0, 63.0, 56.0, 33.0, 29.0, 13.0, 22.0, 5.0, 8.0, 5.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.88232421875, -0.8545913696289062, -0.8268585205078125, -0.7991256713867188, -0.771392822265625, -0.7436599731445312, -0.7159271240234375, -0.6881942749023438, -0.66046142578125, -0.6327285766601562, -0.6049957275390625, -0.5772628784179688, -0.549530029296875, -0.5217971801757812, -0.4940643310546875, -0.46633148193359375, -0.4385986328125, -0.41086578369140625, -0.3831329345703125, -0.35540008544921875, -0.327667236328125, -0.29993438720703125, -0.2722015380859375, -0.24446868896484375, -0.21673583984375, -0.18900299072265625, -0.1612701416015625, -0.13353729248046875, -0.105804443359375, -0.07807159423828125, -0.0503387451171875, -0.02260589599609375, 0.005126953125, 0.03285980224609375, 0.0605926513671875, 0.08832550048828125, 0.116058349609375, 0.14379119873046875, 0.1715240478515625, 0.19925689697265625, 0.22698974609375, 0.25472259521484375, 0.2824554443359375, 0.31018829345703125, 0.337921142578125, 0.36565399169921875, 0.3933868408203125, 0.42111968994140625, 0.4488525390625, 0.47658538818359375, 0.5043182373046875, 0.5320510864257812, 0.559783935546875, 0.5875167846679688, 0.6152496337890625, 0.6429824829101562, 0.67071533203125, 0.6984481811523438, 0.7261810302734375, 0.7539138793945312, 0.781646728515625, 0.8093795776367188, 0.8371124267578125, 0.8648452758789062, 0.892578125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 6.0, 8.0, 10.0, 16.0, 37.0, 65.0, 95.0, 228.0, 390.0, 872.0, 2214.0, 7303.0, 32871.0, 232535.0, 3269246.0, 570322.0, 61381.0, 11605.0, 3097.0, 1043.0, 457.0, 230.0, 99.0, 69.0, 38.0, 21.0, 12.0, 4.0, 3.0, 3.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.2109375, -4.06903076171875, -3.9271240234375, -3.78521728515625, -3.643310546875, -3.50140380859375, -3.3594970703125, -3.21759033203125, -3.07568359375, -2.93377685546875, -2.7918701171875, -2.64996337890625, -2.508056640625, -2.36614990234375, -2.2242431640625, -2.08233642578125, -1.9404296875, -1.79852294921875, -1.6566162109375, -1.51470947265625, -1.372802734375, -1.23089599609375, -1.0889892578125, -0.94708251953125, -0.80517578125, -0.66326904296875, -0.5213623046875, -0.37945556640625, -0.237548828125, -0.09564208984375, 0.0462646484375, 0.18817138671875, 0.330078125, 0.47198486328125, 0.6138916015625, 0.75579833984375, 0.897705078125, 1.03961181640625, 1.1815185546875, 1.32342529296875, 1.46533203125, 1.60723876953125, 1.7491455078125, 1.89105224609375, 2.032958984375, 2.17486572265625, 2.3167724609375, 2.45867919921875, 2.6005859375, 2.74249267578125, 2.8843994140625, 3.02630615234375, 3.168212890625, 3.31011962890625, 3.4520263671875, 3.59393310546875, 3.73583984375, 3.87774658203125, 4.0196533203125, 4.16156005859375, 4.303466796875, 4.44537353515625, 4.5872802734375, 4.72918701171875, 4.87109375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 6.0, 1.0, 6.0, 11.0, 9.0, 8.0, 26.0, 26.0, 33.0, 40.0, 78.0, 74.0, 161.0, 247.0, 353.0, 928.0, 922.0, 380.0, 234.0, 158.0, 105.0, 72.0, 54.0, 35.0, 26.0, 21.0, 11.0, 15.0, 12.0, 9.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.955078125, -0.9285507202148438, -0.9020233154296875, -0.8754959106445312, -0.848968505859375, -0.8224411010742188, -0.7959136962890625, -0.7693862915039062, -0.74285888671875, -0.7163314819335938, -0.6898040771484375, -0.6632766723632812, -0.636749267578125, -0.6102218627929688, -0.5836944580078125, -0.5571670532226562, -0.5306396484375, -0.5041122436523438, -0.4775848388671875, -0.45105743408203125, -0.424530029296875, -0.39800262451171875, -0.3714752197265625, -0.34494781494140625, -0.31842041015625, -0.29189300537109375, -0.2653656005859375, -0.23883819580078125, -0.212310791015625, -0.18578338623046875, -0.1592559814453125, -0.13272857666015625, -0.106201171875, -0.07967376708984375, -0.0531463623046875, -0.02661895751953125, -9.1552734375e-05, 0.02643585205078125, 0.0529632568359375, 0.07949066162109375, 0.10601806640625, 0.13254547119140625, 0.1590728759765625, 0.18560028076171875, 0.212127685546875, 0.23865509033203125, 0.2651824951171875, 0.29170989990234375, 0.3182373046875, 0.34476470947265625, 0.3712921142578125, 0.39781951904296875, 0.424346923828125, 0.45087432861328125, 0.4774017333984375, 0.5039291381835938, 0.53045654296875, 0.5569839477539062, 0.5835113525390625, 0.6100387573242188, 0.636566162109375, 0.6630935668945312, 0.6896209716796875, 0.7161483764648438, 0.74267578125]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 6.0, 29.0, 28.0, 62.0, 123.0, 188.0, 185.0, 155.0, 114.0, 46.0, 32.0, 11.0, 13.0, 3.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-13.376837730407715, -13.099570274353027, -12.822301864624023, -12.545034408569336, -12.267765998840332, -11.990498542785645, -11.71323013305664, -11.435962677001953, -11.158695220947266, -10.881427764892578, -10.604159355163574, -10.326891899108887, -10.049623489379883, -9.772356033325195, -9.495088577270508, -9.217820167541504, -8.9405517578125, -8.663284301757812, -8.386015892028809, -8.108748435974121, -7.831480503082275, -7.55421257019043, -7.276944637298584, -6.999676704406738, -6.722409248352051, -6.445141315460205, -6.167873382568359, -5.890605926513672, -5.613337993621826, -5.3360700607299805, -5.058802127838135, -4.781534194946289, -4.50426721572876, -4.226999282836914, -3.9497315883636475, -3.6724636554718018, -3.395195960998535, -3.1179280281066895, -2.8406600952148438, -2.563392162322998, -2.2861244678497314, -2.0088565349578857, -1.7315888404846191, -1.4543209075927734, -1.1770530939102173, -0.8997852802276611, -0.6225173473358154, -0.3452495336532593, -0.06798171997070312, 0.20928612351417542, 0.48655396699905396, 0.7638218402862549, 1.041089653968811, 1.3183574676513672, 1.595625400543213, 1.872893214225769, 2.150161027908325, 2.427428960800171, 2.7046966552734375, 2.981964588165283, 3.259232521057129, 3.5365002155303955, 3.813768148422241, 4.091035842895508, 4.3683037757873535]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 3.0, 8.0, 7.0, 5.0, 6.0, 10.0, 6.0, 11.0, 12.0, 24.0, 21.0, 20.0, 24.0, 27.0, 41.0, 33.0, 33.0, 28.0, 38.0, 55.0, 34.0, 39.0, 47.0, 43.0, 36.0, 37.0, 36.0, 36.0, 45.0, 35.0, 31.0, 31.0, 25.0, 22.0, 25.0, 16.0, 10.0, 11.0, 7.0, 8.0, 3.0, 7.0, 4.0, 3.0, 3.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9113199710845947, -2.8132874965667725, -2.7152552604675293, -2.617222785949707, -2.519190549850464, -2.4211580753326416, -2.3231258392333984, -2.225093364715576, -2.127060890197754, -2.0290284156799316, -1.9309961795806885, -1.8329637050628662, -1.734931468963623, -1.6368989944458008, -1.538866639137268, -1.4408342838287354, -1.3428020477294922, -1.2447696924209595, -1.1467373371124268, -1.0487048625946045, -0.9506725668907166, -0.8526402115821838, -0.7546077966690063, -0.6565754413604736, -0.5585430860519409, -0.4605107307434082, -0.3624783456325531, -0.264445960521698, -0.16641360521316528, -0.06838124990463257, 0.029651165008544922, 0.12768352031707764, 0.22571587562561035, 0.32374823093414307, 0.42178061604499817, 0.5198130011558533, 0.617845356464386, 0.7158777117729187, 0.8139101266860962, 0.9119424819946289, 1.0099748373031616, 1.1080071926116943, 1.206039547920227, 1.3040719032287598, 1.402104377746582, 1.5001366138458252, 1.5981690883636475, 1.6962014436721802, 1.794233798980713, 1.8922661542892456, 1.9902985095977783, 2.0883309841156006, 2.1863632202148438, 2.284395694732666, 2.3824281692504883, 2.4804604053497314, 2.5784926414489746, 2.676525115966797, 2.77455735206604, 2.8725898265838623, 2.9706220626831055, 3.0686545372009277, 3.16668701171875, 3.264719247817993, 3.3627517223358154]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 3.0, 4.0, 5.0, 11.0, 19.0, 25.0, 28.0, 41.0, 63.0, 67.0, 120.0, 184.0, 235.0, 378.0, 552.0, 921.0, 1662.0, 2925.0, 5876.0, 12549.0, 27912.0, 63713.0, 135833.0, 236466.0, 254879.0, 161478.0, 77644.0, 34486.0, 15009.0, 7159.0, 3340.0, 1848.0, 1048.0, 687.0, 455.0, 295.0, 185.0, 137.0, 96.0, 53.0, 39.0, 41.0, 32.0, 24.0, 14.0, 4.0, 7.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.123046875, -2.054840087890625, -1.98663330078125, -1.918426513671875, -1.8502197265625, -1.782012939453125, -1.71380615234375, -1.645599365234375, -1.577392578125, -1.509185791015625, -1.44097900390625, -1.372772216796875, -1.3045654296875, -1.236358642578125, -1.16815185546875, -1.099945068359375, -1.03173828125, -0.963531494140625, -0.89532470703125, -0.827117919921875, -0.7589111328125, -0.690704345703125, -0.62249755859375, -0.554290771484375, -0.486083984375, -0.417877197265625, -0.34967041015625, -0.281463623046875, -0.2132568359375, -0.145050048828125, -0.07684326171875, -0.008636474609375, 0.0595703125, 0.127777099609375, 0.19598388671875, 0.264190673828125, 0.3323974609375, 0.400604248046875, 0.46881103515625, 0.537017822265625, 0.605224609375, 0.673431396484375, 0.74163818359375, 0.809844970703125, 0.8780517578125, 0.946258544921875, 1.01446533203125, 1.082672119140625, 1.15087890625, 1.219085693359375, 1.28729248046875, 1.355499267578125, 1.4237060546875, 1.491912841796875, 1.56011962890625, 1.628326416015625, 1.696533203125, 1.764739990234375, 1.83294677734375, 1.901153564453125, 1.9693603515625, 2.037567138671875, 2.10577392578125, 2.173980712890625, 2.2421875]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 4.0, 7.0, 12.0, 14.0, 17.0, 35.0, 37.0, 49.0, 57.0, 79.0, 96.0, 97.0, 84.0, 93.0, 75.0, 50.0, 50.0, 44.0, 33.0, 16.0, 12.0, 13.0, 9.0, 4.0, 4.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.92236328125, -0.8943099975585938, -0.8662567138671875, -0.8382034301757812, -0.810150146484375, -0.7820968627929688, -0.7540435791015625, -0.7259902954101562, -0.69793701171875, -0.6698837280273438, -0.6418304443359375, -0.6137771606445312, -0.585723876953125, -0.5576705932617188, -0.5296173095703125, -0.5015640258789062, -0.4735107421875, -0.44545745849609375, -0.4174041748046875, -0.38935089111328125, -0.361297607421875, -0.33324432373046875, -0.3051910400390625, -0.27713775634765625, -0.24908447265625, -0.22103118896484375, -0.1929779052734375, -0.16492462158203125, -0.136871337890625, -0.10881805419921875, -0.0807647705078125, -0.05271148681640625, -0.024658203125, 0.00339508056640625, 0.0314483642578125, 0.05950164794921875, 0.087554931640625, 0.11560821533203125, 0.1436614990234375, 0.17171478271484375, 0.19976806640625, 0.22782135009765625, 0.2558746337890625, 0.28392791748046875, 0.311981201171875, 0.34003448486328125, 0.3680877685546875, 0.39614105224609375, 0.4241943359375, 0.45224761962890625, 0.4803009033203125, 0.5083541870117188, 0.536407470703125, 0.5644607543945312, 0.5925140380859375, 0.6205673217773438, 0.64862060546875, 0.6766738891601562, 0.7047271728515625, 0.7327804565429688, 0.760833740234375, 0.7888870239257812, 0.8169403076171875, 0.8449935913085938, 0.873046875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 7.0, 12.0, 12.0, 14.0, 29.0, 35.0, 47.0, 67.0, 76.0, 96.0, 166.0, 201.0, 293.0, 457.0, 801.0, 1432.0, 3127.0, 8904.0, 32207.0, 125165.0, 341849.0, 350397.0, 132068.0, 34526.0, 9495.0, 3214.0, 1382.0, 763.0, 488.0, 353.0, 234.0, 166.0, 140.0, 89.0, 65.0, 47.0, 44.0, 21.0, 20.0, 15.0, 18.0, 4.0, 8.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.564453125, -3.459686279296875, -3.35491943359375, -3.250152587890625, -3.1453857421875, -3.040618896484375, -2.93585205078125, -2.831085205078125, -2.726318359375, -2.621551513671875, -2.51678466796875, -2.412017822265625, -2.3072509765625, -2.202484130859375, -2.09771728515625, -1.992950439453125, -1.88818359375, -1.783416748046875, -1.67864990234375, -1.573883056640625, -1.4691162109375, -1.364349365234375, -1.25958251953125, -1.154815673828125, -1.050048828125, -0.945281982421875, -0.84051513671875, -0.735748291015625, -0.6309814453125, -0.526214599609375, -0.42144775390625, -0.316680908203125, -0.2119140625, -0.107147216796875, -0.00238037109375, 0.102386474609375, 0.2071533203125, 0.311920166015625, 0.41668701171875, 0.521453857421875, 0.626220703125, 0.730987548828125, 0.83575439453125, 0.940521240234375, 1.0452880859375, 1.150054931640625, 1.25482177734375, 1.359588623046875, 1.46435546875, 1.569122314453125, 1.67388916015625, 1.778656005859375, 1.8834228515625, 1.988189697265625, 2.09295654296875, 2.197723388671875, 2.302490234375, 2.407257080078125, 2.51202392578125, 2.616790771484375, 2.7215576171875, 2.826324462890625, 2.93109130859375, 3.035858154296875, 3.140625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 7.0, 2.0, 1.0, 1.0, 3.0, 2.0, 5.0, 5.0, 5.0, 12.0, 3.0, 6.0, 7.0, 11.0, 18.0, 13.0, 18.0, 20.0, 24.0, 24.0, 26.0, 30.0, 35.0, 39.0, 34.0, 45.0, 35.0, 48.0, 41.0, 43.0, 33.0, 36.0, 35.0, 37.0, 35.0, 38.0, 29.0, 31.0, 22.0, 21.0, 18.0, 7.0, 16.0, 15.0, 13.0, 16.0, 12.0, 7.0, 4.0, 8.0, 3.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0], "bins": [-2.64453125, -2.5634765625, -2.482421875, -2.4013671875, -2.3203125, -2.2392578125, -2.158203125, -2.0771484375, -1.99609375, -1.9150390625, -1.833984375, -1.7529296875, -1.671875, -1.5908203125, -1.509765625, -1.4287109375, -1.34765625, -1.2666015625, -1.185546875, -1.1044921875, -1.0234375, -0.9423828125, -0.861328125, -0.7802734375, -0.69921875, -0.6181640625, -0.537109375, -0.4560546875, -0.375, -0.2939453125, -0.212890625, -0.1318359375, -0.05078125, 0.0302734375, 0.111328125, 0.1923828125, 0.2734375, 0.3544921875, 0.435546875, 0.5166015625, 0.59765625, 0.6787109375, 0.759765625, 0.8408203125, 0.921875, 1.0029296875, 1.083984375, 1.1650390625, 1.24609375, 1.3271484375, 1.408203125, 1.4892578125, 1.5703125, 1.6513671875, 1.732421875, 1.8134765625, 1.89453125, 1.9755859375, 2.056640625, 2.1376953125, 2.21875, 2.2998046875, 2.380859375, 2.4619140625, 2.54296875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 2.0, 3.0, 6.0, 5.0, 3.0, 11.0, 18.0, 19.0, 34.0, 35.0, 99.0, 194.0, 417.0, 1162.0, 4526.0, 33025.0, 494257.0, 476607.0, 31666.0, 4457.0, 1180.0, 442.0, 174.0, 74.0, 48.0, 30.0, 19.0, 14.0, 4.0, 6.0, 7.0, 4.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.19140625, -4.074951171875, -3.95849609375, -3.842041015625, -3.7255859375, -3.609130859375, -3.49267578125, -3.376220703125, -3.259765625, -3.143310546875, -3.02685546875, -2.910400390625, -2.7939453125, -2.677490234375, -2.56103515625, -2.444580078125, -2.328125, -2.211669921875, -2.09521484375, -1.978759765625, -1.8623046875, -1.745849609375, -1.62939453125, -1.512939453125, -1.396484375, -1.280029296875, -1.16357421875, -1.047119140625, -0.9306640625, -0.814208984375, -0.69775390625, -0.581298828125, -0.46484375, -0.348388671875, -0.23193359375, -0.115478515625, 0.0009765625, 0.117431640625, 0.23388671875, 0.350341796875, 0.466796875, 0.583251953125, 0.69970703125, 0.816162109375, 0.9326171875, 1.049072265625, 1.16552734375, 1.281982421875, 1.3984375, 1.514892578125, 1.63134765625, 1.747802734375, 1.8642578125, 1.980712890625, 2.09716796875, 2.213623046875, 2.330078125, 2.446533203125, 2.56298828125, 2.679443359375, 2.7958984375, 2.912353515625, 3.02880859375, 3.145263671875, 3.26171875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 8.0, 8.0, 13.0, 4.0, 12.0, 9.0, 11.0, 15.0, 18.0, 23.0, 23.0, 40.0, 45.0, 43.0, 61.0, 52.0, 74.0, 73.0, 66.0, 66.0, 45.0, 50.0, 45.0, 31.0, 32.0, 17.0, 18.0, 21.0, 21.0, 5.0, 14.0, 8.0, 8.0, 2.0, 3.0, 6.0, 2.0, 1.0, 4.0, 4.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.0002613067626953125, -0.00025432929396629333, -0.00024735182523727417, -0.000240374356508255, -0.00023339688777923584, -0.00022641941905021667, -0.0002194419503211975, -0.00021246448159217834, -0.00020548701286315918, -0.00019850954413414001, -0.00019153207540512085, -0.00018455460667610168, -0.00017757713794708252, -0.00017059966921806335, -0.0001636222004890442, -0.00015664473176002502, -0.00014966726303100586, -0.0001426897943019867, -0.00013571232557296753, -0.00012873485684394836, -0.0001217573881149292, -0.00011477991938591003, -0.00010780245065689087, -0.0001008249819278717, -9.384751319885254e-05, -8.687004446983337e-05, -7.989257574081421e-05, -7.291510701179504e-05, -6.593763828277588e-05, -5.8960169553756714e-05, -5.198270082473755e-05, -4.5005232095718384e-05, -3.802776336669922e-05, -3.1050294637680054e-05, -2.407282590866089e-05, -1.7095357179641724e-05, -1.0117888450622559e-05, -3.1404197216033936e-06, 3.8370490074157715e-06, 1.0814517736434937e-05, 1.77919864654541e-05, 2.4769455194473267e-05, 3.174692392349243e-05, 3.87243926525116e-05, 4.570186138153076e-05, 5.267933011054993e-05, 5.965679883956909e-05, 6.663426756858826e-05, 7.361173629760742e-05, 8.058920502662659e-05, 8.756667375564575e-05, 9.454414248466492e-05, 0.00010152161121368408, 0.00010849907994270325, 0.00011547654867172241, 0.00012245401740074158, 0.00012943148612976074, 0.0001364089548587799, 0.00014338642358779907, 0.00015036389231681824, 0.0001573413610458374, 0.00016431882977485657, 0.00017129629850387573, 0.0001782737672328949, 0.00018525123596191406]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 3.0, 1.0, 2.0, 5.0, 7.0, 8.0, 9.0, 17.0, 15.0, 25.0, 44.0, 55.0, 89.0, 145.0, 284.0, 551.0, 1230.0, 3263.0, 11226.0, 73712.0, 623246.0, 293957.0, 30459.0, 6315.0, 2103.0, 801.0, 407.0, 222.0, 116.0, 63.0, 48.0, 42.0, 28.0, 22.0, 11.0, 8.0, 6.0, 5.0, 6.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.021484375, -2.9200439453125, -2.818603515625, -2.7171630859375, -2.61572265625, -2.5142822265625, -2.412841796875, -2.3114013671875, -2.2099609375, -2.1085205078125, -2.007080078125, -1.9056396484375, -1.80419921875, -1.7027587890625, -1.601318359375, -1.4998779296875, -1.3984375, -1.2969970703125, -1.195556640625, -1.0941162109375, -0.99267578125, -0.8912353515625, -0.789794921875, -0.6883544921875, -0.5869140625, -0.4854736328125, -0.384033203125, -0.2825927734375, -0.18115234375, -0.0797119140625, 0.021728515625, 0.1231689453125, 0.224609375, 0.3260498046875, 0.427490234375, 0.5289306640625, 0.63037109375, 0.7318115234375, 0.833251953125, 0.9346923828125, 1.0361328125, 1.1375732421875, 1.239013671875, 1.3404541015625, 1.44189453125, 1.5433349609375, 1.644775390625, 1.7462158203125, 1.84765625, 1.9490966796875, 2.050537109375, 2.1519775390625, 2.25341796875, 2.3548583984375, 2.456298828125, 2.5577392578125, 2.6591796875, 2.7606201171875, 2.862060546875, 2.9635009765625, 3.06494140625, 3.1663818359375, 3.267822265625, 3.3692626953125, 3.470703125]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 6.0, 2.0, 4.0, 7.0, 11.0, 14.0, 20.0, 19.0, 36.0, 33.0, 38.0, 50.0, 82.0, 65.0, 83.0, 98.0, 72.0, 88.0, 55.0, 51.0, 36.0, 35.0, 17.0, 24.0, 10.0, 11.0, 4.0, 5.0, 4.0, 4.0, 5.0, 1.0, 5.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.3056640625, -1.2610321044921875, -1.216400146484375, -1.1717681884765625, -1.12713623046875, -1.0825042724609375, -1.037872314453125, -0.9932403564453125, -0.9486083984375, -0.9039764404296875, -0.859344482421875, -0.8147125244140625, -0.77008056640625, -0.7254486083984375, -0.680816650390625, -0.6361846923828125, -0.591552734375, -0.5469207763671875, -0.502288818359375, -0.4576568603515625, -0.41302490234375, -0.3683929443359375, -0.323760986328125, -0.2791290283203125, -0.2344970703125, -0.1898651123046875, -0.145233154296875, -0.1006011962890625, -0.05596923828125, -0.0113372802734375, 0.033294677734375, 0.0779266357421875, 0.12255859375, 0.1671905517578125, 0.211822509765625, 0.2564544677734375, 0.30108642578125, 0.3457183837890625, 0.390350341796875, 0.4349822998046875, 0.4796142578125, 0.5242462158203125, 0.568878173828125, 0.6135101318359375, 0.65814208984375, 0.7027740478515625, 0.747406005859375, 0.7920379638671875, 0.836669921875, 0.8813018798828125, 0.925933837890625, 0.9705657958984375, 1.01519775390625, 1.0598297119140625, 1.104461669921875, 1.1490936279296875, 1.1937255859375, 1.2383575439453125, 1.282989501953125, 1.3276214599609375, 1.37225341796875, 1.4168853759765625, 1.461517333984375, 1.5061492919921875, 1.55078125]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 4.0, 6.0, 29.0, 70.0, 204.0, 256.0, 264.0, 111.0, 41.0, 10.0, 10.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.23860168457031, -73.66641998291016, -72.09424591064453, -70.52206420898438, -68.94989013671875, -67.3777084350586, -65.80553436279297, -64.23335266113281, -62.66117477416992, -61.08899688720703, -59.51681900024414, -57.94464111328125, -56.372459411621094, -54.8002815246582, -53.22810363769531, -51.65592575073242, -50.08374786376953, -48.51156997680664, -46.93939208984375, -45.36721420288086, -43.79503631591797, -42.22285461425781, -40.65067672729492, -39.07849884033203, -37.50632095336914, -35.93414306640625, -34.36196517944336, -32.78978729248047, -31.217607498168945, -29.645429611206055, -28.07324981689453, -26.50107192993164, -24.92889404296875, -23.35671615600586, -21.78453826904297, -20.212358474731445, -18.640180587768555, -17.068002700805664, -15.495823860168457, -13.92364501953125, -12.35146713256836, -10.779289245605469, -9.207110404968262, -7.634932041168213, -6.062753677368164, -4.490575313568115, -2.9183969497680664, -1.3462181091308594, 0.22595977783203125, 1.79813814163208, 3.370316505432129, 4.942494869232178, 6.514673233032227, 8.086851119995117, 9.659029960632324, 11.231208801269531, 12.803386688232422, 14.375564575195312, 15.94774341583252, 17.519922256469727, 19.092100143432617, 20.664278030395508, 22.23645782470703, 23.808635711669922, 25.380813598632812]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 0.0, 3.0, 3.0, 4.0, 7.0, 1.0, 11.0, 3.0, 11.0, 12.0, 15.0, 18.0, 22.0, 19.0, 26.0, 43.0, 28.0, 43.0, 32.0, 40.0, 35.0, 51.0, 62.0, 46.0, 50.0, 56.0, 53.0, 41.0, 42.0, 35.0, 26.0, 19.0, 27.0, 17.0, 19.0, 18.0, 22.0, 5.0, 8.0, 10.0, 10.0, 6.0, 2.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.612895965576172, -18.032562255859375, -17.452228546142578, -16.87189483642578, -16.291561126708984, -15.711227416992188, -15.130892753601074, -14.550559043884277, -13.97022533416748, -13.389891624450684, -12.809557914733887, -12.22922420501709, -11.648889541625977, -11.06855583190918, -10.488222122192383, -9.907888412475586, -9.327554702758789, -8.747220993041992, -8.166887283325195, -7.58655309677124, -7.006219387054443, -6.4258856773376465, -5.845551490783691, -5.2652177810668945, -4.684884071350098, -4.104550361633301, -3.524216413497925, -2.943882465362549, -2.363548755645752, -1.783215045928955, -1.202881097793579, -0.6225471496582031, -0.04221343994140625, 0.5381203889846802, 1.1184542179107666, 1.698788046836853, 2.2791218757629395, 2.8594555854797363, 3.4397895336151123, 4.020123481750488, 4.600457191467285, 5.180790901184082, 5.761124610900879, 6.341458797454834, 6.921792507171631, 7.502126216888428, 8.082460403442383, 8.66279411315918, 9.243127822875977, 9.823461532592773, 10.40379524230957, 10.984128952026367, 11.564462661743164, 12.144796371459961, 12.725131034851074, 13.305464744567871, 13.885798454284668, 14.466132164001465, 15.046465873718262, 15.626799583435059, 16.207134246826172, 16.78746795654297, 17.367801666259766, 17.948135375976562, 18.52846908569336]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 10.0, 6.0, 9.0, 9.0, 16.0, 22.0, 41.0, 51.0, 83.0, 163.0, 225.0, 383.0, 743.0, 1354.0, 2821.0, 6582.0, 18650.0, 74991.0, 926159.0, 3018111.0, 105761.0, 23597.0, 7901.0, 3146.0, 1607.0, 726.0, 427.0, 240.0, 147.0, 84.0, 59.0, 28.0, 36.0, 27.0, 16.0, 13.0, 3.0, 6.0, 8.0, 6.0, 2.0, 1.0, 4.0, 1.0, 1.0], "bins": [-3.80078125, -3.701019287109375, -3.60125732421875, -3.501495361328125, -3.4017333984375, -3.301971435546875, -3.20220947265625, -3.102447509765625, -3.002685546875, -2.902923583984375, -2.80316162109375, -2.703399658203125, -2.6036376953125, -2.503875732421875, -2.40411376953125, -2.304351806640625, -2.20458984375, -2.104827880859375, -2.00506591796875, -1.905303955078125, -1.8055419921875, -1.705780029296875, -1.60601806640625, -1.506256103515625, -1.406494140625, -1.306732177734375, -1.20697021484375, -1.107208251953125, -1.0074462890625, -0.907684326171875, -0.80792236328125, -0.708160400390625, -0.6083984375, -0.508636474609375, -0.40887451171875, -0.309112548828125, -0.2093505859375, -0.109588623046875, -0.00982666015625, 0.089935302734375, 0.189697265625, 0.289459228515625, 0.38922119140625, 0.488983154296875, 0.5887451171875, 0.688507080078125, 0.78826904296875, 0.888031005859375, 0.98779296875, 1.087554931640625, 1.18731689453125, 1.287078857421875, 1.3868408203125, 1.486602783203125, 1.58636474609375, 1.686126708984375, 1.785888671875, 1.885650634765625, 1.98541259765625, 2.085174560546875, 2.1849365234375, 2.284698486328125, 2.38446044921875, 2.484222412109375, 2.583984375]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 5.0, 5.0, 8.0, 12.0, 22.0, 23.0, 26.0, 42.0, 45.0, 46.0, 73.0, 81.0, 73.0, 86.0, 92.0, 79.0, 71.0, 57.0, 36.0, 38.0, 26.0, 16.0, 11.0, 11.0, 5.0, 3.0, 7.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.0224609375, -0.9934463500976562, -0.9644317626953125, -0.9354171752929688, -0.906402587890625, -0.8773880004882812, -0.8483734130859375, -0.8193588256835938, -0.79034423828125, -0.7613296508789062, -0.7323150634765625, -0.7033004760742188, -0.674285888671875, -0.6452713012695312, -0.6162567138671875, -0.5872421264648438, -0.5582275390625, -0.5292129516601562, -0.5001983642578125, -0.47118377685546875, -0.442169189453125, -0.41315460205078125, -0.3841400146484375, -0.35512542724609375, -0.32611083984375, -0.29709625244140625, -0.2680816650390625, -0.23906707763671875, -0.210052490234375, -0.18103790283203125, -0.1520233154296875, -0.12300872802734375, -0.093994140625, -0.06497955322265625, -0.0359649658203125, -0.00695037841796875, 0.022064208984375, 0.05107879638671875, 0.0800933837890625, 0.10910797119140625, 0.13812255859375, 0.16713714599609375, 0.1961517333984375, 0.22516632080078125, 0.254180908203125, 0.28319549560546875, 0.3122100830078125, 0.34122467041015625, 0.3702392578125, 0.39925384521484375, 0.4282684326171875, 0.45728302001953125, 0.486297607421875, 0.5153121948242188, 0.5443267822265625, 0.5733413696289062, 0.60235595703125, 0.6313705444335938, 0.6603851318359375, 0.6893997192382812, 0.718414306640625, 0.7474288940429688, 0.7764434814453125, 0.8054580688476562, 0.83447265625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 3.0, 12.0, 3.0, 13.0, 18.0, 32.0, 39.0, 65.0, 140.0, 244.0, 451.0, 1053.0, 2556.0, 6785.0, 21556.0, 97249.0, 923963.0, 2899547.0, 190044.0, 34761.0, 9727.0, 3451.0, 1331.0, 609.0, 281.0, 151.0, 88.0, 43.0, 23.0, 17.0, 10.0, 5.0, 6.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.74609375, -3.647979736328125, -3.54986572265625, -3.451751708984375, -3.3536376953125, -3.255523681640625, -3.15740966796875, -3.059295654296875, -2.961181640625, -2.863067626953125, -2.76495361328125, -2.666839599609375, -2.5687255859375, -2.470611572265625, -2.37249755859375, -2.274383544921875, -2.17626953125, -2.078155517578125, -1.98004150390625, -1.881927490234375, -1.7838134765625, -1.685699462890625, -1.58758544921875, -1.489471435546875, -1.391357421875, -1.293243408203125, -1.19512939453125, -1.097015380859375, -0.9989013671875, -0.900787353515625, -0.80267333984375, -0.704559326171875, -0.6064453125, -0.508331298828125, -0.41021728515625, -0.312103271484375, -0.2139892578125, -0.115875244140625, -0.01776123046875, 0.080352783203125, 0.178466796875, 0.276580810546875, 0.37469482421875, 0.472808837890625, 0.5709228515625, 0.669036865234375, 0.76715087890625, 0.865264892578125, 0.96337890625, 1.061492919921875, 1.15960693359375, 1.257720947265625, 1.3558349609375, 1.453948974609375, 1.55206298828125, 1.650177001953125, 1.748291015625, 1.846405029296875, 1.94451904296875, 2.042633056640625, 2.1407470703125, 2.238861083984375, 2.33697509765625, 2.435089111328125, 2.533203125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 10.0, 4.0, 10.0, 11.0, 13.0, 20.0, 28.0, 38.0, 61.0, 93.0, 131.0, 223.0, 404.0, 1034.0, 964.0, 415.0, 225.0, 114.0, 89.0, 44.0, 29.0, 27.0, 15.0, 14.0, 15.0, 9.0, 10.0, 5.0, 2.0, 3.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.87158203125, -0.8459320068359375, -0.820281982421875, -0.7946319580078125, -0.76898193359375, -0.7433319091796875, -0.717681884765625, -0.6920318603515625, -0.6663818359375, -0.6407318115234375, -0.615081787109375, -0.5894317626953125, -0.56378173828125, -0.5381317138671875, -0.512481689453125, -0.4868316650390625, -0.461181640625, -0.4355316162109375, -0.409881591796875, -0.3842315673828125, -0.35858154296875, -0.3329315185546875, -0.307281494140625, -0.2816314697265625, -0.2559814453125, -0.2303314208984375, -0.204681396484375, -0.1790313720703125, -0.15338134765625, -0.1277313232421875, -0.102081298828125, -0.0764312744140625, -0.05078125, -0.0251312255859375, 0.000518798828125, 0.0261688232421875, 0.05181884765625, 0.0774688720703125, 0.103118896484375, 0.1287689208984375, 0.1544189453125, 0.1800689697265625, 0.205718994140625, 0.2313690185546875, 0.25701904296875, 0.2826690673828125, 0.308319091796875, 0.3339691162109375, 0.359619140625, 0.3852691650390625, 0.410919189453125, 0.4365692138671875, 0.46221923828125, 0.4878692626953125, 0.513519287109375, 0.5391693115234375, 0.5648193359375, 0.5904693603515625, 0.616119384765625, 0.6417694091796875, 0.66741943359375, 0.6930694580078125, 0.718719482421875, 0.7443695068359375, 0.77001953125]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 5.0, 7.0, 13.0, 22.0, 51.0, 81.0, 133.0, 155.0, 165.0, 154.0, 99.0, 70.0, 21.0, 15.0, 5.0, 4.0, 2.0, 2.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.813425064086914, -9.580723762512207, -9.3480224609375, -9.115320205688477, -8.88261890411377, -8.649917602539062, -8.417216300964355, -8.184514999389648, -7.951813220977783, -7.719111919403076, -7.486410140991211, -7.253708839416504, -7.021007537841797, -6.788305759429932, -6.555604457855225, -6.322902679443359, -6.090201377868652, -5.857500076293945, -5.62479829788208, -5.392096996307373, -5.159395694732666, -4.926693916320801, -4.693992614746094, -4.461291313171387, -4.22859001159668, -3.9958884716033936, -3.7631871700286865, -3.5304856300354004, -3.2977840900421143, -3.065082550048828, -2.832381248474121, -2.599679708480835, -2.366978168487549, -2.1342766284942627, -1.9015752077102661, -1.6688737869262695, -1.4361722469329834, -1.2034708261489868, -0.9707694053649902, -0.7380678653717041, -0.5053664445877075, -0.27266496419906616, -0.03996351361274719, 0.19273793697357178, 0.42543941736221313, 0.6581408977508545, 0.8908423185348511, 1.1235438585281372, 1.3562452793121338, 1.5889467000961304, 1.8216482400894165, 2.054349660873413, 2.287051200866699, 2.5197525024414062, 2.7524540424346924, 2.9851555824279785, 3.2178568840026855, 3.4505584239959717, 3.6832597255706787, 3.915961265563965, 4.148662567138672, 4.381364345550537, 4.614065647125244, 4.846767425537109, 5.079468727111816]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 9.0, 5.0, 11.0, 11.0, 11.0, 10.0, 11.0, 18.0, 20.0, 32.0, 32.0, 37.0, 39.0, 43.0, 46.0, 45.0, 55.0, 47.0, 45.0, 56.0, 42.0, 58.0, 45.0, 36.0, 33.0, 25.0, 33.0, 29.0, 9.0, 21.0, 22.0, 15.0, 15.0, 11.0, 10.0, 8.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.6406936645507812, -3.5346696376800537, -3.428645610809326, -3.3226215839385986, -3.216597557067871, -3.1105735301971436, -3.004549503326416, -2.8985252380371094, -2.792501449584961, -2.6864774227142334, -2.580453395843506, -2.4744293689727783, -2.368405342102051, -2.2623813152313232, -2.1563572883605957, -2.050333023071289, -1.9443089962005615, -1.838284969329834, -1.7322609424591064, -1.626236915588379, -1.5202128887176514, -1.4141888618469238, -1.3081647157669067, -1.2021406888961792, -1.0961166620254517, -0.9900926351547241, -0.8840686082839966, -0.7780445218086243, -0.6720204949378967, -0.5659964680671692, -0.4599723815917969, -0.35394835472106934, -0.2479240894317627, -0.14190004765987396, -0.03587600588798523, 0.0701480507850647, 0.17617207765579224, 0.2821961045265198, 0.3882201910018921, 0.49424421787261963, 0.6002682447433472, 0.7062922716140747, 0.8123162984848022, 0.9183403849601746, 1.0243644714355469, 1.1303884983062744, 1.236412525177002, 1.3424365520477295, 1.448460578918457, 1.5544846057891846, 1.660508632659912, 1.7665326595306396, 1.8725566864013672, 1.9785807132720947, 2.0846047401428223, 2.190629005432129, 2.2966527938842773, 2.402676820755005, 2.5087008476257324, 2.61472487449646, 2.7207489013671875, 2.826772928237915, 2.9327969551086426, 3.038821220397949, 3.1448452472686768]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 7.0, 8.0, 15.0, 16.0, 15.0, 26.0, 47.0, 80.0, 115.0, 212.0, 369.0, 620.0, 1210.0, 2467.0, 5718.0, 14325.0, 41971.0, 127256.0, 295896.0, 322862.0, 154097.0, 51396.0, 17094.0, 6673.0, 2913.0, 1480.0, 714.0, 382.0, 229.0, 121.0, 73.0, 57.0, 38.0, 23.0, 15.0, 12.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.970703125, -2.88604736328125, -2.8013916015625, -2.71673583984375, -2.632080078125, -2.54742431640625, -2.4627685546875, -2.37811279296875, -2.29345703125, -2.20880126953125, -2.1241455078125, -2.03948974609375, -1.954833984375, -1.87017822265625, -1.7855224609375, -1.70086669921875, -1.6162109375, -1.53155517578125, -1.4468994140625, -1.36224365234375, -1.277587890625, -1.19293212890625, -1.1082763671875, -1.02362060546875, -0.93896484375, -0.85430908203125, -0.7696533203125, -0.68499755859375, -0.600341796875, -0.51568603515625, -0.4310302734375, -0.34637451171875, -0.26171875, -0.17706298828125, -0.0924072265625, -0.00775146484375, 0.076904296875, 0.16156005859375, 0.2462158203125, 0.33087158203125, 0.41552734375, 0.50018310546875, 0.5848388671875, 0.66949462890625, 0.754150390625, 0.83880615234375, 0.9234619140625, 1.00811767578125, 1.0927734375, 1.17742919921875, 1.2620849609375, 1.34674072265625, 1.431396484375, 1.51605224609375, 1.6007080078125, 1.68536376953125, 1.77001953125, 1.85467529296875, 1.9393310546875, 2.02398681640625, 2.108642578125, 2.19329833984375, 2.2779541015625, 2.36260986328125, 2.447265625]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 6.0, 5.0, 4.0, 7.0, 10.0, 23.0, 22.0, 31.0, 39.0, 54.0, 61.0, 63.0, 93.0, 98.0, 85.0, 77.0, 76.0, 66.0, 53.0, 36.0, 35.0, 23.0, 14.0, 6.0, 5.0, 5.0, 4.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.0517578125, -1.0206222534179688, -0.9894866943359375, -0.9583511352539062, -0.927215576171875, -0.8960800170898438, -0.8649444580078125, -0.8338088989257812, -0.80267333984375, -0.7715377807617188, -0.7404022216796875, -0.7092666625976562, -0.678131103515625, -0.6469955444335938, -0.6158599853515625, -0.5847244262695312, -0.5535888671875, -0.5224533081054688, -0.4913177490234375, -0.46018218994140625, -0.429046630859375, -0.39791107177734375, -0.3667755126953125, -0.33563995361328125, -0.30450439453125, -0.27336883544921875, -0.2422332763671875, -0.21109771728515625, -0.179962158203125, -0.14882659912109375, -0.1176910400390625, -0.08655548095703125, -0.055419921875, -0.02428436279296875, 0.0068511962890625, 0.03798675537109375, 0.069122314453125, 0.10025787353515625, 0.1313934326171875, 0.16252899169921875, 0.19366455078125, 0.22480010986328125, 0.2559356689453125, 0.28707122802734375, 0.318206787109375, 0.34934234619140625, 0.3804779052734375, 0.41161346435546875, 0.4427490234375, 0.47388458251953125, 0.5050201416015625, 0.5361557006835938, 0.567291259765625, 0.5984268188476562, 0.6295623779296875, 0.6606979370117188, 0.69183349609375, 0.7229690551757812, 0.7541046142578125, 0.7852401733398438, 0.816375732421875, 0.8475112915039062, 0.8786468505859375, 0.9097824096679688, 0.94091796875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 6.0, 3.0, 5.0, 6.0, 19.0, 11.0, 15.0, 28.0, 25.0, 41.0, 52.0, 76.0, 99.0, 141.0, 199.0, 320.0, 408.0, 585.0, 990.0, 1782.0, 4537.0, 15597.0, 65629.0, 251315.0, 427159.0, 207519.0, 51725.0, 12069.0, 3761.0, 1638.0, 880.0, 525.0, 398.0, 260.0, 202.0, 135.0, 119.0, 73.0, 61.0, 40.0, 34.0, 29.0, 8.0, 13.0, 10.0, 7.0, 3.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.26171875, -3.161102294921875, -3.06048583984375, -2.959869384765625, -2.8592529296875, -2.758636474609375, -2.65802001953125, -2.557403564453125, -2.456787109375, -2.356170654296875, -2.25555419921875, -2.154937744140625, -2.0543212890625, -1.953704833984375, -1.85308837890625, -1.752471923828125, -1.65185546875, -1.551239013671875, -1.45062255859375, -1.350006103515625, -1.2493896484375, -1.148773193359375, -1.04815673828125, -0.947540283203125, -0.846923828125, -0.746307373046875, -0.64569091796875, -0.545074462890625, -0.4444580078125, -0.343841552734375, -0.24322509765625, -0.142608642578125, -0.0419921875, 0.058624267578125, 0.15924072265625, 0.259857177734375, 0.3604736328125, 0.461090087890625, 0.56170654296875, 0.662322998046875, 0.762939453125, 0.863555908203125, 0.96417236328125, 1.064788818359375, 1.1654052734375, 1.266021728515625, 1.36663818359375, 1.467254638671875, 1.56787109375, 1.668487548828125, 1.76910400390625, 1.869720458984375, 1.9703369140625, 2.070953369140625, 2.17156982421875, 2.272186279296875, 2.372802734375, 2.473419189453125, 2.57403564453125, 2.674652099609375, 2.7752685546875, 2.875885009765625, 2.97650146484375, 3.077117919921875, 3.177734375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 2.0, 2.0, 2.0, 3.0, 6.0, 6.0, 7.0, 11.0, 10.0, 8.0, 10.0, 12.0, 15.0, 16.0, 16.0, 40.0, 33.0, 37.0, 43.0, 36.0, 39.0, 45.0, 45.0, 55.0, 41.0, 49.0, 33.0, 39.0, 42.0, 49.0, 30.0, 33.0, 26.0, 24.0, 22.0, 22.0, 19.0, 20.0, 18.0, 8.0, 8.0, 11.0, 5.0, 6.0, 2.0, 7.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7734375, -2.67791748046875, -2.5823974609375, -2.48687744140625, -2.391357421875, -2.29583740234375, -2.2003173828125, -2.10479736328125, -2.00927734375, -1.91375732421875, -1.8182373046875, -1.72271728515625, -1.627197265625, -1.53167724609375, -1.4361572265625, -1.34063720703125, -1.2451171875, -1.14959716796875, -1.0540771484375, -0.95855712890625, -0.863037109375, -0.76751708984375, -0.6719970703125, -0.57647705078125, -0.48095703125, -0.38543701171875, -0.2899169921875, -0.19439697265625, -0.098876953125, -0.00335693359375, 0.0921630859375, 0.18768310546875, 0.283203125, 0.37872314453125, 0.4742431640625, 0.56976318359375, 0.665283203125, 0.76080322265625, 0.8563232421875, 0.95184326171875, 1.04736328125, 1.14288330078125, 1.2384033203125, 1.33392333984375, 1.429443359375, 1.52496337890625, 1.6204833984375, 1.71600341796875, 1.8115234375, 1.90704345703125, 2.0025634765625, 2.09808349609375, 2.193603515625, 2.28912353515625, 2.3846435546875, 2.48016357421875, 2.57568359375, 2.67120361328125, 2.7667236328125, 2.86224365234375, 2.957763671875, 3.05328369140625, 3.1488037109375, 3.24432373046875, 3.33984375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 6.0, 5.0, 10.0, 10.0, 12.0, 14.0, 26.0, 39.0, 58.0, 110.0, 274.0, 598.0, 2261.0, 13262.0, 153119.0, 751358.0, 113688.0, 10644.0, 1957.0, 555.0, 237.0, 110.0, 70.0, 40.0, 21.0, 22.0, 11.0, 12.0, 5.0, 9.0, 2.0, 3.0, 5.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.25390625, -3.14703369140625, -3.0401611328125, -2.93328857421875, -2.826416015625, -2.71954345703125, -2.6126708984375, -2.50579833984375, -2.39892578125, -2.29205322265625, -2.1851806640625, -2.07830810546875, -1.971435546875, -1.86456298828125, -1.7576904296875, -1.65081787109375, -1.5439453125, -1.43707275390625, -1.3302001953125, -1.22332763671875, -1.116455078125, -1.00958251953125, -0.9027099609375, -0.79583740234375, -0.68896484375, -0.58209228515625, -0.4752197265625, -0.36834716796875, -0.261474609375, -0.15460205078125, -0.0477294921875, 0.05914306640625, 0.166015625, 0.27288818359375, 0.3797607421875, 0.48663330078125, 0.593505859375, 0.70037841796875, 0.8072509765625, 0.91412353515625, 1.02099609375, 1.12786865234375, 1.2347412109375, 1.34161376953125, 1.448486328125, 1.55535888671875, 1.6622314453125, 1.76910400390625, 1.8759765625, 1.98284912109375, 2.0897216796875, 2.19659423828125, 2.303466796875, 2.41033935546875, 2.5172119140625, 2.62408447265625, 2.73095703125, 2.83782958984375, 2.9447021484375, 3.05157470703125, 3.158447265625, 3.26531982421875, 3.3721923828125, 3.47906494140625, 3.5859375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 6.0, 9.0, 7.0, 7.0, 15.0, 12.0, 20.0, 24.0, 25.0, 29.0, 31.0, 29.0, 42.0, 65.0, 67.0, 87.0, 84.0, 66.0, 64.0, 46.0, 49.0, 41.0, 30.0, 27.0, 32.0, 14.0, 11.0, 17.0, 8.0, 8.0, 6.0, 8.0, 5.0, 7.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00021123886108398438, -0.00020404160022735596, -0.00019684433937072754, -0.00018964707851409912, -0.0001824498176574707, -0.00017525255680084229, -0.00016805529594421387, -0.00016085803508758545, -0.00015366077423095703, -0.0001464635133743286, -0.0001392662525177002, -0.00013206899166107178, -0.00012487173080444336, -0.00011767446994781494, -0.00011047720909118652, -0.0001032799482345581, -9.608268737792969e-05, -8.888542652130127e-05, -8.168816566467285e-05, -7.449090480804443e-05, -6.729364395141602e-05, -6.00963830947876e-05, -5.289912223815918e-05, -4.570186138153076e-05, -3.8504600524902344e-05, -3.1307339668273926e-05, -2.4110078811645508e-05, -1.691281795501709e-05, -9.715557098388672e-06, -2.518296241760254e-06, 4.678964614868164e-06, 1.1876225471496582e-05, 1.9073486328125e-05, 2.6270747184753418e-05, 3.3468008041381836e-05, 4.0665268898010254e-05, 4.786252975463867e-05, 5.505979061126709e-05, 6.225705146789551e-05, 6.945431232452393e-05, 7.665157318115234e-05, 8.384883403778076e-05, 9.104609489440918e-05, 9.82433557510376e-05, 0.00010544061660766602, 0.00011263787746429443, 0.00011983513832092285, 0.00012703239917755127, 0.0001342296600341797, 0.0001414269208908081, 0.00014862418174743652, 0.00015582144260406494, 0.00016301870346069336, 0.00017021596431732178, 0.0001774132251739502, 0.0001846104860305786, 0.00019180774688720703, 0.00019900500774383545, 0.00020620226860046387, 0.00021339952945709229, 0.0002205967903137207, 0.00022779405117034912, 0.00023499131202697754, 0.00024218857288360596, 0.0002493858337402344]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 5.0, 2.0, 4.0, 3.0, 3.0, 11.0, 11.0, 13.0, 17.0, 20.0, 36.0, 60.0, 81.0, 123.0, 217.0, 370.0, 713.0, 1446.0, 3401.0, 9605.0, 47833.0, 473383.0, 450341.0, 44928.0, 9485.0, 3312.0, 1456.0, 682.0, 414.0, 228.0, 113.0, 76.0, 52.0, 40.0, 27.0, 13.0, 9.0, 11.0, 4.0, 4.0, 2.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-3.005859375, -2.91473388671875, -2.8236083984375, -2.73248291015625, -2.641357421875, -2.55023193359375, -2.4591064453125, -2.36798095703125, -2.27685546875, -2.18572998046875, -2.0946044921875, -2.00347900390625, -1.912353515625, -1.82122802734375, -1.7301025390625, -1.63897705078125, -1.5478515625, -1.45672607421875, -1.3656005859375, -1.27447509765625, -1.183349609375, -1.09222412109375, -1.0010986328125, -0.90997314453125, -0.81884765625, -0.72772216796875, -0.6365966796875, -0.54547119140625, -0.454345703125, -0.36322021484375, -0.2720947265625, -0.18096923828125, -0.08984375, 0.00128173828125, 0.0924072265625, 0.18353271484375, 0.274658203125, 0.36578369140625, 0.4569091796875, 0.54803466796875, 0.63916015625, 0.73028564453125, 0.8214111328125, 0.91253662109375, 1.003662109375, 1.09478759765625, 1.1859130859375, 1.27703857421875, 1.3681640625, 1.45928955078125, 1.5504150390625, 1.64154052734375, 1.732666015625, 1.82379150390625, 1.9149169921875, 2.00604248046875, 2.09716796875, 2.18829345703125, 2.2794189453125, 2.37054443359375, 2.461669921875, 2.55279541015625, 2.6439208984375, 2.73504638671875, 2.826171875]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 5.0, 3.0, 5.0, 8.0, 8.0, 17.0, 27.0, 23.0, 30.0, 40.0, 66.0, 81.0, 103.0, 100.0, 106.0, 103.0, 73.0, 57.0, 42.0, 23.0, 20.0, 16.0, 10.0, 13.0, 5.0, 3.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.7333984375, -1.6688385009765625, -1.604278564453125, -1.5397186279296875, -1.47515869140625, -1.4105987548828125, -1.346038818359375, -1.2814788818359375, -1.2169189453125, -1.1523590087890625, -1.087799072265625, -1.0232391357421875, -0.95867919921875, -0.8941192626953125, -0.829559326171875, -0.7649993896484375, -0.700439453125, -0.6358795166015625, -0.571319580078125, -0.5067596435546875, -0.44219970703125, -0.3776397705078125, -0.313079833984375, -0.2485198974609375, -0.1839599609375, -0.1194000244140625, -0.054840087890625, 0.0097198486328125, 0.07427978515625, 0.1388397216796875, 0.203399658203125, 0.2679595947265625, 0.33251953125, 0.3970794677734375, 0.461639404296875, 0.5261993408203125, 0.59075927734375, 0.6553192138671875, 0.719879150390625, 0.7844390869140625, 0.8489990234375, 0.9135589599609375, 0.978118896484375, 1.0426788330078125, 1.10723876953125, 1.1717987060546875, 1.236358642578125, 1.3009185791015625, 1.365478515625, 1.4300384521484375, 1.494598388671875, 1.5591583251953125, 1.62371826171875, 1.6882781982421875, 1.752838134765625, 1.8173980712890625, 1.8819580078125, 1.9465179443359375, 2.011077880859375, 2.0756378173828125, 2.14019775390625, 2.2047576904296875, 2.269317626953125, 2.3338775634765625, 2.3984375]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 6.0, 10.0, 33.0, 106.0, 202.0, 306.0, 213.0, 90.0, 30.0, 6.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-63.50049591064453, -61.97401809692383, -60.447540283203125, -58.921058654785156, -57.39458084106445, -55.86810302734375, -54.34162521362305, -52.815147399902344, -51.28866958618164, -49.76219177246094, -48.235713958740234, -46.70923614501953, -45.18275451660156, -43.65627670288086, -42.129798889160156, -40.60332107543945, -39.07684326171875, -37.55036544799805, -36.023887634277344, -34.497406005859375, -32.97092819213867, -31.44445037841797, -29.917972564697266, -28.391494750976562, -26.865013122558594, -25.33853530883789, -23.812055587768555, -22.28557777404785, -20.75909996032715, -19.232620239257812, -17.70614242553711, -16.179664611816406, -14.653186798095703, -13.126708030700684, -11.60023021697998, -10.073751449584961, -8.547273635864258, -7.020794868469238, -5.494316101074219, -3.9678382873535156, -2.441359519958496, -0.9148811101913452, 0.6115972995758057, 2.138075828552246, 3.6645541191101074, 5.191032409667969, 6.717511177062988, 8.243988990783691, 9.770467758178711, 11.29694652557373, 12.823424339294434, 14.349903106689453, 15.876380920410156, 17.40285873413086, 18.929338455200195, 20.4558162689209, 21.982295989990234, 23.508773803710938, 25.035253524780273, 26.561731338500977, 28.08820915222168, 29.614688873291016, 31.14116668701172, 32.66764450073242, 34.194122314453125]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 4.0, 3.0, 6.0, 6.0, 4.0, 8.0, 11.0, 12.0, 13.0, 13.0, 21.0, 15.0, 34.0, 30.0, 26.0, 50.0, 34.0, 41.0, 38.0, 42.0, 37.0, 45.0, 42.0, 35.0, 41.0, 38.0, 45.0, 35.0, 32.0, 28.0, 28.0, 21.0, 24.0, 23.0, 28.0, 18.0, 10.0, 15.0, 6.0, 9.0, 8.0, 3.0, 5.0, 4.0, 4.0, 4.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.902027130126953, -14.386523246765137, -13.871018409729004, -13.355514526367188, -12.840009689331055, -12.324505805969238, -11.809001922607422, -11.293497085571289, -10.777993202209473, -10.262489318847656, -9.746984481811523, -9.231480598449707, -8.71597671508789, -8.200471878051758, -7.684967994689941, -7.169463634490967, -6.653959274291992, -6.138454914093018, -5.622950553894043, -5.107446670532227, -4.591942310333252, -4.076437950134277, -3.560933828353882, -3.0454297065734863, -2.5299253463745117, -2.014420986175537, -1.4989168643951416, -0.9834126234054565, -0.4679083824157715, 0.047595977783203125, 0.5631000995635986, 1.0786042213439941, 1.5941085815429688, 2.1096129417419434, 2.625117063522339, 3.1406211853027344, 3.656125545501709, 4.171629905700684, 4.6871337890625, 5.202638149261475, 5.718142509460449, 6.233646869659424, 6.749151229858398, 7.264655113220215, 7.7801594734191895, 8.295663833618164, 8.81116771697998, 9.326671600341797, 9.84217643737793, 10.357680320739746, 10.873185157775879, 11.388689041137695, 11.904193878173828, 12.419697761535645, 12.935201644897461, 13.450706481933594, 13.96621036529541, 14.481714248657227, 14.99721908569336, 15.512722969055176, 16.028226852416992, 16.543731689453125, 17.059236526489258, 17.574739456176758, 18.09024429321289]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 7.0, 6.0, 6.0, 12.0, 3.0, 26.0, 24.0, 35.0, 60.0, 90.0, 111.0, 201.0, 326.0, 527.0, 957.0, 1925.0, 4140.0, 10250.0, 30882.0, 134007.0, 1882241.0, 1943030.0, 136088.0, 31331.0, 10018.0, 3928.0, 1815.0, 917.0, 498.0, 289.0, 178.0, 97.0, 73.0, 51.0, 47.0, 21.0, 23.0, 14.0, 10.0, 4.0, 8.0, 6.0, 5.0, 1.0, 1.0, 3.0, 2.0], "bins": [-3.09765625, -3.016143798828125, -2.93463134765625, -2.853118896484375, -2.7716064453125, -2.690093994140625, -2.60858154296875, -2.527069091796875, -2.445556640625, -2.364044189453125, -2.28253173828125, -2.201019287109375, -2.1195068359375, -2.037994384765625, -1.95648193359375, -1.874969482421875, -1.79345703125, -1.711944580078125, -1.63043212890625, -1.548919677734375, -1.4674072265625, -1.385894775390625, -1.30438232421875, -1.222869873046875, -1.141357421875, -1.059844970703125, -0.97833251953125, -0.896820068359375, -0.8153076171875, -0.733795166015625, -0.65228271484375, -0.570770263671875, -0.4892578125, -0.407745361328125, -0.32623291015625, -0.244720458984375, -0.1632080078125, -0.081695556640625, -0.00018310546875, 0.081329345703125, 0.162841796875, 0.244354248046875, 0.32586669921875, 0.407379150390625, 0.4888916015625, 0.570404052734375, 0.65191650390625, 0.733428955078125, 0.81494140625, 0.896453857421875, 0.97796630859375, 1.059478759765625, 1.1409912109375, 1.222503662109375, 1.30401611328125, 1.385528564453125, 1.467041015625, 1.548553466796875, 1.63006591796875, 1.711578369140625, 1.7930908203125, 1.874603271484375, 1.95611572265625, 2.037628173828125, 2.119140625]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 3.0, 7.0, 4.0, 17.0, 14.0, 15.0, 22.0, 29.0, 47.0, 50.0, 57.0, 71.0, 65.0, 88.0, 76.0, 86.0, 87.0, 65.0, 54.0, 44.0, 29.0, 24.0, 14.0, 12.0, 8.0, 6.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.109375, -1.0775985717773438, -1.0458221435546875, -1.0140457153320312, -0.982269287109375, -0.9504928588867188, -0.9187164306640625, -0.8869400024414062, -0.85516357421875, -0.8233871459960938, -0.7916107177734375, -0.7598342895507812, -0.728057861328125, -0.6962814331054688, -0.6645050048828125, -0.6327285766601562, -0.6009521484375, -0.5691757202148438, -0.5373992919921875, -0.5056228637695312, -0.473846435546875, -0.44207000732421875, -0.4102935791015625, -0.37851715087890625, -0.34674072265625, -0.31496429443359375, -0.2831878662109375, -0.25141143798828125, -0.219635009765625, -0.18785858154296875, -0.1560821533203125, -0.12430572509765625, -0.092529296875, -0.06075286865234375, -0.0289764404296875, 0.00279998779296875, 0.034576416015625, 0.06635284423828125, 0.0981292724609375, 0.12990570068359375, 0.16168212890625, 0.19345855712890625, 0.2252349853515625, 0.25701141357421875, 0.288787841796875, 0.32056427001953125, 0.3523406982421875, 0.38411712646484375, 0.4158935546875, 0.44766998291015625, 0.4794464111328125, 0.5112228393554688, 0.542999267578125, 0.5747756958007812, 0.6065521240234375, 0.6383285522460938, 0.67010498046875, 0.7018814086914062, 0.7336578369140625, 0.7654342651367188, 0.797210693359375, 0.8289871215820312, 0.8607635498046875, 0.8925399780273438, 0.92431640625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 5.0, 5.0, 4.0, 8.0, 6.0, 15.0, 15.0, 35.0, 56.0, 102.0, 189.0, 283.0, 624.0, 1304.0, 3398.0, 10145.0, 42397.0, 266611.0, 2821574.0, 916728.0, 101962.0, 19999.0, 5409.0, 1898.0, 760.0, 312.0, 164.0, 95.0, 60.0, 33.0, 19.0, 16.0, 19.0, 9.0, 4.0, 6.0, 5.0, 5.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.947265625, -2.8572998046875, -2.767333984375, -2.6773681640625, -2.58740234375, -2.4974365234375, -2.407470703125, -2.3175048828125, -2.2275390625, -2.1375732421875, -2.047607421875, -1.9576416015625, -1.86767578125, -1.7777099609375, -1.687744140625, -1.5977783203125, -1.5078125, -1.4178466796875, -1.327880859375, -1.2379150390625, -1.14794921875, -1.0579833984375, -0.968017578125, -0.8780517578125, -0.7880859375, -0.6981201171875, -0.608154296875, -0.5181884765625, -0.42822265625, -0.3382568359375, -0.248291015625, -0.1583251953125, -0.068359375, 0.0216064453125, 0.111572265625, 0.2015380859375, 0.29150390625, 0.3814697265625, 0.471435546875, 0.5614013671875, 0.6513671875, 0.7413330078125, 0.831298828125, 0.9212646484375, 1.01123046875, 1.1011962890625, 1.191162109375, 1.2811279296875, 1.37109375, 1.4610595703125, 1.551025390625, 1.6409912109375, 1.73095703125, 1.8209228515625, 1.910888671875, 2.0008544921875, 2.0908203125, 2.1807861328125, 2.270751953125, 2.3607177734375, 2.45068359375, 2.5406494140625, 2.630615234375, 2.7205810546875, 2.810546875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 2.0, 2.0, 4.0, 10.0, 12.0, 17.0, 29.0, 33.0, 41.0, 51.0, 99.0, 183.0, 319.0, 510.0, 950.0, 781.0, 423.0, 212.0, 123.0, 96.0, 64.0, 33.0, 23.0, 20.0, 6.0, 8.0, 8.0, 4.0, 3.0, 4.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4853515625, -1.446075439453125, -1.40679931640625, -1.367523193359375, -1.3282470703125, -1.288970947265625, -1.24969482421875, -1.210418701171875, -1.171142578125, -1.131866455078125, -1.09259033203125, -1.053314208984375, -1.0140380859375, -0.974761962890625, -0.93548583984375, -0.896209716796875, -0.85693359375, -0.817657470703125, -0.77838134765625, -0.739105224609375, -0.6998291015625, -0.660552978515625, -0.62127685546875, -0.582000732421875, -0.542724609375, -0.503448486328125, -0.46417236328125, -0.424896240234375, -0.3856201171875, -0.346343994140625, -0.30706787109375, -0.267791748046875, -0.228515625, -0.189239501953125, -0.14996337890625, -0.110687255859375, -0.0714111328125, -0.032135009765625, 0.00714111328125, 0.046417236328125, 0.085693359375, 0.124969482421875, 0.16424560546875, 0.203521728515625, 0.2427978515625, 0.282073974609375, 0.32135009765625, 0.360626220703125, 0.39990234375, 0.439178466796875, 0.47845458984375, 0.517730712890625, 0.5570068359375, 0.596282958984375, 0.63555908203125, 0.674835205078125, 0.714111328125, 0.753387451171875, 0.79266357421875, 0.831939697265625, 0.8712158203125, 0.910491943359375, 0.94976806640625, 0.989044189453125, 1.0283203125]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 0.0, 3.0, 0.0, 7.0, 6.0, 10.0, 12.0, 21.0, 34.0, 58.0, 101.0, 106.0, 108.0, 128.0, 119.0, 98.0, 68.0, 44.0, 32.0, 22.0, 11.0, 8.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.957284450531006, -6.7126898765563965, -6.468095779418945, -6.223501205444336, -5.978907108306885, -5.734312534332275, -5.489718437194824, -5.245123863220215, -5.0005292892456055, -4.755934715270996, -4.511340618133545, -4.2667460441589355, -4.022151947021484, -3.777557373046875, -3.5329630374908447, -3.2883687019348145, -3.0437746047973633, -2.799180269241333, -2.5545859336853027, -2.3099913597106934, -2.065397262573242, -1.8208028078079224, -1.5762083530426025, -1.3316140174865723, -1.087019681930542, -0.8424253463745117, -0.5978309512138367, -0.3532365560531616, -0.10864222049713135, 0.13595211505889893, 0.38054656982421875, 0.625140905380249, 0.8697347640991211, 1.1143290996551514, 1.3589234352111816, 1.6035178899765015, 1.8481122255325317, 2.0927066802978516, 2.337301015853882, 2.581895351409912, 2.8264896869659424, 3.0710840225219727, 3.315678358078003, 3.560272693634033, 3.8048672676086426, 4.049461364746094, 4.294055938720703, 4.5386505126953125, 4.783244609832764, 5.027839183807373, 5.272433280944824, 5.517027854919434, 5.761621952056885, 6.006216526031494, 6.250810623168945, 6.495405197143555, 6.739999771118164, 6.984594345092773, 7.229188442230225, 7.473783016204834, 7.718377113342285, 7.9629716873168945, 8.207566261291504, 8.452159881591797, 8.696754455566406]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 3.0, 7.0, 6.0, 7.0, 6.0, 22.0, 16.0, 25.0, 25.0, 33.0, 45.0, 43.0, 41.0, 58.0, 50.0, 53.0, 51.0, 52.0, 77.0, 57.0, 38.0, 51.0, 44.0, 38.0, 34.0, 22.0, 27.0, 14.0, 14.0, 13.0, 12.0, 7.0, 3.0, 4.0, 2.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.906486988067627, -5.732168197631836, -5.557848930358887, -5.383530139923096, -5.2092108726501465, -5.0348920822143555, -4.860572814941406, -4.686254024505615, -4.511935234069824, -4.337616443634033, -4.163297176361084, -3.988978385925293, -3.8146591186523438, -3.6403403282165527, -3.4660212993621826, -3.2917022705078125, -3.1173830032348633, -2.943063974380493, -2.768744945526123, -2.594426155090332, -2.420106887817383, -2.245788097381592, -2.0714690685272217, -1.8971500396728516, -1.7228310108184814, -1.5485119819641113, -1.3741929531097412, -1.1998740434646606, -1.0255550146102905, -0.8512359857559204, -0.6769170761108398, -0.5025980472564697, -0.3282785415649414, -0.15395954251289368, 0.020359456539154053, 0.1946784257888794, 0.3689974546432495, 0.5433164834976196, 0.7176353931427002, 0.8919544219970703, 1.0662734508514404, 1.2405924797058105, 1.4149115085601807, 1.5892304182052612, 1.7635494470596313, 1.9378684759140015, 2.112187385559082, 2.286506414413452, 2.4608254432678223, 2.6351444721221924, 2.8094635009765625, 2.9837822914123535, 3.1581015586853027, 3.3324203491210938, 3.506739377975464, 3.681058406829834, 3.855377435684204, 4.029696464538574, 4.204015254974365, 4.3783345222473145, 4.5526533126831055, 4.726972579956055, 4.901291370391846, 5.075610160827637, 5.249929428100586]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 8.0, 9.0, 10.0, 14.0, 29.0, 40.0, 51.0, 76.0, 112.0, 151.0, 261.0, 472.0, 769.0, 1465.0, 2828.0, 5857.0, 13255.0, 32587.0, 82253.0, 193789.0, 312593.0, 228769.0, 101936.0, 40637.0, 16353.0, 7090.0, 3203.0, 1627.0, 915.0, 520.0, 314.0, 186.0, 112.0, 97.0, 42.0, 41.0, 24.0, 21.0, 11.0, 11.0, 5.0, 4.0, 4.0, 0.0, 1.0, 5.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.630859375, -2.550201416015625, -2.46954345703125, -2.388885498046875, -2.3082275390625, -2.227569580078125, -2.14691162109375, -2.066253662109375, -1.985595703125, -1.904937744140625, -1.82427978515625, -1.743621826171875, -1.6629638671875, -1.582305908203125, -1.50164794921875, -1.420989990234375, -1.34033203125, -1.259674072265625, -1.17901611328125, -1.098358154296875, -1.0177001953125, -0.937042236328125, -0.85638427734375, -0.775726318359375, -0.695068359375, -0.614410400390625, -0.53375244140625, -0.453094482421875, -0.3724365234375, -0.291778564453125, -0.21112060546875, -0.130462646484375, -0.0498046875, 0.030853271484375, 0.11151123046875, 0.192169189453125, 0.2728271484375, 0.353485107421875, 0.43414306640625, 0.514801025390625, 0.595458984375, 0.676116943359375, 0.75677490234375, 0.837432861328125, 0.9180908203125, 0.998748779296875, 1.07940673828125, 1.160064697265625, 1.24072265625, 1.321380615234375, 1.40203857421875, 1.482696533203125, 1.5633544921875, 1.644012451171875, 1.72467041015625, 1.805328369140625, 1.885986328125, 1.966644287109375, 2.04730224609375, 2.127960205078125, 2.2086181640625, 2.289276123046875, 2.36993408203125, 2.450592041015625, 2.53125]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 6.0, 10.0, 15.0, 13.0, 15.0, 24.0, 43.0, 41.0, 50.0, 64.0, 82.0, 68.0, 80.0, 75.0, 77.0, 73.0, 64.0, 57.0, 35.0, 34.0, 21.0, 15.0, 11.0, 11.0, 1.0, 5.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.05859375, -1.0281219482421875, -0.997650146484375, -0.9671783447265625, -0.93670654296875, -0.9062347412109375, -0.875762939453125, -0.8452911376953125, -0.8148193359375, -0.7843475341796875, -0.753875732421875, -0.7234039306640625, -0.69293212890625, -0.6624603271484375, -0.631988525390625, -0.6015167236328125, -0.571044921875, -0.5405731201171875, -0.510101318359375, -0.4796295166015625, -0.44915771484375, -0.4186859130859375, -0.388214111328125, -0.3577423095703125, -0.3272705078125, -0.2967987060546875, -0.266326904296875, -0.2358551025390625, -0.20538330078125, -0.1749114990234375, -0.144439697265625, -0.1139678955078125, -0.08349609375, -0.0530242919921875, -0.022552490234375, 0.0079193115234375, 0.03839111328125, 0.0688629150390625, 0.099334716796875, 0.1298065185546875, 0.1602783203125, 0.1907501220703125, 0.221221923828125, 0.2516937255859375, 0.28216552734375, 0.3126373291015625, 0.343109130859375, 0.3735809326171875, 0.404052734375, 0.4345245361328125, 0.464996337890625, 0.4954681396484375, 0.52593994140625, 0.5564117431640625, 0.586883544921875, 0.6173553466796875, 0.6478271484375, 0.6782989501953125, 0.708770751953125, 0.7392425537109375, 0.76971435546875, 0.8001861572265625, 0.830657958984375, 0.8611297607421875, 0.8916015625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 2.0, 5.0, 9.0, 8.0, 17.0, 13.0, 27.0, 33.0, 35.0, 57.0, 57.0, 81.0, 113.0, 167.0, 230.0, 340.0, 474.0, 769.0, 1395.0, 2695.0, 6441.0, 16902.0, 49379.0, 135631.0, 297493.0, 306156.0, 144411.0, 53079.0, 18585.0, 6999.0, 2918.0, 1444.0, 802.0, 503.0, 333.0, 230.0, 186.0, 140.0, 109.0, 66.0, 44.0, 56.0, 24.0, 35.0, 11.0, 13.0, 12.0, 12.0, 7.0, 3.0, 5.0, 4.0, 2.0, 2.0], "bins": [-2.81640625, -2.73602294921875, -2.6556396484375, -2.57525634765625, -2.494873046875, -2.41448974609375, -2.3341064453125, -2.25372314453125, -2.17333984375, -2.09295654296875, -2.0125732421875, -1.93218994140625, -1.851806640625, -1.77142333984375, -1.6910400390625, -1.61065673828125, -1.5302734375, -1.44989013671875, -1.3695068359375, -1.28912353515625, -1.208740234375, -1.12835693359375, -1.0479736328125, -0.96759033203125, -0.88720703125, -0.80682373046875, -0.7264404296875, -0.64605712890625, -0.565673828125, -0.48529052734375, -0.4049072265625, -0.32452392578125, -0.244140625, -0.16375732421875, -0.0833740234375, -0.00299072265625, 0.077392578125, 0.15777587890625, 0.2381591796875, 0.31854248046875, 0.39892578125, 0.47930908203125, 0.5596923828125, 0.64007568359375, 0.720458984375, 0.80084228515625, 0.8812255859375, 0.96160888671875, 1.0419921875, 1.12237548828125, 1.2027587890625, 1.28314208984375, 1.363525390625, 1.44390869140625, 1.5242919921875, 1.60467529296875, 1.68505859375, 1.76544189453125, 1.8458251953125, 1.92620849609375, 2.006591796875, 2.08697509765625, 2.1673583984375, 2.24774169921875, 2.328125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 1.0, 3.0, 2.0, 3.0, 2.0, 4.0, 3.0, 6.0, 11.0, 8.0, 12.0, 8.0, 15.0, 23.0, 21.0, 31.0, 22.0, 25.0, 24.0, 29.0, 38.0, 36.0, 41.0, 51.0, 44.0, 42.0, 51.0, 52.0, 38.0, 38.0, 39.0, 37.0, 33.0, 34.0, 29.0, 23.0, 23.0, 25.0, 15.0, 13.0, 18.0, 9.0, 7.0, 5.0, 2.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.19921875, -3.10614013671875, -3.0130615234375, -2.91998291015625, -2.826904296875, -2.73382568359375, -2.6407470703125, -2.54766845703125, -2.45458984375, -2.36151123046875, -2.2684326171875, -2.17535400390625, -2.082275390625, -1.98919677734375, -1.8961181640625, -1.80303955078125, -1.7099609375, -1.61688232421875, -1.5238037109375, -1.43072509765625, -1.337646484375, -1.24456787109375, -1.1514892578125, -1.05841064453125, -0.96533203125, -0.87225341796875, -0.7791748046875, -0.68609619140625, -0.593017578125, -0.49993896484375, -0.4068603515625, -0.31378173828125, -0.220703125, -0.12762451171875, -0.0345458984375, 0.05853271484375, 0.151611328125, 0.24468994140625, 0.3377685546875, 0.43084716796875, 0.52392578125, 0.61700439453125, 0.7100830078125, 0.80316162109375, 0.896240234375, 0.98931884765625, 1.0823974609375, 1.17547607421875, 1.2685546875, 1.36163330078125, 1.4547119140625, 1.54779052734375, 1.640869140625, 1.73394775390625, 1.8270263671875, 1.92010498046875, 2.01318359375, 2.10626220703125, 2.1993408203125, 2.29241943359375, 2.385498046875, 2.47857666015625, 2.5716552734375, 2.66473388671875, 2.7578125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 4.0, 4.0, 3.0, 1.0, 3.0, 3.0, 5.0, 8.0, 11.0, 20.0, 12.0, 21.0, 30.0, 54.0, 115.0, 198.0, 431.0, 1060.0, 2976.0, 12271.0, 80138.0, 594063.0, 312430.0, 34601.0, 6786.0, 1903.0, 735.0, 277.0, 153.0, 72.0, 48.0, 39.0, 22.0, 9.0, 17.0, 7.0, 8.0, 6.0, 1.0, 7.0, 2.0, 1.0, 3.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.09375, -2.999420166015625, -2.90509033203125, -2.810760498046875, -2.7164306640625, -2.622100830078125, -2.52777099609375, -2.433441162109375, -2.339111328125, -2.244781494140625, -2.15045166015625, -2.056121826171875, -1.9617919921875, -1.867462158203125, -1.77313232421875, -1.678802490234375, -1.58447265625, -1.490142822265625, -1.39581298828125, -1.301483154296875, -1.2071533203125, -1.112823486328125, -1.01849365234375, -0.924163818359375, -0.829833984375, -0.735504150390625, -0.64117431640625, -0.546844482421875, -0.4525146484375, -0.358184814453125, -0.26385498046875, -0.169525146484375, -0.0751953125, 0.019134521484375, 0.11346435546875, 0.207794189453125, 0.3021240234375, 0.396453857421875, 0.49078369140625, 0.585113525390625, 0.679443359375, 0.773773193359375, 0.86810302734375, 0.962432861328125, 1.0567626953125, 1.151092529296875, 1.24542236328125, 1.339752197265625, 1.43408203125, 1.528411865234375, 1.62274169921875, 1.717071533203125, 1.8114013671875, 1.905731201171875, 2.00006103515625, 2.094390869140625, 2.188720703125, 2.283050537109375, 2.37738037109375, 2.471710205078125, 2.5660400390625, 2.660369873046875, 2.75469970703125, 2.849029541015625, 2.943359375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 4.0, 6.0, 4.0, 4.0, 5.0, 3.0, 12.0, 18.0, 14.0, 26.0, 21.0, 32.0, 40.0, 50.0, 71.0, 106.0, 114.0, 118.0, 92.0, 51.0, 52.0, 35.0, 31.0, 22.0, 17.0, 15.0, 10.0, 8.0, 14.0, 4.0, 2.0, 2.0, 3.0, 5.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00030684471130371094, -0.0002957470715045929, -0.00028464943170547485, -0.0002735517919063568, -0.00026245415210723877, -0.00025135651230812073, -0.00024025887250900269, -0.00022916123270988464, -0.0002180635929107666, -0.00020696595311164856, -0.00019586831331253052, -0.00018477067351341248, -0.00017367303371429443, -0.0001625753939151764, -0.00015147775411605835, -0.0001403801143169403, -0.00012928247451782227, -0.00011818483471870422, -0.00010708719491958618, -9.598955512046814e-05, -8.48919153213501e-05, -7.379427552223206e-05, -6.269663572311401e-05, -5.159899592399597e-05, -4.050135612487793e-05, -2.9403716325759888e-05, -1.8306076526641846e-05, -7.208436727523804e-06, 3.889203071594238e-06, 1.498684287071228e-05, 2.6084482669830322e-05, 3.7182122468948364e-05, 4.8279762268066406e-05, 5.937740206718445e-05, 7.047504186630249e-05, 8.157268166542053e-05, 9.267032146453857e-05, 0.00010376796126365662, 0.00011486560106277466, 0.0001259632408618927, 0.00013706088066101074, 0.00014815852046012878, 0.00015925616025924683, 0.00017035380005836487, 0.0001814514398574829, 0.00019254907965660095, 0.000203646719455719, 0.00021474435925483704, 0.00022584199905395508, 0.00023693963885307312, 0.00024803727865219116, 0.0002591349184513092, 0.00027023255825042725, 0.0002813301980495453, 0.00029242783784866333, 0.00030352547764778137, 0.0003146231174468994, 0.00032572075724601746, 0.0003368183970451355, 0.00034791603684425354, 0.0003590136766433716, 0.0003701113164424896, 0.00038120895624160767, 0.0003923065960407257, 0.00040340423583984375]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 1.0, 5.0, 13.0, 8.0, 8.0, 17.0, 16.0, 26.0, 40.0, 56.0, 99.0, 134.0, 232.0, 384.0, 697.0, 1377.0, 2729.0, 6797.0, 22078.0, 113121.0, 531355.0, 299376.0, 49082.0, 12059.0, 4458.0, 1978.0, 1026.0, 557.0, 283.0, 182.0, 100.0, 72.0, 51.0, 35.0, 17.0, 18.0, 11.0, 10.0, 7.0, 8.0, 9.0, 5.0, 5.0, 3.0, 1.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0], "bins": [-2.28125, -2.21368408203125, -2.1461181640625, -2.07855224609375, -2.010986328125, -1.94342041015625, -1.8758544921875, -1.80828857421875, -1.74072265625, -1.67315673828125, -1.6055908203125, -1.53802490234375, -1.470458984375, -1.40289306640625, -1.3353271484375, -1.26776123046875, -1.2001953125, -1.13262939453125, -1.0650634765625, -0.99749755859375, -0.929931640625, -0.86236572265625, -0.7947998046875, -0.72723388671875, -0.65966796875, -0.59210205078125, -0.5245361328125, -0.45697021484375, -0.389404296875, -0.32183837890625, -0.2542724609375, -0.18670654296875, -0.119140625, -0.05157470703125, 0.0159912109375, 0.08355712890625, 0.151123046875, 0.21868896484375, 0.2862548828125, 0.35382080078125, 0.42138671875, 0.48895263671875, 0.5565185546875, 0.62408447265625, 0.691650390625, 0.75921630859375, 0.8267822265625, 0.89434814453125, 0.9619140625, 1.02947998046875, 1.0970458984375, 1.16461181640625, 1.232177734375, 1.29974365234375, 1.3673095703125, 1.43487548828125, 1.50244140625, 1.57000732421875, 1.6375732421875, 1.70513916015625, 1.772705078125, 1.84027099609375, 1.9078369140625, 1.97540283203125, 2.04296875]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 0.0, 1.0, 2.0, 3.0, 7.0, 7.0, 19.0, 13.0, 15.0, 36.0, 74.0, 79.0, 135.0, 137.0, 131.0, 109.0, 92.0, 50.0, 31.0, 22.0, 11.0, 7.0, 8.0, 4.0, 4.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.55859375, -2.47613525390625, -2.3936767578125, -2.31121826171875, -2.228759765625, -2.14630126953125, -2.0638427734375, -1.98138427734375, -1.89892578125, -1.81646728515625, -1.7340087890625, -1.65155029296875, -1.569091796875, -1.48663330078125, -1.4041748046875, -1.32171630859375, -1.2392578125, -1.15679931640625, -1.0743408203125, -0.99188232421875, -0.909423828125, -0.82696533203125, -0.7445068359375, -0.66204833984375, -0.57958984375, -0.49713134765625, -0.4146728515625, -0.33221435546875, -0.249755859375, -0.16729736328125, -0.0848388671875, -0.00238037109375, 0.080078125, 0.16253662109375, 0.2449951171875, 0.32745361328125, 0.409912109375, 0.49237060546875, 0.5748291015625, 0.65728759765625, 0.73974609375, 0.82220458984375, 0.9046630859375, 0.98712158203125, 1.069580078125, 1.15203857421875, 1.2344970703125, 1.31695556640625, 1.3994140625, 1.48187255859375, 1.5643310546875, 1.64678955078125, 1.729248046875, 1.81170654296875, 1.8941650390625, 1.97662353515625, 2.05908203125, 2.14154052734375, 2.2239990234375, 2.30645751953125, 2.388916015625, 2.47137451171875, 2.5538330078125, 2.63629150390625, 2.71875]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 7.0, 9.0, 9.0, 20.0, 23.0, 31.0, 35.0, 60.0, 59.0, 92.0, 96.0, 101.0, 92.0, 80.0, 77.0, 61.0, 43.0, 34.0, 24.0, 21.0, 9.0, 3.0, 7.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-22.63901710510254, -22.070018768310547, -21.501020431518555, -20.932022094726562, -20.363025665283203, -19.79402732849121, -19.22502899169922, -18.656030654907227, -18.087032318115234, -17.518033981323242, -16.94903564453125, -16.38003921508789, -15.811039924621582, -15.242042541503906, -14.673044204711914, -14.104045867919922, -13.535048484802246, -12.966050148010254, -12.397052764892578, -11.828054428100586, -11.259056091308594, -10.690057754516602, -10.121060371398926, -9.552062034606934, -8.983064651489258, -8.414066314697266, -7.845068454742432, -7.276070594787598, -6.7070722579956055, -6.1380743980407715, -5.5690765380859375, -5.000078201293945, -4.431078910827637, -3.8620808124542236, -3.2930827140808105, -2.7240848541259766, -2.1550867557525635, -1.5860886573791504, -1.0170907974243164, -0.4480926990509033, 0.12090539932250977, 0.6899034380912781, 1.2589014768600464, 1.82789945602417, 2.396897554397583, 2.965895652770996, 3.53489351272583, 4.103891372680664, 4.672889709472656, 5.24188756942749, 5.810885906219482, 6.379883766174316, 6.948882102966309, 7.517879962921143, 8.086877822875977, 8.655876159667969, 9.224874496459961, 9.793872833251953, 10.362870216369629, 10.931868553161621, 11.500866889953613, 12.069864273071289, 12.638862609863281, 13.207860946655273, 13.77685832977295]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 1.0, 10.0, 3.0, 10.0, 12.0, 11.0, 15.0, 16.0, 25.0, 13.0, 29.0, 32.0, 28.0, 36.0, 47.0, 50.0, 39.0, 50.0, 56.0, 43.0, 47.0, 55.0, 57.0, 38.0, 38.0, 34.0, 27.0, 32.0, 20.0, 29.0, 19.0, 15.0, 16.0, 9.0, 6.0, 12.0, 8.0, 9.0, 1.0, 2.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-20.48953628540039, -19.90407943725586, -19.31862449645996, -18.73316764831543, -18.1477108001709, -17.562255859375, -16.97679901123047, -16.391342163085938, -15.805886268615723, -15.220430374145508, -14.634973526000977, -14.049517631530762, -13.464061737060547, -12.878604888916016, -12.2931489944458, -11.707693099975586, -11.122236251831055, -10.53678035736084, -9.951323509216309, -9.365867614746094, -8.780410766601562, -8.194954872131348, -7.609498977661133, -7.02404260635376, -6.438586235046387, -5.853129863739014, -5.267673492431641, -4.682217597961426, -4.096761226654053, -3.5113048553466797, -2.9258487224578857, -2.340392589569092, -1.7549381256103516, -1.169481873512268, -0.5840256214141846, 0.0014306306838989258, 0.5868868827819824, 1.1723432540893555, 1.7577993869781494, 2.3432555198669434, 2.9287118911743164, 3.5141682624816895, 4.0996246337890625, 4.685080528259277, 5.27053689956665, 5.855993270874023, 6.441449165344238, 7.026905536651611, 7.612361907958984, 8.1978178024292, 8.78327465057373, 9.368730545043945, 9.954187393188477, 10.539643287658691, 11.125099182128906, 11.710556030273438, 12.296011924743652, 12.881467819213867, 13.466924667358398, 14.052380561828613, 14.637836456298828, 15.22329330444336, 15.808749198913574, 16.39420509338379, 16.97966194152832]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 4.0, 3.0, 4.0, 8.0, 7.0, 17.0, 18.0, 42.0, 62.0, 121.0, 192.0, 361.0, 789.0, 2167.0, 7361.0, 39807.0, 843745.0, 3226659.0, 59061.0, 9404.0, 2555.0, 976.0, 412.0, 203.0, 110.0, 72.0, 52.0, 30.0, 17.0, 10.0, 8.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.375, -5.240936279296875, -5.10687255859375, -4.972808837890625, -4.8387451171875, -4.704681396484375, -4.57061767578125, -4.436553955078125, -4.302490234375, -4.168426513671875, -4.03436279296875, -3.900299072265625, -3.7662353515625, -3.632171630859375, -3.49810791015625, -3.364044189453125, -3.22998046875, -3.095916748046875, -2.96185302734375, -2.827789306640625, -2.6937255859375, -2.559661865234375, -2.42559814453125, -2.291534423828125, -2.157470703125, -2.023406982421875, -1.88934326171875, -1.755279541015625, -1.6212158203125, -1.487152099609375, -1.35308837890625, -1.219024658203125, -1.0849609375, -0.950897216796875, -0.81683349609375, -0.682769775390625, -0.5487060546875, -0.414642333984375, -0.28057861328125, -0.146514892578125, -0.012451171875, 0.121612548828125, 0.25567626953125, 0.389739990234375, 0.5238037109375, 0.657867431640625, 0.79193115234375, 0.925994873046875, 1.06005859375, 1.194122314453125, 1.32818603515625, 1.462249755859375, 1.5963134765625, 1.730377197265625, 1.86444091796875, 1.998504638671875, 2.132568359375, 2.266632080078125, 2.40069580078125, 2.534759521484375, 2.6688232421875, 2.802886962890625, 2.93695068359375, 3.071014404296875, 3.205078125]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 6.0, 4.0, 3.0, 15.0, 14.0, 22.0, 23.0, 40.0, 34.0, 42.0, 57.0, 79.0, 80.0, 72.0, 92.0, 72.0, 69.0, 76.0, 48.0, 40.0, 31.0, 25.0, 19.0, 12.0, 10.0, 5.0, 4.0, 5.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.1201171875, -1.0861663818359375, -1.052215576171875, -1.0182647705078125, -0.98431396484375, -0.9503631591796875, -0.916412353515625, -0.8824615478515625, -0.8485107421875, -0.8145599365234375, -0.780609130859375, -0.7466583251953125, -0.71270751953125, -0.6787567138671875, -0.644805908203125, -0.6108551025390625, -0.576904296875, -0.5429534912109375, -0.509002685546875, -0.4750518798828125, -0.44110107421875, -0.4071502685546875, -0.373199462890625, -0.3392486572265625, -0.3052978515625, -0.2713470458984375, -0.237396240234375, -0.2034454345703125, -0.16949462890625, -0.1355438232421875, -0.101593017578125, -0.0676422119140625, -0.03369140625, 0.0002593994140625, 0.034210205078125, 0.0681610107421875, 0.10211181640625, 0.1360626220703125, 0.170013427734375, 0.2039642333984375, 0.2379150390625, 0.2718658447265625, 0.305816650390625, 0.3397674560546875, 0.37371826171875, 0.4076690673828125, 0.441619873046875, 0.4755706787109375, 0.509521484375, 0.5434722900390625, 0.577423095703125, 0.6113739013671875, 0.64532470703125, 0.6792755126953125, 0.713226318359375, 0.7471771240234375, 0.7811279296875, 0.8150787353515625, 0.849029541015625, 0.8829803466796875, 0.91693115234375, 0.9508819580078125, 0.984832763671875, 1.0187835693359375, 1.052734375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 8.0, 7.0, 9.0, 15.0, 29.0, 53.0, 89.0, 118.0, 221.0, 434.0, 966.0, 2095.0, 5918.0, 22076.0, 105900.0, 1160303.0, 2692757.0, 160610.0, 30168.0, 7835.0, 2520.0, 1015.0, 470.0, 268.0, 162.0, 85.0, 54.0, 41.0, 20.0, 10.0, 8.0, 5.0, 6.0, 5.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.19921875, -3.105438232421875, -3.01165771484375, -2.917877197265625, -2.8240966796875, -2.730316162109375, -2.63653564453125, -2.542755126953125, -2.448974609375, -2.355194091796875, -2.26141357421875, -2.167633056640625, -2.0738525390625, -1.980072021484375, -1.88629150390625, -1.792510986328125, -1.69873046875, -1.604949951171875, -1.51116943359375, -1.417388916015625, -1.3236083984375, -1.229827880859375, -1.13604736328125, -1.042266845703125, -0.948486328125, -0.854705810546875, -0.76092529296875, -0.667144775390625, -0.5733642578125, -0.479583740234375, -0.38580322265625, -0.292022705078125, -0.1982421875, -0.104461669921875, -0.01068115234375, 0.083099365234375, 0.1768798828125, 0.270660400390625, 0.36444091796875, 0.458221435546875, 0.552001953125, 0.645782470703125, 0.73956298828125, 0.833343505859375, 0.9271240234375, 1.020904541015625, 1.11468505859375, 1.208465576171875, 1.30224609375, 1.396026611328125, 1.48980712890625, 1.583587646484375, 1.6773681640625, 1.771148681640625, 1.86492919921875, 1.958709716796875, 2.052490234375, 2.146270751953125, 2.24005126953125, 2.333831787109375, 2.4276123046875, 2.521392822265625, 2.61517333984375, 2.708953857421875, 2.802734375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 9.0, 6.0, 21.0, 20.0, 30.0, 43.0, 68.0, 138.0, 271.0, 749.0, 1608.0, 588.0, 235.0, 114.0, 70.0, 40.0, 24.0, 12.0, 5.0, 8.0, 7.0, 2.0, 1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.587890625, -1.541717529296875, -1.49554443359375, -1.449371337890625, -1.4031982421875, -1.357025146484375, -1.31085205078125, -1.264678955078125, -1.218505859375, -1.172332763671875, -1.12615966796875, -1.079986572265625, -1.0338134765625, -0.987640380859375, -0.94146728515625, -0.895294189453125, -0.84912109375, -0.802947998046875, -0.75677490234375, -0.710601806640625, -0.6644287109375, -0.618255615234375, -0.57208251953125, -0.525909423828125, -0.479736328125, -0.433563232421875, -0.38739013671875, -0.341217041015625, -0.2950439453125, -0.248870849609375, -0.20269775390625, -0.156524658203125, -0.1103515625, -0.064178466796875, -0.01800537109375, 0.028167724609375, 0.0743408203125, 0.120513916015625, 0.16668701171875, 0.212860107421875, 0.259033203125, 0.305206298828125, 0.35137939453125, 0.397552490234375, 0.4437255859375, 0.489898681640625, 0.53607177734375, 0.582244873046875, 0.62841796875, 0.674591064453125, 0.72076416015625, 0.766937255859375, 0.8131103515625, 0.859283447265625, 0.90545654296875, 0.951629638671875, 0.997802734375, 1.043975830078125, 1.09014892578125, 1.136322021484375, 1.1824951171875, 1.228668212890625, 1.27484130859375, 1.321014404296875, 1.3671875]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 6.0, 1.0, 6.0, 22.0, 53.0, 117.0, 189.0, 209.0, 170.0, 126.0, 60.0, 27.0, 15.0, 7.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-19.304763793945312, -18.916412353515625, -18.52806282043457, -18.139711380004883, -17.751359939575195, -17.36301040649414, -16.974658966064453, -16.586307525634766, -16.19795799255371, -15.80960750579834, -15.421256065368652, -15.032905578613281, -14.64455509185791, -14.256204605102539, -13.867853164672852, -13.47950267791748, -13.091151237487793, -12.702800750732422, -12.314449310302734, -11.926098823547363, -11.537748336791992, -11.149396896362305, -10.761046409606934, -10.372695922851562, -9.984344482421875, -9.595993995666504, -9.207642555236816, -8.819292068481445, -8.430941581726074, -8.042591094970703, -7.654239654541016, -7.2658891677856445, -6.877537727355957, -6.489186763763428, -6.100836277008057, -5.712485313415527, -5.324134826660156, -4.935783863067627, -4.547432899475098, -4.159082412719727, -3.7707314491271973, -3.382380723953247, -2.994029998779297, -2.6056790351867676, -2.2173283100128174, -1.8289775848388672, -1.440626621246338, -1.0522758960723877, -0.6639251708984375, -0.27557438611984253, 0.11277639865875244, 0.5011272430419922, 0.8894779682159424, 1.2778286933898926, 1.6661796569824219, 2.054530382156372, 2.4428811073303223, 2.8312318325042725, 3.2195825576782227, 3.607933521270752, 3.996284246444702, 4.384634971618652, 4.772985935211182, 5.161336898803711, 5.549687385559082]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 2.0, 4.0, 8.0, 6.0, 5.0, 7.0, 15.0, 7.0, 17.0, 10.0, 22.0, 25.0, 24.0, 26.0, 40.0, 32.0, 32.0, 41.0, 42.0, 33.0, 52.0, 35.0, 40.0, 35.0, 44.0, 28.0, 31.0, 39.0, 44.0, 25.0, 28.0, 35.0, 33.0, 26.0, 17.0, 16.0, 19.0, 13.0, 12.0, 11.0, 5.0, 5.0, 1.0, 5.0, 2.0, 6.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.3657758235931396, -3.251232862472534, -3.1366899013519287, -3.022146701812744, -2.9076037406921387, -2.793060779571533, -2.6785178184509277, -2.5639748573303223, -2.449431896209717, -2.3348889350891113, -2.220345973968506, -2.1058030128479004, -1.9912599325180054, -1.8767168521881104, -1.7621738910675049, -1.6476309299468994, -1.5330878496170044, -1.418544888496399, -1.304001808166504, -1.1894588470458984, -1.074915885925293, -0.9603728652000427, -0.8458298444747925, -0.731286883354187, -0.6167438626289368, -0.5022008419036865, -0.38765788078308105, -0.2731148600578308, -0.15857186913490295, -0.0440288782119751, 0.07051414251327515, 0.18505710363388062, 0.29960012435913086, 0.4141431152820587, 0.5286861062049866, 0.6432291269302368, 0.7577720880508423, 0.8723151087760925, 0.9868581295013428, 1.1014010906219482, 1.2159440517425537, 1.3304870128631592, 1.4450300931930542, 1.5595730543136597, 1.6741160154342651, 1.7886590957641602, 1.9032020568847656, 2.017745018005371, 2.1322879791259766, 2.246830940246582, 2.3613739013671875, 2.475916862487793, 2.5904600620269775, 2.705003023147583, 2.8195459842681885, 2.934088945388794, 3.0486321449279785, 3.163175106048584, 3.2777180671691895, 3.392261028289795, 3.5068042278289795, 3.621347188949585, 3.7358901500701904, 3.850433111190796, 3.9649760723114014]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 7.0, 2.0, 6.0, 6.0, 14.0, 14.0, 33.0, 42.0, 68.0, 147.0, 245.0, 461.0, 897.0, 2080.0, 4864.0, 12326.0, 34863.0, 106403.0, 290242.0, 359559.0, 155552.0, 51501.0, 17476.0, 6465.0, 2699.0, 1250.0, 627.0, 307.0, 170.0, 99.0, 61.0, 26.0, 22.0, 14.0, 10.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.794921875, -2.688140869140625, -2.58135986328125, -2.474578857421875, -2.3677978515625, -2.261016845703125, -2.15423583984375, -2.047454833984375, -1.940673828125, -1.833892822265625, -1.72711181640625, -1.620330810546875, -1.5135498046875, -1.406768798828125, -1.29998779296875, -1.193206787109375, -1.08642578125, -0.979644775390625, -0.87286376953125, -0.766082763671875, -0.6593017578125, -0.552520751953125, -0.44573974609375, -0.338958740234375, -0.232177734375, -0.125396728515625, -0.01861572265625, 0.088165283203125, 0.1949462890625, 0.301727294921875, 0.40850830078125, 0.515289306640625, 0.6220703125, 0.728851318359375, 0.83563232421875, 0.942413330078125, 1.0491943359375, 1.155975341796875, 1.26275634765625, 1.369537353515625, 1.476318359375, 1.583099365234375, 1.68988037109375, 1.796661376953125, 1.9034423828125, 2.010223388671875, 2.11700439453125, 2.223785400390625, 2.33056640625, 2.437347412109375, 2.54412841796875, 2.650909423828125, 2.7576904296875, 2.864471435546875, 2.97125244140625, 3.078033447265625, 3.184814453125, 3.291595458984375, 3.39837646484375, 3.505157470703125, 3.6119384765625, 3.718719482421875, 3.82550048828125, 3.932281494140625, 4.0390625]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 7.0, 4.0, 10.0, 14.0, 24.0, 15.0, 30.0, 27.0, 36.0, 43.0, 51.0, 68.0, 69.0, 72.0, 65.0, 92.0, 69.0, 55.0, 64.0, 37.0, 40.0, 26.0, 24.0, 14.0, 16.0, 9.0, 9.0, 4.0, 5.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.009765625, -0.9784698486328125, -0.947174072265625, -0.9158782958984375, -0.88458251953125, -0.8532867431640625, -0.821990966796875, -0.7906951904296875, -0.7593994140625, -0.7281036376953125, -0.696807861328125, -0.6655120849609375, -0.63421630859375, -0.6029205322265625, -0.571624755859375, -0.5403289794921875, -0.509033203125, -0.4777374267578125, -0.446441650390625, -0.4151458740234375, -0.38385009765625, -0.3525543212890625, -0.321258544921875, -0.2899627685546875, -0.2586669921875, -0.2273712158203125, -0.196075439453125, -0.1647796630859375, -0.13348388671875, -0.1021881103515625, -0.070892333984375, -0.0395965576171875, -0.00830078125, 0.0229949951171875, 0.054290771484375, 0.0855865478515625, 0.11688232421875, 0.1481781005859375, 0.179473876953125, 0.2107696533203125, 0.2420654296875, 0.2733612060546875, 0.304656982421875, 0.3359527587890625, 0.36724853515625, 0.3985443115234375, 0.429840087890625, 0.4611358642578125, 0.492431640625, 0.5237274169921875, 0.555023193359375, 0.5863189697265625, 0.61761474609375, 0.6489105224609375, 0.680206298828125, 0.7115020751953125, 0.7427978515625, 0.7740936279296875, 0.805389404296875, 0.8366851806640625, 0.86798095703125, 0.8992767333984375, 0.930572509765625, 0.9618682861328125, 0.9931640625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 6.0, 6.0, 6.0, 13.0, 11.0, 15.0, 18.0, 32.0, 33.0, 58.0, 85.0, 120.0, 133.0, 202.0, 306.0, 446.0, 751.0, 1385.0, 3704.0, 17399.0, 111360.0, 483566.0, 349828.0, 63032.0, 10241.0, 2661.0, 1151.0, 641.0, 466.0, 236.0, 208.0, 137.0, 96.0, 67.0, 39.0, 32.0, 25.0, 14.0, 9.0, 8.0, 4.0, 3.0, 2.0, 2.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.54296875, -4.4046630859375, -4.266357421875, -4.1280517578125, -3.98974609375, -3.8514404296875, -3.713134765625, -3.5748291015625, -3.4365234375, -3.2982177734375, -3.159912109375, -3.0216064453125, -2.88330078125, -2.7449951171875, -2.606689453125, -2.4683837890625, -2.330078125, -2.1917724609375, -2.053466796875, -1.9151611328125, -1.77685546875, -1.6385498046875, -1.500244140625, -1.3619384765625, -1.2236328125, -1.0853271484375, -0.947021484375, -0.8087158203125, -0.67041015625, -0.5321044921875, -0.393798828125, -0.2554931640625, -0.1171875, 0.0211181640625, 0.159423828125, 0.2977294921875, 0.43603515625, 0.5743408203125, 0.712646484375, 0.8509521484375, 0.9892578125, 1.1275634765625, 1.265869140625, 1.4041748046875, 1.54248046875, 1.6807861328125, 1.819091796875, 1.9573974609375, 2.095703125, 2.2340087890625, 2.372314453125, 2.5106201171875, 2.64892578125, 2.7872314453125, 2.925537109375, 3.0638427734375, 3.2021484375, 3.3404541015625, 3.478759765625, 3.6170654296875, 3.75537109375, 3.8936767578125, 4.031982421875, 4.1702880859375, 4.30859375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 5.0, 6.0, 4.0, 11.0, 7.0, 10.0, 18.0, 21.0, 22.0, 22.0, 19.0, 40.0, 30.0, 31.0, 27.0, 36.0, 50.0, 38.0, 54.0, 44.0, 50.0, 39.0, 51.0, 40.0, 34.0, 32.0, 34.0, 36.0, 26.0, 23.0, 22.0, 20.0, 19.0, 20.0, 14.0, 9.0, 10.0, 7.0, 8.0, 7.0, 6.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.76953125, -2.66717529296875, -2.5648193359375, -2.46246337890625, -2.360107421875, -2.25775146484375, -2.1553955078125, -2.05303955078125, -1.95068359375, -1.84832763671875, -1.7459716796875, -1.64361572265625, -1.541259765625, -1.43890380859375, -1.3365478515625, -1.23419189453125, -1.1318359375, -1.02947998046875, -0.9271240234375, -0.82476806640625, -0.722412109375, -0.62005615234375, -0.5177001953125, -0.41534423828125, -0.31298828125, -0.21063232421875, -0.1082763671875, -0.00592041015625, 0.096435546875, 0.19879150390625, 0.3011474609375, 0.40350341796875, 0.505859375, 0.60821533203125, 0.7105712890625, 0.81292724609375, 0.915283203125, 1.01763916015625, 1.1199951171875, 1.22235107421875, 1.32470703125, 1.42706298828125, 1.5294189453125, 1.63177490234375, 1.734130859375, 1.83648681640625, 1.9388427734375, 2.04119873046875, 2.1435546875, 2.24591064453125, 2.3482666015625, 2.45062255859375, 2.552978515625, 2.65533447265625, 2.7576904296875, 2.86004638671875, 2.96240234375, 3.06475830078125, 3.1671142578125, 3.26947021484375, 3.371826171875, 3.47418212890625, 3.5765380859375, 3.67889404296875, 3.78125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 0.0, 2.0, 2.0, 4.0, 2.0, 2.0, 10.0, 7.0, 18.0, 16.0, 30.0, 39.0, 59.0, 92.0, 109.0, 191.0, 230.0, 412.0, 729.0, 1175.0, 2275.0, 4371.0, 9589.0, 23169.0, 67411.0, 251265.0, 454159.0, 156381.0, 45129.0, 16705.0, 7060.0, 3461.0, 1801.0, 956.0, 636.0, 360.0, 212.0, 155.0, 96.0, 79.0, 48.0, 29.0, 18.0, 24.0, 13.0, 11.0, 4.0, 4.0, 4.0, 3.0, 1.0, 1.0, 5.0, 0.0, 1.0, 1.0], "bins": [-1.9677734375, -1.9104461669921875, -1.853118896484375, -1.7957916259765625, -1.73846435546875, -1.6811370849609375, -1.623809814453125, -1.5664825439453125, -1.5091552734375, -1.4518280029296875, -1.394500732421875, -1.3371734619140625, -1.27984619140625, -1.2225189208984375, -1.165191650390625, -1.1078643798828125, -1.050537109375, -0.9932098388671875, -0.935882568359375, -0.8785552978515625, -0.82122802734375, -0.7639007568359375, -0.706573486328125, -0.6492462158203125, -0.5919189453125, -0.5345916748046875, -0.477264404296875, -0.4199371337890625, -0.36260986328125, -0.3052825927734375, -0.247955322265625, -0.1906280517578125, -0.13330078125, -0.0759735107421875, -0.018646240234375, 0.0386810302734375, 0.09600830078125, 0.1533355712890625, 0.210662841796875, 0.2679901123046875, 0.3253173828125, 0.3826446533203125, 0.439971923828125, 0.4972991943359375, 0.55462646484375, 0.6119537353515625, 0.669281005859375, 0.7266082763671875, 0.783935546875, 0.8412628173828125, 0.898590087890625, 0.9559173583984375, 1.01324462890625, 1.0705718994140625, 1.127899169921875, 1.1852264404296875, 1.2425537109375, 1.2998809814453125, 1.357208251953125, 1.4145355224609375, 1.47186279296875, 1.5291900634765625, 1.586517333984375, 1.6438446044921875, 1.701171875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 0.0, 7.0, 7.0, 7.0, 13.0, 21.0, 22.0, 25.0, 27.0, 27.0, 53.0, 55.0, 64.0, 87.0, 139.0, 108.0, 94.0, 63.0, 42.0, 32.0, 19.0, 25.0, 13.0, 16.0, 8.0, 7.0, 7.0, 3.0, 4.0, 1.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003867149353027344, -0.0003727376461029053, -0.00035876035690307617, -0.00034478306770324707, -0.00033080577850341797, -0.00031682848930358887, -0.00030285120010375977, -0.00028887391090393066, -0.00027489662170410156, -0.00026091933250427246, -0.00024694204330444336, -0.00023296475410461426, -0.00021898746490478516, -0.00020501017570495605, -0.00019103288650512695, -0.00017705559730529785, -0.00016307830810546875, -0.00014910101890563965, -0.00013512372970581055, -0.00012114644050598145, -0.00010716915130615234, -9.319186210632324e-05, -7.921457290649414e-05, -6.523728370666504e-05, -5.125999450683594e-05, -3.7282705307006836e-05, -2.3305416107177734e-05, -9.328126907348633e-06, 4.649162292480469e-06, 1.862645149230957e-05, 3.260374069213867e-05, 4.6581029891967773e-05, 6.0558319091796875e-05, 7.453560829162598e-05, 8.851289749145508e-05, 0.00010249018669128418, 0.00011646747589111328, 0.00013044476509094238, 0.00014442205429077148, 0.00015839934349060059, 0.0001723766326904297, 0.0001863539218902588, 0.0002003312110900879, 0.000214308500289917, 0.0002282857894897461, 0.0002422630786895752, 0.0002562403678894043, 0.0002702176570892334, 0.0002841949462890625, 0.0002981722354888916, 0.0003121495246887207, 0.0003261268138885498, 0.0003401041030883789, 0.000354081392288208, 0.0003680586814880371, 0.0003820359706878662, 0.0003960132598876953, 0.0004099905490875244, 0.0004239678382873535, 0.0004379451274871826, 0.0004519224166870117, 0.0004658997058868408, 0.0004798769950866699, 0.000493854284286499, 0.0005078315734863281]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 9.0, 9.0, 11.0, 16.0, 16.0, 30.0, 45.0, 71.0, 97.0, 163.0, 330.0, 601.0, 1560.0, 5542.0, 34045.0, 448174.0, 510955.0, 37559.0, 6191.0, 1633.0, 627.0, 339.0, 203.0, 126.0, 68.0, 43.0, 30.0, 22.0, 15.0, 3.0, 8.0, 7.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-4.421875, -4.29913330078125, -4.1763916015625, -4.05364990234375, -3.930908203125, -3.80816650390625, -3.6854248046875, -3.56268310546875, -3.43994140625, -3.31719970703125, -3.1944580078125, -3.07171630859375, -2.948974609375, -2.82623291015625, -2.7034912109375, -2.58074951171875, -2.4580078125, -2.33526611328125, -2.2125244140625, -2.08978271484375, -1.967041015625, -1.84429931640625, -1.7215576171875, -1.59881591796875, -1.47607421875, -1.35333251953125, -1.2305908203125, -1.10784912109375, -0.985107421875, -0.86236572265625, -0.7396240234375, -0.61688232421875, -0.494140625, -0.37139892578125, -0.2486572265625, -0.12591552734375, -0.003173828125, 0.11956787109375, 0.2423095703125, 0.36505126953125, 0.48779296875, 0.61053466796875, 0.7332763671875, 0.85601806640625, 0.978759765625, 1.10150146484375, 1.2242431640625, 1.34698486328125, 1.4697265625, 1.59246826171875, 1.7152099609375, 1.83795166015625, 1.960693359375, 2.08343505859375, 2.2061767578125, 2.32891845703125, 2.45166015625, 2.57440185546875, 2.6971435546875, 2.81988525390625, 2.942626953125, 3.06536865234375, 3.1881103515625, 3.31085205078125, 3.43359375]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 2.0, 4.0, 6.0, 5.0, 8.0, 11.0, 13.0, 18.0, 13.0, 15.0, 31.0, 53.0, 65.0, 72.0, 75.0, 121.0, 119.0, 106.0, 62.0, 49.0, 31.0, 15.0, 18.0, 21.0, 11.0, 12.0, 12.0, 8.0, 7.0, 6.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.955078125, -1.893157958984375, -1.83123779296875, -1.769317626953125, -1.7073974609375, -1.645477294921875, -1.58355712890625, -1.521636962890625, -1.459716796875, -1.397796630859375, -1.33587646484375, -1.273956298828125, -1.2120361328125, -1.150115966796875, -1.08819580078125, -1.026275634765625, -0.96435546875, -0.902435302734375, -0.84051513671875, -0.778594970703125, -0.7166748046875, -0.654754638671875, -0.59283447265625, -0.530914306640625, -0.468994140625, -0.407073974609375, -0.34515380859375, -0.283233642578125, -0.2213134765625, -0.159393310546875, -0.09747314453125, -0.035552978515625, 0.0263671875, 0.088287353515625, 0.15020751953125, 0.212127685546875, 0.2740478515625, 0.335968017578125, 0.39788818359375, 0.459808349609375, 0.521728515625, 0.583648681640625, 0.64556884765625, 0.707489013671875, 0.7694091796875, 0.831329345703125, 0.89324951171875, 0.955169677734375, 1.01708984375, 1.079010009765625, 1.14093017578125, 1.202850341796875, 1.2647705078125, 1.326690673828125, 1.38861083984375, 1.450531005859375, 1.512451171875, 1.574371337890625, 1.63629150390625, 1.698211669921875, 1.7601318359375, 1.822052001953125, 1.88397216796875, 1.945892333984375, 2.0078125]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 5.0, 10.0, 10.0, 13.0, 60.0, 107.0, 163.0, 189.0, 165.0, 146.0, 68.0, 37.0, 15.0, 4.0, 7.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-44.157501220703125, -43.02091598510742, -41.88433074951172, -40.74774169921875, -39.61115646362305, -38.474571228027344, -37.337982177734375, -36.20139694213867, -35.06481170654297, -33.928226470947266, -32.79164123535156, -31.655052185058594, -30.51846694946289, -29.381881713867188, -28.24529457092285, -27.108707427978516, -25.972122192382812, -24.83553695678711, -23.698949813842773, -22.562362670898438, -21.425777435302734, -20.28919219970703, -19.152605056762695, -18.01601791381836, -16.879432678222656, -15.742846488952637, -14.606260299682617, -13.469674110412598, -12.333087921142578, -11.196501731872559, -10.059915542602539, -8.92332935333252, -7.786739349365234, -6.650153160095215, -5.513566970825195, -4.376980781555176, -3.2403945922851562, -2.1038084030151367, -0.9672222137451172, 0.16936397552490234, 1.3059501647949219, 2.4425363540649414, 3.579122543334961, 4.7157087326049805, 5.852294921875, 6.9888811111450195, 8.125467300415039, 9.262053489685059, 10.398639678955078, 11.535225868225098, 12.671812057495117, 13.808398246765137, 14.944984436035156, 16.08156967163086, 17.218156814575195, 18.35474395751953, 19.491329193115234, 20.627914428710938, 21.764501571655273, 22.90108871459961, 24.037673950195312, 25.174259185791016, 26.31084632873535, 27.447433471679688, 28.58401870727539]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 6.0, 9.0, 6.0, 7.0, 5.0, 13.0, 10.0, 15.0, 26.0, 26.0, 28.0, 31.0, 39.0, 33.0, 33.0, 38.0, 46.0, 44.0, 58.0, 48.0, 58.0, 45.0, 39.0, 49.0, 48.0, 47.0, 26.0, 29.0, 26.0, 18.0, 23.0, 11.0, 14.0, 12.0, 9.0, 6.0, 9.0, 3.0, 9.0, 1.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.459728240966797, -17.80902671813965, -17.1583251953125, -16.50762367248535, -15.856922149658203, -15.206220626831055, -14.555520057678223, -13.904818534851074, -13.254117012023926, -12.603415489196777, -11.952713966369629, -11.30201244354248, -10.651311874389648, -10.0006103515625, -9.349908828735352, -8.699207305908203, -8.048505783081055, -7.397804260253906, -6.747102737426758, -6.096401691436768, -5.445700168609619, -4.794998645782471, -4.1442975997924805, -3.493596076965332, -2.8428945541381836, -2.192193031311035, -1.5414917469024658, -0.8907903432846069, -0.24008893966674805, 0.4106125831604004, 1.0613138675689697, 1.712015151977539, 2.3627166748046875, 3.013418197631836, 3.6641194820404053, 4.314820766448975, 4.965522289276123, 5.6162238121032715, 6.266924858093262, 6.91762638092041, 7.568327903747559, 8.219029426574707, 8.869730949401855, 9.520432472229004, 10.171133041381836, 10.821834564208984, 11.472536087036133, 12.123237609863281, 12.77393913269043, 13.424640655517578, 14.075342178344727, 14.726043701171875, 15.376745223999023, 16.027446746826172, 16.67814826965332, 17.32884979248047, 17.979549407958984, 18.630250930786133, 19.28095245361328, 19.93165397644043, 20.582355499267578, 21.233057022094727, 21.883758544921875, 22.53445816040039, 23.185161590576172]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 7.0, 12.0, 12.0, 12.0, 27.0, 30.0, 62.0, 74.0, 129.0, 185.0, 414.0, 735.0, 1544.0, 3364.0, 8385.0, 25793.0, 109508.0, 2025343.0, 1869876.0, 108289.0, 25634.0, 8381.0, 3245.0, 1488.0, 695.0, 399.0, 206.0, 144.0, 92.0, 64.0, 40.0, 30.0, 24.0, 7.0, 7.0, 5.0, 6.0, 6.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.30078125, -2.218597412109375, -2.13641357421875, -2.054229736328125, -1.9720458984375, -1.889862060546875, -1.80767822265625, -1.725494384765625, -1.643310546875, -1.561126708984375, -1.47894287109375, -1.396759033203125, -1.3145751953125, -1.232391357421875, -1.15020751953125, -1.068023681640625, -0.98583984375, -0.903656005859375, -0.82147216796875, -0.739288330078125, -0.6571044921875, -0.574920654296875, -0.49273681640625, -0.410552978515625, -0.328369140625, -0.246185302734375, -0.16400146484375, -0.081817626953125, 0.0003662109375, 0.082550048828125, 0.16473388671875, 0.246917724609375, 0.3291015625, 0.411285400390625, 0.49346923828125, 0.575653076171875, 0.6578369140625, 0.740020751953125, 0.82220458984375, 0.904388427734375, 0.986572265625, 1.068756103515625, 1.15093994140625, 1.233123779296875, 1.3153076171875, 1.397491455078125, 1.47967529296875, 1.561859130859375, 1.64404296875, 1.726226806640625, 1.80841064453125, 1.890594482421875, 1.9727783203125, 2.054962158203125, 2.13714599609375, 2.219329833984375, 2.301513671875, 2.383697509765625, 2.46588134765625, 2.548065185546875, 2.6302490234375, 2.712432861328125, 2.79461669921875, 2.876800537109375, 2.958984375]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 3.0, 9.0, 9.0, 8.0, 16.0, 17.0, 31.0, 35.0, 35.0, 47.0, 42.0, 84.0, 72.0, 81.0, 61.0, 69.0, 64.0, 72.0, 57.0, 48.0, 38.0, 26.0, 24.0, 11.0, 19.0, 5.0, 3.0, 6.0, 4.0, 4.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1005859375, -1.0642242431640625, -1.027862548828125, -0.9915008544921875, -0.95513916015625, -0.9187774658203125, -0.882415771484375, -0.8460540771484375, -0.8096923828125, -0.7733306884765625, -0.736968994140625, -0.7006072998046875, -0.66424560546875, -0.6278839111328125, -0.591522216796875, -0.5551605224609375, -0.518798828125, -0.4824371337890625, -0.446075439453125, -0.4097137451171875, -0.37335205078125, -0.3369903564453125, -0.300628662109375, -0.2642669677734375, -0.2279052734375, -0.1915435791015625, -0.155181884765625, -0.1188201904296875, -0.08245849609375, -0.0460968017578125, -0.009735107421875, 0.0266265869140625, 0.06298828125, 0.0993499755859375, 0.135711669921875, 0.1720733642578125, 0.20843505859375, 0.2447967529296875, 0.281158447265625, 0.3175201416015625, 0.3538818359375, 0.3902435302734375, 0.426605224609375, 0.4629669189453125, 0.49932861328125, 0.5356903076171875, 0.572052001953125, 0.6084136962890625, 0.644775390625, 0.6811370849609375, 0.717498779296875, 0.7538604736328125, 0.79022216796875, 0.8265838623046875, 0.862945556640625, 0.8993072509765625, 0.9356689453125, 0.9720306396484375, 1.008392333984375, 1.0447540283203125, 1.08111572265625, 1.1174774169921875, 1.153839111328125, 1.1902008056640625, 1.2265625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 7.0, 4.0, 9.0, 14.0, 27.0, 37.0, 77.0, 133.0, 248.0, 467.0, 1102.0, 2863.0, 7806.0, 23555.0, 91526.0, 662371.0, 3058711.0, 270620.0, 51488.0, 14866.0, 5005.0, 1860.0, 748.0, 363.0, 159.0, 92.0, 56.0, 31.0, 16.0, 14.0, 4.0, 3.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.009765625, -1.927093505859375, -1.84442138671875, -1.761749267578125, -1.6790771484375, -1.596405029296875, -1.51373291015625, -1.431060791015625, -1.348388671875, -1.265716552734375, -1.18304443359375, -1.100372314453125, -1.0177001953125, -0.935028076171875, -0.85235595703125, -0.769683837890625, -0.68701171875, -0.604339599609375, -0.52166748046875, -0.438995361328125, -0.3563232421875, -0.273651123046875, -0.19097900390625, -0.108306884765625, -0.025634765625, 0.057037353515625, 0.13970947265625, 0.222381591796875, 0.3050537109375, 0.387725830078125, 0.47039794921875, 0.553070068359375, 0.6357421875, 0.718414306640625, 0.80108642578125, 0.883758544921875, 0.9664306640625, 1.049102783203125, 1.13177490234375, 1.214447021484375, 1.297119140625, 1.379791259765625, 1.46246337890625, 1.545135498046875, 1.6278076171875, 1.710479736328125, 1.79315185546875, 1.875823974609375, 1.95849609375, 2.041168212890625, 2.12384033203125, 2.206512451171875, 2.2891845703125, 2.371856689453125, 2.45452880859375, 2.537200927734375, 2.619873046875, 2.702545166015625, 2.78521728515625, 2.867889404296875, 2.9505615234375, 3.033233642578125, 3.11590576171875, 3.198577880859375, 3.28125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 5.0, 4.0, 5.0, 8.0, 13.0, 8.0, 17.0, 24.0, 23.0, 32.0, 56.0, 66.0, 162.0, 262.0, 646.0, 1311.0, 705.0, 302.0, 174.0, 84.0, 53.0, 41.0, 17.0, 18.0, 11.0, 11.0, 6.0, 6.0, 5.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.28515625, -1.24017333984375, -1.1951904296875, -1.15020751953125, -1.105224609375, -1.06024169921875, -1.0152587890625, -0.97027587890625, -0.92529296875, -0.88031005859375, -0.8353271484375, -0.79034423828125, -0.745361328125, -0.70037841796875, -0.6553955078125, -0.61041259765625, -0.5654296875, -0.52044677734375, -0.4754638671875, -0.43048095703125, -0.385498046875, -0.34051513671875, -0.2955322265625, -0.25054931640625, -0.20556640625, -0.16058349609375, -0.1156005859375, -0.07061767578125, -0.025634765625, 0.01934814453125, 0.0643310546875, 0.10931396484375, 0.154296875, 0.19927978515625, 0.2442626953125, 0.28924560546875, 0.334228515625, 0.37921142578125, 0.4241943359375, 0.46917724609375, 0.51416015625, 0.55914306640625, 0.6041259765625, 0.64910888671875, 0.694091796875, 0.73907470703125, 0.7840576171875, 0.82904052734375, 0.8740234375, 0.91900634765625, 0.9639892578125, 1.00897216796875, 1.053955078125, 1.09893798828125, 1.1439208984375, 1.18890380859375, 1.23388671875, 1.27886962890625, 1.3238525390625, 1.36883544921875, 1.413818359375, 1.45880126953125, 1.5037841796875, 1.54876708984375, 1.59375]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 8.0, 13.0, 22.0, 41.0, 67.0, 87.0, 125.0, 113.0, 141.0, 116.0, 107.0, 57.0, 50.0, 19.0, 14.0, 8.0, 2.0, 2.0, 2.0, 0.0, 5.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.740456581115723, -9.480880737304688, -9.221304893493652, -8.961729049682617, -8.702153205871582, -8.442577362060547, -8.183001518249512, -7.923425674438477, -7.663849830627441, -7.404273986816406, -7.144698143005371, -6.885122299194336, -6.625546455383301, -6.365970611572266, -6.1063947677612305, -5.846818923950195, -5.587242603302002, -5.327666759490967, -5.068090915679932, -4.8085150718688965, -4.548939228057861, -4.289363384246826, -4.029787063598633, -3.7702114582061768, -3.5106356143951416, -3.2510597705841064, -2.9914839267730713, -2.731907844543457, -2.472332000732422, -2.2127561569213867, -1.9531803131103516, -1.6936044692993164, -1.4340286254882812, -1.174452781677246, -0.9148768782615662, -0.6553009748458862, -0.3957251310348511, -0.13614928722381592, 0.12342667579650879, 0.38300251960754395, 0.6425783634185791, 0.9021542072296143, 1.1617300510406494, 1.4213060140609741, 1.6808818578720093, 1.9404577016830444, 2.200033664703369, 2.4596095085144043, 2.7191853523254395, 2.9787611961364746, 3.2383370399475098, 3.497912883758545, 3.75748872756958, 4.017064571380615, 4.276640892028809, 4.536216735839844, 4.795792579650879, 5.055368423461914, 5.314944267272949, 5.574520111083984, 5.8340959548950195, 6.093671798706055, 6.35324764251709, 6.612823486328125, 6.87239933013916]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 5.0, 10.0, 5.0, 9.0, 5.0, 13.0, 17.0, 26.0, 24.0, 20.0, 21.0, 36.0, 38.0, 45.0, 49.0, 53.0, 53.0, 46.0, 42.0, 49.0, 55.0, 45.0, 34.0, 35.0, 38.0, 28.0, 42.0, 26.0, 18.0, 24.0, 17.0, 12.0, 11.0, 12.0, 14.0, 3.0, 9.0, 2.0, 2.0, 9.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.8537983894348145, -4.698648452758789, -4.5434980392456055, -4.38834810256958, -4.233198165893555, -4.078047752380371, -3.9228978157043457, -3.767747640609741, -3.6125974655151367, -3.4574472904205322, -3.3022971153259277, -3.1471471786499023, -2.991997003555298, -2.8368468284606934, -2.681696891784668, -2.5265467166900635, -2.371396541595459, -2.2162463665008545, -2.06109619140625, -1.9059462547302246, -1.7507960796356201, -1.5956459045410156, -1.4404958486557007, -1.2853457927703857, -1.1301956176757812, -0.9750455021858215, -0.8198953866958618, -0.6647452712059021, -0.5095951557159424, -0.35444504022598267, -0.19929492473602295, -0.04414486885070801, 0.11100530624389648, 0.2661554217338562, 0.4213055372238159, 0.5764556527137756, 0.7316057682037354, 0.8867558836936951, 1.0419059991836548, 1.1970560550689697, 1.3522062301635742, 1.5073564052581787, 1.6625064611434937, 1.8176565170288086, 1.972806692123413, 2.1279568672180176, 2.283106803894043, 2.4382569789886475, 2.593407154083252, 2.7485573291778564, 2.903707504272461, 3.0588574409484863, 3.214007616043091, 3.3691577911376953, 3.5243077278137207, 3.679457902908325, 3.8346080780029297, 3.989758253097534, 4.144908428192139, 4.300058364868164, 4.455208778381348, 4.610358715057373, 4.765508651733398, 4.920659065246582, 5.075809001922607]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 4.0, 9.0, 8.0, 8.0, 23.0, 34.0, 38.0, 54.0, 108.0, 159.0, 213.0, 337.0, 526.0, 848.0, 1489.0, 2501.0, 4583.0, 8702.0, 18043.0, 37851.0, 91515.0, 273874.0, 370011.0, 136901.0, 52057.0, 23444.0, 11425.0, 5974.0, 3210.0, 1807.0, 1058.0, 625.0, 368.0, 240.0, 183.0, 97.0, 78.0, 50.0, 30.0, 16.0, 14.0, 13.0, 12.0, 9.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.484375, -2.40472412109375, -2.3250732421875, -2.24542236328125, -2.165771484375, -2.08612060546875, -2.0064697265625, -1.92681884765625, -1.84716796875, -1.76751708984375, -1.6878662109375, -1.60821533203125, -1.528564453125, -1.44891357421875, -1.3692626953125, -1.28961181640625, -1.2099609375, -1.13031005859375, -1.0506591796875, -0.97100830078125, -0.891357421875, -0.81170654296875, -0.7320556640625, -0.65240478515625, -0.57275390625, -0.49310302734375, -0.4134521484375, -0.33380126953125, -0.254150390625, -0.17449951171875, -0.0948486328125, -0.01519775390625, 0.064453125, 0.14410400390625, 0.2237548828125, 0.30340576171875, 0.383056640625, 0.46270751953125, 0.5423583984375, 0.62200927734375, 0.70166015625, 0.78131103515625, 0.8609619140625, 0.94061279296875, 1.020263671875, 1.09991455078125, 1.1795654296875, 1.25921630859375, 1.3388671875, 1.41851806640625, 1.4981689453125, 1.57781982421875, 1.657470703125, 1.73712158203125, 1.8167724609375, 1.89642333984375, 1.97607421875, 2.05572509765625, 2.1353759765625, 2.21502685546875, 2.294677734375, 2.37432861328125, 2.4539794921875, 2.53363037109375, 2.61328125]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 4.0, 2.0, 5.0, 13.0, 16.0, 15.0, 20.0, 25.0, 25.0, 29.0, 32.0, 50.0, 59.0, 54.0, 62.0, 73.0, 60.0, 60.0, 49.0, 56.0, 56.0, 50.0, 35.0, 36.0, 26.0, 21.0, 17.0, 14.0, 13.0, 6.0, 4.0, 6.0, 5.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.98388671875, -0.9525527954101562, -0.9212188720703125, -0.8898849487304688, -0.858551025390625, -0.8272171020507812, -0.7958831787109375, -0.7645492553710938, -0.73321533203125, -0.7018814086914062, -0.6705474853515625, -0.6392135620117188, -0.607879638671875, -0.5765457153320312, -0.5452117919921875, -0.5138778686523438, -0.4825439453125, -0.45121002197265625, -0.4198760986328125, -0.38854217529296875, -0.357208251953125, -0.32587432861328125, -0.2945404052734375, -0.26320648193359375, -0.23187255859375, -0.20053863525390625, -0.1692047119140625, -0.13787078857421875, -0.106536865234375, -0.07520294189453125, -0.0438690185546875, -0.01253509521484375, 0.018798828125, 0.05013275146484375, 0.0814666748046875, 0.11280059814453125, 0.144134521484375, 0.17546844482421875, 0.2068023681640625, 0.23813629150390625, 0.26947021484375, 0.30080413818359375, 0.3321380615234375, 0.36347198486328125, 0.394805908203125, 0.42613983154296875, 0.4574737548828125, 0.48880767822265625, 0.5201416015625, 0.5514755249023438, 0.5828094482421875, 0.6141433715820312, 0.645477294921875, 0.6768112182617188, 0.7081451416015625, 0.7394790649414062, 0.77081298828125, 0.8021469116210938, 0.8334808349609375, 0.8648147583007812, 0.896148681640625, 0.9274826049804688, 0.9588165283203125, 0.9901504516601562, 1.021484375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 5.0, 6.0, 6.0, 10.0, 9.0, 17.0, 17.0, 23.0, 26.0, 25.0, 64.0, 60.0, 101.0, 116.0, 180.0, 256.0, 374.0, 585.0, 1109.0, 2617.0, 9249.0, 42828.0, 293667.0, 590684.0, 82446.0, 16121.0, 4189.0, 1535.0, 748.0, 433.0, 282.0, 226.0, 142.0, 99.0, 72.0, 45.0, 36.0, 35.0, 32.0, 19.0, 16.0, 12.0, 9.0, 8.0, 9.0, 2.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-4.9140625, -4.76141357421875, -4.6087646484375, -4.45611572265625, -4.303466796875, -4.15081787109375, -3.9981689453125, -3.84552001953125, -3.69287109375, -3.54022216796875, -3.3875732421875, -3.23492431640625, -3.082275390625, -2.92962646484375, -2.7769775390625, -2.62432861328125, -2.4716796875, -2.31903076171875, -2.1663818359375, -2.01373291015625, -1.861083984375, -1.70843505859375, -1.5557861328125, -1.40313720703125, -1.25048828125, -1.09783935546875, -0.9451904296875, -0.79254150390625, -0.639892578125, -0.48724365234375, -0.3345947265625, -0.18194580078125, -0.029296875, 0.12335205078125, 0.2760009765625, 0.42864990234375, 0.581298828125, 0.73394775390625, 0.8865966796875, 1.03924560546875, 1.19189453125, 1.34454345703125, 1.4971923828125, 1.64984130859375, 1.802490234375, 1.95513916015625, 2.1077880859375, 2.26043701171875, 2.4130859375, 2.56573486328125, 2.7183837890625, 2.87103271484375, 3.023681640625, 3.17633056640625, 3.3289794921875, 3.48162841796875, 3.63427734375, 3.78692626953125, 3.9395751953125, 4.09222412109375, 4.244873046875, 4.39752197265625, 4.5501708984375, 4.70281982421875, 4.85546875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [4.0, 2.0, 3.0, 3.0, 3.0, 5.0, 5.0, 5.0, 7.0, 7.0, 6.0, 7.0, 8.0, 20.0, 11.0, 21.0, 20.0, 20.0, 33.0, 28.0, 31.0, 49.0, 24.0, 46.0, 31.0, 43.0, 40.0, 42.0, 61.0, 30.0, 44.0, 44.0, 39.0, 34.0, 31.0, 31.0, 25.0, 14.0, 22.0, 20.0, 13.0, 24.0, 14.0, 10.0, 8.0, 4.0, 5.0, 2.0, 4.0, 2.0, 1.0, 3.0, 2.0, 0.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.861328125, -2.7569580078125, -2.652587890625, -2.5482177734375, -2.44384765625, -2.3394775390625, -2.235107421875, -2.1307373046875, -2.0263671875, -1.9219970703125, -1.817626953125, -1.7132568359375, -1.60888671875, -1.5045166015625, -1.400146484375, -1.2957763671875, -1.19140625, -1.0870361328125, -0.982666015625, -0.8782958984375, -0.77392578125, -0.6695556640625, -0.565185546875, -0.4608154296875, -0.3564453125, -0.2520751953125, -0.147705078125, -0.0433349609375, 0.06103515625, 0.1654052734375, 0.269775390625, 0.3741455078125, 0.478515625, 0.5828857421875, 0.687255859375, 0.7916259765625, 0.89599609375, 1.0003662109375, 1.104736328125, 1.2091064453125, 1.3134765625, 1.4178466796875, 1.522216796875, 1.6265869140625, 1.73095703125, 1.8353271484375, 1.939697265625, 2.0440673828125, 2.1484375, 2.2528076171875, 2.357177734375, 2.4615478515625, 2.56591796875, 2.6702880859375, 2.774658203125, 2.8790283203125, 2.9833984375, 3.0877685546875, 3.192138671875, 3.2965087890625, 3.40087890625, 3.5052490234375, 3.609619140625, 3.7139892578125, 3.818359375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 6.0, 7.0, 4.0, 14.0, 20.0, 30.0, 36.0, 84.0, 153.0, 329.0, 884.0, 3483.0, 21439.0, 298853.0, 681267.0, 34729.0, 5284.0, 1095.0, 421.0, 179.0, 105.0, 64.0, 32.0, 15.0, 13.0, 4.0, 3.0, 4.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.875, -3.7371826171875, -3.599365234375, -3.4615478515625, -3.32373046875, -3.1859130859375, -3.048095703125, -2.9102783203125, -2.7724609375, -2.6346435546875, -2.496826171875, -2.3590087890625, -2.22119140625, -2.0833740234375, -1.945556640625, -1.8077392578125, -1.669921875, -1.5321044921875, -1.394287109375, -1.2564697265625, -1.11865234375, -0.9808349609375, -0.843017578125, -0.7052001953125, -0.5673828125, -0.4295654296875, -0.291748046875, -0.1539306640625, -0.01611328125, 0.1217041015625, 0.259521484375, 0.3973388671875, 0.53515625, 0.6729736328125, 0.810791015625, 0.9486083984375, 1.08642578125, 1.2242431640625, 1.362060546875, 1.4998779296875, 1.6376953125, 1.7755126953125, 1.913330078125, 2.0511474609375, 2.18896484375, 2.3267822265625, 2.464599609375, 2.6024169921875, 2.740234375, 2.8780517578125, 3.015869140625, 3.1536865234375, 3.29150390625, 3.4293212890625, 3.567138671875, 3.7049560546875, 3.8427734375, 3.9805908203125, 4.118408203125, 4.2562255859375, 4.39404296875, 4.5318603515625, 4.669677734375, 4.8074951171875, 4.9453125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 4.0, 7.0, 9.0, 23.0, 21.0, 27.0, 46.0, 121.0, 406.0, 155.0, 54.0, 38.0, 37.0, 17.0, 14.0, 11.0, 5.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0012226104736328125, -0.0011957958340644836, -0.0011689811944961548, -0.001142166554927826, -0.001115351915359497, -0.0010885372757911682, -0.0010617226362228394, -0.0010349079966545105, -0.0010080933570861816, -0.0009812787175178528, -0.0009544640779495239, -0.0009276494383811951, -0.0009008347988128662, -0.0008740201592445374, -0.0008472055196762085, -0.0008203908801078796, -0.0007935762405395508, -0.0007667616009712219, -0.0007399469614028931, -0.0007131323218345642, -0.0006863176822662354, -0.0006595030426979065, -0.0006326884031295776, -0.0006058737635612488, -0.0005790591239929199, -0.0005522444844245911, -0.0005254298448562622, -0.0004986152052879333, -0.0004718005657196045, -0.00044498592615127563, -0.0004181712865829468, -0.0003913566470146179, -0.00036454200744628906, -0.0003377273678779602, -0.00031091272830963135, -0.0002840980887413025, -0.00025728344917297363, -0.00023046880960464478, -0.00020365417003631592, -0.00017683953046798706, -0.0001500248908996582, -0.00012321025133132935, -9.639561176300049e-05, -6.958097219467163e-05, -4.2766332626342773e-05, -1.5951693058013916e-05, 1.0862946510314941e-05, 3.76775860786438e-05, 6.449222564697266e-05, 9.130686521530151e-05, 0.00011812150478363037, 0.00014493614435195923, 0.00017175078392028809, 0.00019856542348861694, 0.0002253800630569458, 0.00025219470262527466, 0.0002790093421936035, 0.0003058239817619324, 0.00033263862133026123, 0.0003594532608985901, 0.00038626790046691895, 0.0004130825400352478, 0.00043989717960357666, 0.0004667118191719055, 0.0004935264587402344]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 3.0, 7.0, 11.0, 5.0, 11.0, 14.0, 19.0, 44.0, 38.0, 93.0, 132.0, 248.0, 511.0, 1269.0, 4935.0, 36032.0, 833678.0, 154115.0, 13311.0, 2463.0, 806.0, 368.0, 184.0, 77.0, 52.0, 37.0, 31.0, 14.0, 7.0, 7.0, 4.0, 5.0, 5.0, 4.0, 2.0, 4.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-5.3984375, -5.2431640625, -5.087890625, -4.9326171875, -4.77734375, -4.6220703125, -4.466796875, -4.3115234375, -4.15625, -4.0009765625, -3.845703125, -3.6904296875, -3.53515625, -3.3798828125, -3.224609375, -3.0693359375, -2.9140625, -2.7587890625, -2.603515625, -2.4482421875, -2.29296875, -2.1376953125, -1.982421875, -1.8271484375, -1.671875, -1.5166015625, -1.361328125, -1.2060546875, -1.05078125, -0.8955078125, -0.740234375, -0.5849609375, -0.4296875, -0.2744140625, -0.119140625, 0.0361328125, 0.19140625, 0.3466796875, 0.501953125, 0.6572265625, 0.8125, 0.9677734375, 1.123046875, 1.2783203125, 1.43359375, 1.5888671875, 1.744140625, 1.8994140625, 2.0546875, 2.2099609375, 2.365234375, 2.5205078125, 2.67578125, 2.8310546875, 2.986328125, 3.1416015625, 3.296875, 3.4521484375, 3.607421875, 3.7626953125, 3.91796875, 4.0732421875, 4.228515625, 4.3837890625, 4.5390625]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 6.0, 5.0, 12.0, 17.0, 28.0, 38.0, 76.0, 150.0, 285.0, 183.0, 101.0, 40.0, 18.0, 13.0, 12.0, 4.0, 5.0, 5.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4453125, -3.31097412109375, -3.1766357421875, -3.04229736328125, -2.907958984375, -2.77362060546875, -2.6392822265625, -2.50494384765625, -2.37060546875, -2.23626708984375, -2.1019287109375, -1.96759033203125, -1.833251953125, -1.69891357421875, -1.5645751953125, -1.43023681640625, -1.2958984375, -1.16156005859375, -1.0272216796875, -0.89288330078125, -0.758544921875, -0.62420654296875, -0.4898681640625, -0.35552978515625, -0.22119140625, -0.08685302734375, 0.0474853515625, 0.18182373046875, 0.316162109375, 0.45050048828125, 0.5848388671875, 0.71917724609375, 0.853515625, 0.98785400390625, 1.1221923828125, 1.25653076171875, 1.390869140625, 1.52520751953125, 1.6595458984375, 1.79388427734375, 1.92822265625, 2.06256103515625, 2.1968994140625, 2.33123779296875, 2.465576171875, 2.59991455078125, 2.7342529296875, 2.86859130859375, 3.0029296875, 3.13726806640625, 3.2716064453125, 3.40594482421875, 3.540283203125, 3.67462158203125, 3.8089599609375, 3.94329833984375, 4.07763671875, 4.21197509765625, 4.3463134765625, 4.48065185546875, 4.614990234375, 4.74932861328125, 4.8836669921875, 5.01800537109375, 5.15234375]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 42.0, 209.0, 419.0, 252.0, 63.0, 14.0, 5.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.46234893798828, -53.84701919555664, -51.231689453125, -48.61635971069336, -46.00102996826172, -43.38570022583008, -40.77037048339844, -38.15504455566406, -35.539710998535156, -32.924381256103516, -30.309051513671875, -27.693721771240234, -25.078392028808594, -22.463062286376953, -19.847734451293945, -17.232404708862305, -14.617076873779297, -12.001747131347656, -9.386417388916016, -6.771088600158691, -4.155758857727051, -1.5404291152954102, 1.074899673461914, 3.6902294158935547, 6.305559158325195, 8.920888900756836, 11.536218643188477, 14.1515474319458, 16.766876220703125, 19.382205963134766, 21.997535705566406, 24.612865447998047, 27.228195190429688, 29.843524932861328, 32.45885467529297, 35.07418441772461, 37.68951416015625, 40.30484390258789, 42.92017364501953, 45.535499572753906, 48.15083312988281, 50.76616287231445, 53.381492614746094, 55.996822357177734, 58.612152099609375, 61.227481842041016, 63.842811584472656, 66.45813751220703, 69.07347106933594, 71.68879699707031, 74.30413055419922, 76.9194564819336, 79.5347900390625, 82.15011596679688, 84.76544952392578, 87.38077545166016, 89.99610137939453, 92.6114273071289, 95.22676086425781, 97.84208679199219, 100.4574203491211, 103.07274627685547, 105.68807983398438, 108.30340576171875, 110.91873931884766]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 7.0, 6.0, 3.0, 3.0, 5.0, 6.0, 5.0, 14.0, 16.0, 9.0, 12.0, 22.0, 24.0, 24.0, 29.0, 36.0, 27.0, 40.0, 34.0, 44.0, 56.0, 62.0, 40.0, 50.0, 34.0, 40.0, 37.0, 47.0, 52.0, 30.0, 24.0, 25.0, 28.0, 20.0, 16.0, 21.0, 14.0, 11.0, 10.0, 8.0, 7.0, 3.0, 6.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.104515075683594, -16.47117805480957, -15.837839126586914, -15.20450210571289, -14.57116413116455, -13.937826156616211, -13.304489135742188, -12.671151161193848, -12.037813186645508, -11.404475212097168, -10.771137237548828, -10.137800216674805, -9.504462242126465, -8.871124267578125, -8.237787246704102, -7.604449272155762, -6.971111297607422, -6.337773323059082, -5.7044358253479, -5.071098327636719, -4.437760353088379, -3.804422616958618, -3.1710848808288574, -2.537747383117676, -1.904409408569336, -1.2710716724395752, -0.6377339363098145, -0.004396200180053711, 0.628941535949707, 1.2622792720794678, 1.8956170082092285, 2.52895450592041, 3.16229248046875, 3.7956302165985107, 4.4289679527282715, 5.062305450439453, 5.695643424987793, 6.328981399536133, 6.9623188972473145, 7.595656394958496, 8.228994369506836, 8.862332344055176, 9.495670318603516, 10.129007339477539, 10.762345314025879, 11.395683288574219, 12.029020309448242, 12.662358283996582, 13.295696258544922, 13.929034233093262, 14.562372207641602, 15.195709228515625, 15.829047203063965, 16.462385177612305, 17.095722198486328, 17.729061126708984, 18.362398147583008, 18.99573516845703, 19.629074096679688, 20.26241111755371, 20.895748138427734, 21.52908706665039, 22.162424087524414, 22.795761108398438, 23.429100036621094]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 0.0, 2.0, 3.0, 4.0, 7.0, 13.0, 14.0, 17.0, 24.0, 41.0, 50.0, 94.0, 166.0, 271.0, 486.0, 934.0, 1932.0, 4248.0, 11039.0, 35316.0, 180744.0, 3434044.0, 438885.0, 58631.0, 16138.0, 5883.0, 2546.0, 1251.0, 592.0, 347.0, 191.0, 127.0, 72.0, 41.0, 44.0, 26.0, 25.0, 13.0, 6.0, 10.0, 4.0, 2.0, 6.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.044921875, -2.948822021484375, -2.85272216796875, -2.756622314453125, -2.6605224609375, -2.564422607421875, -2.46832275390625, -2.372222900390625, -2.276123046875, -2.180023193359375, -2.08392333984375, -1.987823486328125, -1.8917236328125, -1.795623779296875, -1.69952392578125, -1.603424072265625, -1.50732421875, -1.411224365234375, -1.31512451171875, -1.219024658203125, -1.1229248046875, -1.026824951171875, -0.93072509765625, -0.834625244140625, -0.738525390625, -0.642425537109375, -0.54632568359375, -0.450225830078125, -0.3541259765625, -0.258026123046875, -0.16192626953125, -0.065826416015625, 0.0302734375, 0.126373291015625, 0.22247314453125, 0.318572998046875, 0.4146728515625, 0.510772705078125, 0.60687255859375, 0.702972412109375, 0.799072265625, 0.895172119140625, 0.99127197265625, 1.087371826171875, 1.1834716796875, 1.279571533203125, 1.37567138671875, 1.471771240234375, 1.56787109375, 1.663970947265625, 1.76007080078125, 1.856170654296875, 1.9522705078125, 2.048370361328125, 2.14447021484375, 2.240570068359375, 2.336669921875, 2.432769775390625, 2.52886962890625, 2.624969482421875, 2.7210693359375, 2.817169189453125, 2.91326904296875, 3.009368896484375, 3.10546875]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 6.0, 4.0, 0.0, 7.0, 6.0, 13.0, 10.0, 17.0, 20.0, 24.0, 18.0, 25.0, 43.0, 50.0, 54.0, 66.0, 67.0, 64.0, 67.0, 61.0, 54.0, 62.0, 47.0, 52.0, 29.0, 35.0, 26.0, 27.0, 18.0, 9.0, 7.0, 8.0, 3.0, 4.0, 6.0, 2.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.083984375, -1.047088623046875, -1.01019287109375, -0.973297119140625, -0.9364013671875, -0.899505615234375, -0.86260986328125, -0.825714111328125, -0.788818359375, -0.751922607421875, -0.71502685546875, -0.678131103515625, -0.6412353515625, -0.604339599609375, -0.56744384765625, -0.530548095703125, -0.49365234375, -0.456756591796875, -0.41986083984375, -0.382965087890625, -0.3460693359375, -0.309173583984375, -0.27227783203125, -0.235382080078125, -0.198486328125, -0.161590576171875, -0.12469482421875, -0.087799072265625, -0.0509033203125, -0.014007568359375, 0.02288818359375, 0.059783935546875, 0.0966796875, 0.133575439453125, 0.17047119140625, 0.207366943359375, 0.2442626953125, 0.281158447265625, 0.31805419921875, 0.354949951171875, 0.391845703125, 0.428741455078125, 0.46563720703125, 0.502532958984375, 0.5394287109375, 0.576324462890625, 0.61322021484375, 0.650115966796875, 0.68701171875, 0.723907470703125, 0.76080322265625, 0.797698974609375, 0.8345947265625, 0.871490478515625, 0.90838623046875, 0.945281982421875, 0.982177734375, 1.019073486328125, 1.05596923828125, 1.092864990234375, 1.1297607421875, 1.166656494140625, 1.20355224609375, 1.240447998046875, 1.27734375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 4.0, 8.0, 8.0, 12.0, 19.0, 31.0, 42.0, 88.0, 137.0, 223.0, 343.0, 706.0, 1380.0, 3016.0, 6912.0, 17325.0, 54097.0, 271953.0, 3158411.0, 557069.0, 82672.0, 23418.0, 8987.0, 3762.0, 1775.0, 818.0, 432.0, 249.0, 160.0, 81.0, 56.0, 33.0, 17.0, 11.0, 7.0, 7.0, 3.0, 4.0, 5.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.779296875, -2.691497802734375, -2.60369873046875, -2.515899658203125, -2.4281005859375, -2.340301513671875, -2.25250244140625, -2.164703369140625, -2.076904296875, -1.989105224609375, -1.90130615234375, -1.813507080078125, -1.7257080078125, -1.637908935546875, -1.55010986328125, -1.462310791015625, -1.37451171875, -1.286712646484375, -1.19891357421875, -1.111114501953125, -1.0233154296875, -0.935516357421875, -0.84771728515625, -0.759918212890625, -0.672119140625, -0.584320068359375, -0.49652099609375, -0.408721923828125, -0.3209228515625, -0.233123779296875, -0.14532470703125, -0.057525634765625, 0.0302734375, 0.118072509765625, 0.20587158203125, 0.293670654296875, 0.3814697265625, 0.469268798828125, 0.55706787109375, 0.644866943359375, 0.732666015625, 0.820465087890625, 0.90826416015625, 0.996063232421875, 1.0838623046875, 1.171661376953125, 1.25946044921875, 1.347259521484375, 1.43505859375, 1.522857666015625, 1.61065673828125, 1.698455810546875, 1.7862548828125, 1.874053955078125, 1.96185302734375, 2.049652099609375, 2.137451171875, 2.225250244140625, 2.31304931640625, 2.400848388671875, 2.4886474609375, 2.576446533203125, 2.66424560546875, 2.752044677734375, 2.83984375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 10.0, 5.0, 6.0, 8.0, 8.0, 11.0, 18.0, 20.0, 27.0, 47.0, 63.0, 96.0, 191.0, 315.0, 772.0, 1406.0, 470.0, 235.0, 106.0, 79.0, 56.0, 26.0, 25.0, 15.0, 9.0, 11.0, 10.0, 8.0, 7.0, 3.0, 2.0, 3.0, 7.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.4609375, -1.4206695556640625, -1.380401611328125, -1.3401336669921875, -1.29986572265625, -1.2595977783203125, -1.219329833984375, -1.1790618896484375, -1.1387939453125, -1.0985260009765625, -1.058258056640625, -1.0179901123046875, -0.97772216796875, -0.9374542236328125, -0.897186279296875, -0.8569183349609375, -0.816650390625, -0.7763824462890625, -0.736114501953125, -0.6958465576171875, -0.65557861328125, -0.6153106689453125, -0.575042724609375, -0.5347747802734375, -0.4945068359375, -0.4542388916015625, -0.413970947265625, -0.3737030029296875, -0.33343505859375, -0.2931671142578125, -0.252899169921875, -0.2126312255859375, -0.17236328125, -0.1320953369140625, -0.091827392578125, -0.0515594482421875, -0.01129150390625, 0.0289764404296875, 0.069244384765625, 0.1095123291015625, 0.1497802734375, 0.1900482177734375, 0.230316162109375, 0.2705841064453125, 0.31085205078125, 0.3511199951171875, 0.391387939453125, 0.4316558837890625, 0.471923828125, 0.5121917724609375, 0.552459716796875, 0.5927276611328125, 0.63299560546875, 0.6732635498046875, 0.713531494140625, 0.7537994384765625, 0.7940673828125, 0.8343353271484375, 0.874603271484375, 0.9148712158203125, 0.95513916015625, 0.9954071044921875, 1.035675048828125, 1.0759429931640625, 1.1162109375]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 13.0, 25.0, 39.0, 89.0, 114.0, 155.0, 173.0, 149.0, 125.0, 74.0, 25.0, 8.0, 3.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-15.28591251373291, -14.943406105041504, -14.600898742675781, -14.258392333984375, -13.915885925292969, -13.573378562927246, -13.23087215423584, -12.888364791870117, -12.545858383178711, -12.203351974487305, -11.860844612121582, -11.518338203430176, -11.175830841064453, -10.833324432373047, -10.49081802368164, -10.148311614990234, -9.805804252624512, -9.463297843933105, -9.120790481567383, -8.778284072875977, -8.43577766418457, -8.093270301818848, -7.750763893127441, -7.408257007598877, -7.0657501220703125, -6.723243236541748, -6.380736351013184, -6.038229942321777, -5.695723056793213, -5.353216171264648, -5.010709762573242, -4.668202877044678, -4.325695037841797, -3.9831881523132324, -3.640681505203247, -3.2981748580932617, -2.9556679725646973, -2.613161087036133, -2.2706544399261475, -1.928147792816162, -1.5856409072875977, -1.2431341409683228, -0.9006273746490479, -0.558120608329773, -0.21561384201049805, 0.12689292430877686, 0.46939969062805176, 0.8119063377380371, 1.1544132232666016, 1.4969199895858765, 1.8394267559051514, 2.1819334030151367, 2.524440288543701, 2.8669471740722656, 3.209453821182251, 3.5519604682922363, 3.894467353820801, 4.236974239349365, 4.57948112487793, 4.921987533569336, 5.2644944190979, 5.607001304626465, 5.949507713317871, 6.2920145988464355, 6.634521484375]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 4.0, 7.0, 6.0, 5.0, 6.0, 7.0, 13.0, 12.0, 20.0, 24.0, 23.0, 22.0, 29.0, 35.0, 38.0, 40.0, 44.0, 41.0, 41.0, 39.0, 45.0, 53.0, 39.0, 60.0, 36.0, 43.0, 48.0, 39.0, 29.0, 32.0, 17.0, 20.0, 29.0, 17.0, 10.0, 7.0, 8.0, 3.0, 4.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 4.0, 1.0, 0.0, 2.0], "bins": [-4.906667709350586, -4.7587385177612305, -4.610809326171875, -4.462879657745361, -4.314950466156006, -4.16702127456665, -4.019091606140137, -3.8711624145507812, -3.723233222961426, -3.5753040313720703, -3.4273746013641357, -3.279445171356201, -3.1315159797668457, -2.9835867881774902, -2.8356573581695557, -2.687727928161621, -2.5397987365722656, -2.39186954498291, -2.2439401149749756, -2.096010684967041, -1.9480814933776855, -1.8001521825790405, -1.6522228717803955, -1.5042935609817505, -1.3563642501831055, -1.2084349393844604, -1.0605056285858154, -0.9125763177871704, -0.7646470069885254, -0.6167176961898804, -0.46878838539123535, -0.32085907459259033, -0.1729297637939453, -0.025000452995300293, 0.12292885780334473, 0.27085816860198975, 0.41878747940063477, 0.5667167901992798, 0.7146461009979248, 0.8625754117965698, 1.0105047225952148, 1.1584340333938599, 1.3063633441925049, 1.45429265499115, 1.602221965789795, 1.75015127658844, 1.898080587387085, 2.0460100173950195, 2.193939208984375, 2.3418684005737305, 2.489797830581665, 2.6377272605895996, 2.785656452178955, 2.9335856437683105, 3.081515073776245, 3.2294445037841797, 3.377373695373535, 3.5253028869628906, 3.673232316970825, 3.8211617469787598, 3.9690909385681152, 4.117020130157471, 4.264949798583984, 4.41287899017334, 4.560808181762695]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 5.0, 4.0, 6.0, 7.0, 12.0, 17.0, 25.0, 41.0, 59.0, 94.0, 134.0, 238.0, 448.0, 937.0, 2002.0, 4835.0, 12629.0, 34233.0, 99925.0, 330064.0, 377261.0, 120312.0, 40692.0, 14690.0, 5584.0, 2199.0, 976.0, 465.0, 260.0, 134.0, 99.0, 55.0, 37.0, 16.0, 19.0, 19.0, 10.0, 8.0, 2.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.142578125, -2.0535888671875, -1.964599609375, -1.8756103515625, -1.78662109375, -1.6976318359375, -1.608642578125, -1.5196533203125, -1.4306640625, -1.3416748046875, -1.252685546875, -1.1636962890625, -1.07470703125, -0.9857177734375, -0.896728515625, -0.8077392578125, -0.71875, -0.6297607421875, -0.540771484375, -0.4517822265625, -0.36279296875, -0.2738037109375, -0.184814453125, -0.0958251953125, -0.0068359375, 0.0821533203125, 0.171142578125, 0.2601318359375, 0.34912109375, 0.4381103515625, 0.527099609375, 0.6160888671875, 0.705078125, 0.7940673828125, 0.883056640625, 0.9720458984375, 1.06103515625, 1.1500244140625, 1.239013671875, 1.3280029296875, 1.4169921875, 1.5059814453125, 1.594970703125, 1.6839599609375, 1.77294921875, 1.8619384765625, 1.950927734375, 2.0399169921875, 2.12890625, 2.2178955078125, 2.306884765625, 2.3958740234375, 2.48486328125, 2.5738525390625, 2.662841796875, 2.7518310546875, 2.8408203125, 2.9298095703125, 3.018798828125, 3.1077880859375, 3.19677734375, 3.2857666015625, 3.374755859375, 3.4637451171875, 3.552734375]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 7.0, 4.0, 7.0, 5.0, 13.0, 20.0, 19.0, 21.0, 24.0, 37.0, 47.0, 55.0, 57.0, 52.0, 52.0, 71.0, 74.0, 66.0, 59.0, 47.0, 59.0, 44.0, 40.0, 26.0, 25.0, 22.0, 16.0, 11.0, 4.0, 5.0, 6.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.2880859375, -1.250335693359375, -1.21258544921875, -1.174835205078125, -1.1370849609375, -1.099334716796875, -1.06158447265625, -1.023834228515625, -0.986083984375, -0.948333740234375, -0.91058349609375, -0.872833251953125, -0.8350830078125, -0.797332763671875, -0.75958251953125, -0.721832275390625, -0.68408203125, -0.646331787109375, -0.60858154296875, -0.570831298828125, -0.5330810546875, -0.495330810546875, -0.45758056640625, -0.419830322265625, -0.382080078125, -0.344329833984375, -0.30657958984375, -0.268829345703125, -0.2310791015625, -0.193328857421875, -0.15557861328125, -0.117828369140625, -0.080078125, -0.042327880859375, -0.00457763671875, 0.033172607421875, 0.0709228515625, 0.108673095703125, 0.14642333984375, 0.184173583984375, 0.221923828125, 0.259674072265625, 0.29742431640625, 0.335174560546875, 0.3729248046875, 0.410675048828125, 0.44842529296875, 0.486175537109375, 0.52392578125, 0.561676025390625, 0.59942626953125, 0.637176513671875, 0.6749267578125, 0.712677001953125, 0.75042724609375, 0.788177490234375, 0.825927734375, 0.863677978515625, 0.90142822265625, 0.939178466796875, 0.9769287109375, 1.014678955078125, 1.05242919921875, 1.090179443359375, 1.1279296875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 6.0, 0.0, 7.0, 5.0, 14.0, 14.0, 17.0, 31.0, 33.0, 65.0, 98.0, 129.0, 181.0, 312.0, 525.0, 952.0, 2368.0, 6843.0, 23141.0, 92521.0, 546597.0, 298816.0, 53284.0, 14464.0, 4508.0, 1737.0, 748.0, 366.0, 237.0, 160.0, 110.0, 60.0, 56.0, 43.0, 30.0, 27.0, 18.0, 12.0, 8.0, 3.0, 5.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.00390625, -3.87396240234375, -3.7440185546875, -3.61407470703125, -3.484130859375, -3.35418701171875, -3.2242431640625, -3.09429931640625, -2.96435546875, -2.83441162109375, -2.7044677734375, -2.57452392578125, -2.444580078125, -2.31463623046875, -2.1846923828125, -2.05474853515625, -1.9248046875, -1.79486083984375, -1.6649169921875, -1.53497314453125, -1.405029296875, -1.27508544921875, -1.1451416015625, -1.01519775390625, -0.88525390625, -0.75531005859375, -0.6253662109375, -0.49542236328125, -0.365478515625, -0.23553466796875, -0.1055908203125, 0.02435302734375, 0.154296875, 0.28424072265625, 0.4141845703125, 0.54412841796875, 0.674072265625, 0.80401611328125, 0.9339599609375, 1.06390380859375, 1.19384765625, 1.32379150390625, 1.4537353515625, 1.58367919921875, 1.713623046875, 1.84356689453125, 1.9735107421875, 2.10345458984375, 2.2333984375, 2.36334228515625, 2.4932861328125, 2.62322998046875, 2.753173828125, 2.88311767578125, 3.0130615234375, 3.14300537109375, 3.27294921875, 3.40289306640625, 3.5328369140625, 3.66278076171875, 3.792724609375, 3.92266845703125, 4.0526123046875, 4.18255615234375, 4.3125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 2.0, 3.0, 6.0, 9.0, 5.0, 5.0, 14.0, 18.0, 19.0, 15.0, 33.0, 39.0, 46.0, 53.0, 41.0, 47.0, 65.0, 63.0, 65.0, 61.0, 71.0, 51.0, 52.0, 49.0, 29.0, 30.0, 26.0, 20.0, 17.0, 13.0, 8.0, 10.0, 5.0, 3.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.85546875, -5.6978759765625, -5.540283203125, -5.3826904296875, -5.22509765625, -5.0675048828125, -4.909912109375, -4.7523193359375, -4.5947265625, -4.4371337890625, -4.279541015625, -4.1219482421875, -3.96435546875, -3.8067626953125, -3.649169921875, -3.4915771484375, -3.333984375, -3.1763916015625, -3.018798828125, -2.8612060546875, -2.70361328125, -2.5460205078125, -2.388427734375, -2.2308349609375, -2.0732421875, -1.9156494140625, -1.758056640625, -1.6004638671875, -1.44287109375, -1.2852783203125, -1.127685546875, -0.9700927734375, -0.8125, -0.6549072265625, -0.497314453125, -0.3397216796875, -0.18212890625, -0.0245361328125, 0.133056640625, 0.2906494140625, 0.4482421875, 0.6058349609375, 0.763427734375, 0.9210205078125, 1.07861328125, 1.2362060546875, 1.393798828125, 1.5513916015625, 1.708984375, 1.8665771484375, 2.024169921875, 2.1817626953125, 2.33935546875, 2.4969482421875, 2.654541015625, 2.8121337890625, 2.9697265625, 3.1273193359375, 3.284912109375, 3.4425048828125, 3.60009765625, 3.7576904296875, 3.915283203125, 4.0728759765625, 4.23046875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 4.0, 8.0, 13.0, 10.0, 21.0, 35.0, 65.0, 103.0, 223.0, 428.0, 1026.0, 2693.0, 7667.0, 23955.0, 82307.0, 473392.0, 360743.0, 65389.0, 19996.0, 6397.0, 2290.0, 935.0, 419.0, 199.0, 94.0, 70.0, 24.0, 15.0, 12.0, 11.0, 6.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7685546875, -1.7148284912109375, -1.661102294921875, -1.6073760986328125, -1.55364990234375, -1.4999237060546875, -1.446197509765625, -1.3924713134765625, -1.3387451171875, -1.2850189208984375, -1.231292724609375, -1.1775665283203125, -1.12384033203125, -1.0701141357421875, -1.016387939453125, -0.9626617431640625, -0.908935546875, -0.8552093505859375, -0.801483154296875, -0.7477569580078125, -0.69403076171875, -0.6403045654296875, -0.586578369140625, -0.5328521728515625, -0.4791259765625, -0.4253997802734375, -0.371673583984375, -0.3179473876953125, -0.26422119140625, -0.2104949951171875, -0.156768798828125, -0.1030426025390625, -0.04931640625, 0.0044097900390625, 0.058135986328125, 0.1118621826171875, 0.16558837890625, 0.2193145751953125, 0.273040771484375, 0.3267669677734375, 0.3804931640625, 0.4342193603515625, 0.487945556640625, 0.5416717529296875, 0.59539794921875, 0.6491241455078125, 0.702850341796875, 0.7565765380859375, 0.810302734375, 0.8640289306640625, 0.917755126953125, 0.9714813232421875, 1.02520751953125, 1.0789337158203125, 1.132659912109375, 1.1863861083984375, 1.2401123046875, 1.2938385009765625, 1.347564697265625, 1.4012908935546875, 1.45501708984375, 1.5087432861328125, 1.562469482421875, 1.6161956787109375, 1.669921875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 0.0, 2.0, 4.0, 4.0, 5.0, 7.0, 7.0, 9.0, 4.0, 11.0, 9.0, 15.0, 18.0, 21.0, 20.0, 32.0, 75.0, 160.0, 219.0, 168.0, 72.0, 41.0, 21.0, 19.0, 9.0, 3.0, 9.0, 8.0, 3.0, 8.0, 5.0, 5.0, 4.0, 4.0, 4.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003466606140136719, -0.00033248215913772583, -0.0003183037042617798, -0.00030412524938583374, -0.0002899467945098877, -0.00027576833963394165, -0.0002615898847579956, -0.00024741142988204956, -0.00023323297500610352, -0.00021905452013015747, -0.00020487606525421143, -0.00019069761037826538, -0.00017651915550231934, -0.0001623407006263733, -0.00014816224575042725, -0.0001339837908744812, -0.00011980533599853516, -0.00010562688112258911, -9.144842624664307e-05, -7.726997137069702e-05, -6.309151649475098e-05, -4.891306161880493e-05, -3.473460674285889e-05, -2.0556151866912842e-05, -6.377696990966797e-06, 7.800757884979248e-06, 2.1979212760925293e-05, 3.615766763687134e-05, 5.033612251281738e-05, 6.451457738876343e-05, 7.869303226470947e-05, 9.287148714065552e-05, 0.00010704994201660156, 0.00012122839689254761, 0.00013540685176849365, 0.0001495853066444397, 0.00016376376152038574, 0.0001779422163963318, 0.00019212067127227783, 0.00020629912614822388, 0.00022047758102416992, 0.00023465603590011597, 0.000248834490776062, 0.00026301294565200806, 0.0002771914005279541, 0.00029136985540390015, 0.0003055483102798462, 0.00031972676515579224, 0.0003339052200317383, 0.0003480836749076843, 0.00036226212978363037, 0.0003764405846595764, 0.00039061903953552246, 0.0004047974944114685, 0.00041897594928741455, 0.0004331544041633606, 0.00044733285903930664, 0.0004615113139152527, 0.00047568976879119873, 0.0004898682236671448, 0.0005040466785430908, 0.0005182251334190369, 0.0005324035882949829, 0.000546582043170929, 0.000560760498046875]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 5.0, 9.0, 10.0, 18.0, 23.0, 41.0, 49.0, 78.0, 175.0, 295.0, 539.0, 1220.0, 3489.0, 11255.0, 48272.0, 399013.0, 506891.0, 57399.0, 13412.0, 3656.0, 1404.0, 597.0, 313.0, 147.0, 80.0, 59.0, 37.0, 25.0, 21.0, 6.0, 11.0, 4.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.146484375, -2.08154296875, -2.0166015625, -1.95166015625, -1.88671875, -1.82177734375, -1.7568359375, -1.69189453125, -1.626953125, -1.56201171875, -1.4970703125, -1.43212890625, -1.3671875, -1.30224609375, -1.2373046875, -1.17236328125, -1.107421875, -1.04248046875, -0.9775390625, -0.91259765625, -0.84765625, -0.78271484375, -0.7177734375, -0.65283203125, -0.587890625, -0.52294921875, -0.4580078125, -0.39306640625, -0.328125, -0.26318359375, -0.1982421875, -0.13330078125, -0.068359375, -0.00341796875, 0.0615234375, 0.12646484375, 0.19140625, 0.25634765625, 0.3212890625, 0.38623046875, 0.451171875, 0.51611328125, 0.5810546875, 0.64599609375, 0.7109375, 0.77587890625, 0.8408203125, 0.90576171875, 0.970703125, 1.03564453125, 1.1005859375, 1.16552734375, 1.23046875, 1.29541015625, 1.3603515625, 1.42529296875, 1.490234375, 1.55517578125, 1.6201171875, 1.68505859375, 1.75, 1.81494140625, 1.8798828125, 1.94482421875, 2.009765625]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 4.0, 7.0, 3.0, 5.0, 6.0, 12.0, 10.0, 9.0, 26.0, 40.0, 54.0, 67.0, 130.0, 130.0, 147.0, 127.0, 72.0, 50.0, 34.0, 25.0, 20.0, 14.0, 5.0, 4.0, 4.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.390625, -1.32696533203125, -1.2633056640625, -1.19964599609375, -1.135986328125, -1.07232666015625, -1.0086669921875, -0.94500732421875, -0.88134765625, -0.81768798828125, -0.7540283203125, -0.69036865234375, -0.626708984375, -0.56304931640625, -0.4993896484375, -0.43572998046875, -0.3720703125, -0.30841064453125, -0.2447509765625, -0.18109130859375, -0.117431640625, -0.05377197265625, 0.0098876953125, 0.07354736328125, 0.13720703125, 0.20086669921875, 0.2645263671875, 0.32818603515625, 0.391845703125, 0.45550537109375, 0.5191650390625, 0.58282470703125, 0.646484375, 0.71014404296875, 0.7738037109375, 0.83746337890625, 0.901123046875, 0.96478271484375, 1.0284423828125, 1.09210205078125, 1.15576171875, 1.21942138671875, 1.2830810546875, 1.34674072265625, 1.410400390625, 1.47406005859375, 1.5377197265625, 1.60137939453125, 1.6650390625, 1.72869873046875, 1.7923583984375, 1.85601806640625, 1.919677734375, 1.98333740234375, 2.0469970703125, 2.11065673828125, 2.17431640625, 2.23797607421875, 2.3016357421875, 2.36529541015625, 2.428955078125, 2.49261474609375, 2.5562744140625, 2.61993408203125, 2.68359375]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 7.0, 7.0, 25.0, 72.0, 104.0, 149.0, 187.0, 198.0, 132.0, 65.0, 31.0, 15.0, 10.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.85838317871094, -39.75513458251953, -38.651885986328125, -37.54863357543945, -36.44538497924805, -35.34213638305664, -34.238887786865234, -33.13563919067383, -32.032386779785156, -30.92913818359375, -29.82588768005371, -28.722639083862305, -27.619388580322266, -26.51613998413086, -25.412891387939453, -24.309642791748047, -23.20639419555664, -22.103145599365234, -20.999895095825195, -19.89664649963379, -18.79339599609375, -17.690147399902344, -16.586898803710938, -15.483649253845215, -14.380399703979492, -13.27715015411377, -12.173900604248047, -11.07065200805664, -9.967402458190918, -8.864152908325195, -7.760903835296631, -6.657654762268066, -5.554405212402344, -4.451155662536621, -3.3479065895080566, -2.244657278060913, -1.1414079666137695, -0.038158416748046875, 1.0650906562805176, 2.168339729309082, 3.2715892791748047, 4.374838829040527, 5.478087902069092, 6.581336975097656, 7.684586524963379, 8.787836074829102, 9.891084671020508, 10.99433422088623, 12.097583770751953, 13.200833320617676, 14.304082870483398, 15.407331466674805, 16.510581970214844, 17.61383056640625, 18.717079162597656, 19.820327758789062, 20.9235782623291, 22.026826858520508, 23.130077362060547, 24.233325958251953, 25.33657455444336, 26.4398250579834, 27.543073654174805, 28.646324157714844, 29.74957275390625]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 4.0, 11.0, 4.0, 4.0, 7.0, 14.0, 15.0, 9.0, 11.0, 21.0, 28.0, 25.0, 27.0, 42.0, 34.0, 39.0, 45.0, 53.0, 35.0, 43.0, 44.0, 37.0, 46.0, 49.0, 39.0, 28.0, 42.0, 29.0, 36.0, 26.0, 27.0, 20.0, 21.0, 16.0, 14.0, 14.0, 9.0, 6.0, 5.0, 12.0, 3.0, 2.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0], "bins": [-18.986740112304688, -18.44059181213379, -17.894445419311523, -17.348297119140625, -16.80215072631836, -16.25600242614746, -15.709855079650879, -15.163707733154297, -14.617560386657715, -14.071413040161133, -13.52526569366455, -12.979118347167969, -12.43297004699707, -11.886823654174805, -11.340675354003906, -10.794528007507324, -10.248380661010742, -9.70223331451416, -9.156085968017578, -8.609938621520996, -8.063791275024414, -7.517643451690674, -6.971495628356934, -6.425348281860352, -5.8792009353637695, -5.3330535888671875, -4.7869062423706055, -4.240758419036865, -3.694611072540283, -3.148463726043701, -2.60231614112854, -2.056168556213379, -1.5100231170654297, -0.9638756513595581, -0.4177281856536865, 0.12841928005218506, 0.6745667457580566, 1.2207140922546387, 1.7668616771697998, 2.313009262084961, 2.859156608581543, 3.405303955078125, 3.951451539993286, 4.497599124908447, 5.043746471405029, 5.589893817901611, 6.136041641235352, 6.682188987731934, 7.228336334228516, 7.774483680725098, 8.32063102722168, 8.866778373718262, 9.412925720214844, 9.959074020385742, 10.505221366882324, 11.051368713378906, 11.597516059875488, 12.14366340637207, 12.689810752868652, 13.235958099365234, 13.782106399536133, 14.328252792358398, 14.874401092529297, 15.420548439025879, 15.966695785522461]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 7.0, 2.0, 7.0, 10.0, 15.0, 26.0, 37.0, 70.0, 104.0, 184.0, 428.0, 934.0, 2264.0, 6693.0, 24259.0, 144406.0, 3577358.0, 377325.0, 43770.0, 10316.0, 3355.0, 1371.0, 633.0, 312.0, 154.0, 87.0, 62.0, 36.0, 19.0, 15.0, 8.0, 10.0, 5.0, 4.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.849609375, -3.699737548828125, -3.54986572265625, -3.399993896484375, -3.2501220703125, -3.100250244140625, -2.95037841796875, -2.800506591796875, -2.650634765625, -2.500762939453125, -2.35089111328125, -2.201019287109375, -2.0511474609375, -1.901275634765625, -1.75140380859375, -1.601531982421875, -1.45166015625, -1.301788330078125, -1.15191650390625, -1.002044677734375, -0.8521728515625, -0.702301025390625, -0.55242919921875, -0.402557373046875, -0.252685546875, -0.102813720703125, 0.04705810546875, 0.196929931640625, 0.3468017578125, 0.496673583984375, 0.64654541015625, 0.796417236328125, 0.9462890625, 1.096160888671875, 1.24603271484375, 1.395904541015625, 1.5457763671875, 1.695648193359375, 1.84552001953125, 1.995391845703125, 2.145263671875, 2.295135498046875, 2.44500732421875, 2.594879150390625, 2.7447509765625, 2.894622802734375, 3.04449462890625, 3.194366455078125, 3.34423828125, 3.494110107421875, 3.64398193359375, 3.793853759765625, 3.9437255859375, 4.093597412109375, 4.24346923828125, 4.393341064453125, 4.543212890625, 4.693084716796875, 4.84295654296875, 4.992828369140625, 5.1427001953125, 5.292572021484375, 5.44244384765625, 5.592315673828125, 5.7421875]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 14.0, 6.0, 10.0, 18.0, 15.0, 17.0, 22.0, 33.0, 40.0, 38.0, 56.0, 60.0, 48.0, 69.0, 70.0, 61.0, 65.0, 54.0, 52.0, 48.0, 34.0, 38.0, 36.0, 31.0, 15.0, 13.0, 15.0, 8.0, 7.0, 4.0, 8.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1396484375, -1.100311279296875, -1.06097412109375, -1.021636962890625, -0.9822998046875, -0.942962646484375, -0.90362548828125, -0.864288330078125, -0.824951171875, -0.785614013671875, -0.74627685546875, -0.706939697265625, -0.6676025390625, -0.628265380859375, -0.58892822265625, -0.549591064453125, -0.51025390625, -0.470916748046875, -0.43157958984375, -0.392242431640625, -0.3529052734375, -0.313568115234375, -0.27423095703125, -0.234893798828125, -0.195556640625, -0.156219482421875, -0.11688232421875, -0.077545166015625, -0.0382080078125, 0.001129150390625, 0.04046630859375, 0.079803466796875, 0.119140625, 0.158477783203125, 0.19781494140625, 0.237152099609375, 0.2764892578125, 0.315826416015625, 0.35516357421875, 0.394500732421875, 0.433837890625, 0.473175048828125, 0.51251220703125, 0.551849365234375, 0.5911865234375, 0.630523681640625, 0.66986083984375, 0.709197998046875, 0.74853515625, 0.787872314453125, 0.82720947265625, 0.866546630859375, 0.9058837890625, 0.945220947265625, 0.98455810546875, 1.023895263671875, 1.063232421875, 1.102569580078125, 1.14190673828125, 1.181243896484375, 1.2205810546875, 1.259918212890625, 1.29925537109375, 1.338592529296875, 1.3779296875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 1.0, 0.0, 4.0, 7.0, 15.0, 23.0, 35.0, 48.0, 75.0, 137.0, 243.0, 402.0, 709.0, 1280.0, 2413.0, 5165.0, 12354.0, 33256.0, 108821.0, 660947.0, 3042792.0, 233034.0, 58027.0, 19579.0, 7606.0, 3430.0, 1676.0, 931.0, 511.0, 297.0, 183.0, 125.0, 63.0, 35.0, 19.0, 13.0, 7.0, 13.0, 3.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.02734375, -2.916259765625, -2.80517578125, -2.694091796875, -2.5830078125, -2.471923828125, -2.36083984375, -2.249755859375, -2.138671875, -2.027587890625, -1.91650390625, -1.805419921875, -1.6943359375, -1.583251953125, -1.47216796875, -1.361083984375, -1.25, -1.138916015625, -1.02783203125, -0.916748046875, -0.8056640625, -0.694580078125, -0.58349609375, -0.472412109375, -0.361328125, -0.250244140625, -0.13916015625, -0.028076171875, 0.0830078125, 0.194091796875, 0.30517578125, 0.416259765625, 0.52734375, 0.638427734375, 0.74951171875, 0.860595703125, 0.9716796875, 1.082763671875, 1.19384765625, 1.304931640625, 1.416015625, 1.527099609375, 1.63818359375, 1.749267578125, 1.8603515625, 1.971435546875, 2.08251953125, 2.193603515625, 2.3046875, 2.415771484375, 2.52685546875, 2.637939453125, 2.7490234375, 2.860107421875, 2.97119140625, 3.082275390625, 3.193359375, 3.304443359375, 3.41552734375, 3.526611328125, 3.6376953125, 3.748779296875, 3.85986328125, 3.970947265625, 4.08203125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 10.0, 15.0, 16.0, 16.0, 18.0, 29.0, 25.0, 47.0, 88.0, 119.0, 235.0, 597.0, 1820.0, 510.0, 191.0, 112.0, 68.0, 45.0, 35.0, 24.0, 16.0, 7.0, 7.0, 2.0, 3.0, 6.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.7763671875, -1.7180023193359375, -1.659637451171875, -1.6012725830078125, -1.54290771484375, -1.4845428466796875, -1.426177978515625, -1.3678131103515625, -1.3094482421875, -1.2510833740234375, -1.192718505859375, -1.1343536376953125, -1.07598876953125, -1.0176239013671875, -0.959259033203125, -0.9008941650390625, -0.842529296875, -0.7841644287109375, -0.725799560546875, -0.6674346923828125, -0.60906982421875, -0.5507049560546875, -0.492340087890625, -0.4339752197265625, -0.3756103515625, -0.3172454833984375, -0.258880615234375, -0.2005157470703125, -0.14215087890625, -0.0837860107421875, -0.025421142578125, 0.0329437255859375, 0.09130859375, 0.1496734619140625, 0.208038330078125, 0.2664031982421875, 0.32476806640625, 0.3831329345703125, 0.441497802734375, 0.4998626708984375, 0.5582275390625, 0.6165924072265625, 0.674957275390625, 0.7333221435546875, 0.79168701171875, 0.8500518798828125, 0.908416748046875, 0.9667816162109375, 1.025146484375, 1.0835113525390625, 1.141876220703125, 1.2002410888671875, 1.25860595703125, 1.3169708251953125, 1.375335693359375, 1.4337005615234375, 1.4920654296875, 1.5504302978515625, 1.608795166015625, 1.6671600341796875, 1.72552490234375, 1.7838897705078125, 1.842254638671875, 1.9006195068359375, 1.958984375]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 5.0, 7.0, 7.0, 21.0, 42.0, 80.0, 132.0, 165.0, 188.0, 171.0, 103.0, 51.0, 16.0, 13.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.179046630859375, -17.65424156188965, -17.129436492919922, -16.604633331298828, -16.0798282623291, -15.555023193359375, -15.030218124389648, -14.505413055419922, -13.980608940124512, -13.455803871154785, -12.930999755859375, -12.406194686889648, -11.881389617919922, -11.356585502624512, -10.831780433654785, -10.306976318359375, -9.782171249389648, -9.257366180419922, -8.732562065124512, -8.207756996154785, -7.682952404022217, -7.158147811889648, -6.633342742919922, -6.1085381507873535, -5.583733558654785, -5.058928966522217, -4.534124374389648, -4.009319305419922, -3.4845147132873535, -2.959710121154785, -2.4349052906036377, -1.9101004600524902, -1.385293960571289, -0.8604892492294312, -0.33568453788757324, 0.18912017345428467, 0.7139248847961426, 1.238729476928711, 1.7635343074798584, 2.288339138031006, 2.813143730163574, 3.3379483222961426, 3.86275315284729, 4.3875579833984375, 4.912362575531006, 5.437167167663574, 5.961972236633301, 6.486776828765869, 7.0115814208984375, 7.536386013031006, 8.061190605163574, 8.5859956741333, 9.110799789428711, 9.635604858398438, 10.160409927368164, 10.68521499633789, 11.2100191116333, 11.734824180603027, 12.259628295898438, 12.784433364868164, 13.30923843383789, 13.8340425491333, 14.358847618103027, 14.883651733398438, 15.408456802368164]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 5.0, 11.0, 6.0, 14.0, 10.0, 17.0, 23.0, 25.0, 20.0, 25.0, 36.0, 36.0, 40.0, 38.0, 52.0, 40.0, 41.0, 45.0, 44.0, 46.0, 42.0, 48.0, 36.0, 46.0, 39.0, 39.0, 42.0, 32.0, 17.0, 13.0, 16.0, 17.0, 9.0, 9.0, 4.0, 7.0, 3.0, 2.0, 7.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.886143684387207, -5.685298442840576, -5.4844536781311035, -5.283608436584473, -5.082763195037842, -4.881917953491211, -4.681073188781738, -4.480227947235107, -4.279382705688477, -4.078537464141846, -3.877692461013794, -3.676847457885742, -3.4760022163391113, -3.2751572132110596, -3.074312210083008, -2.873466968536377, -2.6726222038269043, -2.4717772006988525, -2.2709319591522217, -2.07008695602417, -1.8692418336868286, -1.6683967113494873, -1.4675517082214355, -1.2667065858840942, -1.065861463546753, -0.8650163412094116, -0.6641712784767151, -0.46332621574401855, -0.26248109340667725, -0.06163597106933594, 0.13920903205871582, 0.34005415439605713, 0.5408992767333984, 0.7417443990707397, 0.9425894618034363, 1.1434345245361328, 1.3442796468734741, 1.5451247692108154, 1.7459697723388672, 1.9468148946762085, 2.14766001701355, 2.3485050201416016, 2.5493502616882324, 2.750195264816284, 2.951040267944336, 3.151885509490967, 3.3527305126190186, 3.5535755157470703, 3.754420757293701, 3.955265760421753, 4.156110763549805, 4.3569560050964355, 4.557801246643066, 4.758646011352539, 4.95949125289917, 5.160336494445801, 5.361181259155273, 5.562026500701904, 5.762871265411377, 5.963716506958008, 6.164561748504639, 6.3654069900512695, 6.566251754760742, 6.767096996307373, 6.967942237854004]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 4.0, 6.0, 13.0, 27.0, 22.0, 37.0, 53.0, 92.0, 154.0, 193.0, 410.0, 692.0, 1203.0, 2320.0, 4751.0, 10346.0, 22368.0, 48962.0, 100129.0, 199052.0, 299505.0, 183291.0, 91404.0, 44115.0, 20602.0, 9399.0, 4506.0, 2173.0, 1123.0, 653.0, 380.0, 219.0, 130.0, 78.0, 55.0, 28.0, 25.0, 15.0, 5.0, 5.0, 7.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.150390625, -3.061492919921875, -2.97259521484375, -2.883697509765625, -2.7947998046875, -2.705902099609375, -2.61700439453125, -2.528106689453125, -2.439208984375, -2.350311279296875, -2.26141357421875, -2.172515869140625, -2.0836181640625, -1.994720458984375, -1.90582275390625, -1.816925048828125, -1.72802734375, -1.639129638671875, -1.55023193359375, -1.461334228515625, -1.3724365234375, -1.283538818359375, -1.19464111328125, -1.105743408203125, -1.016845703125, -0.927947998046875, -0.83905029296875, -0.750152587890625, -0.6612548828125, -0.572357177734375, -0.48345947265625, -0.394561767578125, -0.3056640625, -0.216766357421875, -0.12786865234375, -0.038970947265625, 0.0499267578125, 0.138824462890625, 0.22772216796875, 0.316619873046875, 0.405517578125, 0.494415283203125, 0.58331298828125, 0.672210693359375, 0.7611083984375, 0.850006103515625, 0.93890380859375, 1.027801513671875, 1.11669921875, 1.205596923828125, 1.29449462890625, 1.383392333984375, 1.4722900390625, 1.561187744140625, 1.65008544921875, 1.738983154296875, 1.827880859375, 1.916778564453125, 2.00567626953125, 2.094573974609375, 2.1834716796875, 2.272369384765625, 2.36126708984375, 2.450164794921875, 2.5390625]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 5.0, 6.0, 7.0, 17.0, 7.0, 10.0, 16.0, 18.0, 29.0, 28.0, 40.0, 39.0, 46.0, 48.0, 48.0, 67.0, 56.0, 56.0, 52.0, 62.0, 54.0, 45.0, 43.0, 32.0, 41.0, 24.0, 29.0, 19.0, 17.0, 11.0, 11.0, 7.0, 3.0, 6.0, 6.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.2060546875, -1.1688232421875, -1.131591796875, -1.0943603515625, -1.05712890625, -1.0198974609375, -0.982666015625, -0.9454345703125, -0.908203125, -0.8709716796875, -0.833740234375, -0.7965087890625, -0.75927734375, -0.7220458984375, -0.684814453125, -0.6475830078125, -0.6103515625, -0.5731201171875, -0.535888671875, -0.4986572265625, -0.46142578125, -0.4241943359375, -0.386962890625, -0.3497314453125, -0.3125, -0.2752685546875, -0.238037109375, -0.2008056640625, -0.16357421875, -0.1263427734375, -0.089111328125, -0.0518798828125, -0.0146484375, 0.0225830078125, 0.059814453125, 0.0970458984375, 0.13427734375, 0.1715087890625, 0.208740234375, 0.2459716796875, 0.283203125, 0.3204345703125, 0.357666015625, 0.3948974609375, 0.43212890625, 0.4693603515625, 0.506591796875, 0.5438232421875, 0.5810546875, 0.6182861328125, 0.655517578125, 0.6927490234375, 0.72998046875, 0.7672119140625, 0.804443359375, 0.8416748046875, 0.87890625, 0.9161376953125, 0.953369140625, 0.9906005859375, 1.02783203125, 1.0650634765625, 1.102294921875, 1.1395263671875, 1.1767578125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 6.0, 3.0, 7.0, 9.0, 8.0, 16.0, 32.0, 29.0, 46.0, 65.0, 80.0, 101.0, 137.0, 181.0, 276.0, 436.0, 678.0, 1115.0, 2592.0, 10002.0, 56766.0, 353991.0, 514259.0, 86255.0, 14437.0, 3506.0, 1301.0, 735.0, 419.0, 301.0, 199.0, 147.0, 120.0, 87.0, 59.0, 35.0, 23.0, 29.0, 16.0, 19.0, 11.0, 7.0, 9.0, 1.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-5.87109375, -5.66943359375, -5.4677734375, -5.26611328125, -5.064453125, -4.86279296875, -4.6611328125, -4.45947265625, -4.2578125, -4.05615234375, -3.8544921875, -3.65283203125, -3.451171875, -3.24951171875, -3.0478515625, -2.84619140625, -2.64453125, -2.44287109375, -2.2412109375, -2.03955078125, -1.837890625, -1.63623046875, -1.4345703125, -1.23291015625, -1.03125, -0.82958984375, -0.6279296875, -0.42626953125, -0.224609375, -0.02294921875, 0.1787109375, 0.38037109375, 0.58203125, 0.78369140625, 0.9853515625, 1.18701171875, 1.388671875, 1.59033203125, 1.7919921875, 1.99365234375, 2.1953125, 2.39697265625, 2.5986328125, 2.80029296875, 3.001953125, 3.20361328125, 3.4052734375, 3.60693359375, 3.80859375, 4.01025390625, 4.2119140625, 4.41357421875, 4.615234375, 4.81689453125, 5.0185546875, 5.22021484375, 5.421875, 5.62353515625, 5.8251953125, 6.02685546875, 6.228515625, 6.43017578125, 6.6318359375, 6.83349609375, 7.03515625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 2.0, 2.0, 5.0, 4.0, 10.0, 10.0, 17.0, 13.0, 14.0, 15.0, 18.0, 21.0, 31.0, 25.0, 42.0, 41.0, 41.0, 52.0, 45.0, 55.0, 63.0, 32.0, 64.0, 47.0, 40.0, 49.0, 26.0, 31.0, 35.0, 21.0, 21.0, 15.0, 23.0, 8.0, 14.0, 7.0, 8.0, 9.0, 6.0, 5.0, 2.0, 6.0, 3.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.01953125, -4.85162353515625, -4.6837158203125, -4.51580810546875, -4.347900390625, -4.17999267578125, -4.0120849609375, -3.84417724609375, -3.67626953125, -3.50836181640625, -3.3404541015625, -3.17254638671875, -3.004638671875, -2.83673095703125, -2.6688232421875, -2.50091552734375, -2.3330078125, -2.16510009765625, -1.9971923828125, -1.82928466796875, -1.661376953125, -1.49346923828125, -1.3255615234375, -1.15765380859375, -0.98974609375, -0.82183837890625, -0.6539306640625, -0.48602294921875, -0.318115234375, -0.15020751953125, 0.0177001953125, 0.18560791015625, 0.353515625, 0.52142333984375, 0.6893310546875, 0.85723876953125, 1.025146484375, 1.19305419921875, 1.3609619140625, 1.52886962890625, 1.69677734375, 1.86468505859375, 2.0325927734375, 2.20050048828125, 2.368408203125, 2.53631591796875, 2.7042236328125, 2.87213134765625, 3.0400390625, 3.20794677734375, 3.3758544921875, 3.54376220703125, 3.711669921875, 3.87957763671875, 4.0474853515625, 4.21539306640625, 4.38330078125, 4.55120849609375, 4.7191162109375, 4.88702392578125, 5.054931640625, 5.22283935546875, 5.3907470703125, 5.55865478515625, 5.7265625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 6.0, 6.0, 12.0, 18.0, 27.0, 39.0, 62.0, 128.0, 269.0, 494.0, 1179.0, 3327.0, 19779.0, 766349.0, 241653.0, 10924.0, 2467.0, 931.0, 415.0, 206.0, 101.0, 71.0, 35.0, 18.0, 15.0, 13.0, 8.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-12.9296875, -12.61334228515625, -12.2969970703125, -11.98065185546875, -11.664306640625, -11.34796142578125, -11.0316162109375, -10.71527099609375, -10.39892578125, -10.08258056640625, -9.7662353515625, -9.44989013671875, -9.133544921875, -8.81719970703125, -8.5008544921875, -8.18450927734375, -7.8681640625, -7.55181884765625, -7.2354736328125, -6.91912841796875, -6.602783203125, -6.28643798828125, -5.9700927734375, -5.65374755859375, -5.33740234375, -5.02105712890625, -4.7047119140625, -4.38836669921875, -4.072021484375, -3.75567626953125, -3.4393310546875, -3.12298583984375, -2.806640625, -2.49029541015625, -2.1739501953125, -1.85760498046875, -1.541259765625, -1.22491455078125, -0.9085693359375, -0.59222412109375, -0.27587890625, 0.04046630859375, 0.3568115234375, 0.67315673828125, 0.989501953125, 1.30584716796875, 1.6221923828125, 1.93853759765625, 2.2548828125, 2.57122802734375, 2.8875732421875, 3.20391845703125, 3.520263671875, 3.83660888671875, 4.1529541015625, 4.46929931640625, 4.78564453125, 5.10198974609375, 5.4183349609375, 5.73468017578125, 6.051025390625, 6.36737060546875, 6.6837158203125, 7.00006103515625, 7.31640625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 4.0, 5.0, 7.0, 11.0, 11.0, 12.0, 33.0, 44.0, 46.0, 62.0, 110.0, 312.0, 89.0, 71.0, 50.0, 39.0, 21.0, 22.0, 14.0, 12.0, 8.0, 3.0, 6.0, 2.0, 4.0, 2.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.0013685226440429688, -0.0013363063335418701, -0.0013040900230407715, -0.0012718737125396729, -0.0012396574020385742, -0.0012074410915374756, -0.001175224781036377, -0.0011430084705352783, -0.0011107921600341797, -0.001078575849533081, -0.0010463595390319824, -0.0010141432285308838, -0.0009819269180297852, -0.0009497106075286865, -0.0009174942970275879, -0.0008852779865264893, -0.0008530616760253906, -0.000820845365524292, -0.0007886290550231934, -0.0007564127445220947, -0.0007241964340209961, -0.0006919801235198975, -0.0006597638130187988, -0.0006275475025177002, -0.0005953311920166016, -0.0005631148815155029, -0.0005308985710144043, -0.0004986822605133057, -0.00046646595001220703, -0.0004342496395111084, -0.00040203332901000977, -0.00036981701850891113, -0.0003376007080078125, -0.00030538439750671387, -0.00027316808700561523, -0.0002409517765045166, -0.00020873546600341797, -0.00017651915550231934, -0.0001443028450012207, -0.00011208653450012207, -7.987022399902344e-05, -4.7653913497924805e-05, -1.5437602996826172e-05, 1.677870750427246e-05, 4.8995018005371094e-05, 8.121132850646973e-05, 0.00011342763900756836, 0.000145643949508667, 0.00017786026000976562, 0.00021007657051086426, 0.0002422928810119629, 0.0002745091915130615, 0.00030672550201416016, 0.0003389418125152588, 0.0003711581230163574, 0.00040337443351745605, 0.0004355907440185547, 0.0004678070545196533, 0.000500023365020752, 0.0005322396755218506, 0.0005644559860229492, 0.0005966722965240479, 0.0006288886070251465, 0.0006611049175262451, 0.0006933212280273438]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 2.0, 6.0, 7.0, 6.0, 15.0, 26.0, 35.0, 117.0, 309.0, 906.0, 5945.0, 692273.0, 342989.0, 4699.0, 763.0, 249.0, 100.0, 46.0, 24.0, 13.0, 5.0, 10.0, 3.0, 5.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.484375, -15.0283203125, -14.572265625, -14.1162109375, -13.66015625, -13.2041015625, -12.748046875, -12.2919921875, -11.8359375, -11.3798828125, -10.923828125, -10.4677734375, -10.01171875, -9.5556640625, -9.099609375, -8.6435546875, -8.1875, -7.7314453125, -7.275390625, -6.8193359375, -6.36328125, -5.9072265625, -5.451171875, -4.9951171875, -4.5390625, -4.0830078125, -3.626953125, -3.1708984375, -2.71484375, -2.2587890625, -1.802734375, -1.3466796875, -0.890625, -0.4345703125, 0.021484375, 0.4775390625, 0.93359375, 1.3896484375, 1.845703125, 2.3017578125, 2.7578125, 3.2138671875, 3.669921875, 4.1259765625, 4.58203125, 5.0380859375, 5.494140625, 5.9501953125, 6.40625, 6.8623046875, 7.318359375, 7.7744140625, 8.23046875, 8.6865234375, 9.142578125, 9.5986328125, 10.0546875, 10.5107421875, 10.966796875, 11.4228515625, 11.87890625, 12.3349609375, 12.791015625, 13.2470703125, 13.703125]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 12.0, 10.0, 19.0, 14.0, 22.0, 40.0, 46.0, 94.0, 193.0, 224.0, 115.0, 66.0, 39.0, 27.0, 11.0, 16.0, 18.0, 7.0, 8.0, 6.0, 4.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.90625, -7.7188720703125, -7.531494140625, -7.3441162109375, -7.15673828125, -6.9693603515625, -6.781982421875, -6.5946044921875, -6.4072265625, -6.2198486328125, -6.032470703125, -5.8450927734375, -5.65771484375, -5.4703369140625, -5.282958984375, -5.0955810546875, -4.908203125, -4.7208251953125, -4.533447265625, -4.3460693359375, -4.15869140625, -3.9713134765625, -3.783935546875, -3.5965576171875, -3.4091796875, -3.2218017578125, -3.034423828125, -2.8470458984375, -2.65966796875, -2.4722900390625, -2.284912109375, -2.0975341796875, -1.91015625, -1.7227783203125, -1.535400390625, -1.3480224609375, -1.16064453125, -0.9732666015625, -0.785888671875, -0.5985107421875, -0.4111328125, -0.2237548828125, -0.036376953125, 0.1510009765625, 0.33837890625, 0.5257568359375, 0.713134765625, 0.9005126953125, 1.087890625, 1.2752685546875, 1.462646484375, 1.6500244140625, 1.83740234375, 2.0247802734375, 2.212158203125, 2.3995361328125, 2.5869140625, 2.7742919921875, 2.961669921875, 3.1490478515625, 3.33642578125, 3.5238037109375, 3.711181640625, 3.8985595703125, 4.0859375]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 8.0, 32.0, 56.0, 138.0, 235.0, 251.0, 159.0, 73.0, 28.0, 9.0, 10.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-101.49754333496094, -98.9023666381836, -96.30718994140625, -93.7120132446289, -91.11683654785156, -88.52165985107422, -85.92648315429688, -83.331298828125, -80.73612976074219, -78.14095306396484, -75.5457763671875, -72.95059967041016, -70.35542297363281, -67.76024627685547, -65.16506958007812, -62.569889068603516, -59.974708557128906, -57.37953186035156, -54.78435516357422, -52.189178466796875, -49.59400177001953, -46.99882507324219, -44.40364456176758, -41.808467864990234, -39.21329116821289, -36.61811447143555, -34.0229377746582, -31.427759170532227, -28.832582473754883, -26.23740577697754, -23.642227172851562, -21.04705047607422, -18.451873779296875, -15.856697082519531, -13.261519432067871, -10.666341781616211, -8.071165084838867, -5.475988388061523, -2.8808107376098633, -0.2856330871582031, 2.3095436096191406, 4.904720783233643, 7.4998979568481445, 10.095075607299805, 12.690252304077148, 15.285429000854492, 17.88060760498047, 20.475784301757812, 23.070960998535156, 25.6661376953125, 28.261314392089844, 30.85649299621582, 33.45166778564453, 36.046844482421875, 38.642024993896484, 41.23720169067383, 43.83237838745117, 46.427555084228516, 49.02273178100586, 51.6179084777832, 54.21308898925781, 56.808265686035156, 59.4034423828125, 61.998619079589844, 64.59379577636719]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 3.0, 3.0, 5.0, 4.0, 8.0, 5.0, 8.0, 6.0, 12.0, 13.0, 19.0, 22.0, 23.0, 30.0, 28.0, 27.0, 43.0, 38.0, 39.0, 39.0, 43.0, 51.0, 36.0, 39.0, 45.0, 48.0, 44.0, 31.0, 27.0, 26.0, 36.0, 30.0, 25.0, 24.0, 29.0, 15.0, 9.0, 17.0, 13.0, 6.0, 6.0, 5.0, 6.0, 3.0, 5.0, 4.0, 2.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-29.830400466918945, -28.930217742919922, -28.03003692626953, -27.129854202270508, -26.229671478271484, -25.32948875427246, -24.429306030273438, -23.529125213623047, -22.628942489624023, -21.728759765625, -20.82857894897461, -19.928396224975586, -19.028213500976562, -18.12803077697754, -17.227848052978516, -16.327667236328125, -15.427484512329102, -14.527301788330078, -13.627120018005371, -12.726938247680664, -11.82675552368164, -10.926572799682617, -10.02639102935791, -9.126209259033203, -8.22602653503418, -7.3258442878723145, -6.425662040710449, -5.525479793548584, -4.625297546386719, -3.7251152992248535, -2.8249330520629883, -1.924750804901123, -1.0245704650878906, -0.12438821792602539, 0.7757940292358398, 1.675976276397705, 2.5761585235595703, 3.4763407707214355, 4.376523017883301, 5.276705265045166, 6.176887512207031, 7.0770697593688965, 7.977252006530762, 8.877433776855469, 9.777616500854492, 10.677799224853516, 11.577980995178223, 12.47816276550293, 13.378345489501953, 14.278528213500977, 15.178709983825684, 16.07889175415039, 16.979074478149414, 17.879257202148438, 18.779438018798828, 19.67962074279785, 20.579803466796875, 21.4799861907959, 22.380168914794922, 23.280349731445312, 24.180532455444336, 25.08071517944336, 25.98089599609375, 26.881078720092773, 27.781261444091797]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 2.0, 6.0, 8.0, 8.0, 11.0, 12.0, 16.0, 20.0, 29.0, 51.0, 87.0, 147.0, 275.0, 595.0, 1280.0, 3222.0, 8968.0, 32575.0, 178641.0, 3217370.0, 652322.0, 72434.0, 17045.0, 5370.0, 2034.0, 846.0, 375.0, 199.0, 109.0, 84.0, 52.0, 24.0, 23.0, 14.0, 6.0, 4.0, 9.0, 5.0, 6.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.65625, -4.5096435546875, -4.363037109375, -4.2164306640625, -4.06982421875, -3.9232177734375, -3.776611328125, -3.6300048828125, -3.4833984375, -3.3367919921875, -3.190185546875, -3.0435791015625, -2.89697265625, -2.7503662109375, -2.603759765625, -2.4571533203125, -2.310546875, -2.1639404296875, -2.017333984375, -1.8707275390625, -1.72412109375, -1.5775146484375, -1.430908203125, -1.2843017578125, -1.1376953125, -0.9910888671875, -0.844482421875, -0.6978759765625, -0.55126953125, -0.4046630859375, -0.258056640625, -0.1114501953125, 0.03515625, 0.1817626953125, 0.328369140625, 0.4749755859375, 0.62158203125, 0.7681884765625, 0.914794921875, 1.0614013671875, 1.2080078125, 1.3546142578125, 1.501220703125, 1.6478271484375, 1.79443359375, 1.9410400390625, 2.087646484375, 2.2342529296875, 2.380859375, 2.5274658203125, 2.674072265625, 2.8206787109375, 2.96728515625, 3.1138916015625, 3.260498046875, 3.4071044921875, 3.5537109375, 3.7003173828125, 3.846923828125, 3.9935302734375, 4.14013671875, 4.2867431640625, 4.433349609375, 4.5799560546875, 4.7265625]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 7.0, 6.0, 12.0, 8.0, 13.0, 16.0, 14.0, 19.0, 27.0, 33.0, 34.0, 30.0, 33.0, 47.0, 53.0, 52.0, 53.0, 50.0, 60.0, 50.0, 42.0, 38.0, 54.0, 31.0, 41.0, 31.0, 29.0, 17.0, 18.0, 16.0, 19.0, 18.0, 10.0, 3.0, 5.0, 4.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.1982421875, -1.1595306396484375, -1.120819091796875, -1.0821075439453125, -1.04339599609375, -1.0046844482421875, -0.965972900390625, -0.9272613525390625, -0.8885498046875, -0.8498382568359375, -0.811126708984375, -0.7724151611328125, -0.73370361328125, -0.6949920654296875, -0.656280517578125, -0.6175689697265625, -0.578857421875, -0.5401458740234375, -0.501434326171875, -0.4627227783203125, -0.42401123046875, -0.3852996826171875, -0.346588134765625, -0.3078765869140625, -0.2691650390625, -0.2304534912109375, -0.191741943359375, -0.1530303955078125, -0.11431884765625, -0.0756072998046875, -0.036895751953125, 0.0018157958984375, 0.04052734375, 0.0792388916015625, 0.117950439453125, 0.1566619873046875, 0.19537353515625, 0.2340850830078125, 0.272796630859375, 0.3115081787109375, 0.3502197265625, 0.3889312744140625, 0.427642822265625, 0.4663543701171875, 0.50506591796875, 0.5437774658203125, 0.582489013671875, 0.6212005615234375, 0.659912109375, 0.6986236572265625, 0.737335205078125, 0.7760467529296875, 0.81475830078125, 0.8534698486328125, 0.892181396484375, 0.9308929443359375, 0.9696044921875, 1.0083160400390625, 1.047027587890625, 1.0857391357421875, 1.12445068359375, 1.1631622314453125, 1.201873779296875, 1.2405853271484375, 1.279296875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 3.0, 3.0, 5.0, 9.0, 17.0, 23.0, 30.0, 33.0, 49.0, 78.0, 115.0, 165.0, 246.0, 464.0, 822.0, 1453.0, 2991.0, 6088.0, 14488.0, 37734.0, 119615.0, 596982.0, 2887924.0, 383377.0, 89501.0, 29770.0, 11623.0, 5094.0, 2438.0, 1240.0, 697.0, 427.0, 271.0, 163.0, 123.0, 68.0, 53.0, 25.0, 24.0, 11.0, 14.0, 13.0, 9.0, 4.0, 4.0, 1.0, 1.0, 2.0, 4.0, 1.0], "bins": [-4.68359375, -4.55487060546875, -4.4261474609375, -4.29742431640625, -4.168701171875, -4.03997802734375, -3.9112548828125, -3.78253173828125, -3.65380859375, -3.52508544921875, -3.3963623046875, -3.26763916015625, -3.138916015625, -3.01019287109375, -2.8814697265625, -2.75274658203125, -2.6240234375, -2.49530029296875, -2.3665771484375, -2.23785400390625, -2.109130859375, -1.98040771484375, -1.8516845703125, -1.72296142578125, -1.59423828125, -1.46551513671875, -1.3367919921875, -1.20806884765625, -1.079345703125, -0.95062255859375, -0.8218994140625, -0.69317626953125, -0.564453125, -0.43572998046875, -0.3070068359375, -0.17828369140625, -0.049560546875, 0.07916259765625, 0.2078857421875, 0.33660888671875, 0.46533203125, 0.59405517578125, 0.7227783203125, 0.85150146484375, 0.980224609375, 1.10894775390625, 1.2376708984375, 1.36639404296875, 1.4951171875, 1.62384033203125, 1.7525634765625, 1.88128662109375, 2.010009765625, 2.13873291015625, 2.2674560546875, 2.39617919921875, 2.52490234375, 2.65362548828125, 2.7823486328125, 2.91107177734375, 3.039794921875, 3.16851806640625, 3.2972412109375, 3.42596435546875, 3.5546875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 6.0, 5.0, 2.0, 5.0, 4.0, 13.0, 22.0, 14.0, 22.0, 22.0, 53.0, 52.0, 89.0, 136.0, 230.0, 401.0, 1030.0, 962.0, 369.0, 219.0, 133.0, 108.0, 46.0, 42.0, 23.0, 17.0, 13.0, 10.0, 13.0, 3.0, 1.0, 2.0, 4.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.26171875, -2.18365478515625, -2.1055908203125, -2.02752685546875, -1.949462890625, -1.87139892578125, -1.7933349609375, -1.71527099609375, -1.63720703125, -1.55914306640625, -1.4810791015625, -1.40301513671875, -1.324951171875, -1.24688720703125, -1.1688232421875, -1.09075927734375, -1.0126953125, -0.93463134765625, -0.8565673828125, -0.77850341796875, -0.700439453125, -0.62237548828125, -0.5443115234375, -0.46624755859375, -0.38818359375, -0.31011962890625, -0.2320556640625, -0.15399169921875, -0.075927734375, 0.00213623046875, 0.0802001953125, 0.15826416015625, 0.236328125, 0.31439208984375, 0.3924560546875, 0.47052001953125, 0.548583984375, 0.62664794921875, 0.7047119140625, 0.78277587890625, 0.86083984375, 0.93890380859375, 1.0169677734375, 1.09503173828125, 1.173095703125, 1.25115966796875, 1.3292236328125, 1.40728759765625, 1.4853515625, 1.56341552734375, 1.6414794921875, 1.71954345703125, 1.797607421875, 1.87567138671875, 1.9537353515625, 2.03179931640625, 2.10986328125, 2.18792724609375, 2.2659912109375, 2.34405517578125, 2.422119140625, 2.50018310546875, 2.5782470703125, 2.65631103515625, 2.734375]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 13.0, 9.0, 53.0, 92.0, 136.0, 197.0, 197.0, 133.0, 93.0, 59.0, 16.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.233524322509766, -45.31840515136719, -44.403282165527344, -43.488162994384766, -42.57304000854492, -41.657920837402344, -40.7427978515625, -39.82767868041992, -38.912559509277344, -37.997440338134766, -37.08231735229492, -36.167198181152344, -35.2520751953125, -34.33695602416992, -33.421836853027344, -32.5067138671875, -31.59159278869629, -30.676471710205078, -29.761350631713867, -28.846229553222656, -27.931110382080078, -27.015989303588867, -26.100868225097656, -25.185747146606445, -24.270626068115234, -23.355504989624023, -22.440383911132812, -21.525264739990234, -20.610143661499023, -19.695022583007812, -18.7799015045166, -17.86478042602539, -16.949661254882812, -16.0345401763916, -15.119420051574707, -14.204298973083496, -13.289178848266602, -12.37405776977539, -11.45893669128418, -10.543815612792969, -9.62869644165039, -8.71357536315918, -7.798455238342285, -6.883334159851074, -5.9682135581970215, -5.053092956542969, -4.137971878051758, -3.222851276397705, -2.3077306747436523, -1.39260995388031, -0.4774892330169678, 0.43763160705566406, 1.3527522087097168, 2.2678728103637695, 3.1829938888549805, 4.098114490509033, 5.013235092163086, 5.928355693817139, 6.843476295471191, 7.758597373962402, 8.673717498779297, 9.588838577270508, 10.503959655761719, 11.41908073425293, 12.334200859069824]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 1.0, 6.0, 6.0, 14.0, 17.0, 15.0, 18.0, 23.0, 33.0, 30.0, 42.0, 46.0, 53.0, 44.0, 42.0, 50.0, 65.0, 76.0, 49.0, 54.0, 56.0, 50.0, 36.0, 29.0, 30.0, 27.0, 27.0, 19.0, 10.0, 11.0, 9.0, 9.0, 5.0, 1.0, 2.0, 1.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.575841903686523, -10.180875778198242, -9.785910606384277, -9.390944480895996, -8.995979309082031, -8.60101318359375, -8.206047058105469, -7.811081886291504, -7.416115760803223, -7.0211501121521, -6.626184463500977, -6.231218338012695, -5.836252689361572, -5.441287040710449, -5.046321392059326, -4.651355743408203, -4.25639009475708, -3.861424446105957, -3.466458559036255, -3.071492910385132, -2.6765270233154297, -2.2815613746643066, -1.8865957260131836, -1.4916298389434814, -1.0966641902923584, -0.7016984224319458, -0.306732714176178, 0.08823299407958984, 0.48319876194000244, 0.878164529800415, 1.273130178451538, 1.6680960655212402, 2.0630617141723633, 2.4580273628234863, 2.8529932498931885, 3.2479588985443115, 3.6429247856140137, 4.037890434265137, 4.43285608291626, 4.827821731567383, 5.222787857055664, 5.617753505706787, 6.01271915435791, 6.407685279846191, 6.8026509284973145, 7.1976165771484375, 7.5925822257995605, 7.987547874450684, 8.382513046264648, 8.77747917175293, 9.172444343566895, 9.567410469055176, 9.96237564086914, 10.357341766357422, 10.752307891845703, 11.147273063659668, 11.54223918914795, 11.93720531463623, 12.332170486450195, 12.727136611938477, 13.122101783752441, 13.517067909240723, 13.912033081054688, 14.306999206542969, 14.70196533203125]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 3.0, 3.0, 9.0, 11.0, 10.0, 26.0, 15.0, 35.0, 47.0, 76.0, 85.0, 144.0, 210.0, 377.0, 713.0, 1274.0, 2420.0, 5149.0, 10448.0, 22489.0, 48262.0, 98723.0, 174245.0, 229001.0, 203176.0, 127326.0, 65057.0, 31007.0, 14366.0, 6645.0, 3268.0, 1682.0, 943.0, 509.0, 284.0, 179.0, 122.0, 71.0, 46.0, 21.0, 23.0, 17.0, 13.0, 10.0, 4.0, 6.0, 4.0, 4.0, 3.0, 1.0, 2.0, 1.0], "bins": [-3.69140625, -3.5880126953125, -3.484619140625, -3.3812255859375, -3.27783203125, -3.1744384765625, -3.071044921875, -2.9676513671875, -2.8642578125, -2.7608642578125, -2.657470703125, -2.5540771484375, -2.45068359375, -2.3472900390625, -2.243896484375, -2.1405029296875, -2.037109375, -1.9337158203125, -1.830322265625, -1.7269287109375, -1.62353515625, -1.5201416015625, -1.416748046875, -1.3133544921875, -1.2099609375, -1.1065673828125, -1.003173828125, -0.8997802734375, -0.79638671875, -0.6929931640625, -0.589599609375, -0.4862060546875, -0.3828125, -0.2794189453125, -0.176025390625, -0.0726318359375, 0.03076171875, 0.1341552734375, 0.237548828125, 0.3409423828125, 0.4443359375, 0.5477294921875, 0.651123046875, 0.7545166015625, 0.85791015625, 0.9613037109375, 1.064697265625, 1.1680908203125, 1.271484375, 1.3748779296875, 1.478271484375, 1.5816650390625, 1.68505859375, 1.7884521484375, 1.891845703125, 1.9952392578125, 2.0986328125, 2.2020263671875, 2.305419921875, 2.4088134765625, 2.51220703125, 2.6156005859375, 2.718994140625, 2.8223876953125, 2.92578125]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 7.0, 9.0, 6.0, 14.0, 8.0, 9.0, 15.0, 21.0, 30.0, 39.0, 35.0, 42.0, 41.0, 43.0, 56.0, 51.0, 49.0, 54.0, 51.0, 72.0, 41.0, 43.0, 38.0, 29.0, 30.0, 35.0, 20.0, 30.0, 23.0, 22.0, 10.0, 9.0, 6.0, 3.0, 6.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.2646484375, -1.2232818603515625, -1.181915283203125, -1.1405487060546875, -1.09918212890625, -1.0578155517578125, -1.016448974609375, -0.9750823974609375, -0.9337158203125, -0.8923492431640625, -0.850982666015625, -0.8096160888671875, -0.76824951171875, -0.7268829345703125, -0.685516357421875, -0.6441497802734375, -0.602783203125, -0.5614166259765625, -0.520050048828125, -0.4786834716796875, -0.43731689453125, -0.3959503173828125, -0.354583740234375, -0.3132171630859375, -0.2718505859375, -0.2304840087890625, -0.189117431640625, -0.1477508544921875, -0.10638427734375, -0.0650177001953125, -0.023651123046875, 0.0177154541015625, 0.05908203125, 0.1004486083984375, 0.141815185546875, 0.1831817626953125, 0.22454833984375, 0.2659149169921875, 0.307281494140625, 0.3486480712890625, 0.3900146484375, 0.4313812255859375, 0.472747802734375, 0.5141143798828125, 0.55548095703125, 0.5968475341796875, 0.638214111328125, 0.6795806884765625, 0.720947265625, 0.7623138427734375, 0.803680419921875, 0.8450469970703125, 0.88641357421875, 0.9277801513671875, 0.969146728515625, 1.0105133056640625, 1.0518798828125, 1.0932464599609375, 1.134613037109375, 1.1759796142578125, 1.21734619140625, 1.2587127685546875, 1.300079345703125, 1.3414459228515625, 1.3828125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 2.0, 3.0, 5.0, 9.0, 11.0, 15.0, 21.0, 37.0, 46.0, 57.0, 84.0, 126.0, 158.0, 214.0, 331.0, 497.0, 744.0, 1190.0, 2751.0, 10318.0, 62106.0, 366053.0, 481515.0, 99716.0, 15134.0, 3473.0, 1372.0, 787.0, 565.0, 340.0, 247.0, 159.0, 126.0, 91.0, 68.0, 43.0, 46.0, 26.0, 20.0, 13.0, 9.0, 5.0, 6.0, 5.0, 2.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-8.4296875, -8.1588134765625, -7.887939453125, -7.6170654296875, -7.34619140625, -7.0753173828125, -6.804443359375, -6.5335693359375, -6.2626953125, -5.9918212890625, -5.720947265625, -5.4500732421875, -5.17919921875, -4.9083251953125, -4.637451171875, -4.3665771484375, -4.095703125, -3.8248291015625, -3.553955078125, -3.2830810546875, -3.01220703125, -2.7413330078125, -2.470458984375, -2.1995849609375, -1.9287109375, -1.6578369140625, -1.386962890625, -1.1160888671875, -0.84521484375, -0.5743408203125, -0.303466796875, -0.0325927734375, 0.23828125, 0.5091552734375, 0.780029296875, 1.0509033203125, 1.32177734375, 1.5926513671875, 1.863525390625, 2.1343994140625, 2.4052734375, 2.6761474609375, 2.947021484375, 3.2178955078125, 3.48876953125, 3.7596435546875, 4.030517578125, 4.3013916015625, 4.572265625, 4.8431396484375, 5.114013671875, 5.3848876953125, 5.65576171875, 5.9266357421875, 6.197509765625, 6.4683837890625, 6.7392578125, 7.0101318359375, 7.281005859375, 7.5518798828125, 7.82275390625, 8.0936279296875, 8.364501953125, 8.6353759765625, 8.90625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 5.0, 4.0, 10.0, 7.0, 8.0, 6.0, 6.0, 12.0, 13.0, 21.0, 22.0, 26.0, 28.0, 24.0, 25.0, 27.0, 32.0, 37.0, 42.0, 47.0, 47.0, 48.0, 42.0, 56.0, 36.0, 34.0, 43.0, 41.0, 41.0, 37.0, 27.0, 25.0, 21.0, 15.0, 17.0, 18.0, 12.0, 11.0, 11.0, 2.0, 12.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 3.0, 0.0, 2.0, 1.0], "bins": [-7.5078125, -7.2847900390625, -7.061767578125, -6.8387451171875, -6.61572265625, -6.3927001953125, -6.169677734375, -5.9466552734375, -5.7236328125, -5.5006103515625, -5.277587890625, -5.0545654296875, -4.83154296875, -4.6085205078125, -4.385498046875, -4.1624755859375, -3.939453125, -3.7164306640625, -3.493408203125, -3.2703857421875, -3.04736328125, -2.8243408203125, -2.601318359375, -2.3782958984375, -2.1552734375, -1.9322509765625, -1.709228515625, -1.4862060546875, -1.26318359375, -1.0401611328125, -0.817138671875, -0.5941162109375, -0.37109375, -0.1480712890625, 0.074951171875, 0.2979736328125, 0.52099609375, 0.7440185546875, 0.967041015625, 1.1900634765625, 1.4130859375, 1.6361083984375, 1.859130859375, 2.0821533203125, 2.30517578125, 2.5281982421875, 2.751220703125, 2.9742431640625, 3.197265625, 3.4202880859375, 3.643310546875, 3.8663330078125, 4.08935546875, 4.3123779296875, 4.535400390625, 4.7584228515625, 4.9814453125, 5.2044677734375, 5.427490234375, 5.6505126953125, 5.87353515625, 6.0965576171875, 6.319580078125, 6.5426025390625, 6.765625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 8.0, 7.0, 16.0, 14.0, 18.0, 35.0, 41.0, 60.0, 101.0, 127.0, 215.0, 315.0, 522.0, 979.0, 2022.0, 4771.0, 12836.0, 39363.0, 126193.0, 351673.0, 333846.0, 117705.0, 36310.0, 12215.0, 4610.0, 1983.0, 1033.0, 572.0, 328.0, 231.0, 118.0, 87.0, 59.0, 38.0, 36.0, 19.0, 15.0, 7.0, 9.0, 6.0, 5.0, 3.0, 3.0, 5.0], "bins": [-4.32421875, -4.216033935546875, -4.10784912109375, -3.999664306640625, -3.8914794921875, -3.783294677734375, -3.67510986328125, -3.566925048828125, -3.458740234375, -3.350555419921875, -3.24237060546875, -3.134185791015625, -3.0260009765625, -2.917816162109375, -2.80963134765625, -2.701446533203125, -2.59326171875, -2.485076904296875, -2.37689208984375, -2.268707275390625, -2.1605224609375, -2.052337646484375, -1.94415283203125, -1.835968017578125, -1.727783203125, -1.619598388671875, -1.51141357421875, -1.403228759765625, -1.2950439453125, -1.186859130859375, -1.07867431640625, -0.970489501953125, -0.8623046875, -0.754119873046875, -0.64593505859375, -0.537750244140625, -0.4295654296875, -0.321380615234375, -0.21319580078125, -0.105010986328125, 0.003173828125, 0.111358642578125, 0.21954345703125, 0.327728271484375, 0.4359130859375, 0.544097900390625, 0.65228271484375, 0.760467529296875, 0.86865234375, 0.976837158203125, 1.08502197265625, 1.193206787109375, 1.3013916015625, 1.409576416015625, 1.51776123046875, 1.625946044921875, 1.734130859375, 1.842315673828125, 1.95050048828125, 2.058685302734375, 2.1668701171875, 2.275054931640625, 2.38323974609375, 2.491424560546875, 2.599609375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 4.0, 8.0, 1.0, 8.0, 12.0, 22.0, 30.0, 29.0, 40.0, 73.0, 63.0, 76.0, 106.0, 103.0, 85.0, 84.0, 49.0, 56.0, 36.0, 33.0, 32.0, 16.0, 14.0, 10.0, 6.0, 4.0, 0.0, 1.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0010852813720703125, -0.0010568499565124512, -0.0010284185409545898, -0.0009999871253967285, -0.0009715557098388672, -0.0009431242942810059, -0.0009146928787231445, -0.0008862614631652832, -0.0008578300476074219, -0.0008293986320495605, -0.0008009672164916992, -0.0007725358009338379, -0.0007441043853759766, -0.0007156729698181152, -0.0006872415542602539, -0.0006588101387023926, -0.0006303787231445312, -0.0006019473075866699, -0.0005735158920288086, -0.0005450844764709473, -0.0005166530609130859, -0.0004882216453552246, -0.0004597902297973633, -0.00043135881423950195, -0.0004029273986816406, -0.0003744959831237793, -0.00034606456756591797, -0.00031763315200805664, -0.0002892017364501953, -0.000260770320892334, -0.00023233890533447266, -0.00020390748977661133, -0.00017547607421875, -0.00014704465866088867, -0.00011861324310302734, -9.018182754516602e-05, -6.175041198730469e-05, -3.331899642944336e-05, -4.887580871582031e-06, 2.3543834686279297e-05, 5.1975250244140625e-05, 8.040666580200195e-05, 0.00010883808135986328, 0.0001372694969177246, 0.00016570091247558594, 0.00019413232803344727, 0.0002225637435913086, 0.0002509951591491699, 0.00027942657470703125, 0.0003078579902648926, 0.0003362894058227539, 0.00036472082138061523, 0.00039315223693847656, 0.0004215836524963379, 0.0004500150680541992, 0.00047844648361206055, 0.0005068778991699219, 0.0005353093147277832, 0.0005637407302856445, 0.0005921721458435059, 0.0006206035614013672, 0.0006490349769592285, 0.0006774663925170898, 0.0007058978080749512, 0.0007343292236328125]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 4.0, 7.0, 6.0, 5.0, 15.0, 15.0, 19.0, 32.0, 35.0, 78.0, 95.0, 137.0, 216.0, 340.0, 591.0, 1047.0, 2373.0, 7156.0, 33818.0, 202658.0, 580403.0, 178680.0, 29516.0, 6573.0, 2286.0, 983.0, 545.0, 312.0, 200.0, 125.0, 84.0, 70.0, 46.0, 28.0, 16.0, 15.0, 8.0, 6.0, 2.0, 5.0, 7.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.91796875, -4.75653076171875, -4.5950927734375, -4.43365478515625, -4.272216796875, -4.11077880859375, -3.9493408203125, -3.78790283203125, -3.62646484375, -3.46502685546875, -3.3035888671875, -3.14215087890625, -2.980712890625, -2.81927490234375, -2.6578369140625, -2.49639892578125, -2.3349609375, -2.17352294921875, -2.0120849609375, -1.85064697265625, -1.689208984375, -1.52777099609375, -1.3663330078125, -1.20489501953125, -1.04345703125, -0.88201904296875, -0.7205810546875, -0.55914306640625, -0.397705078125, -0.23626708984375, -0.0748291015625, 0.08660888671875, 0.248046875, 0.40948486328125, 0.5709228515625, 0.73236083984375, 0.893798828125, 1.05523681640625, 1.2166748046875, 1.37811279296875, 1.53955078125, 1.70098876953125, 1.8624267578125, 2.02386474609375, 2.185302734375, 2.34674072265625, 2.5081787109375, 2.66961669921875, 2.8310546875, 2.99249267578125, 3.1539306640625, 3.31536865234375, 3.476806640625, 3.63824462890625, 3.7996826171875, 3.96112060546875, 4.12255859375, 4.28399658203125, 4.4454345703125, 4.60687255859375, 4.768310546875, 4.92974853515625, 5.0911865234375, 5.25262451171875, 5.4140625]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 3.0, 8.0, 4.0, 3.0, 7.0, 8.0, 9.0, 8.0, 10.0, 21.0, 27.0, 25.0, 30.0, 33.0, 42.0, 49.0, 66.0, 51.0, 73.0, 65.0, 76.0, 62.0, 57.0, 49.0, 33.0, 37.0, 23.0, 34.0, 27.0, 19.0, 7.0, 6.0, 9.0, 9.0, 3.0, 3.0, 4.0, 6.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.109375, -4.000091552734375, -3.89080810546875, -3.781524658203125, -3.6722412109375, -3.562957763671875, -3.45367431640625, -3.344390869140625, -3.235107421875, -3.125823974609375, -3.01654052734375, -2.907257080078125, -2.7979736328125, -2.688690185546875, -2.57940673828125, -2.470123291015625, -2.36083984375, -2.251556396484375, -2.14227294921875, -2.032989501953125, -1.9237060546875, -1.814422607421875, -1.70513916015625, -1.595855712890625, -1.486572265625, -1.377288818359375, -1.26800537109375, -1.158721923828125, -1.0494384765625, -0.940155029296875, -0.83087158203125, -0.721588134765625, -0.6123046875, -0.503021240234375, -0.39373779296875, -0.284454345703125, -0.1751708984375, -0.065887451171875, 0.04339599609375, 0.152679443359375, 0.261962890625, 0.371246337890625, 0.48052978515625, 0.589813232421875, 0.6990966796875, 0.808380126953125, 0.91766357421875, 1.026947021484375, 1.13623046875, 1.245513916015625, 1.35479736328125, 1.464080810546875, 1.5733642578125, 1.682647705078125, 1.79193115234375, 1.901214599609375, 2.010498046875, 2.119781494140625, 2.22906494140625, 2.338348388671875, 2.4476318359375, 2.556915283203125, 2.66619873046875, 2.775482177734375, 2.884765625]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 11.0, 52.0, 180.0, 342.0, 268.0, 111.0, 31.0, 9.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-103.76200103759766, -99.18781280517578, -94.6136245727539, -90.03943634033203, -85.46524810791016, -80.89105987548828, -76.3168716430664, -71.74268341064453, -67.16849517822266, -62.59430694580078, -58.020118713378906, -53.44593048095703, -48.871742248535156, -44.29755401611328, -39.723365783691406, -35.14917755126953, -30.574989318847656, -26.00080108642578, -21.426612854003906, -16.85242462158203, -12.278236389160156, -7.704048156738281, -3.1298599243164062, 1.4443283081054688, 6.018516540527344, 10.592704772949219, 15.166893005371094, 19.74108123779297, 24.315269470214844, 28.88945770263672, 33.463645935058594, 38.03783416748047, 42.612030029296875, 47.18621826171875, 51.760406494140625, 56.3345947265625, 60.908782958984375, 65.48297119140625, 70.05715942382812, 74.63134765625, 79.20553588867188, 83.77972412109375, 88.35391235351562, 92.9281005859375, 97.50228881835938, 102.07647705078125, 106.65066528320312, 111.224853515625, 115.79904174804688, 120.37322998046875, 124.94741821289062, 129.5216064453125, 134.09579467773438, 138.66998291015625, 143.24417114257812, 147.818359375, 152.39254760742188, 156.96673583984375, 161.54092407226562, 166.1151123046875, 170.68930053710938, 175.26348876953125, 179.83767700195312, 184.411865234375, 188.98605346679688]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 1.0, 5.0, 5.0, 7.0, 6.0, 10.0, 7.0, 16.0, 22.0, 25.0, 22.0, 24.0, 23.0, 38.0, 43.0, 38.0, 47.0, 37.0, 36.0, 61.0, 61.0, 33.0, 49.0, 48.0, 35.0, 39.0, 34.0, 36.0, 30.0, 23.0, 23.0, 18.0, 26.0, 14.0, 12.0, 9.0, 16.0, 7.0, 3.0, 7.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-31.330036163330078, -30.151119232177734, -28.97220230102539, -27.793283462524414, -26.61436653137207, -25.435449600219727, -24.25653076171875, -23.077613830566406, -21.898696899414062, -20.71977996826172, -19.540863037109375, -18.3619441986084, -17.183027267456055, -16.00411033630371, -14.82519245147705, -13.64627456665039, -12.467357635498047, -11.288440704345703, -10.109522819519043, -8.930604934692383, -7.751688003540039, -6.572770595550537, -5.393853187561035, -4.214935302734375, -3.0360183715820312, -1.8571009635925293, -0.6781835556030273, 0.5007338523864746, 1.6796512603759766, 2.8585686683654785, 4.0374860763549805, 5.216403961181641, 6.39532470703125, 7.574242115020752, 8.753159523010254, 9.932077407836914, 11.110994338989258, 12.289911270141602, 13.468829154968262, 14.647747039794922, 15.826663970947266, 17.00558090209961, 18.184497833251953, 19.36341667175293, 20.542333602905273, 21.721250534057617, 22.900169372558594, 24.079086303710938, 25.25800323486328, 26.436920166015625, 27.61583709716797, 28.794755935668945, 29.97367286682129, 31.152589797973633, 32.33150863647461, 33.51042556762695, 34.6893424987793, 35.86825942993164, 37.047176361083984, 38.22609329223633, 39.40501403808594, 40.58393096923828, 41.762847900390625, 42.94176483154297, 44.12068176269531]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 0.0, 6.0, 2.0, 3.0, 7.0, 8.0, 22.0, 19.0, 28.0, 45.0, 64.0, 77.0, 117.0, 178.0, 248.0, 402.0, 595.0, 1066.0, 1841.0, 3504.0, 7228.0, 17678.0, 56529.0, 432038.0, 3553032.0, 79629.0, 21900.0, 8538.0, 4098.0, 2137.0, 1204.0, 689.0, 475.0, 274.0, 187.0, 120.0, 99.0, 61.0, 31.0, 28.0, 21.0, 19.0, 19.0, 3.0, 7.0, 4.0, 2.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.2265625, -4.0706787109375, -3.914794921875, -3.7589111328125, -3.60302734375, -3.4471435546875, -3.291259765625, -3.1353759765625, -2.9794921875, -2.8236083984375, -2.667724609375, -2.5118408203125, -2.35595703125, -2.2000732421875, -2.044189453125, -1.8883056640625, -1.732421875, -1.5765380859375, -1.420654296875, -1.2647705078125, -1.10888671875, -0.9530029296875, -0.797119140625, -0.6412353515625, -0.4853515625, -0.3294677734375, -0.173583984375, -0.0177001953125, 0.13818359375, 0.2940673828125, 0.449951171875, 0.6058349609375, 0.76171875, 0.9176025390625, 1.073486328125, 1.2293701171875, 1.38525390625, 1.5411376953125, 1.697021484375, 1.8529052734375, 2.0087890625, 2.1646728515625, 2.320556640625, 2.4764404296875, 2.63232421875, 2.7882080078125, 2.944091796875, 3.0999755859375, 3.255859375, 3.4117431640625, 3.567626953125, 3.7235107421875, 3.87939453125, 4.0352783203125, 4.191162109375, 4.3470458984375, 4.5029296875, 4.6588134765625, 4.814697265625, 4.9705810546875, 5.12646484375, 5.2823486328125, 5.438232421875, 5.5941162109375, 5.75]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 7.0, 13.0, 6.0, 11.0, 16.0, 10.0, 22.0, 16.0, 16.0, 30.0, 28.0, 33.0, 42.0, 48.0, 46.0, 63.0, 67.0, 57.0, 39.0, 56.0, 46.0, 39.0, 48.0, 36.0, 31.0, 34.0, 21.0, 29.0, 20.0, 12.0, 10.0, 12.0, 9.0, 6.0, 6.0, 3.0, 3.0, 4.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.4580078125, -1.4091033935546875, -1.360198974609375, -1.3112945556640625, -1.26239013671875, -1.2134857177734375, -1.164581298828125, -1.1156768798828125, -1.0667724609375, -1.0178680419921875, -0.968963623046875, -0.9200592041015625, -0.87115478515625, -0.8222503662109375, -0.773345947265625, -0.7244415283203125, -0.675537109375, -0.6266326904296875, -0.577728271484375, -0.5288238525390625, -0.47991943359375, -0.4310150146484375, -0.382110595703125, -0.3332061767578125, -0.2843017578125, -0.2353973388671875, -0.186492919921875, -0.1375885009765625, -0.08868408203125, -0.0397796630859375, 0.009124755859375, 0.0580291748046875, 0.10693359375, 0.1558380126953125, 0.204742431640625, 0.2536468505859375, 0.30255126953125, 0.3514556884765625, 0.400360107421875, 0.4492645263671875, 0.4981689453125, 0.5470733642578125, 0.595977783203125, 0.6448822021484375, 0.69378662109375, 0.7426910400390625, 0.791595458984375, 0.8404998779296875, 0.889404296875, 0.9383087158203125, 0.987213134765625, 1.0361175537109375, 1.08502197265625, 1.1339263916015625, 1.182830810546875, 1.2317352294921875, 1.2806396484375, 1.3295440673828125, 1.378448486328125, 1.4273529052734375, 1.47625732421875, 1.5251617431640625, 1.574066162109375, 1.6229705810546875, 1.671875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 10.0, 12.0, 11.0, 13.0, 17.0, 21.0, 32.0, 56.0, 79.0, 108.0, 155.0, 248.0, 459.0, 833.0, 1627.0, 3437.0, 8771.0, 32061.0, 410464.0, 3666430.0, 49281.0, 11682.0, 4269.0, 1953.0, 930.0, 494.0, 283.0, 178.0, 111.0, 95.0, 43.0, 47.0, 23.0, 22.0, 8.0, 9.0, 7.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.78125, -10.4456787109375, -10.110107421875, -9.7745361328125, -9.43896484375, -9.1033935546875, -8.767822265625, -8.4322509765625, -8.0966796875, -7.7611083984375, -7.425537109375, -7.0899658203125, -6.75439453125, -6.4188232421875, -6.083251953125, -5.7476806640625, -5.412109375, -5.0765380859375, -4.740966796875, -4.4053955078125, -4.06982421875, -3.7342529296875, -3.398681640625, -3.0631103515625, -2.7275390625, -2.3919677734375, -2.056396484375, -1.7208251953125, -1.38525390625, -1.0496826171875, -0.714111328125, -0.3785400390625, -0.04296875, 0.2926025390625, 0.628173828125, 0.9637451171875, 1.29931640625, 1.6348876953125, 1.970458984375, 2.3060302734375, 2.6416015625, 2.9771728515625, 3.312744140625, 3.6483154296875, 3.98388671875, 4.3194580078125, 4.655029296875, 4.9906005859375, 5.326171875, 5.6617431640625, 5.997314453125, 6.3328857421875, 6.66845703125, 7.0040283203125, 7.339599609375, 7.6751708984375, 8.0107421875, 8.3463134765625, 8.681884765625, 9.0174560546875, 9.35302734375, 9.6885986328125, 10.024169921875, 10.3597412109375, 10.6953125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 7.0, 4.0, 3.0, 6.0, 5.0, 10.0, 14.0, 13.0, 39.0, 47.0, 130.0, 526.0, 2819.0, 226.0, 87.0, 47.0, 34.0, 15.0, 6.0, 13.0, 9.0, 5.0, 5.0, 4.0, 5.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.328125, -2.263916015625, -2.19970703125, -2.135498046875, -2.0712890625, -2.007080078125, -1.94287109375, -1.878662109375, -1.814453125, -1.750244140625, -1.68603515625, -1.621826171875, -1.5576171875, -1.493408203125, -1.42919921875, -1.364990234375, -1.30078125, -1.236572265625, -1.17236328125, -1.108154296875, -1.0439453125, -0.979736328125, -0.91552734375, -0.851318359375, -0.787109375, -0.722900390625, -0.65869140625, -0.594482421875, -0.5302734375, -0.466064453125, -0.40185546875, -0.337646484375, -0.2734375, -0.209228515625, -0.14501953125, -0.080810546875, -0.0166015625, 0.047607421875, 0.11181640625, 0.176025390625, 0.240234375, 0.304443359375, 0.36865234375, 0.432861328125, 0.4970703125, 0.561279296875, 0.62548828125, 0.689697265625, 0.75390625, 0.818115234375, 0.88232421875, 0.946533203125, 1.0107421875, 1.074951171875, 1.13916015625, 1.203369140625, 1.267578125, 1.331787109375, 1.39599609375, 1.460205078125, 1.5244140625, 1.588623046875, 1.65283203125, 1.717041015625, 1.78125]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 12.0, 10.0, 22.0, 31.0, 41.0, 49.0, 86.0, 123.0, 118.0, 145.0, 103.0, 77.0, 61.0, 52.0, 19.0, 23.0, 7.0, 10.0, 3.0, 5.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.26930046081543, -9.9465970993042, -9.623892784118652, -9.301189422607422, -8.978485107421875, -8.655781745910645, -8.333078384399414, -8.010374069213867, -7.687670707702637, -7.364966869354248, -7.042263031005859, -6.719559669494629, -6.39685583114624, -6.074151992797852, -5.751448631286621, -5.428744792938232, -5.106040954589844, -4.783337116241455, -4.460633277893066, -4.137929916381836, -3.8152260780334473, -3.4925222396850586, -3.169818639755249, -2.8471150398254395, -2.524411201477051, -2.201707363128662, -1.8790037631988525, -1.5563000440597534, -1.2335963249206543, -0.9108926057815552, -0.588188886642456, -0.2654852867126465, 0.05721855163574219, 0.3799222707748413, 0.7026259899139404, 1.0253297090530396, 1.3480334281921387, 1.6707371473312378, 1.993440866470337, 2.3161444664001465, 2.638848304748535, 2.961552143096924, 3.2842557430267334, 3.606959342956543, 3.9296631813049316, 4.25236701965332, 4.575070381164551, 4.8977742195129395, 5.220478057861328, 5.543181896209717, 5.8658857345581055, 6.188589096069336, 6.511292934417725, 6.833996772766113, 7.156700134277344, 7.479403972625732, 7.802107810974121, 8.124811172485352, 8.447515487670898, 8.770218849182129, 9.09292221069336, 9.415626525878906, 9.738329887390137, 10.061033248901367, 10.383737564086914]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 5.0, 6.0, 7.0, 8.0, 9.0, 8.0, 10.0, 15.0, 19.0, 21.0, 17.0, 23.0, 17.0, 20.0, 18.0, 25.0, 26.0, 33.0, 40.0, 33.0, 37.0, 34.0, 47.0, 33.0, 36.0, 29.0, 30.0, 35.0, 40.0, 30.0, 29.0, 19.0, 31.0, 26.0, 26.0, 24.0, 21.0, 20.0, 14.0, 15.0, 9.0, 12.0, 14.0, 12.0, 4.0, 4.0, 5.0, 5.0, 3.0, 0.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.5464162826538086, -3.432985782623291, -3.3195555210113525, -3.206125020980835, -3.0926945209503174, -2.979264259338379, -2.8658337593078613, -2.7524032592773438, -2.6389729976654053, -2.5255424976348877, -2.412112236022949, -2.2986817359924316, -2.185251235961914, -2.0718209743499756, -1.958390474319458, -1.84496009349823, -1.7315295934677124, -1.6180992126464844, -1.5046687126159668, -1.3912383317947388, -1.2778079509735107, -1.1643774509429932, -1.0509470701217651, -0.9375166893005371, -0.8240862488746643, -0.7106558084487915, -0.5972254276275635, -0.4837949872016907, -0.37036457657814026, -0.25693416595458984, -0.14350372552871704, -0.030073344707489014, 0.08335709571838379, 0.1967875063419342, 0.3102179169654846, 0.4236483573913574, 0.5370787382125854, 0.6505091786384583, 0.763939619064331, 0.8773699998855591, 0.9908004403114319, 1.1042308807373047, 1.2176612615585327, 1.3310916423797607, 1.4445221424102783, 1.5579525232315063, 1.6713829040527344, 1.784813404083252, 1.89824378490448, 2.011674165725708, 2.1251046657562256, 2.238534927368164, 2.3519654273986816, 2.465395927429199, 2.578826427459717, 2.6922566890716553, 2.805687189102173, 2.9191176891326904, 3.032547950744629, 3.1459784507751465, 3.259408950805664, 3.3728392124176025, 3.48626971244812, 3.5996999740600586, 3.713130474090576]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 5.0, 6.0, 10.0, 12.0, 9.0, 14.0, 25.0, 45.0, 56.0, 95.0, 138.0, 270.0, 557.0, 1360.0, 3321.0, 8974.0, 24946.0, 69513.0, 177119.0, 303254.0, 261738.0, 124334.0, 46380.0, 16208.0, 5878.0, 2294.0, 1017.0, 435.0, 214.0, 117.0, 78.0, 39.0, 33.0, 16.0, 15.0, 11.0, 6.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.89453125, -4.7406005859375, -4.586669921875, -4.4327392578125, -4.27880859375, -4.1248779296875, -3.970947265625, -3.8170166015625, -3.6630859375, -3.5091552734375, -3.355224609375, -3.2012939453125, -3.04736328125, -2.8934326171875, -2.739501953125, -2.5855712890625, -2.431640625, -2.2777099609375, -2.123779296875, -1.9698486328125, -1.81591796875, -1.6619873046875, -1.508056640625, -1.3541259765625, -1.2001953125, -1.0462646484375, -0.892333984375, -0.7384033203125, -0.58447265625, -0.4305419921875, -0.276611328125, -0.1226806640625, 0.03125, 0.1851806640625, 0.339111328125, 0.4930419921875, 0.64697265625, 0.8009033203125, 0.954833984375, 1.1087646484375, 1.2626953125, 1.4166259765625, 1.570556640625, 1.7244873046875, 1.87841796875, 2.0323486328125, 2.186279296875, 2.3402099609375, 2.494140625, 2.6480712890625, 2.802001953125, 2.9559326171875, 3.10986328125, 3.2637939453125, 3.417724609375, 3.5716552734375, 3.7255859375, 3.8795166015625, 4.033447265625, 4.1873779296875, 4.34130859375, 4.4952392578125, 4.649169921875, 4.8031005859375, 4.95703125]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 3.0, 3.0, 8.0, 6.0, 9.0, 17.0, 11.0, 16.0, 24.0, 15.0, 23.0, 29.0, 27.0, 46.0, 50.0, 33.0, 49.0, 49.0, 62.0, 49.0, 54.0, 55.0, 49.0, 47.0, 39.0, 30.0, 29.0, 30.0, 26.0, 19.0, 15.0, 9.0, 22.0, 10.0, 7.0, 7.0, 8.0, 3.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0], "bins": [-1.65625, -1.6050567626953125, -1.553863525390625, -1.5026702880859375, -1.45147705078125, -1.4002838134765625, -1.349090576171875, -1.2978973388671875, -1.2467041015625, -1.1955108642578125, -1.144317626953125, -1.0931243896484375, -1.04193115234375, -0.9907379150390625, -0.939544677734375, -0.8883514404296875, -0.837158203125, -0.7859649658203125, -0.734771728515625, -0.6835784912109375, -0.63238525390625, -0.5811920166015625, -0.529998779296875, -0.4788055419921875, -0.4276123046875, -0.3764190673828125, -0.325225830078125, -0.2740325927734375, -0.22283935546875, -0.1716461181640625, -0.120452880859375, -0.0692596435546875, -0.01806640625, 0.0331268310546875, 0.084320068359375, 0.1355133056640625, 0.18670654296875, 0.2378997802734375, 0.289093017578125, 0.3402862548828125, 0.3914794921875, 0.4426727294921875, 0.493865966796875, 0.5450592041015625, 0.59625244140625, 0.6474456787109375, 0.698638916015625, 0.7498321533203125, 0.801025390625, 0.8522186279296875, 0.903411865234375, 0.9546051025390625, 1.00579833984375, 1.0569915771484375, 1.108184814453125, 1.1593780517578125, 1.2105712890625, 1.2617645263671875, 1.312957763671875, 1.3641510009765625, 1.41534423828125, 1.4665374755859375, 1.517730712890625, 1.5689239501953125, 1.6201171875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 11.0, 6.0, 11.0, 15.0, 20.0, 31.0, 58.0, 74.0, 141.0, 222.0, 373.0, 586.0, 1161.0, 2723.0, 16723.0, 368792.0, 620874.0, 30063.0, 3552.0, 1392.0, 700.0, 448.0, 211.0, 112.0, 88.0, 67.0, 38.0, 26.0, 10.0, 10.0, 9.0, 4.0, 8.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.0546875, -14.5374755859375, -14.020263671875, -13.5030517578125, -12.98583984375, -12.4686279296875, -11.951416015625, -11.4342041015625, -10.9169921875, -10.3997802734375, -9.882568359375, -9.3653564453125, -8.84814453125, -8.3309326171875, -7.813720703125, -7.2965087890625, -6.779296875, -6.2620849609375, -5.744873046875, -5.2276611328125, -4.71044921875, -4.1932373046875, -3.676025390625, -3.1588134765625, -2.6416015625, -2.1243896484375, -1.607177734375, -1.0899658203125, -0.57275390625, -0.0555419921875, 0.461669921875, 0.9788818359375, 1.49609375, 2.0133056640625, 2.530517578125, 3.0477294921875, 3.56494140625, 4.0821533203125, 4.599365234375, 5.1165771484375, 5.6337890625, 6.1510009765625, 6.668212890625, 7.1854248046875, 7.70263671875, 8.2198486328125, 8.737060546875, 9.2542724609375, 9.771484375, 10.2886962890625, 10.805908203125, 11.3231201171875, 11.84033203125, 12.3575439453125, 12.874755859375, 13.3919677734375, 13.9091796875, 14.4263916015625, 14.943603515625, 15.4608154296875, 15.97802734375, 16.4952392578125, 17.012451171875, 17.5296630859375, 18.046875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 2.0, 4.0, 11.0, 10.0, 11.0, 17.0, 21.0, 18.0, 24.0, 37.0, 31.0, 34.0, 47.0, 45.0, 62.0, 50.0, 61.0, 57.0, 54.0, 69.0, 48.0, 41.0, 36.0, 41.0, 37.0, 24.0, 17.0, 20.0, 12.0, 15.0, 19.0, 6.0, 9.0, 6.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.03125, -10.665771484375, -10.30029296875, -9.934814453125, -9.5693359375, -9.203857421875, -8.83837890625, -8.472900390625, -8.107421875, -7.741943359375, -7.37646484375, -7.010986328125, -6.6455078125, -6.280029296875, -5.91455078125, -5.549072265625, -5.18359375, -4.818115234375, -4.45263671875, -4.087158203125, -3.7216796875, -3.356201171875, -2.99072265625, -2.625244140625, -2.259765625, -1.894287109375, -1.52880859375, -1.163330078125, -0.7978515625, -0.432373046875, -0.06689453125, 0.298583984375, 0.6640625, 1.029541015625, 1.39501953125, 1.760498046875, 2.1259765625, 2.491455078125, 2.85693359375, 3.222412109375, 3.587890625, 3.953369140625, 4.31884765625, 4.684326171875, 5.0498046875, 5.415283203125, 5.78076171875, 6.146240234375, 6.51171875, 6.877197265625, 7.24267578125, 7.608154296875, 7.9736328125, 8.339111328125, 8.70458984375, 9.070068359375, 9.435546875, 9.801025390625, 10.16650390625, 10.531982421875, 10.8974609375, 11.262939453125, 11.62841796875, 11.993896484375, 12.359375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 2.0, 4.0, 9.0, 8.0, 8.0, 17.0, 26.0, 41.0, 69.0, 110.0, 192.0, 339.0, 652.0, 1368.0, 3489.0, 11511.0, 72408.0, 670298.0, 252260.0, 25774.0, 5880.0, 2148.0, 856.0, 453.0, 238.0, 154.0, 89.0, 52.0, 25.0, 21.0, 14.0, 11.0, 7.0, 7.0, 6.0, 2.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.6171875, -7.37725830078125, -7.1373291015625, -6.89739990234375, -6.657470703125, -6.41754150390625, -6.1776123046875, -5.93768310546875, -5.69775390625, -5.45782470703125, -5.2178955078125, -4.97796630859375, -4.738037109375, -4.49810791015625, -4.2581787109375, -4.01824951171875, -3.7783203125, -3.53839111328125, -3.2984619140625, -3.05853271484375, -2.818603515625, -2.57867431640625, -2.3387451171875, -2.09881591796875, -1.85888671875, -1.61895751953125, -1.3790283203125, -1.13909912109375, -0.899169921875, -0.65924072265625, -0.4193115234375, -0.17938232421875, 0.060546875, 0.30047607421875, 0.5404052734375, 0.78033447265625, 1.020263671875, 1.26019287109375, 1.5001220703125, 1.74005126953125, 1.97998046875, 2.21990966796875, 2.4598388671875, 2.69976806640625, 2.939697265625, 3.17962646484375, 3.4195556640625, 3.65948486328125, 3.8994140625, 4.13934326171875, 4.3792724609375, 4.61920166015625, 4.859130859375, 5.09906005859375, 5.3389892578125, 5.57891845703125, 5.81884765625, 6.05877685546875, 6.2987060546875, 6.53863525390625, 6.778564453125, 7.01849365234375, 7.2584228515625, 7.49835205078125, 7.73828125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 6.0, 1.0, 6.0, 12.0, 17.0, 15.0, 35.0, 34.0, 61.0, 78.0, 97.0, 104.0, 98.0, 116.0, 89.0, 69.0, 58.0, 31.0, 17.0, 18.0, 16.0, 11.0, 5.0, 4.0, 2.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0014638900756835938, -0.0014266595244407654, -0.001389428973197937, -0.0013521984219551086, -0.0013149678707122803, -0.001277737319469452, -0.0012405067682266235, -0.0012032762169837952, -0.0011660456657409668, -0.0011288151144981384, -0.00109158456325531, -0.0010543540120124817, -0.0010171234607696533, -0.000979892909526825, -0.0009426623582839966, -0.0009054318070411682, -0.0008682012557983398, -0.0008309707045555115, -0.0007937401533126831, -0.0007565096020698547, -0.0007192790508270264, -0.000682048499584198, -0.0006448179483413696, -0.0006075873970985413, -0.0005703568458557129, -0.0005331262946128845, -0.0004958957433700562, -0.0004586651921272278, -0.0004214346408843994, -0.00038420408964157104, -0.0003469735383987427, -0.0003097429871559143, -0.00027251243591308594, -0.00023528188467025757, -0.0001980513334274292, -0.00016082078218460083, -0.00012359023094177246, -8.635967969894409e-05, -4.912912845611572e-05, -1.1898577213287354e-05, 2.5331974029541016e-05, 6.256252527236938e-05, 9.979307651519775e-05, 0.00013702362775802612, 0.0001742541790008545, 0.00021148473024368286, 0.00024871528148651123, 0.0002859458327293396, 0.00032317638397216797, 0.00036040693521499634, 0.0003976374864578247, 0.0004348680377006531, 0.00047209858894348145, 0.0005093291401863098, 0.0005465596914291382, 0.0005837902426719666, 0.0006210207939147949, 0.0006582513451576233, 0.0006954818964004517, 0.00073271244764328, 0.0007699429988861084, 0.0008071735501289368, 0.0008444041013717651, 0.0008816346526145935, 0.0009188652038574219]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 2.0, 2.0, 5.0, 2.0, 7.0, 12.0, 12.0, 8.0, 25.0, 16.0, 28.0, 33.0, 66.0, 94.0, 149.0, 308.0, 726.0, 2119.0, 8633.0, 130387.0, 856187.0, 41639.0, 5337.0, 1581.0, 518.0, 241.0, 141.0, 67.0, 47.0, 36.0, 32.0, 27.0, 23.0, 10.0, 8.0, 8.0, 6.0, 2.0, 1.0, 6.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0], "bins": [-12.2890625, -11.950927734375, -11.61279296875, -11.274658203125, -10.9365234375, -10.598388671875, -10.26025390625, -9.922119140625, -9.583984375, -9.245849609375, -8.90771484375, -8.569580078125, -8.2314453125, -7.893310546875, -7.55517578125, -7.217041015625, -6.87890625, -6.540771484375, -6.20263671875, -5.864501953125, -5.5263671875, -5.188232421875, -4.85009765625, -4.511962890625, -4.173828125, -3.835693359375, -3.49755859375, -3.159423828125, -2.8212890625, -2.483154296875, -2.14501953125, -1.806884765625, -1.46875, -1.130615234375, -0.79248046875, -0.454345703125, -0.1162109375, 0.221923828125, 0.56005859375, 0.898193359375, 1.236328125, 1.574462890625, 1.91259765625, 2.250732421875, 2.5888671875, 2.927001953125, 3.26513671875, 3.603271484375, 3.94140625, 4.279541015625, 4.61767578125, 4.955810546875, 5.2939453125, 5.632080078125, 5.97021484375, 6.308349609375, 6.646484375, 6.984619140625, 7.32275390625, 7.660888671875, 7.9990234375, 8.337158203125, 8.67529296875, 9.013427734375, 9.3515625]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 5.0, 2.0, 4.0, 4.0, 9.0, 18.0, 18.0, 29.0, 37.0, 75.0, 97.0, 112.0, 126.0, 131.0, 110.0, 75.0, 43.0, 47.0, 19.0, 11.0, 10.0, 8.0, 8.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.140625, -7.90533447265625, -7.6700439453125, -7.43475341796875, -7.199462890625, -6.96417236328125, -6.7288818359375, -6.49359130859375, -6.25830078125, -6.02301025390625, -5.7877197265625, -5.55242919921875, -5.317138671875, -5.08184814453125, -4.8465576171875, -4.61126708984375, -4.3759765625, -4.14068603515625, -3.9053955078125, -3.67010498046875, -3.434814453125, -3.19952392578125, -2.9642333984375, -2.72894287109375, -2.49365234375, -2.25836181640625, -2.0230712890625, -1.78778076171875, -1.552490234375, -1.31719970703125, -1.0819091796875, -0.84661865234375, -0.611328125, -0.37603759765625, -0.1407470703125, 0.09454345703125, 0.329833984375, 0.56512451171875, 0.8004150390625, 1.03570556640625, 1.27099609375, 1.50628662109375, 1.7415771484375, 1.97686767578125, 2.212158203125, 2.44744873046875, 2.6827392578125, 2.91802978515625, 3.1533203125, 3.38861083984375, 3.6239013671875, 3.85919189453125, 4.094482421875, 4.32977294921875, 4.5650634765625, 4.80035400390625, 5.03564453125, 5.27093505859375, 5.5062255859375, 5.74151611328125, 5.976806640625, 6.21209716796875, 6.4473876953125, 6.68267822265625, 6.91796875]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 26.0, 83.0, 183.0, 299.0, 240.0, 111.0, 33.0, 11.0, 5.0, 2.0, 3.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-157.500732421875, -152.3770294189453, -147.25332641601562, -142.12960815429688, -137.0059051513672, -131.8822021484375, -126.75849151611328, -121.63478088378906, -116.51107788085938, -111.38737487792969, -106.26366424560547, -101.13995361328125, -96.01625061035156, -90.89254760742188, -85.76883697509766, -80.64512634277344, -75.52142333984375, -70.39772033691406, -65.27400970458984, -60.15030288696289, -55.02659606933594, -49.902889251708984, -44.77918243408203, -39.65547561645508, -34.531768798828125, -29.408061981201172, -24.28435516357422, -19.160648345947266, -14.036941528320312, -8.91323471069336, -3.7895278930664062, 1.3341789245605469, 6.4578857421875, 11.581592559814453, 16.705299377441406, 21.82900619506836, 26.952713012695312, 32.076419830322266, 37.20012664794922, 42.32383346557617, 47.447540283203125, 52.57124710083008, 57.69495391845703, 62.818660736083984, 67.94236755371094, 73.06607055664062, 78.18978118896484, 83.31349182128906, 88.43719482421875, 93.56089782714844, 98.68460845947266, 103.80831909179688, 108.93202209472656, 114.05572509765625, 119.17943572998047, 124.30314636230469, 129.42684936523438, 134.55055236816406, 139.67425537109375, 144.7979736328125, 149.9216766357422, 155.04537963867188, 160.16909790039062, 165.2928009033203, 170.41650390625]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 5.0, 7.0, 6.0, 12.0, 9.0, 16.0, 12.0, 27.0, 34.0, 32.0, 46.0, 40.0, 40.0, 46.0, 62.0, 61.0, 47.0, 77.0, 58.0, 61.0, 39.0, 44.0, 32.0, 26.0, 23.0, 26.0, 16.0, 18.0, 17.0, 13.0, 9.0, 13.0, 5.0, 6.0, 3.0, 6.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-56.25861358642578, -54.5308723449707, -52.80312728881836, -51.07538604736328, -49.3476448059082, -47.61989974975586, -45.89215850830078, -44.16441345214844, -42.43667221069336, -40.70893096923828, -38.98118591308594, -37.25344467163086, -35.52570343017578, -33.79795837402344, -32.07021713256836, -30.34247398376465, -28.61473274230957, -26.88698959350586, -25.15924835205078, -23.43150520324707, -21.70376205444336, -19.97602081298828, -18.24827766418457, -16.52053451538086, -14.792792320251465, -13.06505012512207, -11.33730697631836, -9.609564781188965, -7.881822109222412, -6.154079437255859, -4.426337242126465, -2.698594093322754, -0.9708518981933594, 0.7568906545639038, 2.484633207321167, 4.212375640869141, 5.940118312835693, 7.667860984802246, 9.39560317993164, 11.123346328735352, 12.851088523864746, 14.57883071899414, 16.30657386779785, 18.034317016601562, 19.76205825805664, 21.48980140686035, 23.217544555664062, 24.94528579711914, 26.67302894592285, 28.400772094726562, 30.12851333618164, 31.85625648498535, 33.58399963378906, 35.31174087524414, 37.03948211669922, 38.76722717285156, 40.49496841430664, 42.22270965576172, 43.95045471191406, 45.67819595336914, 47.40593719482422, 49.13368225097656, 50.86142349243164, 52.58916473388672, 54.31690979003906]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 5.0, 5.0, 11.0, 13.0, 7.0, 9.0, 20.0, 28.0, 40.0, 55.0, 62.0, 100.0, 148.0, 207.0, 300.0, 431.0, 765.0, 1308.0, 2301.0, 4334.0, 9241.0, 22268.0, 73452.0, 3396134.0, 583366.0, 61600.0, 19718.0, 8670.0, 4160.0, 2169.0, 1284.0, 712.0, 433.0, 294.0, 197.0, 142.0, 80.0, 57.0, 46.0, 24.0, 35.0, 22.0, 9.0, 5.0, 7.0, 1.0, 6.0, 0.0, 1.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-5.25390625, -5.0841064453125, -4.914306640625, -4.7445068359375, -4.57470703125, -4.4049072265625, -4.235107421875, -4.0653076171875, -3.8955078125, -3.7257080078125, -3.555908203125, -3.3861083984375, -3.21630859375, -3.0465087890625, -2.876708984375, -2.7069091796875, -2.537109375, -2.3673095703125, -2.197509765625, -2.0277099609375, -1.85791015625, -1.6881103515625, -1.518310546875, -1.3485107421875, -1.1787109375, -1.0089111328125, -0.839111328125, -0.6693115234375, -0.49951171875, -0.3297119140625, -0.159912109375, 0.0098876953125, 0.1796875, 0.3494873046875, 0.519287109375, 0.6890869140625, 0.85888671875, 1.0286865234375, 1.198486328125, 1.3682861328125, 1.5380859375, 1.7078857421875, 1.877685546875, 2.0474853515625, 2.21728515625, 2.3870849609375, 2.556884765625, 2.7266845703125, 2.896484375, 3.0662841796875, 3.236083984375, 3.4058837890625, 3.57568359375, 3.7454833984375, 3.915283203125, 4.0850830078125, 4.2548828125, 4.4246826171875, 4.594482421875, 4.7642822265625, 4.93408203125, 5.1038818359375, 5.273681640625, 5.4434814453125, 5.61328125]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 5.0, 8.0, 8.0, 8.0, 15.0, 16.0, 17.0, 27.0, 36.0, 43.0, 50.0, 71.0, 62.0, 68.0, 77.0, 83.0, 64.0, 69.0, 52.0, 46.0, 35.0, 31.0, 25.0, 23.0, 8.0, 18.0, 8.0, 7.0, 5.0, 7.0, 2.0, 3.0, 0.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.287109375, -2.207855224609375, -2.12860107421875, -2.049346923828125, -1.9700927734375, -1.890838623046875, -1.81158447265625, -1.732330322265625, -1.653076171875, -1.573822021484375, -1.49456787109375, -1.415313720703125, -1.3360595703125, -1.256805419921875, -1.17755126953125, -1.098297119140625, -1.01904296875, -0.939788818359375, -0.86053466796875, -0.781280517578125, -0.7020263671875, -0.622772216796875, -0.54351806640625, -0.464263916015625, -0.385009765625, -0.305755615234375, -0.22650146484375, -0.147247314453125, -0.0679931640625, 0.011260986328125, 0.09051513671875, 0.169769287109375, 0.2490234375, 0.328277587890625, 0.40753173828125, 0.486785888671875, 0.5660400390625, 0.645294189453125, 0.72454833984375, 0.803802490234375, 0.883056640625, 0.962310791015625, 1.04156494140625, 1.120819091796875, 1.2000732421875, 1.279327392578125, 1.35858154296875, 1.437835693359375, 1.51708984375, 1.596343994140625, 1.67559814453125, 1.754852294921875, 1.8341064453125, 1.913360595703125, 1.99261474609375, 2.071868896484375, 2.151123046875, 2.230377197265625, 2.30963134765625, 2.388885498046875, 2.4681396484375, 2.547393798828125, 2.62664794921875, 2.705902099609375, 2.78515625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 4.0, 9.0, 9.0, 14.0, 15.0, 27.0, 24.0, 48.0, 52.0, 76.0, 101.0, 180.0, 260.0, 425.0, 656.0, 1118.0, 1917.0, 3616.0, 7989.0, 20100.0, 76017.0, 3478085.0, 520266.0, 52710.0, 16393.0, 6611.0, 3228.0, 1662.0, 963.0, 585.0, 382.0, 224.0, 173.0, 100.0, 80.0, 48.0, 28.0, 27.0, 12.0, 21.0, 11.0, 6.0, 6.0, 7.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.203125, -8.9315185546875, -8.659912109375, -8.3883056640625, -8.11669921875, -7.8450927734375, -7.573486328125, -7.3018798828125, -7.0302734375, -6.7586669921875, -6.487060546875, -6.2154541015625, -5.94384765625, -5.6722412109375, -5.400634765625, -5.1290283203125, -4.857421875, -4.5858154296875, -4.314208984375, -4.0426025390625, -3.77099609375, -3.4993896484375, -3.227783203125, -2.9561767578125, -2.6845703125, -2.4129638671875, -2.141357421875, -1.8697509765625, -1.59814453125, -1.3265380859375, -1.054931640625, -0.7833251953125, -0.51171875, -0.2401123046875, 0.031494140625, 0.3031005859375, 0.57470703125, 0.8463134765625, 1.117919921875, 1.3895263671875, 1.6611328125, 1.9327392578125, 2.204345703125, 2.4759521484375, 2.74755859375, 3.0191650390625, 3.290771484375, 3.5623779296875, 3.833984375, 4.1055908203125, 4.377197265625, 4.6488037109375, 4.92041015625, 5.1920166015625, 5.463623046875, 5.7352294921875, 6.0068359375, 6.2784423828125, 6.550048828125, 6.8216552734375, 7.09326171875, 7.3648681640625, 7.636474609375, 7.9080810546875, 8.1796875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 3.0, 2.0, 2.0, 4.0, 6.0, 3.0, 9.0, 9.0, 12.0, 23.0, 31.0, 61.0, 115.0, 318.0, 2834.0, 352.0, 111.0, 57.0, 40.0, 23.0, 18.0, 14.0, 9.0, 4.0, 2.0, 3.0, 4.0, 3.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.03515625, -2.954254150390625, -2.87335205078125, -2.792449951171875, -2.7115478515625, -2.630645751953125, -2.54974365234375, -2.468841552734375, -2.387939453125, -2.307037353515625, -2.22613525390625, -2.145233154296875, -2.0643310546875, -1.983428955078125, -1.90252685546875, -1.821624755859375, -1.74072265625, -1.659820556640625, -1.57891845703125, -1.498016357421875, -1.4171142578125, -1.336212158203125, -1.25531005859375, -1.174407958984375, -1.093505859375, -1.012603759765625, -0.93170166015625, -0.850799560546875, -0.7698974609375, -0.688995361328125, -0.60809326171875, -0.527191162109375, -0.4462890625, -0.365386962890625, -0.28448486328125, -0.203582763671875, -0.1226806640625, -0.041778564453125, 0.03912353515625, 0.120025634765625, 0.200927734375, 0.281829833984375, 0.36273193359375, 0.443634033203125, 0.5245361328125, 0.605438232421875, 0.68634033203125, 0.767242431640625, 0.84814453125, 0.929046630859375, 1.00994873046875, 1.090850830078125, 1.1717529296875, 1.252655029296875, 1.33355712890625, 1.414459228515625, 1.495361328125, 1.576263427734375, 1.65716552734375, 1.738067626953125, 1.8189697265625, 1.899871826171875, 1.98077392578125, 2.061676025390625, 2.142578125]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 6.0, 11.0, 25.0, 28.0, 57.0, 81.0, 106.0, 122.0, 131.0, 131.0, 106.0, 75.0, 54.0, 31.0, 19.0, 7.0, 6.0, 4.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.85519027709961, -17.428876876831055, -17.0025634765625, -16.576250076293945, -16.14993667602539, -15.72362232208252, -15.297307968139648, -14.870994567871094, -14.444681167602539, -14.018367767333984, -13.59205436706543, -13.165740013122559, -12.739426612854004, -12.31311321258545, -11.886798858642578, -11.460485458374023, -11.034172058105469, -10.607858657836914, -10.18154525756836, -9.755230903625488, -9.328917503356934, -8.902604103088379, -8.476289749145508, -8.049976348876953, -7.623662948608398, -7.197349548339844, -6.771035671234131, -6.344721794128418, -5.918408393859863, -5.492094993591309, -5.065781116485596, -4.639467239379883, -4.213152885437012, -3.786839246749878, -3.360525608062744, -2.9342119693756104, -2.5078983306884766, -2.0815846920013428, -1.655271053314209, -1.2289574146270752, -0.8026437759399414, -0.3763301372528076, 0.04998350143432617, 0.47629714012145996, 0.9026107788085938, 1.3289244174957275, 1.7552380561828613, 2.181551694869995, 2.607865333557129, 3.0341789722442627, 3.4604926109313965, 3.8868062496185303, 4.313119888305664, 4.739433288574219, 5.165747165679932, 5.5920610427856445, 6.018374443054199, 6.444687843322754, 6.871001720428467, 7.29731559753418, 7.723628997802734, 8.149942398071289, 8.576255798339844, 9.002570152282715, 9.42888355255127]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 1.0, 0.0, 2.0, 4.0, 4.0, 4.0, 14.0, 10.0, 10.0, 14.0, 11.0, 19.0, 22.0, 26.0, 31.0, 32.0, 44.0, 42.0, 38.0, 40.0, 43.0, 47.0, 39.0, 35.0, 35.0, 41.0, 46.0, 49.0, 32.0, 27.0, 37.0, 36.0, 32.0, 16.0, 25.0, 14.0, 16.0, 17.0, 16.0, 7.0, 5.0, 4.0, 7.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.916535377502441, -5.7146100997924805, -5.5126848220825195, -5.310759544372559, -5.108834743499756, -4.906909465789795, -4.704984188079834, -4.503058910369873, -4.30113410949707, -4.099208831787109, -3.8972837924957275, -3.6953585147857666, -3.4934334754943848, -3.291508197784424, -3.089582920074463, -2.887657642364502, -2.685732364654541, -2.48380708694458, -2.2818820476531982, -2.0799567699432373, -1.878031611442566, -1.6761064529418945, -1.4741811752319336, -1.2722560167312622, -1.0703308582305908, -0.8684056997299194, -0.6664804816246033, -0.4645552635192871, -0.2626301050186157, -0.060704946517944336, 0.1412203311920166, 0.343145489692688, 0.5450706481933594, 0.7469958066940308, 0.9489210247993469, 1.150846242904663, 1.3527714014053345, 1.5546965599060059, 1.7566218376159668, 1.9585469961166382, 2.1604721546173096, 2.3623974323272705, 2.5643224716186523, 2.7662477493286133, 2.968173027038574, 3.170098066329956, 3.372023344039917, 3.573948383331299, 3.7758736610412598, 3.9777989387512207, 4.179724216461182, 4.381649017333984, 4.583574295043945, 4.785499572753906, 4.987424850463867, 5.189350128173828, 5.391275405883789, 5.59320068359375, 5.795125961303711, 5.997051239013672, 6.198976039886475, 6.4009013175964355, 6.6028265953063965, 6.804751873016357, 7.00667667388916]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 2.0, 5.0, 8.0, 7.0, 18.0, 11.0, 20.0, 48.0, 42.0, 94.0, 135.0, 223.0, 340.0, 586.0, 1020.0, 1757.0, 3126.0, 6227.0, 12284.0, 25388.0, 53946.0, 112405.0, 201253.0, 248953.0, 187019.0, 100528.0, 47491.0, 22291.0, 10929.0, 5579.0, 2902.0, 1598.0, 932.0, 550.0, 306.0, 191.0, 114.0, 83.0, 50.0, 24.0, 21.0, 15.0, 14.0, 12.0, 4.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.41796875, -3.30560302734375, -3.1932373046875, -3.08087158203125, -2.968505859375, -2.85614013671875, -2.7437744140625, -2.63140869140625, -2.51904296875, -2.40667724609375, -2.2943115234375, -2.18194580078125, -2.069580078125, -1.95721435546875, -1.8448486328125, -1.73248291015625, -1.6201171875, -1.50775146484375, -1.3953857421875, -1.28302001953125, -1.170654296875, -1.05828857421875, -0.9459228515625, -0.83355712890625, -0.72119140625, -0.60882568359375, -0.4964599609375, -0.38409423828125, -0.271728515625, -0.15936279296875, -0.0469970703125, 0.06536865234375, 0.177734375, 0.29010009765625, 0.4024658203125, 0.51483154296875, 0.627197265625, 0.73956298828125, 0.8519287109375, 0.96429443359375, 1.07666015625, 1.18902587890625, 1.3013916015625, 1.41375732421875, 1.526123046875, 1.63848876953125, 1.7508544921875, 1.86322021484375, 1.9755859375, 2.08795166015625, 2.2003173828125, 2.31268310546875, 2.425048828125, 2.53741455078125, 2.6497802734375, 2.76214599609375, 2.87451171875, 2.98687744140625, 3.0992431640625, 3.21160888671875, 3.323974609375, 3.43634033203125, 3.5487060546875, 3.66107177734375, 3.7734375]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 6.0, 3.0, 2.0, 4.0, 2.0, 7.0, 8.0, 18.0, 22.0, 27.0, 34.0, 49.0, 41.0, 51.0, 71.0, 68.0, 75.0, 74.0, 71.0, 58.0, 63.0, 59.0, 38.0, 47.0, 28.0, 21.0, 14.0, 9.0, 10.0, 7.0, 6.0, 7.0, 2.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.669921875, -2.58441162109375, -2.4989013671875, -2.41339111328125, -2.327880859375, -2.24237060546875, -2.1568603515625, -2.07135009765625, -1.98583984375, -1.90032958984375, -1.8148193359375, -1.72930908203125, -1.643798828125, -1.55828857421875, -1.4727783203125, -1.38726806640625, -1.3017578125, -1.21624755859375, -1.1307373046875, -1.04522705078125, -0.959716796875, -0.87420654296875, -0.7886962890625, -0.70318603515625, -0.61767578125, -0.53216552734375, -0.4466552734375, -0.36114501953125, -0.275634765625, -0.19012451171875, -0.1046142578125, -0.01910400390625, 0.06640625, 0.15191650390625, 0.2374267578125, 0.32293701171875, 0.408447265625, 0.49395751953125, 0.5794677734375, 0.66497802734375, 0.75048828125, 0.83599853515625, 0.9215087890625, 1.00701904296875, 1.092529296875, 1.17803955078125, 1.2635498046875, 1.34906005859375, 1.4345703125, 1.52008056640625, 1.6055908203125, 1.69110107421875, 1.776611328125, 1.86212158203125, 1.9476318359375, 2.03314208984375, 2.11865234375, 2.20416259765625, 2.2896728515625, 2.37518310546875, 2.460693359375, 2.54620361328125, 2.6317138671875, 2.71722412109375, 2.802734375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 1.0, 5.0, 5.0, 9.0, 11.0, 6.0, 14.0, 34.0, 34.0, 51.0, 71.0, 85.0, 146.0, 182.0, 297.0, 436.0, 748.0, 1338.0, 2833.0, 10381.0, 117443.0, 778323.0, 119328.0, 10391.0, 2843.0, 1337.0, 779.0, 462.0, 314.0, 184.0, 135.0, 89.0, 62.0, 49.0, 29.0, 25.0, 19.0, 14.0, 16.0, 5.0, 4.0, 8.0, 3.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0], "bins": [-15.125, -14.698974609375, -14.27294921875, -13.846923828125, -13.4208984375, -12.994873046875, -12.56884765625, -12.142822265625, -11.716796875, -11.290771484375, -10.86474609375, -10.438720703125, -10.0126953125, -9.586669921875, -9.16064453125, -8.734619140625, -8.30859375, -7.882568359375, -7.45654296875, -7.030517578125, -6.6044921875, -6.178466796875, -5.75244140625, -5.326416015625, -4.900390625, -4.474365234375, -4.04833984375, -3.622314453125, -3.1962890625, -2.770263671875, -2.34423828125, -1.918212890625, -1.4921875, -1.066162109375, -0.64013671875, -0.214111328125, 0.2119140625, 0.637939453125, 1.06396484375, 1.489990234375, 1.916015625, 2.342041015625, 2.76806640625, 3.194091796875, 3.6201171875, 4.046142578125, 4.47216796875, 4.898193359375, 5.32421875, 5.750244140625, 6.17626953125, 6.602294921875, 7.0283203125, 7.454345703125, 7.88037109375, 8.306396484375, 8.732421875, 9.158447265625, 9.58447265625, 10.010498046875, 10.4365234375, 10.862548828125, 11.28857421875, 11.714599609375, 12.140625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 5.0, 9.0, 7.0, 10.0, 8.0, 9.0, 18.0, 16.0, 22.0, 30.0, 19.0, 40.0, 36.0, 48.0, 40.0, 60.0, 45.0, 57.0, 53.0, 56.0, 43.0, 48.0, 41.0, 45.0, 31.0, 26.0, 28.0, 30.0, 15.0, 20.0, 16.0, 14.0, 17.0, 9.0, 8.0, 8.0, 5.0, 4.0, 7.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.9765625, -10.6181640625, -10.259765625, -9.9013671875, -9.54296875, -9.1845703125, -8.826171875, -8.4677734375, -8.109375, -7.7509765625, -7.392578125, -7.0341796875, -6.67578125, -6.3173828125, -5.958984375, -5.6005859375, -5.2421875, -4.8837890625, -4.525390625, -4.1669921875, -3.80859375, -3.4501953125, -3.091796875, -2.7333984375, -2.375, -2.0166015625, -1.658203125, -1.2998046875, -0.94140625, -0.5830078125, -0.224609375, 0.1337890625, 0.4921875, 0.8505859375, 1.208984375, 1.5673828125, 1.92578125, 2.2841796875, 2.642578125, 3.0009765625, 3.359375, 3.7177734375, 4.076171875, 4.4345703125, 4.79296875, 5.1513671875, 5.509765625, 5.8681640625, 6.2265625, 6.5849609375, 6.943359375, 7.3017578125, 7.66015625, 8.0185546875, 8.376953125, 8.7353515625, 9.09375, 9.4521484375, 9.810546875, 10.1689453125, 10.52734375, 10.8857421875, 11.244140625, 11.6025390625, 11.9609375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 7.0, 0.0, 1.0, 5.0, 8.0, 6.0, 18.0, 28.0, 45.0, 41.0, 95.0, 121.0, 214.0, 372.0, 753.0, 1912.0, 7389.0, 70797.0, 778170.0, 171245.0, 12623.0, 2681.0, 970.0, 410.0, 226.0, 139.0, 80.0, 68.0, 33.0, 27.0, 29.0, 9.0, 10.0, 5.0, 9.0, 6.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.26171875, -6.98919677734375, -6.7166748046875, -6.44415283203125, -6.171630859375, -5.89910888671875, -5.6265869140625, -5.35406494140625, -5.08154296875, -4.80902099609375, -4.5364990234375, -4.26397705078125, -3.991455078125, -3.71893310546875, -3.4464111328125, -3.17388916015625, -2.9013671875, -2.62884521484375, -2.3563232421875, -2.08380126953125, -1.811279296875, -1.53875732421875, -1.2662353515625, -0.99371337890625, -0.72119140625, -0.44866943359375, -0.1761474609375, 0.09637451171875, 0.368896484375, 0.64141845703125, 0.9139404296875, 1.18646240234375, 1.458984375, 1.73150634765625, 2.0040283203125, 2.27655029296875, 2.549072265625, 2.82159423828125, 3.0941162109375, 3.36663818359375, 3.63916015625, 3.91168212890625, 4.1842041015625, 4.45672607421875, 4.729248046875, 5.00177001953125, 5.2742919921875, 5.54681396484375, 5.8193359375, 6.09185791015625, 6.3643798828125, 6.63690185546875, 6.909423828125, 7.18194580078125, 7.4544677734375, 7.72698974609375, 7.99951171875, 8.27203369140625, 8.5445556640625, 8.81707763671875, 9.089599609375, 9.36212158203125, 9.6346435546875, 9.90716552734375, 10.1796875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 9.0, 7.0, 8.0, 10.0, 23.0, 26.0, 29.0, 60.0, 51.0, 86.0, 86.0, 96.0, 112.0, 105.0, 58.0, 52.0, 48.0, 41.0, 25.0, 14.0, 17.0, 8.0, 8.0, 6.0, 3.0, 5.0, 2.0, 4.0, 5.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.001537322998046875, -0.0015014037489891052, -0.0014654844999313354, -0.0014295652508735657, -0.001393646001815796, -0.0013577267527580261, -0.0013218075037002563, -0.0012858882546424866, -0.0012499690055847168, -0.001214049756526947, -0.0011781305074691772, -0.0011422112584114075, -0.0011062920093536377, -0.001070372760295868, -0.0010344535112380981, -0.0009985342621803284, -0.0009626150131225586, -0.0009266957640647888, -0.000890776515007019, -0.0008548572659492493, -0.0008189380168914795, -0.0007830187678337097, -0.0007470995187759399, -0.0007111802697181702, -0.0006752610206604004, -0.0006393417716026306, -0.0006034225225448608, -0.0005675032734870911, -0.0005315840244293213, -0.0004956647753715515, -0.00045974552631378174, -0.00042382627725601196, -0.0003879070281982422, -0.0003519877791404724, -0.00031606853008270264, -0.00028014928102493286, -0.0002442300319671631, -0.0002083107829093933, -0.00017239153385162354, -0.00013647228479385376, -0.00010055303573608398, -6.463378667831421e-05, -2.8714537620544434e-05, 7.204711437225342e-06, 4.312396049499512e-05, 7.904320955276489e-05, 0.00011496245861053467, 0.00015088170766830444, 0.00018680095672607422, 0.000222720205783844, 0.00025863945484161377, 0.00029455870389938354, 0.0003304779529571533, 0.0003663972020149231, 0.00040231645107269287, 0.00043823570013046265, 0.0004741549491882324, 0.0005100741982460022, 0.000545993447303772, 0.0005819126963615417, 0.0006178319454193115, 0.0006537511944770813, 0.0006896704435348511, 0.0007255896925926208, 0.0007615089416503906]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 1.0, 1.0, 3.0, 3.0, 4.0, 2.0, 9.0, 12.0, 15.0, 26.0, 39.0, 76.0, 114.0, 158.0, 361.0, 845.0, 2097.0, 7888.0, 78536.0, 834244.0, 110433.0, 9567.0, 2384.0, 853.0, 419.0, 207.0, 102.0, 65.0, 26.0, 28.0, 14.0, 8.0, 6.0, 3.0, 1.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.1015625, -8.7935791015625, -8.485595703125, -8.1776123046875, -7.86962890625, -7.5616455078125, -7.253662109375, -6.9456787109375, -6.6376953125, -6.3297119140625, -6.021728515625, -5.7137451171875, -5.40576171875, -5.0977783203125, -4.789794921875, -4.4818115234375, -4.173828125, -3.8658447265625, -3.557861328125, -3.2498779296875, -2.94189453125, -2.6339111328125, -2.325927734375, -2.0179443359375, -1.7099609375, -1.4019775390625, -1.093994140625, -0.7860107421875, -0.47802734375, -0.1700439453125, 0.137939453125, 0.4459228515625, 0.75390625, 1.0618896484375, 1.369873046875, 1.6778564453125, 1.98583984375, 2.2938232421875, 2.601806640625, 2.9097900390625, 3.2177734375, 3.5257568359375, 3.833740234375, 4.1417236328125, 4.44970703125, 4.7576904296875, 5.065673828125, 5.3736572265625, 5.681640625, 5.9896240234375, 6.297607421875, 6.6055908203125, 6.91357421875, 7.2215576171875, 7.529541015625, 7.8375244140625, 8.1455078125, 8.4534912109375, 8.761474609375, 9.0694580078125, 9.37744140625, 9.6854248046875, 9.993408203125, 10.3013916015625, 10.609375]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 6.0, 3.0, 13.0, 16.0, 18.0, 17.0, 33.0, 48.0, 73.0, 94.0, 112.0, 104.0, 94.0, 90.0, 77.0, 58.0, 43.0, 28.0, 18.0, 22.0, 9.0, 8.0, 5.0, 5.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.375, -6.1798095703125, -5.984619140625, -5.7894287109375, -5.59423828125, -5.3990478515625, -5.203857421875, -5.0086669921875, -4.8134765625, -4.6182861328125, -4.423095703125, -4.2279052734375, -4.03271484375, -3.8375244140625, -3.642333984375, -3.4471435546875, -3.251953125, -3.0567626953125, -2.861572265625, -2.6663818359375, -2.47119140625, -2.2760009765625, -2.080810546875, -1.8856201171875, -1.6904296875, -1.4952392578125, -1.300048828125, -1.1048583984375, -0.90966796875, -0.7144775390625, -0.519287109375, -0.3240966796875, -0.12890625, 0.0662841796875, 0.261474609375, 0.4566650390625, 0.65185546875, 0.8470458984375, 1.042236328125, 1.2374267578125, 1.4326171875, 1.6278076171875, 1.822998046875, 2.0181884765625, 2.21337890625, 2.4085693359375, 2.603759765625, 2.7989501953125, 2.994140625, 3.1893310546875, 3.384521484375, 3.5797119140625, 3.77490234375, 3.9700927734375, 4.165283203125, 4.3604736328125, 4.5556640625, 4.7508544921875, 4.946044921875, 5.1412353515625, 5.33642578125, 5.5316162109375, 5.726806640625, 5.9219970703125, 6.1171875]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 8.0, 13.0, 38.0, 85.0, 161.0, 213.0, 209.0, 132.0, 73.0, 40.0, 11.0, 13.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-136.553955078125, -132.73532104492188, -128.9166717529297, -125.09803771972656, -121.2793960571289, -117.46075439453125, -113.6421127319336, -109.82347106933594, -106.00483703613281, -102.18619537353516, -98.3675537109375, -94.54891967773438, -90.73027801513672, -86.91163635253906, -83.0929946899414, -79.27435302734375, -75.4557113647461, -71.63706970214844, -67.81842803955078, -63.99979019165039, -60.18115234375, -56.362510681152344, -52.54386901855469, -48.72522735595703, -44.90658950805664, -41.087947845458984, -37.269309997558594, -33.45066833496094, -29.632028579711914, -25.81338882446289, -21.994747161865234, -18.17610740661621, -14.357467651367188, -10.538827896118164, -6.720187187194824, -2.9015464782714844, 0.9170932769775391, 4.7357330322265625, 8.554374694824219, 12.373014450073242, 16.191654205322266, 20.01029396057129, 23.828933715820312, 27.64757537841797, 31.466215133666992, 35.284854888916016, 39.10349655151367, 42.92213439941406, 46.74077606201172, 50.559417724609375, 54.378055572509766, 58.19669723510742, 62.01533508300781, 65.83397674560547, 69.65261840820312, 73.47126007080078, 77.28990173339844, 81.1085433959961, 84.92718505859375, 88.74581909179688, 92.56446075439453, 96.38310241699219, 100.20174407958984, 104.0203857421875, 107.83901977539062]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 7.0, 8.0, 1.0, 5.0, 15.0, 11.0, 14.0, 17.0, 14.0, 20.0, 27.0, 38.0, 29.0, 31.0, 39.0, 53.0, 41.0, 46.0, 63.0, 43.0, 51.0, 51.0, 45.0, 38.0, 37.0, 44.0, 37.0, 35.0, 26.0, 21.0, 20.0, 24.0, 12.0, 6.0, 14.0, 5.0, 9.0, 3.0, 0.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.134376525878906, -52.55606460571289, -50.977752685546875, -49.399444580078125, -47.82113265991211, -46.242820739746094, -44.664512634277344, -43.08620071411133, -41.50788879394531, -39.9295768737793, -38.35126495361328, -36.77295684814453, -35.194644927978516, -33.6163330078125, -32.03802490234375, -30.459712982177734, -28.88140106201172, -27.303089141845703, -25.72477912902832, -24.146469116210938, -22.568157196044922, -20.989845275878906, -19.411535263061523, -17.83322525024414, -16.254913330078125, -14.676602363586426, -13.098291397094727, -11.519980430603027, -9.941669464111328, -8.363358497619629, -6.78504753112793, -5.2067365646362305, -3.6284255981445312, -2.050114631652832, -0.4718036651611328, 1.1065073013305664, 2.6848182678222656, 4.263129234313965, 5.841440200805664, 7.419751167297363, 8.998062133789062, 10.576373100280762, 12.154684066772461, 13.73299503326416, 15.31130599975586, 16.889617919921875, 18.467927932739258, 20.04623794555664, 21.624549865722656, 23.202861785888672, 24.781171798706055, 26.359481811523438, 27.937793731689453, 29.51610565185547, 31.09441566467285, 32.672725677490234, 34.25103759765625, 35.829349517822266, 37.40766143798828, 38.98596954345703, 40.56428146362305, 42.14259338378906, 43.72090148925781, 45.29921340942383, 46.877525329589844]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 6.0, 3.0, 3.0, 5.0, 9.0, 5.0, 16.0, 15.0, 31.0, 32.0, 60.0, 96.0, 129.0, 209.0, 324.0, 555.0, 949.0, 1803.0, 4078.0, 11813.0, 64788.0, 4014581.0, 73251.0, 12857.0, 4303.0, 1906.0, 926.0, 574.0, 336.0, 218.0, 134.0, 90.0, 54.0, 50.0, 23.0, 15.0, 13.0, 9.0, 5.0, 4.0, 4.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.3984375, -12.0494384765625, -11.700439453125, -11.3514404296875, -11.00244140625, -10.6534423828125, -10.304443359375, -9.9554443359375, -9.6064453125, -9.2574462890625, -8.908447265625, -8.5594482421875, -8.21044921875, -7.8614501953125, -7.512451171875, -7.1634521484375, -6.814453125, -6.4654541015625, -6.116455078125, -5.7674560546875, -5.41845703125, -5.0694580078125, -4.720458984375, -4.3714599609375, -4.0224609375, -3.6734619140625, -3.324462890625, -2.9754638671875, -2.62646484375, -2.2774658203125, -1.928466796875, -1.5794677734375, -1.23046875, -0.8814697265625, -0.532470703125, -0.1834716796875, 0.16552734375, 0.5145263671875, 0.863525390625, 1.2125244140625, 1.5615234375, 1.9105224609375, 2.259521484375, 2.6085205078125, 2.95751953125, 3.3065185546875, 3.655517578125, 4.0045166015625, 4.353515625, 4.7025146484375, 5.051513671875, 5.4005126953125, 5.74951171875, 6.0985107421875, 6.447509765625, 6.7965087890625, 7.1455078125, 7.4945068359375, 7.843505859375, 8.1925048828125, 8.54150390625, 8.8905029296875, 9.239501953125, 9.5885009765625, 9.9375]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 4.0, 2.0, 3.0, 4.0, 9.0, 11.0, 15.0, 13.0, 27.0, 36.0, 37.0, 52.0, 48.0, 60.0, 76.0, 89.0, 67.0, 82.0, 64.0, 64.0, 60.0, 31.0, 31.0, 21.0, 17.0, 17.0, 10.0, 11.0, 8.0, 9.0, 6.0, 5.0, 4.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.09375, -3.00048828125, -2.9072265625, -2.81396484375, -2.720703125, -2.62744140625, -2.5341796875, -2.44091796875, -2.34765625, -2.25439453125, -2.1611328125, -2.06787109375, -1.974609375, -1.88134765625, -1.7880859375, -1.69482421875, -1.6015625, -1.50830078125, -1.4150390625, -1.32177734375, -1.228515625, -1.13525390625, -1.0419921875, -0.94873046875, -0.85546875, -0.76220703125, -0.6689453125, -0.57568359375, -0.482421875, -0.38916015625, -0.2958984375, -0.20263671875, -0.109375, -0.01611328125, 0.0771484375, 0.17041015625, 0.263671875, 0.35693359375, 0.4501953125, 0.54345703125, 0.63671875, 0.72998046875, 0.8232421875, 0.91650390625, 1.009765625, 1.10302734375, 1.1962890625, 1.28955078125, 1.3828125, 1.47607421875, 1.5693359375, 1.66259765625, 1.755859375, 1.84912109375, 1.9423828125, 2.03564453125, 2.12890625, 2.22216796875, 2.3154296875, 2.40869140625, 2.501953125, 2.59521484375, 2.6884765625, 2.78173828125, 2.875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 6.0, 8.0, 7.0, 11.0, 12.0, 15.0, 26.0, 26.0, 22.0, 52.0, 69.0, 78.0, 93.0, 119.0, 189.0, 347.0, 599.0, 1436.0, 3980.0, 15728.0, 2913287.0, 1235230.0, 15970.0, 3842.0, 1366.0, 645.0, 351.0, 183.0, 156.0, 122.0, 74.0, 52.0, 40.0, 36.0, 30.0, 21.0, 16.0, 15.0, 7.0, 8.0, 3.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-24.453125, -23.73388671875, -23.0146484375, -22.29541015625, -21.576171875, -20.85693359375, -20.1376953125, -19.41845703125, -18.69921875, -17.97998046875, -17.2607421875, -16.54150390625, -15.822265625, -15.10302734375, -14.3837890625, -13.66455078125, -12.9453125, -12.22607421875, -11.5068359375, -10.78759765625, -10.068359375, -9.34912109375, -8.6298828125, -7.91064453125, -7.19140625, -6.47216796875, -5.7529296875, -5.03369140625, -4.314453125, -3.59521484375, -2.8759765625, -2.15673828125, -1.4375, -0.71826171875, 0.0009765625, 0.72021484375, 1.439453125, 2.15869140625, 2.8779296875, 3.59716796875, 4.31640625, 5.03564453125, 5.7548828125, 6.47412109375, 7.193359375, 7.91259765625, 8.6318359375, 9.35107421875, 10.0703125, 10.78955078125, 11.5087890625, 12.22802734375, 12.947265625, 13.66650390625, 14.3857421875, 15.10498046875, 15.82421875, 16.54345703125, 17.2626953125, 17.98193359375, 18.701171875, 19.42041015625, 20.1396484375, 20.85888671875, 21.578125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 5.0, 2.0, 9.0, 12.0, 22.0, 50.0, 217.0, 3520.0, 152.0, 40.0, 29.0, 11.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.109375, -6.91400146484375, -6.7186279296875, -6.52325439453125, -6.327880859375, -6.13250732421875, -5.9371337890625, -5.74176025390625, -5.54638671875, -5.35101318359375, -5.1556396484375, -4.96026611328125, -4.764892578125, -4.56951904296875, -4.3741455078125, -4.17877197265625, -3.9833984375, -3.78802490234375, -3.5926513671875, -3.39727783203125, -3.201904296875, -3.00653076171875, -2.8111572265625, -2.61578369140625, -2.42041015625, -2.22503662109375, -2.0296630859375, -1.83428955078125, -1.638916015625, -1.44354248046875, -1.2481689453125, -1.05279541015625, -0.857421875, -0.66204833984375, -0.4666748046875, -0.27130126953125, -0.075927734375, 0.11944580078125, 0.3148193359375, 0.51019287109375, 0.70556640625, 0.90093994140625, 1.0963134765625, 1.29168701171875, 1.487060546875, 1.68243408203125, 1.8778076171875, 2.07318115234375, 2.2685546875, 2.46392822265625, 2.6593017578125, 2.85467529296875, 3.050048828125, 3.24542236328125, 3.4407958984375, 3.63616943359375, 3.83154296875, 4.02691650390625, 4.2222900390625, 4.41766357421875, 4.613037109375, 4.80841064453125, 5.0037841796875, 5.19915771484375, 5.39453125]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 10.0, 5.0, 6.0, 21.0, 22.0, 59.0, 54.0, 91.0, 98.0, 124.0, 127.0, 134.0, 72.0, 55.0, 35.0, 26.0, 22.0, 12.0, 9.0, 3.0, 5.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.344937324523926, -14.837417602539062, -14.329898834228516, -13.822379112243652, -13.314859390258789, -12.807340621948242, -12.299820899963379, -11.792301177978516, -11.284782409667969, -10.777262687683105, -10.269743919372559, -9.762224197387695, -9.254704475402832, -8.747184753417969, -8.239665985107422, -7.732146263122559, -7.224626541137695, -6.71710729598999, -6.209587574005127, -5.702068328857422, -5.194548606872559, -4.6870293617248535, -4.179510116577148, -3.6719906330108643, -3.16447114944458, -2.656951665878296, -2.1494321823120117, -1.6419129371643066, -1.1343934535980225, -0.6268739700317383, -0.1193547248840332, 0.388164758682251, 0.8956851959228516, 1.4032046794891357, 1.9107240438461304, 2.418243408203125, 2.925762891769409, 3.4332823753356934, 3.9408016204833984, 4.448321342468262, 4.955840587615967, 5.463359832763672, 5.970879554748535, 6.47839879989624, 6.985918045043945, 7.493437767028809, 8.000957489013672, 8.508476257324219, 9.015995979309082, 9.523515701293945, 10.031034469604492, 10.538554191589355, 11.046073913574219, 11.553592681884766, 12.061112403869629, 12.568632125854492, 13.076150894165039, 13.583670616149902, 14.09118938446045, 14.598709106445312, 15.106228828430176, 15.613748550415039, 16.121267318725586, 16.628786087036133, 17.136306762695312]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 5.0, 6.0, 6.0, 4.0, 7.0, 10.0, 19.0, 13.0, 10.0, 16.0, 23.0, 22.0, 21.0, 31.0, 21.0, 37.0, 25.0, 40.0, 36.0, 44.0, 54.0, 43.0, 36.0, 46.0, 38.0, 37.0, 40.0, 28.0, 28.0, 31.0, 36.0, 39.0, 22.0, 20.0, 23.0, 14.0, 15.0, 9.0, 14.0, 8.0, 8.0, 5.0, 5.0, 2.0, 3.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.398200988769531, -7.152790069580078, -6.907378673553467, -6.661967754364014, -6.416556358337402, -6.171145439147949, -5.925734519958496, -5.680323123931885, -5.434911727905273, -5.18950080871582, -4.944089412689209, -4.698678493499756, -4.4532670974731445, -4.207856178283691, -3.962445020675659, -3.717033863067627, -3.471622943878174, -3.2262117862701416, -2.9808006286621094, -2.7353897094726562, -2.489978313446045, -2.244567394256592, -1.9991562366485596, -1.7537450790405273, -1.5083339214324951, -1.262922763824463, -1.0175116062164307, -0.772100567817688, -0.5266894102096558, -0.28127825260162354, -0.03586721420288086, 0.20954394340515137, 0.4549551010131836, 0.7003662586212158, 0.9457773566246033, 1.1911884546279907, 1.436599612236023, 1.6820107698440552, 1.9274218082427979, 2.17283296585083, 2.4182441234588623, 2.6636552810668945, 2.9090664386749268, 3.154477596282959, 3.399888515472412, 3.6452999114990234, 3.8907108306884766, 4.13612174987793, 4.381533145904541, 4.626944065093994, 4.8723554611206055, 5.117766380310059, 5.36317777633667, 5.608588695526123, 5.854000091552734, 6.0994110107421875, 6.344821929931641, 6.590232849121094, 6.835644245147705, 7.081055164337158, 7.3264665603637695, 7.571877479553223, 7.817288398742676, 8.062700271606445, 8.308111190795898]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 5.0, 7.0, 15.0, 13.0, 28.0, 19.0, 49.0, 66.0, 123.0, 261.0, 458.0, 1126.0, 3018.0, 9975.0, 40248.0, 197362.0, 561491.0, 182624.0, 37393.0, 9307.0, 2853.0, 1064.0, 488.0, 236.0, 129.0, 54.0, 49.0, 28.0, 24.0, 15.0, 7.0, 9.0, 4.0, 5.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0], "bins": [-10.359375, -10.08294677734375, -9.8065185546875, -9.53009033203125, -9.253662109375, -8.97723388671875, -8.7008056640625, -8.42437744140625, -8.14794921875, -7.87152099609375, -7.5950927734375, -7.31866455078125, -7.042236328125, -6.76580810546875, -6.4893798828125, -6.21295166015625, -5.9365234375, -5.66009521484375, -5.3836669921875, -5.10723876953125, -4.830810546875, -4.55438232421875, -4.2779541015625, -4.00152587890625, -3.72509765625, -3.44866943359375, -3.1722412109375, -2.89581298828125, -2.619384765625, -2.34295654296875, -2.0665283203125, -1.79010009765625, -1.513671875, -1.23724365234375, -0.9608154296875, -0.68438720703125, -0.407958984375, -0.13153076171875, 0.1448974609375, 0.42132568359375, 0.69775390625, 0.97418212890625, 1.2506103515625, 1.52703857421875, 1.803466796875, 2.07989501953125, 2.3563232421875, 2.63275146484375, 2.9091796875, 3.18560791015625, 3.4620361328125, 3.73846435546875, 4.014892578125, 4.29132080078125, 4.5677490234375, 4.84417724609375, 5.12060546875, 5.39703369140625, 5.6734619140625, 5.94989013671875, 6.226318359375, 6.50274658203125, 6.7791748046875, 7.05560302734375, 7.33203125]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 3.0, 4.0, 10.0, 4.0, 5.0, 6.0, 15.0, 18.0, 20.0, 33.0, 38.0, 38.0, 41.0, 61.0, 45.0, 55.0, 66.0, 65.0, 64.0, 62.0, 54.0, 52.0, 44.0, 38.0, 24.0, 26.0, 22.0, 11.0, 11.0, 20.0, 13.0, 6.0, 6.0, 7.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0], "bins": [-3.451171875, -3.356689453125, -3.26220703125, -3.167724609375, -3.0732421875, -2.978759765625, -2.88427734375, -2.789794921875, -2.6953125, -2.600830078125, -2.50634765625, -2.411865234375, -2.3173828125, -2.222900390625, -2.12841796875, -2.033935546875, -1.939453125, -1.844970703125, -1.75048828125, -1.656005859375, -1.5615234375, -1.467041015625, -1.37255859375, -1.278076171875, -1.18359375, -1.089111328125, -0.99462890625, -0.900146484375, -0.8056640625, -0.711181640625, -0.61669921875, -0.522216796875, -0.427734375, -0.333251953125, -0.23876953125, -0.144287109375, -0.0498046875, 0.044677734375, 0.13916015625, 0.233642578125, 0.328125, 0.422607421875, 0.51708984375, 0.611572265625, 0.7060546875, 0.800537109375, 0.89501953125, 0.989501953125, 1.083984375, 1.178466796875, 1.27294921875, 1.367431640625, 1.4619140625, 1.556396484375, 1.65087890625, 1.745361328125, 1.83984375, 1.934326171875, 2.02880859375, 2.123291015625, 2.2177734375, 2.312255859375, 2.40673828125, 2.501220703125, 2.595703125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 2.0, 7.0, 9.0, 13.0, 12.0, 27.0, 37.0, 65.0, 113.0, 153.0, 275.0, 496.0, 891.0, 1753.0, 6186.0, 102639.0, 885297.0, 43032.0, 4205.0, 1519.0, 741.0, 417.0, 250.0, 133.0, 89.0, 60.0, 50.0, 31.0, 16.0, 17.0, 10.0, 7.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.0390625, -14.4222412109375, -13.805419921875, -13.1885986328125, -12.57177734375, -11.9549560546875, -11.338134765625, -10.7213134765625, -10.1044921875, -9.4876708984375, -8.870849609375, -8.2540283203125, -7.63720703125, -7.0203857421875, -6.403564453125, -5.7867431640625, -5.169921875, -4.5531005859375, -3.936279296875, -3.3194580078125, -2.70263671875, -2.0858154296875, -1.468994140625, -0.8521728515625, -0.2353515625, 0.3814697265625, 0.998291015625, 1.6151123046875, 2.23193359375, 2.8487548828125, 3.465576171875, 4.0823974609375, 4.69921875, 5.3160400390625, 5.932861328125, 6.5496826171875, 7.16650390625, 7.7833251953125, 8.400146484375, 9.0169677734375, 9.6337890625, 10.2506103515625, 10.867431640625, 11.4842529296875, 12.10107421875, 12.7178955078125, 13.334716796875, 13.9515380859375, 14.568359375, 15.1851806640625, 15.802001953125, 16.4188232421875, 17.03564453125, 17.6524658203125, 18.269287109375, 18.8861083984375, 19.5029296875, 20.1197509765625, 20.736572265625, 21.3533935546875, 21.97021484375, 22.5870361328125, 23.203857421875, 23.8206787109375, 24.4375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 6.0, 3.0, 2.0, 3.0, 19.0, 19.0, 20.0, 12.0, 29.0, 44.0, 56.0, 62.0, 72.0, 72.0, 75.0, 94.0, 64.0, 70.0, 55.0, 59.0, 38.0, 24.0, 29.0, 22.0, 16.0, 13.0, 11.0, 11.0, 4.0, 4.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-26.046875, -25.34716796875, -24.6474609375, -23.94775390625, -23.248046875, -22.54833984375, -21.8486328125, -21.14892578125, -20.44921875, -19.74951171875, -19.0498046875, -18.35009765625, -17.650390625, -16.95068359375, -16.2509765625, -15.55126953125, -14.8515625, -14.15185546875, -13.4521484375, -12.75244140625, -12.052734375, -11.35302734375, -10.6533203125, -9.95361328125, -9.25390625, -8.55419921875, -7.8544921875, -7.15478515625, -6.455078125, -5.75537109375, -5.0556640625, -4.35595703125, -3.65625, -2.95654296875, -2.2568359375, -1.55712890625, -0.857421875, -0.15771484375, 0.5419921875, 1.24169921875, 1.94140625, 2.64111328125, 3.3408203125, 4.04052734375, 4.740234375, 5.43994140625, 6.1396484375, 6.83935546875, 7.5390625, 8.23876953125, 8.9384765625, 9.63818359375, 10.337890625, 11.03759765625, 11.7373046875, 12.43701171875, 13.13671875, 13.83642578125, 14.5361328125, 15.23583984375, 15.935546875, 16.63525390625, 17.3349609375, 18.03466796875, 18.734375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 2.0, 2.0, 4.0, 5.0, 5.0, 8.0, 9.0, 8.0, 15.0, 24.0, 25.0, 30.0, 50.0, 75.0, 128.0, 181.0, 351.0, 641.0, 1521.0, 6263.0, 64304.0, 851653.0, 111233.0, 8376.0, 1879.0, 747.0, 368.0, 220.0, 135.0, 81.0, 50.0, 46.0, 25.0, 23.0, 17.0, 12.0, 11.0, 9.0, 8.0, 3.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-10.2421875, -9.9278564453125, -9.613525390625, -9.2991943359375, -8.98486328125, -8.6705322265625, -8.356201171875, -8.0418701171875, -7.7275390625, -7.4132080078125, -7.098876953125, -6.7845458984375, -6.47021484375, -6.1558837890625, -5.841552734375, -5.5272216796875, -5.212890625, -4.8985595703125, -4.584228515625, -4.2698974609375, -3.95556640625, -3.6412353515625, -3.326904296875, -3.0125732421875, -2.6982421875, -2.3839111328125, -2.069580078125, -1.7552490234375, -1.44091796875, -1.1265869140625, -0.812255859375, -0.4979248046875, -0.18359375, 0.1307373046875, 0.445068359375, 0.7593994140625, 1.07373046875, 1.3880615234375, 1.702392578125, 2.0167236328125, 2.3310546875, 2.6453857421875, 2.959716796875, 3.2740478515625, 3.58837890625, 3.9027099609375, 4.217041015625, 4.5313720703125, 4.845703125, 5.1600341796875, 5.474365234375, 5.7886962890625, 6.10302734375, 6.4173583984375, 6.731689453125, 7.0460205078125, 7.3603515625, 7.6746826171875, 7.989013671875, 8.3033447265625, 8.61767578125, 8.9320068359375, 9.246337890625, 9.5606689453125, 9.875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 5.0, 4.0, 5.0, 14.0, 11.0, 16.0, 13.0, 27.0, 24.0, 39.0, 46.0, 69.0, 80.0, 109.0, 104.0, 91.0, 82.0, 52.0, 45.0, 36.0, 31.0, 18.0, 18.0, 13.0, 14.0, 9.0, 4.0, 4.0, 2.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0009794235229492188, -0.0009481757879257202, -0.0009169280529022217, -0.0008856803178787231, -0.0008544325828552246, -0.0008231848478317261, -0.0007919371128082275, -0.000760689377784729, -0.0007294416427612305, -0.0006981939077377319, -0.0006669461727142334, -0.0006356984376907349, -0.0006044507026672363, -0.0005732029676437378, -0.0005419552326202393, -0.0005107074975967407, -0.0004794597625732422, -0.00044821202754974365, -0.0004169642925262451, -0.0003857165575027466, -0.00035446882247924805, -0.0003232210874557495, -0.000291973352432251, -0.00026072561740875244, -0.0002294778823852539, -0.00019823014736175537, -0.00016698241233825684, -0.0001357346773147583, -0.00010448694229125977, -7.323920726776123e-05, -4.1991472244262695e-05, -1.074373722076416e-05, 2.0503997802734375e-05, 5.175173282623291e-05, 8.299946784973145e-05, 0.00011424720287322998, 0.00014549493789672852, 0.00017674267292022705, 0.00020799040794372559, 0.00023923814296722412, 0.00027048587799072266, 0.0003017336130142212, 0.0003329813480377197, 0.00036422908306121826, 0.0003954768180847168, 0.00042672455310821533, 0.00045797228813171387, 0.0004892200231552124, 0.0005204677581787109, 0.0005517154932022095, 0.000582963228225708, 0.0006142109632492065, 0.0006454586982727051, 0.0006767064332962036, 0.0007079541683197021, 0.0007392019033432007, 0.0007704496383666992, 0.0008016973733901978, 0.0008329451084136963, 0.0008641928434371948, 0.0008954405784606934, 0.0009266883134841919, 0.0009579360485076904, 0.000989183783531189, 0.0010204315185546875]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 2.0, 6.0, 11.0, 7.0, 16.0, 24.0, 36.0, 61.0, 98.0, 161.0, 296.0, 543.0, 1206.0, 3723.0, 23745.0, 621392.0, 375325.0, 16672.0, 2947.0, 1099.0, 515.0, 253.0, 157.0, 83.0, 53.0, 37.0, 24.0, 13.0, 15.0, 6.0, 4.0, 5.0, 8.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.8828125, -9.5411376953125, -9.199462890625, -8.8577880859375, -8.51611328125, -8.1744384765625, -7.832763671875, -7.4910888671875, -7.1494140625, -6.8077392578125, -6.466064453125, -6.1243896484375, -5.78271484375, -5.4410400390625, -5.099365234375, -4.7576904296875, -4.416015625, -4.0743408203125, -3.732666015625, -3.3909912109375, -3.04931640625, -2.7076416015625, -2.365966796875, -2.0242919921875, -1.6826171875, -1.3409423828125, -0.999267578125, -0.6575927734375, -0.31591796875, 0.0257568359375, 0.367431640625, 0.7091064453125, 1.05078125, 1.3924560546875, 1.734130859375, 2.0758056640625, 2.41748046875, 2.7591552734375, 3.100830078125, 3.4425048828125, 3.7841796875, 4.1258544921875, 4.467529296875, 4.8092041015625, 5.15087890625, 5.4925537109375, 5.834228515625, 6.1759033203125, 6.517578125, 6.8592529296875, 7.200927734375, 7.5426025390625, 7.88427734375, 8.2259521484375, 8.567626953125, 8.9093017578125, 9.2509765625, 9.5926513671875, 9.934326171875, 10.2760009765625, 10.61767578125, 10.9593505859375, 11.301025390625, 11.6427001953125, 11.984375]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 9.0, 4.0, 9.0, 11.0, 13.0, 13.0, 17.0, 34.0, 53.0, 35.0, 61.0, 74.0, 88.0, 103.0, 85.0, 112.0, 70.0, 55.0, 47.0, 37.0, 16.0, 15.0, 11.0, 6.0, 9.0, 4.0, 2.0, 8.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.93359375, -5.70318603515625, -5.4727783203125, -5.24237060546875, -5.011962890625, -4.78155517578125, -4.5511474609375, -4.32073974609375, -4.09033203125, -3.85992431640625, -3.6295166015625, -3.39910888671875, -3.168701171875, -2.93829345703125, -2.7078857421875, -2.47747802734375, -2.2470703125, -2.01666259765625, -1.7862548828125, -1.55584716796875, -1.325439453125, -1.09503173828125, -0.8646240234375, -0.63421630859375, -0.40380859375, -0.17340087890625, 0.0570068359375, 0.28741455078125, 0.517822265625, 0.74822998046875, 0.9786376953125, 1.20904541015625, 1.439453125, 1.66986083984375, 1.9002685546875, 2.13067626953125, 2.361083984375, 2.59149169921875, 2.8218994140625, 3.05230712890625, 3.28271484375, 3.51312255859375, 3.7435302734375, 3.97393798828125, 4.204345703125, 4.43475341796875, 4.6651611328125, 4.89556884765625, 5.1259765625, 5.35638427734375, 5.5867919921875, 5.81719970703125, 6.047607421875, 6.27801513671875, 6.5084228515625, 6.73883056640625, 6.96923828125, 7.19964599609375, 7.4300537109375, 7.66046142578125, 7.890869140625, 8.12127685546875, 8.3516845703125, 8.58209228515625, 8.8125]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 23.0, 125.0, 422.0, 320.0, 89.0, 13.0, 6.0, 6.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-394.9014892578125, -385.2113037109375, -375.5211181640625, -365.8309326171875, -356.1407470703125, -346.4505615234375, -336.7603759765625, -327.0701904296875, -317.3800048828125, -307.6898193359375, -297.9996337890625, -288.3094482421875, -278.6192626953125, -268.9290771484375, -259.2388916015625, -249.5487060546875, -239.8585205078125, -230.1683349609375, -220.4781494140625, -210.7879638671875, -201.0977783203125, -191.4075927734375, -181.7174072265625, -172.0272216796875, -162.3370361328125, -152.6468505859375, -142.9566650390625, -133.2664794921875, -123.5762939453125, -113.8861083984375, -104.1959228515625, -94.5057373046875, -84.81552124023438, -75.12533569335938, -65.43515014648438, -55.744964599609375, -46.054779052734375, -36.364593505859375, -26.674407958984375, -16.984222412109375, -7.294036865234375, 2.396148681640625, 12.086334228515625, 21.776519775390625, 31.466705322265625, 41.156890869140625, 50.847076416015625, 60.537261962890625, 70.22744750976562, 79.91763305664062, 89.60781860351562, 99.29800415039062, 108.98818969726562, 118.67837524414062, 128.36856079101562, 138.05874633789062, 147.74893188476562, 157.43911743164062, 167.12930297851562, 176.81948852539062, 186.50967407226562, 196.19985961914062, 205.89004516601562, 215.58023071289062, 225.27041625976562]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 1.0, 3.0, 4.0, 0.0, 3.0, 5.0, 7.0, 7.0, 8.0, 12.0, 10.0, 17.0, 20.0, 28.0, 30.0, 36.0, 32.0, 37.0, 39.0, 44.0, 51.0, 45.0, 50.0, 52.0, 50.0, 53.0, 46.0, 43.0, 27.0, 35.0, 33.0, 26.0, 27.0, 27.0, 22.0, 20.0, 9.0, 13.0, 7.0, 6.0, 9.0, 2.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0], "bins": [-66.11119842529297, -64.19395446777344, -62.27671813964844, -60.35947799682617, -58.442237854003906, -56.524993896484375, -54.60775375366211, -52.690513610839844, -50.77327346801758, -48.85603332519531, -46.93879318237305, -45.02155303955078, -43.10430908203125, -41.18707275390625, -39.26982879638672, -37.35258865356445, -35.43534851074219, -33.51810836791992, -31.600868225097656, -29.683626174926758, -27.766386032104492, -25.849145889282227, -23.931903839111328, -22.014663696289062, -20.097423553466797, -18.18018341064453, -16.262943267822266, -14.345701217651367, -12.428461074829102, -10.511220932006836, -8.593979835510254, -6.676738739013672, -4.759502410888672, -2.842261791229248, -0.9250211715698242, 0.9922194480895996, 2.9094600677490234, 4.826700210571289, 6.743941307067871, 8.661182403564453, 10.578422546386719, 12.495662689208984, 14.412903785705566, 16.33014488220215, 18.247385025024414, 20.16462516784668, 22.081867218017578, 23.999107360839844, 25.91634750366211, 27.833587646484375, 29.75082778930664, 31.66806983947754, 33.58531188964844, 35.50254821777344, 37.41979217529297, 39.337032318115234, 41.2542724609375, 43.171512603759766, 45.08875274658203, 47.0059928894043, 48.92323303222656, 50.840476989746094, 52.75771713256836, 54.674957275390625, 56.59219741821289]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 7.0, 6.0, 12.0, 10.0, 22.0, 22.0, 43.0, 51.0, 81.0, 116.0, 164.0, 305.0, 487.0, 928.0, 1851.0, 3648.0, 9054.0, 29654.0, 220110.0, 3810137.0, 87375.0, 17990.0, 6049.0, 2790.0, 1451.0, 744.0, 431.0, 250.0, 166.0, 118.0, 48.0, 51.0, 25.0, 24.0, 19.0, 18.0, 12.0, 4.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-8.9765625, -8.7149658203125, -8.453369140625, -8.1917724609375, -7.93017578125, -7.6685791015625, -7.406982421875, -7.1453857421875, -6.8837890625, -6.6221923828125, -6.360595703125, -6.0989990234375, -5.83740234375, -5.5758056640625, -5.314208984375, -5.0526123046875, -4.791015625, -4.5294189453125, -4.267822265625, -4.0062255859375, -3.74462890625, -3.4830322265625, -3.221435546875, -2.9598388671875, -2.6982421875, -2.4366455078125, -2.175048828125, -1.9134521484375, -1.65185546875, -1.3902587890625, -1.128662109375, -0.8670654296875, -0.60546875, -0.3438720703125, -0.082275390625, 0.1793212890625, 0.44091796875, 0.7025146484375, 0.964111328125, 1.2257080078125, 1.4873046875, 1.7489013671875, 2.010498046875, 2.2720947265625, 2.53369140625, 2.7952880859375, 3.056884765625, 3.3184814453125, 3.580078125, 3.8416748046875, 4.103271484375, 4.3648681640625, 4.62646484375, 4.8880615234375, 5.149658203125, 5.4112548828125, 5.6728515625, 5.9344482421875, 6.196044921875, 6.4576416015625, 6.71923828125, 6.9808349609375, 7.242431640625, 7.5040283203125, 7.765625]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 3.0, 7.0, 4.0, 5.0, 14.0, 14.0, 31.0, 39.0, 41.0, 75.0, 63.0, 87.0, 81.0, 110.0, 89.0, 76.0, 56.0, 49.0, 49.0, 27.0, 19.0, 13.0, 13.0, 11.0, 4.0, 4.0, 6.0, 4.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.1328125, -3.99652099609375, -3.8602294921875, -3.72393798828125, -3.587646484375, -3.45135498046875, -3.3150634765625, -3.17877197265625, -3.04248046875, -2.90618896484375, -2.7698974609375, -2.63360595703125, -2.497314453125, -2.36102294921875, -2.2247314453125, -2.08843994140625, -1.9521484375, -1.81585693359375, -1.6795654296875, -1.54327392578125, -1.406982421875, -1.27069091796875, -1.1343994140625, -0.99810791015625, -0.86181640625, -0.72552490234375, -0.5892333984375, -0.45294189453125, -0.316650390625, -0.18035888671875, -0.0440673828125, 0.09222412109375, 0.228515625, 0.36480712890625, 0.5010986328125, 0.63739013671875, 0.773681640625, 0.90997314453125, 1.0462646484375, 1.18255615234375, 1.31884765625, 1.45513916015625, 1.5914306640625, 1.72772216796875, 1.864013671875, 2.00030517578125, 2.1365966796875, 2.27288818359375, 2.4091796875, 2.54547119140625, 2.6817626953125, 2.81805419921875, 2.954345703125, 3.09063720703125, 3.2269287109375, 3.36322021484375, 3.49951171875, 3.63580322265625, 3.7720947265625, 3.90838623046875, 4.044677734375, 4.18096923828125, 4.3172607421875, 4.45355224609375, 4.58984375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 7.0, 4.0, 11.0, 8.0, 11.0, 20.0, 37.0, 55.0, 73.0, 150.0, 232.0, 485.0, 1029.0, 2623.0, 7747.0, 35247.0, 3442556.0, 666099.0, 27240.0, 6567.0, 2253.0, 850.0, 426.0, 196.0, 112.0, 75.0, 53.0, 35.0, 28.0, 15.0, 15.0, 7.0, 6.0, 4.0, 7.0, 3.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.890625, -14.4091796875, -13.927734375, -13.4462890625, -12.96484375, -12.4833984375, -12.001953125, -11.5205078125, -11.0390625, -10.5576171875, -10.076171875, -9.5947265625, -9.11328125, -8.6318359375, -8.150390625, -7.6689453125, -7.1875, -6.7060546875, -6.224609375, -5.7431640625, -5.26171875, -4.7802734375, -4.298828125, -3.8173828125, -3.3359375, -2.8544921875, -2.373046875, -1.8916015625, -1.41015625, -0.9287109375, -0.447265625, 0.0341796875, 0.515625, 0.9970703125, 1.478515625, 1.9599609375, 2.44140625, 2.9228515625, 3.404296875, 3.8857421875, 4.3671875, 4.8486328125, 5.330078125, 5.8115234375, 6.29296875, 6.7744140625, 7.255859375, 7.7373046875, 8.21875, 8.7001953125, 9.181640625, 9.6630859375, 10.14453125, 10.6259765625, 11.107421875, 11.5888671875, 12.0703125, 12.5517578125, 13.033203125, 13.5146484375, 13.99609375, 14.4775390625, 14.958984375, 15.4404296875, 15.921875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 5.0, 4.0, 5.0, 12.0, 14.0, 13.0, 16.0, 57.0, 108.0, 359.0, 2770.0, 434.0, 121.0, 67.0, 26.0, 14.0, 17.0, 7.0, 8.0, 10.0, 2.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.7578125, -4.56414794921875, -4.3704833984375, -4.17681884765625, -3.983154296875, -3.78948974609375, -3.5958251953125, -3.40216064453125, -3.20849609375, -3.01483154296875, -2.8211669921875, -2.62750244140625, -2.433837890625, -2.24017333984375, -2.0465087890625, -1.85284423828125, -1.6591796875, -1.46551513671875, -1.2718505859375, -1.07818603515625, -0.884521484375, -0.69085693359375, -0.4971923828125, -0.30352783203125, -0.10986328125, 0.08380126953125, 0.2774658203125, 0.47113037109375, 0.664794921875, 0.85845947265625, 1.0521240234375, 1.24578857421875, 1.439453125, 1.63311767578125, 1.8267822265625, 2.02044677734375, 2.214111328125, 2.40777587890625, 2.6014404296875, 2.79510498046875, 2.98876953125, 3.18243408203125, 3.3760986328125, 3.56976318359375, 3.763427734375, 3.95709228515625, 4.1507568359375, 4.34442138671875, 4.5380859375, 4.73175048828125, 4.9254150390625, 5.11907958984375, 5.312744140625, 5.50640869140625, 5.7000732421875, 5.89373779296875, 6.08740234375, 6.28106689453125, 6.4747314453125, 6.66839599609375, 6.862060546875, 7.05572509765625, 7.2493896484375, 7.44305419921875, 7.63671875]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 15.0, 28.0, 63.0, 108.0, 182.0, 205.0, 171.0, 137.0, 52.0, 17.0, 10.0, 9.0, 0.0, 2.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.58665466308594, -46.381343841552734, -45.17603302001953, -43.97071838378906, -42.76540756225586, -41.560096740722656, -40.35478591918945, -39.14947509765625, -37.94416046142578, -36.73884963989258, -35.533538818359375, -34.328224182128906, -33.1229133605957, -31.9176025390625, -30.712291717529297, -29.506980895996094, -28.30167007446289, -27.096359252929688, -25.89104652404785, -24.68573570251465, -23.480422973632812, -22.27511215209961, -21.069801330566406, -19.864490509033203, -18.659177780151367, -17.453866958618164, -16.248554229736328, -15.043243408203125, -13.837931632995605, -12.632619857788086, -11.427309036254883, -10.221997261047363, -9.016681671142578, -7.811369895935059, -6.606058597564697, -5.400747299194336, -4.195435523986816, -2.990123748779297, -1.7848124504089355, -0.5795011520385742, 0.6258106231689453, 1.8311221599578857, 3.036433696746826, 4.2417449951171875, 5.447056770324707, 6.652368545532227, 7.857679843902588, 9.06299114227295, 10.268302917480469, 11.473614692687988, 12.678926467895508, 13.884237289428711, 15.08954906463623, 16.29486083984375, 17.500171661376953, 18.705482482910156, 19.910795211791992, 21.116106033325195, 22.32141876220703, 23.526729583740234, 24.732040405273438, 25.937353134155273, 27.142663955688477, 28.347976684570312, 29.553287506103516]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 0.0, 4.0, 6.0, 5.0, 6.0, 9.0, 11.0, 18.0, 8.0, 15.0, 20.0, 18.0, 30.0, 23.0, 28.0, 32.0, 38.0, 51.0, 50.0, 38.0, 35.0, 41.0, 43.0, 46.0, 37.0, 39.0, 28.0, 30.0, 42.0, 35.0, 27.0, 24.0, 26.0, 24.0, 12.0, 21.0, 16.0, 11.0, 12.0, 7.0, 8.0, 7.0, 4.0, 6.0, 4.0, 6.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-13.290494918823242, -12.892053604125977, -12.493612289428711, -12.095170974731445, -11.696728706359863, -11.298287391662598, -10.899846076965332, -10.501404762268066, -10.1029634475708, -9.704522132873535, -9.30608081817627, -8.907638549804688, -8.509197235107422, -8.110755920410156, -7.712314605712891, -7.313873291015625, -6.915431499481201, -6.5169901847839355, -6.118548393249512, -5.720107078552246, -5.3216657638549805, -4.923224449157715, -4.524782657623291, -4.126341342926025, -3.7278997898101807, -3.329458236694336, -2.9310169219970703, -2.5325753688812256, -2.134133815765381, -1.7356925010681152, -1.3372509479522705, -0.9388096332550049, -0.5403680801391602, -0.1419266164302826, 0.25651484727859497, 0.6549563407897949, 1.05339777469635, 1.4518392086029053, 1.85028076171875, 2.2487220764160156, 2.6471636295318604, 3.045605182647705, 3.4440464973449707, 3.8424880504608154, 4.24092960357666, 4.639370918273926, 5.037812232971191, 5.436253547668457, 5.834695339202881, 6.2331366539001465, 6.63157844543457, 7.030019760131836, 7.428461074829102, 7.826902389526367, 8.225343704223633, 8.623785018920898, 9.02222728729248, 9.420668601989746, 9.819109916687012, 10.217552185058594, 10.61599349975586, 11.014434814453125, 11.41287612915039, 11.811317443847656, 12.209758758544922]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 5.0, 5.0, 12.0, 6.0, 9.0, 13.0, 19.0, 36.0, 55.0, 80.0, 118.0, 226.0, 339.0, 616.0, 1155.0, 2384.0, 5117.0, 11803.0, 31157.0, 87034.0, 279180.0, 416521.0, 135270.0, 46907.0, 17098.0, 6983.0, 3046.0, 1462.0, 793.0, 411.0, 225.0, 163.0, 96.0, 63.0, 50.0, 33.0, 24.0, 18.0, 7.0, 9.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-8.7578125, -8.515869140625, -8.27392578125, -8.031982421875, -7.7900390625, -7.548095703125, -7.30615234375, -7.064208984375, -6.822265625, -6.580322265625, -6.33837890625, -6.096435546875, -5.8544921875, -5.612548828125, -5.37060546875, -5.128662109375, -4.88671875, -4.644775390625, -4.40283203125, -4.160888671875, -3.9189453125, -3.677001953125, -3.43505859375, -3.193115234375, -2.951171875, -2.709228515625, -2.46728515625, -2.225341796875, -1.9833984375, -1.741455078125, -1.49951171875, -1.257568359375, -1.015625, -0.773681640625, -0.53173828125, -0.289794921875, -0.0478515625, 0.194091796875, 0.43603515625, 0.677978515625, 0.919921875, 1.161865234375, 1.40380859375, 1.645751953125, 1.8876953125, 2.129638671875, 2.37158203125, 2.613525390625, 2.85546875, 3.097412109375, 3.33935546875, 3.581298828125, 3.8232421875, 4.065185546875, 4.30712890625, 4.549072265625, 4.791015625, 5.032958984375, 5.27490234375, 5.516845703125, 5.7587890625, 6.000732421875, 6.24267578125, 6.484619140625, 6.7265625]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 6.0, 7.0, 6.0, 13.0, 10.0, 11.0, 26.0, 32.0, 33.0, 37.0, 42.0, 47.0, 76.0, 68.0, 69.0, 76.0, 69.0, 51.0, 59.0, 49.0, 51.0, 26.0, 20.0, 21.0, 21.0, 20.0, 15.0, 18.0, 8.0, 1.0, 3.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.60546875, -3.490447998046875, -3.37542724609375, -3.260406494140625, -3.1453857421875, -3.030364990234375, -2.91534423828125, -2.800323486328125, -2.685302734375, -2.570281982421875, -2.45526123046875, -2.340240478515625, -2.2252197265625, -2.110198974609375, -1.99517822265625, -1.880157470703125, -1.76513671875, -1.650115966796875, -1.53509521484375, -1.420074462890625, -1.3050537109375, -1.190032958984375, -1.07501220703125, -0.959991455078125, -0.844970703125, -0.729949951171875, -0.61492919921875, -0.499908447265625, -0.3848876953125, -0.269866943359375, -0.15484619140625, -0.039825439453125, 0.0751953125, 0.190216064453125, 0.30523681640625, 0.420257568359375, 0.5352783203125, 0.650299072265625, 0.76531982421875, 0.880340576171875, 0.995361328125, 1.110382080078125, 1.22540283203125, 1.340423583984375, 1.4554443359375, 1.570465087890625, 1.68548583984375, 1.800506591796875, 1.91552734375, 2.030548095703125, 2.14556884765625, 2.260589599609375, 2.3756103515625, 2.490631103515625, 2.60565185546875, 2.720672607421875, 2.835693359375, 2.950714111328125, 3.06573486328125, 3.180755615234375, 3.2957763671875, 3.410797119140625, 3.52581787109375, 3.640838623046875, 3.755859375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 7.0, 13.0, 2.0, 6.0, 7.0, 21.0, 24.0, 27.0, 38.0, 62.0, 95.0, 122.0, 200.0, 296.0, 467.0, 725.0, 1284.0, 2616.0, 7554.0, 43369.0, 559285.0, 387537.0, 32776.0, 6478.0, 2313.0, 1244.0, 714.0, 378.0, 269.0, 189.0, 138.0, 97.0, 65.0, 32.0, 37.0, 17.0, 13.0, 13.0, 10.0, 7.0, 3.0, 3.0, 1.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.96875, -15.48388671875, -14.9990234375, -14.51416015625, -14.029296875, -13.54443359375, -13.0595703125, -12.57470703125, -12.08984375, -11.60498046875, -11.1201171875, -10.63525390625, -10.150390625, -9.66552734375, -9.1806640625, -8.69580078125, -8.2109375, -7.72607421875, -7.2412109375, -6.75634765625, -6.271484375, -5.78662109375, -5.3017578125, -4.81689453125, -4.33203125, -3.84716796875, -3.3623046875, -2.87744140625, -2.392578125, -1.90771484375, -1.4228515625, -0.93798828125, -0.453125, 0.03173828125, 0.5166015625, 1.00146484375, 1.486328125, 1.97119140625, 2.4560546875, 2.94091796875, 3.42578125, 3.91064453125, 4.3955078125, 4.88037109375, 5.365234375, 5.85009765625, 6.3349609375, 6.81982421875, 7.3046875, 7.78955078125, 8.2744140625, 8.75927734375, 9.244140625, 9.72900390625, 10.2138671875, 10.69873046875, 11.18359375, 11.66845703125, 12.1533203125, 12.63818359375, 13.123046875, 13.60791015625, 14.0927734375, 14.57763671875, 15.0625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 4.0, 5.0, 8.0, 8.0, 12.0, 4.0, 7.0, 8.0, 15.0, 12.0, 22.0, 30.0, 31.0, 38.0, 35.0, 63.0, 50.0, 47.0, 58.0, 53.0, 62.0, 55.0, 53.0, 49.0, 48.0, 39.0, 31.0, 32.0, 22.0, 21.0, 16.0, 8.0, 11.0, 10.0, 9.0, 10.0, 8.0, 0.0, 2.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.2578125, -11.7777099609375, -11.297607421875, -10.8175048828125, -10.33740234375, -9.8572998046875, -9.377197265625, -8.8970947265625, -8.4169921875, -7.9368896484375, -7.456787109375, -6.9766845703125, -6.49658203125, -6.0164794921875, -5.536376953125, -5.0562744140625, -4.576171875, -4.0960693359375, -3.615966796875, -3.1358642578125, -2.65576171875, -2.1756591796875, -1.695556640625, -1.2154541015625, -0.7353515625, -0.2552490234375, 0.224853515625, 0.7049560546875, 1.18505859375, 1.6651611328125, 2.145263671875, 2.6253662109375, 3.10546875, 3.5855712890625, 4.065673828125, 4.5457763671875, 5.02587890625, 5.5059814453125, 5.986083984375, 6.4661865234375, 6.9462890625, 7.4263916015625, 7.906494140625, 8.3865966796875, 8.86669921875, 9.3468017578125, 9.826904296875, 10.3070068359375, 10.787109375, 11.2672119140625, 11.747314453125, 12.2274169921875, 12.70751953125, 13.1876220703125, 13.667724609375, 14.1478271484375, 14.6279296875, 15.1080322265625, 15.588134765625, 16.0682373046875, 16.54833984375, 17.0284423828125, 17.508544921875, 17.9886474609375, 18.46875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 2.0, 4.0, 6.0, 8.0, 8.0, 17.0, 19.0, 17.0, 35.0, 39.0, 65.0, 114.0, 158.0, 303.0, 533.0, 1000.0, 2311.0, 6031.0, 22245.0, 142474.0, 706855.0, 134484.0, 21430.0, 5807.0, 2233.0, 1009.0, 522.0, 304.0, 189.0, 103.0, 69.0, 58.0, 31.0, 15.0, 17.0, 14.0, 6.0, 6.0, 5.0, 5.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-6.953125, -6.76763916015625, -6.5821533203125, -6.39666748046875, -6.211181640625, -6.02569580078125, -5.8402099609375, -5.65472412109375, -5.46923828125, -5.28375244140625, -5.0982666015625, -4.91278076171875, -4.727294921875, -4.54180908203125, -4.3563232421875, -4.17083740234375, -3.9853515625, -3.79986572265625, -3.6143798828125, -3.42889404296875, -3.243408203125, -3.05792236328125, -2.8724365234375, -2.68695068359375, -2.50146484375, -2.31597900390625, -2.1304931640625, -1.94500732421875, -1.759521484375, -1.57403564453125, -1.3885498046875, -1.20306396484375, -1.017578125, -0.83209228515625, -0.6466064453125, -0.46112060546875, -0.275634765625, -0.09014892578125, 0.0953369140625, 0.28082275390625, 0.46630859375, 0.65179443359375, 0.8372802734375, 1.02276611328125, 1.208251953125, 1.39373779296875, 1.5792236328125, 1.76470947265625, 1.9501953125, 2.13568115234375, 2.3211669921875, 2.50665283203125, 2.692138671875, 2.87762451171875, 3.0631103515625, 3.24859619140625, 3.43408203125, 3.61956787109375, 3.8050537109375, 3.99053955078125, 4.176025390625, 4.36151123046875, 4.5469970703125, 4.73248291015625, 4.91796875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 9.0, 7.0, 6.0, 6.0, 15.0, 22.0, 25.0, 24.0, 46.0, 51.0, 77.0, 93.0, 138.0, 135.0, 85.0, 60.0, 35.0, 37.0, 25.0, 31.0, 21.0, 11.0, 10.0, 10.0, 9.0, 5.0, 3.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011386871337890625, -0.0010962188243865967, -0.0010537505149841309, -0.001011282205581665, -0.0009688138961791992, -0.0009263455867767334, -0.0008838772773742676, -0.0008414089679718018, -0.0007989406585693359, -0.0007564723491668701, -0.0007140040397644043, -0.0006715357303619385, -0.0006290674209594727, -0.0005865991115570068, -0.000544130802154541, -0.0005016624927520752, -0.0004591941833496094, -0.00041672587394714355, -0.00037425756454467773, -0.0003317892551422119, -0.0002893209457397461, -0.0002468526363372803, -0.00020438432693481445, -0.00016191601753234863, -0.00011944770812988281, -7.697939872741699e-05, -3.451108932495117e-05, 7.957220077514648e-06, 5.042552947998047e-05, 9.289383888244629e-05, 0.0001353621482849121, 0.00017783045768737793, 0.00022029876708984375, 0.00026276707649230957, 0.0003052353858947754, 0.0003477036952972412, 0.00039017200469970703, 0.00043264031410217285, 0.00047510862350463867, 0.0005175769329071045, 0.0005600452423095703, 0.0006025135517120361, 0.000644981861114502, 0.0006874501705169678, 0.0007299184799194336, 0.0007723867893218994, 0.0008148550987243652, 0.0008573234081268311, 0.0008997917175292969, 0.0009422600269317627, 0.0009847283363342285, 0.0010271966457366943, 0.0010696649551391602, 0.001112133264541626, 0.0011546015739440918, 0.0011970698833465576, 0.0012395381927490234, 0.0012820065021514893, 0.001324474811553955, 0.001366943120956421, 0.0014094114303588867, 0.0014518797397613525, 0.0014943480491638184, 0.0015368163585662842, 0.00157928466796875]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 7.0, 6.0, 5.0, 10.0, 16.0, 16.0, 11.0, 25.0, 33.0, 52.0, 70.0, 96.0, 136.0, 238.0, 417.0, 790.0, 1716.0, 4684.0, 19878.0, 180178.0, 731265.0, 90080.0, 12419.0, 3392.0, 1373.0, 660.0, 365.0, 202.0, 132.0, 80.0, 60.0, 42.0, 31.0, 15.0, 11.0, 11.0, 3.0, 6.0, 4.0, 1.0, 6.0, 2.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.328125, -6.1263427734375, -5.924560546875, -5.7227783203125, -5.52099609375, -5.3192138671875, -5.117431640625, -4.9156494140625, -4.7138671875, -4.5120849609375, -4.310302734375, -4.1085205078125, -3.90673828125, -3.7049560546875, -3.503173828125, -3.3013916015625, -3.099609375, -2.8978271484375, -2.696044921875, -2.4942626953125, -2.29248046875, -2.0906982421875, -1.888916015625, -1.6871337890625, -1.4853515625, -1.2835693359375, -1.081787109375, -0.8800048828125, -0.67822265625, -0.4764404296875, -0.274658203125, -0.0728759765625, 0.12890625, 0.3306884765625, 0.532470703125, 0.7342529296875, 0.93603515625, 1.1378173828125, 1.339599609375, 1.5413818359375, 1.7431640625, 1.9449462890625, 2.146728515625, 2.3485107421875, 2.55029296875, 2.7520751953125, 2.953857421875, 3.1556396484375, 3.357421875, 3.5592041015625, 3.760986328125, 3.9627685546875, 4.16455078125, 4.3663330078125, 4.568115234375, 4.7698974609375, 4.9716796875, 5.1734619140625, 5.375244140625, 5.5770263671875, 5.77880859375, 5.9805908203125, 6.182373046875, 6.3841552734375, 6.5859375]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 7.0, 3.0, 5.0, 7.0, 6.0, 10.0, 14.0, 25.0, 30.0, 27.0, 46.0, 46.0, 70.0, 89.0, 105.0, 100.0, 69.0, 88.0, 57.0, 61.0, 29.0, 24.0, 21.0, 21.0, 13.0, 6.0, 5.0, 4.0, 2.0, 3.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.30078125, -5.135986328125, -4.97119140625, -4.806396484375, -4.6416015625, -4.476806640625, -4.31201171875, -4.147216796875, -3.982421875, -3.817626953125, -3.65283203125, -3.488037109375, -3.3232421875, -3.158447265625, -2.99365234375, -2.828857421875, -2.6640625, -2.499267578125, -2.33447265625, -2.169677734375, -2.0048828125, -1.840087890625, -1.67529296875, -1.510498046875, -1.345703125, -1.180908203125, -1.01611328125, -0.851318359375, -0.6865234375, -0.521728515625, -0.35693359375, -0.192138671875, -0.02734375, 0.137451171875, 0.30224609375, 0.467041015625, 0.6318359375, 0.796630859375, 0.96142578125, 1.126220703125, 1.291015625, 1.455810546875, 1.62060546875, 1.785400390625, 1.9501953125, 2.114990234375, 2.27978515625, 2.444580078125, 2.609375, 2.774169921875, 2.93896484375, 3.103759765625, 3.2685546875, 3.433349609375, 3.59814453125, 3.762939453125, 3.927734375, 4.092529296875, 4.25732421875, 4.422119140625, 4.5869140625, 4.751708984375, 4.91650390625, 5.081298828125, 5.24609375]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 6.0, 8.0, 19.0, 25.0, 67.0, 140.0, 206.0, 209.0, 162.0, 88.0, 32.0, 19.0, 11.0, 5.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-166.58319091796875, -161.975830078125, -157.36846923828125, -152.7611083984375, -148.15374755859375, -143.54638671875, -138.93902587890625, -134.3316650390625, -129.72430419921875, -125.116943359375, -120.50958251953125, -115.9022216796875, -111.29486083984375, -106.6875, -102.08013916015625, -97.4727783203125, -92.86540985107422, -88.25804901123047, -83.65068817138672, -79.04332733154297, -74.43596649169922, -69.82860565185547, -65.22123718261719, -60.6138801574707, -56.00651931762695, -51.3991584777832, -46.79179763793945, -42.18443298339844, -37.57707214355469, -32.96971130371094, -28.362350463867188, -23.754989624023438, -19.147628784179688, -14.540267944335938, -9.932906150817871, -5.325544357299805, -0.7181835174560547, 3.8891773223876953, 8.496540069580078, 13.103900909423828, 17.711261749267578, 22.318622589111328, 26.925983428955078, 31.53334617614746, 36.140708923339844, 40.748069763183594, 45.355430603027344, 49.962791442871094, 54.570152282714844, 59.177513122558594, 63.784873962402344, 68.3922348022461, 72.99959564208984, 77.6069564819336, 82.21432495117188, 86.82168579101562, 91.42904663085938, 96.03640747070312, 100.64376831054688, 105.25112915039062, 109.85848999023438, 114.46585083007812, 119.07321166992188, 123.68057250976562, 128.28793334960938]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 8.0, 6.0, 10.0, 8.0, 4.0, 10.0, 19.0, 22.0, 27.0, 19.0, 36.0, 48.0, 34.0, 36.0, 47.0, 54.0, 66.0, 57.0, 53.0, 53.0, 53.0, 58.0, 59.0, 40.0, 40.0, 24.0, 31.0, 16.0, 17.0, 15.0, 6.0, 12.0, 7.0, 6.0, 4.0, 4.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.17760467529297, -63.88184356689453, -61.58608627319336, -59.29032897949219, -56.99456787109375, -54.69880676269531, -52.40304946899414, -50.10729217529297, -47.81153106689453, -45.515769958496094, -43.22001266479492, -40.92425537109375, -38.62849426269531, -36.332733154296875, -34.0369758605957, -31.7412166595459, -29.445457458496094, -27.14969825744629, -24.853939056396484, -22.55817985534668, -20.262420654296875, -17.96666145324707, -15.670902252197266, -13.375143051147461, -11.079383850097656, -8.783624649047852, -6.487865447998047, -4.192106246948242, -1.8963470458984375, 0.3994121551513672, 2.695171356201172, 4.990930557250977, 7.28668212890625, 9.582441329956055, 11.87820053100586, 14.173959732055664, 16.46971893310547, 18.765478134155273, 21.061237335205078, 23.356996536254883, 25.652755737304688, 27.948514938354492, 30.244274139404297, 32.54003143310547, 34.835792541503906, 37.131553649902344, 39.427310943603516, 41.72306823730469, 44.018829345703125, 46.31459045410156, 48.610347747802734, 50.906105041503906, 53.201866149902344, 55.49762725830078, 57.79338455200195, 60.089141845703125, 62.38490295410156, 64.6806640625, 66.97642517089844, 69.27217864990234, 71.56793975830078, 73.86370086669922, 76.15945434570312, 78.45521545410156, 80.7509765625]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 1.0, 3.0, 3.0, 15.0, 11.0, 19.0, 17.0, 40.0, 41.0, 100.0, 137.0, 233.0, 370.0, 578.0, 1021.0, 1803.0, 3394.0, 6821.0, 15568.0, 40497.0, 142870.0, 1014561.0, 2532749.0, 320827.0, 68684.0, 23411.0, 9726.0, 4601.0, 2473.0, 1428.0, 806.0, 525.0, 300.0, 200.0, 145.0, 89.0, 69.0, 44.0, 29.0, 20.0, 11.0, 7.0, 9.0, 9.0, 5.0, 5.0, 5.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.59765625, -4.44561767578125, -4.2935791015625, -4.14154052734375, -3.989501953125, -3.83746337890625, -3.6854248046875, -3.53338623046875, -3.38134765625, -3.22930908203125, -3.0772705078125, -2.92523193359375, -2.773193359375, -2.62115478515625, -2.4691162109375, -2.31707763671875, -2.1650390625, -2.01300048828125, -1.8609619140625, -1.70892333984375, -1.556884765625, -1.40484619140625, -1.2528076171875, -1.10076904296875, -0.94873046875, -0.79669189453125, -0.6446533203125, -0.49261474609375, -0.340576171875, -0.18853759765625, -0.0364990234375, 0.11553955078125, 0.267578125, 0.41961669921875, 0.5716552734375, 0.72369384765625, 0.875732421875, 1.02777099609375, 1.1798095703125, 1.33184814453125, 1.48388671875, 1.63592529296875, 1.7879638671875, 1.94000244140625, 2.092041015625, 2.24407958984375, 2.3961181640625, 2.54815673828125, 2.7001953125, 2.85223388671875, 3.0042724609375, 3.15631103515625, 3.308349609375, 3.46038818359375, 3.6124267578125, 3.76446533203125, 3.91650390625, 4.06854248046875, 4.2205810546875, 4.37261962890625, 4.524658203125, 4.67669677734375, 4.8287353515625, 4.98077392578125, 5.1328125]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 5.0, 13.0, 11.0, 16.0, 20.0, 26.0, 35.0, 44.0, 45.0, 74.0, 65.0, 83.0, 64.0, 74.0, 75.0, 63.0, 58.0, 39.0, 40.0, 41.0, 23.0, 17.0, 21.0, 17.0, 9.0, 8.0, 6.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.353515625, -3.238555908203125, -3.12359619140625, -3.008636474609375, -2.8936767578125, -2.778717041015625, -2.66375732421875, -2.548797607421875, -2.433837890625, -2.318878173828125, -2.20391845703125, -2.088958740234375, -1.9739990234375, -1.859039306640625, -1.74407958984375, -1.629119873046875, -1.51416015625, -1.399200439453125, -1.28424072265625, -1.169281005859375, -1.0543212890625, -0.939361572265625, -0.82440185546875, -0.709442138671875, -0.594482421875, -0.479522705078125, -0.36456298828125, -0.249603271484375, -0.1346435546875, -0.019683837890625, 0.09527587890625, 0.210235595703125, 0.3251953125, 0.440155029296875, 0.55511474609375, 0.670074462890625, 0.7850341796875, 0.899993896484375, 1.01495361328125, 1.129913330078125, 1.244873046875, 1.359832763671875, 1.47479248046875, 1.589752197265625, 1.7047119140625, 1.819671630859375, 1.93463134765625, 2.049591064453125, 2.16455078125, 2.279510498046875, 2.39447021484375, 2.509429931640625, 2.6243896484375, 2.739349365234375, 2.85430908203125, 2.969268798828125, 3.084228515625, 3.199188232421875, 3.31414794921875, 3.429107666015625, 3.5440673828125, 3.659027099609375, 3.77398681640625, 3.888946533203125, 4.00390625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 5.0, 5.0, 6.0, 6.0, 9.0, 18.0, 15.0, 24.0, 33.0, 53.0, 70.0, 158.0, 283.0, 625.0, 1543.0, 4603.0, 16928.0, 83867.0, 1279015.0, 2650528.0, 124742.0, 22541.0, 5834.0, 1844.0, 728.0, 350.0, 182.0, 88.0, 69.0, 37.0, 29.0, 17.0, 15.0, 7.0, 1.0, 7.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.703125, -10.3892822265625, -10.075439453125, -9.7615966796875, -9.44775390625, -9.1339111328125, -8.820068359375, -8.5062255859375, -8.1923828125, -7.8785400390625, -7.564697265625, -7.2508544921875, -6.93701171875, -6.6231689453125, -6.309326171875, -5.9954833984375, -5.681640625, -5.3677978515625, -5.053955078125, -4.7401123046875, -4.42626953125, -4.1124267578125, -3.798583984375, -3.4847412109375, -3.1708984375, -2.8570556640625, -2.543212890625, -2.2293701171875, -1.91552734375, -1.6016845703125, -1.287841796875, -0.9739990234375, -0.66015625, -0.3463134765625, -0.032470703125, 0.2813720703125, 0.59521484375, 0.9090576171875, 1.222900390625, 1.5367431640625, 1.8505859375, 2.1644287109375, 2.478271484375, 2.7921142578125, 3.10595703125, 3.4197998046875, 3.733642578125, 4.0474853515625, 4.361328125, 4.6751708984375, 4.989013671875, 5.3028564453125, 5.61669921875, 5.9305419921875, 6.244384765625, 6.5582275390625, 6.8720703125, 7.1859130859375, 7.499755859375, 7.8135986328125, 8.12744140625, 8.4412841796875, 8.755126953125, 9.0689697265625, 9.3828125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 5.0, 3.0, 3.0, 4.0, 1.0, 8.0, 8.0, 7.0, 8.0, 12.0, 18.0, 23.0, 26.0, 44.0, 58.0, 97.0, 123.0, 197.0, 333.0, 558.0, 822.0, 655.0, 388.0, 222.0, 154.0, 93.0, 48.0, 42.0, 29.0, 29.0, 13.0, 11.0, 14.0, 10.0, 9.0, 7.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.8203125, -6.5438232421875, -6.267333984375, -5.9908447265625, -5.71435546875, -5.4378662109375, -5.161376953125, -4.8848876953125, -4.6083984375, -4.3319091796875, -4.055419921875, -3.7789306640625, -3.50244140625, -3.2259521484375, -2.949462890625, -2.6729736328125, -2.396484375, -2.1199951171875, -1.843505859375, -1.5670166015625, -1.29052734375, -1.0140380859375, -0.737548828125, -0.4610595703125, -0.1845703125, 0.0919189453125, 0.368408203125, 0.6448974609375, 0.92138671875, 1.1978759765625, 1.474365234375, 1.7508544921875, 2.02734375, 2.3038330078125, 2.580322265625, 2.8568115234375, 3.13330078125, 3.4097900390625, 3.686279296875, 3.9627685546875, 4.2392578125, 4.5157470703125, 4.792236328125, 5.0687255859375, 5.34521484375, 5.6217041015625, 5.898193359375, 6.1746826171875, 6.451171875, 6.7276611328125, 7.004150390625, 7.2806396484375, 7.55712890625, 7.8336181640625, 8.110107421875, 8.3865966796875, 8.6630859375, 8.9395751953125, 9.216064453125, 9.4925537109375, 9.76904296875, 10.0455322265625, 10.322021484375, 10.5985107421875, 10.875]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 6.0, 4.0, 10.0, 26.0, 88.0, 166.0, 268.0, 258.0, 107.0, 44.0, 10.0, 3.0, 6.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-238.91790771484375, -234.23193359375, -229.54595947265625, -224.8599853515625, -220.1740264892578, -215.48805236816406, -210.8020782470703, -206.11610412597656, -201.4301300048828, -196.74415588378906, -192.0581817626953, -187.37222290039062, -182.68624877929688, -178.00027465820312, -173.31430053710938, -168.62832641601562, -163.94235229492188, -159.25637817382812, -154.57040405273438, -149.88442993164062, -145.19847106933594, -140.5124969482422, -135.82652282714844, -131.1405487060547, -126.45458984375, -121.76861572265625, -117.08264923095703, -112.39667510986328, -107.71070098876953, -103.02473449707031, -98.33876037597656, -93.65278625488281, -88.96681213378906, -84.28083801269531, -79.5948715209961, -74.90889739990234, -70.2229232788086, -65.53695678710938, -60.850982666015625, -56.165008544921875, -51.479034423828125, -46.79306411743164, -42.10708999633789, -37.421119689941406, -32.735145568847656, -28.049175262451172, -23.363204956054688, -18.677230834960938, -13.991260528564453, -9.305288314819336, -4.619317054748535, 0.06665420532226562, 4.752626419067383, 9.4385986328125, 14.124568939208984, 18.810543060302734, 23.49651336669922, 28.182485580444336, 32.86845779418945, 37.55442810058594, 42.24040222167969, 46.92637252807617, 51.612342834472656, 56.298316955566406, 60.98428726196289]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 4.0, 3.0, 7.0, 10.0, 5.0, 12.0, 16.0, 22.0, 11.0, 20.0, 34.0, 28.0, 41.0, 38.0, 39.0, 43.0, 39.0, 35.0, 39.0, 67.0, 45.0, 47.0, 47.0, 43.0, 50.0, 39.0, 39.0, 33.0, 23.0, 27.0, 16.0, 17.0, 5.0, 16.0, 9.0, 6.0, 7.0, 6.0, 5.0, 4.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-40.99607849121094, -39.68263244628906, -38.36919021606445, -37.05574417114258, -35.74230194091797, -34.428855895996094, -33.115413665771484, -31.80196762084961, -30.488523483276367, -29.175079345703125, -27.861635208129883, -26.54819107055664, -25.234745025634766, -23.921302795410156, -22.60785675048828, -21.29441261291504, -19.980968475341797, -18.667524337768555, -17.354080200195312, -16.04063606262207, -14.727190971374512, -13.41374683380127, -12.100301742553711, -10.786857604980469, -9.473413467407227, -8.159969329833984, -6.846524715423584, -5.533080101013184, -4.219635963439941, -2.906191825866699, -1.5927472114562988, -0.27930259704589844, 1.0341453552246094, 2.3475897312164307, 3.661034107208252, 4.974478721618652, 6.2879228591918945, 7.601366996765137, 8.914812088012695, 10.228256225585938, 11.54170036315918, 12.855144500732422, 14.168588638305664, 15.482033729553223, 16.79547882080078, 18.10892105102539, 19.422367095947266, 20.735811233520508, 22.04925537109375, 23.362699508666992, 24.676143646240234, 25.989587783813477, 27.30303192138672, 28.616477966308594, 29.929922103881836, 31.243366241455078, 32.55680847167969, 33.87025451660156, 35.18369674682617, 36.49714279174805, 37.810585021972656, 39.12403106689453, 40.43747329711914, 41.750919342041016, 43.06436538696289]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 4.0, 9.0, 4.0, 11.0, 18.0, 24.0, 35.0, 34.0, 61.0, 84.0, 141.0, 189.0, 323.0, 508.0, 747.0, 1262.0, 2179.0, 3946.0, 7322.0, 14547.0, 30403.0, 69455.0, 206792.0, 440774.0, 158834.0, 57220.0, 25799.0, 12659.0, 6562.0, 3587.0, 1938.0, 1158.0, 691.0, 419.0, 271.0, 160.0, 123.0, 76.0, 56.0, 33.0, 30.0, 28.0, 12.0, 12.0, 4.0, 8.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.6640625, -5.47137451171875, -5.2786865234375, -5.08599853515625, -4.893310546875, -4.70062255859375, -4.5079345703125, -4.31524658203125, -4.12255859375, -3.92987060546875, -3.7371826171875, -3.54449462890625, -3.351806640625, -3.15911865234375, -2.9664306640625, -2.77374267578125, -2.5810546875, -2.38836669921875, -2.1956787109375, -2.00299072265625, -1.810302734375, -1.61761474609375, -1.4249267578125, -1.23223876953125, -1.03955078125, -0.84686279296875, -0.6541748046875, -0.46148681640625, -0.268798828125, -0.07611083984375, 0.1165771484375, 0.30926513671875, 0.501953125, 0.69464111328125, 0.8873291015625, 1.08001708984375, 1.272705078125, 1.46539306640625, 1.6580810546875, 1.85076904296875, 2.04345703125, 2.23614501953125, 2.4288330078125, 2.62152099609375, 2.814208984375, 3.00689697265625, 3.1995849609375, 3.39227294921875, 3.5849609375, 3.77764892578125, 3.9703369140625, 4.16302490234375, 4.355712890625, 4.54840087890625, 4.7410888671875, 4.93377685546875, 5.12646484375, 5.31915283203125, 5.5118408203125, 5.70452880859375, 5.897216796875, 6.08990478515625, 6.2825927734375, 6.47528076171875, 6.66796875]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 1.0, 6.0, 9.0, 6.0, 12.0, 20.0, 25.0, 34.0, 31.0, 36.0, 46.0, 45.0, 67.0, 85.0, 71.0, 65.0, 65.0, 58.0, 60.0, 45.0, 55.0, 23.0, 31.0, 23.0, 29.0, 17.0, 7.0, 8.0, 8.0, 10.0, 6.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0], "bins": [-5.1640625, -5.042388916015625, -4.92071533203125, -4.799041748046875, -4.6773681640625, -4.555694580078125, -4.43402099609375, -4.312347412109375, -4.190673828125, -4.069000244140625, -3.94732666015625, -3.825653076171875, -3.7039794921875, -3.582305908203125, -3.46063232421875, -3.338958740234375, -3.21728515625, -3.095611572265625, -2.97393798828125, -2.852264404296875, -2.7305908203125, -2.608917236328125, -2.48724365234375, -2.365570068359375, -2.243896484375, -2.122222900390625, -2.00054931640625, -1.878875732421875, -1.7572021484375, -1.635528564453125, -1.51385498046875, -1.392181396484375, -1.2705078125, -1.148834228515625, -1.02716064453125, -0.905487060546875, -0.7838134765625, -0.662139892578125, -0.54046630859375, -0.418792724609375, -0.297119140625, -0.175445556640625, -0.05377197265625, 0.067901611328125, 0.1895751953125, 0.311248779296875, 0.43292236328125, 0.554595947265625, 0.67626953125, 0.797943115234375, 0.91961669921875, 1.041290283203125, 1.1629638671875, 1.284637451171875, 1.40631103515625, 1.527984619140625, 1.649658203125, 1.771331787109375, 1.89300537109375, 2.014678955078125, 2.1363525390625, 2.258026123046875, 2.37969970703125, 2.501373291015625, 2.623046875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 3.0, 3.0, 3.0, 6.0, 3.0, 7.0, 22.0, 29.0, 31.0, 53.0, 88.0, 124.0, 193.0, 304.0, 595.0, 1169.0, 3149.0, 12230.0, 153407.0, 830670.0, 36945.0, 5568.0, 1856.0, 892.0, 450.0, 291.0, 165.0, 108.0, 73.0, 46.0, 23.0, 14.0, 10.0, 6.0, 10.0, 3.0, 5.0, 2.0, 0.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.234375, -16.552001953125, -15.86962890625, -15.187255859375, -14.5048828125, -13.822509765625, -13.14013671875, -12.457763671875, -11.775390625, -11.093017578125, -10.41064453125, -9.728271484375, -9.0458984375, -8.363525390625, -7.68115234375, -6.998779296875, -6.31640625, -5.634033203125, -4.95166015625, -4.269287109375, -3.5869140625, -2.904541015625, -2.22216796875, -1.539794921875, -0.857421875, -0.175048828125, 0.50732421875, 1.189697265625, 1.8720703125, 2.554443359375, 3.23681640625, 3.919189453125, 4.6015625, 5.283935546875, 5.96630859375, 6.648681640625, 7.3310546875, 8.013427734375, 8.69580078125, 9.378173828125, 10.060546875, 10.742919921875, 11.42529296875, 12.107666015625, 12.7900390625, 13.472412109375, 14.15478515625, 14.837158203125, 15.51953125, 16.201904296875, 16.88427734375, 17.566650390625, 18.2490234375, 18.931396484375, 19.61376953125, 20.296142578125, 20.978515625, 21.660888671875, 22.34326171875, 23.025634765625, 23.7080078125, 24.390380859375, 25.07275390625, 25.755126953125, 26.4375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 1.0, 6.0, 2.0, 5.0, 1.0, 4.0, 5.0, 9.0, 6.0, 7.0, 15.0, 8.0, 11.0, 22.0, 15.0, 19.0, 33.0, 36.0, 38.0, 46.0, 54.0, 61.0, 70.0, 51.0, 51.0, 43.0, 58.0, 47.0, 38.0, 40.0, 29.0, 32.0, 32.0, 25.0, 23.0, 15.0, 9.0, 9.0, 8.0, 7.0, 3.0, 3.0, 3.0, 4.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-14.625, -14.103271484375, -13.58154296875, -13.059814453125, -12.5380859375, -12.016357421875, -11.49462890625, -10.972900390625, -10.451171875, -9.929443359375, -9.40771484375, -8.885986328125, -8.3642578125, -7.842529296875, -7.32080078125, -6.799072265625, -6.27734375, -5.755615234375, -5.23388671875, -4.712158203125, -4.1904296875, -3.668701171875, -3.14697265625, -2.625244140625, -2.103515625, -1.581787109375, -1.06005859375, -0.538330078125, -0.0166015625, 0.505126953125, 1.02685546875, 1.548583984375, 2.0703125, 2.592041015625, 3.11376953125, 3.635498046875, 4.1572265625, 4.678955078125, 5.20068359375, 5.722412109375, 6.244140625, 6.765869140625, 7.28759765625, 7.809326171875, 8.3310546875, 8.852783203125, 9.37451171875, 9.896240234375, 10.41796875, 10.939697265625, 11.46142578125, 11.983154296875, 12.5048828125, 13.026611328125, 13.54833984375, 14.070068359375, 14.591796875, 15.113525390625, 15.63525390625, 16.156982421875, 16.6787109375, 17.200439453125, 17.72216796875, 18.243896484375, 18.765625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 7.0, 3.0, 7.0, 9.0, 15.0, 13.0, 32.0, 59.0, 101.0, 154.0, 268.0, 539.0, 1223.0, 3461.0, 13038.0, 75868.0, 786116.0, 139882.0, 19943.0, 4711.0, 1590.0, 715.0, 339.0, 166.0, 117.0, 70.0, 31.0, 28.0, 19.0, 9.0, 5.0, 5.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.6328125, -8.39715576171875, -8.1614990234375, -7.92584228515625, -7.690185546875, -7.45452880859375, -7.2188720703125, -6.98321533203125, -6.74755859375, -6.51190185546875, -6.2762451171875, -6.04058837890625, -5.804931640625, -5.56927490234375, -5.3336181640625, -5.09796142578125, -4.8623046875, -4.62664794921875, -4.3909912109375, -4.15533447265625, -3.919677734375, -3.68402099609375, -3.4483642578125, -3.21270751953125, -2.97705078125, -2.74139404296875, -2.5057373046875, -2.27008056640625, -2.034423828125, -1.79876708984375, -1.5631103515625, -1.32745361328125, -1.091796875, -0.85614013671875, -0.6204833984375, -0.38482666015625, -0.149169921875, 0.08648681640625, 0.3221435546875, 0.55780029296875, 0.79345703125, 1.02911376953125, 1.2647705078125, 1.50042724609375, 1.736083984375, 1.97174072265625, 2.2073974609375, 2.44305419921875, 2.6787109375, 2.91436767578125, 3.1500244140625, 3.38568115234375, 3.621337890625, 3.85699462890625, 4.0926513671875, 4.32830810546875, 4.56396484375, 4.79962158203125, 5.0352783203125, 5.27093505859375, 5.506591796875, 5.74224853515625, 5.9779052734375, 6.21356201171875, 6.44921875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 8.0, 8.0, 9.0, 14.0, 21.0, 18.0, 24.0, 21.0, 43.0, 68.0, 113.0, 184.0, 162.0, 113.0, 56.0, 29.0, 30.0, 16.0, 17.0, 9.0, 5.0, 6.0, 8.0, 5.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00133514404296875, -0.0012814998626708984, -0.0012278556823730469, -0.0011742115020751953, -0.0011205673217773438, -0.0010669231414794922, -0.0010132789611816406, -0.0009596347808837891, -0.0009059906005859375, -0.0008523464202880859, -0.0007987022399902344, -0.0007450580596923828, -0.0006914138793945312, -0.0006377696990966797, -0.0005841255187988281, -0.0005304813385009766, -0.000476837158203125, -0.00042319297790527344, -0.0003695487976074219, -0.0003159046173095703, -0.00026226043701171875, -0.0002086162567138672, -0.00015497207641601562, -0.00010132789611816406, -4.76837158203125e-05, 5.9604644775390625e-06, 5.9604644775390625e-05, 0.00011324882507324219, 0.00016689300537109375, 0.0002205371856689453, 0.0002741813659667969, 0.00032782554626464844, 0.0003814697265625, 0.00043511390686035156, 0.0004887580871582031, 0.0005424022674560547, 0.0005960464477539062, 0.0006496906280517578, 0.0007033348083496094, 0.0007569789886474609, 0.0008106231689453125, 0.0008642673492431641, 0.0009179115295410156, 0.0009715557098388672, 0.0010251998901367188, 0.0010788440704345703, 0.0011324882507324219, 0.0011861324310302734, 0.001239776611328125, 0.0012934207916259766, 0.0013470649719238281, 0.0014007091522216797, 0.0014543533325195312, 0.0015079975128173828, 0.0015616416931152344, 0.001615285873413086, 0.0016689300537109375, 0.001722574234008789, 0.0017762184143066406, 0.0018298625946044922, 0.0018835067749023438, 0.0019371509552001953, 0.001990795135498047, 0.0020444393157958984, 0.00209808349609375]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 8.0, 10.0, 4.0, 3.0, 11.0, 31.0, 25.0, 41.0, 78.0, 131.0, 229.0, 341.0, 652.0, 1462.0, 3481.0, 12283.0, 78984.0, 779538.0, 145048.0, 18099.0, 4632.0, 1660.0, 793.0, 408.0, 257.0, 136.0, 88.0, 48.0, 25.0, 16.0, 11.0, 11.0, 8.0, 7.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.5078125, -8.28167724609375, -8.0555419921875, -7.82940673828125, -7.603271484375, -7.37713623046875, -7.1510009765625, -6.92486572265625, -6.69873046875, -6.47259521484375, -6.2464599609375, -6.02032470703125, -5.794189453125, -5.56805419921875, -5.3419189453125, -5.11578369140625, -4.8896484375, -4.66351318359375, -4.4373779296875, -4.21124267578125, -3.985107421875, -3.75897216796875, -3.5328369140625, -3.30670166015625, -3.08056640625, -2.85443115234375, -2.6282958984375, -2.40216064453125, -2.176025390625, -1.94989013671875, -1.7237548828125, -1.49761962890625, -1.271484375, -1.04534912109375, -0.8192138671875, -0.59307861328125, -0.366943359375, -0.14080810546875, 0.0853271484375, 0.31146240234375, 0.53759765625, 0.76373291015625, 0.9898681640625, 1.21600341796875, 1.442138671875, 1.66827392578125, 1.8944091796875, 2.12054443359375, 2.3466796875, 2.57281494140625, 2.7989501953125, 3.02508544921875, 3.251220703125, 3.47735595703125, 3.7034912109375, 3.92962646484375, 4.15576171875, 4.38189697265625, 4.6080322265625, 4.83416748046875, 5.060302734375, 5.28643798828125, 5.5125732421875, 5.73870849609375, 5.96484375]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 1.0, 4.0, 4.0, 2.0, 12.0, 9.0, 14.0, 23.0, 22.0, 20.0, 52.0, 63.0, 78.0, 111.0, 133.0, 143.0, 86.0, 54.0, 52.0, 31.0, 26.0, 19.0, 12.0, 6.0, 8.0, 7.0, 5.0, 5.0, 6.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.04296875, -6.81390380859375, -6.5848388671875, -6.35577392578125, -6.126708984375, -5.89764404296875, -5.6685791015625, -5.43951416015625, -5.21044921875, -4.98138427734375, -4.7523193359375, -4.52325439453125, -4.294189453125, -4.06512451171875, -3.8360595703125, -3.60699462890625, -3.3779296875, -3.14886474609375, -2.9197998046875, -2.69073486328125, -2.461669921875, -2.23260498046875, -2.0035400390625, -1.77447509765625, -1.54541015625, -1.31634521484375, -1.0872802734375, -0.85821533203125, -0.629150390625, -0.40008544921875, -0.1710205078125, 0.05804443359375, 0.287109375, 0.51617431640625, 0.7452392578125, 0.97430419921875, 1.203369140625, 1.43243408203125, 1.6614990234375, 1.89056396484375, 2.11962890625, 2.34869384765625, 2.5777587890625, 2.80682373046875, 3.035888671875, 3.26495361328125, 3.4940185546875, 3.72308349609375, 3.9521484375, 4.18121337890625, 4.4102783203125, 4.63934326171875, 4.868408203125, 5.09747314453125, 5.3265380859375, 5.55560302734375, 5.78466796875, 6.01373291015625, 6.2427978515625, 6.47186279296875, 6.700927734375, 6.92999267578125, 7.1590576171875, 7.38812255859375, 7.6171875]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 1.0, 3.0, 7.0, 6.0, 17.0, 28.0, 69.0, 111.0, 160.0, 216.0, 149.0, 100.0, 57.0, 32.0, 15.0, 10.0, 4.0, 3.0, 5.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-116.56110382080078, -113.08155822753906, -109.60201263427734, -106.12246704101562, -102.6429214477539, -99.16337585449219, -95.68383026123047, -92.20428466796875, -88.72473907470703, -85.24519348144531, -81.7656478881836, -78.28610229492188, -74.80655670166016, -71.32701110839844, -67.84746551513672, -64.367919921875, -60.88837432861328, -57.40882873535156, -53.929283142089844, -50.449737548828125, -46.970191955566406, -43.49064636230469, -40.01110076904297, -36.53155517578125, -33.05200958251953, -29.572463989257812, -26.092918395996094, -22.613372802734375, -19.133827209472656, -15.654281616210938, -12.174736022949219, -8.6951904296875, -5.21563720703125, -1.7360916137695312, 1.7434539794921875, 5.222999572753906, 8.702545166015625, 12.182090759277344, 15.661636352539062, 19.14118194580078, 22.6207275390625, 26.10027313232422, 29.579818725585938, 33.059364318847656, 36.538909912109375, 40.018455505371094, 43.49800109863281, 46.97754669189453, 50.45709228515625, 53.93663787841797, 57.41618347167969, 60.895729064941406, 64.37527465820312, 67.85482025146484, 71.33436584472656, 74.81391143798828, 78.29345703125, 81.77300262451172, 85.25254821777344, 88.73209381103516, 92.21163940429688, 95.6911849975586, 99.17073059082031, 102.65027618408203, 106.12982177734375]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 5.0, 4.0, 10.0, 14.0, 21.0, 17.0, 21.0, 35.0, 45.0, 52.0, 55.0, 63.0, 64.0, 78.0, 77.0, 79.0, 80.0, 51.0, 53.0, 44.0, 35.0, 21.0, 20.0, 19.0, 12.0, 10.0, 6.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-107.40464782714844, -104.58346557617188, -101.76227569580078, -98.94109344482422, -96.11991119384766, -93.2987289428711, -90.4775390625, -87.65635681152344, -84.83517456054688, -82.01399230957031, -79.19280242919922, -76.37162017822266, -73.5504379272461, -70.72925567626953, -67.90806579589844, -65.08688354492188, -62.26569747924805, -59.44451141357422, -56.623329162597656, -53.80214309692383, -50.980960845947266, -48.15977478027344, -45.338592529296875, -42.51740646362305, -39.69622039794922, -36.87503433227539, -34.05385208129883, -31.232666015625, -28.411483764648438, -25.59029769897461, -22.769113540649414, -19.94792938232422, -17.126747131347656, -14.305562973022461, -11.484378814697266, -8.663193702697754, -5.842009544372559, -3.0208253860473633, -0.19964027404785156, 2.6215438842773438, 5.442728042602539, 8.263912200927734, 11.08509635925293, 13.906281471252441, 16.727466583251953, 19.548648834228516, 22.369834899902344, 25.19101905822754, 28.012203216552734, 30.83338737487793, 33.654571533203125, 36.47575759887695, 39.296939849853516, 42.118125915527344, 44.939308166503906, 47.760494232177734, 50.58168029785156, 53.40286636352539, 56.22404861450195, 59.04523468017578, 61.866416931152344, 64.6875991821289, 67.5087890625, 70.32997131347656, 73.15115356445312]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 5.0, 6.0, 10.0, 19.0, 22.0, 38.0, 67.0, 120.0, 254.0, 1306.0, 16268.0, 3419928.0, 745766.0, 8889.0, 1039.0, 249.0, 111.0, 64.0, 36.0, 23.0, 15.0, 12.0, 8.0, 5.0, 8.0, 6.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-24.578125, -23.9620361328125, -23.345947265625, -22.7298583984375, -22.11376953125, -21.4976806640625, -20.881591796875, -20.2655029296875, -19.6494140625, -19.0333251953125, -18.417236328125, -17.8011474609375, -17.18505859375, -16.5689697265625, -15.952880859375, -15.3367919921875, -14.720703125, -14.1046142578125, -13.488525390625, -12.8724365234375, -12.25634765625, -11.6402587890625, -11.024169921875, -10.4080810546875, -9.7919921875, -9.1759033203125, -8.559814453125, -7.9437255859375, -7.32763671875, -6.7115478515625, -6.095458984375, -5.4793701171875, -4.86328125, -4.2471923828125, -3.631103515625, -3.0150146484375, -2.39892578125, -1.7828369140625, -1.166748046875, -0.5506591796875, 0.0654296875, 0.6815185546875, 1.297607421875, 1.9136962890625, 2.52978515625, 3.1458740234375, 3.761962890625, 4.3780517578125, 4.994140625, 5.6102294921875, 6.226318359375, 6.8424072265625, 7.45849609375, 8.0745849609375, 8.690673828125, 9.3067626953125, 9.9228515625, 10.5389404296875, 11.155029296875, 11.7711181640625, 12.38720703125, 13.0032958984375, 13.619384765625, 14.2354736328125, 14.8515625]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 9.0, 11.0, 31.0, 46.0, 75.0, 111.0, 132.0, 150.0, 139.0, 100.0, 74.0, 50.0, 35.0, 23.0, 12.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.92578125, -6.68426513671875, -6.4427490234375, -6.20123291015625, -5.959716796875, -5.71820068359375, -5.4766845703125, -5.23516845703125, -4.99365234375, -4.75213623046875, -4.5106201171875, -4.26910400390625, -4.027587890625, -3.78607177734375, -3.5445556640625, -3.30303955078125, -3.0615234375, -2.82000732421875, -2.5784912109375, -2.33697509765625, -2.095458984375, -1.85394287109375, -1.6124267578125, -1.37091064453125, -1.12939453125, -0.88787841796875, -0.6463623046875, -0.40484619140625, -0.163330078125, 0.07818603515625, 0.3197021484375, 0.56121826171875, 0.802734375, 1.04425048828125, 1.2857666015625, 1.52728271484375, 1.768798828125, 2.01031494140625, 2.2518310546875, 2.49334716796875, 2.73486328125, 2.97637939453125, 3.2178955078125, 3.45941162109375, 3.700927734375, 3.94244384765625, 4.1839599609375, 4.42547607421875, 4.6669921875, 4.90850830078125, 5.1500244140625, 5.39154052734375, 5.633056640625, 5.87457275390625, 6.1160888671875, 6.35760498046875, 6.59912109375, 6.84063720703125, 7.0821533203125, 7.32366943359375, 7.565185546875, 7.80670166015625, 8.0482177734375, 8.28973388671875, 8.53125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 4.0, 2.0, 5.0, 7.0, 6.0, 21.0, 25.0, 34.0, 59.0, 70.0, 112.0, 234.0, 361.0, 726.0, 1558.0, 3720.0, 10011.0, 31362.0, 135191.0, 1393581.0, 2357073.0, 197824.0, 41593.0, 12295.0, 4354.0, 1812.0, 875.0, 476.0, 281.0, 187.0, 106.0, 99.0, 56.0, 41.0, 32.0, 20.0, 15.0, 16.0, 10.0, 12.0, 6.0, 6.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.88671875, -7.64105224609375, -7.3953857421875, -7.14971923828125, -6.904052734375, -6.65838623046875, -6.4127197265625, -6.16705322265625, -5.92138671875, -5.67572021484375, -5.4300537109375, -5.18438720703125, -4.938720703125, -4.69305419921875, -4.4473876953125, -4.20172119140625, -3.9560546875, -3.71038818359375, -3.4647216796875, -3.21905517578125, -2.973388671875, -2.72772216796875, -2.4820556640625, -2.23638916015625, -1.99072265625, -1.74505615234375, -1.4993896484375, -1.25372314453125, -1.008056640625, -0.76239013671875, -0.5167236328125, -0.27105712890625, -0.025390625, 0.22027587890625, 0.4659423828125, 0.71160888671875, 0.957275390625, 1.20294189453125, 1.4486083984375, 1.69427490234375, 1.93994140625, 2.18560791015625, 2.4312744140625, 2.67694091796875, 2.922607421875, 3.16827392578125, 3.4139404296875, 3.65960693359375, 3.9052734375, 4.15093994140625, 4.3966064453125, 4.64227294921875, 4.887939453125, 5.13360595703125, 5.3792724609375, 5.62493896484375, 5.87060546875, 6.11627197265625, 6.3619384765625, 6.60760498046875, 6.853271484375, 7.09893798828125, 7.3446044921875, 7.59027099609375, 7.8359375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 3.0, 3.0, 5.0, 11.0, 9.0, 20.0, 27.0, 29.0, 52.0, 62.0, 119.0, 184.0, 376.0, 695.0, 938.0, 655.0, 343.0, 203.0, 115.0, 65.0, 48.0, 40.0, 26.0, 12.0, 12.0, 7.0, 4.0, 8.0, 1.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.0078125, -7.68017578125, -7.3525390625, -7.02490234375, -6.697265625, -6.36962890625, -6.0419921875, -5.71435546875, -5.38671875, -5.05908203125, -4.7314453125, -4.40380859375, -4.076171875, -3.74853515625, -3.4208984375, -3.09326171875, -2.765625, -2.43798828125, -2.1103515625, -1.78271484375, -1.455078125, -1.12744140625, -0.7998046875, -0.47216796875, -0.14453125, 0.18310546875, 0.5107421875, 0.83837890625, 1.166015625, 1.49365234375, 1.8212890625, 2.14892578125, 2.4765625, 2.80419921875, 3.1318359375, 3.45947265625, 3.787109375, 4.11474609375, 4.4423828125, 4.77001953125, 5.09765625, 5.42529296875, 5.7529296875, 6.08056640625, 6.408203125, 6.73583984375, 7.0634765625, 7.39111328125, 7.71875, 8.04638671875, 8.3740234375, 8.70166015625, 9.029296875, 9.35693359375, 9.6845703125, 10.01220703125, 10.33984375, 10.66748046875, 10.9951171875, 11.32275390625, 11.650390625, 11.97802734375, 12.3056640625, 12.63330078125, 12.9609375]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 8.0, 11.0, 14.0, 26.0, 52.0, 94.0, 149.0, 215.0, 181.0, 107.0, 62.0, 36.0, 23.0, 13.0, 4.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-105.49851989746094, -102.6020278930664, -99.7055435180664, -96.80905151367188, -93.91255950927734, -91.01607513427734, -88.11958312988281, -85.22309875488281, -82.32660675048828, -79.43011474609375, -76.53363037109375, -73.63713836669922, -70.74064636230469, -67.84416198730469, -64.94766998291016, -62.05118179321289, -59.15468978881836, -56.258201599121094, -53.36170959472656, -50.4652214050293, -47.56873321533203, -44.6722412109375, -41.775753021240234, -38.87926483154297, -35.98277282714844, -33.08628463745117, -30.189794540405273, -27.293304443359375, -24.39681625366211, -21.50032615661621, -18.603836059570312, -15.707347869873047, -12.810859680175781, -9.9143705368042, -7.017880916595459, -4.121391296386719, -1.2249021530151367, 1.6715869903564453, 4.568077087402344, 7.464565277099609, 10.361055374145508, 13.25754451751709, 16.154033660888672, 19.05052375793457, 21.94701385498047, 24.843502044677734, 27.739992141723633, 30.6364803314209, 33.5329704284668, 36.42945861816406, 39.325950622558594, 42.22243881225586, 45.118927001953125, 48.015419006347656, 50.91190719604492, 53.80839538574219, 56.70488739013672, 59.601375579833984, 62.497867584228516, 65.39435577392578, 68.29084777832031, 71.18733215332031, 74.08382415771484, 76.98031616210938, 79.87680053710938]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 5.0, 6.0, 4.0, 11.0, 15.0, 22.0, 27.0, 24.0, 33.0, 39.0, 36.0, 41.0, 51.0, 64.0, 55.0, 82.0, 58.0, 61.0, 54.0, 44.0, 46.0, 42.0, 31.0, 32.0, 31.0, 19.0, 13.0, 13.0, 7.0, 15.0, 3.0, 7.0, 6.0, 8.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.96294021606445, -45.446712493896484, -43.930484771728516, -42.41425323486328, -40.89802551269531, -39.381797790527344, -37.865570068359375, -36.349342346191406, -34.83311462402344, -33.31688690185547, -31.800657272338867, -30.2844295501709, -28.768199920654297, -27.251972198486328, -25.73574447631836, -24.21951675415039, -22.703285217285156, -21.187057495117188, -19.670827865600586, -18.154600143432617, -16.638370513916016, -15.122142791748047, -13.605915069580078, -12.089686393737793, -10.573457717895508, -9.057229042053223, -7.541000843048096, -6.024772644042969, -4.508543968200684, -2.9923152923583984, -1.4760875701904297, 0.04014110565185547, 1.5563735961914062, 3.0726020336151123, 4.588830471038818, 6.105058670043945, 7.6212873458862305, 9.137516021728516, 10.653743743896484, 12.16997241973877, 13.686201095581055, 15.20242977142334, 16.718658447265625, 18.234886169433594, 19.751113891601562, 21.267343521118164, 22.783571243286133, 24.299800872802734, 25.816028594970703, 27.332256317138672, 28.848485946655273, 30.364713668823242, 31.880943298339844, 33.39717102050781, 34.91339874267578, 36.42962646484375, 37.94585418701172, 39.46208190917969, 40.978309631347656, 42.494537353515625, 44.01076889038086, 45.52699661254883, 47.0432243347168, 48.559452056884766, 50.07568359375]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 7.0, 12.0, 15.0, 22.0, 29.0, 50.0, 54.0, 74.0, 92.0, 192.0, 301.0, 397.0, 766.0, 1211.0, 2000.0, 3605.0, 6317.0, 11795.0, 23286.0, 51008.0, 143367.0, 429101.0, 236609.0, 72914.0, 30909.0, 15395.0, 8222.0, 4512.0, 2495.0, 1466.0, 863.0, 503.0, 317.0, 214.0, 146.0, 92.0, 56.0, 40.0, 27.0, 21.0, 20.0, 14.0, 8.0, 6.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.46484375, -5.29241943359375, -5.1199951171875, -4.94757080078125, -4.775146484375, -4.60272216796875, -4.4302978515625, -4.25787353515625, -4.08544921875, -3.91302490234375, -3.7406005859375, -3.56817626953125, -3.395751953125, -3.22332763671875, -3.0509033203125, -2.87847900390625, -2.7060546875, -2.53363037109375, -2.3612060546875, -2.18878173828125, -2.016357421875, -1.84393310546875, -1.6715087890625, -1.49908447265625, -1.32666015625, -1.15423583984375, -0.9818115234375, -0.80938720703125, -0.636962890625, -0.46453857421875, -0.2921142578125, -0.11968994140625, 0.052734375, 0.22515869140625, 0.3975830078125, 0.57000732421875, 0.742431640625, 0.91485595703125, 1.0872802734375, 1.25970458984375, 1.43212890625, 1.60455322265625, 1.7769775390625, 1.94940185546875, 2.121826171875, 2.29425048828125, 2.4666748046875, 2.63909912109375, 2.8115234375, 2.98394775390625, 3.1563720703125, 3.32879638671875, 3.501220703125, 3.67364501953125, 3.8460693359375, 4.01849365234375, 4.19091796875, 4.36334228515625, 4.5357666015625, 4.70819091796875, 4.880615234375, 5.05303955078125, 5.2254638671875, 5.39788818359375, 5.5703125]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 3.0, 11.0, 10.0, 7.0, 15.0, 17.0, 20.0, 27.0, 38.0, 41.0, 43.0, 56.0, 57.0, 45.0, 73.0, 60.0, 70.0, 57.0, 62.0, 51.0, 39.0, 46.0, 40.0, 27.0, 21.0, 17.0, 12.0, 6.0, 5.0, 9.0, 4.0, 4.0, 2.0, 4.0, 1.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.7265625, -3.612457275390625, -3.49835205078125, -3.384246826171875, -3.2701416015625, -3.156036376953125, -3.04193115234375, -2.927825927734375, -2.813720703125, -2.699615478515625, -2.58551025390625, -2.471405029296875, -2.3572998046875, -2.243194580078125, -2.12908935546875, -2.014984130859375, -1.90087890625, -1.786773681640625, -1.67266845703125, -1.558563232421875, -1.4444580078125, -1.330352783203125, -1.21624755859375, -1.102142333984375, -0.988037109375, -0.873931884765625, -0.75982666015625, -0.645721435546875, -0.5316162109375, -0.417510986328125, -0.30340576171875, -0.189300537109375, -0.0751953125, 0.038909912109375, 0.15301513671875, 0.267120361328125, 0.3812255859375, 0.495330810546875, 0.60943603515625, 0.723541259765625, 0.837646484375, 0.951751708984375, 1.06585693359375, 1.179962158203125, 1.2940673828125, 1.408172607421875, 1.52227783203125, 1.636383056640625, 1.75048828125, 1.864593505859375, 1.97869873046875, 2.092803955078125, 2.2069091796875, 2.321014404296875, 2.43511962890625, 2.549224853515625, 2.663330078125, 2.777435302734375, 2.89154052734375, 3.005645751953125, 3.1197509765625, 3.233856201171875, 3.34796142578125, 3.462066650390625, 3.576171875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 2.0, 2.0, 1.0, 7.0, 8.0, 4.0, 11.0, 8.0, 16.0, 18.0, 19.0, 38.0, 58.0, 59.0, 86.0, 127.0, 181.0, 262.0, 395.0, 625.0, 1022.0, 1902.0, 3986.0, 10052.0, 29525.0, 125981.0, 685211.0, 137968.0, 31361.0, 10570.0, 4219.0, 1943.0, 999.0, 575.0, 358.0, 274.0, 181.0, 145.0, 103.0, 62.0, 47.0, 35.0, 32.0, 25.0, 12.0, 8.0, 10.0, 9.0, 5.0, 2.0, 4.0, 6.0, 0.0, 2.0, 2.0, 1.0, 2.0], "bins": [-10.0546875, -9.7547607421875, -9.454833984375, -9.1549072265625, -8.85498046875, -8.5550537109375, -8.255126953125, -7.9552001953125, -7.6552734375, -7.3553466796875, -7.055419921875, -6.7554931640625, -6.45556640625, -6.1556396484375, -5.855712890625, -5.5557861328125, -5.255859375, -4.9559326171875, -4.656005859375, -4.3560791015625, -4.05615234375, -3.7562255859375, -3.456298828125, -3.1563720703125, -2.8564453125, -2.5565185546875, -2.256591796875, -1.9566650390625, -1.65673828125, -1.3568115234375, -1.056884765625, -0.7569580078125, -0.45703125, -0.1571044921875, 0.142822265625, 0.4427490234375, 0.74267578125, 1.0426025390625, 1.342529296875, 1.6424560546875, 1.9423828125, 2.2423095703125, 2.542236328125, 2.8421630859375, 3.14208984375, 3.4420166015625, 3.741943359375, 4.0418701171875, 4.341796875, 4.6417236328125, 4.941650390625, 5.2415771484375, 5.54150390625, 5.8414306640625, 6.141357421875, 6.4412841796875, 6.7412109375, 7.0411376953125, 7.341064453125, 7.6409912109375, 7.94091796875, 8.2408447265625, 8.540771484375, 8.8406982421875, 9.140625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 9.0, 7.0, 11.0, 9.0, 14.0, 18.0, 13.0, 20.0, 31.0, 23.0, 44.0, 56.0, 53.0, 63.0, 50.0, 60.0, 55.0, 56.0, 61.0, 51.0, 52.0, 45.0, 43.0, 30.0, 25.0, 16.0, 25.0, 13.0, 11.0, 8.0, 4.0, 8.0, 5.0, 3.0, 4.0, 2.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.359375, -14.88623046875, -14.4130859375, -13.93994140625, -13.466796875, -12.99365234375, -12.5205078125, -12.04736328125, -11.57421875, -11.10107421875, -10.6279296875, -10.15478515625, -9.681640625, -9.20849609375, -8.7353515625, -8.26220703125, -7.7890625, -7.31591796875, -6.8427734375, -6.36962890625, -5.896484375, -5.42333984375, -4.9501953125, -4.47705078125, -4.00390625, -3.53076171875, -3.0576171875, -2.58447265625, -2.111328125, -1.63818359375, -1.1650390625, -0.69189453125, -0.21875, 0.25439453125, 0.7275390625, 1.20068359375, 1.673828125, 2.14697265625, 2.6201171875, 3.09326171875, 3.56640625, 4.03955078125, 4.5126953125, 4.98583984375, 5.458984375, 5.93212890625, 6.4052734375, 6.87841796875, 7.3515625, 7.82470703125, 8.2978515625, 8.77099609375, 9.244140625, 9.71728515625, 10.1904296875, 10.66357421875, 11.13671875, 11.60986328125, 12.0830078125, 12.55615234375, 13.029296875, 13.50244140625, 13.9755859375, 14.44873046875, 14.921875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 9.0, 12.0, 18.0, 23.0, 63.0, 70.0, 129.0, 259.0, 617.0, 1919.0, 8619.0, 65841.0, 770359.0, 178251.0, 17389.0, 3274.0, 927.0, 363.0, 176.0, 86.0, 54.0, 29.0, 18.0, 11.0, 8.0, 9.0, 3.0, 5.0, 3.0, 5.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.625, -8.38336181640625, -8.1417236328125, -7.90008544921875, -7.658447265625, -7.41680908203125, -7.1751708984375, -6.93353271484375, -6.69189453125, -6.45025634765625, -6.2086181640625, -5.96697998046875, -5.725341796875, -5.48370361328125, -5.2420654296875, -5.00042724609375, -4.7587890625, -4.51715087890625, -4.2755126953125, -4.03387451171875, -3.792236328125, -3.55059814453125, -3.3089599609375, -3.06732177734375, -2.82568359375, -2.58404541015625, -2.3424072265625, -2.10076904296875, -1.859130859375, -1.61749267578125, -1.3758544921875, -1.13421630859375, -0.892578125, -0.65093994140625, -0.4093017578125, -0.16766357421875, 0.073974609375, 0.31561279296875, 0.5572509765625, 0.79888916015625, 1.04052734375, 1.28216552734375, 1.5238037109375, 1.76544189453125, 2.007080078125, 2.24871826171875, 2.4903564453125, 2.73199462890625, 2.9736328125, 3.21527099609375, 3.4569091796875, 3.69854736328125, 3.940185546875, 4.18182373046875, 4.4234619140625, 4.66510009765625, 4.90673828125, 5.14837646484375, 5.3900146484375, 5.63165283203125, 5.873291015625, 6.11492919921875, 6.3565673828125, 6.59820556640625, 6.83984375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 2.0, 2.0, 3.0, 4.0, 3.0, 9.0, 10.0, 16.0, 14.0, 21.0, 29.0, 45.0, 38.0, 58.0, 116.0, 137.0, 124.0, 79.0, 83.0, 48.0, 41.0, 22.0, 18.0, 11.0, 17.0, 13.0, 13.0, 10.0, 3.0, 2.0, 5.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009179115295410156, -0.0008812174201011658, -0.0008445233106613159, -0.0008078292012214661, -0.0007711350917816162, -0.0007344409823417664, -0.0006977468729019165, -0.0006610527634620667, -0.0006243586540222168, -0.0005876645445823669, -0.0005509704351425171, -0.0005142763257026672, -0.0004775822162628174, -0.00044088810682296753, -0.0004041939973831177, -0.0003674998879432678, -0.00033080577850341797, -0.0002941116690635681, -0.00025741755962371826, -0.0002207234501838684, -0.00018402934074401855, -0.0001473352313041687, -0.00011064112186431885, -7.3947012424469e-05, -3.725290298461914e-05, -5.587935447692871e-07, 3.6135315895080566e-05, 7.282942533493042e-05, 0.00010952353477478027, 0.00014621764421463013, 0.00018291175365447998, 0.00021960586309432983, 0.0002562999725341797, 0.00029299408197402954, 0.0003296881914138794, 0.00036638230085372925, 0.0004030764102935791, 0.00043977051973342896, 0.0004764646291732788, 0.0005131587386131287, 0.0005498528480529785, 0.0005865469574928284, 0.0006232410669326782, 0.0006599351763725281, 0.0006966292858123779, 0.0007333233952522278, 0.0007700175046920776, 0.0008067116141319275, 0.0008434057235717773, 0.0008800998330116272, 0.000916793942451477, 0.0009534880518913269, 0.0009901821613311768, 0.0010268762707710266, 0.0010635703802108765, 0.0011002644896507263, 0.0011369585990905762, 0.001173652708530426, 0.0012103468179702759, 0.0012470409274101257, 0.0012837350368499756, 0.0013204291462898254, 0.0013571232557296753, 0.0013938173651695251, 0.001430511474609375]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 5.0, 3.0, 7.0, 8.0, 16.0, 28.0, 36.0, 60.0, 75.0, 168.0, 249.0, 516.0, 1073.0, 2295.0, 6268.0, 24388.0, 147819.0, 694593.0, 137326.0, 23417.0, 5919.0, 2159.0, 961.0, 508.0, 272.0, 163.0, 78.0, 55.0, 27.0, 21.0, 12.0, 10.0, 5.0, 7.0, 5.0, 1.0, 0.0, 2.0, 5.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.53515625, -5.36474609375, -5.1943359375, -5.02392578125, -4.853515625, -4.68310546875, -4.5126953125, -4.34228515625, -4.171875, -4.00146484375, -3.8310546875, -3.66064453125, -3.490234375, -3.31982421875, -3.1494140625, -2.97900390625, -2.80859375, -2.63818359375, -2.4677734375, -2.29736328125, -2.126953125, -1.95654296875, -1.7861328125, -1.61572265625, -1.4453125, -1.27490234375, -1.1044921875, -0.93408203125, -0.763671875, -0.59326171875, -0.4228515625, -0.25244140625, -0.08203125, 0.08837890625, 0.2587890625, 0.42919921875, 0.599609375, 0.77001953125, 0.9404296875, 1.11083984375, 1.28125, 1.45166015625, 1.6220703125, 1.79248046875, 1.962890625, 2.13330078125, 2.3037109375, 2.47412109375, 2.64453125, 2.81494140625, 2.9853515625, 3.15576171875, 3.326171875, 3.49658203125, 3.6669921875, 3.83740234375, 4.0078125, 4.17822265625, 4.3486328125, 4.51904296875, 4.689453125, 4.85986328125, 5.0302734375, 5.20068359375, 5.37109375]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 5.0, 6.0, 8.0, 7.0, 8.0, 15.0, 9.0, 14.0, 14.0, 14.0, 22.0, 36.0, 37.0, 43.0, 44.0, 54.0, 69.0, 65.0, 72.0, 62.0, 59.0, 51.0, 39.0, 43.0, 35.0, 29.0, 23.0, 22.0, 17.0, 26.0, 14.0, 14.0, 11.0, 8.0, 4.0, 7.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.544921875, -3.43609619140625, -3.3272705078125, -3.21844482421875, -3.109619140625, -3.00079345703125, -2.8919677734375, -2.78314208984375, -2.67431640625, -2.56549072265625, -2.4566650390625, -2.34783935546875, -2.239013671875, -2.13018798828125, -2.0213623046875, -1.91253662109375, -1.8037109375, -1.69488525390625, -1.5860595703125, -1.47723388671875, -1.368408203125, -1.25958251953125, -1.1507568359375, -1.04193115234375, -0.93310546875, -0.82427978515625, -0.7154541015625, -0.60662841796875, -0.497802734375, -0.38897705078125, -0.2801513671875, -0.17132568359375, -0.0625, 0.04632568359375, 0.1551513671875, 0.26397705078125, 0.372802734375, 0.48162841796875, 0.5904541015625, 0.69927978515625, 0.80810546875, 0.91693115234375, 1.0257568359375, 1.13458251953125, 1.243408203125, 1.35223388671875, 1.4610595703125, 1.56988525390625, 1.6787109375, 1.78753662109375, 1.8963623046875, 2.00518798828125, 2.114013671875, 2.22283935546875, 2.3316650390625, 2.44049072265625, 2.54931640625, 2.65814208984375, 2.7669677734375, 2.87579345703125, 2.984619140625, 3.09344482421875, 3.2022705078125, 3.31109619140625, 3.419921875]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 7.0, 15.0, 22.0, 129.0, 360.0, 276.0, 132.0, 34.0, 8.0, 9.0, 4.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-155.42617797851562, -149.64454650878906, -143.8629150390625, -138.081298828125, -132.29966735839844, -126.51803588867188, -120.73641204833984, -114.95478820800781, -109.17315673828125, -103.39152526855469, -97.60990142822266, -91.82827758789062, -86.04664611816406, -80.2650146484375, -74.48339080810547, -68.70176696777344, -62.920135498046875, -57.13850784301758, -51.35688018798828, -45.575252532958984, -39.79362487792969, -34.01199722290039, -28.230369567871094, -22.448741912841797, -16.6671142578125, -10.885486602783203, -5.103858947753906, 0.6777687072753906, 6.4593963623046875, 12.241024017333984, 18.02265167236328, 23.804279327392578, 29.585906982421875, 35.36753463745117, 41.14916229248047, 46.930789947509766, 52.71241760253906, 58.49404525756836, 64.27567291259766, 70.05729675292969, 75.83892822265625, 81.62055969238281, 87.40218353271484, 93.18380737304688, 98.96543884277344, 104.7470703125, 110.52869415283203, 116.31031799316406, 122.09194946289062, 127.87358093261719, 133.65521240234375, 139.43682861328125, 145.2184600830078, 151.00009155273438, 156.78170776367188, 162.56333923339844, 168.344970703125, 174.12660217285156, 179.90823364257812, 185.68984985351562, 191.4714813232422, 197.25311279296875, 203.03472900390625, 208.8163604736328, 214.59799194335938]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 4.0, 4.0, 3.0, 3.0, 8.0, 9.0, 7.0, 7.0, 10.0, 17.0, 24.0, 21.0, 29.0, 17.0, 36.0, 21.0, 40.0, 27.0, 39.0, 52.0, 40.0, 60.0, 50.0, 58.0, 46.0, 40.0, 34.0, 30.0, 37.0, 31.0, 29.0, 31.0, 18.0, 16.0, 14.0, 17.0, 16.0, 11.0, 14.0, 4.0, 7.0, 4.0, 5.0, 5.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-48.482295989990234, -46.944129943847656, -45.405967712402344, -43.867801666259766, -42.32963562011719, -40.791473388671875, -39.2533073425293, -37.71514129638672, -36.176979064941406, -34.63881301879883, -33.100650787353516, -31.562484741210938, -30.02431869506836, -28.486154556274414, -26.94799041748047, -25.40982437133789, -23.871658325195312, -22.333494186401367, -20.79532814025879, -19.257164001464844, -17.718997955322266, -16.18083381652832, -14.642669677734375, -13.104504585266113, -11.566339492797852, -10.02817440032959, -8.490009307861328, -6.951845169067383, -5.413680076599121, -3.8755149841308594, -2.337350845336914, -0.7991857528686523, 0.738983154296875, 2.2771480083465576, 3.8153128623962402, 5.353477478027344, 6.8916425704956055, 8.429807662963867, 9.967971801757812, 11.506136894226074, 13.044301986694336, 14.582467079162598, 16.12063217163086, 17.658796310424805, 19.19696044921875, 20.735126495361328, 22.273290634155273, 23.81145477294922, 25.349620819091797, 26.887784957885742, 28.42595100402832, 29.964115142822266, 31.502281188964844, 33.040443420410156, 34.578609466552734, 36.11677551269531, 37.654937744140625, 39.1931037902832, 40.731266021728516, 42.269432067871094, 43.80759811401367, 45.34576416015625, 46.88392639160156, 48.42209243774414, 49.96025848388672]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 5.0, 7.0, 13.0, 31.0, 33.0, 63.0, 83.0, 138.0, 232.0, 397.0, 800.0, 1600.0, 3232.0, 7596.0, 19439.0, 55377.0, 199856.0, 1139673.0, 2178739.0, 436455.0, 97482.0, 31472.0, 11875.0, 4875.0, 2333.0, 1106.0, 543.0, 356.0, 193.0, 117.0, 63.0, 35.0, 24.0, 10.0, 9.0, 8.0, 3.0, 4.0, 1.0, 0.0, 3.0, 0.0, 3.0], "bins": [-5.49609375, -5.35601806640625, -5.2159423828125, -5.07586669921875, -4.935791015625, -4.79571533203125, -4.6556396484375, -4.51556396484375, -4.37548828125, -4.23541259765625, -4.0953369140625, -3.95526123046875, -3.815185546875, -3.67510986328125, -3.5350341796875, -3.39495849609375, -3.2548828125, -3.11480712890625, -2.9747314453125, -2.83465576171875, -2.694580078125, -2.55450439453125, -2.4144287109375, -2.27435302734375, -2.13427734375, -1.99420166015625, -1.8541259765625, -1.71405029296875, -1.573974609375, -1.43389892578125, -1.2938232421875, -1.15374755859375, -1.013671875, -0.87359619140625, -0.7335205078125, -0.59344482421875, -0.453369140625, -0.31329345703125, -0.1732177734375, -0.03314208984375, 0.10693359375, 0.24700927734375, 0.3870849609375, 0.52716064453125, 0.667236328125, 0.80731201171875, 0.9473876953125, 1.08746337890625, 1.2275390625, 1.36761474609375, 1.5076904296875, 1.64776611328125, 1.787841796875, 1.92791748046875, 2.0679931640625, 2.20806884765625, 2.34814453125, 2.48822021484375, 2.6282958984375, 2.76837158203125, 2.908447265625, 3.04852294921875, 3.1885986328125, 3.32867431640625, 3.46875]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 6.0, 5.0, 5.0, 10.0, 10.0, 26.0, 35.0, 48.0, 62.0, 68.0, 68.0, 99.0, 84.0, 102.0, 98.0, 82.0, 61.0, 47.0, 28.0, 30.0, 13.0, 7.0, 8.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.5546875, -6.400665283203125, -6.24664306640625, -6.092620849609375, -5.9385986328125, -5.784576416015625, -5.63055419921875, -5.476531982421875, -5.322509765625, -5.168487548828125, -5.01446533203125, -4.860443115234375, -4.7064208984375, -4.552398681640625, -4.39837646484375, -4.244354248046875, -4.09033203125, -3.936309814453125, -3.78228759765625, -3.628265380859375, -3.4742431640625, -3.320220947265625, -3.16619873046875, -3.012176513671875, -2.858154296875, -2.704132080078125, -2.55010986328125, -2.396087646484375, -2.2420654296875, -2.088043212890625, -1.93402099609375, -1.779998779296875, -1.6259765625, -1.471954345703125, -1.31793212890625, -1.163909912109375, -1.0098876953125, -0.855865478515625, -0.70184326171875, -0.547821044921875, -0.393798828125, -0.239776611328125, -0.08575439453125, 0.068267822265625, 0.2222900390625, 0.376312255859375, 0.53033447265625, 0.684356689453125, 0.83837890625, 0.992401123046875, 1.14642333984375, 1.300445556640625, 1.4544677734375, 1.608489990234375, 1.76251220703125, 1.916534423828125, 2.070556640625, 2.224578857421875, 2.37860107421875, 2.532623291015625, 2.6866455078125, 2.840667724609375, 2.99468994140625, 3.148712158203125, 3.302734375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 4.0, 9.0, 10.0, 8.0, 28.0, 29.0, 67.0, 120.0, 155.0, 340.0, 725.0, 1736.0, 5293.0, 19523.0, 98856.0, 1250291.0, 2607816.0, 171692.0, 27136.0, 6632.0, 1940.0, 812.0, 385.0, 235.0, 137.0, 95.0, 74.0, 50.0, 26.0, 18.0, 16.0, 8.0, 9.0, 7.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.21875, -10.8994140625, -10.580078125, -10.2607421875, -9.94140625, -9.6220703125, -9.302734375, -8.9833984375, -8.6640625, -8.3447265625, -8.025390625, -7.7060546875, -7.38671875, -7.0673828125, -6.748046875, -6.4287109375, -6.109375, -5.7900390625, -5.470703125, -5.1513671875, -4.83203125, -4.5126953125, -4.193359375, -3.8740234375, -3.5546875, -3.2353515625, -2.916015625, -2.5966796875, -2.27734375, -1.9580078125, -1.638671875, -1.3193359375, -1.0, -0.6806640625, -0.361328125, -0.0419921875, 0.27734375, 0.5966796875, 0.916015625, 1.2353515625, 1.5546875, 1.8740234375, 2.193359375, 2.5126953125, 2.83203125, 3.1513671875, 3.470703125, 3.7900390625, 4.109375, 4.4287109375, 4.748046875, 5.0673828125, 5.38671875, 5.7060546875, 6.025390625, 6.3447265625, 6.6640625, 6.9833984375, 7.302734375, 7.6220703125, 7.94140625, 8.2607421875, 8.580078125, 8.8994140625, 9.21875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 1.0, 3.0, 6.0, 6.0, 11.0, 13.0, 18.0, 12.0, 26.0, 41.0, 66.0, 86.0, 147.0, 257.0, 471.0, 742.0, 841.0, 508.0, 313.0, 174.0, 129.0, 62.0, 46.0, 38.0, 24.0, 15.0, 10.0, 12.0, 3.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.3515625, -6.9669189453125, -6.582275390625, -6.1976318359375, -5.81298828125, -5.4283447265625, -5.043701171875, -4.6590576171875, -4.2744140625, -3.8897705078125, -3.505126953125, -3.1204833984375, -2.73583984375, -2.3511962890625, -1.966552734375, -1.5819091796875, -1.197265625, -0.8126220703125, -0.427978515625, -0.0433349609375, 0.34130859375, 0.7259521484375, 1.110595703125, 1.4952392578125, 1.8798828125, 2.2645263671875, 2.649169921875, 3.0338134765625, 3.41845703125, 3.8031005859375, 4.187744140625, 4.5723876953125, 4.95703125, 5.3416748046875, 5.726318359375, 6.1109619140625, 6.49560546875, 6.8802490234375, 7.264892578125, 7.6495361328125, 8.0341796875, 8.4188232421875, 8.803466796875, 9.1881103515625, 9.57275390625, 9.9573974609375, 10.342041015625, 10.7266845703125, 11.111328125, 11.4959716796875, 11.880615234375, 12.2652587890625, 12.64990234375, 13.0345458984375, 13.419189453125, 13.8038330078125, 14.1884765625, 14.5731201171875, 14.957763671875, 15.3424072265625, 15.72705078125, 16.1116943359375, 16.496337890625, 16.8809814453125, 17.265625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 2.0, 14.0, 14.0, 21.0, 37.0, 86.0, 123.0, 163.0, 167.0, 144.0, 94.0, 48.0, 25.0, 14.0, 10.0, 7.0, 8.0, 3.0, 3.0, 3.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-95.48467254638672, -92.41374206542969, -89.34281158447266, -86.27188110351562, -83.2009506225586, -80.13002014160156, -77.05909729003906, -73.9881591796875, -70.917236328125, -67.84630584716797, -64.77537536621094, -61.704444885253906, -58.633514404296875, -55.562583923339844, -52.49165725708008, -49.42072677612305, -46.34979248046875, -43.27886199951172, -40.20793151855469, -37.137001037597656, -34.066070556640625, -30.995141983032227, -27.924213409423828, -24.853282928466797, -21.782352447509766, -18.711421966552734, -15.64049243927002, -12.569562911987305, -9.498632431030273, -6.427701950073242, -3.3567733764648438, -0.2858428955078125, 2.78509521484375, 5.856025218963623, 8.926955223083496, 11.997884750366211, 15.068815231323242, 18.139745712280273, 21.210674285888672, 24.281604766845703, 27.352535247802734, 30.423465728759766, 33.4943962097168, 36.56532287597656, 39.636253356933594, 42.707183837890625, 45.778114318847656, 48.84904479980469, 51.91997528076172, 54.99090576171875, 58.06183624267578, 61.13276672363281, 64.20369720458984, 67.27462768554688, 70.34555053710938, 73.41648864746094, 76.48741149902344, 79.55834197998047, 82.6292724609375, 85.70020294189453, 88.77113342285156, 91.8420639038086, 94.91299438476562, 97.98391723632812, 101.05485534667969]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 6.0, 3.0, 3.0, 6.0, 12.0, 9.0, 19.0, 18.0, 21.0, 23.0, 25.0, 26.0, 25.0, 47.0, 41.0, 53.0, 53.0, 47.0, 55.0, 53.0, 55.0, 48.0, 55.0, 37.0, 40.0, 32.0, 28.0, 29.0, 25.0, 23.0, 29.0, 17.0, 8.0, 10.0, 8.0, 6.0, 8.0, 2.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-61.604740142822266, -59.988685607910156, -58.37263107299805, -56.75657653808594, -55.14052200317383, -53.52446746826172, -51.90841293334961, -50.2923583984375, -48.67630386352539, -47.06024932861328, -45.44419479370117, -43.82814025878906, -42.21208572387695, -40.596031188964844, -38.979976654052734, -37.363922119140625, -35.747867584228516, -34.131813049316406, -32.5157585144043, -30.899703979492188, -29.283649444580078, -27.66759490966797, -26.05154037475586, -24.43548583984375, -22.81943130493164, -21.20337677001953, -19.587322235107422, -17.971267700195312, -16.355213165283203, -14.739158630371094, -13.123104095458984, -11.507049560546875, -9.8909912109375, -8.27493667602539, -6.658882141113281, -5.042827606201172, -3.4267730712890625, -1.8107185363769531, -0.19466400146484375, 1.4213905334472656, 3.037445068359375, 4.653499603271484, 6.269554138183594, 7.885608673095703, 9.501663208007812, 11.117717742919922, 12.733772277832031, 14.34982681274414, 15.96588134765625, 17.58193588256836, 19.19799041748047, 20.814044952392578, 22.430099487304688, 24.046154022216797, 25.662208557128906, 27.278263092041016, 28.894317626953125, 30.510372161865234, 32.126426696777344, 33.74248123168945, 35.35853576660156, 36.97459030151367, 38.59064483642578, 40.20669937133789, 41.82275390625]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 10.0, 9.0, 7.0, 13.0, 18.0, 30.0, 39.0, 57.0, 87.0, 128.0, 255.0, 393.0, 577.0, 1059.0, 1772.0, 3083.0, 5754.0, 10644.0, 20149.0, 40724.0, 85457.0, 205810.0, 360223.0, 166570.0, 72528.0, 34774.0, 17716.0, 9161.0, 4841.0, 2702.0, 1528.0, 919.0, 573.0, 350.0, 213.0, 126.0, 90.0, 53.0, 40.0, 24.0, 15.0, 12.0, 11.0, 6.0, 4.0, 5.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-5.83984375, -5.6595458984375, -5.479248046875, -5.2989501953125, -5.11865234375, -4.9383544921875, -4.758056640625, -4.5777587890625, -4.3974609375, -4.2171630859375, -4.036865234375, -3.8565673828125, -3.67626953125, -3.4959716796875, -3.315673828125, -3.1353759765625, -2.955078125, -2.7747802734375, -2.594482421875, -2.4141845703125, -2.23388671875, -2.0535888671875, -1.873291015625, -1.6929931640625, -1.5126953125, -1.3323974609375, -1.152099609375, -0.9718017578125, -0.79150390625, -0.6112060546875, -0.430908203125, -0.2506103515625, -0.0703125, 0.1099853515625, 0.290283203125, 0.4705810546875, 0.65087890625, 0.8311767578125, 1.011474609375, 1.1917724609375, 1.3720703125, 1.5523681640625, 1.732666015625, 1.9129638671875, 2.09326171875, 2.2735595703125, 2.453857421875, 2.6341552734375, 2.814453125, 2.9947509765625, 3.175048828125, 3.3553466796875, 3.53564453125, 3.7159423828125, 3.896240234375, 4.0765380859375, 4.2568359375, 4.4371337890625, 4.617431640625, 4.7977294921875, 4.97802734375, 5.1583251953125, 5.338623046875, 5.5189208984375, 5.69921875]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 2.0, 3.0, 2.0, 3.0, 1.0, 5.0, 5.0, 9.0, 8.0, 7.0, 15.0, 19.0, 21.0, 22.0, 17.0, 29.0, 24.0, 22.0, 33.0, 30.0, 31.0, 38.0, 32.0, 39.0, 38.0, 48.0, 39.0, 50.0, 54.0, 48.0, 36.0, 33.0, 30.0, 22.0, 30.0, 28.0, 19.0, 18.0, 19.0, 14.0, 11.0, 12.0, 8.0, 6.0, 10.0, 4.0, 7.0, 5.0, 3.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.275390625, -2.198944091796875, -2.12249755859375, -2.046051025390625, -1.9696044921875, -1.893157958984375, -1.81671142578125, -1.740264892578125, -1.663818359375, -1.587371826171875, -1.51092529296875, -1.434478759765625, -1.3580322265625, -1.281585693359375, -1.20513916015625, -1.128692626953125, -1.05224609375, -0.975799560546875, -0.89935302734375, -0.822906494140625, -0.7464599609375, -0.670013427734375, -0.59356689453125, -0.517120361328125, -0.440673828125, -0.364227294921875, -0.28778076171875, -0.211334228515625, -0.1348876953125, -0.058441162109375, 0.01800537109375, 0.094451904296875, 0.1708984375, 0.247344970703125, 0.32379150390625, 0.400238037109375, 0.4766845703125, 0.553131103515625, 0.62957763671875, 0.706024169921875, 0.782470703125, 0.858917236328125, 0.93536376953125, 1.011810302734375, 1.0882568359375, 1.164703369140625, 1.24114990234375, 1.317596435546875, 1.39404296875, 1.470489501953125, 1.54693603515625, 1.623382568359375, 1.6998291015625, 1.776275634765625, 1.85272216796875, 1.929168701171875, 2.005615234375, 2.082061767578125, 2.15850830078125, 2.234954833984375, 2.3114013671875, 2.387847900390625, 2.46429443359375, 2.540740966796875, 2.6171875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 5.0, 5.0, 6.0, 17.0, 17.0, 22.0, 45.0, 52.0, 88.0, 121.0, 185.0, 307.0, 521.0, 913.0, 1729.0, 4190.0, 14563.0, 109632.0, 821606.0, 75529.0, 11768.0, 3629.0, 1571.0, 791.0, 440.0, 283.0, 169.0, 129.0, 69.0, 52.0, 30.0, 27.0, 14.0, 14.0, 7.0, 4.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.921875, -18.27880859375, -17.6357421875, -16.99267578125, -16.349609375, -15.70654296875, -15.0634765625, -14.42041015625, -13.77734375, -13.13427734375, -12.4912109375, -11.84814453125, -11.205078125, -10.56201171875, -9.9189453125, -9.27587890625, -8.6328125, -7.98974609375, -7.3466796875, -6.70361328125, -6.060546875, -5.41748046875, -4.7744140625, -4.13134765625, -3.48828125, -2.84521484375, -2.2021484375, -1.55908203125, -0.916015625, -0.27294921875, 0.3701171875, 1.01318359375, 1.65625, 2.29931640625, 2.9423828125, 3.58544921875, 4.228515625, 4.87158203125, 5.5146484375, 6.15771484375, 6.80078125, 7.44384765625, 8.0869140625, 8.72998046875, 9.373046875, 10.01611328125, 10.6591796875, 11.30224609375, 11.9453125, 12.58837890625, 13.2314453125, 13.87451171875, 14.517578125, 15.16064453125, 15.8037109375, 16.44677734375, 17.08984375, 17.73291015625, 18.3759765625, 19.01904296875, 19.662109375, 20.30517578125, 20.9482421875, 21.59130859375, 22.234375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 0.0, 5.0, 3.0, 6.0, 3.0, 5.0, 7.0, 7.0, 13.0, 10.0, 12.0, 16.0, 29.0, 31.0, 21.0, 42.0, 35.0, 41.0, 44.0, 42.0, 50.0, 46.0, 57.0, 53.0, 43.0, 42.0, 49.0, 30.0, 47.0, 29.0, 27.0, 33.0, 23.0, 19.0, 14.0, 8.0, 11.0, 14.0, 9.0, 7.0, 3.0, 8.0, 3.0, 4.0, 3.0, 1.0, 0.0, 1.0, 2.0], "bins": [-16.921875, -16.4744873046875, -16.027099609375, -15.5797119140625, -15.13232421875, -14.6849365234375, -14.237548828125, -13.7901611328125, -13.3427734375, -12.8953857421875, -12.447998046875, -12.0006103515625, -11.55322265625, -11.1058349609375, -10.658447265625, -10.2110595703125, -9.763671875, -9.3162841796875, -8.868896484375, -8.4215087890625, -7.97412109375, -7.5267333984375, -7.079345703125, -6.6319580078125, -6.1845703125, -5.7371826171875, -5.289794921875, -4.8424072265625, -4.39501953125, -3.9476318359375, -3.500244140625, -3.0528564453125, -2.60546875, -2.1580810546875, -1.710693359375, -1.2633056640625, -0.81591796875, -0.3685302734375, 0.078857421875, 0.5262451171875, 0.9736328125, 1.4210205078125, 1.868408203125, 2.3157958984375, 2.76318359375, 3.2105712890625, 3.657958984375, 4.1053466796875, 4.552734375, 5.0001220703125, 5.447509765625, 5.8948974609375, 6.34228515625, 6.7896728515625, 7.237060546875, 7.6844482421875, 8.1318359375, 8.5792236328125, 9.026611328125, 9.4739990234375, 9.92138671875, 10.3687744140625, 10.816162109375, 11.2635498046875, 11.7109375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 6.0, 2.0, 4.0, 8.0, 7.0, 12.0, 23.0, 12.0, 29.0, 45.0, 53.0, 79.0, 102.0, 157.0, 256.0, 379.0, 685.0, 1179.0, 2434.0, 5530.0, 13839.0, 41135.0, 141697.0, 622834.0, 149353.0, 43004.0, 14438.0, 5672.0, 2566.0, 1206.0, 676.0, 356.0, 242.0, 157.0, 109.0, 55.0, 48.0, 36.0, 24.0, 37.0, 15.0, 13.0, 19.0, 7.0, 5.0, 9.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.53125, -4.39190673828125, -4.2525634765625, -4.11322021484375, -3.973876953125, -3.83453369140625, -3.6951904296875, -3.55584716796875, -3.41650390625, -3.27716064453125, -3.1378173828125, -2.99847412109375, -2.859130859375, -2.71978759765625, -2.5804443359375, -2.44110107421875, -2.3017578125, -2.16241455078125, -2.0230712890625, -1.88372802734375, -1.744384765625, -1.60504150390625, -1.4656982421875, -1.32635498046875, -1.18701171875, -1.04766845703125, -0.9083251953125, -0.76898193359375, -0.629638671875, -0.49029541015625, -0.3509521484375, -0.21160888671875, -0.072265625, 0.06707763671875, 0.2064208984375, 0.34576416015625, 0.485107421875, 0.62445068359375, 0.7637939453125, 0.90313720703125, 1.04248046875, 1.18182373046875, 1.3211669921875, 1.46051025390625, 1.599853515625, 1.73919677734375, 1.8785400390625, 2.01788330078125, 2.1572265625, 2.29656982421875, 2.4359130859375, 2.57525634765625, 2.714599609375, 2.85394287109375, 2.9932861328125, 3.13262939453125, 3.27197265625, 3.41131591796875, 3.5506591796875, 3.69000244140625, 3.829345703125, 3.96868896484375, 4.1080322265625, 4.24737548828125, 4.38671875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 5.0, 3.0, 3.0, 2.0, 2.0, 8.0, 11.0, 11.0, 17.0, 11.0, 21.0, 25.0, 27.0, 37.0, 39.0, 55.0, 98.0, 160.0, 122.0, 81.0, 58.0, 42.0, 34.0, 28.0, 24.0, 14.0, 16.0, 13.0, 11.0, 4.0, 9.0, 2.0, 4.0, 5.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0017604827880859375, -0.0017082691192626953, -0.0016560554504394531, -0.001603841781616211, -0.0015516281127929688, -0.0014994144439697266, -0.0014472007751464844, -0.0013949871063232422, -0.0013427734375, -0.0012905597686767578, -0.0012383460998535156, -0.0011861324310302734, -0.0011339187622070312, -0.001081705093383789, -0.0010294914245605469, -0.0009772777557373047, -0.0009250640869140625, -0.0008728504180908203, -0.0008206367492675781, -0.0007684230804443359, -0.0007162094116210938, -0.0006639957427978516, -0.0006117820739746094, -0.0005595684051513672, -0.000507354736328125, -0.0004551410675048828, -0.0004029273986816406, -0.00035071372985839844, -0.00029850006103515625, -0.00024628639221191406, -0.00019407272338867188, -0.0001418590545654297, -8.96453857421875e-05, -3.743171691894531e-05, 1.4781951904296875e-05, 6.699562072753906e-05, 0.00011920928955078125, 0.00017142295837402344, 0.00022363662719726562, 0.0002758502960205078, 0.00032806396484375, 0.0003802776336669922, 0.0004324913024902344, 0.00048470497131347656, 0.0005369186401367188, 0.0005891323089599609, 0.0006413459777832031, 0.0006935596466064453, 0.0007457733154296875, 0.0007979869842529297, 0.0008502006530761719, 0.0009024143218994141, 0.0009546279907226562, 0.0010068416595458984, 0.0010590553283691406, 0.0011112689971923828, 0.001163482666015625, 0.0012156963348388672, 0.0012679100036621094, 0.0013201236724853516, 0.0013723373413085938, 0.001424551010131836, 0.0014767646789550781, 0.0015289783477783203, 0.0015811920166015625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 8.0, 5.0, 7.0, 8.0, 13.0, 16.0, 25.0, 32.0, 57.0, 97.0, 139.0, 192.0, 266.0, 398.0, 689.0, 1211.0, 2140.0, 4334.0, 10462.0, 34242.0, 154136.0, 655312.0, 134999.0, 30880.0, 9837.0, 4025.0, 1995.0, 1109.0, 685.0, 433.0, 253.0, 169.0, 113.0, 74.0, 62.0, 45.0, 20.0, 23.0, 17.0, 8.0, 11.0, 7.0, 4.0, 2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 3.0], "bins": [-5.265625, -5.11712646484375, -4.9686279296875, -4.82012939453125, -4.671630859375, -4.52313232421875, -4.3746337890625, -4.22613525390625, -4.07763671875, -3.92913818359375, -3.7806396484375, -3.63214111328125, -3.483642578125, -3.33514404296875, -3.1866455078125, -3.03814697265625, -2.8896484375, -2.74114990234375, -2.5926513671875, -2.44415283203125, -2.295654296875, -2.14715576171875, -1.9986572265625, -1.85015869140625, -1.70166015625, -1.55316162109375, -1.4046630859375, -1.25616455078125, -1.107666015625, -0.95916748046875, -0.8106689453125, -0.66217041015625, -0.513671875, -0.36517333984375, -0.2166748046875, -0.06817626953125, 0.080322265625, 0.22882080078125, 0.3773193359375, 0.52581787109375, 0.67431640625, 0.82281494140625, 0.9713134765625, 1.11981201171875, 1.268310546875, 1.41680908203125, 1.5653076171875, 1.71380615234375, 1.8623046875, 2.01080322265625, 2.1593017578125, 2.30780029296875, 2.456298828125, 2.60479736328125, 2.7532958984375, 2.90179443359375, 3.05029296875, 3.19879150390625, 3.3472900390625, 3.49578857421875, 3.644287109375, 3.79278564453125, 3.9412841796875, 4.08978271484375, 4.23828125]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 2.0, 5.0, 4.0, 2.0, 3.0, 6.0, 5.0, 10.0, 8.0, 9.0, 19.0, 17.0, 16.0, 21.0, 30.0, 37.0, 35.0, 46.0, 51.0, 84.0, 97.0, 72.0, 83.0, 54.0, 47.0, 38.0, 29.0, 39.0, 32.0, 24.0, 16.0, 12.0, 12.0, 5.0, 9.0, 9.0, 5.0, 9.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.734375, -4.59063720703125, -4.4468994140625, -4.30316162109375, -4.159423828125, -4.01568603515625, -3.8719482421875, -3.72821044921875, -3.58447265625, -3.44073486328125, -3.2969970703125, -3.15325927734375, -3.009521484375, -2.86578369140625, -2.7220458984375, -2.57830810546875, -2.4345703125, -2.29083251953125, -2.1470947265625, -2.00335693359375, -1.859619140625, -1.71588134765625, -1.5721435546875, -1.42840576171875, -1.28466796875, -1.14093017578125, -0.9971923828125, -0.85345458984375, -0.709716796875, -0.56597900390625, -0.4222412109375, -0.27850341796875, -0.134765625, 0.00897216796875, 0.1527099609375, 0.29644775390625, 0.440185546875, 0.58392333984375, 0.7276611328125, 0.87139892578125, 1.01513671875, 1.15887451171875, 1.3026123046875, 1.44635009765625, 1.590087890625, 1.73382568359375, 1.8775634765625, 2.02130126953125, 2.1650390625, 2.30877685546875, 2.4525146484375, 2.59625244140625, 2.739990234375, 2.88372802734375, 3.0274658203125, 3.17120361328125, 3.31494140625, 3.45867919921875, 3.6024169921875, 3.74615478515625, 3.889892578125, 4.03363037109375, 4.1773681640625, 4.32110595703125, 4.46484375]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 6.0, 5.0, 9.0, 21.0, 30.0, 64.0, 172.0, 272.0, 186.0, 108.0, 58.0, 28.0, 23.0, 5.0, 6.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-76.49140930175781, -71.92589569091797, -67.36038208007812, -62.79486846923828, -58.22935485839844, -53.663841247558594, -49.09832763671875, -44.532814025878906, -39.96730041503906, -35.40178680419922, -30.836273193359375, -26.27075958251953, -21.705245971679688, -17.139732360839844, -12.57421875, -8.008705139160156, -3.4431915283203125, 1.1223220825195312, 5.687835693359375, 10.253349304199219, 14.818862915039062, 19.384376525878906, 23.94989013671875, 28.515403747558594, 33.08091735839844, 37.64643096923828, 42.211944580078125, 46.77745819091797, 51.34297180175781, 55.908485412597656, 60.4739990234375, 65.03951263427734, 69.60504150390625, 74.1705551147461, 78.73606872558594, 83.30158233642578, 87.86709594726562, 92.43260955810547, 96.99812316894531, 101.56363677978516, 106.129150390625, 110.69466400146484, 115.26017761230469, 119.82569122314453, 124.39120483398438, 128.95672607421875, 133.52223205566406, 138.08773803710938, 142.65325927734375, 147.21878051757812, 151.78428649902344, 156.34979248046875, 160.91531372070312, 165.4808349609375, 170.0463409423828, 174.61184692382812, 179.1773681640625, 183.74288940429688, 188.3083953857422, 192.8739013671875, 197.43942260742188, 202.00494384765625, 206.57044982910156, 211.13595581054688, 215.70147705078125]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 10.0, 9.0, 5.0, 13.0, 8.0, 10.0, 17.0, 14.0, 11.0, 24.0, 23.0, 33.0, 23.0, 36.0, 33.0, 43.0, 50.0, 63.0, 77.0, 59.0, 64.0, 46.0, 35.0, 48.0, 34.0, 24.0, 25.0, 22.0, 15.0, 27.0, 19.0, 12.0, 11.0, 16.0, 5.0, 10.0, 4.0, 5.0, 9.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-50.63334274291992, -48.9393310546875, -47.24531555175781, -45.55130386352539, -43.85729217529297, -42.16327667236328, -40.46926498413086, -38.77525329589844, -37.08123779296875, -35.38722610473633, -33.69321060180664, -31.99919891357422, -30.305187225341797, -28.611173629760742, -26.917160034179688, -25.223148345947266, -23.529136657714844, -21.83512306213379, -20.141111373901367, -18.447097778320312, -16.75308609008789, -15.059072494506836, -13.365058898925781, -11.671046257019043, -9.977033615112305, -8.283020973205566, -6.58900785446167, -4.894994735717773, -3.200982093811035, -1.5069694519042969, 0.1870441436767578, 1.881056785583496, 3.5750656127929688, 5.269078254699707, 6.9630913734436035, 8.6571044921875, 10.351117134094238, 12.045129776000977, 13.739143371582031, 15.43315601348877, 17.127168655395508, 18.821182250976562, 20.515193939208984, 22.20920753479004, 23.903221130371094, 25.597232818603516, 27.29124641418457, 28.985260009765625, 30.679271697998047, 32.37328338623047, 34.067298889160156, 35.76131057739258, 37.455322265625, 39.14933776855469, 40.84334945678711, 42.53736114501953, 44.23137664794922, 45.92538833618164, 47.61940383911133, 49.31341552734375, 51.00742721557617, 52.701438903808594, 54.39545440673828, 56.0894660949707, 57.783477783203125]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 5.0, 7.0, 9.0, 19.0, 30.0, 43.0, 69.0, 105.0, 220.0, 357.0, 716.0, 1337.0, 3217.0, 7675.0, 21416.0, 71376.0, 369002.0, 2476290.0, 1040822.0, 142397.0, 36681.0, 12805.0, 4935.0, 2200.0, 1098.0, 562.0, 337.0, 189.0, 135.0, 69.0, 62.0, 39.0, 19.0, 15.0, 7.0, 8.0, 4.0, 4.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.75, -5.57958984375, -5.4091796875, -5.23876953125, -5.068359375, -4.89794921875, -4.7275390625, -4.55712890625, -4.38671875, -4.21630859375, -4.0458984375, -3.87548828125, -3.705078125, -3.53466796875, -3.3642578125, -3.19384765625, -3.0234375, -2.85302734375, -2.6826171875, -2.51220703125, -2.341796875, -2.17138671875, -2.0009765625, -1.83056640625, -1.66015625, -1.48974609375, -1.3193359375, -1.14892578125, -0.978515625, -0.80810546875, -0.6376953125, -0.46728515625, -0.296875, -0.12646484375, 0.0439453125, 0.21435546875, 0.384765625, 0.55517578125, 0.7255859375, 0.89599609375, 1.06640625, 1.23681640625, 1.4072265625, 1.57763671875, 1.748046875, 1.91845703125, 2.0888671875, 2.25927734375, 2.4296875, 2.60009765625, 2.7705078125, 2.94091796875, 3.111328125, 3.28173828125, 3.4521484375, 3.62255859375, 3.79296875, 3.96337890625, 4.1337890625, 4.30419921875, 4.474609375, 4.64501953125, 4.8154296875, 4.98583984375, 5.15625]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 1.0, 3.0, 5.0, 8.0, 9.0, 5.0, 11.0, 14.0, 14.0, 26.0, 25.0, 30.0, 36.0, 37.0, 32.0, 42.0, 27.0, 42.0, 62.0, 50.0, 50.0, 41.0, 53.0, 43.0, 40.0, 38.0, 31.0, 35.0, 23.0, 26.0, 26.0, 17.0, 20.0, 14.0, 17.0, 10.0, 7.0, 9.0, 5.0, 2.0, 5.0, 3.0, 2.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.759765625, -2.67413330078125, -2.5885009765625, -2.50286865234375, -2.417236328125, -2.33160400390625, -2.2459716796875, -2.16033935546875, -2.07470703125, -1.98907470703125, -1.9034423828125, -1.81781005859375, -1.732177734375, -1.64654541015625, -1.5609130859375, -1.47528076171875, -1.3896484375, -1.30401611328125, -1.2183837890625, -1.13275146484375, -1.047119140625, -0.96148681640625, -0.8758544921875, -0.79022216796875, -0.70458984375, -0.61895751953125, -0.5333251953125, -0.44769287109375, -0.362060546875, -0.27642822265625, -0.1907958984375, -0.10516357421875, -0.01953125, 0.06610107421875, 0.1517333984375, 0.23736572265625, 0.322998046875, 0.40863037109375, 0.4942626953125, 0.57989501953125, 0.66552734375, 0.75115966796875, 0.8367919921875, 0.92242431640625, 1.008056640625, 1.09368896484375, 1.1793212890625, 1.26495361328125, 1.3505859375, 1.43621826171875, 1.5218505859375, 1.60748291015625, 1.693115234375, 1.77874755859375, 1.8643798828125, 1.95001220703125, 2.03564453125, 2.12127685546875, 2.2069091796875, 2.29254150390625, 2.378173828125, 2.46380615234375, 2.5494384765625, 2.63507080078125, 2.720703125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 4.0, 5.0, 3.0, 10.0, 8.0, 19.0, 27.0, 48.0, 93.0, 164.0, 274.0, 597.0, 1285.0, 3180.0, 8552.0, 29676.0, 158003.0, 2413090.0, 1441867.0, 106035.0, 20795.0, 6189.0, 2306.0, 983.0, 477.0, 244.0, 155.0, 79.0, 40.0, 29.0, 19.0, 11.0, 10.0, 7.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.3203125, -10.9864501953125, -10.652587890625, -10.3187255859375, -9.98486328125, -9.6510009765625, -9.317138671875, -8.9832763671875, -8.6494140625, -8.3155517578125, -7.981689453125, -7.6478271484375, -7.31396484375, -6.9801025390625, -6.646240234375, -6.3123779296875, -5.978515625, -5.6446533203125, -5.310791015625, -4.9769287109375, -4.64306640625, -4.3092041015625, -3.975341796875, -3.6414794921875, -3.3076171875, -2.9737548828125, -2.639892578125, -2.3060302734375, -1.97216796875, -1.6383056640625, -1.304443359375, -0.9705810546875, -0.63671875, -0.3028564453125, 0.031005859375, 0.3648681640625, 0.69873046875, 1.0325927734375, 1.366455078125, 1.7003173828125, 2.0341796875, 2.3680419921875, 2.701904296875, 3.0357666015625, 3.36962890625, 3.7034912109375, 4.037353515625, 4.3712158203125, 4.705078125, 5.0389404296875, 5.372802734375, 5.7066650390625, 6.04052734375, 6.3743896484375, 6.708251953125, 7.0421142578125, 7.3759765625, 7.7098388671875, 8.043701171875, 8.3775634765625, 8.71142578125, 9.0452880859375, 9.379150390625, 9.7130126953125, 10.046875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 5.0, 5.0, 4.0, 7.0, 10.0, 16.0, 13.0, 23.0, 18.0, 20.0, 41.0, 67.0, 90.0, 125.0, 190.0, 331.0, 511.0, 752.0, 645.0, 407.0, 263.0, 178.0, 104.0, 76.0, 45.0, 43.0, 24.0, 12.0, 12.0, 13.0, 10.0, 2.0, 3.0, 5.0, 6.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.2890625, -9.954833984375, -9.62060546875, -9.286376953125, -8.9521484375, -8.617919921875, -8.28369140625, -7.949462890625, -7.615234375, -7.281005859375, -6.94677734375, -6.612548828125, -6.2783203125, -5.944091796875, -5.60986328125, -5.275634765625, -4.94140625, -4.607177734375, -4.27294921875, -3.938720703125, -3.6044921875, -3.270263671875, -2.93603515625, -2.601806640625, -2.267578125, -1.933349609375, -1.59912109375, -1.264892578125, -0.9306640625, -0.596435546875, -0.26220703125, 0.072021484375, 0.40625, 0.740478515625, 1.07470703125, 1.408935546875, 1.7431640625, 2.077392578125, 2.41162109375, 2.745849609375, 3.080078125, 3.414306640625, 3.74853515625, 4.082763671875, 4.4169921875, 4.751220703125, 5.08544921875, 5.419677734375, 5.75390625, 6.088134765625, 6.42236328125, 6.756591796875, 7.0908203125, 7.425048828125, 7.75927734375, 8.093505859375, 8.427734375, 8.761962890625, 9.09619140625, 9.430419921875, 9.7646484375, 10.098876953125, 10.43310546875, 10.767333984375, 11.1015625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 1.0, 3.0, 2.0, 6.0, 14.0, 27.0, 63.0, 132.0, 213.0, 211.0, 178.0, 87.0, 31.0, 14.0, 4.0, 7.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-147.84857177734375, -143.39707946777344, -138.94558715820312, -134.4940948486328, -130.0426025390625, -125.59110260009766, -121.13961029052734, -116.68811798095703, -112.23661804199219, -107.78512573242188, -103.33363342285156, -98.88214111328125, -94.4306411743164, -89.9791488647461, -85.52765655517578, -81.07616424560547, -76.62467193603516, -72.17317962646484, -67.72168731689453, -63.27019119262695, -58.818695068359375, -54.36720275878906, -49.91571044921875, -45.46421813964844, -41.01272201538086, -36.56122970581055, -32.10973358154297, -27.658241271972656, -23.20674705505371, -18.755252838134766, -14.303760528564453, -9.852266311645508, -5.4007720947265625, -0.9492783546447754, 3.5022153854370117, 7.953708648681641, 12.405202865600586, 16.85669708251953, 21.308189392089844, 25.75968360900879, 30.211177825927734, 34.66267013549805, 39.114166259765625, 43.56565856933594, 48.01715087890625, 52.46864700317383, 56.92013931274414, 61.37163543701172, 65.82312774658203, 70.27462005615234, 74.72611236572266, 79.1776123046875, 83.62910461425781, 88.08059692382812, 92.53208923339844, 96.98358154296875, 101.43507385253906, 105.88656616210938, 110.33805847167969, 114.78955078125, 119.24105072021484, 123.69254302978516, 128.14404296875, 132.5955352783203, 137.04702758789062]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 2.0, 4.0, 8.0, 9.0, 7.0, 9.0, 6.0, 10.0, 15.0, 15.0, 18.0, 29.0, 29.0, 30.0, 24.0, 35.0, 42.0, 37.0, 42.0, 48.0, 43.0, 47.0, 49.0, 48.0, 35.0, 34.0, 34.0, 36.0, 36.0, 39.0, 30.0, 19.0, 32.0, 19.0, 15.0, 12.0, 11.0, 10.0, 7.0, 4.0, 2.0, 8.0, 8.0, 3.0, 1.0, 3.0, 0.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-43.10148620605469, -41.596649169921875, -40.09181213378906, -38.58697509765625, -37.08213806152344, -35.577301025390625, -34.07246398925781, -32.567626953125, -31.062788009643555, -29.557950973510742, -28.05311393737793, -26.548274993896484, -25.043437957763672, -23.53860092163086, -22.033763885498047, -20.528926849365234, -19.024089813232422, -17.51925277709961, -16.014415740966797, -14.509577751159668, -13.004740715026855, -11.499903678894043, -9.995065689086914, -8.490228652954102, -6.985391616821289, -5.480554580688477, -3.975717067718506, -2.470879554748535, -0.9660425186157227, 0.5387945175170898, 2.0436325073242188, 3.5484695434570312, 5.053310394287109, 6.558147430419922, 8.062984466552734, 9.567822456359863, 11.072659492492676, 12.577496528625488, 14.082334518432617, 15.58717155456543, 17.092008590698242, 18.596845626831055, 20.101682662963867, 21.606521606445312, 23.111358642578125, 24.616195678710938, 26.12103271484375, 27.625869750976562, 29.130706787109375, 30.635543823242188, 32.140380859375, 33.64521789550781, 35.150054931640625, 36.65489196777344, 38.15972900390625, 39.66456604003906, 41.169403076171875, 42.67424011230469, 44.1790771484375, 45.68391418457031, 47.188751220703125, 48.69358825683594, 50.19842529296875, 51.70326232910156, 53.20810317993164]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 6.0, 12.0, 17.0, 26.0, 38.0, 51.0, 104.0, 149.0, 261.0, 418.0, 709.0, 1166.0, 2071.0, 3628.0, 7087.0, 14947.0, 35775.0, 106539.0, 374379.0, 343102.0, 95926.0, 33168.0, 14097.0, 6655.0, 3523.0, 1923.0, 1091.0, 618.0, 369.0, 255.0, 166.0, 108.0, 61.0, 38.0, 34.0, 14.0, 10.0, 9.0, 4.0, 0.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.23828125, -7.01177978515625, -6.7852783203125, -6.55877685546875, -6.332275390625, -6.10577392578125, -5.8792724609375, -5.65277099609375, -5.42626953125, -5.19976806640625, -4.9732666015625, -4.74676513671875, -4.520263671875, -4.29376220703125, -4.0672607421875, -3.84075927734375, -3.6142578125, -3.38775634765625, -3.1612548828125, -2.93475341796875, -2.708251953125, -2.48175048828125, -2.2552490234375, -2.02874755859375, -1.80224609375, -1.57574462890625, -1.3492431640625, -1.12274169921875, -0.896240234375, -0.66973876953125, -0.4432373046875, -0.21673583984375, 0.009765625, 0.23626708984375, 0.4627685546875, 0.68927001953125, 0.915771484375, 1.14227294921875, 1.3687744140625, 1.59527587890625, 1.82177734375, 2.04827880859375, 2.2747802734375, 2.50128173828125, 2.727783203125, 2.95428466796875, 3.1807861328125, 3.40728759765625, 3.6337890625, 3.86029052734375, 4.0867919921875, 4.31329345703125, 4.539794921875, 4.76629638671875, 4.9927978515625, 5.21929931640625, 5.44580078125, 5.67230224609375, 5.8988037109375, 6.12530517578125, 6.351806640625, 6.57830810546875, 6.8048095703125, 7.03131103515625, 7.2578125]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 6.0, 4.0, 9.0, 5.0, 6.0, 15.0, 17.0, 27.0, 19.0, 35.0, 32.0, 35.0, 40.0, 32.0, 56.0, 50.0, 54.0, 54.0, 58.0, 54.0, 52.0, 41.0, 45.0, 36.0, 35.0, 39.0, 31.0, 21.0, 22.0, 22.0, 8.0, 7.0, 10.0, 16.0, 5.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.923828125, -3.811309814453125, -3.69879150390625, -3.586273193359375, -3.4737548828125, -3.361236572265625, -3.24871826171875, -3.136199951171875, -3.023681640625, -2.911163330078125, -2.79864501953125, -2.686126708984375, -2.5736083984375, -2.461090087890625, -2.34857177734375, -2.236053466796875, -2.12353515625, -2.011016845703125, -1.89849853515625, -1.785980224609375, -1.6734619140625, -1.560943603515625, -1.44842529296875, -1.335906982421875, -1.223388671875, -1.110870361328125, -0.99835205078125, -0.885833740234375, -0.7733154296875, -0.660797119140625, -0.54827880859375, -0.435760498046875, -0.3232421875, -0.210723876953125, -0.09820556640625, 0.014312744140625, 0.1268310546875, 0.239349365234375, 0.35186767578125, 0.464385986328125, 0.576904296875, 0.689422607421875, 0.80194091796875, 0.914459228515625, 1.0269775390625, 1.139495849609375, 1.25201416015625, 1.364532470703125, 1.47705078125, 1.589569091796875, 1.70208740234375, 1.814605712890625, 1.9271240234375, 2.039642333984375, 2.15216064453125, 2.264678955078125, 2.377197265625, 2.489715576171875, 2.60223388671875, 2.714752197265625, 2.8272705078125, 2.939788818359375, 3.05230712890625, 3.164825439453125, 3.27734375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 5.0, 4.0, 5.0, 7.0, 5.0, 13.0, 13.0, 37.0, 33.0, 58.0, 103.0, 135.0, 197.0, 382.0, 649.0, 1342.0, 3339.0, 11679.0, 78409.0, 823076.0, 107573.0, 14512.0, 3770.0, 1483.0, 707.0, 400.0, 223.0, 133.0, 87.0, 61.0, 46.0, 27.0, 10.0, 14.0, 9.0, 4.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.03125, -17.4775390625, -16.923828125, -16.3701171875, -15.81640625, -15.2626953125, -14.708984375, -14.1552734375, -13.6015625, -13.0478515625, -12.494140625, -11.9404296875, -11.38671875, -10.8330078125, -10.279296875, -9.7255859375, -9.171875, -8.6181640625, -8.064453125, -7.5107421875, -6.95703125, -6.4033203125, -5.849609375, -5.2958984375, -4.7421875, -4.1884765625, -3.634765625, -3.0810546875, -2.52734375, -1.9736328125, -1.419921875, -0.8662109375, -0.3125, 0.2412109375, 0.794921875, 1.3486328125, 1.90234375, 2.4560546875, 3.009765625, 3.5634765625, 4.1171875, 4.6708984375, 5.224609375, 5.7783203125, 6.33203125, 6.8857421875, 7.439453125, 7.9931640625, 8.546875, 9.1005859375, 9.654296875, 10.2080078125, 10.76171875, 11.3154296875, 11.869140625, 12.4228515625, 12.9765625, 13.5302734375, 14.083984375, 14.6376953125, 15.19140625, 15.7451171875, 16.298828125, 16.8525390625, 17.40625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 5.0, 9.0, 5.0, 8.0, 10.0, 17.0, 10.0, 14.0, 19.0, 20.0, 32.0, 36.0, 45.0, 46.0, 41.0, 56.0, 49.0, 61.0, 63.0, 61.0, 72.0, 48.0, 47.0, 50.0, 28.0, 22.0, 23.0, 23.0, 16.0, 22.0, 20.0, 7.0, 3.0, 6.0, 2.0, 2.0, 6.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.703125, -17.183349609375, -16.66357421875, -16.143798828125, -15.6240234375, -15.104248046875, -14.58447265625, -14.064697265625, -13.544921875, -13.025146484375, -12.50537109375, -11.985595703125, -11.4658203125, -10.946044921875, -10.42626953125, -9.906494140625, -9.38671875, -8.866943359375, -8.34716796875, -7.827392578125, -7.3076171875, -6.787841796875, -6.26806640625, -5.748291015625, -5.228515625, -4.708740234375, -4.18896484375, -3.669189453125, -3.1494140625, -2.629638671875, -2.10986328125, -1.590087890625, -1.0703125, -0.550537109375, -0.03076171875, 0.489013671875, 1.0087890625, 1.528564453125, 2.04833984375, 2.568115234375, 3.087890625, 3.607666015625, 4.12744140625, 4.647216796875, 5.1669921875, 5.686767578125, 6.20654296875, 6.726318359375, 7.24609375, 7.765869140625, 8.28564453125, 8.805419921875, 9.3251953125, 9.844970703125, 10.36474609375, 10.884521484375, 11.404296875, 11.924072265625, 12.44384765625, 12.963623046875, 13.4833984375, 14.003173828125, 14.52294921875, 15.042724609375, 15.5625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 5.0, 6.0, 6.0, 15.0, 35.0, 44.0, 80.0, 145.0, 329.0, 687.0, 1906.0, 6599.0, 32004.0, 265368.0, 673862.0, 53154.0, 9968.0, 2633.0, 898.0, 387.0, 182.0, 92.0, 63.0, 29.0, 17.0, 14.0, 11.0, 4.0, 7.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.6640625, -6.43536376953125, -6.2066650390625, -5.97796630859375, -5.749267578125, -5.52056884765625, -5.2918701171875, -5.06317138671875, -4.83447265625, -4.60577392578125, -4.3770751953125, -4.14837646484375, -3.919677734375, -3.69097900390625, -3.4622802734375, -3.23358154296875, -3.0048828125, -2.77618408203125, -2.5474853515625, -2.31878662109375, -2.090087890625, -1.86138916015625, -1.6326904296875, -1.40399169921875, -1.17529296875, -0.94659423828125, -0.7178955078125, -0.48919677734375, -0.260498046875, -0.03179931640625, 0.1968994140625, 0.42559814453125, 0.654296875, 0.88299560546875, 1.1116943359375, 1.34039306640625, 1.569091796875, 1.79779052734375, 2.0264892578125, 2.25518798828125, 2.48388671875, 2.71258544921875, 2.9412841796875, 3.16998291015625, 3.398681640625, 3.62738037109375, 3.8560791015625, 4.08477783203125, 4.3134765625, 4.54217529296875, 4.7708740234375, 4.99957275390625, 5.228271484375, 5.45697021484375, 5.6856689453125, 5.91436767578125, 6.14306640625, 6.37176513671875, 6.6004638671875, 6.82916259765625, 7.057861328125, 7.28656005859375, 7.5152587890625, 7.74395751953125, 7.97265625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 5.0, 0.0, 4.0, 3.0, 8.0, 11.0, 10.0, 11.0, 18.0, 14.0, 23.0, 20.0, 16.0, 42.0, 69.0, 93.0, 144.0, 144.0, 105.0, 52.0, 36.0, 36.0, 29.0, 20.0, 11.0, 13.0, 11.0, 14.0, 5.0, 10.0, 6.0, 2.0, 2.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0013866424560546875, -0.001338958740234375, -0.0012912750244140625, -0.00124359130859375, -0.0011959075927734375, -0.001148223876953125, -0.0011005401611328125, -0.0010528564453125, -0.0010051727294921875, -0.000957489013671875, -0.0009098052978515625, -0.00086212158203125, -0.0008144378662109375, -0.000766754150390625, -0.0007190704345703125, -0.00067138671875, -0.0006237030029296875, -0.000576019287109375, -0.0005283355712890625, -0.00048065185546875, -0.0004329681396484375, -0.000385284423828125, -0.0003376007080078125, -0.0002899169921875, -0.0002422332763671875, -0.000194549560546875, -0.0001468658447265625, -9.918212890625e-05, -5.14984130859375e-05, -3.814697265625e-06, 4.38690185546875e-05, 9.1552734375e-05, 0.0001392364501953125, 0.000186920166015625, 0.0002346038818359375, 0.00028228759765625, 0.0003299713134765625, 0.000377655029296875, 0.0004253387451171875, 0.0004730224609375, 0.0005207061767578125, 0.000568389892578125, 0.0006160736083984375, 0.00066375732421875, 0.0007114410400390625, 0.000759124755859375, 0.0008068084716796875, 0.0008544921875, 0.0009021759033203125, 0.000949859619140625, 0.0009975433349609375, 0.00104522705078125, 0.0010929107666015625, 0.001140594482421875, 0.0011882781982421875, 0.0012359619140625, 0.0012836456298828125, 0.001331329345703125, 0.0013790130615234375, 0.00142669677734375, 0.0014743804931640625, 0.001522064208984375, 0.0015697479248046875, 0.001617431640625, 0.0016651153564453125]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 0.0, 3.0, 5.0, 10.0, 13.0, 21.0, 14.0, 34.0, 55.0, 74.0, 122.0, 188.0, 332.0, 657.0, 1210.0, 2667.0, 7302.0, 25960.0, 127535.0, 707237.0, 135275.0, 27043.0, 7380.0, 2627.0, 1222.0, 597.0, 359.0, 201.0, 134.0, 97.0, 49.0, 35.0, 29.0, 17.0, 23.0, 10.0, 6.0, 5.0, 2.0, 1.0, 6.0, 3.0, 0.0, 0.0, 3.0, 1.0, 1.0], "bins": [-6.03515625, -5.869873046875, -5.70458984375, -5.539306640625, -5.3740234375, -5.208740234375, -5.04345703125, -4.878173828125, -4.712890625, -4.547607421875, -4.38232421875, -4.217041015625, -4.0517578125, -3.886474609375, -3.72119140625, -3.555908203125, -3.390625, -3.225341796875, -3.06005859375, -2.894775390625, -2.7294921875, -2.564208984375, -2.39892578125, -2.233642578125, -2.068359375, -1.903076171875, -1.73779296875, -1.572509765625, -1.4072265625, -1.241943359375, -1.07666015625, -0.911376953125, -0.74609375, -0.580810546875, -0.41552734375, -0.250244140625, -0.0849609375, 0.080322265625, 0.24560546875, 0.410888671875, 0.576171875, 0.741455078125, 0.90673828125, 1.072021484375, 1.2373046875, 1.402587890625, 1.56787109375, 1.733154296875, 1.8984375, 2.063720703125, 2.22900390625, 2.394287109375, 2.5595703125, 2.724853515625, 2.89013671875, 3.055419921875, 3.220703125, 3.385986328125, 3.55126953125, 3.716552734375, 3.8818359375, 4.047119140625, 4.21240234375, 4.377685546875, 4.54296875]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 3.0, 3.0, 9.0, 5.0, 11.0, 14.0, 10.0, 16.0, 15.0, 25.0, 26.0, 39.0, 52.0, 55.0, 80.0, 116.0, 112.0, 95.0, 70.0, 58.0, 33.0, 29.0, 16.0, 16.0, 14.0, 15.0, 10.0, 11.0, 9.0, 3.0, 6.0, 3.0, 6.0, 1.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.10546875, -4.95098876953125, -4.7965087890625, -4.64202880859375, -4.487548828125, -4.33306884765625, -4.1785888671875, -4.02410888671875, -3.86962890625, -3.71514892578125, -3.5606689453125, -3.40618896484375, -3.251708984375, -3.09722900390625, -2.9427490234375, -2.78826904296875, -2.6337890625, -2.47930908203125, -2.3248291015625, -2.17034912109375, -2.015869140625, -1.86138916015625, -1.7069091796875, -1.55242919921875, -1.39794921875, -1.24346923828125, -1.0889892578125, -0.93450927734375, -0.780029296875, -0.62554931640625, -0.4710693359375, -0.31658935546875, -0.162109375, -0.00762939453125, 0.1468505859375, 0.30133056640625, 0.455810546875, 0.61029052734375, 0.7647705078125, 0.91925048828125, 1.07373046875, 1.22821044921875, 1.3826904296875, 1.53717041015625, 1.691650390625, 1.84613037109375, 2.0006103515625, 2.15509033203125, 2.3095703125, 2.46405029296875, 2.6185302734375, 2.77301025390625, 2.927490234375, 3.08197021484375, 3.2364501953125, 3.39093017578125, 3.54541015625, 3.69989013671875, 3.8543701171875, 4.00885009765625, 4.163330078125, 4.31781005859375, 4.4722900390625, 4.62677001953125, 4.78125]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 12.0, 29.0, 66.0, 188.0, 424.0, 189.0, 61.0, 16.0, 7.0, 9.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-192.97183227539062, -186.45510864257812, -179.93836975097656, -173.42164611816406, -166.90492248535156, -160.38818359375, -153.8714599609375, -147.354736328125, -140.8380126953125, -134.3212890625, -127.80455780029297, -121.28782653808594, -114.77110290527344, -108.2543716430664, -101.73764038085938, -95.22091674804688, -88.70418548583984, -82.18745422363281, -75.67073059082031, -69.15399932861328, -62.63727569580078, -56.12054443359375, -49.603816986083984, -43.08708953857422, -36.57036209106445, -30.053634643554688, -23.536907196044922, -17.020177841186523, -10.503450393676758, -3.9867210388183594, 2.5300064086914062, 9.046733856201172, 15.563461303710938, 22.080188751220703, 28.59691619873047, 35.1136474609375, 41.63037109375, 48.14710235595703, 54.6638298034668, 61.18055725097656, 67.69728088378906, 74.2140121459961, 80.7307357788086, 87.24746704101562, 93.76419067382812, 100.28092193603516, 106.79765319824219, 113.31437683105469, 119.83110809326172, 126.34783935546875, 132.86456298828125, 139.38128662109375, 145.8980255126953, 152.4147491455078, 158.9314727783203, 165.44821166992188, 171.96493530273438, 178.48165893554688, 184.99839782714844, 191.51512145996094, 198.03184509277344, 204.548583984375, 211.0653076171875, 217.58203125, 224.0987548828125]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 6.0, 6.0, 3.0, 10.0, 12.0, 10.0, 13.0, 16.0, 13.0, 19.0, 18.0, 28.0, 23.0, 20.0, 28.0, 28.0, 32.0, 42.0, 48.0, 58.0, 76.0, 70.0, 49.0, 53.0, 41.0, 30.0, 36.0, 30.0, 19.0, 28.0, 26.0, 14.0, 17.0, 7.0, 10.0, 10.0, 11.0, 10.0, 5.0, 4.0, 8.0, 2.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 3.0], "bins": [-57.12102508544922, -55.33594512939453, -53.550865173339844, -51.765785217285156, -49.98070526123047, -48.19562530517578, -46.410545349121094, -44.625465393066406, -42.84038543701172, -41.05530548095703, -39.270225524902344, -37.485145568847656, -35.70006561279297, -33.91498565673828, -32.129905700683594, -30.344825744628906, -28.55974578857422, -26.77466583251953, -24.989585876464844, -23.204505920410156, -21.41942596435547, -19.63434600830078, -17.849266052246094, -16.064186096191406, -14.279106140136719, -12.494026184082031, -10.708946228027344, -8.923866271972656, -7.138786315917969, -5.353706359863281, -3.5686264038085938, -1.7835464477539062, 0.001529693603515625, 1.7866096496582031, 3.5716896057128906, 5.356769561767578, 7.141849517822266, 8.926929473876953, 10.71200942993164, 12.497089385986328, 14.282169342041016, 16.067249298095703, 17.85232925415039, 19.637409210205078, 21.422489166259766, 23.207569122314453, 24.99264907836914, 26.777729034423828, 28.562808990478516, 30.347888946533203, 32.13296890258789, 33.91804885864258, 35.703128814697266, 37.48820877075195, 39.27328872680664, 41.05836868286133, 42.843448638916016, 44.6285285949707, 46.41360855102539, 48.19868850708008, 49.983768463134766, 51.76884841918945, 53.55392837524414, 55.33900833129883, 57.124088287353516]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 7.0, 3.0, 7.0, 13.0, 12.0, 15.0, 25.0, 29.0, 56.0, 81.0, 95.0, 200.0, 250.0, 430.0, 801.0, 1328.0, 2383.0, 4641.0, 9477.0, 21713.0, 60369.0, 238944.0, 1413162.0, 1967285.0, 341679.0, 78932.0, 27868.0, 11644.0, 5664.0, 2844.0, 1670.0, 922.0, 566.0, 399.0, 241.0, 166.0, 117.0, 75.0, 51.0, 35.0, 28.0, 14.0, 18.0, 14.0, 8.0, 7.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-4.5703125, -4.43231201171875, -4.2943115234375, -4.15631103515625, -4.018310546875, -3.88031005859375, -3.7423095703125, -3.60430908203125, -3.46630859375, -3.32830810546875, -3.1903076171875, -3.05230712890625, -2.914306640625, -2.77630615234375, -2.6383056640625, -2.50030517578125, -2.3623046875, -2.22430419921875, -2.0863037109375, -1.94830322265625, -1.810302734375, -1.67230224609375, -1.5343017578125, -1.39630126953125, -1.25830078125, -1.12030029296875, -0.9822998046875, -0.84429931640625, -0.706298828125, -0.56829833984375, -0.4302978515625, -0.29229736328125, -0.154296875, -0.01629638671875, 0.1217041015625, 0.25970458984375, 0.397705078125, 0.53570556640625, 0.6737060546875, 0.81170654296875, 0.94970703125, 1.08770751953125, 1.2257080078125, 1.36370849609375, 1.501708984375, 1.63970947265625, 1.7777099609375, 1.91571044921875, 2.0537109375, 2.19171142578125, 2.3297119140625, 2.46771240234375, 2.605712890625, 2.74371337890625, 2.8817138671875, 3.01971435546875, 3.15771484375, 3.29571533203125, 3.4337158203125, 3.57171630859375, 3.709716796875, 3.84771728515625, 3.9857177734375, 4.12371826171875, 4.26171875]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 3.0, 10.0, 14.0, 12.0, 10.0, 13.0, 17.0, 22.0, 21.0, 29.0, 33.0, 45.0, 59.0, 38.0, 44.0, 55.0, 58.0, 53.0, 53.0, 59.0, 42.0, 56.0, 37.0, 36.0, 33.0, 25.0, 30.0, 25.0, 16.0, 13.0, 7.0, 12.0, 4.0, 5.0, 6.0, 1.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.923828125, -3.80865478515625, -3.6934814453125, -3.57830810546875, -3.463134765625, -3.34796142578125, -3.2327880859375, -3.11761474609375, -3.00244140625, -2.88726806640625, -2.7720947265625, -2.65692138671875, -2.541748046875, -2.42657470703125, -2.3114013671875, -2.19622802734375, -2.0810546875, -1.96588134765625, -1.8507080078125, -1.73553466796875, -1.620361328125, -1.50518798828125, -1.3900146484375, -1.27484130859375, -1.15966796875, -1.04449462890625, -0.9293212890625, -0.81414794921875, -0.698974609375, -0.58380126953125, -0.4686279296875, -0.35345458984375, -0.23828125, -0.12310791015625, -0.0079345703125, 0.10723876953125, 0.222412109375, 0.33758544921875, 0.4527587890625, 0.56793212890625, 0.68310546875, 0.79827880859375, 0.9134521484375, 1.02862548828125, 1.143798828125, 1.25897216796875, 1.3741455078125, 1.48931884765625, 1.6044921875, 1.71966552734375, 1.8348388671875, 1.95001220703125, 2.065185546875, 2.18035888671875, 2.2955322265625, 2.41070556640625, 2.52587890625, 2.64105224609375, 2.7562255859375, 2.87139892578125, 2.986572265625, 3.10174560546875, 3.2169189453125, 3.33209228515625, 3.447265625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 7.0, 7.0, 6.0, 7.0, 14.0, 19.0, 33.0, 56.0, 112.0, 169.0, 395.0, 891.0, 2311.0, 6726.0, 28825.0, 261980.0, 3578268.0, 272285.0, 30150.0, 7320.0, 2588.0, 1081.0, 469.0, 228.0, 135.0, 63.0, 58.0, 26.0, 14.0, 12.0, 10.0, 5.0, 6.0, 5.0, 3.0, 0.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-15.3828125, -14.97265625, -14.5625, -14.15234375, -13.7421875, -13.33203125, -12.921875, -12.51171875, -12.1015625, -11.69140625, -11.28125, -10.87109375, -10.4609375, -10.05078125, -9.640625, -9.23046875, -8.8203125, -8.41015625, -8.0, -7.58984375, -7.1796875, -6.76953125, -6.359375, -5.94921875, -5.5390625, -5.12890625, -4.71875, -4.30859375, -3.8984375, -3.48828125, -3.078125, -2.66796875, -2.2578125, -1.84765625, -1.4375, -1.02734375, -0.6171875, -0.20703125, 0.203125, 0.61328125, 1.0234375, 1.43359375, 1.84375, 2.25390625, 2.6640625, 3.07421875, 3.484375, 3.89453125, 4.3046875, 4.71484375, 5.125, 5.53515625, 5.9453125, 6.35546875, 6.765625, 7.17578125, 7.5859375, 7.99609375, 8.40625, 8.81640625, 9.2265625, 9.63671875, 10.046875, 10.45703125, 10.8671875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 5.0, 1.0, 5.0, 4.0, 7.0, 7.0, 9.0, 26.0, 25.0, 42.0, 41.0, 52.0, 98.0, 154.0, 250.0, 440.0, 743.0, 741.0, 547.0, 315.0, 172.0, 124.0, 70.0, 52.0, 47.0, 17.0, 16.0, 14.0, 9.0, 9.0, 8.0, 8.0, 6.0, 2.0, 2.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.0859375, -7.764404296875, -7.44287109375, -7.121337890625, -6.7998046875, -6.478271484375, -6.15673828125, -5.835205078125, -5.513671875, -5.192138671875, -4.87060546875, -4.549072265625, -4.2275390625, -3.906005859375, -3.58447265625, -3.262939453125, -2.94140625, -2.619873046875, -2.29833984375, -1.976806640625, -1.6552734375, -1.333740234375, -1.01220703125, -0.690673828125, -0.369140625, -0.047607421875, 0.27392578125, 0.595458984375, 0.9169921875, 1.238525390625, 1.56005859375, 1.881591796875, 2.203125, 2.524658203125, 2.84619140625, 3.167724609375, 3.4892578125, 3.810791015625, 4.13232421875, 4.453857421875, 4.775390625, 5.096923828125, 5.41845703125, 5.739990234375, 6.0615234375, 6.383056640625, 6.70458984375, 7.026123046875, 7.34765625, 7.669189453125, 7.99072265625, 8.312255859375, 8.6337890625, 8.955322265625, 9.27685546875, 9.598388671875, 9.919921875, 10.241455078125, 10.56298828125, 10.884521484375, 11.2060546875, 11.527587890625, 11.84912109375, 12.170654296875, 12.4921875]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 6.0, 16.0, 63.0, 216.0, 346.0, 233.0, 81.0, 18.0, 8.0, 2.0, 10.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-249.49484252929688, -243.35812377929688, -237.22140502929688, -231.08468627929688, -224.94796752929688, -218.81124877929688, -212.67453002929688, -206.53781127929688, -200.40109252929688, -194.26437377929688, -188.12765502929688, -181.99093627929688, -175.85421752929688, -169.71749877929688, -163.58078002929688, -157.44406127929688, -151.30734252929688, -145.17062377929688, -139.03390502929688, -132.89718627929688, -126.76046752929688, -120.62374877929688, -114.48703002929688, -108.35031127929688, -102.21359252929688, -96.07687377929688, -89.94015502929688, -83.80343627929688, -77.66671752929688, -71.52999877929688, -65.39328002929688, -59.256561279296875, -53.11985778808594, -46.98313903808594, -40.84642028808594, -34.70970153808594, -28.572982788085938, -22.436264038085938, -16.299545288085938, -10.162826538085938, -4.0261077880859375, 2.1106109619140625, 8.247329711914062, 14.384048461914062, 20.520767211914062, 26.657485961914062, 32.79420471191406, 38.93092346191406, 45.06764221191406, 51.20436096191406, 57.34107971191406, 63.47779846191406, 69.61451721191406, 75.75123596191406, 81.88795471191406, 88.02467346191406, 94.16139221191406, 100.29811096191406, 106.43482971191406, 112.57154846191406, 118.70826721191406, 124.84498596191406, 130.98170471191406, 137.11842346191406, 143.25514221191406]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 6.0, 10.0, 8.0, 12.0, 15.0, 19.0, 21.0, 33.0, 28.0, 31.0, 51.0, 36.0, 47.0, 52.0, 62.0, 62.0, 48.0, 61.0, 39.0, 46.0, 38.0, 39.0, 45.0, 35.0, 27.0, 23.0, 25.0, 14.0, 13.0, 11.0, 17.0, 8.0, 3.0, 4.0, 7.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.34728240966797, -55.741737365722656, -54.136192321777344, -52.53064727783203, -50.92509841918945, -49.31955337524414, -47.71400833129883, -46.108463287353516, -44.5029182434082, -42.89737319946289, -41.29182815551758, -39.686279296875, -38.08073425292969, -36.475189208984375, -34.86964416503906, -33.26409912109375, -31.658552169799805, -30.053007125854492, -28.447460174560547, -26.841915130615234, -25.236370086669922, -23.63082504272461, -22.025278091430664, -20.41973304748535, -18.814186096191406, -17.208641052246094, -15.603095054626465, -13.997549057006836, -12.392004013061523, -10.786458015441895, -9.180912017822266, -7.575366973876953, -5.969821929931641, -4.36427640914917, -2.75873064994812, -1.1531848907470703, 0.4523606300354004, 2.057906150817871, 3.6634521484375, 5.2689971923828125, 6.874543190002441, 8.48008918762207, 10.085634231567383, 11.691180229187012, 13.29672622680664, 14.902271270751953, 16.507816314697266, 18.113361358642578, 19.718908309936523, 21.324453353881836, 22.93000030517578, 24.535545349121094, 26.141090393066406, 27.74663543701172, 29.352182388305664, 30.957727432250977, 32.56327438354492, 34.168819427490234, 35.77436447143555, 37.379913330078125, 38.98545837402344, 40.59100341796875, 42.19654846191406, 43.802093505859375, 45.40763854980469]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 6.0, 5.0, 3.0, 14.0, 14.0, 19.0, 23.0, 33.0, 51.0, 88.0, 114.0, 152.0, 235.0, 312.0, 475.0, 704.0, 1168.0, 1880.0, 3143.0, 5724.0, 11140.0, 24657.0, 61590.0, 166112.0, 334782.0, 258996.0, 102880.0, 38842.0, 16563.0, 7913.0, 4229.0, 2430.0, 1525.0, 910.0, 622.0, 390.0, 242.0, 169.0, 115.0, 80.0, 62.0, 38.0, 30.0, 18.0, 17.0, 8.0, 12.0, 16.0, 3.0, 2.0, 1.0, 2.0, 4.0, 0.0, 1.0, 2.0], "bins": [-4.55859375, -4.41943359375, -4.2802734375, -4.14111328125, -4.001953125, -3.86279296875, -3.7236328125, -3.58447265625, -3.4453125, -3.30615234375, -3.1669921875, -3.02783203125, -2.888671875, -2.74951171875, -2.6103515625, -2.47119140625, -2.33203125, -2.19287109375, -2.0537109375, -1.91455078125, -1.775390625, -1.63623046875, -1.4970703125, -1.35791015625, -1.21875, -1.07958984375, -0.9404296875, -0.80126953125, -0.662109375, -0.52294921875, -0.3837890625, -0.24462890625, -0.10546875, 0.03369140625, 0.1728515625, 0.31201171875, 0.451171875, 0.59033203125, 0.7294921875, 0.86865234375, 1.0078125, 1.14697265625, 1.2861328125, 1.42529296875, 1.564453125, 1.70361328125, 1.8427734375, 1.98193359375, 2.12109375, 2.26025390625, 2.3994140625, 2.53857421875, 2.677734375, 2.81689453125, 2.9560546875, 3.09521484375, 3.234375, 3.37353515625, 3.5126953125, 3.65185546875, 3.791015625, 3.93017578125, 4.0693359375, 4.20849609375, 4.34765625]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 4.0, 2.0, 2.0, 3.0, 6.0, 10.0, 11.0, 12.0, 16.0, 20.0, 32.0, 24.0, 21.0, 32.0, 36.0, 44.0, 42.0, 47.0, 45.0, 44.0, 51.0, 47.0, 49.0, 52.0, 49.0, 39.0, 34.0, 51.0, 28.0, 20.0, 26.0, 27.0, 20.0, 12.0, 6.0, 9.0, 10.0, 3.0, 4.0, 6.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-4.1328125, -4.0169677734375, -3.901123046875, -3.7852783203125, -3.66943359375, -3.5535888671875, -3.437744140625, -3.3218994140625, -3.2060546875, -3.0902099609375, -2.974365234375, -2.8585205078125, -2.74267578125, -2.6268310546875, -2.510986328125, -2.3951416015625, -2.279296875, -2.1634521484375, -2.047607421875, -1.9317626953125, -1.81591796875, -1.7000732421875, -1.584228515625, -1.4683837890625, -1.3525390625, -1.2366943359375, -1.120849609375, -1.0050048828125, -0.88916015625, -0.7733154296875, -0.657470703125, -0.5416259765625, -0.42578125, -0.3099365234375, -0.194091796875, -0.0782470703125, 0.03759765625, 0.1534423828125, 0.269287109375, 0.3851318359375, 0.5009765625, 0.6168212890625, 0.732666015625, 0.8485107421875, 0.96435546875, 1.0802001953125, 1.196044921875, 1.3118896484375, 1.427734375, 1.5435791015625, 1.659423828125, 1.7752685546875, 1.89111328125, 2.0069580078125, 2.122802734375, 2.2386474609375, 2.3544921875, 2.4703369140625, 2.586181640625, 2.7020263671875, 2.81787109375, 2.9337158203125, 3.049560546875, 3.1654052734375, 3.28125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 1.0, 4.0, 6.0, 4.0, 4.0, 5.0, 11.0, 18.0, 10.0, 22.0, 33.0, 42.0, 68.0, 121.0, 160.0, 276.0, 551.0, 1065.0, 2426.0, 6259.0, 22841.0, 138529.0, 693272.0, 147669.0, 23700.0, 6503.0, 2450.0, 1102.0, 560.0, 317.0, 176.0, 114.0, 79.0, 43.0, 32.0, 17.0, 19.0, 13.0, 11.0, 7.0, 10.0, 4.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-9.6484375, -9.368896484375, -9.08935546875, -8.809814453125, -8.5302734375, -8.250732421875, -7.97119140625, -7.691650390625, -7.412109375, -7.132568359375, -6.85302734375, -6.573486328125, -6.2939453125, -6.014404296875, -5.73486328125, -5.455322265625, -5.17578125, -4.896240234375, -4.61669921875, -4.337158203125, -4.0576171875, -3.778076171875, -3.49853515625, -3.218994140625, -2.939453125, -2.659912109375, -2.38037109375, -2.100830078125, -1.8212890625, -1.541748046875, -1.26220703125, -0.982666015625, -0.703125, -0.423583984375, -0.14404296875, 0.135498046875, 0.4150390625, 0.694580078125, 0.97412109375, 1.253662109375, 1.533203125, 1.812744140625, 2.09228515625, 2.371826171875, 2.6513671875, 2.930908203125, 3.21044921875, 3.489990234375, 3.76953125, 4.049072265625, 4.32861328125, 4.608154296875, 4.8876953125, 5.167236328125, 5.44677734375, 5.726318359375, 6.005859375, 6.285400390625, 6.56494140625, 6.844482421875, 7.1240234375, 7.403564453125, 7.68310546875, 7.962646484375, 8.2421875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 5.0, 5.0, 7.0, 11.0, 20.0, 17.0, 21.0, 24.0, 23.0, 34.0, 41.0, 49.0, 67.0, 49.0, 63.0, 52.0, 65.0, 46.0, 48.0, 37.0, 43.0, 53.0, 29.0, 29.0, 24.0, 31.0, 15.0, 19.0, 18.0, 13.0, 5.0, 8.0, 5.0, 5.0, 6.0, 2.0, 4.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-17.109375, -16.64111328125, -16.1728515625, -15.70458984375, -15.236328125, -14.76806640625, -14.2998046875, -13.83154296875, -13.36328125, -12.89501953125, -12.4267578125, -11.95849609375, -11.490234375, -11.02197265625, -10.5537109375, -10.08544921875, -9.6171875, -9.14892578125, -8.6806640625, -8.21240234375, -7.744140625, -7.27587890625, -6.8076171875, -6.33935546875, -5.87109375, -5.40283203125, -4.9345703125, -4.46630859375, -3.998046875, -3.52978515625, -3.0615234375, -2.59326171875, -2.125, -1.65673828125, -1.1884765625, -0.72021484375, -0.251953125, 0.21630859375, 0.6845703125, 1.15283203125, 1.62109375, 2.08935546875, 2.5576171875, 3.02587890625, 3.494140625, 3.96240234375, 4.4306640625, 4.89892578125, 5.3671875, 5.83544921875, 6.3037109375, 6.77197265625, 7.240234375, 7.70849609375, 8.1767578125, 8.64501953125, 9.11328125, 9.58154296875, 10.0498046875, 10.51806640625, 10.986328125, 11.45458984375, 11.9228515625, 12.39111328125, 12.859375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 7.0, 1.0, 8.0, 7.0, 18.0, 15.0, 34.0, 60.0, 85.0, 189.0, 404.0, 1185.0, 3987.0, 15547.0, 92723.0, 732307.0, 169103.0, 24699.0, 5428.0, 1652.0, 598.0, 222.0, 120.0, 64.0, 41.0, 19.0, 13.0, 9.0, 8.0, 2.0, 2.0, 0.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.43359375, -6.27130126953125, -6.1090087890625, -5.94671630859375, -5.784423828125, -5.62213134765625, -5.4598388671875, -5.29754638671875, -5.13525390625, -4.97296142578125, -4.8106689453125, -4.64837646484375, -4.486083984375, -4.32379150390625, -4.1614990234375, -3.99920654296875, -3.8369140625, -3.67462158203125, -3.5123291015625, -3.35003662109375, -3.187744140625, -3.02545166015625, -2.8631591796875, -2.70086669921875, -2.53857421875, -2.37628173828125, -2.2139892578125, -2.05169677734375, -1.889404296875, -1.72711181640625, -1.5648193359375, -1.40252685546875, -1.240234375, -1.07794189453125, -0.9156494140625, -0.75335693359375, -0.591064453125, -0.42877197265625, -0.2664794921875, -0.10418701171875, 0.05810546875, 0.22039794921875, 0.3826904296875, 0.54498291015625, 0.707275390625, 0.86956787109375, 1.0318603515625, 1.19415283203125, 1.3564453125, 1.51873779296875, 1.6810302734375, 1.84332275390625, 2.005615234375, 2.16790771484375, 2.3302001953125, 2.49249267578125, 2.65478515625, 2.81707763671875, 2.9793701171875, 3.14166259765625, 3.303955078125, 3.46624755859375, 3.6285400390625, 3.79083251953125, 3.953125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 1.0, 5.0, 5.0, 3.0, 2.0, 4.0, 6.0, 6.0, 23.0, 13.0, 25.0, 36.0, 55.0, 71.0, 82.0, 110.0, 125.0, 113.0, 74.0, 69.0, 51.0, 38.0, 17.0, 10.0, 17.0, 13.0, 9.0, 7.0, 6.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0013704299926757812, -0.0013345703482627869, -0.0012987107038497925, -0.001262851059436798, -0.0012269914150238037, -0.0011911317706108093, -0.001155272126197815, -0.0011194124817848206, -0.0010835528373718262, -0.0010476931929588318, -0.0010118335485458374, -0.000975973904132843, -0.0009401142597198486, -0.0009042546153068542, -0.0008683949708938599, -0.0008325353264808655, -0.0007966756820678711, -0.0007608160376548767, -0.0007249563932418823, -0.0006890967488288879, -0.0006532371044158936, -0.0006173774600028992, -0.0005815178155899048, -0.0005456581711769104, -0.000509798526763916, -0.00047393888235092163, -0.00043807923793792725, -0.00040221959352493286, -0.0003663599491119385, -0.0003305003046989441, -0.0002946406602859497, -0.0002587810158729553, -0.00022292137145996094, -0.00018706172704696655, -0.00015120208263397217, -0.00011534243822097778, -7.94827938079834e-05, -4.3623149394989014e-05, -7.763504981994629e-06, 2.8096139430999756e-05, 6.395578384399414e-05, 9.981542825698853e-05, 0.0001356750726699829, 0.0001715347170829773, 0.00020739436149597168, 0.00024325400590896606, 0.00027911365032196045, 0.00031497329473495483, 0.0003508329391479492, 0.0003866925835609436, 0.000422552227973938, 0.0004584118723869324, 0.0004942715167999268, 0.0005301311612129211, 0.0005659908056259155, 0.0006018504500389099, 0.0006377100944519043, 0.0006735697388648987, 0.0007094293832778931, 0.0007452890276908875, 0.0007811486721038818, 0.0008170083165168762, 0.0008528679609298706, 0.000888727605342865, 0.0009245872497558594]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 6.0, 8.0, 5.0, 11.0, 19.0, 35.0, 44.0, 98.0, 160.0, 261.0, 517.0, 1134.0, 2454.0, 6505.0, 21341.0, 88802.0, 577319.0, 270807.0, 56216.0, 14353.0, 4812.0, 1808.0, 832.0, 436.0, 224.0, 135.0, 69.0, 49.0, 27.0, 23.0, 16.0, 9.0, 11.0, 2.0, 4.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.33984375, -4.218780517578125, -4.09771728515625, -3.976654052734375, -3.8555908203125, -3.734527587890625, -3.61346435546875, -3.492401123046875, -3.371337890625, -3.250274658203125, -3.12921142578125, -3.008148193359375, -2.8870849609375, -2.766021728515625, -2.64495849609375, -2.523895263671875, -2.40283203125, -2.281768798828125, -2.16070556640625, -2.039642333984375, -1.9185791015625, -1.797515869140625, -1.67645263671875, -1.555389404296875, -1.434326171875, -1.313262939453125, -1.19219970703125, -1.071136474609375, -0.9500732421875, -0.829010009765625, -0.70794677734375, -0.586883544921875, -0.4658203125, -0.344757080078125, -0.22369384765625, -0.102630615234375, 0.0184326171875, 0.139495849609375, 0.26055908203125, 0.381622314453125, 0.502685546875, 0.623748779296875, 0.74481201171875, 0.865875244140625, 0.9869384765625, 1.108001708984375, 1.22906494140625, 1.350128173828125, 1.47119140625, 1.592254638671875, 1.71331787109375, 1.834381103515625, 1.9554443359375, 2.076507568359375, 2.19757080078125, 2.318634033203125, 2.439697265625, 2.560760498046875, 2.68182373046875, 2.802886962890625, 2.9239501953125, 3.045013427734375, 3.16607666015625, 3.287139892578125, 3.408203125]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 3.0, 2.0, 5.0, 6.0, 2.0, 8.0, 6.0, 15.0, 21.0, 25.0, 39.0, 51.0, 85.0, 100.0, 101.0, 108.0, 96.0, 82.0, 83.0, 47.0, 38.0, 27.0, 16.0, 12.0, 10.0, 6.0, 2.0, 3.0, 3.0, 2.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.109375, -4.96136474609375, -4.8133544921875, -4.66534423828125, -4.517333984375, -4.36932373046875, -4.2213134765625, -4.07330322265625, -3.92529296875, -3.77728271484375, -3.6292724609375, -3.48126220703125, -3.333251953125, -3.18524169921875, -3.0372314453125, -2.88922119140625, -2.7412109375, -2.59320068359375, -2.4451904296875, -2.29718017578125, -2.149169921875, -2.00115966796875, -1.8531494140625, -1.70513916015625, -1.55712890625, -1.40911865234375, -1.2611083984375, -1.11309814453125, -0.965087890625, -0.81707763671875, -0.6690673828125, -0.52105712890625, -0.373046875, -0.22503662109375, -0.0770263671875, 0.07098388671875, 0.218994140625, 0.36700439453125, 0.5150146484375, 0.66302490234375, 0.81103515625, 0.95904541015625, 1.1070556640625, 1.25506591796875, 1.403076171875, 1.55108642578125, 1.6990966796875, 1.84710693359375, 1.9951171875, 2.14312744140625, 2.2911376953125, 2.43914794921875, 2.587158203125, 2.73516845703125, 2.8831787109375, 3.03118896484375, 3.17919921875, 3.32720947265625, 3.4752197265625, 3.62322998046875, 3.771240234375, 3.91925048828125, 4.0672607421875, 4.21527099609375, 4.36328125]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 11.0, 9.0, 14.0, 10.0, 24.0, 38.0, 71.0, 110.0, 177.0, 208.0, 121.0, 82.0, 43.0, 24.0, 20.0, 10.0, 8.0, 8.0, 3.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-74.55690002441406, -72.44540405273438, -70.33390808105469, -68.222412109375, -66.11092376708984, -63.999427795410156, -61.88793182373047, -59.77643585205078, -57.664939880371094, -55.553443908691406, -53.441951751708984, -51.3304557800293, -49.21895980834961, -47.10746765136719, -44.9959716796875, -42.88447570800781, -40.77298355102539, -38.6614875793457, -36.54999542236328, -34.438499450683594, -32.327003479003906, -30.21550941467285, -28.104015350341797, -25.99251937866211, -23.881025314331055, -21.76953125, -19.658035278320312, -17.546541213989258, -15.435046195983887, -13.323551177978516, -11.212057113647461, -9.10056209564209, -6.989070892333984, -4.877575874328613, -2.7660813331604004, -0.6545867919921875, 1.4569082260131836, 3.5684032440185547, 5.679897308349609, 7.7913923263549805, 9.902887344360352, 12.014382362365723, 14.125877380371094, 16.23737144470215, 18.348865509033203, 20.46036148071289, 22.571855545043945, 24.683349609375, 26.794845581054688, 28.906339645385742, 31.01783561706543, 33.129329681396484, 35.24082565307617, 37.352317810058594, 39.46381378173828, 41.57530975341797, 43.686805725097656, 45.798301696777344, 47.909793853759766, 50.02128982543945, 52.13278579711914, 54.24427795410156, 56.35577392578125, 58.46726989746094, 60.57876205444336]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 7.0, 6.0, 7.0, 7.0, 7.0, 13.0, 23.0, 18.0, 15.0, 25.0, 26.0, 31.0, 24.0, 33.0, 37.0, 56.0, 56.0, 72.0, 79.0, 69.0, 56.0, 50.0, 41.0, 30.0, 32.0, 31.0, 22.0, 17.0, 20.0, 13.0, 17.0, 10.0, 8.0, 10.0, 12.0, 7.0, 4.0, 2.0, 3.0, 2.0, 3.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-51.08452224731445, -49.30108642578125, -47.51764678955078, -45.73421096801758, -43.95077133178711, -42.167335510253906, -40.38389587402344, -38.600460052490234, -36.81702423095703, -35.03358840942383, -33.25014877319336, -31.466712951660156, -29.683273315429688, -27.899837493896484, -26.11639976501465, -24.332962036132812, -22.549522399902344, -20.766084671020508, -18.982646942138672, -17.19921112060547, -15.415772438049316, -13.63233470916748, -11.848897933959961, -10.065460205078125, -8.282022476196289, -6.498584747314453, -4.715147495269775, -2.9317102432250977, -1.1482725143432617, 0.6351652145385742, 2.4186019897460938, 4.20203971862793, 5.9854736328125, 7.768911361694336, 9.552349090576172, 11.335785865783691, 13.119223594665527, 14.902661323547363, 16.686098098754883, 18.46953582763672, 20.252973556518555, 22.03641128540039, 23.819849014282227, 25.603286743164062, 27.386722564697266, 29.170162200927734, 30.953598022460938, 32.737037658691406, 34.52047348022461, 36.30390930175781, 38.08734893798828, 39.870784759521484, 41.65422439575195, 43.437660217285156, 45.221099853515625, 47.00453567504883, 48.78797149658203, 50.571407318115234, 52.3548469543457, 54.138282775878906, 55.921722412109375, 57.70515823364258, 59.48859405517578, 61.27203369140625, 63.05547332763672]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 11.0, 7.0, 9.0, 13.0, 23.0, 33.0, 53.0, 119.0, 160.0, 283.0, 436.0, 805.0, 1475.0, 2803.0, 5720.0, 13293.0, 39378.0, 166501.0, 1129510.0, 2350532.0, 378638.0, 68483.0, 19872.0, 8005.0, 3601.0, 1868.0, 1048.0, 598.0, 331.0, 247.0, 132.0, 80.0, 66.0, 44.0, 34.0, 16.0, 14.0, 17.0, 9.0, 11.0, 7.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.90234375, -4.74530029296875, -4.5882568359375, -4.43121337890625, -4.274169921875, -4.11712646484375, -3.9600830078125, -3.80303955078125, -3.64599609375, -3.48895263671875, -3.3319091796875, -3.17486572265625, -3.017822265625, -2.86077880859375, -2.7037353515625, -2.54669189453125, -2.3896484375, -2.23260498046875, -2.0755615234375, -1.91851806640625, -1.761474609375, -1.60443115234375, -1.4473876953125, -1.29034423828125, -1.13330078125, -0.97625732421875, -0.8192138671875, -0.66217041015625, -0.505126953125, -0.34808349609375, -0.1910400390625, -0.03399658203125, 0.123046875, 0.28009033203125, 0.4371337890625, 0.59417724609375, 0.751220703125, 0.90826416015625, 1.0653076171875, 1.22235107421875, 1.37939453125, 1.53643798828125, 1.6934814453125, 1.85052490234375, 2.007568359375, 2.16461181640625, 2.3216552734375, 2.47869873046875, 2.6357421875, 2.79278564453125, 2.9498291015625, 3.10687255859375, 3.263916015625, 3.42095947265625, 3.5780029296875, 3.73504638671875, 3.89208984375, 4.04913330078125, 4.2061767578125, 4.36322021484375, 4.520263671875, 4.67730712890625, 4.8343505859375, 4.99139404296875, 5.1484375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 0.0, 4.0, 2.0, 5.0, 6.0, 7.0, 8.0, 9.0, 17.0, 16.0, 14.0, 18.0, 26.0, 24.0, 32.0, 25.0, 47.0, 36.0, 47.0, 40.0, 55.0, 44.0, 43.0, 48.0, 46.0, 35.0, 48.0, 40.0, 35.0, 29.0, 28.0, 27.0, 28.0, 21.0, 20.0, 9.0, 13.0, 7.0, 12.0, 8.0, 8.0, 5.0, 3.0, 1.0, 3.0, 1.0, 1.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.373046875, -3.267425537109375, -3.16180419921875, -3.056182861328125, -2.9505615234375, -2.844940185546875, -2.73931884765625, -2.633697509765625, -2.528076171875, -2.422454833984375, -2.31683349609375, -2.211212158203125, -2.1055908203125, -1.999969482421875, -1.89434814453125, -1.788726806640625, -1.68310546875, -1.577484130859375, -1.47186279296875, -1.366241455078125, -1.2606201171875, -1.154998779296875, -1.04937744140625, -0.943756103515625, -0.838134765625, -0.732513427734375, -0.62689208984375, -0.521270751953125, -0.4156494140625, -0.310028076171875, -0.20440673828125, -0.098785400390625, 0.0068359375, 0.112457275390625, 0.21807861328125, 0.323699951171875, 0.4293212890625, 0.534942626953125, 0.64056396484375, 0.746185302734375, 0.851806640625, 0.957427978515625, 1.06304931640625, 1.168670654296875, 1.2742919921875, 1.379913330078125, 1.48553466796875, 1.591156005859375, 1.69677734375, 1.802398681640625, 1.90802001953125, 2.013641357421875, 2.1192626953125, 2.224884033203125, 2.33050537109375, 2.436126708984375, 2.541748046875, 2.647369384765625, 2.75299072265625, 2.858612060546875, 2.9642333984375, 3.069854736328125, 3.17547607421875, 3.281097412109375, 3.38671875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 5.0, 3.0, 4.0, 13.0, 7.0, 11.0, 21.0, 36.0, 38.0, 66.0, 102.0, 147.0, 238.0, 439.0, 957.0, 2290.0, 6565.0, 23066.0, 145903.0, 3215582.0, 727118.0, 53050.0, 11853.0, 3793.0, 1369.0, 652.0, 350.0, 217.0, 119.0, 70.0, 66.0, 40.0, 26.0, 17.0, 15.0, 11.0, 11.0, 4.0, 4.0, 2.0, 3.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-9.4921875, -9.137451171875, -8.78271484375, -8.427978515625, -8.0732421875, -7.718505859375, -7.36376953125, -7.009033203125, -6.654296875, -6.299560546875, -5.94482421875, -5.590087890625, -5.2353515625, -4.880615234375, -4.52587890625, -4.171142578125, -3.81640625, -3.461669921875, -3.10693359375, -2.752197265625, -2.3974609375, -2.042724609375, -1.68798828125, -1.333251953125, -0.978515625, -0.623779296875, -0.26904296875, 0.085693359375, 0.4404296875, 0.795166015625, 1.14990234375, 1.504638671875, 1.859375, 2.214111328125, 2.56884765625, 2.923583984375, 3.2783203125, 3.633056640625, 3.98779296875, 4.342529296875, 4.697265625, 5.052001953125, 5.40673828125, 5.761474609375, 6.1162109375, 6.470947265625, 6.82568359375, 7.180419921875, 7.53515625, 7.889892578125, 8.24462890625, 8.599365234375, 8.9541015625, 9.308837890625, 9.66357421875, 10.018310546875, 10.373046875, 10.727783203125, 11.08251953125, 11.437255859375, 11.7919921875, 12.146728515625, 12.50146484375, 12.856201171875, 13.2109375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 7.0, 6.0, 4.0, 5.0, 7.0, 12.0, 13.0, 16.0, 20.0, 26.0, 45.0, 66.0, 111.0, 218.0, 396.0, 774.0, 993.0, 596.0, 305.0, 181.0, 99.0, 61.0, 32.0, 19.0, 23.0, 11.0, 12.0, 6.0, 3.0, 2.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.9921875, -8.62109375, -8.25, -7.87890625, -7.5078125, -7.13671875, -6.765625, -6.39453125, -6.0234375, -5.65234375, -5.28125, -4.91015625, -4.5390625, -4.16796875, -3.796875, -3.42578125, -3.0546875, -2.68359375, -2.3125, -1.94140625, -1.5703125, -1.19921875, -0.828125, -0.45703125, -0.0859375, 0.28515625, 0.65625, 1.02734375, 1.3984375, 1.76953125, 2.140625, 2.51171875, 2.8828125, 3.25390625, 3.625, 3.99609375, 4.3671875, 4.73828125, 5.109375, 5.48046875, 5.8515625, 6.22265625, 6.59375, 6.96484375, 7.3359375, 7.70703125, 8.078125, 8.44921875, 8.8203125, 9.19140625, 9.5625, 9.93359375, 10.3046875, 10.67578125, 11.046875, 11.41796875, 11.7890625, 12.16015625, 12.53125, 12.90234375, 13.2734375, 13.64453125, 14.015625, 14.38671875, 14.7578125]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 6.0, 5.0, 22.0, 40.0, 64.0, 159.0, 220.0, 229.0, 125.0, 69.0, 28.0, 15.0, 9.0, 2.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.77438354492188, -60.941139221191406, -57.10789489746094, -53.2746467590332, -49.441402435302734, -45.608158111572266, -41.77490997314453, -37.94166564941406, -34.108421325683594, -30.275177001953125, -26.441930770874023, -22.608684539794922, -18.775440216064453, -14.942195892333984, -11.108949661254883, -7.275703430175781, -3.4424591064453125, 0.39078617095947266, 4.224031448364258, 8.057276725769043, 11.890522003173828, 15.723766326904297, 19.5570125579834, 23.3902587890625, 27.22350311279297, 31.056747436523438, 34.889991760253906, 38.72323989868164, 42.55648422241211, 46.38972854614258, 50.22297668457031, 54.05622100830078, 57.88946533203125, 61.72270965576172, 65.55595397949219, 69.38919830322266, 73.22244262695312, 77.05569458007812, 80.8889389038086, 84.72218322753906, 88.55542755126953, 92.388671875, 96.22191619873047, 100.05516052246094, 103.88841247558594, 107.72164916992188, 111.55490112304688, 115.38814544677734, 119.22138977050781, 123.05463409423828, 126.88787841796875, 130.72113037109375, 134.5543670654297, 138.3876190185547, 142.22085571289062, 146.05410766601562, 149.88735961914062, 153.72061157226562, 157.55384826660156, 161.38710021972656, 165.2203369140625, 169.0535888671875, 172.88682556152344, 176.72007751464844, 180.55331420898438]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 5.0, 3.0, 3.0, 12.0, 8.0, 13.0, 9.0, 22.0, 17.0, 19.0, 31.0, 38.0, 40.0, 39.0, 60.0, 51.0, 63.0, 53.0, 47.0, 45.0, 48.0, 51.0, 42.0, 47.0, 39.0, 37.0, 28.0, 23.0, 20.0, 15.0, 17.0, 9.0, 12.0, 8.0, 5.0, 5.0, 8.0, 7.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.58546447753906, -46.099002838134766, -44.61254119873047, -43.12607955932617, -41.639617919921875, -40.15315246582031, -38.66669464111328, -37.18022918701172, -35.69376754760742, -34.207305908203125, -32.72084426879883, -31.23438262939453, -29.7479190826416, -28.261457443237305, -26.774995803833008, -25.288532257080078, -23.802072525024414, -22.315610885620117, -20.82914924621582, -19.34268569946289, -17.856224060058594, -16.369762420654297, -14.88330078125, -13.396838188171387, -11.91037654876709, -10.423914909362793, -8.93745231628418, -7.450990676879883, -5.964528560638428, -4.478066444396973, -2.991604804992676, -1.5051422119140625, -0.018680572509765625, 1.4677814245224, 2.9542434215545654, 4.440705299377441, 5.9271674156188965, 7.413629531860352, 8.900091171264648, 10.386553764343262, 11.873015403747559, 13.359477043151855, 14.845939636230469, 16.332401275634766, 17.818862915039062, 19.30532455444336, 20.791786193847656, 22.278249740600586, 23.764711380004883, 25.25117301940918, 26.737634658813477, 28.224098205566406, 29.710559844970703, 31.197021484375, 32.6834831237793, 34.169944763183594, 35.65640640258789, 37.14286804199219, 38.629329681396484, 40.11579132080078, 41.60225296020508, 43.088714599609375, 44.57518005371094, 46.061641693115234, 47.54810333251953]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 1.0, 7.0, 6.0, 8.0, 10.0, 23.0, 27.0, 32.0, 51.0, 90.0, 108.0, 206.0, 308.0, 564.0, 989.0, 1824.0, 4082.0, 9730.0, 27538.0, 98788.0, 402162.0, 370864.0, 88969.0, 25266.0, 9024.0, 3768.0, 1808.0, 962.0, 543.0, 270.0, 185.0, 120.0, 73.0, 51.0, 24.0, 17.0, 20.0, 11.0, 9.0, 6.0, 5.0, 6.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-6.58984375, -6.3836669921875, -6.177490234375, -5.9713134765625, -5.76513671875, -5.5589599609375, -5.352783203125, -5.1466064453125, -4.9404296875, -4.7342529296875, -4.528076171875, -4.3218994140625, -4.11572265625, -3.9095458984375, -3.703369140625, -3.4971923828125, -3.291015625, -3.0848388671875, -2.878662109375, -2.6724853515625, -2.46630859375, -2.2601318359375, -2.053955078125, -1.8477783203125, -1.6416015625, -1.4354248046875, -1.229248046875, -1.0230712890625, -0.81689453125, -0.6107177734375, -0.404541015625, -0.1983642578125, 0.0078125, 0.2139892578125, 0.420166015625, 0.6263427734375, 0.83251953125, 1.0386962890625, 1.244873046875, 1.4510498046875, 1.6572265625, 1.8634033203125, 2.069580078125, 2.2757568359375, 2.48193359375, 2.6881103515625, 2.894287109375, 3.1004638671875, 3.306640625, 3.5128173828125, 3.718994140625, 3.9251708984375, 4.13134765625, 4.3375244140625, 4.543701171875, 4.7498779296875, 4.9560546875, 5.1622314453125, 5.368408203125, 5.5745849609375, 5.78076171875, 5.9869384765625, 6.193115234375, 6.3992919921875, 6.60546875]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 3.0, 4.0, 5.0, 3.0, 7.0, 7.0, 8.0, 10.0, 5.0, 11.0, 20.0, 20.0, 14.0, 36.0, 29.0, 22.0, 38.0, 44.0, 23.0, 40.0, 42.0, 60.0, 47.0, 50.0, 45.0, 50.0, 39.0, 33.0, 34.0, 32.0, 40.0, 24.0, 18.0, 14.0, 24.0, 12.0, 18.0, 14.0, 13.0, 7.0, 8.0, 10.0, 4.0, 3.0, 2.0, 1.0, 2.0, 4.0, 5.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-3.53515625, -3.428253173828125, -3.32135009765625, -3.214447021484375, -3.1075439453125, -3.000640869140625, -2.89373779296875, -2.786834716796875, -2.679931640625, -2.573028564453125, -2.46612548828125, -2.359222412109375, -2.2523193359375, -2.145416259765625, -2.03851318359375, -1.931610107421875, -1.82470703125, -1.717803955078125, -1.61090087890625, -1.503997802734375, -1.3970947265625, -1.290191650390625, -1.18328857421875, -1.076385498046875, -0.969482421875, -0.862579345703125, -0.75567626953125, -0.648773193359375, -0.5418701171875, -0.434967041015625, -0.32806396484375, -0.221160888671875, -0.1142578125, -0.007354736328125, 0.09954833984375, 0.206451416015625, 0.3133544921875, 0.420257568359375, 0.52716064453125, 0.634063720703125, 0.740966796875, 0.847869873046875, 0.95477294921875, 1.061676025390625, 1.1685791015625, 1.275482177734375, 1.38238525390625, 1.489288330078125, 1.59619140625, 1.703094482421875, 1.80999755859375, 1.916900634765625, 2.0238037109375, 2.130706787109375, 2.23760986328125, 2.344512939453125, 2.451416015625, 2.558319091796875, 2.66522216796875, 2.772125244140625, 2.8790283203125, 2.985931396484375, 3.09283447265625, 3.199737548828125, 3.306640625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 5.0, 9.0, 6.0, 15.0, 26.0, 38.0, 45.0, 49.0, 85.0, 135.0, 197.0, 386.0, 690.0, 1474.0, 4179.0, 14415.0, 82113.0, 714782.0, 191818.0, 27403.0, 6460.0, 2111.0, 883.0, 474.0, 266.0, 154.0, 119.0, 56.0, 45.0, 30.0, 21.0, 12.0, 15.0, 10.0, 5.0, 9.0, 4.0, 5.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-10.890625, -10.5938720703125, -10.297119140625, -10.0003662109375, -9.70361328125, -9.4068603515625, -9.110107421875, -8.8133544921875, -8.5166015625, -8.2198486328125, -7.923095703125, -7.6263427734375, -7.32958984375, -7.0328369140625, -6.736083984375, -6.4393310546875, -6.142578125, -5.8458251953125, -5.549072265625, -5.2523193359375, -4.95556640625, -4.6588134765625, -4.362060546875, -4.0653076171875, -3.7685546875, -3.4718017578125, -3.175048828125, -2.8782958984375, -2.58154296875, -2.2847900390625, -1.988037109375, -1.6912841796875, -1.39453125, -1.0977783203125, -0.801025390625, -0.5042724609375, -0.20751953125, 0.0892333984375, 0.385986328125, 0.6827392578125, 0.9794921875, 1.2762451171875, 1.572998046875, 1.8697509765625, 2.16650390625, 2.4632568359375, 2.760009765625, 3.0567626953125, 3.353515625, 3.6502685546875, 3.947021484375, 4.2437744140625, 4.54052734375, 4.8372802734375, 5.134033203125, 5.4307861328125, 5.7275390625, 6.0242919921875, 6.321044921875, 6.6177978515625, 6.91455078125, 7.2113037109375, 7.508056640625, 7.8048095703125, 8.1015625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 0.0, 5.0, 7.0, 4.0, 6.0, 6.0, 12.0, 8.0, 14.0, 16.0, 16.0, 23.0, 20.0, 25.0, 42.0, 41.0, 49.0, 47.0, 49.0, 51.0, 59.0, 47.0, 55.0, 55.0, 45.0, 33.0, 37.0, 26.0, 32.0, 24.0, 26.0, 26.0, 21.0, 12.0, 9.0, 10.0, 9.0, 9.0, 4.0, 8.0, 6.0, 4.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-15.8515625, -15.38720703125, -14.9228515625, -14.45849609375, -13.994140625, -13.52978515625, -13.0654296875, -12.60107421875, -12.13671875, -11.67236328125, -11.2080078125, -10.74365234375, -10.279296875, -9.81494140625, -9.3505859375, -8.88623046875, -8.421875, -7.95751953125, -7.4931640625, -7.02880859375, -6.564453125, -6.10009765625, -5.6357421875, -5.17138671875, -4.70703125, -4.24267578125, -3.7783203125, -3.31396484375, -2.849609375, -2.38525390625, -1.9208984375, -1.45654296875, -0.9921875, -0.52783203125, -0.0634765625, 0.40087890625, 0.865234375, 1.32958984375, 1.7939453125, 2.25830078125, 2.72265625, 3.18701171875, 3.6513671875, 4.11572265625, 4.580078125, 5.04443359375, 5.5087890625, 5.97314453125, 6.4375, 6.90185546875, 7.3662109375, 7.83056640625, 8.294921875, 8.75927734375, 9.2236328125, 9.68798828125, 10.15234375, 10.61669921875, 11.0810546875, 11.54541015625, 12.009765625, 12.47412109375, 12.9384765625, 13.40283203125, 13.8671875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 7.0, 14.0, 21.0, 19.0, 40.0, 55.0, 131.0, 205.0, 487.0, 1110.0, 3253.0, 10816.0, 49752.0, 674370.0, 263053.0, 33161.0, 7865.0, 2445.0, 962.0, 388.0, 179.0, 111.0, 51.0, 27.0, 17.0, 8.0, 7.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.94921875, -4.7987060546875, -4.648193359375, -4.4976806640625, -4.34716796875, -4.1966552734375, -4.046142578125, -3.8956298828125, -3.7451171875, -3.5946044921875, -3.444091796875, -3.2935791015625, -3.14306640625, -2.9925537109375, -2.842041015625, -2.6915283203125, -2.541015625, -2.3905029296875, -2.239990234375, -2.0894775390625, -1.93896484375, -1.7884521484375, -1.637939453125, -1.4874267578125, -1.3369140625, -1.1864013671875, -1.035888671875, -0.8853759765625, -0.73486328125, -0.5843505859375, -0.433837890625, -0.2833251953125, -0.1328125, 0.0177001953125, 0.168212890625, 0.3187255859375, 0.46923828125, 0.6197509765625, 0.770263671875, 0.9207763671875, 1.0712890625, 1.2218017578125, 1.372314453125, 1.5228271484375, 1.67333984375, 1.8238525390625, 1.974365234375, 2.1248779296875, 2.275390625, 2.4259033203125, 2.576416015625, 2.7269287109375, 2.87744140625, 3.0279541015625, 3.178466796875, 3.3289794921875, 3.4794921875, 3.6300048828125, 3.780517578125, 3.9310302734375, 4.08154296875, 4.2320556640625, 4.382568359375, 4.5330810546875, 4.68359375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 5.0, 2.0, 3.0, 1.0, 6.0, 7.0, 10.0, 13.0, 12.0, 11.0, 26.0, 25.0, 35.0, 45.0, 69.0, 85.0, 128.0, 137.0, 101.0, 79.0, 58.0, 34.0, 28.0, 23.0, 17.0, 10.0, 5.0, 3.0, 4.0, 4.0, 6.0, 3.0, 1.0, 1.0, 3.0, 1.0, 6.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0010929107666015625, -0.0010617747902870178, -0.0010306388139724731, -0.0009995028376579285, -0.0009683668613433838, -0.0009372308850288391, -0.0009060949087142944, -0.0008749589323997498, -0.0008438229560852051, -0.0008126869797706604, -0.0007815510034561157, -0.000750415027141571, -0.0007192790508270264, -0.0006881430745124817, -0.000657007098197937, -0.0006258711218833923, -0.0005947351455688477, -0.000563599169254303, -0.0005324631929397583, -0.0005013272166252136, -0.00047019124031066895, -0.00043905526399612427, -0.0004079192876815796, -0.0003767833113670349, -0.00034564733505249023, -0.00031451135873794556, -0.0002833753824234009, -0.0002522394061088562, -0.00022110342979431152, -0.00018996745347976685, -0.00015883147716522217, -0.0001276955008506775, -9.655952453613281e-05, -6.542354822158813e-05, -3.428757190704346e-05, -3.1515955924987793e-06, 2.79843807220459e-05, 5.9120357036590576e-05, 9.025633335113525e-05, 0.00012139230966567993, 0.0001525282859802246, 0.0001836642622947693, 0.00021480023860931396, 0.00024593621492385864, 0.0002770721912384033, 0.000308208167552948, 0.0003393441438674927, 0.00037048012018203735, 0.00040161609649658203, 0.0004327520728111267, 0.0004638880491256714, 0.0004950240254402161, 0.0005261600017547607, 0.0005572959780693054, 0.0005884319543838501, 0.0006195679306983948, 0.0006507039070129395, 0.0006818398833274841, 0.0007129758596420288, 0.0007441118359565735, 0.0007752478122711182, 0.0008063837885856628, 0.0008375197649002075, 0.0008686557412147522, 0.0008997917175292969]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 3.0, 10.0, 14.0, 23.0, 49.0, 64.0, 133.0, 310.0, 666.0, 1843.0, 6830.0, 35708.0, 586385.0, 373844.0, 33148.0, 6477.0, 1799.0, 681.0, 268.0, 143.0, 71.0, 42.0, 16.0, 12.0, 7.0, 3.0, 4.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.990234375, -3.816619873046875, -3.64300537109375, -3.469390869140625, -3.2957763671875, -3.122161865234375, -2.94854736328125, -2.774932861328125, -2.601318359375, -2.427703857421875, -2.25408935546875, -2.080474853515625, -1.9068603515625, -1.733245849609375, -1.55963134765625, -1.386016845703125, -1.21240234375, -1.038787841796875, -0.86517333984375, -0.691558837890625, -0.5179443359375, -0.344329833984375, -0.17071533203125, 0.002899169921875, 0.176513671875, 0.350128173828125, 0.52374267578125, 0.697357177734375, 0.8709716796875, 1.044586181640625, 1.21820068359375, 1.391815185546875, 1.5654296875, 1.739044189453125, 1.91265869140625, 2.086273193359375, 2.2598876953125, 2.433502197265625, 2.60711669921875, 2.780731201171875, 2.954345703125, 3.127960205078125, 3.30157470703125, 3.475189208984375, 3.6488037109375, 3.822418212890625, 3.99603271484375, 4.169647216796875, 4.34326171875, 4.516876220703125, 4.69049072265625, 4.864105224609375, 5.0377197265625, 5.211334228515625, 5.38494873046875, 5.558563232421875, 5.732177734375, 5.905792236328125, 6.07940673828125, 6.253021240234375, 6.4266357421875, 6.600250244140625, 6.77386474609375, 6.947479248046875, 7.12109375]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 7.0, 5.0, 4.0, 6.0, 10.0, 6.0, 7.0, 13.0, 11.0, 18.0, 19.0, 35.0, 31.0, 62.0, 64.0, 94.0, 76.0, 93.0, 92.0, 67.0, 61.0, 40.0, 33.0, 32.0, 26.0, 13.0, 13.0, 13.0, 11.0, 13.0, 5.0, 4.0, 5.0, 4.0, 3.0, 4.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.068359375, -2.967742919921875, -2.86712646484375, -2.766510009765625, -2.6658935546875, -2.565277099609375, -2.46466064453125, -2.364044189453125, -2.263427734375, -2.162811279296875, -2.06219482421875, -1.961578369140625, -1.8609619140625, -1.760345458984375, -1.65972900390625, -1.559112548828125, -1.45849609375, -1.357879638671875, -1.25726318359375, -1.156646728515625, -1.0560302734375, -0.955413818359375, -0.85479736328125, -0.754180908203125, -0.653564453125, -0.552947998046875, -0.45233154296875, -0.351715087890625, -0.2510986328125, -0.150482177734375, -0.04986572265625, 0.050750732421875, 0.1513671875, 0.251983642578125, 0.35260009765625, 0.453216552734375, 0.5538330078125, 0.654449462890625, 0.75506591796875, 0.855682373046875, 0.956298828125, 1.056915283203125, 1.15753173828125, 1.258148193359375, 1.3587646484375, 1.459381103515625, 1.55999755859375, 1.660614013671875, 1.76123046875, 1.861846923828125, 1.96246337890625, 2.063079833984375, 2.1636962890625, 2.264312744140625, 2.36492919921875, 2.465545654296875, 2.566162109375, 2.666778564453125, 2.76739501953125, 2.868011474609375, 2.9686279296875, 3.069244384765625, 3.16986083984375, 3.270477294921875, 3.37109375]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 2.0, 4.0, 8.0, 7.0, 6.0, 16.0, 32.0, 81.0, 137.0, 270.0, 208.0, 120.0, 53.0, 29.0, 14.0, 6.0, 4.0, 3.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.4241943359375, -65.56255340576172, -62.7009162902832, -59.83927536010742, -56.977638244628906, -54.115997314453125, -51.254356384277344, -48.39271545410156, -45.53107833862305, -42.669437408447266, -39.80780029296875, -36.94615936279297, -34.08451843261719, -31.222881317138672, -28.36124038696289, -25.499601364135742, -22.637962341308594, -19.776323318481445, -16.914684295654297, -14.053043365478516, -11.191404342651367, -8.329765319824219, -5.4681243896484375, -2.606485366821289, 0.2551536560058594, 3.116793155670166, 5.978432655334473, 8.840072631835938, 11.701711654663086, 14.563350677490234, 17.424991607666016, 20.286630630493164, 23.148277282714844, 26.009916305541992, 28.87155532836914, 31.733196258544922, 34.59483337402344, 37.45647430419922, 40.318115234375, 43.17975616455078, 46.0413932800293, 48.90303421020508, 51.764671325683594, 54.626312255859375, 57.487953186035156, 60.34959030151367, 63.21123123168945, 66.07286834716797, 68.93450927734375, 71.79615020751953, 74.65779113769531, 77.51942443847656, 80.38106536865234, 83.24270629882812, 86.1043472290039, 88.96598815917969, 91.82762145996094, 94.68926239013672, 97.5509033203125, 100.41253662109375, 103.27417755126953, 106.13581848144531, 108.9974594116211, 111.85910034179688, 114.72074127197266]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 8.0, 5.0, 6.0, 4.0, 3.0, 3.0, 5.0, 11.0, 19.0, 16.0, 22.0, 15.0, 30.0, 19.0, 29.0, 31.0, 35.0, 53.0, 62.0, 55.0, 100.0, 94.0, 70.0, 50.0, 43.0, 36.0, 22.0, 25.0, 18.0, 16.0, 20.0, 13.0, 18.0, 10.0, 9.0, 8.0, 13.0, 6.0, 4.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-58.38625717163086, -56.482337951660156, -54.57841873168945, -52.67449951171875, -50.77057647705078, -48.866661071777344, -46.962738037109375, -45.05881881713867, -43.15489959716797, -41.250980377197266, -39.34706115722656, -37.44314193725586, -35.539222717285156, -33.63529968261719, -31.731380462646484, -29.82746124267578, -27.923542022705078, -26.019622802734375, -24.115703582763672, -22.211782455444336, -20.307863235473633, -18.40394401550293, -16.500022888183594, -14.59610366821289, -12.692184448242188, -10.788265228271484, -8.884345054626465, -6.9804253578186035, -5.076505661010742, -3.172586441040039, -1.2686662673950195, 0.63525390625, 2.5391769409179688, 4.44309663772583, 6.347016334533691, 8.250936508178711, 10.154855728149414, 12.058774948120117, 13.962695121765137, 15.866615295410156, 17.77053451538086, 19.674453735351562, 21.578372955322266, 23.4822940826416, 25.386213302612305, 27.290132522583008, 29.194053649902344, 31.097972869873047, 33.00189208984375, 34.90581130981445, 36.809730529785156, 38.71364974975586, 40.61756896972656, 42.52149200439453, 44.425411224365234, 46.32933044433594, 48.23324966430664, 50.137168884277344, 52.04108810424805, 53.94500732421875, 55.84893035888672, 57.752845764160156, 59.656768798828125, 61.56068801879883, 63.46460723876953]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 4.0, 6.0, 11.0, 17.0, 29.0, 30.0, 52.0, 71.0, 102.0, 148.0, 218.0, 373.0, 658.0, 1150.0, 2198.0, 4564.0, 10797.0, 32824.0, 140888.0, 967898.0, 2508791.0, 420708.0, 69131.0, 18907.0, 7270.0, 3260.0, 1595.0, 943.0, 574.0, 338.0, 243.0, 143.0, 116.0, 62.0, 46.0, 31.0, 23.0, 14.0, 12.0, 8.0, 3.0, 11.0, 4.0, 4.0, 4.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-5.546875, -5.36376953125, -5.1806640625, -4.99755859375, -4.814453125, -4.63134765625, -4.4482421875, -4.26513671875, -4.08203125, -3.89892578125, -3.7158203125, -3.53271484375, -3.349609375, -3.16650390625, -2.9833984375, -2.80029296875, -2.6171875, -2.43408203125, -2.2509765625, -2.06787109375, -1.884765625, -1.70166015625, -1.5185546875, -1.33544921875, -1.15234375, -0.96923828125, -0.7861328125, -0.60302734375, -0.419921875, -0.23681640625, -0.0537109375, 0.12939453125, 0.3125, 0.49560546875, 0.6787109375, 0.86181640625, 1.044921875, 1.22802734375, 1.4111328125, 1.59423828125, 1.77734375, 1.96044921875, 2.1435546875, 2.32666015625, 2.509765625, 2.69287109375, 2.8759765625, 3.05908203125, 3.2421875, 3.42529296875, 3.6083984375, 3.79150390625, 3.974609375, 4.15771484375, 4.3408203125, 4.52392578125, 4.70703125, 4.89013671875, 5.0732421875, 5.25634765625, 5.439453125, 5.62255859375, 5.8056640625, 5.98876953125, 6.171875]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 1.0, 4.0, 3.0, 6.0, 6.0, 10.0, 12.0, 12.0, 18.0, 15.0, 14.0, 22.0, 27.0, 35.0, 30.0, 30.0, 37.0, 42.0, 39.0, 48.0, 37.0, 44.0, 54.0, 47.0, 36.0, 46.0, 40.0, 40.0, 35.0, 30.0, 36.0, 24.0, 20.0, 13.0, 11.0, 13.0, 8.0, 12.0, 8.0, 9.0, 10.0, 7.0, 3.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0], "bins": [-3.263671875, -3.16253662109375, -3.0614013671875, -2.96026611328125, -2.859130859375, -2.75799560546875, -2.6568603515625, -2.55572509765625, -2.45458984375, -2.35345458984375, -2.2523193359375, -2.15118408203125, -2.050048828125, -1.94891357421875, -1.8477783203125, -1.74664306640625, -1.6455078125, -1.54437255859375, -1.4432373046875, -1.34210205078125, -1.240966796875, -1.13983154296875, -1.0386962890625, -0.93756103515625, -0.83642578125, -0.73529052734375, -0.6341552734375, -0.53302001953125, -0.431884765625, -0.33074951171875, -0.2296142578125, -0.12847900390625, -0.02734375, 0.07379150390625, 0.1749267578125, 0.27606201171875, 0.377197265625, 0.47833251953125, 0.5794677734375, 0.68060302734375, 0.78173828125, 0.88287353515625, 0.9840087890625, 1.08514404296875, 1.186279296875, 1.28741455078125, 1.3885498046875, 1.48968505859375, 1.5908203125, 1.69195556640625, 1.7930908203125, 1.89422607421875, 1.995361328125, 2.09649658203125, 2.1976318359375, 2.29876708984375, 2.39990234375, 2.50103759765625, 2.6021728515625, 2.70330810546875, 2.804443359375, 2.90557861328125, 3.0067138671875, 3.10784912109375, 3.208984375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 2.0, 5.0, 6.0, 9.0, 13.0, 19.0, 32.0, 60.0, 113.0, 206.0, 412.0, 936.0, 2745.0, 11631.0, 112355.0, 3621534.0, 413348.0, 23768.0, 4517.0, 1395.0, 541.0, 274.0, 141.0, 81.0, 55.0, 27.0, 14.0, 10.0, 12.0, 7.0, 2.0, 7.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.0234375, -10.5579833984375, -10.092529296875, -9.6270751953125, -9.16162109375, -8.6961669921875, -8.230712890625, -7.7652587890625, -7.2998046875, -6.8343505859375, -6.368896484375, -5.9034423828125, -5.43798828125, -4.9725341796875, -4.507080078125, -4.0416259765625, -3.576171875, -3.1107177734375, -2.645263671875, -2.1798095703125, -1.71435546875, -1.2489013671875, -0.783447265625, -0.3179931640625, 0.1474609375, 0.6129150390625, 1.078369140625, 1.5438232421875, 2.00927734375, 2.4747314453125, 2.940185546875, 3.4056396484375, 3.87109375, 4.3365478515625, 4.802001953125, 5.2674560546875, 5.73291015625, 6.1983642578125, 6.663818359375, 7.1292724609375, 7.5947265625, 8.0601806640625, 8.525634765625, 8.9910888671875, 9.45654296875, 9.9219970703125, 10.387451171875, 10.8529052734375, 11.318359375, 11.7838134765625, 12.249267578125, 12.7147216796875, 13.18017578125, 13.6456298828125, 14.111083984375, 14.5765380859375, 15.0419921875, 15.5074462890625, 15.972900390625, 16.4383544921875, 16.90380859375, 17.3692626953125, 17.834716796875, 18.3001708984375, 18.765625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 3.0, 0.0, 3.0, 5.0, 6.0, 10.0, 12.0, 17.0, 31.0, 45.0, 66.0, 94.0, 196.0, 324.0, 705.0, 993.0, 713.0, 360.0, 190.0, 101.0, 59.0, 48.0, 27.0, 19.0, 16.0, 10.0, 11.0, 7.0, 2.0, 4.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.078125, -9.68359375, -9.2890625, -8.89453125, -8.5, -8.10546875, -7.7109375, -7.31640625, -6.921875, -6.52734375, -6.1328125, -5.73828125, -5.34375, -4.94921875, -4.5546875, -4.16015625, -3.765625, -3.37109375, -2.9765625, -2.58203125, -2.1875, -1.79296875, -1.3984375, -1.00390625, -0.609375, -0.21484375, 0.1796875, 0.57421875, 0.96875, 1.36328125, 1.7578125, 2.15234375, 2.546875, 2.94140625, 3.3359375, 3.73046875, 4.125, 4.51953125, 4.9140625, 5.30859375, 5.703125, 6.09765625, 6.4921875, 6.88671875, 7.28125, 7.67578125, 8.0703125, 8.46484375, 8.859375, 9.25390625, 9.6484375, 10.04296875, 10.4375, 10.83203125, 11.2265625, 11.62109375, 12.015625, 12.41015625, 12.8046875, 13.19921875, 13.59375, 13.98828125, 14.3828125, 14.77734375, 15.171875]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 4.0, 5.0, 6.0, 13.0, 22.0, 43.0, 78.0, 116.0, 180.0, 177.0, 152.0, 76.0, 51.0, 29.0, 23.0, 6.0, 7.0, 9.0, 4.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-106.87898254394531, -104.06421661376953, -101.24945068359375, -98.43468475341797, -95.61991882324219, -92.80516052246094, -89.99039459228516, -87.17562866210938, -84.3608627319336, -81.54609680175781, -78.73133087158203, -75.91656494140625, -73.101806640625, -70.28704071044922, -67.47227478027344, -64.65750885009766, -61.842742919921875, -59.027976989746094, -56.21321105957031, -53.3984489440918, -50.583683013916016, -47.768917083740234, -44.95415496826172, -42.13938903808594, -39.324623107910156, -36.509857177734375, -33.695091247558594, -30.880329132080078, -28.065563201904297, -25.250797271728516, -22.436033248901367, -19.62126922607422, -16.80651092529297, -13.991745948791504, -11.176980972290039, -8.362215995788574, -5.547451019287109, -2.7326860427856445, 0.08207893371582031, 2.8968429565429688, 5.71160888671875, 8.526373863220215, 11.34113883972168, 14.155903816223145, 16.97066879272461, 19.78543472290039, 22.60019874572754, 25.414962768554688, 28.22972869873047, 31.04449462890625, 33.85926055908203, 36.67402267456055, 39.48878860473633, 42.30355453491211, 45.118316650390625, 47.933082580566406, 50.74784851074219, 53.56261444091797, 56.37738037109375, 59.192142486572266, 62.00690841674805, 64.82167053222656, 67.63643646240234, 70.45120239257812, 73.2659683227539]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 7.0, 1.0, 4.0, 5.0, 8.0, 11.0, 13.0, 9.0, 18.0, 14.0, 16.0, 27.0, 29.0, 24.0, 28.0, 33.0, 34.0, 32.0, 35.0, 32.0, 42.0, 58.0, 54.0, 60.0, 52.0, 33.0, 38.0, 45.0, 34.0, 32.0, 22.0, 16.0, 22.0, 23.0, 12.0, 17.0, 13.0, 7.0, 12.0, 4.0, 7.0, 5.0, 6.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-42.382041931152344, -41.16856002807617, -39.955078125, -38.74159622192383, -37.528114318847656, -36.31463623046875, -35.10115432739258, -33.887672424316406, -32.674190521240234, -31.460708618164062, -30.24722671508789, -29.03374671936035, -27.82026481628418, -26.606782913208008, -25.39330291748047, -24.179821014404297, -22.966339111328125, -21.752857208251953, -20.53937530517578, -19.325895309448242, -18.11241340637207, -16.8989315032959, -15.685450553894043, -14.471969604492188, -13.258487701416016, -12.045005798339844, -10.831524848937988, -9.618043899536133, -8.404561996459961, -7.191080570220947, -5.977599143981934, -4.764118194580078, -3.550640106201172, -2.337158679962158, -1.1236772537231445, 0.08980417251586914, 1.3032855987548828, 2.5167670249938965, 3.73024845123291, 4.943729400634766, 6.1572113037109375, 7.370692729949951, 8.584174156188965, 9.79765510559082, 11.011137008666992, 12.224618911743164, 13.43809986114502, 14.651580810546875, 15.865062713623047, 17.07854461669922, 18.29202651977539, 19.50550651550293, 20.7189884185791, 21.932470321655273, 23.145950317382812, 24.359432220458984, 25.572914123535156, 26.786396026611328, 27.9998779296875, 29.21335792541504, 30.42683982849121, 31.640321731567383, 32.85380172729492, 34.067283630371094, 35.280765533447266]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 6.0, 12.0, 17.0, 22.0, 38.0, 38.0, 48.0, 103.0, 152.0, 238.0, 372.0, 625.0, 1070.0, 1847.0, 3447.0, 6789.0, 13722.0, 30293.0, 74188.0, 207510.0, 392489.0, 190725.0, 69483.0, 28417.0, 13014.0, 6335.0, 3184.0, 1770.0, 963.0, 591.0, 372.0, 241.0, 155.0, 88.0, 57.0, 35.0, 27.0, 23.0, 17.0, 8.0, 15.0, 2.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-4.6015625, -4.45050048828125, -4.2994384765625, -4.14837646484375, -3.997314453125, -3.84625244140625, -3.6951904296875, -3.54412841796875, -3.39306640625, -3.24200439453125, -3.0909423828125, -2.93988037109375, -2.788818359375, -2.63775634765625, -2.4866943359375, -2.33563232421875, -2.1845703125, -2.03350830078125, -1.8824462890625, -1.73138427734375, -1.580322265625, -1.42926025390625, -1.2781982421875, -1.12713623046875, -0.97607421875, -0.82501220703125, -0.6739501953125, -0.52288818359375, -0.371826171875, -0.22076416015625, -0.0697021484375, 0.08135986328125, 0.232421875, 0.38348388671875, 0.5345458984375, 0.68560791015625, 0.836669921875, 0.98773193359375, 1.1387939453125, 1.28985595703125, 1.44091796875, 1.59197998046875, 1.7430419921875, 1.89410400390625, 2.045166015625, 2.19622802734375, 2.3472900390625, 2.49835205078125, 2.6494140625, 2.80047607421875, 2.9515380859375, 3.10260009765625, 3.253662109375, 3.40472412109375, 3.5557861328125, 3.70684814453125, 3.85791015625, 4.00897216796875, 4.1600341796875, 4.31109619140625, 4.462158203125, 4.61322021484375, 4.7642822265625, 4.91534423828125, 5.06640625]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 3.0, 2.0, 2.0, 6.0, 11.0, 13.0, 16.0, 17.0, 26.0, 21.0, 26.0, 41.0, 32.0, 41.0, 54.0, 59.0, 62.0, 59.0, 57.0, 66.0, 60.0, 42.0, 37.0, 43.0, 29.0, 29.0, 25.0, 23.0, 24.0, 18.0, 21.0, 7.0, 12.0, 11.0, 2.0, 3.0, 8.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.01953125, -3.87286376953125, -3.7261962890625, -3.57952880859375, -3.432861328125, -3.28619384765625, -3.1395263671875, -2.99285888671875, -2.84619140625, -2.69952392578125, -2.5528564453125, -2.40618896484375, -2.259521484375, -2.11285400390625, -1.9661865234375, -1.81951904296875, -1.6728515625, -1.52618408203125, -1.3795166015625, -1.23284912109375, -1.086181640625, -0.93951416015625, -0.7928466796875, -0.64617919921875, -0.49951171875, -0.35284423828125, -0.2061767578125, -0.05950927734375, 0.087158203125, 0.23382568359375, 0.3804931640625, 0.52716064453125, 0.673828125, 0.82049560546875, 0.9671630859375, 1.11383056640625, 1.260498046875, 1.40716552734375, 1.5538330078125, 1.70050048828125, 1.84716796875, 1.99383544921875, 2.1405029296875, 2.28717041015625, 2.433837890625, 2.58050537109375, 2.7271728515625, 2.87384033203125, 3.0205078125, 3.16717529296875, 3.3138427734375, 3.46051025390625, 3.607177734375, 3.75384521484375, 3.9005126953125, 4.04718017578125, 4.19384765625, 4.34051513671875, 4.4871826171875, 4.63385009765625, 4.780517578125, 4.92718505859375, 5.0738525390625, 5.22052001953125, 5.3671875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 6.0, 9.0, 12.0, 6.0, 21.0, 14.0, 35.0, 53.0, 74.0, 138.0, 183.0, 321.0, 695.0, 1610.0, 4811.0, 20986.0, 195718.0, 760233.0, 50436.0, 8539.0, 2554.0, 989.0, 459.0, 235.0, 147.0, 86.0, 72.0, 41.0, 25.0, 18.0, 10.0, 5.0, 5.0, 4.0, 2.0, 1.0, 4.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.25, -12.873779296875, -12.49755859375, -12.121337890625, -11.7451171875, -11.368896484375, -10.99267578125, -10.616455078125, -10.240234375, -9.864013671875, -9.48779296875, -9.111572265625, -8.7353515625, -8.359130859375, -7.98291015625, -7.606689453125, -7.23046875, -6.854248046875, -6.47802734375, -6.101806640625, -5.7255859375, -5.349365234375, -4.97314453125, -4.596923828125, -4.220703125, -3.844482421875, -3.46826171875, -3.092041015625, -2.7158203125, -2.339599609375, -1.96337890625, -1.587158203125, -1.2109375, -0.834716796875, -0.45849609375, -0.082275390625, 0.2939453125, 0.670166015625, 1.04638671875, 1.422607421875, 1.798828125, 2.175048828125, 2.55126953125, 2.927490234375, 3.3037109375, 3.679931640625, 4.05615234375, 4.432373046875, 4.80859375, 5.184814453125, 5.56103515625, 5.937255859375, 6.3134765625, 6.689697265625, 7.06591796875, 7.442138671875, 7.818359375, 8.194580078125, 8.57080078125, 8.947021484375, 9.3232421875, 9.699462890625, 10.07568359375, 10.451904296875, 10.828125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 0.0, 1.0, 7.0, 4.0, 11.0, 22.0, 10.0, 17.0, 28.0, 32.0, 25.0, 41.0, 42.0, 67.0, 57.0, 68.0, 62.0, 61.0, 76.0, 67.0, 58.0, 51.0, 41.0, 32.0, 32.0, 21.0, 16.0, 10.0, 8.0, 11.0, 9.0, 4.0, 3.0, 3.0, 3.0, 3.0, 1.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.421875, -16.82080078125, -16.2197265625, -15.61865234375, -15.017578125, -14.41650390625, -13.8154296875, -13.21435546875, -12.61328125, -12.01220703125, -11.4111328125, -10.81005859375, -10.208984375, -9.60791015625, -9.0068359375, -8.40576171875, -7.8046875, -7.20361328125, -6.6025390625, -6.00146484375, -5.400390625, -4.79931640625, -4.1982421875, -3.59716796875, -2.99609375, -2.39501953125, -1.7939453125, -1.19287109375, -0.591796875, 0.00927734375, 0.6103515625, 1.21142578125, 1.8125, 2.41357421875, 3.0146484375, 3.61572265625, 4.216796875, 4.81787109375, 5.4189453125, 6.02001953125, 6.62109375, 7.22216796875, 7.8232421875, 8.42431640625, 9.025390625, 9.62646484375, 10.2275390625, 10.82861328125, 11.4296875, 12.03076171875, 12.6318359375, 13.23291015625, 13.833984375, 14.43505859375, 15.0361328125, 15.63720703125, 16.23828125, 16.83935546875, 17.4404296875, 18.04150390625, 18.642578125, 19.24365234375, 19.8447265625, 20.44580078125, 21.046875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 5.0, 5.0, 9.0, 7.0, 13.0, 20.0, 20.0, 22.0, 28.0, 46.0, 60.0, 85.0, 133.0, 215.0, 368.0, 566.0, 995.0, 2016.0, 4027.0, 9144.0, 24071.0, 78239.0, 624950.0, 219634.0, 52600.0, 17257.0, 6960.0, 3177.0, 1614.0, 883.0, 489.0, 292.0, 189.0, 132.0, 88.0, 60.0, 34.0, 22.0, 13.0, 20.0, 14.0, 12.0, 4.0, 8.0, 2.0, 2.0, 4.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0], "bins": [-2.369140625, -2.29913330078125, -2.2291259765625, -2.15911865234375, -2.089111328125, -2.01910400390625, -1.9490966796875, -1.87908935546875, -1.80908203125, -1.73907470703125, -1.6690673828125, -1.59906005859375, -1.529052734375, -1.45904541015625, -1.3890380859375, -1.31903076171875, -1.2490234375, -1.17901611328125, -1.1090087890625, -1.03900146484375, -0.968994140625, -0.89898681640625, -0.8289794921875, -0.75897216796875, -0.68896484375, -0.61895751953125, -0.5489501953125, -0.47894287109375, -0.408935546875, -0.33892822265625, -0.2689208984375, -0.19891357421875, -0.12890625, -0.05889892578125, 0.0111083984375, 0.08111572265625, 0.151123046875, 0.22113037109375, 0.2911376953125, 0.36114501953125, 0.43115234375, 0.50115966796875, 0.5711669921875, 0.64117431640625, 0.711181640625, 0.78118896484375, 0.8511962890625, 0.92120361328125, 0.9912109375, 1.06121826171875, 1.1312255859375, 1.20123291015625, 1.271240234375, 1.34124755859375, 1.4112548828125, 1.48126220703125, 1.55126953125, 1.62127685546875, 1.6912841796875, 1.76129150390625, 1.831298828125, 1.90130615234375, 1.9713134765625, 2.04132080078125, 2.111328125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 4.0, 4.0, 1.0, 6.0, 3.0, 10.0, 7.0, 19.0, 22.0, 36.0, 38.0, 66.0, 93.0, 204.0, 162.0, 106.0, 68.0, 49.0, 29.0, 17.0, 15.0, 7.0, 11.0, 5.0, 8.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001312255859375, -0.0012736916542053223, -0.0012351274490356445, -0.0011965632438659668, -0.001157999038696289, -0.0011194348335266113, -0.0010808706283569336, -0.0010423064231872559, -0.0010037422180175781, -0.0009651780128479004, -0.0009266138076782227, -0.0008880496025085449, -0.0008494853973388672, -0.0008109211921691895, -0.0007723569869995117, -0.000733792781829834, -0.0006952285766601562, -0.0006566643714904785, -0.0006181001663208008, -0.000579535961151123, -0.0005409717559814453, -0.0005024075508117676, -0.00046384334564208984, -0.0004252791404724121, -0.0003867149353027344, -0.00034815073013305664, -0.0003095865249633789, -0.00027102231979370117, -0.00023245811462402344, -0.0001938939094543457, -0.00015532970428466797, -0.00011676549911499023, -7.82012939453125e-05, -3.9637088775634766e-05, -1.0728836059570312e-06, 3.74913215637207e-05, 7.605552673339844e-05, 0.00011461973190307617, 0.0001531839370727539, 0.00019174814224243164, 0.00023031234741210938, 0.0002688765525817871, 0.00030744075775146484, 0.0003460049629211426, 0.0003845691680908203, 0.00042313337326049805, 0.0004616975784301758, 0.0005002617835998535, 0.0005388259887695312, 0.000577390193939209, 0.0006159543991088867, 0.0006545186042785645, 0.0006930828094482422, 0.0007316470146179199, 0.0007702112197875977, 0.0008087754249572754, 0.0008473396301269531, 0.0008859038352966309, 0.0009244680404663086, 0.0009630322456359863, 0.001001596450805664, 0.0010401606559753418, 0.0010787248611450195, 0.0011172890663146973, 0.001155853271484375]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 9.0, 8.0, 16.0, 9.0, 41.0, 59.0, 66.0, 120.0, 190.0, 290.0, 583.0, 1253.0, 2930.0, 8358.0, 28629.0, 126912.0, 724390.0, 114983.0, 26244.0, 7973.0, 2864.0, 1230.0, 626.0, 293.0, 184.0, 111.0, 63.0, 36.0, 28.0, 16.0, 13.0, 8.0, 8.0, 5.0, 6.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.564453125, -2.471099853515625, -2.37774658203125, -2.284393310546875, -2.1910400390625, -2.097686767578125, -2.00433349609375, -1.910980224609375, -1.817626953125, -1.724273681640625, -1.63092041015625, -1.537567138671875, -1.4442138671875, -1.350860595703125, -1.25750732421875, -1.164154052734375, -1.07080078125, -0.977447509765625, -0.88409423828125, -0.790740966796875, -0.6973876953125, -0.604034423828125, -0.51068115234375, -0.417327880859375, -0.323974609375, -0.230621337890625, -0.13726806640625, -0.043914794921875, 0.0494384765625, 0.142791748046875, 0.23614501953125, 0.329498291015625, 0.4228515625, 0.516204833984375, 0.60955810546875, 0.702911376953125, 0.7962646484375, 0.889617919921875, 0.98297119140625, 1.076324462890625, 1.169677734375, 1.263031005859375, 1.35638427734375, 1.449737548828125, 1.5430908203125, 1.636444091796875, 1.72979736328125, 1.823150634765625, 1.91650390625, 2.009857177734375, 2.10321044921875, 2.196563720703125, 2.2899169921875, 2.383270263671875, 2.47662353515625, 2.569976806640625, 2.663330078125, 2.756683349609375, 2.85003662109375, 2.943389892578125, 3.0367431640625, 3.130096435546875, 3.22344970703125, 3.316802978515625, 3.41015625]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 6.0, 7.0, 3.0, 10.0, 9.0, 7.0, 7.0, 10.0, 13.0, 14.0, 17.0, 26.0, 34.0, 55.0, 59.0, 80.0, 103.0, 91.0, 106.0, 71.0, 48.0, 46.0, 39.0, 28.0, 26.0, 19.0, 14.0, 8.0, 11.0, 8.0, 8.0, 3.0, 6.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.818359375, -2.733917236328125, -2.64947509765625, -2.565032958984375, -2.4805908203125, -2.396148681640625, -2.31170654296875, -2.227264404296875, -2.142822265625, -2.058380126953125, -1.97393798828125, -1.889495849609375, -1.8050537109375, -1.720611572265625, -1.63616943359375, -1.551727294921875, -1.46728515625, -1.382843017578125, -1.29840087890625, -1.213958740234375, -1.1295166015625, -1.045074462890625, -0.96063232421875, -0.876190185546875, -0.791748046875, -0.707305908203125, -0.62286376953125, -0.538421630859375, -0.4539794921875, -0.369537353515625, -0.28509521484375, -0.200653076171875, -0.1162109375, -0.031768798828125, 0.05267333984375, 0.137115478515625, 0.2215576171875, 0.305999755859375, 0.39044189453125, 0.474884033203125, 0.559326171875, 0.643768310546875, 0.72821044921875, 0.812652587890625, 0.8970947265625, 0.981536865234375, 1.06597900390625, 1.150421142578125, 1.23486328125, 1.319305419921875, 1.40374755859375, 1.488189697265625, 1.5726318359375, 1.657073974609375, 1.74151611328125, 1.825958251953125, 1.910400390625, 1.994842529296875, 2.07928466796875, 2.163726806640625, 2.2481689453125, 2.332611083984375, 2.41705322265625, 2.501495361328125, 2.5859375]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 7.0, 10.0, 12.0, 35.0, 75.0, 168.0, 402.0, 166.0, 65.0, 29.0, 16.0, 5.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-141.18927001953125, -137.6227569580078, -134.05624389648438, -130.48973083496094, -126.9232177734375, -123.35670471191406, -119.79019165039062, -116.22367858886719, -112.65716552734375, -109.09065246582031, -105.52413940429688, -101.95762634277344, -98.39111328125, -94.82460021972656, -91.25808715820312, -87.69157409667969, -84.12506103515625, -80.55854797363281, -76.99203491210938, -73.42552185058594, -69.8590087890625, -66.29249572753906, -62.725982666015625, -59.15946960449219, -55.59296417236328, -52.026451110839844, -48.459938049316406, -44.89342498779297, -41.32691192626953, -37.760398864746094, -34.193885803222656, -30.62737464904785, -27.06085968017578, -23.494346618652344, -19.927833557128906, -16.36132049560547, -12.794808387756348, -9.228296279907227, -5.661783218383789, -2.0952701568603516, 1.471242904663086, 5.037755966186523, 8.604269027709961, 12.170781135559082, 15.73729419708252, 19.30380630493164, 22.870319366455078, 26.436832427978516, 30.003345489501953, 33.56985855102539, 37.13637161254883, 40.702884674072266, 44.2693977355957, 47.835906982421875, 51.40242004394531, 54.96893310546875, 58.53544616699219, 62.101959228515625, 65.66847229003906, 69.2349853515625, 72.80149841308594, 76.36801147460938, 79.93452453613281, 83.50103759765625, 87.06755065917969]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 5.0, 5.0, 2.0, 7.0, 5.0, 6.0, 14.0, 7.0, 7.0, 17.0, 10.0, 16.0, 19.0, 17.0, 22.0, 28.0, 29.0, 40.0, 44.0, 69.0, 132.0, 104.0, 64.0, 43.0, 26.0, 37.0, 28.0, 37.0, 20.0, 23.0, 16.0, 19.0, 19.0, 13.0, 11.0, 9.0, 4.0, 9.0, 4.0, 7.0, 1.0, 5.0, 2.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.071258544921875, -55.161033630371094, -53.25080871582031, -51.34058380126953, -49.43035888671875, -47.52013397216797, -45.60990524291992, -43.69968032836914, -41.78945541381836, -39.87923049926758, -37.9690055847168, -36.058780670166016, -34.14855194091797, -32.23832702636719, -30.328102111816406, -28.417877197265625, -26.507652282714844, -24.597427368164062, -22.68720245361328, -20.776975631713867, -18.866750717163086, -16.956525802612305, -15.046299934387207, -13.13607406616211, -11.225849151611328, -9.315624237060547, -7.405398368835449, -5.49517297744751, -3.5849475860595703, -1.674722671508789, 0.2355031967163086, 2.1457290649414062, 4.0559539794921875, 5.966179370880127, 7.876404762268066, 9.786630630493164, 11.696855545043945, 13.607080459594727, 15.517306327819824, 17.427532196044922, 19.337757110595703, 21.247982025146484, 23.158206939697266, 25.06843376159668, 26.97865867614746, 28.888883590698242, 30.799110412597656, 32.70933532714844, 34.61956024169922, 36.52978515625, 38.44001007080078, 40.35023498535156, 42.260459899902344, 44.170684814453125, 46.08091354370117, 47.99113845825195, 49.901363372802734, 51.811588287353516, 53.7218132019043, 55.63203811645508, 57.542266845703125, 59.452491760253906, 61.36271667480469, 63.27294158935547, 65.18316650390625]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 18.0, 25.0, 19.0, 33.0, 64.0, 110.0, 149.0, 268.0, 485.0, 782.0, 1401.0, 2676.0, 5907.0, 13818.0, 39538.0, 156550.0, 815488.0, 2210508.0, 748045.0, 137986.0, 35983.0, 12688.0, 5569.0, 2633.0, 1377.0, 802.0, 496.0, 305.0, 182.0, 110.0, 86.0, 47.0, 39.0, 33.0, 12.0, 18.0, 16.0, 8.0, 6.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.6484375, -6.397216796875, -6.14599609375, -5.894775390625, -5.6435546875, -5.392333984375, -5.14111328125, -4.889892578125, -4.638671875, -4.387451171875, -4.13623046875, -3.885009765625, -3.6337890625, -3.382568359375, -3.13134765625, -2.880126953125, -2.62890625, -2.377685546875, -2.12646484375, -1.875244140625, -1.6240234375, -1.372802734375, -1.12158203125, -0.870361328125, -0.619140625, -0.367919921875, -0.11669921875, 0.134521484375, 0.3857421875, 0.636962890625, 0.88818359375, 1.139404296875, 1.390625, 1.641845703125, 1.89306640625, 2.144287109375, 2.3955078125, 2.646728515625, 2.89794921875, 3.149169921875, 3.400390625, 3.651611328125, 3.90283203125, 4.154052734375, 4.4052734375, 4.656494140625, 4.90771484375, 5.158935546875, 5.41015625, 5.661376953125, 5.91259765625, 6.163818359375, 6.4150390625, 6.666259765625, 6.91748046875, 7.168701171875, 7.419921875, 7.671142578125, 7.92236328125, 8.173583984375, 8.4248046875, 8.676025390625, 8.92724609375, 9.178466796875, 9.4296875]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 3.0, 7.0, 6.0, 5.0, 7.0, 13.0, 9.0, 16.0, 12.0, 15.0, 17.0, 27.0, 33.0, 24.0, 30.0, 45.0, 34.0, 36.0, 48.0, 41.0, 44.0, 47.0, 37.0, 39.0, 47.0, 36.0, 55.0, 41.0, 47.0, 29.0, 15.0, 19.0, 20.0, 20.0, 15.0, 7.0, 14.0, 6.0, 4.0, 5.0, 4.0, 5.0, 9.0, 8.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0], "bins": [-3.646484375, -3.538848876953125, -3.43121337890625, -3.323577880859375, -3.2159423828125, -3.108306884765625, -3.00067138671875, -2.893035888671875, -2.785400390625, -2.677764892578125, -2.57012939453125, -2.462493896484375, -2.3548583984375, -2.247222900390625, -2.13958740234375, -2.031951904296875, -1.92431640625, -1.816680908203125, -1.70904541015625, -1.601409912109375, -1.4937744140625, -1.386138916015625, -1.27850341796875, -1.170867919921875, -1.063232421875, -0.955596923828125, -0.84796142578125, -0.740325927734375, -0.6326904296875, -0.525054931640625, -0.41741943359375, -0.309783935546875, -0.2021484375, -0.094512939453125, 0.01312255859375, 0.120758056640625, 0.2283935546875, 0.336029052734375, 0.44366455078125, 0.551300048828125, 0.658935546875, 0.766571044921875, 0.87420654296875, 0.981842041015625, 1.0894775390625, 1.197113037109375, 1.30474853515625, 1.412384033203125, 1.52001953125, 1.627655029296875, 1.73529052734375, 1.842926025390625, 1.9505615234375, 2.058197021484375, 2.16583251953125, 2.273468017578125, 2.381103515625, 2.488739013671875, 2.59637451171875, 2.704010009765625, 2.8116455078125, 2.919281005859375, 3.02691650390625, 3.134552001953125, 3.2421875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 10.0, 9.0, 15.0, 16.0, 17.0, 30.0, 37.0, 66.0, 122.0, 172.0, 250.0, 480.0, 892.0, 2089.0, 6820.0, 40368.0, 2448093.0, 1647224.0, 36946.0, 6471.0, 2057.0, 889.0, 448.0, 287.0, 132.0, 100.0, 76.0, 48.0, 28.0, 26.0, 17.0, 10.0, 13.0, 8.0, 4.0, 6.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-26.6875, -25.92431640625, -25.1611328125, -24.39794921875, -23.634765625, -22.87158203125, -22.1083984375, -21.34521484375, -20.58203125, -19.81884765625, -19.0556640625, -18.29248046875, -17.529296875, -16.76611328125, -16.0029296875, -15.23974609375, -14.4765625, -13.71337890625, -12.9501953125, -12.18701171875, -11.423828125, -10.66064453125, -9.8974609375, -9.13427734375, -8.37109375, -7.60791015625, -6.8447265625, -6.08154296875, -5.318359375, -4.55517578125, -3.7919921875, -3.02880859375, -2.265625, -1.50244140625, -0.7392578125, 0.02392578125, 0.787109375, 1.55029296875, 2.3134765625, 3.07666015625, 3.83984375, 4.60302734375, 5.3662109375, 6.12939453125, 6.892578125, 7.65576171875, 8.4189453125, 9.18212890625, 9.9453125, 10.70849609375, 11.4716796875, 12.23486328125, 12.998046875, 13.76123046875, 14.5244140625, 15.28759765625, 16.05078125, 16.81396484375, 17.5771484375, 18.34033203125, 19.103515625, 19.86669921875, 20.6298828125, 21.39306640625, 22.15625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 7.0, 2.0, 5.0, 8.0, 17.0, 16.0, 21.0, 36.0, 30.0, 50.0, 75.0, 107.0, 139.0, 186.0, 259.0, 347.0, 416.0, 543.0, 466.0, 339.0, 248.0, 185.0, 139.0, 104.0, 72.0, 66.0, 44.0, 41.0, 29.0, 16.0, 22.0, 8.0, 9.0, 9.0, 2.0, 5.0, 2.0, 2.0, 4.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.234375, -13.8194580078125, -13.404541015625, -12.9896240234375, -12.57470703125, -12.1597900390625, -11.744873046875, -11.3299560546875, -10.9150390625, -10.5001220703125, -10.085205078125, -9.6702880859375, -9.25537109375, -8.8404541015625, -8.425537109375, -8.0106201171875, -7.595703125, -7.1807861328125, -6.765869140625, -6.3509521484375, -5.93603515625, -5.5211181640625, -5.106201171875, -4.6912841796875, -4.2763671875, -3.8614501953125, -3.446533203125, -3.0316162109375, -2.61669921875, -2.2017822265625, -1.786865234375, -1.3719482421875, -0.95703125, -0.5421142578125, -0.127197265625, 0.2877197265625, 0.70263671875, 1.1175537109375, 1.532470703125, 1.9473876953125, 2.3623046875, 2.7772216796875, 3.192138671875, 3.6070556640625, 4.02197265625, 4.4368896484375, 4.851806640625, 5.2667236328125, 5.681640625, 6.0965576171875, 6.511474609375, 6.9263916015625, 7.34130859375, 7.7562255859375, 8.171142578125, 8.5860595703125, 9.0009765625, 9.4158935546875, 9.830810546875, 10.2457275390625, 10.66064453125, 11.0755615234375, 11.490478515625, 11.9053955078125, 12.3203125]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 6.0, 8.0, 9.0, 15.0, 28.0, 52.0, 93.0, 167.0, 199.0, 152.0, 105.0, 64.0, 28.0, 23.0, 20.0, 5.0, 4.0, 6.0, 4.0, 4.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-206.316650390625, -200.34393310546875, -194.37123107910156, -188.39852905273438, -182.42581176757812, -176.45309448242188, -170.4803924560547, -164.5076904296875, -158.53497314453125, -152.562255859375, -146.5895538330078, -140.61685180664062, -134.64413452148438, -128.67141723632812, -122.69871520996094, -116.72600555419922, -110.7532958984375, -104.78058624267578, -98.80787658691406, -92.83516693115234, -86.86245727539062, -80.8897476196289, -74.91703796386719, -68.94432830810547, -62.97161865234375, -56.99890899658203, -51.02619934082031, -45.053489685058594, -39.080780029296875, -33.108070373535156, -27.135360717773438, -21.16265106201172, -15.189956665039062, -9.217247009277344, -3.244537353515625, 2.7281723022460938, 8.700881958007812, 14.673591613769531, 20.64630126953125, 26.61901092529297, 32.59172058105469, 38.564430236816406, 44.537139892578125, 50.509849548339844, 56.48255920410156, 62.45526885986328, 68.427978515625, 74.40068817138672, 80.37339782714844, 86.34610748291016, 92.31881713867188, 98.2915267944336, 104.26423645019531, 110.23694610595703, 116.20965576171875, 122.18236541748047, 128.1550750732422, 134.12777709960938, 140.10049438476562, 146.07321166992188, 152.04591369628906, 158.01861572265625, 163.9913330078125, 169.96405029296875, 175.93675231933594]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 9.0, 4.0, 3.0, 5.0, 5.0, 5.0, 9.0, 8.0, 14.0, 18.0, 20.0, 12.0, 15.0, 15.0, 21.0, 28.0, 19.0, 25.0, 30.0, 41.0, 34.0, 30.0, 46.0, 41.0, 40.0, 40.0, 40.0, 48.0, 43.0, 35.0, 38.0, 26.0, 27.0, 28.0, 27.0, 26.0, 17.0, 18.0, 9.0, 20.0, 5.0, 10.0, 5.0, 12.0, 10.0, 5.0, 3.0, 6.0, 2.0, 4.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0], "bins": [-64.35797882080078, -62.348270416259766, -60.33856201171875, -58.328857421875, -56.319149017333984, -54.30944061279297, -52.29973602294922, -50.2900276184082, -48.28031921386719, -46.27061080932617, -44.260902404785156, -42.251197814941406, -40.24148941040039, -38.231781005859375, -36.222076416015625, -34.21236801147461, -32.202659606933594, -30.192951202392578, -28.183244705200195, -26.173538208007812, -24.163829803466797, -22.15412139892578, -20.1444149017334, -18.134708404541016, -16.125, -14.1152925491333, -12.105585098266602, -10.095877647399902, -8.086170196533203, -6.076462745666504, -4.066755294799805, -2.0570478439331055, -0.04734039306640625, 1.962367057800293, 3.972074508666992, 5.981781959533691, 7.991489410400391, 10.00119686126709, 12.010904312133789, 14.020611763000488, 16.030319213867188, 18.040027618408203, 20.049734115600586, 22.05944061279297, 24.069149017333984, 26.078857421875, 28.088563919067383, 30.098270416259766, 32.10797882080078, 34.1176872253418, 36.12739562988281, 38.13710021972656, 40.14680862426758, 42.156517028808594, 44.166221618652344, 46.17593002319336, 48.185638427734375, 50.19534683227539, 52.205055236816406, 54.214759826660156, 56.22446823120117, 58.23417663574219, 60.24388122558594, 62.25358963012695, 64.26329803466797]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 8.0, 6.0, 10.0, 12.0, 14.0, 17.0, 38.0, 41.0, 65.0, 112.0, 177.0, 321.0, 537.0, 890.0, 1736.0, 3850.0, 9379.0, 26839.0, 95551.0, 531062.0, 285152.0, 61350.0, 18374.0, 6895.0, 2899.0, 1385.0, 740.0, 411.0, 246.0, 154.0, 83.0, 62.0, 52.0, 26.0, 23.0, 21.0, 8.0, 6.0, 3.0, 6.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.2578125, -9.0064697265625, -8.755126953125, -8.5037841796875, -8.25244140625, -8.0010986328125, -7.749755859375, -7.4984130859375, -7.2470703125, -6.9957275390625, -6.744384765625, -6.4930419921875, -6.24169921875, -5.9903564453125, -5.739013671875, -5.4876708984375, -5.236328125, -4.9849853515625, -4.733642578125, -4.4822998046875, -4.23095703125, -3.9796142578125, -3.728271484375, -3.4769287109375, -3.2255859375, -2.9742431640625, -2.722900390625, -2.4715576171875, -2.22021484375, -1.9688720703125, -1.717529296875, -1.4661865234375, -1.21484375, -0.9635009765625, -0.712158203125, -0.4608154296875, -0.20947265625, 0.0418701171875, 0.293212890625, 0.5445556640625, 0.7958984375, 1.0472412109375, 1.298583984375, 1.5499267578125, 1.80126953125, 2.0526123046875, 2.303955078125, 2.5552978515625, 2.806640625, 3.0579833984375, 3.309326171875, 3.5606689453125, 3.81201171875, 4.0633544921875, 4.314697265625, 4.5660400390625, 4.8173828125, 5.0687255859375, 5.320068359375, 5.5714111328125, 5.82275390625, 6.0740966796875, 6.325439453125, 6.5767822265625, 6.828125]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 1.0, 5.0, 12.0, 9.0, 7.0, 7.0, 9.0, 13.0, 27.0, 27.0, 31.0, 33.0, 44.0, 42.0, 39.0, 37.0, 51.0, 50.0, 39.0, 44.0, 47.0, 51.0, 37.0, 50.0, 42.0, 38.0, 31.0, 30.0, 27.0, 27.0, 19.0, 19.0, 5.0, 11.0, 11.0, 5.0, 1.0, 4.0, 9.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-6.09375, -5.9205322265625, -5.747314453125, -5.5740966796875, -5.40087890625, -5.2276611328125, -5.054443359375, -4.8812255859375, -4.7080078125, -4.5347900390625, -4.361572265625, -4.1883544921875, -4.01513671875, -3.8419189453125, -3.668701171875, -3.4954833984375, -3.322265625, -3.1490478515625, -2.975830078125, -2.8026123046875, -2.62939453125, -2.4561767578125, -2.282958984375, -2.1097412109375, -1.9365234375, -1.7633056640625, -1.590087890625, -1.4168701171875, -1.24365234375, -1.0704345703125, -0.897216796875, -0.7239990234375, -0.55078125, -0.3775634765625, -0.204345703125, -0.0311279296875, 0.14208984375, 0.3153076171875, 0.488525390625, 0.6617431640625, 0.8349609375, 1.0081787109375, 1.181396484375, 1.3546142578125, 1.52783203125, 1.7010498046875, 1.874267578125, 2.0474853515625, 2.220703125, 2.3939208984375, 2.567138671875, 2.7403564453125, 2.91357421875, 3.0867919921875, 3.260009765625, 3.4332275390625, 3.6064453125, 3.7796630859375, 3.952880859375, 4.1260986328125, 4.29931640625, 4.4725341796875, 4.645751953125, 4.8189697265625, 4.9921875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 2.0, 9.0, 6.0, 5.0, 7.0, 7.0, 18.0, 17.0, 21.0, 25.0, 48.0, 59.0, 84.0, 144.0, 207.0, 372.0, 698.0, 1637.0, 4725.0, 19012.0, 136925.0, 831930.0, 39712.0, 8088.0, 2461.0, 1019.0, 503.0, 275.0, 160.0, 116.0, 68.0, 49.0, 24.0, 32.0, 27.0, 15.0, 8.0, 18.0, 6.0, 4.0, 6.0, 3.0, 2.0, 4.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.3359375, -8.992919921875, -8.64990234375, -8.306884765625, -7.9638671875, -7.620849609375, -7.27783203125, -6.934814453125, -6.591796875, -6.248779296875, -5.90576171875, -5.562744140625, -5.2197265625, -4.876708984375, -4.53369140625, -4.190673828125, -3.84765625, -3.504638671875, -3.16162109375, -2.818603515625, -2.4755859375, -2.132568359375, -1.78955078125, -1.446533203125, -1.103515625, -0.760498046875, -0.41748046875, -0.074462890625, 0.2685546875, 0.611572265625, 0.95458984375, 1.297607421875, 1.640625, 1.983642578125, 2.32666015625, 2.669677734375, 3.0126953125, 3.355712890625, 3.69873046875, 4.041748046875, 4.384765625, 4.727783203125, 5.07080078125, 5.413818359375, 5.7568359375, 6.099853515625, 6.44287109375, 6.785888671875, 7.12890625, 7.471923828125, 7.81494140625, 8.157958984375, 8.5009765625, 8.843994140625, 9.18701171875, 9.530029296875, 9.873046875, 10.216064453125, 10.55908203125, 10.902099609375, 11.2451171875, 11.588134765625, 11.93115234375, 12.274169921875, 12.6171875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 6.0, 3.0, 7.0, 6.0, 7.0, 18.0, 9.0, 9.0, 16.0, 20.0, 16.0, 17.0, 24.0, 22.0, 33.0, 38.0, 47.0, 37.0, 47.0, 70.0, 75.0, 72.0, 54.0, 55.0, 47.0, 24.0, 40.0, 33.0, 16.0, 21.0, 13.0, 16.0, 14.0, 10.0, 7.0, 10.0, 9.0, 9.0, 4.0, 3.0, 1.0, 3.0, 7.0, 1.0, 1.0, 1.0, 3.0, 4.0, 1.0, 3.0], "bins": [-20.84375, -20.240966796875, -19.63818359375, -19.035400390625, -18.4326171875, -17.829833984375, -17.22705078125, -16.624267578125, -16.021484375, -15.418701171875, -14.81591796875, -14.213134765625, -13.6103515625, -13.007568359375, -12.40478515625, -11.802001953125, -11.19921875, -10.596435546875, -9.99365234375, -9.390869140625, -8.7880859375, -8.185302734375, -7.58251953125, -6.979736328125, -6.376953125, -5.774169921875, -5.17138671875, -4.568603515625, -3.9658203125, -3.363037109375, -2.76025390625, -2.157470703125, -1.5546875, -0.951904296875, -0.34912109375, 0.253662109375, 0.8564453125, 1.459228515625, 2.06201171875, 2.664794921875, 3.267578125, 3.870361328125, 4.47314453125, 5.075927734375, 5.6787109375, 6.281494140625, 6.88427734375, 7.487060546875, 8.08984375, 8.692626953125, 9.29541015625, 9.898193359375, 10.5009765625, 11.103759765625, 11.70654296875, 12.309326171875, 12.912109375, 13.514892578125, 14.11767578125, 14.720458984375, 15.3232421875, 15.926025390625, 16.52880859375, 17.131591796875, 17.734375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 2.0, 3.0, 6.0, 12.0, 14.0, 23.0, 15.0, 26.0, 40.0, 56.0, 100.0, 134.0, 241.0, 420.0, 801.0, 1518.0, 3453.0, 9192.0, 30164.0, 159066.0, 766170.0, 53130.0, 14557.0, 5052.0, 2043.0, 991.0, 541.0, 280.0, 179.0, 119.0, 56.0, 42.0, 26.0, 28.0, 15.0, 5.0, 14.0, 9.0, 6.0, 2.0, 4.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7900390625, -1.7344512939453125, -1.678863525390625, -1.6232757568359375, -1.56768798828125, -1.5121002197265625, -1.456512451171875, -1.4009246826171875, -1.3453369140625, -1.2897491455078125, -1.234161376953125, -1.1785736083984375, -1.12298583984375, -1.0673980712890625, -1.011810302734375, -0.9562225341796875, -0.900634765625, -0.8450469970703125, -0.789459228515625, -0.7338714599609375, -0.67828369140625, -0.6226959228515625, -0.567108154296875, -0.5115203857421875, -0.4559326171875, -0.4003448486328125, -0.344757080078125, -0.2891693115234375, -0.23358154296875, -0.1779937744140625, -0.122406005859375, -0.0668182373046875, -0.01123046875, 0.0443572998046875, 0.099945068359375, 0.1555328369140625, 0.21112060546875, 0.2667083740234375, 0.322296142578125, 0.3778839111328125, 0.4334716796875, 0.4890594482421875, 0.544647216796875, 0.6002349853515625, 0.65582275390625, 0.7114105224609375, 0.766998291015625, 0.8225860595703125, 0.878173828125, 0.9337615966796875, 0.989349365234375, 1.0449371337890625, 1.10052490234375, 1.1561126708984375, 1.211700439453125, 1.2672882080078125, 1.3228759765625, 1.3784637451171875, 1.434051513671875, 1.4896392822265625, 1.54522705078125, 1.6008148193359375, 1.656402587890625, 1.7119903564453125, 1.767578125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 1.0, 2.0, 6.0, 5.0, 6.0, 19.0, 8.0, 16.0, 16.0, 19.0, 22.0, 36.0, 49.0, 50.0, 65.0, 118.0, 113.0, 121.0, 92.0, 59.0, 40.0, 32.0, 22.0, 19.0, 15.0, 11.0, 7.0, 5.0, 7.0, 7.0, 3.0, 6.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0006542205810546875, -0.0006352514028549194, -0.0006162822246551514, -0.0005973130464553833, -0.0005783438682556152, -0.0005593746900558472, -0.0005404055118560791, -0.000521436333656311, -0.000502467155456543, -0.0004834979772567749, -0.00046452879905700684, -0.00044555962085723877, -0.0004265904426574707, -0.00040762126445770264, -0.00038865208625793457, -0.0003696829080581665, -0.00035071372985839844, -0.00033174455165863037, -0.0003127753734588623, -0.00029380619525909424, -0.00027483701705932617, -0.0002558678388595581, -0.00023689866065979004, -0.00021792948246002197, -0.0001989603042602539, -0.00017999112606048584, -0.00016102194786071777, -0.0001420527696609497, -0.00012308359146118164, -0.00010411441326141357, -8.514523506164551e-05, -6.617605686187744e-05, -4.7206878662109375e-05, -2.823770046234131e-05, -9.268522262573242e-06, 9.700655937194824e-06, 2.866983413696289e-05, 4.763901233673096e-05, 6.660819053649902e-05, 8.557736873626709e-05, 0.00010454654693603516, 0.00012351572513580322, 0.0001424849033355713, 0.00016145408153533936, 0.00018042325973510742, 0.0001993924379348755, 0.00021836161613464355, 0.00023733079433441162, 0.0002562999725341797, 0.00027526915073394775, 0.0002942383289337158, 0.0003132075071334839, 0.00033217668533325195, 0.00035114586353302, 0.0003701150417327881, 0.00038908421993255615, 0.0004080533981323242, 0.0004270225763320923, 0.00044599175453186035, 0.0004649609327316284, 0.0004839301109313965, 0.0005028992891311646, 0.0005218684673309326, 0.0005408376455307007, 0.0005598068237304688]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 4.0, 5.0, 6.0, 10.0, 16.0, 24.0, 28.0, 48.0, 70.0, 128.0, 186.0, 307.0, 525.0, 1089.0, 2576.0, 8177.0, 44736.0, 893874.0, 79146.0, 11454.0, 3232.0, 1280.0, 693.0, 343.0, 213.0, 141.0, 76.0, 66.0, 37.0, 16.0, 23.0, 11.0, 8.0, 5.0, 4.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.21484375, -3.09844970703125, -2.9820556640625, -2.86566162109375, -2.749267578125, -2.63287353515625, -2.5164794921875, -2.40008544921875, -2.28369140625, -2.16729736328125, -2.0509033203125, -1.93450927734375, -1.818115234375, -1.70172119140625, -1.5853271484375, -1.46893310546875, -1.3525390625, -1.23614501953125, -1.1197509765625, -1.00335693359375, -0.886962890625, -0.77056884765625, -0.6541748046875, -0.53778076171875, -0.42138671875, -0.30499267578125, -0.1885986328125, -0.07220458984375, 0.044189453125, 0.16058349609375, 0.2769775390625, 0.39337158203125, 0.509765625, 0.62615966796875, 0.7425537109375, 0.85894775390625, 0.975341796875, 1.09173583984375, 1.2081298828125, 1.32452392578125, 1.44091796875, 1.55731201171875, 1.6737060546875, 1.79010009765625, 1.906494140625, 2.02288818359375, 2.1392822265625, 2.25567626953125, 2.3720703125, 2.48846435546875, 2.6048583984375, 2.72125244140625, 2.837646484375, 2.95404052734375, 3.0704345703125, 3.18682861328125, 3.30322265625, 3.41961669921875, 3.5360107421875, 3.65240478515625, 3.768798828125, 3.88519287109375, 4.0015869140625, 4.11798095703125, 4.234375]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 5.0, 1.0, 2.0, 3.0, 4.0, 3.0, 8.0, 9.0, 8.0, 10.0, 9.0, 19.0, 21.0, 19.0, 24.0, 28.0, 57.0, 59.0, 52.0, 72.0, 76.0, 76.0, 67.0, 75.0, 56.0, 46.0, 34.0, 32.0, 24.0, 14.0, 11.0, 12.0, 8.0, 8.0, 5.0, 5.0, 8.0, 7.0, 6.0, 5.0, 3.0, 2.0, 1.0, 3.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.568359375, -1.5146331787109375, -1.460906982421875, -1.4071807861328125, -1.35345458984375, -1.2997283935546875, -1.246002197265625, -1.1922760009765625, -1.1385498046875, -1.0848236083984375, -1.031097412109375, -0.9773712158203125, -0.92364501953125, -0.8699188232421875, -0.816192626953125, -0.7624664306640625, -0.708740234375, -0.6550140380859375, -0.601287841796875, -0.5475616455078125, -0.49383544921875, -0.4401092529296875, -0.386383056640625, -0.3326568603515625, -0.2789306640625, -0.2252044677734375, -0.171478271484375, -0.1177520751953125, -0.06402587890625, -0.0102996826171875, 0.043426513671875, 0.0971527099609375, 0.15087890625, 0.2046051025390625, 0.258331298828125, 0.3120574951171875, 0.36578369140625, 0.4195098876953125, 0.473236083984375, 0.5269622802734375, 0.5806884765625, 0.6344146728515625, 0.688140869140625, 0.7418670654296875, 0.79559326171875, 0.8493194580078125, 0.903045654296875, 0.9567718505859375, 1.010498046875, 1.0642242431640625, 1.117950439453125, 1.1716766357421875, 1.22540283203125, 1.2791290283203125, 1.332855224609375, 1.3865814208984375, 1.4403076171875, 1.4940338134765625, 1.547760009765625, 1.6014862060546875, 1.65521240234375, 1.7089385986328125, 1.762664794921875, 1.8163909912109375, 1.8701171875]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 6.0, 5.0, 14.0, 25.0, 31.0, 48.0, 92.0, 348.0, 208.0, 81.0, 36.0, 28.0, 23.0, 14.0, 16.0, 8.0, 9.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.67078399658203, -41.213218688964844, -38.75564956665039, -36.2980842590332, -33.84051513671875, -31.382949829101562, -28.925384521484375, -26.467817306518555, -24.010250091552734, -21.552682876586914, -19.095115661621094, -16.637550354003906, -14.179983139038086, -11.722415924072266, -9.264849662780762, -6.807283401489258, -4.3497161865234375, -1.8921494483947754, 0.5654172897338867, 3.022984027862549, 5.480550765991211, 7.938117980957031, 10.395684242248535, 12.853250503540039, 15.31081771850586, 17.76838493347168, 20.2259521484375, 22.683517456054688, 25.141084671020508, 27.598651885986328, 30.056217193603516, 32.51378631591797, 34.97135925292969, 37.428924560546875, 39.88649368286133, 42.344058990478516, 44.80162811279297, 47.259193420410156, 49.716758728027344, 52.17432403564453, 54.631893157958984, 57.08945846557617, 59.547027587890625, 62.00459289550781, 64.462158203125, 66.91972351074219, 69.3772964477539, 71.8348617553711, 74.29242706298828, 76.74999237060547, 79.20755767822266, 81.66513061523438, 84.12269592285156, 86.58026123046875, 89.03782653808594, 91.49539184570312, 93.95295715332031, 96.4105224609375, 98.86808776855469, 101.3256607055664, 103.7832260131836, 106.24079132080078, 108.69835662841797, 111.15592193603516, 113.61349487304688]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 4.0, 6.0, 5.0, 12.0, 8.0, 14.0, 21.0, 17.0, 26.0, 23.0, 26.0, 27.0, 39.0, 68.0, 159.0, 149.0, 129.0, 64.0, 37.0, 23.0, 21.0, 16.0, 16.0, 11.0, 9.0, 16.0, 11.0, 5.0, 5.0, 6.0, 3.0, 7.0, 3.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.879539489746094, -57.83122634887695, -55.78291320800781, -53.73460388183594, -51.6862907409668, -49.637977600097656, -47.58966827392578, -45.54135513305664, -43.4930419921875, -41.44472885131836, -39.39641571044922, -37.348106384277344, -35.2997932434082, -33.25148010253906, -31.203168869018555, -29.154857635498047, -27.106544494628906, -25.058231353759766, -23.009920120239258, -20.96160888671875, -18.91329574584961, -16.86498260498047, -14.816671371459961, -12.768359184265137, -10.720046997070312, -8.671734809875488, -6.623422622680664, -4.57511043548584, -2.5267982482910156, -0.4784860610961914, 1.5698261260986328, 3.618138313293457, 5.66644287109375, 7.714755058288574, 9.763067245483398, 11.811379432678223, 13.859691619873047, 15.908003807067871, 17.956315994262695, 20.004627227783203, 22.052940368652344, 24.101253509521484, 26.149564743041992, 28.1978759765625, 30.24618911743164, 32.29450225830078, 34.342811584472656, 36.3911247253418, 38.43943786621094, 40.48775100708008, 42.53606414794922, 44.584373474121094, 46.632686614990234, 48.680999755859375, 50.72930908203125, 52.77762222290039, 54.82593536376953, 56.87424850463867, 58.92256164550781, 60.97087097167969, 63.01918411254883, 65.06749725341797, 67.11580657958984, 69.16412353515625, 71.21243286132812]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 4.0, 4.0, 5.0, 9.0, 8.0, 11.0, 16.0, 16.0, 9.0, 15.0, 31.0, 28.0, 28.0, 31.0, 25.0, 33.0, 45.0, 111.0, 152.0, 97.0, 56.0, 37.0, 27.0, 28.0, 25.0, 25.0, 19.0, 13.0, 14.0, 19.0, 12.0, 7.0, 9.0, 8.0, 8.0, 6.0, 7.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.08203125, -4.91546630859375, -4.7489013671875, -4.58233642578125, -4.415771484375, -4.24920654296875, -4.0826416015625, -3.91607666015625, -3.74951171875, -3.58294677734375, -3.4163818359375, -3.24981689453125, -3.083251953125, -2.91668701171875, -2.7501220703125, -2.58355712890625, -2.4169921875, -2.25042724609375, -2.0838623046875, -1.91729736328125, -1.750732421875, -1.58416748046875, -1.4176025390625, -1.25103759765625, -1.08447265625, -0.91790771484375, -0.7513427734375, -0.58477783203125, -0.418212890625, -0.25164794921875, -0.0850830078125, 0.08148193359375, 0.248046875, 0.41461181640625, 0.5811767578125, 0.74774169921875, 0.914306640625, 1.08087158203125, 1.2474365234375, 1.41400146484375, 1.58056640625, 1.74713134765625, 1.9136962890625, 2.08026123046875, 2.246826171875, 2.41339111328125, 2.5799560546875, 2.74652099609375, 2.9130859375, 3.07965087890625, 3.2462158203125, 3.41278076171875, 3.579345703125, 3.74591064453125, 3.9124755859375, 4.07904052734375, 4.24560546875, 4.41217041015625, 4.5787353515625, 4.74530029296875, 4.911865234375, 5.07843017578125, 5.2449951171875, 5.41156005859375, 5.578125]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 7.0, 10.0, 12.0, 18.0, 20.0, 38.0, 49.0, 50.0, 130.0, 326.0, 1050.0, 5099.0, 276722.0, 8096722.0, 6156.0, 1365.0, 383.0, 160.0, 86.0, 65.0, 24.0, 21.0, 20.0, 8.0, 17.0, 12.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0], "bins": [-50.51854705810547, -48.71722412109375, -46.91590118408203, -45.11457824707031, -43.313255310058594, -41.511932373046875, -39.710609436035156, -37.90928649902344, -36.10796356201172, -34.306640625, -32.50531768798828, -30.703994750976562, -28.902671813964844, -27.101348876953125, -25.300025939941406, -23.498703002929688, -21.6973819732666, -19.896059036254883, -18.094736099243164, -16.293413162231445, -14.492090225219727, -12.690768241882324, -10.889445304870605, -9.088122367858887, -7.286799430847168, -5.485476493835449, -3.6841537952423096, -1.88283109664917, -0.08150815963745117, 1.7198143005371094, 3.521137237548828, 5.322460174560547, 7.123783111572266, 8.925106048583984, 10.726428985595703, 12.527751922607422, 14.32907485961914, 16.13039779663086, 17.931720733642578, 19.733043670654297, 21.534366607666016, 23.335689544677734, 25.137012481689453, 26.938335418701172, 28.73965835571289, 30.54098129272461, 32.34230422973633, 34.14362716674805, 35.9449462890625, 37.74626922607422, 39.54759216308594, 41.348915100097656, 43.150238037109375, 44.951560974121094, 46.75288391113281, 48.55420684814453, 50.35552978515625, 52.15685272216797, 53.95817565917969, 55.759498596191406, 57.560821533203125, 59.362144470214844, 61.16346740722656, 62.96479034423828, 64.76611328125]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 2.0, 5.0, 1.0, 4.0, 1.0, 6.0, 4.0, 1.0, 5.0, 2.0, 3.0, 7.0, 5.0, 2.0, 6.0, 6.0, 4.0, 3.0, 6.0, 3.0, 1.0, 3.0, 0.0, 3.0, 4.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0], "bins": [-94.94087982177734, -92.66596221923828, -90.39105224609375, -88.11613464355469, -85.84122467041016, -83.5663070678711, -81.29139709472656, -79.0164794921875, -76.74156188964844, -74.46664428710938, -72.19173431396484, -69.91681671142578, -67.64190673828125, -65.36698913574219, -63.09207534790039, -60.817161560058594, -58.54225158691406, -56.267337799072266, -53.99242401123047, -51.71751022338867, -49.442596435546875, -47.16767883300781, -44.892765045166016, -42.61785125732422, -40.34293746948242, -38.068023681640625, -35.79310989379883, -33.51819610595703, -31.2432804107666, -28.968366622924805, -26.693450927734375, -24.418537139892578, -22.14361572265625, -19.868701934814453, -17.593788146972656, -15.318872451782227, -13.04395866394043, -10.769044876098633, -8.49413013458252, -6.219215393066406, -3.9443016052246094, -1.6693873405456543, 0.6055269241333008, 2.880441188812256, 5.155355453491211, 7.430269241333008, 9.705183982849121, 11.980098724365234, 14.255012512207031, 16.529926300048828, 18.804840087890625, 21.079755783081055, 23.35466957092285, 25.62958335876465, 27.904499053955078, 30.179412841796875, 32.45432662963867, 34.72924041748047, 37.004154205322266, 39.27906799316406, 41.553985595703125, 43.828895568847656, 46.10381317138672, 48.378726959228516, 50.65364074707031]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 9.0, 9.0, 5.0, 11.0, 11.0, 14.0, 6.0, 13.0, 17.0, 26.0, 25.0, 34.0, 43.0, 26.0, 36.0, 49.0, 47.0, 44.0, 56.0, 53.0, 62.0, 47.0, 43.0, 42.0, 36.0, 41.0, 35.0, 37.0, 28.0, 22.0, 21.0, 14.0, 10.0, 7.0, 6.0, 5.0, 4.0, 10.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.7578125, -3.640594482421875, -3.52337646484375, -3.406158447265625, -3.2889404296875, -3.171722412109375, -3.05450439453125, -2.937286376953125, -2.820068359375, -2.702850341796875, -2.58563232421875, -2.468414306640625, -2.3511962890625, -2.233978271484375, -2.11676025390625, -1.999542236328125, -1.88232421875, -1.765106201171875, -1.64788818359375, -1.530670166015625, -1.4134521484375, -1.296234130859375, -1.17901611328125, -1.061798095703125, -0.944580078125, -0.827362060546875, -0.71014404296875, -0.592926025390625, -0.4757080078125, -0.358489990234375, -0.24127197265625, -0.124053955078125, -0.0068359375, 0.110382080078125, 0.22760009765625, 0.344818115234375, 0.4620361328125, 0.579254150390625, 0.69647216796875, 0.813690185546875, 0.930908203125, 1.048126220703125, 1.16534423828125, 1.282562255859375, 1.3997802734375, 1.516998291015625, 1.63421630859375, 1.751434326171875, 1.86865234375, 1.985870361328125, 2.10308837890625, 2.220306396484375, 2.3375244140625, 2.454742431640625, 2.57196044921875, 2.689178466796875, 2.806396484375, 2.923614501953125, 3.04083251953125, 3.158050537109375, 3.2752685546875, 3.392486572265625, 3.50970458984375, 3.626922607421875, 3.744140625]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 6.0, 11.0, 8.0, 28.0, 33.0, 93.0, 171.0, 509.0, 1611.0, 9838.0, 111627.0, 349239.0, 44687.0, 4826.0, 982.0, 296.0, 133.0, 83.0, 40.0, 16.0, 12.0, 7.0, 4.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.3125, -72.5556640625, -69.798828125, -67.0419921875, -64.28515625, -61.5283203125, -58.771484375, -56.0146484375, -53.2578125, -50.5009765625, -47.744140625, -44.9873046875, -42.23046875, -39.4736328125, -36.716796875, -33.9599609375, -31.203125, -28.4462890625, -25.689453125, -22.9326171875, -20.17578125, -17.4189453125, -14.662109375, -11.9052734375, -9.1484375, -6.3916015625, -3.634765625, -0.8779296875, 1.87890625, 4.6357421875, 7.392578125, 10.1494140625, 12.90625, 15.6630859375, 18.419921875, 21.1767578125, 23.93359375, 26.6904296875, 29.447265625, 32.2041015625, 34.9609375, 37.7177734375, 40.474609375, 43.2314453125, 45.98828125, 48.7451171875, 51.501953125, 54.2587890625, 57.015625, 59.7724609375, 62.529296875, 65.2861328125, 68.04296875, 70.7998046875, 73.556640625, 76.3134765625, 79.0703125, 81.8271484375, 84.583984375, 87.3408203125, 90.09765625, 92.8544921875, 95.611328125, 98.3681640625, 101.125]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 7.0, 2.0, 2.0, 4.0, 7.0, 9.0, 10.0, 16.0, 14.0, 13.0, 14.0, 19.0, 29.0, 32.0, 39.0, 50.0, 41.0, 43.0, 57.0, 73.0, 57.0, 62.0, 61.0, 46.0, 48.0, 35.0, 40.0, 22.0, 31.0, 19.0, 19.0, 16.0, 19.0, 6.0, 11.0, 7.0, 5.0, 7.0, 5.0, 4.0, 7.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.9375, -4.7747802734375, -4.612060546875, -4.4493408203125, -4.28662109375, -4.1239013671875, -3.961181640625, -3.7984619140625, -3.6357421875, -3.4730224609375, -3.310302734375, -3.1475830078125, -2.98486328125, -2.8221435546875, -2.659423828125, -2.4967041015625, -2.333984375, -2.1712646484375, -2.008544921875, -1.8458251953125, -1.68310546875, -1.5203857421875, -1.357666015625, -1.1949462890625, -1.0322265625, -0.8695068359375, -0.706787109375, -0.5440673828125, -0.38134765625, -0.2186279296875, -0.055908203125, 0.1068115234375, 0.26953125, 0.4322509765625, 0.594970703125, 0.7576904296875, 0.92041015625, 1.0831298828125, 1.245849609375, 1.4085693359375, 1.5712890625, 1.7340087890625, 1.896728515625, 2.0594482421875, 2.22216796875, 2.3848876953125, 2.547607421875, 2.7103271484375, 2.873046875, 3.0357666015625, 3.198486328125, 3.3612060546875, 3.52392578125, 3.6866455078125, 3.849365234375, 4.0120849609375, 4.1748046875, 4.3375244140625, 4.500244140625, 4.6629638671875, 4.82568359375, 4.9884033203125, 5.151123046875, 5.3138427734375, 5.4765625]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 7.0, 7.0, 6.0, 14.0, 31.0, 52.0, 86.0, 132.0, 69.0, 31.0, 11.0, 7.0, 5.0, 5.0, 7.0, 1.0, 3.0, 6.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-57.08107376098633, -55.44074630737305, -53.800418853759766, -52.16009521484375, -50.51976776123047, -48.87944030761719, -47.239112854003906, -45.598785400390625, -43.958457946777344, -42.31813049316406, -40.67780303955078, -39.0374755859375, -37.397151947021484, -35.7568244934082, -34.11649703979492, -32.47616958618164, -30.835845947265625, -29.195518493652344, -27.555192947387695, -25.914865493774414, -24.274539947509766, -22.634212493896484, -20.993885040283203, -19.353557586669922, -17.713232040405273, -16.072904586791992, -14.432579040527344, -12.792251586914062, -11.151925086975098, -9.511598587036133, -7.871271133422852, -6.230944633483887, -4.590614318847656, -2.9502875804901123, -1.3099608421325684, 0.3303661346435547, 1.9706926345825195, 3.6110191345214844, 5.251346588134766, 6.8916730880737305, 8.531999588012695, 10.17232608795166, 11.812652587890625, 13.452980041503906, 15.093306541442871, 16.733633041381836, 18.373960494995117, 20.014286041259766, 21.654613494873047, 23.294940948486328, 24.935266494750977, 26.575593948364258, 28.215919494628906, 29.856246948242188, 31.49657440185547, 33.13690185546875, 34.77722930908203, 36.41755676269531, 38.057884216308594, 39.698211669921875, 41.33853530883789, 42.97886276245117, 44.61919021606445, 46.259517669677734, 47.89984130859375]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 7.0, 1.0, 3.0, 2.0, 1.0, 6.0, 5.0, 3.0, 4.0, 7.0, 2.0, 6.0, 15.0, 23.0, 31.0, 57.0, 86.0, 72.0, 57.0, 38.0, 18.0, 8.0, 8.0, 8.0, 4.0, 3.0, 4.0, 0.0, 4.0, 5.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-32.847557067871094, -31.865861892700195, -30.884166717529297, -29.9024715423584, -28.9207763671875, -27.93907928466797, -26.95738410949707, -25.975688934326172, -24.993993759155273, -24.012298583984375, -23.030603408813477, -22.048908233642578, -21.067211151123047, -20.08551788330078, -19.10382080078125, -18.12212562561035, -17.140430450439453, -16.158735275268555, -15.177040100097656, -14.195343971252441, -13.213648796081543, -12.231953620910645, -11.25025749206543, -10.268562316894531, -9.286867141723633, -8.305171966552734, -7.323476314544678, -6.341780662536621, -5.360085487365723, -4.378390312194824, -3.3966946601867676, -2.414999008178711, -1.4333057403564453, -0.4516103267669678, 0.5300850868225098, 1.5117805004119873, 2.493475914001465, 3.4751710891723633, 4.45686674118042, 5.438562393188477, 6.420257568359375, 7.401952743530273, 8.383647918701172, 9.365344047546387, 10.347039222717285, 11.328734397888184, 12.310430526733398, 13.292125701904297, 14.273820877075195, 15.255516052246094, 16.237211227416992, 17.21890640258789, 18.200603485107422, 19.182296752929688, 20.16399383544922, 21.145689010620117, 22.127384185791016, 23.109079360961914, 24.090774536132812, 25.07246971130371, 26.05416488647461, 27.03586196899414, 28.01755714416504, 28.999252319335938, 29.980947494506836]}, "eval/loss": 2.5400922298431396, "eval/wer": 1.315569218564062, "eval/runtime": 1264.1279, "eval/samples_per_second": 2.09, "eval/steps_per_second": 0.262} \ No newline at end of file +{"train/loss": 0.4394, "train/learning_rate": 6.143111638954869e-05, "train/epoch": 8.41, "train/global_step": 7500, "_runtime": 48387, "_timestamp": 1647642265, "_step": 7502, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 9.0, 30.0, 62.0, 130.0, 237.0, 283.0, 169.0, 61.0, 19.0, 10.0, 4.0], "bins": [-159.2660369873047, -156.52210998535156, -153.77818298339844, -151.03427124023438, -148.29034423828125, -145.54641723632812, -142.802490234375, -140.05856323242188, -137.31463623046875, -134.57070922851562, -131.8267822265625, -129.08285522460938, -126.33893585205078, -123.59501647949219, -120.85108947753906, -118.10716247558594, -115.36325073242188, -112.61932373046875, -109.87540435791016, -107.13147735595703, -104.3875503540039, -101.64363098144531, -98.89970397949219, -96.15577697753906, -93.41184997558594, -90.66792297363281, -87.92400360107422, -85.1800765991211, -82.43614959716797, -79.69223022460938, -76.94830322265625, -74.20437622070312, -71.46045684814453, -68.7165298461914, -65.97261047363281, -63.22868347167969, -60.48476028442383, -57.74083709716797, -54.996910095214844, -52.252986907958984, -49.50905990600586, -46.76513671875, -44.021209716796875, -41.277286529541016, -38.533363342285156, -35.78943634033203, -33.04551315307617, -30.301589965820312, -27.55766487121582, -24.813739776611328, -22.06981658935547, -19.325891494750977, -16.581966400146484, -13.838043212890625, -11.094118118286133, -8.350194931030273, -5.606269836425781, -2.8623454570770264, -0.11842107772827148, 2.6255035400390625, 5.369427680969238, 8.113351821899414, 10.857276916503906, 13.601200103759766, 16.345125198364258]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 5.0, 3.0, 4.0, 9.0, 5.0, 12.0, 9.0, 9.0, 19.0, 19.0, 21.0, 13.0, 16.0, 25.0, 26.0, 28.0, 26.0, 29.0, 24.0, 45.0, 44.0, 28.0, 41.0, 43.0, 43.0, 50.0, 41.0, 41.0, 39.0, 37.0, 35.0, 35.0, 21.0, 25.0, 9.0, 16.0, 19.0, 8.0, 20.0, 12.0, 14.0, 5.0, 7.0, 6.0, 8.0, 8.0, 2.0, 1.0, 2.0, 1.0, 0.0, 6.0], "bins": [-21.268795013427734, -20.66993522644043, -20.071075439453125, -19.47221565246582, -18.873355865478516, -18.274494171142578, -17.675636291503906, -17.07677459716797, -16.477914810180664, -15.87905502319336, -15.280195236206055, -14.68133544921875, -14.082474708557129, -13.483614921569824, -12.88475513458252, -12.285894393920898, -11.68703556060791, -11.088175773620605, -10.4893159866333, -9.89045524597168, -9.291595458984375, -8.69273567199707, -8.093875885009766, -7.495015621185303, -6.896155834197998, -6.297296047210693, -5.6984357833862305, -5.099575996398926, -4.500716209411621, -3.901855945587158, -3.3029961585998535, -2.7041358947753906, -2.105276107788086, -1.5064160823822021, -0.9075561761856079, -0.30869626998901367, 0.2901637554168701, 0.8890237808227539, 1.4878835678100586, 2.0867438316345215, 2.685603618621826, 3.28446364402771, 3.8833236694335938, 4.482183456420898, 5.081043243408203, 5.679903507232666, 6.278763294219971, 6.877623558044434, 7.476483345031738, 8.075343132019043, 8.674202919006348, 9.273063659667969, 9.871923446655273, 10.470783233642578, 11.069643020629883, 11.668502807617188, 12.267362594604492, 12.866222381591797, 13.465082168579102, 14.063941955566406, 14.662802696228027, 15.261662483215332, 15.860522270202637, 16.459383010864258, 17.058242797851562]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 6.0, 2.0, 9.0, 9.0, 11.0, 22.0, 22.0, 25.0, 42.0, 30.0, 36.0, 44.0, 43.0, 41.0, 46.0, 66.0, 67.0, 53.0, 50.0, 68.0, 54.0, 41.0, 35.0, 42.0, 35.0, 25.0, 20.0, 17.0, 11.0, 16.0, 11.0, 7.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.537109375, -2.459320068359375, -2.38153076171875, -2.303741455078125, -2.2259521484375, -2.148162841796875, -2.07037353515625, -1.992584228515625, -1.914794921875, -1.837005615234375, -1.75921630859375, -1.681427001953125, -1.6036376953125, -1.525848388671875, -1.44805908203125, -1.370269775390625, -1.29248046875, -1.214691162109375, -1.13690185546875, -1.059112548828125, -0.9813232421875, -0.903533935546875, -0.82574462890625, -0.747955322265625, -0.670166015625, -0.592376708984375, -0.51458740234375, -0.436798095703125, -0.3590087890625, -0.281219482421875, -0.20343017578125, -0.125640869140625, -0.0478515625, 0.029937744140625, 0.10772705078125, 0.185516357421875, 0.2633056640625, 0.341094970703125, 0.41888427734375, 0.496673583984375, 0.574462890625, 0.652252197265625, 0.73004150390625, 0.807830810546875, 0.8856201171875, 0.963409423828125, 1.04119873046875, 1.118988037109375, 1.19677734375, 1.274566650390625, 1.35235595703125, 1.430145263671875, 1.5079345703125, 1.585723876953125, 1.66351318359375, 1.741302490234375, 1.819091796875, 1.896881103515625, 1.97467041015625, 2.052459716796875, 2.1302490234375, 2.208038330078125, 2.28582763671875, 2.363616943359375, 2.44140625]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 5.0, 13.0, 6.0, 14.0, 22.0, 29.0, 71.0, 94.0, 132.0, 248.0, 448.0, 916.0, 2069.0, 6347.0, 39892.0, 729846.0, 3273839.0, 121758.0, 13017.0, 3073.0, 1131.0, 576.0, 311.0, 171.0, 84.0, 56.0, 45.0, 25.0, 17.0, 16.0, 9.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.890625, -17.317626953125, -16.74462890625, -16.171630859375, -15.5986328125, -15.025634765625, -14.45263671875, -13.879638671875, -13.306640625, -12.733642578125, -12.16064453125, -11.587646484375, -11.0146484375, -10.441650390625, -9.86865234375, -9.295654296875, -8.72265625, -8.149658203125, -7.57666015625, -7.003662109375, -6.4306640625, -5.857666015625, -5.28466796875, -4.711669921875, -4.138671875, -3.565673828125, -2.99267578125, -2.419677734375, -1.8466796875, -1.273681640625, -0.70068359375, -0.127685546875, 0.4453125, 1.018310546875, 1.59130859375, 2.164306640625, 2.7373046875, 3.310302734375, 3.88330078125, 4.456298828125, 5.029296875, 5.602294921875, 6.17529296875, 6.748291015625, 7.3212890625, 7.894287109375, 8.46728515625, 9.040283203125, 9.61328125, 10.186279296875, 10.75927734375, 11.332275390625, 11.9052734375, 12.478271484375, 13.05126953125, 13.624267578125, 14.197265625, 14.770263671875, 15.34326171875, 15.916259765625, 16.4892578125, 17.062255859375, 17.63525390625, 18.208251953125, 18.78125]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 1.0, 3.0, 2.0, 2.0, 7.0, 14.0, 19.0, 30.0, 34.0, 50.0, 68.0, 106.0, 122.0, 181.0, 224.0, 298.0, 356.0, 444.0, 448.0, 428.0, 307.0, 260.0, 187.0, 132.0, 98.0, 77.0, 56.0, 38.0, 24.0, 19.0, 9.0, 10.0, 9.0, 4.0, 2.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.12109375, -6.89910888671875, -6.6771240234375, -6.45513916015625, -6.233154296875, -6.01116943359375, -5.7891845703125, -5.56719970703125, -5.34521484375, -5.12322998046875, -4.9012451171875, -4.67926025390625, -4.457275390625, -4.23529052734375, -4.0133056640625, -3.79132080078125, -3.5693359375, -3.34735107421875, -3.1253662109375, -2.90338134765625, -2.681396484375, -2.45941162109375, -2.2374267578125, -2.01544189453125, -1.79345703125, -1.57147216796875, -1.3494873046875, -1.12750244140625, -0.905517578125, -0.68353271484375, -0.4615478515625, -0.23956298828125, -0.017578125, 0.20440673828125, 0.4263916015625, 0.64837646484375, 0.870361328125, 1.09234619140625, 1.3143310546875, 1.53631591796875, 1.75830078125, 1.98028564453125, 2.2022705078125, 2.42425537109375, 2.646240234375, 2.86822509765625, 3.0902099609375, 3.31219482421875, 3.5341796875, 3.75616455078125, 3.9781494140625, 4.20013427734375, 4.422119140625, 4.64410400390625, 4.8660888671875, 5.08807373046875, 5.31005859375, 5.53204345703125, 5.7540283203125, 5.97601318359375, 6.197998046875, 6.41998291015625, 6.6419677734375, 6.86395263671875, 7.0859375]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 3.0, 2.0, 5.0, 8.0, 8.0, 11.0, 7.0, 19.0, 17.0, 35.0, 55.0, 94.0, 170.0, 227.0, 432.0, 704.0, 1347.0, 3575.0, 15693.0, 109393.0, 1107807.0, 2621403.0, 287602.0, 34857.0, 6536.0, 2017.0, 929.0, 504.0, 329.0, 179.0, 104.0, 80.0, 37.0, 36.0, 16.0, 19.0, 15.0, 10.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-25.796875, -25.103759765625, -24.41064453125, -23.717529296875, -23.0244140625, -22.331298828125, -21.63818359375, -20.945068359375, -20.251953125, -19.558837890625, -18.86572265625, -18.172607421875, -17.4794921875, -16.786376953125, -16.09326171875, -15.400146484375, -14.70703125, -14.013916015625, -13.32080078125, -12.627685546875, -11.9345703125, -11.241455078125, -10.54833984375, -9.855224609375, -9.162109375, -8.468994140625, -7.77587890625, -7.082763671875, -6.3896484375, -5.696533203125, -5.00341796875, -4.310302734375, -3.6171875, -2.924072265625, -2.23095703125, -1.537841796875, -0.8447265625, -0.151611328125, 0.54150390625, 1.234619140625, 1.927734375, 2.620849609375, 3.31396484375, 4.007080078125, 4.7001953125, 5.393310546875, 6.08642578125, 6.779541015625, 7.47265625, 8.165771484375, 8.85888671875, 9.552001953125, 10.2451171875, 10.938232421875, 11.63134765625, 12.324462890625, 13.017578125, 13.710693359375, 14.40380859375, 15.096923828125, 15.7900390625, 16.483154296875, 17.17626953125, 17.869384765625, 18.5625]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 19.0, 45.0, 95.0, 159.0, 208.0, 196.0, 137.0, 85.0, 40.0, 16.0, 8.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.099878311157227, -25.938156127929688, -23.77643394470215, -21.61471176147461, -19.45298957824707, -17.29126739501953, -15.129545211791992, -12.967823028564453, -10.806100845336914, -8.644378662109375, -6.482656478881836, -4.320934295654297, -2.159212112426758, 0.00251007080078125, 2.1642322540283203, 4.325954437255859, 6.487676620483398, 8.649398803710938, 10.811120986938477, 12.972843170166016, 15.134565353393555, 17.296287536621094, 19.458009719848633, 21.619731903076172, 23.78145408630371, 25.94317626953125, 28.10489845275879, 30.266620635986328, 32.4283447265625, 34.590065002441406, 36.75178527832031, 38.913509368896484, 41.075233459472656, 43.23695373535156, 45.398677825927734, 47.560401916503906, 49.72212219238281, 51.88384246826172, 54.04556655883789, 56.20729064941406, 58.36901092529297, 60.530731201171875, 62.69245529174805, 64.85417938232422, 67.01589965820312, 69.17761993408203, 71.33934020996094, 73.50106811523438, 75.66278839111328, 77.82450866699219, 79.98623657226562, 82.14795684814453, 84.30967712402344, 86.47139739990234, 88.63311767578125, 90.79484558105469, 92.9565658569336, 95.1182861328125, 97.28001403808594, 99.44173431396484, 101.60345458984375, 103.76517486572266, 105.92689514160156, 108.088623046875, 110.2503433227539]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 2.0, 5.0, 7.0, 4.0, 11.0, 10.0, 13.0, 19.0, 12.0, 20.0, 21.0, 20.0, 23.0, 28.0, 28.0, 28.0, 37.0, 40.0, 43.0, 36.0, 45.0, 40.0, 39.0, 54.0, 51.0, 35.0, 30.0, 35.0, 33.0, 28.0, 21.0, 34.0, 22.0, 22.0, 21.0, 18.0, 7.0, 14.0, 9.0, 8.0, 7.0, 6.0, 7.0, 4.0, 7.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.09615707397461, -22.380571365356445, -21.664987564086914, -20.94940185546875, -20.233816146850586, -19.518230438232422, -18.80264663696289, -18.087060928344727, -17.371475219726562, -16.6558895111084, -15.94030475616455, -15.224720001220703, -14.509134292602539, -13.793549537658691, -13.077964782714844, -12.36237907409668, -11.646795272827148, -10.9312105178833, -10.215624809265137, -9.500040054321289, -8.784454345703125, -8.068869590759277, -7.35328483581543, -6.637699604034424, -5.922114372253418, -5.206529140472412, -4.490943908691406, -3.7753591537475586, -3.0597739219665527, -2.344188690185547, -1.6286039352416992, -0.9130187034606934, -0.1974334716796875, 0.5181516408920288, 1.2337367534637451, 1.9493217468261719, 2.6649069786071777, 3.3804922103881836, 4.096076965332031, 4.811662197113037, 5.527247428894043, 6.242832660675049, 6.958417892456055, 7.674002647399902, 8.38958740234375, 9.105173110961914, 9.820757865905762, 10.53634262084961, 11.251928329467773, 11.967513084411621, 12.683098793029785, 13.398683547973633, 14.114269256591797, 14.829854011535645, 15.545438766479492, 16.261024475097656, 16.976608276367188, 17.69219398498535, 18.407777786254883, 19.123363494873047, 19.83894920349121, 20.554534912109375, 21.270118713378906, 21.98570442199707, 22.701290130615234]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 8.0, 7.0, 6.0, 11.0, 10.0, 16.0, 12.0, 21.0, 17.0, 27.0, 17.0, 28.0, 15.0, 26.0, 44.0, 48.0, 45.0, 49.0, 56.0, 41.0, 51.0, 43.0, 54.0, 46.0, 47.0, 48.0, 37.0, 16.0, 29.0, 17.0, 23.0, 24.0, 9.0, 20.0, 12.0, 6.0, 10.0, 8.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.41015625, -2.3409423828125, -2.271728515625, -2.2025146484375, -2.13330078125, -2.0640869140625, -1.994873046875, -1.9256591796875, -1.8564453125, -1.7872314453125, -1.718017578125, -1.6488037109375, -1.57958984375, -1.5103759765625, -1.441162109375, -1.3719482421875, -1.302734375, -1.2335205078125, -1.164306640625, -1.0950927734375, -1.02587890625, -0.9566650390625, -0.887451171875, -0.8182373046875, -0.7490234375, -0.6798095703125, -0.610595703125, -0.5413818359375, -0.47216796875, -0.4029541015625, -0.333740234375, -0.2645263671875, -0.1953125, -0.1260986328125, -0.056884765625, 0.0123291015625, 0.08154296875, 0.1507568359375, 0.219970703125, 0.2891845703125, 0.3583984375, 0.4276123046875, 0.496826171875, 0.5660400390625, 0.63525390625, 0.7044677734375, 0.773681640625, 0.8428955078125, 0.912109375, 0.9813232421875, 1.050537109375, 1.1197509765625, 1.18896484375, 1.2581787109375, 1.327392578125, 1.3966064453125, 1.4658203125, 1.5350341796875, 1.604248046875, 1.6734619140625, 1.74267578125, 1.8118896484375, 1.881103515625, 1.9503173828125, 2.01953125]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 5.0, 3.0, 4.0, 6.0, 5.0, 9.0, 13.0, 23.0, 31.0, 40.0, 62.0, 125.0, 202.0, 333.0, 693.0, 1225.0, 2501.0, 4903.0, 8973.0, 16482.0, 29204.0, 48860.0, 76072.0, 107604.0, 136735.0, 153051.0, 140655.0, 113494.0, 81805.0, 53140.0, 32358.0, 18692.0, 10210.0, 5259.0, 2683.0, 1389.0, 738.0, 390.0, 219.0, 135.0, 81.0, 51.0, 26.0, 26.0, 13.0, 11.0, 9.0, 5.0, 7.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-1.923828125, -1.8682098388671875, -1.812591552734375, -1.7569732666015625, -1.70135498046875, -1.6457366943359375, -1.590118408203125, -1.5345001220703125, -1.4788818359375, -1.4232635498046875, -1.367645263671875, -1.3120269775390625, -1.25640869140625, -1.2007904052734375, -1.145172119140625, -1.0895538330078125, -1.033935546875, -0.9783172607421875, -0.922698974609375, -0.8670806884765625, -0.81146240234375, -0.7558441162109375, -0.700225830078125, -0.6446075439453125, -0.5889892578125, -0.5333709716796875, -0.477752685546875, -0.4221343994140625, -0.36651611328125, -0.3108978271484375, -0.255279541015625, -0.1996612548828125, -0.14404296875, -0.0884246826171875, -0.032806396484375, 0.0228118896484375, 0.07843017578125, 0.1340484619140625, 0.189666748046875, 0.2452850341796875, 0.3009033203125, 0.3565216064453125, 0.412139892578125, 0.4677581787109375, 0.52337646484375, 0.5789947509765625, 0.634613037109375, 0.6902313232421875, 0.745849609375, 0.8014678955078125, 0.857086181640625, 0.9127044677734375, 0.96832275390625, 1.0239410400390625, 1.079559326171875, 1.1351776123046875, 1.1907958984375, 1.2464141845703125, 1.302032470703125, 1.3576507568359375, 1.41326904296875, 1.4688873291015625, 1.524505615234375, 1.5801239013671875, 1.6357421875]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 6.0, 4.0, 2.0, 7.0, 9.0, 8.0, 8.0, 12.0, 15.0, 14.0, 19.0, 25.0, 20.0, 21.0, 31.0, 21.0, 23.0, 35.0, 26.0, 36.0, 39.0, 40.0, 46.0, 33.0, 1063.0, 50.0, 31.0, 43.0, 44.0, 44.0, 33.0, 24.0, 26.0, 24.0, 21.0, 28.0, 16.0, 13.0, 14.0, 15.0, 6.0, 7.0, 3.0, 8.0, 6.0, 5.0, 1.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.732421875, -1.675811767578125, -1.61920166015625, -1.562591552734375, -1.5059814453125, -1.449371337890625, -1.39276123046875, -1.336151123046875, -1.279541015625, -1.222930908203125, -1.16632080078125, -1.109710693359375, -1.0531005859375, -0.996490478515625, -0.93988037109375, -0.883270263671875, -0.82666015625, -0.770050048828125, -0.71343994140625, -0.656829833984375, -0.6002197265625, -0.543609619140625, -0.48699951171875, -0.430389404296875, -0.373779296875, -0.317169189453125, -0.26055908203125, -0.203948974609375, -0.1473388671875, -0.090728759765625, -0.03411865234375, 0.022491455078125, 0.0791015625, 0.135711669921875, 0.19232177734375, 0.248931884765625, 0.3055419921875, 0.362152099609375, 0.41876220703125, 0.475372314453125, 0.531982421875, 0.588592529296875, 0.64520263671875, 0.701812744140625, 0.7584228515625, 0.815032958984375, 0.87164306640625, 0.928253173828125, 0.98486328125, 1.041473388671875, 1.09808349609375, 1.154693603515625, 1.2113037109375, 1.267913818359375, 1.32452392578125, 1.381134033203125, 1.437744140625, 1.494354248046875, 1.55096435546875, 1.607574462890625, 1.6641845703125, 1.720794677734375, 1.77740478515625, 1.834014892578125, 1.890625]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 6.0, 6.0, 8.0, 11.0, 17.0, 28.0, 25.0, 49.0, 87.0, 99.0, 151.0, 191.0, 286.0, 389.0, 557.0, 811.0, 1056.0, 1452.0, 2023.0, 2828.0, 3741.0, 5196.0, 7243.0, 10113.0, 14931.0, 23531.0, 46780.0, 253263.0, 1512488.0, 110122.0, 34351.0, 19818.0, 12886.0, 9095.0, 6554.0, 4637.0, 3454.0, 2504.0, 1788.0, 1298.0, 896.0, 646.0, 504.0, 365.0, 274.0, 165.0, 114.0, 84.0, 80.0, 45.0, 25.0, 23.0, 18.0, 9.0, 5.0, 8.0, 7.0, 4.0, 0.0, 0.0, 1.0], "bins": [-1.9130859375, -1.85198974609375, -1.7908935546875, -1.72979736328125, -1.668701171875, -1.60760498046875, -1.5465087890625, -1.48541259765625, -1.42431640625, -1.36322021484375, -1.3021240234375, -1.24102783203125, -1.179931640625, -1.11883544921875, -1.0577392578125, -0.99664306640625, -0.935546875, -0.87445068359375, -0.8133544921875, -0.75225830078125, -0.691162109375, -0.63006591796875, -0.5689697265625, -0.50787353515625, -0.44677734375, -0.38568115234375, -0.3245849609375, -0.26348876953125, -0.202392578125, -0.14129638671875, -0.0802001953125, -0.01910400390625, 0.0419921875, 0.10308837890625, 0.1641845703125, 0.22528076171875, 0.286376953125, 0.34747314453125, 0.4085693359375, 0.46966552734375, 0.53076171875, 0.59185791015625, 0.6529541015625, 0.71405029296875, 0.775146484375, 0.83624267578125, 0.8973388671875, 0.95843505859375, 1.01953125, 1.08062744140625, 1.1417236328125, 1.20281982421875, 1.263916015625, 1.32501220703125, 1.3861083984375, 1.44720458984375, 1.50830078125, 1.56939697265625, 1.6304931640625, 1.69158935546875, 1.752685546875, 1.81378173828125, 1.8748779296875, 1.93597412109375, 1.9970703125]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 4.0, 5.0, 12.0, 11.0, 18.0, 15.0, 17.0, 28.0, 26.0, 27.0, 28.0, 31.0, 38.0, 37.0, 40.0, 34.0, 33.0, 40.0, 47.0, 40.0, 44.0, 39.0, 34.0, 34.0, 39.0, 44.0, 32.0, 32.0, 31.0, 27.0, 21.0, 16.0, 21.0, 18.0, 7.0, 13.0, 5.0, 5.0, 2.0, 1.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.37451171875, -0.3619346618652344, -0.34935760498046875, -0.3367805480957031, -0.3242034912109375, -0.3116264343261719, -0.29904937744140625, -0.2864723205566406, -0.273895263671875, -0.2613182067871094, -0.24874114990234375, -0.23616409301757812, -0.2235870361328125, -0.21100997924804688, -0.19843292236328125, -0.18585586547851562, -0.17327880859375, -0.16070175170898438, -0.14812469482421875, -0.13554763793945312, -0.1229705810546875, -0.11039352416992188, -0.09781646728515625, -0.08523941040039062, -0.072662353515625, -0.060085296630859375, -0.04750823974609375, -0.034931182861328125, -0.0223541259765625, -0.009777069091796875, 0.00279998779296875, 0.015377044677734375, 0.0279541015625, 0.040531158447265625, 0.05310821533203125, 0.06568527221679688, 0.0782623291015625, 0.09083938598632812, 0.10341644287109375, 0.11599349975585938, 0.128570556640625, 0.14114761352539062, 0.15372467041015625, 0.16630172729492188, 0.1788787841796875, 0.19145584106445312, 0.20403289794921875, 0.21660995483398438, 0.22918701171875, 0.24176406860351562, 0.25434112548828125, 0.2669181823730469, 0.2794952392578125, 0.2920722961425781, 0.30464935302734375, 0.3172264099121094, 0.329803466796875, 0.3423805236816406, 0.35495758056640625, 0.3675346374511719, 0.3801116943359375, 0.3926887512207031, 0.40526580810546875, 0.4178428649902344, 0.430419921875]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 6.0, 14.0, 8.0, 15.0, 12.0, 30.0, 34.0, 47.0, 47.0, 70.0, 75.0, 93.0, 102.0, 123.0, 177.0, 229.0, 234.0, 360.0, 511.0, 4894.0, 778812.0, 258842.0, 1708.0, 471.0, 325.0, 245.0, 210.0, 158.0, 130.0, 116.0, 92.0, 78.0, 69.0, 53.0, 35.0, 31.0, 31.0, 25.0, 11.0, 5.0, 6.0, 4.0, 4.0, 6.0, 6.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.8671875, -5.67071533203125, -5.4742431640625, -5.27777099609375, -5.081298828125, -4.88482666015625, -4.6883544921875, -4.49188232421875, -4.29541015625, -4.09893798828125, -3.9024658203125, -3.70599365234375, -3.509521484375, -3.31304931640625, -3.1165771484375, -2.92010498046875, -2.7236328125, -2.52716064453125, -2.3306884765625, -2.13421630859375, -1.937744140625, -1.74127197265625, -1.5447998046875, -1.34832763671875, -1.15185546875, -0.95538330078125, -0.7589111328125, -0.56243896484375, -0.365966796875, -0.16949462890625, 0.0269775390625, 0.22344970703125, 0.419921875, 0.61639404296875, 0.8128662109375, 1.00933837890625, 1.205810546875, 1.40228271484375, 1.5987548828125, 1.79522705078125, 1.99169921875, 2.18817138671875, 2.3846435546875, 2.58111572265625, 2.777587890625, 2.97406005859375, 3.1705322265625, 3.36700439453125, 3.5634765625, 3.75994873046875, 3.9564208984375, 4.15289306640625, 4.349365234375, 4.54583740234375, 4.7423095703125, 4.93878173828125, 5.13525390625, 5.33172607421875, 5.5281982421875, 5.72467041015625, 5.921142578125, 6.11761474609375, 6.3140869140625, 6.51055908203125, 6.70703125]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 4.0, 22.0, 45.0, 115.0, 290.0, 330.0, 133.0, 45.0, 13.0, 7.0, 7.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.287353038787842, -7.007768630981445, -6.728184700012207, -6.4486002922058105, -6.169015884399414, -5.889431476593018, -5.609847068786621, -5.330263137817383, -5.050678730010986, -4.77109432220459, -4.491510391235352, -4.211925983428955, -3.9323415756225586, -3.652757167816162, -3.3731729984283447, -3.0935888290405273, -2.814004421234131, -2.5344200134277344, -2.254835844039917, -1.97525155544281, -1.6956672668457031, -1.4160829782485962, -1.1364986896514893, -0.8569144010543823, -0.5773301124572754, -0.29774582386016846, -0.018161535263061523, 0.2614227533340454, 0.5410070419311523, 0.8205913305282593, 1.1001756191253662, 1.3797599077224731, 1.6593437194824219, 1.9389280080795288, 2.2185122966766357, 2.498096466064453, 2.7776808738708496, 3.057265281677246, 3.3368494510650635, 3.616433620452881, 3.8960180282592773, 4.175602436065674, 4.45518684387207, 4.734770774841309, 5.014355182647705, 5.293939590454102, 5.57352352142334, 5.853107929229736, 6.132692337036133, 6.412276744842529, 6.691861152648926, 6.971445083618164, 7.2510294914245605, 7.530613899230957, 7.810197830200195, 8.08978271484375, 8.369366645812988, 8.648950576782227, 8.928535461425781, 9.20811939239502, 9.487703323364258, 9.767288208007812, 10.04687213897705, 10.326457023620605, 10.606040954589844]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 5.0, 7.0, 5.0, 8.0, 13.0, 20.0, 13.0, 26.0, 18.0, 24.0, 25.0, 30.0, 36.0, 43.0, 46.0, 51.0, 49.0, 49.0, 47.0, 53.0, 43.0, 50.0, 49.0, 36.0, 49.0, 28.0, 31.0, 35.0, 19.0, 22.0, 16.0, 11.0, 10.0, 10.0, 6.0, 5.0, 6.0, 2.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.750164985656738, -4.592185020446777, -4.434205055236816, -4.276225566864014, -4.118245601654053, -3.960265636444092, -3.802285671234131, -3.64430570602417, -3.486325979232788, -3.328346014022827, -3.1703662872314453, -3.0123863220214844, -2.8544063568115234, -2.6964266300201416, -2.5384466648101807, -2.380466938018799, -2.222486972808838, -2.064507007598877, -1.9065272808074951, -1.7485473155975342, -1.5905674695968628, -1.4325876235961914, -1.2746076583862305, -1.116627812385559, -0.9586479663848877, -0.8006681203842163, -0.6426882147789001, -0.48470833897590637, -0.3267284631729126, -0.1687486171722412, -0.010768711566925049, 0.1472111940383911, 0.3051910400390625, 0.4631709158420563, 0.62115079164505, 0.7791306972503662, 0.9371105432510376, 1.095090389251709, 1.25307035446167, 1.4110502004623413, 1.5690300464630127, 1.727009892463684, 1.8849897384643555, 2.0429697036743164, 2.2009496688842773, 2.358929395675659, 2.51690936088562, 2.674889087677002, 2.832869052886963, 2.990849018096924, 3.1488287448883057, 3.3068087100982666, 3.4647884368896484, 3.6227684020996094, 3.7807483673095703, 3.9387283325195312, 4.096708297729492, 4.254688262939453, 4.412668228149414, 4.570647716522217, 4.728627681732178, 4.886607646942139, 5.0445876121521, 5.2025675773620605, 5.360547065734863]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 7.0, 5.0, 2.0, 7.0, 9.0, 9.0, 15.0, 17.0, 28.0, 20.0, 30.0, 17.0, 41.0, 35.0, 43.0, 36.0, 58.0, 50.0, 66.0, 54.0, 53.0, 41.0, 58.0, 48.0, 39.0, 32.0, 33.0, 31.0, 36.0, 14.0, 18.0, 10.0, 17.0, 8.0, 5.0, 8.0, 6.0, 4.0, 1.0, 0.0, 1.0, 3.0], "bins": [-3.1171875, -3.041351318359375, -2.96551513671875, -2.889678955078125, -2.8138427734375, -2.738006591796875, -2.66217041015625, -2.586334228515625, -2.510498046875, -2.434661865234375, -2.35882568359375, -2.282989501953125, -2.2071533203125, -2.131317138671875, -2.05548095703125, -1.979644775390625, -1.90380859375, -1.827972412109375, -1.75213623046875, -1.676300048828125, -1.6004638671875, -1.524627685546875, -1.44879150390625, -1.372955322265625, -1.297119140625, -1.221282958984375, -1.14544677734375, -1.069610595703125, -0.9937744140625, -0.917938232421875, -0.84210205078125, -0.766265869140625, -0.6904296875, -0.614593505859375, -0.53875732421875, -0.462921142578125, -0.3870849609375, -0.311248779296875, -0.23541259765625, -0.159576416015625, -0.083740234375, -0.007904052734375, 0.06793212890625, 0.143768310546875, 0.2196044921875, 0.295440673828125, 0.37127685546875, 0.447113037109375, 0.52294921875, 0.598785400390625, 0.67462158203125, 0.750457763671875, 0.8262939453125, 0.902130126953125, 0.97796630859375, 1.053802490234375, 1.129638671875, 1.205474853515625, 1.28131103515625, 1.357147216796875, 1.4329833984375, 1.508819580078125, 1.58465576171875, 1.660491943359375, 1.736328125]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 6.0, 11.0, 17.0, 23.0, 24.0, 40.0, 52.0, 85.0, 148.0, 214.0, 330.0, 612.0, 1070.0, 1700.0, 3215.0, 5730.0, 11034.0, 22281.0, 47528.0, 107310.0, 226693.0, 294146.0, 175877.0, 78744.0, 35120.0, 17074.0, 8821.0, 4548.0, 2464.0, 1467.0, 825.0, 486.0, 302.0, 201.0, 119.0, 87.0, 50.0, 27.0, 24.0, 16.0, 7.0, 11.0, 12.0, 3.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.48046875, -5.32073974609375, -5.1610107421875, -5.00128173828125, -4.841552734375, -4.68182373046875, -4.5220947265625, -4.36236572265625, -4.20263671875, -4.04290771484375, -3.8831787109375, -3.72344970703125, -3.563720703125, -3.40399169921875, -3.2442626953125, -3.08453369140625, -2.9248046875, -2.76507568359375, -2.6053466796875, -2.44561767578125, -2.285888671875, -2.12615966796875, -1.9664306640625, -1.80670166015625, -1.64697265625, -1.48724365234375, -1.3275146484375, -1.16778564453125, -1.008056640625, -0.84832763671875, -0.6885986328125, -0.52886962890625, -0.369140625, -0.20941162109375, -0.0496826171875, 0.11004638671875, 0.269775390625, 0.42950439453125, 0.5892333984375, 0.74896240234375, 0.90869140625, 1.06842041015625, 1.2281494140625, 1.38787841796875, 1.547607421875, 1.70733642578125, 1.8670654296875, 2.02679443359375, 2.1865234375, 2.34625244140625, 2.5059814453125, 2.66571044921875, 2.825439453125, 2.98516845703125, 3.1448974609375, 3.30462646484375, 3.46435546875, 3.62408447265625, 3.7838134765625, 3.94354248046875, 4.103271484375, 4.26300048828125, 4.4227294921875, 4.58245849609375, 4.7421875]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 7.0, 3.0, 0.0, 3.0, 7.0, 7.0, 10.0, 8.0, 16.0, 16.0, 21.0, 12.0, 22.0, 31.0, 29.0, 35.0, 27.0, 35.0, 54.0, 77.0, 127.0, 165.0, 226.0, 1280.0, 229.0, 125.0, 85.0, 66.0, 62.0, 41.0, 35.0, 36.0, 27.0, 23.0, 12.0, 11.0, 20.0, 12.0, 17.0, 8.0, 11.0, 4.0, 5.0, 4.0, 0.0, 7.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.4453125, -6.2178955078125, -5.990478515625, -5.7630615234375, -5.53564453125, -5.3082275390625, -5.080810546875, -4.8533935546875, -4.6259765625, -4.3985595703125, -4.171142578125, -3.9437255859375, -3.71630859375, -3.4888916015625, -3.261474609375, -3.0340576171875, -2.806640625, -2.5792236328125, -2.351806640625, -2.1243896484375, -1.89697265625, -1.6695556640625, -1.442138671875, -1.2147216796875, -0.9873046875, -0.7598876953125, -0.532470703125, -0.3050537109375, -0.07763671875, 0.1497802734375, 0.377197265625, 0.6046142578125, 0.83203125, 1.0594482421875, 1.286865234375, 1.5142822265625, 1.74169921875, 1.9691162109375, 2.196533203125, 2.4239501953125, 2.6513671875, 2.8787841796875, 3.106201171875, 3.3336181640625, 3.56103515625, 3.7884521484375, 4.015869140625, 4.2432861328125, 4.470703125, 4.6981201171875, 4.925537109375, 5.1529541015625, 5.38037109375, 5.6077880859375, 5.835205078125, 6.0626220703125, 6.2900390625, 6.5174560546875, 6.744873046875, 6.9722900390625, 7.19970703125, 7.4271240234375, 7.654541015625, 7.8819580078125, 8.109375]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 0.0, 8.0, 7.0, 5.0, 11.0, 7.0, 15.0, 16.0, 18.0, 17.0, 33.0, 23.0, 47.0, 52.0, 80.0, 163.0, 380.0, 2094.0, 92574.0, 2953498.0, 93582.0, 2115.0, 422.0, 176.0, 94.0, 52.0, 34.0, 28.0, 29.0, 22.0, 15.0, 18.0, 14.0, 7.0, 11.0, 9.0, 6.0, 8.0, 6.0, 4.0, 3.0, 3.0, 2.0, 0.0, 0.0, 3.0, 1.0], "bins": [-33.125, -32.217529296875, -31.31005859375, -30.402587890625, -29.4951171875, -28.587646484375, -27.68017578125, -26.772705078125, -25.865234375, -24.957763671875, -24.05029296875, -23.142822265625, -22.2353515625, -21.327880859375, -20.42041015625, -19.512939453125, -18.60546875, -17.697998046875, -16.79052734375, -15.883056640625, -14.9755859375, -14.068115234375, -13.16064453125, -12.253173828125, -11.345703125, -10.438232421875, -9.53076171875, -8.623291015625, -7.7158203125, -6.808349609375, -5.90087890625, -4.993408203125, -4.0859375, -3.178466796875, -2.27099609375, -1.363525390625, -0.4560546875, 0.451416015625, 1.35888671875, 2.266357421875, 3.173828125, 4.081298828125, 4.98876953125, 5.896240234375, 6.8037109375, 7.711181640625, 8.61865234375, 9.526123046875, 10.43359375, 11.341064453125, 12.24853515625, 13.156005859375, 14.0634765625, 14.970947265625, 15.87841796875, 16.785888671875, 17.693359375, 18.600830078125, 19.50830078125, 20.415771484375, 21.3232421875, 22.230712890625, 23.13818359375, 24.045654296875, 24.953125]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 9.0, 20.0, 43.0, 71.0, 147.0, 178.0, 198.0, 153.0, 92.0, 55.0, 26.0, 10.0, 8.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.873958587646484, -33.981712341308594, -33.08946990966797, -32.19722366333008, -31.304977416992188, -30.41273307800293, -29.520488739013672, -28.62824249267578, -27.73599624633789, -26.843751907348633, -25.951505661010742, -25.059261322021484, -24.167015075683594, -23.274770736694336, -22.382526397705078, -21.490280151367188, -20.59803581237793, -19.705791473388672, -18.81354522705078, -17.921300888061523, -17.029054641723633, -16.136810302734375, -15.2445650100708, -14.352319717407227, -13.460074424743652, -12.567829132080078, -11.675583839416504, -10.78333854675293, -9.891094207763672, -8.998847961425781, -8.106603622436523, -7.214358329772949, -6.322111129760742, -5.429865837097168, -4.537620544433594, -3.6453757286071777, -2.7531304359436035, -1.8608851432800293, -0.9686403274536133, -0.07639503479003906, 0.8158502578735352, 1.7080954313278198, 2.6003406047821045, 3.4925856590270996, 4.384830951690674, 5.277076244354248, 6.169321060180664, 7.061566352844238, 7.9538116455078125, 8.846056938171387, 9.738302230834961, 10.630546569824219, 11.52279281616211, 12.415037155151367, 13.307282447814941, 14.199527740478516, 15.09177303314209, 15.984018325805664, 16.876262664794922, 17.768508911132812, 18.66075325012207, 19.55299949645996, 20.44524383544922, 21.33749008178711, 22.229734420776367]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 1.0, 4.0, 1.0, 7.0, 5.0, 7.0, 9.0, 15.0, 11.0, 16.0, 9.0, 14.0, 21.0, 27.0, 16.0, 28.0, 25.0, 34.0, 36.0, 34.0, 46.0, 41.0, 49.0, 26.0, 53.0, 46.0, 34.0, 31.0, 40.0, 25.0, 44.0, 34.0, 27.0, 28.0, 22.0, 21.0, 24.0, 16.0, 13.0, 14.0, 11.0, 17.0, 6.0, 4.0, 5.0, 1.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 4.0, 0.0, 1.0], "bins": [-25.479583740234375, -24.716249465942383, -23.952913284301758, -23.189579010009766, -22.42624282836914, -21.66290855407715, -20.899574279785156, -20.13623809814453, -19.37290382385254, -18.609569549560547, -17.846233367919922, -17.08289909362793, -16.319564819335938, -15.556228637695312, -14.79289436340332, -14.029559135437012, -13.266223907470703, -12.502888679504395, -11.739553451538086, -10.976219177246094, -10.212883949279785, -9.449548721313477, -8.686214447021484, -7.922879219055176, -7.159543991088867, -6.396208763122559, -5.632874011993408, -4.869539260864258, -4.106204032897949, -3.3428690433502197, -2.5795340538024902, -1.8161993026733398, -1.0528621673583984, -0.28952717781066895, 0.47380781173706055, 1.23714280128479, 2.0004777908325195, 2.763812780380249, 3.5271477699279785, 4.290482521057129, 5.0538177490234375, 5.817152976989746, 6.5804877281188965, 7.343822479248047, 8.107157707214355, 8.870492935180664, 9.633827209472656, 10.397162437438965, 11.160497665405273, 11.923832893371582, 12.68716812133789, 13.450502395629883, 14.213837623596191, 14.9771728515625, 15.740507125854492, 16.503841400146484, 17.26717758178711, 18.0305118560791, 18.793848037719727, 19.55718231201172, 20.320518493652344, 21.083852767944336, 21.847187042236328, 22.610523223876953, 23.373857498168945]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 4.0, 5.0, 4.0, 8.0, 10.0, 12.0, 16.0, 18.0, 13.0, 16.0, 21.0, 27.0, 31.0, 39.0, 31.0, 36.0, 34.0, 38.0, 52.0, 53.0, 53.0, 46.0, 49.0, 36.0, 47.0, 43.0, 49.0, 23.0, 38.0, 16.0, 25.0, 27.0, 25.0, 17.0, 10.0, 9.0, 7.0, 5.0, 11.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.8984375, -2.8212890625, -2.744140625, -2.6669921875, -2.58984375, -2.5126953125, -2.435546875, -2.3583984375, -2.28125, -2.2041015625, -2.126953125, -2.0498046875, -1.97265625, -1.8955078125, -1.818359375, -1.7412109375, -1.6640625, -1.5869140625, -1.509765625, -1.4326171875, -1.35546875, -1.2783203125, -1.201171875, -1.1240234375, -1.046875, -0.9697265625, -0.892578125, -0.8154296875, -0.73828125, -0.6611328125, -0.583984375, -0.5068359375, -0.4296875, -0.3525390625, -0.275390625, -0.1982421875, -0.12109375, -0.0439453125, 0.033203125, 0.1103515625, 0.1875, 0.2646484375, 0.341796875, 0.4189453125, 0.49609375, 0.5732421875, 0.650390625, 0.7275390625, 0.8046875, 0.8818359375, 0.958984375, 1.0361328125, 1.11328125, 1.1904296875, 1.267578125, 1.3447265625, 1.421875, 1.4990234375, 1.576171875, 1.6533203125, 1.73046875, 1.8076171875, 1.884765625, 1.9619140625, 2.0390625]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 3.0, 6.0, 17.0, 24.0, 44.0, 72.0, 104.0, 178.0, 297.0, 710.0, 1438.0, 3876.0, 11968.0, 43233.0, 185163.0, 1166158.0, 2270370.0, 395606.0, 82327.0, 21801.0, 6493.0, 2381.0, 973.0, 465.0, 242.0, 124.0, 77.0, 53.0, 34.0, 18.0, 11.0, 3.0, 9.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.8671875, -5.625, -5.3828125, -5.140625, -4.8984375, -4.65625, -4.4140625, -4.171875, -3.9296875, -3.6875, -3.4453125, -3.203125, -2.9609375, -2.71875, -2.4765625, -2.234375, -1.9921875, -1.75, -1.5078125, -1.265625, -1.0234375, -0.78125, -0.5390625, -0.296875, -0.0546875, 0.1875, 0.4296875, 0.671875, 0.9140625, 1.15625, 1.3984375, 1.640625, 1.8828125, 2.125, 2.3671875, 2.609375, 2.8515625, 3.09375, 3.3359375, 3.578125, 3.8203125, 4.0625, 4.3046875, 4.546875, 4.7890625, 5.03125, 5.2734375, 5.515625, 5.7578125, 6.0, 6.2421875, 6.484375, 6.7265625, 6.96875, 7.2109375, 7.453125, 7.6953125, 7.9375, 8.1796875, 8.421875, 8.6640625, 8.90625, 9.1484375, 9.390625, 9.6328125]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 4.0, 0.0, 8.0, 12.0, 8.0, 21.0, 27.0, 35.0, 58.0, 77.0, 114.0, 161.0, 233.0, 281.0, 392.0, 466.0, 489.0, 411.0, 362.0, 255.0, 219.0, 151.0, 99.0, 54.0, 49.0, 23.0, 28.0, 18.0, 13.0, 6.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.328125, -7.049560546875, -6.77099609375, -6.492431640625, -6.2138671875, -5.935302734375, -5.65673828125, -5.378173828125, -5.099609375, -4.821044921875, -4.54248046875, -4.263916015625, -3.9853515625, -3.706787109375, -3.42822265625, -3.149658203125, -2.87109375, -2.592529296875, -2.31396484375, -2.035400390625, -1.7568359375, -1.478271484375, -1.19970703125, -0.921142578125, -0.642578125, -0.364013671875, -0.08544921875, 0.193115234375, 0.4716796875, 0.750244140625, 1.02880859375, 1.307373046875, 1.5859375, 1.864501953125, 2.14306640625, 2.421630859375, 2.7001953125, 2.978759765625, 3.25732421875, 3.535888671875, 3.814453125, 4.093017578125, 4.37158203125, 4.650146484375, 4.9287109375, 5.207275390625, 5.48583984375, 5.764404296875, 6.04296875, 6.321533203125, 6.60009765625, 6.878662109375, 7.1572265625, 7.435791015625, 7.71435546875, 7.992919921875, 8.271484375, 8.550048828125, 8.82861328125, 9.107177734375, 9.3857421875, 9.664306640625, 9.94287109375, 10.221435546875, 10.5]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 4.0, 6.0, 18.0, 15.0, 30.0, 40.0, 51.0, 58.0, 65.0, 105.0, 188.0, 282.0, 430.0, 731.0, 1635.0, 4535.0, 14736.0, 57614.0, 246010.0, 1137044.0, 2044405.0, 527026.0, 117048.0, 28898.0, 8048.0, 2651.0, 1070.0, 537.0, 301.0, 210.0, 144.0, 95.0, 60.0, 64.0, 37.0, 26.0, 17.0, 12.0, 11.0, 10.0, 3.0, 6.0, 2.0, 1.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.34375, -10.96875, -10.59375, -10.21875, -9.84375, -9.46875, -9.09375, -8.71875, -8.34375, -7.96875, -7.59375, -7.21875, -6.84375, -6.46875, -6.09375, -5.71875, -5.34375, -4.96875, -4.59375, -4.21875, -3.84375, -3.46875, -3.09375, -2.71875, -2.34375, -1.96875, -1.59375, -1.21875, -0.84375, -0.46875, -0.09375, 0.28125, 0.65625, 1.03125, 1.40625, 1.78125, 2.15625, 2.53125, 2.90625, 3.28125, 3.65625, 4.03125, 4.40625, 4.78125, 5.15625, 5.53125, 5.90625, 6.28125, 6.65625, 7.03125, 7.40625, 7.78125, 8.15625, 8.53125, 8.90625, 9.28125, 9.65625, 10.03125, 10.40625, 10.78125, 11.15625, 11.53125, 11.90625, 12.28125, 12.65625]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 12.0, 27.0, 64.0, 147.0, 183.0, 233.0, 166.0, 100.0, 50.0, 23.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-119.343994140625, -117.0604248046875, -114.77685546875, -112.4932861328125, -110.209716796875, -107.9261474609375, -105.642578125, -103.3590087890625, -101.075439453125, -98.7918701171875, -96.50830078125, -94.2247314453125, -91.941162109375, -89.6575927734375, -87.3740234375, -85.0904541015625, -82.806884765625, -80.5233154296875, -78.23974609375, -75.9561767578125, -73.672607421875, -71.3890380859375, -69.10546875, -66.8218994140625, -64.53832244873047, -62.25475311279297, -59.97118377685547, -57.68761444091797, -55.40404510498047, -53.12047576904297, -50.83690643310547, -48.55333709716797, -46.26976013183594, -43.98619079589844, -41.70262145996094, -39.41905212402344, -37.13548278808594, -34.85191345214844, -32.56834411621094, -30.284772872924805, -28.001205444335938, -25.717636108398438, -23.434066772460938, -21.150497436523438, -18.866928100585938, -16.583358764648438, -14.299787521362305, -12.016218185424805, -9.732648849487305, -7.449079513549805, -5.1655097007751465, -2.8819398880004883, -0.5983705520629883, 1.6851987838745117, 3.968769073486328, 6.252338409423828, 8.535907745361328, 10.819477081298828, 13.103046417236328, 15.386616706848145, 17.670185089111328, 19.953754425048828, 22.23732566833496, 24.52089500427246, 26.80446434020996]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 12.0, 6.0, 10.0, 7.0, 14.0, 13.0, 17.0, 15.0, 17.0, 21.0, 26.0, 34.0, 37.0, 36.0, 32.0, 34.0, 34.0, 37.0, 33.0, 36.0, 49.0, 46.0, 44.0, 42.0, 44.0, 41.0, 34.0, 30.0, 31.0, 29.0, 29.0, 21.0, 21.0, 15.0, 12.0, 10.0, 11.0, 12.0, 3.0, 4.0, 4.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-23.115182876586914, -22.29827308654785, -21.48136329650879, -20.664453506469727, -19.847545623779297, -19.030635833740234, -18.213726043701172, -17.39681625366211, -16.579906463623047, -15.762996673583984, -14.946086883544922, -14.129178047180176, -13.312268257141113, -12.49535846710205, -11.678449630737305, -10.861539840698242, -10.04463005065918, -9.227720260620117, -8.410810470581055, -7.593901634216309, -6.776991844177246, -5.960082054138184, -5.143172740936279, -4.326263427734375, -3.5093536376953125, -2.692444086074829, -1.8755345344543457, -1.0586249828338623, -0.2417154312133789, 0.5751943588256836, 1.392103672027588, 2.209012985229492, 3.0259246826171875, 3.842834234237671, 4.659743785858154, 5.476653099060059, 6.293562889099121, 7.110472679138184, 7.927381992340088, 8.744291305541992, 9.561201095581055, 10.378110885620117, 11.19502067565918, 12.011929512023926, 12.828839302062988, 13.64574909210205, 14.462657928466797, 15.27956771850586, 16.096477508544922, 16.913387298583984, 17.730297088623047, 18.54720687866211, 19.364116668701172, 20.181026458740234, 20.997934341430664, 21.814844131469727, 22.63175392150879, 23.44866371154785, 24.265573501586914, 25.082483291625977, 25.899391174316406, 26.71630096435547, 27.53321075439453, 28.350120544433594, 29.167030334472656]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 1.0, 2.0, 0.0, 4.0, 6.0, 10.0, 15.0, 12.0, 13.0, 15.0, 19.0, 27.0, 22.0, 28.0, 26.0, 30.0, 44.0, 29.0, 34.0, 45.0, 50.0, 43.0, 38.0, 46.0, 52.0, 35.0, 47.0, 43.0, 41.0, 33.0, 25.0, 33.0, 28.0, 18.0, 22.0, 23.0, 11.0, 10.0, 7.0, 7.0, 9.0, 2.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.771484375, -2.69549560546875, -2.6195068359375, -2.54351806640625, -2.467529296875, -2.39154052734375, -2.3155517578125, -2.23956298828125, -2.16357421875, -2.08758544921875, -2.0115966796875, -1.93560791015625, -1.859619140625, -1.78363037109375, -1.7076416015625, -1.63165283203125, -1.5556640625, -1.47967529296875, -1.4036865234375, -1.32769775390625, -1.251708984375, -1.17572021484375, -1.0997314453125, -1.02374267578125, -0.94775390625, -0.87176513671875, -0.7957763671875, -0.71978759765625, -0.643798828125, -0.56781005859375, -0.4918212890625, -0.41583251953125, -0.33984375, -0.26385498046875, -0.1878662109375, -0.11187744140625, -0.035888671875, 0.04010009765625, 0.1160888671875, 0.19207763671875, 0.26806640625, 0.34405517578125, 0.4200439453125, 0.49603271484375, 0.572021484375, 0.64801025390625, 0.7239990234375, 0.79998779296875, 0.8759765625, 0.95196533203125, 1.0279541015625, 1.10394287109375, 1.179931640625, 1.25592041015625, 1.3319091796875, 1.40789794921875, 1.48388671875, 1.55987548828125, 1.6358642578125, 1.71185302734375, 1.787841796875, 1.86383056640625, 1.9398193359375, 2.01580810546875, 2.091796875]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 3.0, 4.0, 6.0, 8.0, 7.0, 13.0, 29.0, 44.0, 65.0, 108.0, 177.0, 307.0, 480.0, 791.0, 1216.0, 1901.0, 3078.0, 4923.0, 7602.0, 11311.0, 16897.0, 24147.0, 34021.0, 45815.0, 59372.0, 72684.0, 85590.0, 94728.0, 99781.0, 95976.0, 87327.0, 75338.0, 61773.0, 48188.0, 35922.0, 26196.0, 17942.0, 12322.0, 8093.0, 5368.0, 3348.0, 2093.0, 1342.0, 863.0, 505.0, 338.0, 197.0, 134.0, 78.0, 41.0, 26.0, 17.0, 10.0, 10.0, 4.0, 7.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.3271484375, -1.2851409912109375, -1.243133544921875, -1.2011260986328125, -1.15911865234375, -1.1171112060546875, -1.075103759765625, -1.0330963134765625, -0.9910888671875, -0.9490814208984375, -0.907073974609375, -0.8650665283203125, -0.82305908203125, -0.7810516357421875, -0.739044189453125, -0.6970367431640625, -0.655029296875, -0.6130218505859375, -0.571014404296875, -0.5290069580078125, -0.48699951171875, -0.4449920654296875, -0.402984619140625, -0.3609771728515625, -0.3189697265625, -0.2769622802734375, -0.234954833984375, -0.1929473876953125, -0.15093994140625, -0.1089324951171875, -0.066925048828125, -0.0249176025390625, 0.01708984375, 0.0590972900390625, 0.101104736328125, 0.1431121826171875, 0.18511962890625, 0.2271270751953125, 0.269134521484375, 0.3111419677734375, 0.3531494140625, 0.3951568603515625, 0.437164306640625, 0.4791717529296875, 0.52117919921875, 0.5631866455078125, 0.605194091796875, 0.6472015380859375, 0.689208984375, 0.7312164306640625, 0.773223876953125, 0.8152313232421875, 0.85723876953125, 0.8992462158203125, 0.941253662109375, 0.9832611083984375, 1.0252685546875, 1.0672760009765625, 1.109283447265625, 1.1512908935546875, 1.19329833984375, 1.2353057861328125, 1.277313232421875, 1.3193206787109375, 1.361328125]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 3.0, 5.0, 4.0, 5.0, 9.0, 9.0, 7.0, 18.0, 14.0, 13.0, 28.0, 16.0, 27.0, 23.0, 30.0, 33.0, 41.0, 35.0, 28.0, 49.0, 35.0, 45.0, 1069.0, 44.0, 30.0, 43.0, 46.0, 34.0, 33.0, 24.0, 23.0, 34.0, 25.0, 27.0, 17.0, 24.0, 16.0, 10.0, 10.0, 8.0, 8.0, 17.0, 1.0, 3.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.353515625, -2.281768798828125, -2.21002197265625, -2.138275146484375, -2.0665283203125, -1.994781494140625, -1.92303466796875, -1.851287841796875, -1.779541015625, -1.707794189453125, -1.63604736328125, -1.564300537109375, -1.4925537109375, -1.420806884765625, -1.34906005859375, -1.277313232421875, -1.20556640625, -1.133819580078125, -1.06207275390625, -0.990325927734375, -0.9185791015625, -0.846832275390625, -0.77508544921875, -0.703338623046875, -0.631591796875, -0.559844970703125, -0.48809814453125, -0.416351318359375, -0.3446044921875, -0.272857666015625, -0.20111083984375, -0.129364013671875, -0.0576171875, 0.014129638671875, 0.08587646484375, 0.157623291015625, 0.2293701171875, 0.301116943359375, 0.37286376953125, 0.444610595703125, 0.516357421875, 0.588104248046875, 0.65985107421875, 0.731597900390625, 0.8033447265625, 0.875091552734375, 0.94683837890625, 1.018585205078125, 1.09033203125, 1.162078857421875, 1.23382568359375, 1.305572509765625, 1.3773193359375, 1.449066162109375, 1.52081298828125, 1.592559814453125, 1.664306640625, 1.736053466796875, 1.80780029296875, 1.879547119140625, 1.9512939453125, 2.023040771484375, 2.09478759765625, 2.166534423828125, 2.23828125]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 9.0, 9.0, 13.0, 19.0, 28.0, 46.0, 75.0, 97.0, 134.0, 207.0, 308.0, 397.0, 617.0, 885.0, 1239.0, 1831.0, 2610.0, 3748.0, 5286.0, 7611.0, 10978.0, 16200.0, 27761.0, 73549.0, 1439503.0, 385340.0, 48963.0, 23281.0, 14379.0, 9662.0, 6751.0, 4795.0, 3344.0, 2303.0, 1582.0, 1145.0, 737.0, 530.0, 348.0, 260.0, 173.0, 140.0, 78.0, 56.0, 27.0, 23.0, 25.0, 12.0, 7.0, 6.0, 8.0, 2.0, 1.0, 0.0, 4.0], "bins": [-2.580078125, -2.50384521484375, -2.4276123046875, -2.35137939453125, -2.275146484375, -2.19891357421875, -2.1226806640625, -2.04644775390625, -1.97021484375, -1.89398193359375, -1.8177490234375, -1.74151611328125, -1.665283203125, -1.58905029296875, -1.5128173828125, -1.43658447265625, -1.3603515625, -1.28411865234375, -1.2078857421875, -1.13165283203125, -1.055419921875, -0.97918701171875, -0.9029541015625, -0.82672119140625, -0.75048828125, -0.67425537109375, -0.5980224609375, -0.52178955078125, -0.445556640625, -0.36932373046875, -0.2930908203125, -0.21685791015625, -0.140625, -0.06439208984375, 0.0118408203125, 0.08807373046875, 0.164306640625, 0.24053955078125, 0.3167724609375, 0.39300537109375, 0.46923828125, 0.54547119140625, 0.6217041015625, 0.69793701171875, 0.774169921875, 0.85040283203125, 0.9266357421875, 1.00286865234375, 1.0791015625, 1.15533447265625, 1.2315673828125, 1.30780029296875, 1.384033203125, 1.46026611328125, 1.5364990234375, 1.61273193359375, 1.68896484375, 1.76519775390625, 1.8414306640625, 1.91766357421875, 1.993896484375, 2.07012939453125, 2.1463623046875, 2.22259521484375, 2.298828125]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 5.0, 1.0, 8.0, 8.0, 15.0, 18.0, 18.0, 25.0, 18.0, 30.0, 32.0, 44.0, 27.0, 46.0, 34.0, 31.0, 40.0, 18.0, 36.0, 39.0, 48.0, 37.0, 34.0, 29.0, 35.0, 38.0, 31.0, 39.0, 31.0, 27.0, 24.0, 19.0, 32.0, 23.0, 18.0, 18.0, 13.0, 9.0, 4.0, 5.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.422119140625, -0.408660888671875, -0.39520263671875, -0.381744384765625, -0.3682861328125, -0.354827880859375, -0.34136962890625, -0.327911376953125, -0.314453125, -0.300994873046875, -0.28753662109375, -0.274078369140625, -0.2606201171875, -0.247161865234375, -0.23370361328125, -0.220245361328125, -0.206787109375, -0.193328857421875, -0.17987060546875, -0.166412353515625, -0.1529541015625, -0.139495849609375, -0.12603759765625, -0.112579345703125, -0.09912109375, -0.085662841796875, -0.07220458984375, -0.058746337890625, -0.0452880859375, -0.031829833984375, -0.01837158203125, -0.004913330078125, 0.008544921875, 0.022003173828125, 0.03546142578125, 0.048919677734375, 0.0623779296875, 0.075836181640625, 0.08929443359375, 0.102752685546875, 0.1162109375, 0.129669189453125, 0.14312744140625, 0.156585693359375, 0.1700439453125, 0.183502197265625, 0.19696044921875, 0.210418701171875, 0.223876953125, 0.237335205078125, 0.25079345703125, 0.264251708984375, 0.2777099609375, 0.291168212890625, 0.30462646484375, 0.318084716796875, 0.33154296875, 0.345001220703125, 0.35845947265625, 0.371917724609375, 0.3853759765625, 0.398834228515625, 0.41229248046875, 0.425750732421875, 0.439208984375]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 5.0, 2.0, 4.0, 9.0, 16.0, 23.0, 19.0, 39.0, 56.0, 56.0, 82.0, 75.0, 71.0, 103.0, 110.0, 133.0, 133.0, 168.0, 195.0, 259.0, 439.0, 1702.0, 520168.0, 521051.0, 1667.0, 438.0, 265.0, 172.0, 169.0, 145.0, 119.0, 114.0, 90.0, 64.0, 76.0, 77.0, 68.0, 51.0, 48.0, 30.0, 16.0, 10.0, 11.0, 5.0, 5.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.94921875, -6.7320556640625, -6.514892578125, -6.2977294921875, -6.08056640625, -5.8634033203125, -5.646240234375, -5.4290771484375, -5.2119140625, -4.9947509765625, -4.777587890625, -4.5604248046875, -4.34326171875, -4.1260986328125, -3.908935546875, -3.6917724609375, -3.474609375, -3.2574462890625, -3.040283203125, -2.8231201171875, -2.60595703125, -2.3887939453125, -2.171630859375, -1.9544677734375, -1.7373046875, -1.5201416015625, -1.302978515625, -1.0858154296875, -0.86865234375, -0.6514892578125, -0.434326171875, -0.2171630859375, 0.0, 0.2171630859375, 0.434326171875, 0.6514892578125, 0.86865234375, 1.0858154296875, 1.302978515625, 1.5201416015625, 1.7373046875, 1.9544677734375, 2.171630859375, 2.3887939453125, 2.60595703125, 2.8231201171875, 3.040283203125, 3.2574462890625, 3.474609375, 3.6917724609375, 3.908935546875, 4.1260986328125, 4.34326171875, 4.5604248046875, 4.777587890625, 4.9947509765625, 5.2119140625, 5.4290771484375, 5.646240234375, 5.8634033203125, 6.08056640625, 6.2977294921875, 6.514892578125, 6.7320556640625, 6.94921875]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 18.0, 250.0, 658.0, 82.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.786502838134766, -32.02855682373047, -31.270614624023438, -30.512670516967773, -29.75472640991211, -28.996780395507812, -28.23883628845215, -27.480892181396484, -26.72294807434082, -25.965003967285156, -25.207059860229492, -24.449115753173828, -23.69116973876953, -22.933225631713867, -22.175281524658203, -21.41733741760254, -20.659393310546875, -19.90144920349121, -19.143505096435547, -18.385560989379883, -17.62761688232422, -16.869670867919922, -16.111726760864258, -15.353782653808594, -14.59583854675293, -13.837894439697266, -13.079950332641602, -12.322005271911621, -11.564061164855957, -10.806117057800293, -10.048171997070312, -9.290227890014648, -8.532281875610352, -7.7743377685546875, -7.016393184661865, -6.258448600769043, -5.500504493713379, -4.742560386657715, -3.9846158027648926, -3.2266712188720703, -2.4687271118164062, -1.710782766342163, -0.9528384208679199, -0.19489407539367676, 0.5630502700805664, 1.3209946155548096, 2.0789389610290527, 2.836883544921875, 3.594827651977539, 4.352771759033203, 5.110716342926025, 5.868660926818848, 6.626605033874512, 7.384549140930176, 8.142494201660156, 8.90043830871582, 9.658382415771484, 10.416326522827148, 11.174270629882812, 11.932215690612793, 12.690159797668457, 13.448103904724121, 14.206048965454102, 14.963993072509766, 15.72193717956543]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 8.0, 12.0, 5.0, 16.0, 9.0, 17.0, 30.0, 23.0, 39.0, 39.0, 37.0, 43.0, 35.0, 43.0, 56.0, 67.0, 52.0, 51.0, 57.0, 53.0, 43.0, 43.0, 49.0, 35.0, 17.0, 33.0, 18.0, 20.0, 19.0, 12.0, 4.0, 6.0, 12.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.323416709899902, -6.117707252502441, -5.9119977951049805, -5.706288814544678, -5.500579357147217, -5.294869899749756, -5.089160442352295, -4.883451461791992, -4.677742004394531, -4.47203254699707, -4.266323089599609, -4.060614109039307, -3.8549046516418457, -3.6491951942443848, -3.443485736846924, -3.237776517868042, -3.032067060470581, -2.82635760307312, -2.6206483840942383, -2.4149389266967773, -2.2092297077178955, -2.0035202503204346, -1.7978109121322632, -1.5921015739440918, -1.3863922357559204, -1.180682897567749, -0.9749735593795776, -0.7692641615867615, -0.5635548233985901, -0.3578454256057739, -0.15213608741760254, 0.05357325077056885, 0.25928258895874023, 0.4649919271469116, 0.670701265335083, 0.8764106631278992, 1.0821199417114258, 1.2878293991088867, 1.493538737297058, 1.6992480754852295, 1.9049574136734009, 2.1106667518615723, 2.316376209259033, 2.522085428237915, 2.727794885635376, 2.933504104614258, 3.1392135620117188, 3.3449230194091797, 3.5506322383880615, 3.7563416957855225, 3.9620509147644043, 4.167760372161865, 4.373469829559326, 4.579178810119629, 4.78488826751709, 4.990597724914551, 5.196307182312012, 5.402016639709473, 5.607726097106934, 5.813435077667236, 6.019144535064697, 6.224853992462158, 6.430563449859619, 6.636272430419922, 6.841981887817383]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 8.0, 3.0, 11.0, 11.0, 10.0, 16.0, 13.0, 21.0, 20.0, 27.0, 27.0, 37.0, 38.0, 34.0, 42.0, 48.0, 35.0, 47.0, 54.0, 53.0, 48.0, 50.0, 52.0, 40.0, 38.0, 29.0, 35.0, 31.0, 27.0, 25.0, 17.0, 14.0, 12.0, 11.0, 10.0, 4.0, 4.0, 1.0, 8.0, 1.0], "bins": [-3.654296875, -3.5688323974609375, -3.483367919921875, -3.3979034423828125, -3.31243896484375, -3.2269744873046875, -3.141510009765625, -3.0560455322265625, -2.9705810546875, -2.8851165771484375, -2.799652099609375, -2.7141876220703125, -2.62872314453125, -2.5432586669921875, -2.457794189453125, -2.3723297119140625, -2.286865234375, -2.2014007568359375, -2.115936279296875, -2.0304718017578125, -1.94500732421875, -1.8595428466796875, -1.774078369140625, -1.6886138916015625, -1.6031494140625, -1.5176849365234375, -1.432220458984375, -1.3467559814453125, -1.26129150390625, -1.1758270263671875, -1.090362548828125, -1.0048980712890625, -0.91943359375, -0.8339691162109375, -0.748504638671875, -0.6630401611328125, -0.57757568359375, -0.4921112060546875, -0.406646728515625, -0.3211822509765625, -0.2357177734375, -0.1502532958984375, -0.064788818359375, 0.0206756591796875, 0.10614013671875, 0.1916046142578125, 0.277069091796875, 0.3625335693359375, 0.447998046875, 0.5334625244140625, 0.618927001953125, 0.7043914794921875, 0.78985595703125, 0.8753204345703125, 0.960784912109375, 1.0462493896484375, 1.1317138671875, 1.2171783447265625, 1.302642822265625, 1.3881072998046875, 1.47357177734375, 1.5590362548828125, 1.644500732421875, 1.7299652099609375, 1.8154296875]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 6.0, 4.0, 6.0, 4.0, 11.0, 13.0, 18.0, 27.0, 44.0, 54.0, 86.0, 145.0, 235.0, 390.0, 721.0, 1245.0, 2286.0, 4268.0, 8487.0, 17004.0, 34764.0, 71947.0, 138385.0, 220914.0, 231271.0, 154480.0, 81875.0, 39952.0, 19495.0, 9676.0, 4847.0, 2560.0, 1382.0, 781.0, 439.0, 270.0, 156.0, 102.0, 68.0, 63.0, 28.0, 23.0, 17.0, 5.0, 6.0, 3.0, 2.0, 0.0, 0.0, 3.0, 1.0], "bins": [-2.81640625, -2.740478515625, -2.66455078125, -2.588623046875, -2.5126953125, -2.436767578125, -2.36083984375, -2.284912109375, -2.208984375, -2.133056640625, -2.05712890625, -1.981201171875, -1.9052734375, -1.829345703125, -1.75341796875, -1.677490234375, -1.6015625, -1.525634765625, -1.44970703125, -1.373779296875, -1.2978515625, -1.221923828125, -1.14599609375, -1.070068359375, -0.994140625, -0.918212890625, -0.84228515625, -0.766357421875, -0.6904296875, -0.614501953125, -0.53857421875, -0.462646484375, -0.38671875, -0.310791015625, -0.23486328125, -0.158935546875, -0.0830078125, -0.007080078125, 0.06884765625, 0.144775390625, 0.220703125, 0.296630859375, 0.37255859375, 0.448486328125, 0.5244140625, 0.600341796875, 0.67626953125, 0.752197265625, 0.828125, 0.904052734375, 0.97998046875, 1.055908203125, 1.1318359375, 1.207763671875, 1.28369140625, 1.359619140625, 1.435546875, 1.511474609375, 1.58740234375, 1.663330078125, 1.7392578125, 1.815185546875, 1.89111328125, 1.967041015625, 2.04296875]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 3.0, 3.0, 2.0, 3.0, 6.0, 12.0, 11.0, 18.0, 19.0, 16.0, 24.0, 28.0, 33.0, 43.0, 30.0, 44.0, 46.0, 62.0, 80.0, 137.0, 269.0, 1396.0, 233.0, 123.0, 64.0, 58.0, 46.0, 33.0, 34.0, 26.0, 26.0, 23.0, 18.0, 22.0, 18.0, 13.0, 7.0, 8.0, 7.0, 5.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.8125, -9.498779296875, -9.18505859375, -8.871337890625, -8.5576171875, -8.243896484375, -7.93017578125, -7.616455078125, -7.302734375, -6.989013671875, -6.67529296875, -6.361572265625, -6.0478515625, -5.734130859375, -5.42041015625, -5.106689453125, -4.79296875, -4.479248046875, -4.16552734375, -3.851806640625, -3.5380859375, -3.224365234375, -2.91064453125, -2.596923828125, -2.283203125, -1.969482421875, -1.65576171875, -1.342041015625, -1.0283203125, -0.714599609375, -0.40087890625, -0.087158203125, 0.2265625, 0.540283203125, 0.85400390625, 1.167724609375, 1.4814453125, 1.795166015625, 2.10888671875, 2.422607421875, 2.736328125, 3.050048828125, 3.36376953125, 3.677490234375, 3.9912109375, 4.304931640625, 4.61865234375, 4.932373046875, 5.24609375, 5.559814453125, 5.87353515625, 6.187255859375, 6.5009765625, 6.814697265625, 7.12841796875, 7.442138671875, 7.755859375, 8.069580078125, 8.38330078125, 8.697021484375, 9.0107421875, 9.324462890625, 9.63818359375, 9.951904296875, 10.265625]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 6.0, 4.0, 13.0, 5.0, 17.0, 21.0, 18.0, 26.0, 22.0, 29.0, 40.0, 62.0, 86.0, 152.0, 360.0, 1038.0, 4216.0, 43378.0, 1516471.0, 1528993.0, 44428.0, 4218.0, 1118.0, 405.0, 192.0, 96.0, 68.0, 33.0, 41.0, 25.0, 32.0, 16.0, 18.0, 19.0, 9.0, 8.0, 4.0, 7.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-13.59375, -13.1552734375, -12.716796875, -12.2783203125, -11.83984375, -11.4013671875, -10.962890625, -10.5244140625, -10.0859375, -9.6474609375, -9.208984375, -8.7705078125, -8.33203125, -7.8935546875, -7.455078125, -7.0166015625, -6.578125, -6.1396484375, -5.701171875, -5.2626953125, -4.82421875, -4.3857421875, -3.947265625, -3.5087890625, -3.0703125, -2.6318359375, -2.193359375, -1.7548828125, -1.31640625, -0.8779296875, -0.439453125, -0.0009765625, 0.4375, 0.8759765625, 1.314453125, 1.7529296875, 2.19140625, 2.6298828125, 3.068359375, 3.5068359375, 3.9453125, 4.3837890625, 4.822265625, 5.2607421875, 5.69921875, 6.1376953125, 6.576171875, 7.0146484375, 7.453125, 7.8916015625, 8.330078125, 8.7685546875, 9.20703125, 9.6455078125, 10.083984375, 10.5224609375, 10.9609375, 11.3994140625, 11.837890625, 12.2763671875, 12.71484375, 13.1533203125, 13.591796875, 14.0302734375, 14.46875]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 39.0, 390.0, 501.0, 85.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.521692276000977, -12.990403175354004, -10.459114074707031, -7.927824974060059, -5.396535873413086, -2.8652467727661133, -0.3339576721191406, 2.1973323822021484, 4.728620529174805, 7.259909629821777, 9.79119873046875, 12.322487831115723, 14.853776931762695, 17.385066986083984, 19.91635513305664, 22.44764518737793, 24.978933334350586, 27.510223388671875, 30.04151153564453, 32.57279968261719, 35.104087829589844, 37.635379791259766, 40.16666793823242, 42.697959899902344, 45.229248046875, 47.760536193847656, 50.29182434082031, 52.823116302490234, 55.35440444946289, 57.88569259643555, 60.41698455810547, 62.948272705078125, 65.47955322265625, 68.0108413696289, 70.54212951660156, 73.07341766357422, 75.60470581054688, 78.13600158691406, 80.66728973388672, 83.19857788085938, 85.72986602783203, 88.26115417480469, 90.79244232177734, 93.32373046875, 95.85502624511719, 98.38631439208984, 100.9176025390625, 103.44889068603516, 105.98017883300781, 108.51146697998047, 111.04275512695312, 113.57404327392578, 116.10533142089844, 118.63662719726562, 121.16791534423828, 123.69920349121094, 126.2304916381836, 128.76177978515625, 131.29307556152344, 133.82435607910156, 136.35565185546875, 138.88693237304688, 141.41822814941406, 143.94952392578125, 146.48080444335938]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 3.0, 5.0, 2.0, 1.0, 4.0, 4.0, 6.0, 6.0, 4.0, 12.0, 5.0, 17.0, 6.0, 18.0, 20.0, 17.0, 28.0, 24.0, 32.0, 33.0, 35.0, 39.0, 33.0, 34.0, 45.0, 35.0, 38.0, 35.0, 45.0, 40.0, 46.0, 31.0, 34.0, 40.0, 30.0, 30.0, 27.0, 22.0, 19.0, 12.0, 13.0, 15.0, 17.0, 11.0, 3.0, 9.0, 8.0, 10.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-27.57522201538086, -26.682418823242188, -25.789615631103516, -24.896812438964844, -24.004009246826172, -23.1112060546875, -22.21840476989746, -21.32560157775879, -20.432798385620117, -19.539995193481445, -18.647192001342773, -17.7543888092041, -16.861587524414062, -15.968783378601074, -15.075981140136719, -14.183177947998047, -13.290374755859375, -12.397571563720703, -11.504768371582031, -10.611966133117676, -9.719162940979004, -8.826359748840332, -7.933557033538818, -7.040754318237305, -6.147951126098633, -5.255147933959961, -4.362345218658447, -3.4695422649383545, -2.5767393112182617, -1.6839361190795898, -0.7911334037780762, 0.1016693115234375, 0.9944744110107422, 1.887277364730835, 2.7800803184509277, 3.6728832721710205, 4.565686225891113, 5.458489418029785, 6.351292133331299, 7.2440948486328125, 8.136898040771484, 9.029701232910156, 9.922504425048828, 10.815306663513184, 11.708109855651855, 12.600913047790527, 13.493715286254883, 14.386518478393555, 15.279321670532227, 16.1721248626709, 17.06492805480957, 17.957731246948242, 18.85053253173828, 19.743335723876953, 20.636138916015625, 21.528942108154297, 22.42174530029297, 23.31454849243164, 24.207351684570312, 25.100154876708984, 25.992958068847656, 26.885761260986328, 27.778562545776367, 28.67136573791504, 29.56416893005371]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 1.0, 6.0, 12.0, 7.0, 16.0, 20.0, 16.0, 22.0, 25.0, 34.0, 27.0, 34.0, 31.0, 22.0, 38.0, 46.0, 49.0, 49.0, 49.0, 59.0, 49.0, 44.0, 50.0, 41.0, 43.0, 42.0, 24.0, 26.0, 40.0, 17.0, 16.0, 11.0, 11.0, 12.0, 6.0, 4.0, 3.0, 6.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.564453125, -3.473968505859375, -3.38348388671875, -3.292999267578125, -3.2025146484375, -3.112030029296875, -3.02154541015625, -2.931060791015625, -2.840576171875, -2.750091552734375, -2.65960693359375, -2.569122314453125, -2.4786376953125, -2.388153076171875, -2.29766845703125, -2.207183837890625, -2.11669921875, -2.026214599609375, -1.93572998046875, -1.845245361328125, -1.7547607421875, -1.664276123046875, -1.57379150390625, -1.483306884765625, -1.392822265625, -1.302337646484375, -1.21185302734375, -1.121368408203125, -1.0308837890625, -0.940399169921875, -0.84991455078125, -0.759429931640625, -0.6689453125, -0.578460693359375, -0.48797607421875, -0.397491455078125, -0.3070068359375, -0.216522216796875, -0.12603759765625, -0.035552978515625, 0.054931640625, 0.145416259765625, 0.23590087890625, 0.326385498046875, 0.4168701171875, 0.507354736328125, 0.59783935546875, 0.688323974609375, 0.77880859375, 0.869293212890625, 0.95977783203125, 1.050262451171875, 1.1407470703125, 1.231231689453125, 1.32171630859375, 1.412200927734375, 1.502685546875, 1.593170166015625, 1.68365478515625, 1.774139404296875, 1.8646240234375, 1.955108642578125, 2.04559326171875, 2.136077880859375, 2.2265625]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 5.0, 9.0, 6.0, 13.0, 20.0, 25.0, 24.0, 33.0, 33.0, 57.0, 58.0, 62.0, 68.0, 149.0, 357.0, 916.0, 3537.0, 16842.0, 107299.0, 1188559.0, 2587210.0, 245998.0, 33852.0, 6480.0, 1533.0, 460.0, 199.0, 109.0, 73.0, 58.0, 44.0, 58.0, 39.0, 25.0, 25.0, 15.0, 11.0, 8.0, 5.0, 5.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.171875, -11.8446044921875, -11.517333984375, -11.1900634765625, -10.86279296875, -10.5355224609375, -10.208251953125, -9.8809814453125, -9.5537109375, -9.2264404296875, -8.899169921875, -8.5718994140625, -8.24462890625, -7.9173583984375, -7.590087890625, -7.2628173828125, -6.935546875, -6.6082763671875, -6.281005859375, -5.9537353515625, -5.62646484375, -5.2991943359375, -4.971923828125, -4.6446533203125, -4.3173828125, -3.9901123046875, -3.662841796875, -3.3355712890625, -3.00830078125, -2.6810302734375, -2.353759765625, -2.0264892578125, -1.69921875, -1.3719482421875, -1.044677734375, -0.7174072265625, -0.39013671875, -0.0628662109375, 0.264404296875, 0.5916748046875, 0.9189453125, 1.2462158203125, 1.573486328125, 1.9007568359375, 2.22802734375, 2.5552978515625, 2.882568359375, 3.2098388671875, 3.537109375, 3.8643798828125, 4.191650390625, 4.5189208984375, 4.84619140625, 5.1734619140625, 5.500732421875, 5.8280029296875, 6.1552734375, 6.4825439453125, 6.809814453125, 7.1370849609375, 7.46435546875, 7.7916259765625, 8.118896484375, 8.4461669921875, 8.7734375]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 5.0, 7.0, 7.0, 4.0, 8.0, 8.0, 33.0, 38.0, 48.0, 40.0, 78.0, 118.0, 173.0, 228.0, 305.0, 432.0, 452.0, 469.0, 418.0, 373.0, 239.0, 178.0, 134.0, 98.0, 58.0, 42.0, 30.0, 14.0, 13.0, 17.0, 6.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.7265625, -5.4571533203125, -5.187744140625, -4.9183349609375, -4.64892578125, -4.3795166015625, -4.110107421875, -3.8406982421875, -3.5712890625, -3.3018798828125, -3.032470703125, -2.7630615234375, -2.49365234375, -2.2242431640625, -1.954833984375, -1.6854248046875, -1.416015625, -1.1466064453125, -0.877197265625, -0.6077880859375, -0.33837890625, -0.0689697265625, 0.200439453125, 0.4698486328125, 0.7392578125, 1.0086669921875, 1.278076171875, 1.5474853515625, 1.81689453125, 2.0863037109375, 2.355712890625, 2.6251220703125, 2.89453125, 3.1639404296875, 3.433349609375, 3.7027587890625, 3.97216796875, 4.2415771484375, 4.510986328125, 4.7803955078125, 5.0498046875, 5.3192138671875, 5.588623046875, 5.8580322265625, 6.12744140625, 6.3968505859375, 6.666259765625, 6.9356689453125, 7.205078125, 7.4744873046875, 7.743896484375, 8.0133056640625, 8.28271484375, 8.5521240234375, 8.821533203125, 9.0909423828125, 9.3603515625, 9.6297607421875, 9.899169921875, 10.1685791015625, 10.43798828125, 10.7073974609375, 10.976806640625, 11.2462158203125, 11.515625]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 8.0, 8.0, 13.0, 21.0, 17.0, 26.0, 27.0, 46.0, 54.0, 80.0, 109.0, 185.0, 415.0, 1009.0, 3084.0, 12582.0, 69500.0, 495109.0, 2626910.0, 847252.0, 112049.0, 18978.0, 4332.0, 1314.0, 494.0, 209.0, 121.0, 94.0, 60.0, 40.0, 37.0, 27.0, 14.0, 19.0, 17.0, 6.0, 2.0, 6.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.8984375, -12.3951416015625, -11.891845703125, -11.3885498046875, -10.88525390625, -10.3819580078125, -9.878662109375, -9.3753662109375, -8.8720703125, -8.3687744140625, -7.865478515625, -7.3621826171875, -6.85888671875, -6.3555908203125, -5.852294921875, -5.3489990234375, -4.845703125, -4.3424072265625, -3.839111328125, -3.3358154296875, -2.83251953125, -2.3292236328125, -1.825927734375, -1.3226318359375, -0.8193359375, -0.3160400390625, 0.187255859375, 0.6905517578125, 1.19384765625, 1.6971435546875, 2.200439453125, 2.7037353515625, 3.20703125, 3.7103271484375, 4.213623046875, 4.7169189453125, 5.22021484375, 5.7235107421875, 6.226806640625, 6.7301025390625, 7.2333984375, 7.7366943359375, 8.239990234375, 8.7432861328125, 9.24658203125, 9.7498779296875, 10.253173828125, 10.7564697265625, 11.259765625, 11.7630615234375, 12.266357421875, 12.7696533203125, 13.27294921875, 13.7762451171875, 14.279541015625, 14.7828369140625, 15.2861328125, 15.7894287109375, 16.292724609375, 16.7960205078125, 17.29931640625, 17.8026123046875, 18.305908203125, 18.8092041015625, 19.3125]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 10.0, 20.0, 35.0, 59.0, 87.0, 117.0, 141.0, 158.0, 100.0, 119.0, 49.0, 56.0, 26.0, 16.0, 9.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-18.87264060974121, -17.228172302246094, -15.583703994750977, -13.939234733581543, -12.294766426086426, -10.650298118591309, -9.005828857421875, -7.361360549926758, -5.716892242431641, -4.072423934936523, -2.427955150604248, -0.7834863662719727, 0.8609819412231445, 2.5054502487182617, 4.149919509887695, 5.7943878173828125, 7.43885612487793, 9.083324432373047, 10.727792739868164, 12.372262001037598, 14.016730308532715, 15.661198616027832, 17.305667877197266, 18.950136184692383, 20.5946044921875, 22.239072799682617, 23.883541107177734, 25.528011322021484, 27.17247772216797, 28.81694793701172, 30.461416244506836, 32.10588455200195, 33.75035095214844, 35.39482116699219, 37.03928756713867, 38.68375778198242, 40.328224182128906, 41.972694396972656, 43.617164611816406, 45.26163101196289, 46.906097412109375, 48.550567626953125, 50.19503402709961, 51.83950424194336, 53.483970642089844, 55.128440856933594, 56.772911071777344, 58.41737747192383, 60.06184768676758, 61.70631790161133, 63.35078430175781, 64.99525451660156, 66.63972473144531, 68.28418731689453, 69.92865753173828, 71.57312774658203, 73.21759796142578, 74.86206817626953, 76.50653839111328, 78.1510009765625, 79.79547119140625, 81.43994140625, 83.08441162109375, 84.7288818359375, 86.37334442138672]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 4.0, 4.0, 9.0, 6.0, 8.0, 4.0, 10.0, 16.0, 16.0, 20.0, 17.0, 21.0, 21.0, 18.0, 37.0, 30.0, 27.0, 45.0, 30.0, 38.0, 46.0, 34.0, 49.0, 35.0, 27.0, 41.0, 50.0, 34.0, 36.0, 29.0, 35.0, 27.0, 30.0, 24.0, 25.0, 14.0, 11.0, 15.0, 11.0, 11.0, 8.0, 8.0, 5.0, 6.0, 1.0, 7.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0], "bins": [-27.618024826049805, -26.826065063476562, -26.034103393554688, -25.242143630981445, -24.45018196105957, -23.658222198486328, -22.866260528564453, -22.07430076599121, -21.28234100341797, -20.490381240844727, -19.69841957092285, -18.90645980834961, -18.114498138427734, -17.322538375854492, -16.53057861328125, -15.738616943359375, -14.9466552734375, -14.154694557189941, -13.362733840942383, -12.57077407836914, -11.778812408447266, -10.986852645874023, -10.194891929626465, -9.402931213378906, -8.610970497131348, -7.819009780883789, -7.0270490646362305, -6.23508882522583, -5.4431281089782715, -4.651167392730713, -3.8592071533203125, -3.067246437072754, -2.2752838134765625, -1.4833232164382935, -0.6913626194000244, 0.10059785842895508, 0.8925585746765137, 1.6845192909240723, 2.4764795303344727, 3.2684402465820312, 4.06040096282959, 4.852361679077148, 5.644322395324707, 6.436282634735107, 7.228243350982666, 8.020204544067383, 8.812164306640625, 9.604125022888184, 10.396085739135742, 11.1880464553833, 11.98000717163086, 12.771966934204102, 13.563928604125977, 14.355888366699219, 15.147849082946777, 15.939809799194336, 16.731769561767578, 17.52372932434082, 18.315690994262695, 19.107650756835938, 19.899612426757812, 20.691572189331055, 21.483531951904297, 22.275493621826172, 23.067455291748047]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 9.0, 6.0, 9.0, 7.0, 11.0, 14.0, 17.0, 23.0, 18.0, 21.0, 26.0, 20.0, 29.0, 25.0, 31.0, 37.0, 35.0, 42.0, 46.0, 47.0, 36.0, 44.0, 32.0, 30.0, 36.0, 50.0, 30.0, 33.0, 35.0, 27.0, 25.0, 27.0, 18.0, 13.0, 24.0, 16.0, 16.0, 7.0, 6.0, 6.0, 5.0, 8.0, 1.0, 3.0, 2.0, 0.0, 3.0], "bins": [-2.98828125, -2.90899658203125, -2.8297119140625, -2.75042724609375, -2.671142578125, -2.59185791015625, -2.5125732421875, -2.43328857421875, -2.35400390625, -2.27471923828125, -2.1954345703125, -2.11614990234375, -2.036865234375, -1.95758056640625, -1.8782958984375, -1.79901123046875, -1.7197265625, -1.64044189453125, -1.5611572265625, -1.48187255859375, -1.402587890625, -1.32330322265625, -1.2440185546875, -1.16473388671875, -1.08544921875, -1.00616455078125, -0.9268798828125, -0.84759521484375, -0.768310546875, -0.68902587890625, -0.6097412109375, -0.53045654296875, -0.451171875, -0.37188720703125, -0.2926025390625, -0.21331787109375, -0.134033203125, -0.05474853515625, 0.0245361328125, 0.10382080078125, 0.18310546875, 0.26239013671875, 0.3416748046875, 0.42095947265625, 0.500244140625, 0.57952880859375, 0.6588134765625, 0.73809814453125, 0.8173828125, 0.89666748046875, 0.9759521484375, 1.05523681640625, 1.134521484375, 1.21380615234375, 1.2930908203125, 1.37237548828125, 1.45166015625, 1.53094482421875, 1.6102294921875, 1.68951416015625, 1.768798828125, 1.84808349609375, 1.9273681640625, 2.00665283203125, 2.0859375]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 1.0, 6.0, 8.0, 12.0, 15.0, 22.0, 43.0, 59.0, 94.0, 193.0, 337.0, 558.0, 954.0, 1670.0, 2769.0, 4694.0, 7822.0, 12533.0, 19906.0, 30441.0, 44290.0, 60945.0, 78173.0, 95059.0, 107485.0, 113864.0, 107198.0, 94964.0, 78613.0, 59953.0, 43898.0, 30356.0, 19903.0, 12549.0, 7901.0, 4695.0, 2758.0, 1621.0, 935.0, 540.0, 323.0, 163.0, 93.0, 51.0, 37.0, 25.0, 17.0, 7.0, 2.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.5107421875, -1.4595184326171875, -1.408294677734375, -1.3570709228515625, -1.30584716796875, -1.2546234130859375, -1.203399658203125, -1.1521759033203125, -1.1009521484375, -1.0497283935546875, -0.998504638671875, -0.9472808837890625, -0.89605712890625, -0.8448333740234375, -0.793609619140625, -0.7423858642578125, -0.691162109375, -0.6399383544921875, -0.588714599609375, -0.5374908447265625, -0.48626708984375, -0.4350433349609375, -0.383819580078125, -0.3325958251953125, -0.2813720703125, -0.2301483154296875, -0.178924560546875, -0.1277008056640625, -0.07647705078125, -0.0252532958984375, 0.025970458984375, 0.0771942138671875, 0.12841796875, 0.1796417236328125, 0.230865478515625, 0.2820892333984375, 0.33331298828125, 0.3845367431640625, 0.435760498046875, 0.4869842529296875, 0.5382080078125, 0.5894317626953125, 0.640655517578125, 0.6918792724609375, 0.74310302734375, 0.7943267822265625, 0.845550537109375, 0.8967742919921875, 0.947998046875, 0.9992218017578125, 1.050445556640625, 1.1016693115234375, 1.15289306640625, 1.2041168212890625, 1.255340576171875, 1.3065643310546875, 1.3577880859375, 1.4090118408203125, 1.460235595703125, 1.5114593505859375, 1.56268310546875, 1.6139068603515625, 1.665130615234375, 1.7163543701171875, 1.767578125]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 4.0, 0.0, 3.0, 2.0, 8.0, 6.0, 6.0, 8.0, 5.0, 11.0, 17.0, 14.0, 17.0, 18.0, 30.0, 13.0, 24.0, 34.0, 25.0, 35.0, 53.0, 32.0, 41.0, 30.0, 44.0, 37.0, 1059.0, 28.0, 30.0, 40.0, 30.0, 29.0, 42.0, 33.0, 32.0, 13.0, 28.0, 15.0, 16.0, 22.0, 14.0, 13.0, 15.0, 12.0, 9.0, 14.0, 4.0, 7.0, 3.0, 3.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.36328125, -2.284820556640625, -2.20635986328125, -2.127899169921875, -2.0494384765625, -1.970977783203125, -1.89251708984375, -1.814056396484375, -1.735595703125, -1.657135009765625, -1.57867431640625, -1.500213623046875, -1.4217529296875, -1.343292236328125, -1.26483154296875, -1.186370849609375, -1.10791015625, -1.029449462890625, -0.95098876953125, -0.872528076171875, -0.7940673828125, -0.715606689453125, -0.63714599609375, -0.558685302734375, -0.480224609375, -0.401763916015625, -0.32330322265625, -0.244842529296875, -0.1663818359375, -0.087921142578125, -0.00946044921875, 0.069000244140625, 0.1474609375, 0.225921630859375, 0.30438232421875, 0.382843017578125, 0.4613037109375, 0.539764404296875, 0.61822509765625, 0.696685791015625, 0.775146484375, 0.853607177734375, 0.93206787109375, 1.010528564453125, 1.0889892578125, 1.167449951171875, 1.24591064453125, 1.324371337890625, 1.40283203125, 1.481292724609375, 1.55975341796875, 1.638214111328125, 1.7166748046875, 1.795135498046875, 1.87359619140625, 1.952056884765625, 2.030517578125, 2.108978271484375, 2.18743896484375, 2.265899658203125, 2.3443603515625, 2.422821044921875, 2.50128173828125, 2.579742431640625, 2.658203125]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 5.0, 6.0, 6.0, 11.0, 15.0, 28.0, 32.0, 73.0, 83.0, 114.0, 182.0, 289.0, 444.0, 624.0, 923.0, 1410.0, 2003.0, 2920.0, 4342.0, 6473.0, 9047.0, 14099.0, 22429.0, 46022.0, 289541.0, 1527880.0, 85728.0, 30012.0, 17373.0, 11172.0, 7561.0, 5302.0, 3566.0, 2392.0, 1669.0, 1075.0, 758.0, 484.0, 334.0, 251.0, 134.0, 114.0, 75.0, 38.0, 35.0, 25.0, 21.0, 13.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6015625, -2.515533447265625, -2.42950439453125, -2.343475341796875, -2.2574462890625, -2.171417236328125, -2.08538818359375, -1.999359130859375, -1.913330078125, -1.827301025390625, -1.74127197265625, -1.655242919921875, -1.5692138671875, -1.483184814453125, -1.39715576171875, -1.311126708984375, -1.22509765625, -1.139068603515625, -1.05303955078125, -0.967010498046875, -0.8809814453125, -0.794952392578125, -0.70892333984375, -0.622894287109375, -0.536865234375, -0.450836181640625, -0.36480712890625, -0.278778076171875, -0.1927490234375, -0.106719970703125, -0.02069091796875, 0.065338134765625, 0.1513671875, 0.237396240234375, 0.32342529296875, 0.409454345703125, 0.4954833984375, 0.581512451171875, 0.66754150390625, 0.753570556640625, 0.839599609375, 0.925628662109375, 1.01165771484375, 1.097686767578125, 1.1837158203125, 1.269744873046875, 1.35577392578125, 1.441802978515625, 1.52783203125, 1.613861083984375, 1.69989013671875, 1.785919189453125, 1.8719482421875, 1.957977294921875, 2.04400634765625, 2.130035400390625, 2.216064453125, 2.302093505859375, 2.38812255859375, 2.474151611328125, 2.5601806640625, 2.646209716796875, 2.73223876953125, 2.818267822265625, 2.904296875]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 6.0, 5.0, 4.0, 4.0, 5.0, 13.0, 13.0, 13.0, 17.0, 20.0, 15.0, 23.0, 26.0, 21.0, 29.0, 30.0, 29.0, 40.0, 25.0, 36.0, 37.0, 35.0, 24.0, 24.0, 28.0, 38.0, 40.0, 43.0, 30.0, 32.0, 28.0, 23.0, 28.0, 30.0, 22.0, 29.0, 24.0, 18.0, 25.0, 14.0, 9.0, 12.0, 12.0, 6.0, 8.0, 6.0, 3.0, 0.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.350830078125, -0.340118408203125, -0.32940673828125, -0.318695068359375, -0.3079833984375, -0.297271728515625, -0.28656005859375, -0.275848388671875, -0.26513671875, -0.254425048828125, -0.24371337890625, -0.233001708984375, -0.2222900390625, -0.211578369140625, -0.20086669921875, -0.190155029296875, -0.179443359375, -0.168731689453125, -0.15802001953125, -0.147308349609375, -0.1365966796875, -0.125885009765625, -0.11517333984375, -0.104461669921875, -0.09375, -0.083038330078125, -0.07232666015625, -0.061614990234375, -0.0509033203125, -0.040191650390625, -0.02947998046875, -0.018768310546875, -0.008056640625, 0.002655029296875, 0.01336669921875, 0.024078369140625, 0.0347900390625, 0.045501708984375, 0.05621337890625, 0.066925048828125, 0.07763671875, 0.088348388671875, 0.09906005859375, 0.109771728515625, 0.1204833984375, 0.131195068359375, 0.14190673828125, 0.152618408203125, 0.163330078125, 0.174041748046875, 0.18475341796875, 0.195465087890625, 0.2061767578125, 0.216888427734375, 0.22760009765625, 0.238311767578125, 0.2490234375, 0.259735107421875, 0.27044677734375, 0.281158447265625, 0.2918701171875, 0.302581787109375, 0.31329345703125, 0.324005126953125, 0.334716796875]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 7.0, 0.0, 12.0, 1.0, 4.0, 12.0, 17.0, 22.0, 21.0, 26.0, 39.0, 63.0, 63.0, 80.0, 99.0, 92.0, 102.0, 137.0, 126.0, 183.0, 243.0, 314.0, 442.0, 1731.0, 77701.0, 920321.0, 43433.0, 1210.0, 426.0, 294.0, 218.0, 173.0, 176.0, 118.0, 115.0, 110.0, 77.0, 76.0, 61.0, 53.0, 41.0, 34.0, 22.0, 16.0, 12.0, 13.0, 10.0, 3.0, 3.0, 4.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.453125, -5.2796630859375, -5.106201171875, -4.9327392578125, -4.75927734375, -4.5858154296875, -4.412353515625, -4.2388916015625, -4.0654296875, -3.8919677734375, -3.718505859375, -3.5450439453125, -3.37158203125, -3.1981201171875, -3.024658203125, -2.8511962890625, -2.677734375, -2.5042724609375, -2.330810546875, -2.1573486328125, -1.98388671875, -1.8104248046875, -1.636962890625, -1.4635009765625, -1.2900390625, -1.1165771484375, -0.943115234375, -0.7696533203125, -0.59619140625, -0.4227294921875, -0.249267578125, -0.0758056640625, 0.09765625, 0.2711181640625, 0.444580078125, 0.6180419921875, 0.79150390625, 0.9649658203125, 1.138427734375, 1.3118896484375, 1.4853515625, 1.6588134765625, 1.832275390625, 2.0057373046875, 2.17919921875, 2.3526611328125, 2.526123046875, 2.6995849609375, 2.873046875, 3.0465087890625, 3.219970703125, 3.3934326171875, 3.56689453125, 3.7403564453125, 3.913818359375, 4.0872802734375, 4.2607421875, 4.4342041015625, 4.607666015625, 4.7811279296875, 4.95458984375, 5.1280517578125, 5.301513671875, 5.4749755859375, 5.6484375]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 10.0, 56.0, 618.0, 303.0, 25.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.485300064086914, -30.732196807861328, -29.979093551635742, -29.225990295410156, -28.47288703918457, -27.719783782958984, -26.9666805267334, -26.213577270507812, -25.460474014282227, -24.70737075805664, -23.954267501831055, -23.20116424560547, -22.448060989379883, -21.694957733154297, -20.94185447692871, -20.188751220703125, -19.43564796447754, -18.682544708251953, -17.929441452026367, -17.17633819580078, -16.423234939575195, -15.67013168334961, -14.917028427124023, -14.163925170898438, -13.410821914672852, -12.657718658447266, -11.90461540222168, -11.151512145996094, -10.398408889770508, -9.645305633544922, -8.892202377319336, -8.13909912109375, -7.385997772216797, -6.632894515991211, -5.879791259765625, -5.126688003540039, -4.373584747314453, -3.620481491088867, -2.8673782348632812, -2.1142749786376953, -1.3611717224121094, -0.6080684661865234, 0.1450347900390625, 0.8981380462646484, 1.6512413024902344, 2.4043445587158203, 3.1574478149414062, 3.910551071166992, 4.663654327392578, 5.416757583618164, 6.16986083984375, 6.922964096069336, 7.676067352294922, 8.429170608520508, 9.182273864746094, 9.93537712097168, 10.688480377197266, 11.441583633422852, 12.194686889648438, 12.947790145874023, 13.70089340209961, 14.453996658325195, 15.207099914550781, 15.960203170776367, 16.713306427001953]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 4.0, 6.0, 11.0, 5.0, 10.0, 11.0, 14.0, 18.0, 22.0, 29.0, 28.0, 31.0, 45.0, 30.0, 36.0, 56.0, 37.0, 48.0, 53.0, 64.0, 47.0, 47.0, 31.0, 52.0, 36.0, 38.0, 34.0, 26.0, 30.0, 17.0, 22.0, 18.0, 20.0, 7.0, 9.0, 5.0, 5.0, 4.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.901732921600342, -4.7468085289001465, -4.591884613037109, -4.436960220336914, -4.282036304473877, -4.127111911773682, -3.9721877574920654, -3.817263603210449, -3.662339448928833, -3.507415294647217, -3.3524911403656006, -3.1975669860839844, -3.042642593383789, -2.887718677520752, -2.7327942848205566, -2.5778701305389404, -2.422945976257324, -2.268021821975708, -2.113097667694092, -1.958173394203186, -1.8032492399215698, -1.6483250856399536, -1.4934008121490479, -1.3384766578674316, -1.1835525035858154, -1.0286283493041992, -0.8737041354179382, -0.7187799215316772, -0.563855767250061, -0.4089316129684448, -0.25400739908218384, -0.09908318519592285, 0.05584144592285156, 0.21076563000679016, 0.36568981409072876, 0.5206140279769897, 0.675538182258606, 0.8304623365402222, 0.9853865504264832, 1.1403107643127441, 1.2952349185943604, 1.4501590728759766, 1.6050832271575928, 1.7600075006484985, 1.9149316549301147, 2.0698556900024414, 2.2247800827026367, 2.379704236984253, 2.534628391265869, 2.6895525455474854, 2.8444766998291016, 2.9994008541107178, 3.154325008392334, 3.3092494010925293, 3.4641735553741455, 3.6190977096557617, 3.774021863937378, 3.928946018218994, 4.0838704109191895, 4.238794326782227, 4.393718719482422, 4.548642635345459, 4.703567028045654, 4.858490943908691, 5.013415336608887]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 5.0, 6.0, 5.0, 8.0, 5.0, 14.0, 14.0, 12.0, 20.0, 22.0, 22.0, 16.0, 20.0, 29.0, 37.0, 26.0, 33.0, 31.0, 31.0, 32.0, 36.0, 37.0, 57.0, 41.0, 36.0, 52.0, 33.0, 41.0, 36.0, 36.0, 26.0, 24.0, 17.0, 21.0, 22.0, 32.0, 14.0, 14.0, 10.0, 10.0, 7.0, 8.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0], "bins": [-3.029296875, -2.9493408203125, -2.869384765625, -2.7894287109375, -2.70947265625, -2.6295166015625, -2.549560546875, -2.4696044921875, -2.3896484375, -2.3096923828125, -2.229736328125, -2.1497802734375, -2.06982421875, -1.9898681640625, -1.909912109375, -1.8299560546875, -1.75, -1.6700439453125, -1.590087890625, -1.5101318359375, -1.43017578125, -1.3502197265625, -1.270263671875, -1.1903076171875, -1.1103515625, -1.0303955078125, -0.950439453125, -0.8704833984375, -0.79052734375, -0.7105712890625, -0.630615234375, -0.5506591796875, -0.470703125, -0.3907470703125, -0.310791015625, -0.2308349609375, -0.15087890625, -0.0709228515625, 0.009033203125, 0.0889892578125, 0.1689453125, 0.2489013671875, 0.328857421875, 0.4088134765625, 0.48876953125, 0.5687255859375, 0.648681640625, 0.7286376953125, 0.80859375, 0.8885498046875, 0.968505859375, 1.0484619140625, 1.12841796875, 1.2083740234375, 1.288330078125, 1.3682861328125, 1.4482421875, 1.5281982421875, 1.608154296875, 1.6881103515625, 1.76806640625, 1.8480224609375, 1.927978515625, 2.0079345703125, 2.087890625]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 7.0, 7.0, 13.0, 24.0, 22.0, 60.0, 63.0, 113.0, 173.0, 247.0, 372.0, 594.0, 856.0, 1292.0, 1694.0, 2471.0, 3660.0, 4980.0, 7698.0, 12770.0, 28679.0, 93510.0, 344410.0, 370386.0, 104361.0, 31339.0, 13507.0, 7919.0, 5322.0, 3737.0, 2580.0, 1837.0, 1262.0, 895.0, 547.0, 395.0, 258.0, 163.0, 118.0, 75.0, 53.0, 39.0, 21.0, 14.0, 7.0, 2.0, 3.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.12109375, -3.97918701171875, -3.8372802734375, -3.69537353515625, -3.553466796875, -3.41156005859375, -3.2696533203125, -3.12774658203125, -2.98583984375, -2.84393310546875, -2.7020263671875, -2.56011962890625, -2.418212890625, -2.27630615234375, -2.1343994140625, -1.99249267578125, -1.8505859375, -1.70867919921875, -1.5667724609375, -1.42486572265625, -1.282958984375, -1.14105224609375, -0.9991455078125, -0.85723876953125, -0.71533203125, -0.57342529296875, -0.4315185546875, -0.28961181640625, -0.147705078125, -0.00579833984375, 0.1361083984375, 0.27801513671875, 0.419921875, 0.56182861328125, 0.7037353515625, 0.84564208984375, 0.987548828125, 1.12945556640625, 1.2713623046875, 1.41326904296875, 1.55517578125, 1.69708251953125, 1.8389892578125, 1.98089599609375, 2.122802734375, 2.26470947265625, 2.4066162109375, 2.54852294921875, 2.6904296875, 2.83233642578125, 2.9742431640625, 3.11614990234375, 3.258056640625, 3.39996337890625, 3.5418701171875, 3.68377685546875, 3.82568359375, 3.96759033203125, 4.1094970703125, 4.25140380859375, 4.393310546875, 4.53521728515625, 4.6771240234375, 4.81903076171875, 4.9609375]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 3.0, 4.0, 3.0, 6.0, 11.0, 6.0, 7.0, 7.0, 7.0, 10.0, 23.0, 15.0, 23.0, 29.0, 17.0, 29.0, 24.0, 34.0, 30.0, 40.0, 57.0, 48.0, 73.0, 146.0, 298.0, 1370.0, 188.0, 86.0, 69.0, 58.0, 44.0, 29.0, 46.0, 33.0, 29.0, 25.0, 18.0, 15.0, 18.0, 14.0, 12.0, 10.0, 5.0, 5.0, 13.0, 5.0, 4.0, 2.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.90625, -8.6207275390625, -8.335205078125, -8.0496826171875, -7.76416015625, -7.4786376953125, -7.193115234375, -6.9075927734375, -6.6220703125, -6.3365478515625, -6.051025390625, -5.7655029296875, -5.47998046875, -5.1944580078125, -4.908935546875, -4.6234130859375, -4.337890625, -4.0523681640625, -3.766845703125, -3.4813232421875, -3.19580078125, -2.9102783203125, -2.624755859375, -2.3392333984375, -2.0537109375, -1.7681884765625, -1.482666015625, -1.1971435546875, -0.91162109375, -0.6260986328125, -0.340576171875, -0.0550537109375, 0.23046875, 0.5159912109375, 0.801513671875, 1.0870361328125, 1.37255859375, 1.6580810546875, 1.943603515625, 2.2291259765625, 2.5146484375, 2.8001708984375, 3.085693359375, 3.3712158203125, 3.65673828125, 3.9422607421875, 4.227783203125, 4.5133056640625, 4.798828125, 5.0843505859375, 5.369873046875, 5.6553955078125, 5.94091796875, 6.2264404296875, 6.511962890625, 6.7974853515625, 7.0830078125, 7.3685302734375, 7.654052734375, 7.9395751953125, 8.22509765625, 8.5106201171875, 8.796142578125, 9.0816650390625, 9.3671875]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 5.0, 1.0, 2.0, 3.0, 4.0, 3.0, 6.0, 6.0, 8.0, 13.0, 11.0, 15.0, 20.0, 24.0, 34.0, 33.0, 49.0, 61.0, 93.0, 130.0, 258.0, 526.0, 1167.0, 2740.0, 7136.0, 22146.0, 104543.0, 2040854.0, 879731.0, 61136.0, 15586.0, 5187.0, 2062.0, 962.0, 413.0, 209.0, 129.0, 86.0, 62.0, 53.0, 40.0, 37.0, 21.0, 20.0, 25.0, 10.0, 10.0, 13.0, 5.0, 7.0, 5.0, 2.0, 4.0, 9.0, 4.0, 1.0], "bins": [-13.6171875, -13.2374267578125, -12.857666015625, -12.4779052734375, -12.09814453125, -11.7183837890625, -11.338623046875, -10.9588623046875, -10.5791015625, -10.1993408203125, -9.819580078125, -9.4398193359375, -9.06005859375, -8.6802978515625, -8.300537109375, -7.9207763671875, -7.541015625, -7.1612548828125, -6.781494140625, -6.4017333984375, -6.02197265625, -5.6422119140625, -5.262451171875, -4.8826904296875, -4.5029296875, -4.1231689453125, -3.743408203125, -3.3636474609375, -2.98388671875, -2.6041259765625, -2.224365234375, -1.8446044921875, -1.46484375, -1.0850830078125, -0.705322265625, -0.3255615234375, 0.05419921875, 0.4339599609375, 0.813720703125, 1.1934814453125, 1.5732421875, 1.9530029296875, 2.332763671875, 2.7125244140625, 3.09228515625, 3.4720458984375, 3.851806640625, 4.2315673828125, 4.611328125, 4.9910888671875, 5.370849609375, 5.7506103515625, 6.13037109375, 6.5101318359375, 6.889892578125, 7.2696533203125, 7.6494140625, 8.0291748046875, 8.408935546875, 8.7886962890625, 9.16845703125, 9.5482177734375, 9.927978515625, 10.3077392578125, 10.6875]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 12.0, 116.0, 489.0, 356.0, 38.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-191.65777587890625, -187.9557342529297, -184.2537078857422, -180.55166625976562, -176.84963989257812, -173.14759826660156, -169.44557189941406, -165.7435302734375, -162.04150390625, -158.33946228027344, -154.63743591308594, -150.93539428710938, -147.23336791992188, -143.5313262939453, -139.8292999267578, -136.12725830078125, -132.4252166748047, -128.72317504882812, -125.02114868164062, -121.3191146850586, -117.61708068847656, -113.9150390625, -110.2130126953125, -106.51097106933594, -102.80894470214844, -99.1069107055664, -95.40487670898438, -91.70284271240234, -88.00080871582031, -84.29876708984375, -80.59674072265625, -76.89469909667969, -73.19267272949219, -69.49063873291016, -65.78860473632812, -62.086570739746094, -58.3845329284668, -54.682498931884766, -50.980464935302734, -47.27842712402344, -43.576393127441406, -39.874359130859375, -36.172325134277344, -32.47029113769531, -28.768253326416016, -25.066219329833984, -21.364185333251953, -17.66214942932129, -13.960113525390625, -10.258078575134277, -6.556044101715088, -2.8540096282958984, 0.8480253219604492, 4.550060272216797, 8.252094268798828, 11.954130172729492, 15.656164169311523, 19.358198165893555, 23.06023406982422, 26.76226806640625, 30.46430206298828, 34.16633605957031, 37.868370056152344, 41.57040786743164, 45.27244186401367]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 10.0, 7.0, 6.0, 17.0, 15.0, 22.0, 18.0, 21.0, 30.0, 16.0, 38.0, 34.0, 29.0, 27.0, 39.0, 35.0, 47.0, 42.0, 44.0, 36.0, 44.0, 51.0, 44.0, 39.0, 25.0, 33.0, 37.0, 24.0, 22.0, 23.0, 13.0, 15.0, 12.0, 18.0, 14.0, 11.0, 9.0, 6.0, 3.0, 6.0, 5.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-29.288494110107422, -28.27434539794922, -27.260196685791016, -26.24604606628418, -25.231897354125977, -24.217748641967773, -23.203598022460938, -22.189449310302734, -21.17530059814453, -20.161151885986328, -19.147003173828125, -18.13285255432129, -17.118703842163086, -16.104555130004883, -15.090405464172363, -14.076255798339844, -13.06210708618164, -12.047958374023438, -11.033808708190918, -10.019659042358398, -9.005510330200195, -7.991361141204834, -6.977211952209473, -5.963062763214111, -4.94891357421875, -3.9347643852233887, -2.9206151962280273, -1.906466007232666, -0.8923168182373047, 0.12183237075805664, 1.135981559753418, 2.1501307487487793, 3.164276123046875, 4.178425312042236, 5.192574501037598, 6.206723690032959, 7.22087287902832, 8.235021591186523, 9.249171257019043, 10.263320922851562, 11.277469635009766, 12.291618347167969, 13.305768013000488, 14.319917678833008, 15.334066390991211, 16.348215103149414, 17.36236572265625, 18.376514434814453, 19.390663146972656, 20.40481185913086, 21.418960571289062, 22.4331111907959, 23.4472599029541, 24.461408615112305, 25.47555923461914, 26.489707946777344, 27.503856658935547, 28.51800537109375, 29.532154083251953, 30.54630470275879, 31.560453414916992, 32.57460403442383, 33.58875274658203, 34.602901458740234, 35.61705017089844]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 8.0, 5.0, 9.0, 9.0, 8.0, 9.0, 20.0, 15.0, 15.0, 17.0, 19.0, 27.0, 25.0, 24.0, 31.0, 25.0, 24.0, 35.0, 37.0, 38.0, 41.0, 40.0, 38.0, 48.0, 42.0, 29.0, 39.0, 42.0, 30.0, 29.0, 36.0, 23.0, 30.0, 18.0, 17.0, 19.0, 10.0, 21.0, 10.0, 11.0, 7.0, 8.0, 9.0, 4.0, 3.0, 3.0, 2.0, 1.0, 2.0], "bins": [-3.169921875, -3.084808349609375, -2.99969482421875, -2.914581298828125, -2.8294677734375, -2.744354248046875, -2.65924072265625, -2.574127197265625, -2.489013671875, -2.403900146484375, -2.31878662109375, -2.233673095703125, -2.1485595703125, -2.063446044921875, -1.97833251953125, -1.893218994140625, -1.80810546875, -1.722991943359375, -1.63787841796875, -1.552764892578125, -1.4676513671875, -1.382537841796875, -1.29742431640625, -1.212310791015625, -1.127197265625, -1.042083740234375, -0.95697021484375, -0.871856689453125, -0.7867431640625, -0.701629638671875, -0.61651611328125, -0.531402587890625, -0.4462890625, -0.361175537109375, -0.27606201171875, -0.190948486328125, -0.1058349609375, -0.020721435546875, 0.06439208984375, 0.149505615234375, 0.234619140625, 0.319732666015625, 0.40484619140625, 0.489959716796875, 0.5750732421875, 0.660186767578125, 0.74530029296875, 0.830413818359375, 0.91552734375, 1.000640869140625, 1.08575439453125, 1.170867919921875, 1.2559814453125, 1.341094970703125, 1.42620849609375, 1.511322021484375, 1.596435546875, 1.681549072265625, 1.76666259765625, 1.851776123046875, 1.9368896484375, 2.022003173828125, 2.10711669921875, 2.192230224609375, 2.27734375]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 3.0, 5.0, 2.0, 6.0, 12.0, 8.0, 9.0, 20.0, 24.0, 24.0, 27.0, 35.0, 41.0, 56.0, 70.0, 105.0, 188.0, 462.0, 1246.0, 4779.0, 22258.0, 142515.0, 1696959.0, 2108563.0, 181723.0, 27135.0, 5475.0, 1416.0, 471.0, 193.0, 111.0, 80.0, 58.0, 40.0, 29.0, 25.0, 25.0, 18.0, 18.0, 11.0, 10.0, 7.0, 3.0, 6.0, 9.0, 2.0, 2.0, 1.0, 5.0, 0.0, 1.0], "bins": [-11.84375, -11.5152587890625, -11.186767578125, -10.8582763671875, -10.52978515625, -10.2012939453125, -9.872802734375, -9.5443115234375, -9.2158203125, -8.8873291015625, -8.558837890625, -8.2303466796875, -7.90185546875, -7.5733642578125, -7.244873046875, -6.9163818359375, -6.587890625, -6.2593994140625, -5.930908203125, -5.6024169921875, -5.27392578125, -4.9454345703125, -4.616943359375, -4.2884521484375, -3.9599609375, -3.6314697265625, -3.302978515625, -2.9744873046875, -2.64599609375, -2.3175048828125, -1.989013671875, -1.6605224609375, -1.33203125, -1.0035400390625, -0.675048828125, -0.3465576171875, -0.01806640625, 0.3104248046875, 0.638916015625, 0.9674072265625, 1.2958984375, 1.6243896484375, 1.952880859375, 2.2813720703125, 2.60986328125, 2.9383544921875, 3.266845703125, 3.5953369140625, 3.923828125, 4.2523193359375, 4.580810546875, 4.9093017578125, 5.23779296875, 5.5662841796875, 5.894775390625, 6.2232666015625, 6.5517578125, 6.8802490234375, 7.208740234375, 7.5372314453125, 7.86572265625, 8.1942138671875, 8.522705078125, 8.8511962890625, 9.1796875]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 4.0, 2.0, 7.0, 9.0, 8.0, 10.0, 24.0, 22.0, 25.0, 39.0, 74.0, 105.0, 117.0, 164.0, 214.0, 286.0, 382.0, 444.0, 445.0, 396.0, 350.0, 261.0, 165.0, 134.0, 109.0, 86.0, 66.0, 32.0, 22.0, 25.0, 12.0, 11.0, 7.0, 11.0, 6.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.82421875, -6.57366943359375, -6.3231201171875, -6.07257080078125, -5.822021484375, -5.57147216796875, -5.3209228515625, -5.07037353515625, -4.81982421875, -4.56927490234375, -4.3187255859375, -4.06817626953125, -3.817626953125, -3.56707763671875, -3.3165283203125, -3.06597900390625, -2.8154296875, -2.56488037109375, -2.3143310546875, -2.06378173828125, -1.813232421875, -1.56268310546875, -1.3121337890625, -1.06158447265625, -0.81103515625, -0.56048583984375, -0.3099365234375, -0.05938720703125, 0.191162109375, 0.44171142578125, 0.6922607421875, 0.94281005859375, 1.193359375, 1.44390869140625, 1.6944580078125, 1.94500732421875, 2.195556640625, 2.44610595703125, 2.6966552734375, 2.94720458984375, 3.19775390625, 3.44830322265625, 3.6988525390625, 3.94940185546875, 4.199951171875, 4.45050048828125, 4.7010498046875, 4.95159912109375, 5.2021484375, 5.45269775390625, 5.7032470703125, 5.95379638671875, 6.204345703125, 6.45489501953125, 6.7054443359375, 6.95599365234375, 7.20654296875, 7.45709228515625, 7.7076416015625, 7.95819091796875, 8.208740234375, 8.45928955078125, 8.7098388671875, 8.96038818359375, 9.2109375]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 6.0, 12.0, 9.0, 5.0, 14.0, 19.0, 22.0, 44.0, 48.0, 78.0, 78.0, 119.0, 201.0, 340.0, 664.0, 1462.0, 4036.0, 13909.0, 54897.0, 274530.0, 1597485.0, 1834573.0, 324473.0, 63904.0, 15456.0, 4552.0, 1610.0, 719.0, 356.0, 199.0, 114.0, 91.0, 61.0, 47.0, 35.0, 30.0, 22.0, 13.0, 16.0, 12.0, 3.0, 9.0, 2.0, 1.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 3.0], "bins": [-13.9609375, -13.5509033203125, -13.140869140625, -12.7308349609375, -12.32080078125, -11.9107666015625, -11.500732421875, -11.0906982421875, -10.6806640625, -10.2706298828125, -9.860595703125, -9.4505615234375, -9.04052734375, -8.6304931640625, -8.220458984375, -7.8104248046875, -7.400390625, -6.9903564453125, -6.580322265625, -6.1702880859375, -5.76025390625, -5.3502197265625, -4.940185546875, -4.5301513671875, -4.1201171875, -3.7100830078125, -3.300048828125, -2.8900146484375, -2.47998046875, -2.0699462890625, -1.659912109375, -1.2498779296875, -0.83984375, -0.4298095703125, -0.019775390625, 0.3902587890625, 0.80029296875, 1.2103271484375, 1.620361328125, 2.0303955078125, 2.4404296875, 2.8504638671875, 3.260498046875, 3.6705322265625, 4.08056640625, 4.4906005859375, 4.900634765625, 5.3106689453125, 5.720703125, 6.1307373046875, 6.540771484375, 6.9508056640625, 7.36083984375, 7.7708740234375, 8.180908203125, 8.5909423828125, 9.0009765625, 9.4110107421875, 9.821044921875, 10.2310791015625, 10.64111328125, 11.0511474609375, 11.461181640625, 11.8712158203125, 12.28125]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 25.0, 53.0, 130.0, 192.0, 231.0, 180.0, 118.0, 64.0, 12.0, 8.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-121.33665466308594, -118.47526550292969, -115.61387634277344, -112.75248718261719, -109.89109802246094, -107.02971649169922, -104.16832733154297, -101.30693817138672, -98.44554901123047, -95.58415985107422, -92.72277069091797, -89.86138153076172, -87.0, -84.13861083984375, -81.2772216796875, -78.41583251953125, -75.554443359375, -72.69305419921875, -69.8316650390625, -66.97027587890625, -64.10888671875, -61.247501373291016, -58.38611602783203, -55.52472686767578, -52.66333770751953, -49.80194854736328, -46.94055938720703, -44.07917404174805, -41.2177848815918, -38.35639572143555, -35.49501037597656, -32.63362121582031, -29.772235870361328, -26.910846710205078, -24.04945945739746, -21.188072204589844, -18.326683044433594, -15.46529483795166, -12.603906631469727, -9.74251937866211, -6.881130218505859, -4.019742012023926, -1.1583538055419922, 1.7030344009399414, 4.564422607421875, 7.425810813903809, 10.287199020385742, 13.14858627319336, 16.00997543334961, 18.87136459350586, 21.732751846313477, 24.594139099121094, 27.455528259277344, 30.316917419433594, 33.178306579589844, 36.03969192504883, 38.90108108520508, 41.76247024536133, 44.62385559082031, 47.48524475097656, 50.34663391113281, 53.20802307128906, 56.06941223144531, 58.9307975769043, 61.79218673706055]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 6.0, 3.0, 6.0, 9.0, 5.0, 10.0, 10.0, 8.0, 15.0, 13.0, 21.0, 16.0, 18.0, 25.0, 35.0, 24.0, 31.0, 29.0, 30.0, 44.0, 40.0, 48.0, 38.0, 34.0, 41.0, 36.0, 29.0, 42.0, 26.0, 26.0, 35.0, 29.0, 29.0, 20.0, 15.0, 21.0, 23.0, 21.0, 14.0, 15.0, 15.0, 10.0, 4.0, 4.0, 9.0, 3.0, 6.0, 8.0, 0.0, 5.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-22.52098846435547, -21.789676666259766, -21.058364868164062, -20.327054977416992, -19.59574317932129, -18.864431381225586, -18.133121490478516, -17.401809692382812, -16.67049789428711, -15.939186096191406, -15.20787525177002, -14.476564407348633, -13.74525260925293, -13.013940811157227, -12.28262996673584, -11.551319122314453, -10.82000732421875, -10.088695526123047, -9.35738468170166, -8.626073837280273, -7.89476203918457, -7.163450717926025, -6.4321393966674805, -5.7008280754089355, -4.969516754150391, -4.238205432891846, -3.506894111633301, -2.775582790374756, -2.044271469116211, -1.312960147857666, -0.5816488265991211, 0.14966249465942383, 0.8809738159179688, 1.6122851371765137, 2.3435964584350586, 3.0749077796936035, 3.8062191009521484, 4.537530422210693, 5.268841743469238, 6.000153064727783, 6.731464385986328, 7.462775707244873, 8.194087028503418, 8.925397872924805, 9.656709671020508, 10.388021469116211, 11.119332313537598, 11.850643157958984, 12.581954956054688, 13.31326675415039, 14.044577598571777, 14.775888442993164, 15.507200241088867, 16.23851203918457, 16.96982192993164, 17.701133728027344, 18.432445526123047, 19.16375732421875, 19.895069122314453, 20.626379013061523, 21.357690811157227, 22.08900260925293, 22.8203125, 23.551624298095703, 24.282936096191406]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 10.0, 8.0, 11.0, 11.0, 20.0, 15.0, 15.0, 22.0, 18.0, 30.0, 32.0, 30.0, 34.0, 42.0, 33.0, 41.0, 44.0, 50.0, 50.0, 30.0, 37.0, 39.0, 39.0, 28.0, 32.0, 28.0, 35.0, 32.0, 32.0, 28.0, 22.0, 18.0, 17.0, 22.0, 11.0, 11.0, 9.0, 5.0, 2.0, 7.0, 1.0, 0.0, 1.0], "bins": [-3.712890625, -3.61956787109375, -3.5262451171875, -3.43292236328125, -3.339599609375, -3.24627685546875, -3.1529541015625, -3.05963134765625, -2.96630859375, -2.87298583984375, -2.7796630859375, -2.68634033203125, -2.593017578125, -2.49969482421875, -2.4063720703125, -2.31304931640625, -2.2197265625, -2.12640380859375, -2.0330810546875, -1.93975830078125, -1.846435546875, -1.75311279296875, -1.6597900390625, -1.56646728515625, -1.47314453125, -1.37982177734375, -1.2864990234375, -1.19317626953125, -1.099853515625, -1.00653076171875, -0.9132080078125, -0.81988525390625, -0.7265625, -0.63323974609375, -0.5399169921875, -0.44659423828125, -0.353271484375, -0.25994873046875, -0.1666259765625, -0.07330322265625, 0.02001953125, 0.11334228515625, 0.2066650390625, 0.29998779296875, 0.393310546875, 0.48663330078125, 0.5799560546875, 0.67327880859375, 0.7666015625, 0.85992431640625, 0.9532470703125, 1.04656982421875, 1.139892578125, 1.23321533203125, 1.3265380859375, 1.41986083984375, 1.51318359375, 1.60650634765625, 1.6998291015625, 1.79315185546875, 1.886474609375, 1.97979736328125, 2.0731201171875, 2.16644287109375, 2.259765625]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 4.0, 4.0, 6.0, 12.0, 14.0, 19.0, 52.0, 93.0, 130.0, 205.0, 374.0, 619.0, 1077.0, 1757.0, 2824.0, 4622.0, 7390.0, 11330.0, 17209.0, 25325.0, 35929.0, 49203.0, 63735.0, 78964.0, 93910.0, 104508.0, 107333.0, 99276.0, 86256.0, 70242.0, 55780.0, 42155.0, 29833.0, 20845.0, 13759.0, 9138.0, 5650.0, 3530.0, 2241.0, 1269.0, 766.0, 466.0, 314.0, 167.0, 88.0, 62.0, 39.0, 15.0, 11.0, 6.0, 6.0, 4.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.6103515625, -1.5570831298828125, -1.503814697265625, -1.4505462646484375, -1.39727783203125, -1.3440093994140625, -1.290740966796875, -1.2374725341796875, -1.1842041015625, -1.1309356689453125, -1.077667236328125, -1.0243988037109375, -0.97113037109375, -0.9178619384765625, -0.864593505859375, -0.8113250732421875, -0.758056640625, -0.7047882080078125, -0.651519775390625, -0.5982513427734375, -0.54498291015625, -0.4917144775390625, -0.438446044921875, -0.3851776123046875, -0.3319091796875, -0.2786407470703125, -0.225372314453125, -0.1721038818359375, -0.11883544921875, -0.0655670166015625, -0.012298583984375, 0.0409698486328125, 0.09423828125, 0.1475067138671875, 0.200775146484375, 0.2540435791015625, 0.30731201171875, 0.3605804443359375, 0.413848876953125, 0.4671173095703125, 0.5203857421875, 0.5736541748046875, 0.626922607421875, 0.6801910400390625, 0.73345947265625, 0.7867279052734375, 0.839996337890625, 0.8932647705078125, 0.946533203125, 0.9998016357421875, 1.053070068359375, 1.1063385009765625, 1.15960693359375, 1.2128753662109375, 1.266143798828125, 1.3194122314453125, 1.3726806640625, 1.4259490966796875, 1.479217529296875, 1.5324859619140625, 1.58575439453125, 1.6390228271484375, 1.692291259765625, 1.7455596923828125, 1.798828125]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 2.0, 1.0, 1.0, 7.0, 5.0, 1.0, 2.0, 8.0, 6.0, 10.0, 8.0, 12.0, 12.0, 15.0, 18.0, 16.0, 26.0, 32.0, 30.0, 31.0, 35.0, 32.0, 35.0, 27.0, 45.0, 40.0, 1070.0, 28.0, 40.0, 32.0, 36.0, 37.0, 30.0, 43.0, 38.0, 27.0, 29.0, 19.0, 20.0, 18.0, 23.0, 13.0, 8.0, 13.0, 9.0, 7.0, 11.0, 9.0, 5.0, 3.0, 2.0, 1.0, 5.0, 1.0, 1.0, 1.0, 2.0], "bins": [-3.240234375, -3.144500732421875, -3.04876708984375, -2.953033447265625, -2.8572998046875, -2.761566162109375, -2.66583251953125, -2.570098876953125, -2.474365234375, -2.378631591796875, -2.28289794921875, -2.187164306640625, -2.0914306640625, -1.995697021484375, -1.89996337890625, -1.804229736328125, -1.70849609375, -1.612762451171875, -1.51702880859375, -1.421295166015625, -1.3255615234375, -1.229827880859375, -1.13409423828125, -1.038360595703125, -0.942626953125, -0.846893310546875, -0.75115966796875, -0.655426025390625, -0.5596923828125, -0.463958740234375, -0.36822509765625, -0.272491455078125, -0.1767578125, -0.081024169921875, 0.01470947265625, 0.110443115234375, 0.2061767578125, 0.301910400390625, 0.39764404296875, 0.493377685546875, 0.589111328125, 0.684844970703125, 0.78057861328125, 0.876312255859375, 0.9720458984375, 1.067779541015625, 1.16351318359375, 1.259246826171875, 1.35498046875, 1.450714111328125, 1.54644775390625, 1.642181396484375, 1.7379150390625, 1.833648681640625, 1.92938232421875, 2.025115966796875, 2.120849609375, 2.216583251953125, 2.31231689453125, 2.408050537109375, 2.5037841796875, 2.599517822265625, 2.69525146484375, 2.790985107421875, 2.88671875]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 6.0, 9.0, 14.0, 23.0, 40.0, 56.0, 73.0, 125.0, 194.0, 264.0, 396.0, 595.0, 908.0, 1285.0, 1964.0, 3012.0, 4226.0, 6268.0, 9386.0, 14083.0, 23134.0, 49780.0, 413683.0, 1420424.0, 71875.0, 27308.0, 15944.0, 10450.0, 6959.0, 4748.0, 3267.0, 2285.0, 1482.0, 964.0, 649.0, 463.0, 259.0, 189.0, 109.0, 85.0, 46.0, 41.0, 31.0, 15.0, 9.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0], "bins": [-3.53515625, -3.431610107421875, -3.32806396484375, -3.224517822265625, -3.1209716796875, -3.017425537109375, -2.91387939453125, -2.810333251953125, -2.706787109375, -2.603240966796875, -2.49969482421875, -2.396148681640625, -2.2926025390625, -2.189056396484375, -2.08551025390625, -1.981964111328125, -1.87841796875, -1.774871826171875, -1.67132568359375, -1.567779541015625, -1.4642333984375, -1.360687255859375, -1.25714111328125, -1.153594970703125, -1.050048828125, -0.946502685546875, -0.84295654296875, -0.739410400390625, -0.6358642578125, -0.532318115234375, -0.42877197265625, -0.325225830078125, -0.2216796875, -0.118133544921875, -0.01458740234375, 0.088958740234375, 0.1925048828125, 0.296051025390625, 0.39959716796875, 0.503143310546875, 0.606689453125, 0.710235595703125, 0.81378173828125, 0.917327880859375, 1.0208740234375, 1.124420166015625, 1.22796630859375, 1.331512451171875, 1.43505859375, 1.538604736328125, 1.64215087890625, 1.745697021484375, 1.8492431640625, 1.952789306640625, 2.05633544921875, 2.159881591796875, 2.263427734375, 2.366973876953125, 2.47052001953125, 2.574066162109375, 2.6776123046875, 2.781158447265625, 2.88470458984375, 2.988250732421875, 3.091796875]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 1.0, 5.0, 5.0, 7.0, 10.0, 19.0, 11.0, 8.0, 10.0, 16.0, 22.0, 17.0, 23.0, 23.0, 30.0, 33.0, 35.0, 33.0, 35.0, 39.0, 35.0, 25.0, 26.0, 32.0, 24.0, 43.0, 35.0, 48.0, 38.0, 35.0, 33.0, 31.0, 38.0, 20.0, 24.0, 20.0, 20.0, 21.0, 14.0, 11.0, 11.0, 6.0, 6.0, 6.0, 4.0, 4.0, 7.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.32275390625, -0.3132591247558594, -0.30376434326171875, -0.2942695617675781, -0.2847747802734375, -0.2752799987792969, -0.26578521728515625, -0.2562904357910156, -0.246795654296875, -0.23730087280273438, -0.22780609130859375, -0.21831130981445312, -0.2088165283203125, -0.19932174682617188, -0.18982696533203125, -0.18033218383789062, -0.17083740234375, -0.16134262084960938, -0.15184783935546875, -0.14235305786132812, -0.1328582763671875, -0.12336349487304688, -0.11386871337890625, -0.10437393188476562, -0.094879150390625, -0.08538436889648438, -0.07588958740234375, -0.06639480590820312, -0.0569000244140625, -0.047405242919921875, -0.03791046142578125, -0.028415679931640625, -0.0189208984375, -0.009426116943359375, 6.866455078125e-05, 0.009563446044921875, 0.0190582275390625, 0.028553009033203125, 0.03804779052734375, 0.047542572021484375, 0.057037353515625, 0.06653213500976562, 0.07602691650390625, 0.08552169799804688, 0.0950164794921875, 0.10451126098632812, 0.11400604248046875, 0.12350082397460938, 0.13299560546875, 0.14249038696289062, 0.15198516845703125, 0.16147994995117188, 0.1709747314453125, 0.18046951293945312, 0.18996429443359375, 0.19945907592773438, 0.208953857421875, 0.21844863891601562, 0.22794342041015625, 0.23743820190429688, 0.2469329833984375, 0.2564277648925781, 0.26592254638671875, 0.2754173278808594, 0.284912109375]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 6.0, 10.0, 10.0, 14.0, 20.0, 25.0, 27.0, 38.0, 33.0, 66.0, 60.0, 78.0, 80.0, 102.0, 126.0, 132.0, 191.0, 213.0, 265.0, 375.0, 881.0, 7708.0, 198554.0, 785921.0, 48577.0, 2786.0, 597.0, 325.0, 246.0, 197.0, 165.0, 134.0, 121.0, 80.0, 76.0, 51.0, 53.0, 37.0, 36.0, 25.0, 28.0, 19.0, 29.0, 10.0, 6.0, 9.0, 5.0, 6.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.33984375, -4.19659423828125, -4.0533447265625, -3.91009521484375, -3.766845703125, -3.62359619140625, -3.4803466796875, -3.33709716796875, -3.19384765625, -3.05059814453125, -2.9073486328125, -2.76409912109375, -2.620849609375, -2.47760009765625, -2.3343505859375, -2.19110107421875, -2.0478515625, -1.90460205078125, -1.7613525390625, -1.61810302734375, -1.474853515625, -1.33160400390625, -1.1883544921875, -1.04510498046875, -0.90185546875, -0.75860595703125, -0.6153564453125, -0.47210693359375, -0.328857421875, -0.18560791015625, -0.0423583984375, 0.10089111328125, 0.244140625, 0.38739013671875, 0.5306396484375, 0.67388916015625, 0.817138671875, 0.96038818359375, 1.1036376953125, 1.24688720703125, 1.39013671875, 1.53338623046875, 1.6766357421875, 1.81988525390625, 1.963134765625, 2.10638427734375, 2.2496337890625, 2.39288330078125, 2.5361328125, 2.67938232421875, 2.8226318359375, 2.96588134765625, 3.109130859375, 3.25238037109375, 3.3956298828125, 3.53887939453125, 3.68212890625, 3.82537841796875, 3.9686279296875, 4.11187744140625, 4.255126953125, 4.39837646484375, 4.5416259765625, 4.68487548828125, 4.828125]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 12.0, 62.0, 538.0, 349.0, 44.0, 9.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.57135581970215, -26.92828941345215, -26.28522300720215, -25.64215660095215, -24.99909019470215, -24.35602378845215, -23.71295738220215, -23.06989097595215, -22.42682456970215, -21.78375816345215, -21.14069175720215, -20.49762535095215, -19.85455894470215, -19.21149253845215, -18.56842613220215, -17.92535972595215, -17.28229522705078, -16.63922882080078, -15.996162414550781, -15.353096008300781, -14.710029602050781, -14.066963195800781, -13.423896789550781, -12.780830383300781, -12.137763977050781, -11.494697570800781, -10.851631164550781, -10.208564758300781, -9.565498352050781, -8.922431945800781, -8.279365539550781, -7.6362996101379395, -6.993231773376465, -6.350165367126465, -5.707098960876465, -5.064032554626465, -4.420966148376465, -3.777899980545044, -3.134833812713623, -2.491767406463623, -1.848701000213623, -1.205634593963623, -0.5625683069229126, 0.08049798011779785, 0.7235643863677979, 1.3666307926177979, 2.0096969604492188, 2.6527633666992188, 3.2958297729492188, 3.9388961791992188, 4.581962585449219, 5.225028991699219, 5.868095397949219, 6.511161804199219, 7.1542277336120605, 7.7972941398620605, 8.440361022949219, 9.083427429199219, 9.726493835449219, 10.369560241699219, 11.012626647949219, 11.655693054199219, 12.298759460449219, 12.941825866699219, 13.584891319274902]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 6.0, 4.0, 9.0, 10.0, 13.0, 25.0, 27.0, 32.0, 32.0, 36.0, 40.0, 57.0, 51.0, 56.0, 66.0, 73.0, 53.0, 50.0, 47.0, 54.0, 52.0, 42.0, 33.0, 28.0, 27.0, 20.0, 20.0, 11.0, 9.0, 7.0, 8.0, 4.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.1971001625061035, -4.062735080718994, -3.9283699989318848, -3.7940049171447754, -3.659639835357666, -3.5252747535705566, -3.3909096717834473, -3.256544589996338, -3.1221795082092285, -2.987814426422119, -2.8534493446350098, -2.7190842628479004, -2.584719181060791, -2.4503540992736816, -2.3159890174865723, -2.181623935699463, -2.0472590923309326, -1.9128940105438232, -1.7785289287567139, -1.6441638469696045, -1.5097987651824951, -1.3754336833953857, -1.241068720817566, -1.1067036390304565, -0.9723385572433472, -0.8379734754562378, -0.7036083936691284, -0.5692433714866638, -0.43487828969955444, -0.30051320791244507, -0.16614818572998047, -0.031783103942871094, 0.10258197784423828, 0.23694704473018646, 0.37131211161613464, 0.5056771636009216, 0.640042245388031, 0.7744073271751404, 0.908772349357605, 1.0431374311447144, 1.1775025129318237, 1.311867594718933, 1.4462326765060425, 1.5805976390838623, 1.7149627208709717, 1.849327802658081, 1.9836928844451904, 2.1180579662323, 2.252423048019409, 2.3867881298065186, 2.521153211593628, 2.6555182933807373, 2.7898833751678467, 2.924248456954956, 3.0586133003234863, 3.1929783821105957, 3.327343463897705, 3.4617085456848145, 3.596073627471924, 3.730438709259033, 3.8648037910461426, 3.999168872833252, 4.133533954620361, 4.267899036407471, 4.40226411819458]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 6.0, 1.0, 6.0, 7.0, 8.0, 10.0, 8.0, 12.0, 12.0, 13.0, 18.0, 26.0, 15.0, 17.0, 23.0, 39.0, 26.0, 37.0, 40.0, 32.0, 35.0, 37.0, 44.0, 42.0, 39.0, 35.0, 32.0, 30.0, 34.0, 35.0, 33.0, 24.0, 33.0, 26.0, 30.0, 26.0, 17.0, 21.0, 18.0, 15.0, 9.0, 9.0, 10.0, 7.0, 4.0, 3.0, 3.0, 0.0, 1.0, 3.0, 2.0], "bins": [-3.224609375, -3.13665771484375, -3.0487060546875, -2.96075439453125, -2.872802734375, -2.78485107421875, -2.6968994140625, -2.60894775390625, -2.52099609375, -2.43304443359375, -2.3450927734375, -2.25714111328125, -2.169189453125, -2.08123779296875, -1.9932861328125, -1.90533447265625, -1.8173828125, -1.72943115234375, -1.6414794921875, -1.55352783203125, -1.465576171875, -1.37762451171875, -1.2896728515625, -1.20172119140625, -1.11376953125, -1.02581787109375, -0.9378662109375, -0.84991455078125, -0.761962890625, -0.67401123046875, -0.5860595703125, -0.49810791015625, -0.41015625, -0.32220458984375, -0.2342529296875, -0.14630126953125, -0.058349609375, 0.02960205078125, 0.1175537109375, 0.20550537109375, 0.29345703125, 0.38140869140625, 0.4693603515625, 0.55731201171875, 0.645263671875, 0.73321533203125, 0.8211669921875, 0.90911865234375, 0.9970703125, 1.08502197265625, 1.1729736328125, 1.26092529296875, 1.348876953125, 1.43682861328125, 1.5247802734375, 1.61273193359375, 1.70068359375, 1.78863525390625, 1.8765869140625, 1.96453857421875, 2.052490234375, 2.14044189453125, 2.2283935546875, 2.31634521484375, 2.404296875]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 5.0, 8.0, 14.0, 16.0, 17.0, 24.0, 42.0, 62.0, 101.0, 124.0, 185.0, 309.0, 449.0, 669.0, 1136.0, 1786.0, 2961.0, 4883.0, 8341.0, 15524.0, 31809.0, 77469.0, 202949.0, 339724.0, 209948.0, 80297.0, 32407.0, 15677.0, 8618.0, 4973.0, 3037.0, 1757.0, 1144.0, 756.0, 454.0, 294.0, 184.0, 133.0, 83.0, 60.0, 41.0, 28.0, 24.0, 6.0, 9.0, 9.0, 7.0, 2.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6484375, -2.5587158203125, -2.468994140625, -2.3792724609375, -2.28955078125, -2.1998291015625, -2.110107421875, -2.0203857421875, -1.9306640625, -1.8409423828125, -1.751220703125, -1.6614990234375, -1.57177734375, -1.4820556640625, -1.392333984375, -1.3026123046875, -1.212890625, -1.1231689453125, -1.033447265625, -0.9437255859375, -0.85400390625, -0.7642822265625, -0.674560546875, -0.5848388671875, -0.4951171875, -0.4053955078125, -0.315673828125, -0.2259521484375, -0.13623046875, -0.0465087890625, 0.043212890625, 0.1329345703125, 0.22265625, 0.3123779296875, 0.402099609375, 0.4918212890625, 0.58154296875, 0.6712646484375, 0.760986328125, 0.8507080078125, 0.9404296875, 1.0301513671875, 1.119873046875, 1.2095947265625, 1.29931640625, 1.3890380859375, 1.478759765625, 1.5684814453125, 1.658203125, 1.7479248046875, 1.837646484375, 1.9273681640625, 2.01708984375, 2.1068115234375, 2.196533203125, 2.2862548828125, 2.3759765625, 2.4656982421875, 2.555419921875, 2.6451416015625, 2.73486328125, 2.8245849609375, 2.914306640625, 3.0040283203125, 3.09375]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 4.0, 4.0, 4.0, 9.0, 5.0, 5.0, 10.0, 13.0, 16.0, 16.0, 16.0, 19.0, 17.0, 27.0, 27.0, 32.0, 26.0, 31.0, 39.0, 41.0, 48.0, 60.0, 92.0, 263.0, 1451.0, 238.0, 91.0, 64.0, 53.0, 42.0, 30.0, 24.0, 25.0, 25.0, 33.0, 27.0, 16.0, 17.0, 21.0, 18.0, 10.0, 8.0, 6.0, 5.0, 5.0, 5.0, 7.0, 5.0, 3.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.859375, -9.5465087890625, -9.233642578125, -8.9207763671875, -8.60791015625, -8.2950439453125, -7.982177734375, -7.6693115234375, -7.3564453125, -7.0435791015625, -6.730712890625, -6.4178466796875, -6.10498046875, -5.7921142578125, -5.479248046875, -5.1663818359375, -4.853515625, -4.5406494140625, -4.227783203125, -3.9149169921875, -3.60205078125, -3.2891845703125, -2.976318359375, -2.6634521484375, -2.3505859375, -2.0377197265625, -1.724853515625, -1.4119873046875, -1.09912109375, -0.7862548828125, -0.473388671875, -0.1605224609375, 0.15234375, 0.4652099609375, 0.778076171875, 1.0909423828125, 1.40380859375, 1.7166748046875, 2.029541015625, 2.3424072265625, 2.6552734375, 2.9681396484375, 3.281005859375, 3.5938720703125, 3.90673828125, 4.2196044921875, 4.532470703125, 4.8453369140625, 5.158203125, 5.4710693359375, 5.783935546875, 6.0968017578125, 6.40966796875, 6.7225341796875, 7.035400390625, 7.3482666015625, 7.6611328125, 7.9739990234375, 8.286865234375, 8.5997314453125, 8.91259765625, 9.2254638671875, 9.538330078125, 9.8511962890625, 10.1640625]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 5.0, 12.0, 5.0, 5.0, 13.0, 12.0, 12.0, 9.0, 23.0, 37.0, 38.0, 54.0, 80.0, 99.0, 169.0, 260.0, 518.0, 1089.0, 3301.0, 14732.0, 142707.0, 2582926.0, 366842.0, 24902.0, 4770.0, 1504.0, 605.0, 335.0, 176.0, 119.0, 89.0, 48.0, 43.0, 40.0, 25.0, 16.0, 16.0, 18.0, 11.0, 8.0, 8.0, 8.0, 3.0, 6.0, 2.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.984375, -10.63720703125, -10.2900390625, -9.94287109375, -9.595703125, -9.24853515625, -8.9013671875, -8.55419921875, -8.20703125, -7.85986328125, -7.5126953125, -7.16552734375, -6.818359375, -6.47119140625, -6.1240234375, -5.77685546875, -5.4296875, -5.08251953125, -4.7353515625, -4.38818359375, -4.041015625, -3.69384765625, -3.3466796875, -2.99951171875, -2.65234375, -2.30517578125, -1.9580078125, -1.61083984375, -1.263671875, -0.91650390625, -0.5693359375, -0.22216796875, 0.125, 0.47216796875, 0.8193359375, 1.16650390625, 1.513671875, 1.86083984375, 2.2080078125, 2.55517578125, 2.90234375, 3.24951171875, 3.5966796875, 3.94384765625, 4.291015625, 4.63818359375, 4.9853515625, 5.33251953125, 5.6796875, 6.02685546875, 6.3740234375, 6.72119140625, 7.068359375, 7.41552734375, 7.7626953125, 8.10986328125, 8.45703125, 8.80419921875, 9.1513671875, 9.49853515625, 9.845703125, 10.19287109375, 10.5400390625, 10.88720703125, 11.234375]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 652.0, 360.0], "bins": [-455.39630126953125, -448.15338134765625, -440.9104309082031, -433.6675109863281, -426.424560546875, -419.181640625, -411.938720703125, -404.6957702636719, -397.4528503417969, -390.2099304199219, -382.96697998046875, -375.72406005859375, -368.48114013671875, -361.2381896972656, -353.9952697753906, -346.7523193359375, -339.5093994140625, -332.2664794921875, -325.0235290527344, -317.7806091308594, -310.53765869140625, -303.29473876953125, -296.05181884765625, -288.8088684082031, -281.5659484863281, -274.3230285644531, -267.080078125, -259.837158203125, -252.59422302246094, -245.35128784179688, -238.10836791992188, -230.8654327392578, -223.62249755859375, -216.3795623779297, -209.13662719726562, -201.89370727539062, -194.65077209472656, -187.4078369140625, -180.1649169921875, -172.92198181152344, -165.67904663085938, -158.4361114501953, -151.19317626953125, -143.95025634765625, -136.7073211669922, -129.46438598632812, -122.2214584350586, -114.97853088378906, -107.73558807373047, -100.49266052246094, -93.24972534179688, -86.00679016113281, -78.76386260986328, -71.52093505859375, -64.27799987792969, -57.03506851196289, -49.792137145996094, -42.5492057800293, -35.3062744140625, -28.063343048095703, -20.820411682128906, -13.57748031616211, -6.3345489501953125, 0.9083824157714844, 8.151312828063965]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 6.0, 7.0, 5.0, 10.0, 6.0, 8.0, 9.0, 19.0, 19.0, 15.0, 27.0, 23.0, 25.0, 40.0, 27.0, 24.0, 33.0, 27.0, 40.0, 41.0, 40.0, 54.0, 45.0, 33.0, 38.0, 37.0, 39.0, 35.0, 26.0, 29.0, 30.0, 21.0, 23.0, 21.0, 22.0, 19.0, 12.0, 9.0, 15.0, 11.0, 9.0, 7.0, 3.0, 4.0, 4.0, 4.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0], "bins": [-35.55496597290039, -34.497459411621094, -33.4399528503418, -32.3824462890625, -31.324939727783203, -30.267433166503906, -29.209928512573242, -28.152421951293945, -27.09491539001465, -26.03740882873535, -24.979902267456055, -23.922395706176758, -22.864891052246094, -21.807384490966797, -20.7498779296875, -19.692371368408203, -18.634864807128906, -17.57735824584961, -16.519851684570312, -15.462346076965332, -14.404839515686035, -13.347332954406738, -12.289827346801758, -11.232320785522461, -10.174814224243164, -9.117307662963867, -8.05980110168457, -7.00229549407959, -5.944788932800293, -4.887282371520996, -3.8297762870788574, -2.7722702026367188, -1.7147636413574219, -0.6572573184967041, 0.40024900436401367, 1.4577553272247314, 2.515261650085449, 3.572768211364746, 4.630274295806885, 5.687780380249023, 6.74528694152832, 7.802793502807617, 8.860300064086914, 9.917805671691895, 10.975312232971191, 12.032818794250488, 13.090324401855469, 14.147830963134766, 15.205337524414062, 16.26284408569336, 17.320350646972656, 18.377857208251953, 19.43536376953125, 20.492870330810547, 21.55037498474121, 22.607881546020508, 23.665388107299805, 24.7228946685791, 25.7804012298584, 26.837907791137695, 27.89541244506836, 28.952919006347656, 30.010425567626953, 31.06793212890625, 32.12543869018555]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 2.0, 3.0, 4.0, 2.0, 1.0, 5.0, 5.0, 5.0, 9.0, 11.0, 17.0, 9.0, 16.0, 16.0, 25.0, 17.0, 26.0, 23.0, 33.0, 33.0, 29.0, 20.0, 34.0, 33.0, 41.0, 43.0, 35.0, 34.0, 38.0, 26.0, 30.0, 30.0, 35.0, 36.0, 30.0, 26.0, 31.0, 24.0, 24.0, 24.0, 16.0, 22.0, 17.0, 8.0, 10.0, 5.0, 14.0, 9.0, 10.0, 4.0, 4.0, 1.0, 4.0, 0.0, 3.0, 0.0, 2.0], "bins": [-2.875, -2.791229248046875, -2.70745849609375, -2.623687744140625, -2.5399169921875, -2.456146240234375, -2.37237548828125, -2.288604736328125, -2.204833984375, -2.121063232421875, -2.03729248046875, -1.953521728515625, -1.8697509765625, -1.785980224609375, -1.70220947265625, -1.618438720703125, -1.53466796875, -1.450897216796875, -1.36712646484375, -1.283355712890625, -1.1995849609375, -1.115814208984375, -1.03204345703125, -0.948272705078125, -0.864501953125, -0.780731201171875, -0.69696044921875, -0.613189697265625, -0.5294189453125, -0.445648193359375, -0.36187744140625, -0.278106689453125, -0.1943359375, -0.110565185546875, -0.02679443359375, 0.056976318359375, 0.1407470703125, 0.224517822265625, 0.30828857421875, 0.392059326171875, 0.475830078125, 0.559600830078125, 0.64337158203125, 0.727142333984375, 0.8109130859375, 0.894683837890625, 0.97845458984375, 1.062225341796875, 1.14599609375, 1.229766845703125, 1.31353759765625, 1.397308349609375, 1.4810791015625, 1.564849853515625, 1.64862060546875, 1.732391357421875, 1.816162109375, 1.899932861328125, 1.98370361328125, 2.067474365234375, 2.1512451171875, 2.235015869140625, 2.31878662109375, 2.402557373046875, 2.486328125]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 0.0, 2.0, 4.0, 2.0, 3.0, 7.0, 3.0, 14.0, 14.0, 19.0, 30.0, 38.0, 45.0, 50.0, 75.0, 122.0, 198.0, 334.0, 608.0, 1085.0, 2029.0, 4258.0, 8942.0, 21204.0, 55525.0, 167298.0, 664345.0, 1862377.0, 1026242.0, 250484.0, 77536.0, 28564.0, 11911.0, 5208.0, 2527.0, 1349.0, 714.0, 426.0, 240.0, 134.0, 95.0, 70.0, 47.0, 30.0, 16.0, 16.0, 11.0, 9.0, 6.0, 8.0, 5.0, 5.0, 2.0, 1.0, 3.0, 3.0], "bins": [-6.1328125, -5.9608154296875, -5.788818359375, -5.6168212890625, -5.44482421875, -5.2728271484375, -5.100830078125, -4.9288330078125, -4.7568359375, -4.5848388671875, -4.412841796875, -4.2408447265625, -4.06884765625, -3.8968505859375, -3.724853515625, -3.5528564453125, -3.380859375, -3.2088623046875, -3.036865234375, -2.8648681640625, -2.69287109375, -2.5208740234375, -2.348876953125, -2.1768798828125, -2.0048828125, -1.8328857421875, -1.660888671875, -1.4888916015625, -1.31689453125, -1.1448974609375, -0.972900390625, -0.8009033203125, -0.62890625, -0.4569091796875, -0.284912109375, -0.1129150390625, 0.05908203125, 0.2310791015625, 0.403076171875, 0.5750732421875, 0.7470703125, 0.9190673828125, 1.091064453125, 1.2630615234375, 1.43505859375, 1.6070556640625, 1.779052734375, 1.9510498046875, 2.123046875, 2.2950439453125, 2.467041015625, 2.6390380859375, 2.81103515625, 2.9830322265625, 3.155029296875, 3.3270263671875, 3.4990234375, 3.6710205078125, 3.843017578125, 4.0150146484375, 4.18701171875, 4.3590087890625, 4.531005859375, 4.7030029296875, 4.875]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 5.0, 3.0, 8.0, 9.0, 11.0, 22.0, 18.0, 38.0, 61.0, 81.0, 114.0, 138.0, 258.0, 320.0, 463.0, 540.0, 513.0, 402.0, 304.0, 237.0, 165.0, 117.0, 86.0, 57.0, 38.0, 22.0, 19.0, 14.0, 7.0, 6.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.5859375, -10.282958984375, -9.97998046875, -9.677001953125, -9.3740234375, -9.071044921875, -8.76806640625, -8.465087890625, -8.162109375, -7.859130859375, -7.55615234375, -7.253173828125, -6.9501953125, -6.647216796875, -6.34423828125, -6.041259765625, -5.73828125, -5.435302734375, -5.13232421875, -4.829345703125, -4.5263671875, -4.223388671875, -3.92041015625, -3.617431640625, -3.314453125, -3.011474609375, -2.70849609375, -2.405517578125, -2.1025390625, -1.799560546875, -1.49658203125, -1.193603515625, -0.890625, -0.587646484375, -0.28466796875, 0.018310546875, 0.3212890625, 0.624267578125, 0.92724609375, 1.230224609375, 1.533203125, 1.836181640625, 2.13916015625, 2.442138671875, 2.7451171875, 3.048095703125, 3.35107421875, 3.654052734375, 3.95703125, 4.260009765625, 4.56298828125, 4.865966796875, 5.1689453125, 5.471923828125, 5.77490234375, 6.077880859375, 6.380859375, 6.683837890625, 6.98681640625, 7.289794921875, 7.5927734375, 7.895751953125, 8.19873046875, 8.501708984375, 8.8046875]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 5.0, 11.0, 10.0, 21.0, 32.0, 68.0, 85.0, 205.0, 376.0, 784.0, 2031.0, 6535.0, 25190.0, 125539.0, 806761.0, 2522467.0, 581533.0, 94619.0, 19688.0, 5168.0, 1749.0, 730.0, 298.0, 173.0, 102.0, 48.0, 32.0, 15.0, 6.0, 5.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.4765625, -11.0421142578125, -10.607666015625, -10.1732177734375, -9.73876953125, -9.3043212890625, -8.869873046875, -8.4354248046875, -8.0009765625, -7.5665283203125, -7.132080078125, -6.6976318359375, -6.26318359375, -5.8287353515625, -5.394287109375, -4.9598388671875, -4.525390625, -4.0909423828125, -3.656494140625, -3.2220458984375, -2.78759765625, -2.3531494140625, -1.918701171875, -1.4842529296875, -1.0498046875, -0.6153564453125, -0.180908203125, 0.2535400390625, 0.68798828125, 1.1224365234375, 1.556884765625, 1.9913330078125, 2.42578125, 2.8602294921875, 3.294677734375, 3.7291259765625, 4.16357421875, 4.5980224609375, 5.032470703125, 5.4669189453125, 5.9013671875, 6.3358154296875, 6.770263671875, 7.2047119140625, 7.63916015625, 8.0736083984375, 8.508056640625, 8.9425048828125, 9.376953125, 9.8114013671875, 10.245849609375, 10.6802978515625, 11.11474609375, 11.5491943359375, 11.983642578125, 12.4180908203125, 12.8525390625, 13.2869873046875, 13.721435546875, 14.1558837890625, 14.59033203125, 15.0247802734375, 15.459228515625, 15.8936767578125, 16.328125]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 7.0, 10.0, 26.0, 26.0, 53.0, 98.0, 117.0, 124.0, 141.0, 124.0, 112.0, 75.0, 45.0, 29.0, 14.0, 4.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.03145217895508, -30.18287467956543, -28.33429718017578, -26.4857177734375, -24.637142181396484, -22.788562774658203, -20.939985275268555, -19.091407775878906, -17.242830276489258, -15.39425277709961, -13.545675277709961, -11.697096824645996, -9.848519325256348, -7.999941825866699, -6.151363372802734, -4.302785873413086, -2.4542083740234375, -0.60563063621521, 1.2429471015930176, 3.091525077819824, 4.940102577209473, 6.788680076599121, 8.637258529663086, 10.485836029052734, 12.334413528442383, 14.182991027832031, 16.03156852722168, 17.880146026611328, 19.72872543334961, 21.577301025390625, 23.425880432128906, 25.274457931518555, 27.123031616210938, 28.971609115600586, 30.820186614990234, 32.668766021728516, 34.51734161376953, 36.36592102050781, 38.214500427246094, 40.06307601928711, 41.911651611328125, 43.760231018066406, 45.60880661010742, 47.4573860168457, 49.30596160888672, 51.154541015625, 53.00312042236328, 54.8516960144043, 56.70027542114258, 58.54885482788086, 60.397430419921875, 62.246009826660156, 64.09458923339844, 65.94316101074219, 67.79174041748047, 69.64031982421875, 71.48889923095703, 73.33747863769531, 75.1860580444336, 77.03462982177734, 78.88320922851562, 80.7317886352539, 82.58036804199219, 84.42893981933594, 86.27751922607422]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 1.0, 4.0, 4.0, 4.0, 3.0, 5.0, 7.0, 11.0, 6.0, 9.0, 12.0, 10.0, 16.0, 17.0, 17.0, 35.0, 28.0, 33.0, 37.0, 37.0, 38.0, 46.0, 38.0, 41.0, 40.0, 46.0, 45.0, 43.0, 43.0, 31.0, 28.0, 28.0, 24.0, 29.0, 34.0, 23.0, 16.0, 31.0, 15.0, 16.0, 12.0, 10.0, 7.0, 6.0, 4.0, 5.0, 0.0, 3.0, 4.0, 6.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-26.277666091918945, -25.463714599609375, -24.649763107299805, -23.8358097076416, -23.02185821533203, -22.20790672302246, -21.39395523071289, -20.580001831054688, -19.766050338745117, -18.952098846435547, -18.138147354125977, -17.324193954467773, -16.510242462158203, -15.696290969848633, -14.882339477539062, -14.068387031555176, -13.254435539245605, -12.440484046936035, -11.626531600952148, -10.812580108642578, -9.998627662658691, -9.184676170349121, -8.370723724365234, -7.556772232055664, -6.7428202629089355, -5.928868293762207, -5.1149163246154785, -4.30096435546875, -3.4870126247406006, -2.673060894012451, -1.8591089248657227, -1.0451569557189941, -0.23120498657226562, 0.5827469229698181, 1.3966988325119019, 2.210650682449341, 3.0246026515960693, 3.8385543823242188, 4.652506351470947, 5.466458320617676, 6.280410289764404, 7.094362258911133, 7.908314228057861, 8.72226619720459, 9.53621768951416, 10.350170135498047, 11.164121627807617, 11.978073120117188, 12.792025566101074, 13.605977058410645, 14.419929504394531, 15.233880996704102, 16.047832489013672, 16.861785888671875, 17.675737380981445, 18.489688873291016, 19.303640365600586, 20.117591857910156, 20.931543350219727, 21.74549674987793, 22.5594482421875, 23.37339973449707, 24.18735122680664, 25.001304626464844, 25.815256118774414]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 3.0, 4.0, 8.0, 3.0, 10.0, 15.0, 17.0, 14.0, 18.0, 17.0, 22.0, 20.0, 16.0, 30.0, 29.0, 22.0, 34.0, 34.0, 38.0, 30.0, 26.0, 32.0, 42.0, 31.0, 28.0, 28.0, 39.0, 35.0, 37.0, 31.0, 35.0, 37.0, 27.0, 24.0, 21.0, 21.0, 20.0, 13.0, 18.0, 15.0, 10.0, 8.0, 10.0, 9.0, 4.0, 5.0, 2.0, 5.0, 5.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.94140625, -2.8555908203125, -2.769775390625, -2.6839599609375, -2.59814453125, -2.5123291015625, -2.426513671875, -2.3406982421875, -2.2548828125, -2.1690673828125, -2.083251953125, -1.9974365234375, -1.91162109375, -1.8258056640625, -1.739990234375, -1.6541748046875, -1.568359375, -1.4825439453125, -1.396728515625, -1.3109130859375, -1.22509765625, -1.1392822265625, -1.053466796875, -0.9676513671875, -0.8818359375, -0.7960205078125, -0.710205078125, -0.6243896484375, -0.53857421875, -0.4527587890625, -0.366943359375, -0.2811279296875, -0.1953125, -0.1094970703125, -0.023681640625, 0.0621337890625, 0.14794921875, 0.2337646484375, 0.319580078125, 0.4053955078125, 0.4912109375, 0.5770263671875, 0.662841796875, 0.7486572265625, 0.83447265625, 0.9202880859375, 1.006103515625, 1.0919189453125, 1.177734375, 1.2635498046875, 1.349365234375, 1.4351806640625, 1.52099609375, 1.6068115234375, 1.692626953125, 1.7784423828125, 1.8642578125, 1.9500732421875, 2.035888671875, 2.1217041015625, 2.20751953125, 2.2933349609375, 2.379150390625, 2.4649658203125, 2.55078125]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 5.0, 5.0, 5.0, 12.0, 20.0, 25.0, 31.0, 77.0, 122.0, 189.0, 298.0, 473.0, 781.0, 1214.0, 1882.0, 2987.0, 4841.0, 7252.0, 11048.0, 16098.0, 23302.0, 32207.0, 42938.0, 55318.0, 68507.0, 81049.0, 90226.0, 96021.0, 94669.0, 88237.0, 78034.0, 65477.0, 51955.0, 40071.0, 29672.0, 20975.0, 14612.0, 9882.0, 6336.0, 4417.0, 2758.0, 1670.0, 1091.0, 670.0, 421.0, 271.0, 164.0, 95.0, 52.0, 35.0, 28.0, 19.0, 7.0, 7.0, 6.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-1.51171875, -1.4611053466796875, -1.410491943359375, -1.3598785400390625, -1.30926513671875, -1.2586517333984375, -1.208038330078125, -1.1574249267578125, -1.1068115234375, -1.0561981201171875, -1.005584716796875, -0.9549713134765625, -0.90435791015625, -0.8537445068359375, -0.803131103515625, -0.7525177001953125, -0.701904296875, -0.6512908935546875, -0.600677490234375, -0.5500640869140625, -0.49945068359375, -0.4488372802734375, -0.398223876953125, -0.3476104736328125, -0.2969970703125, -0.2463836669921875, -0.195770263671875, -0.1451568603515625, -0.09454345703125, -0.0439300537109375, 0.006683349609375, 0.0572967529296875, 0.10791015625, 0.1585235595703125, 0.209136962890625, 0.2597503662109375, 0.31036376953125, 0.3609771728515625, 0.411590576171875, 0.4622039794921875, 0.5128173828125, 0.5634307861328125, 0.614044189453125, 0.6646575927734375, 0.71527099609375, 0.7658843994140625, 0.816497802734375, 0.8671112060546875, 0.917724609375, 0.9683380126953125, 1.018951416015625, 1.0695648193359375, 1.12017822265625, 1.1707916259765625, 1.221405029296875, 1.2720184326171875, 1.3226318359375, 1.3732452392578125, 1.423858642578125, 1.4744720458984375, 1.52508544921875, 1.5756988525390625, 1.626312255859375, 1.6769256591796875, 1.7275390625]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 4.0, 5.0, 4.0, 9.0, 6.0, 9.0, 11.0, 11.0, 14.0, 17.0, 18.0, 26.0, 19.0, 26.0, 25.0, 33.0, 31.0, 27.0, 35.0, 45.0, 27.0, 46.0, 1069.0, 40.0, 41.0, 39.0, 40.0, 34.0, 31.0, 31.0, 46.0, 30.0, 31.0, 31.0, 14.0, 21.0, 17.0, 8.0, 13.0, 7.0, 8.0, 8.0, 3.0, 5.0, 6.0, 5.0, 1.0, 2.0, 1.0, 0.0, 4.0, 1.0, 1.0, 2.0, 1.0], "bins": [-3.185546875, -3.085784912109375, -2.98602294921875, -2.886260986328125, -2.7864990234375, -2.686737060546875, -2.58697509765625, -2.487213134765625, -2.387451171875, -2.287689208984375, -2.18792724609375, -2.088165283203125, -1.9884033203125, -1.888641357421875, -1.78887939453125, -1.689117431640625, -1.58935546875, -1.489593505859375, -1.38983154296875, -1.290069580078125, -1.1903076171875, -1.090545654296875, -0.99078369140625, -0.891021728515625, -0.791259765625, -0.691497802734375, -0.59173583984375, -0.491973876953125, -0.3922119140625, -0.292449951171875, -0.19268798828125, -0.092926025390625, 0.0068359375, 0.106597900390625, 0.20635986328125, 0.306121826171875, 0.4058837890625, 0.505645751953125, 0.60540771484375, 0.705169677734375, 0.804931640625, 0.904693603515625, 1.00445556640625, 1.104217529296875, 1.2039794921875, 1.303741455078125, 1.40350341796875, 1.503265380859375, 1.60302734375, 1.702789306640625, 1.80255126953125, 1.902313232421875, 2.0020751953125, 2.101837158203125, 2.20159912109375, 2.301361083984375, 2.401123046875, 2.500885009765625, 2.60064697265625, 2.700408935546875, 2.8001708984375, 2.899932861328125, 2.99969482421875, 3.099456787109375, 3.19921875]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0, 5.0, 12.0, 15.0, 23.0, 24.0, 47.0, 63.0, 99.0, 129.0, 191.0, 337.0, 455.0, 704.0, 1043.0, 1538.0, 2382.0, 3441.0, 5013.0, 7488.0, 10914.0, 16913.0, 29025.0, 75840.0, 1441764.0, 381657.0, 49877.0, 23769.0, 14542.0, 9892.0, 6322.0, 4290.0, 3057.0, 2032.0, 1417.0, 906.0, 616.0, 435.0, 299.0, 185.0, 122.0, 90.0, 56.0, 40.0, 23.0, 15.0, 12.0, 8.0, 7.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-3.205078125, -3.10113525390625, -2.9971923828125, -2.89324951171875, -2.789306640625, -2.68536376953125, -2.5814208984375, -2.47747802734375, -2.37353515625, -2.26959228515625, -2.1656494140625, -2.06170654296875, -1.957763671875, -1.85382080078125, -1.7498779296875, -1.64593505859375, -1.5419921875, -1.43804931640625, -1.3341064453125, -1.23016357421875, -1.126220703125, -1.02227783203125, -0.9183349609375, -0.81439208984375, -0.71044921875, -0.60650634765625, -0.5025634765625, -0.39862060546875, -0.294677734375, -0.19073486328125, -0.0867919921875, 0.01715087890625, 0.12109375, 0.22503662109375, 0.3289794921875, 0.43292236328125, 0.536865234375, 0.64080810546875, 0.7447509765625, 0.84869384765625, 0.95263671875, 1.05657958984375, 1.1605224609375, 1.26446533203125, 1.368408203125, 1.47235107421875, 1.5762939453125, 1.68023681640625, 1.7841796875, 1.88812255859375, 1.9920654296875, 2.09600830078125, 2.199951171875, 2.30389404296875, 2.4078369140625, 2.51177978515625, 2.61572265625, 2.71966552734375, 2.8236083984375, 2.92755126953125, 3.031494140625, 3.13543701171875, 3.2393798828125, 3.34332275390625, 3.447265625]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 2.0, 3.0, 6.0, 6.0, 7.0, 9.0, 15.0, 9.0, 22.0, 23.0, 22.0, 21.0, 31.0, 31.0, 46.0, 50.0, 44.0, 41.0, 27.0, 35.0, 36.0, 36.0, 33.0, 37.0, 39.0, 33.0, 32.0, 42.0, 34.0, 39.0, 28.0, 33.0, 25.0, 14.0, 21.0, 11.0, 13.0, 14.0, 7.0, 8.0, 4.0, 4.0, 7.0, 3.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.411865234375, -0.4000968933105469, -0.38832855224609375, -0.3765602111816406, -0.3647918701171875, -0.3530235290527344, -0.34125518798828125, -0.3294868469238281, -0.317718505859375, -0.3059501647949219, -0.29418182373046875, -0.2824134826660156, -0.2706451416015625, -0.2588768005371094, -0.24710845947265625, -0.23534011840820312, -0.22357177734375, -0.21180343627929688, -0.20003509521484375, -0.18826675415039062, -0.1764984130859375, -0.16473007202148438, -0.15296173095703125, -0.14119338989257812, -0.129425048828125, -0.11765670776367188, -0.10588836669921875, -0.09412002563476562, -0.0823516845703125, -0.07058334350585938, -0.05881500244140625, -0.047046661376953125, -0.0352783203125, -0.023509979248046875, -0.01174163818359375, 2.6702880859375e-05, 0.0117950439453125, 0.023563385009765625, 0.03533172607421875, 0.047100067138671875, 0.058868408203125, 0.07063674926757812, 0.08240509033203125, 0.09417343139648438, 0.1059417724609375, 0.11771011352539062, 0.12947845458984375, 0.14124679565429688, 0.15301513671875, 0.16478347778320312, 0.17655181884765625, 0.18832015991210938, 0.2000885009765625, 0.21185684204101562, 0.22362518310546875, 0.23539352416992188, 0.247161865234375, 0.2589302062988281, 0.27069854736328125, 0.2824668884277344, 0.2942352294921875, 0.3060035705566406, 0.31777191162109375, 0.3295402526855469, 0.34130859375]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 2.0, 11.0, 9.0, 11.0, 11.0, 18.0, 25.0, 25.0, 33.0, 50.0, 66.0, 92.0, 110.0, 132.0, 185.0, 221.0, 348.0, 406.0, 735.0, 5397.0, 329871.0, 696495.0, 11535.0, 974.0, 406.0, 289.0, 279.0, 181.0, 125.0, 113.0, 93.0, 66.0, 57.0, 45.0, 36.0, 26.0, 18.0, 19.0, 8.0, 10.0, 5.0, 4.0, 5.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.69921875, -5.50994873046875, -5.3206787109375, -5.13140869140625, -4.942138671875, -4.75286865234375, -4.5635986328125, -4.37432861328125, -4.18505859375, -3.99578857421875, -3.8065185546875, -3.61724853515625, -3.427978515625, -3.23870849609375, -3.0494384765625, -2.86016845703125, -2.6708984375, -2.48162841796875, -2.2923583984375, -2.10308837890625, -1.913818359375, -1.72454833984375, -1.5352783203125, -1.34600830078125, -1.15673828125, -0.96746826171875, -0.7781982421875, -0.58892822265625, -0.399658203125, -0.21038818359375, -0.0211181640625, 0.16815185546875, 0.357421875, 0.54669189453125, 0.7359619140625, 0.92523193359375, 1.114501953125, 1.30377197265625, 1.4930419921875, 1.68231201171875, 1.87158203125, 2.06085205078125, 2.2501220703125, 2.43939208984375, 2.628662109375, 2.81793212890625, 3.0072021484375, 3.19647216796875, 3.3857421875, 3.57501220703125, 3.7642822265625, 3.95355224609375, 4.142822265625, 4.33209228515625, 4.5213623046875, 4.71063232421875, 4.89990234375, 5.08917236328125, 5.2784423828125, 5.46771240234375, 5.656982421875, 5.84625244140625, 6.0355224609375, 6.22479248046875, 6.4140625]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 14.0, 93.0, 699.0, 178.0, 27.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.35578155517578, -32.60832977294922, -31.86087989807129, -31.113428115844727, -30.365978240966797, -29.618526458740234, -28.871074676513672, -28.12362289428711, -27.37617301940918, -26.628721237182617, -25.881271362304688, -25.133819580078125, -24.386367797851562, -23.638917922973633, -22.89146614074707, -22.14401626586914, -21.396564483642578, -20.649112701416016, -19.901662826538086, -19.154211044311523, -18.406761169433594, -17.65930938720703, -16.91185760498047, -16.164405822753906, -15.416955947875977, -14.66950511932373, -13.922054290771484, -13.174602508544922, -12.427151679992676, -11.67970085144043, -10.932249069213867, -10.184798240661621, -9.437347412109375, -8.689896583557129, -7.942445278167725, -7.19499397277832, -6.447543144226074, -5.700092315673828, -4.952641010284424, -4.2051897048950195, -3.4577388763427734, -2.7102878093719482, -1.962836742401123, -1.2153856754302979, -0.46793460845947266, 0.27951645851135254, 1.0269675254821777, 1.774418830871582, 2.521869659423828, 3.2693207263946533, 4.0167717933654785, 4.764223098754883, 5.511673927307129, 6.259124755859375, 7.006576061248779, 7.754027366638184, 8.50147819519043, 9.248929023742676, 9.996379852294922, 10.743831634521484, 11.49128246307373, 12.238733291625977, 12.986185073852539, 13.733635902404785, 14.481086730957031]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 11.0, 14.0, 12.0, 17.0, 24.0, 30.0, 25.0, 41.0, 38.0, 46.0, 57.0, 38.0, 57.0, 59.0, 46.0, 47.0, 61.0, 54.0, 57.0, 44.0, 50.0, 30.0, 25.0, 26.0, 28.0, 22.0, 9.0, 12.0, 5.0, 5.0, 11.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.096261978149414, -3.950772285461426, -3.8052823543548584, -3.65979266166687, -3.514302968978882, -3.3688130378723145, -3.223323345184326, -3.077833652496338, -2.9323439598083496, -2.7868542671203613, -2.641364336013794, -2.4958746433258057, -2.3503849506378174, -2.20489501953125, -2.0594053268432617, -1.9139156341552734, -1.768425703048706, -1.6229358911514282, -1.47744619846344, -1.331956386566162, -1.1864666938781738, -1.040976881980896, -0.8954870700836182, -0.7499973773956299, -0.604507565498352, -0.459017813205719, -0.31352803111076355, -0.1680382490158081, -0.02254849672317505, 0.12294125556945801, 0.26843106746673584, 0.4139207601547241, 0.559410572052002, 0.704900324344635, 0.8503900766372681, 0.9958798885345459, 1.1413695812225342, 1.286859393119812, 1.4323492050170898, 1.5778388977050781, 1.723328709602356, 1.8688185214996338, 2.014308214187622, 2.1597981452941895, 2.3052878379821777, 2.450777530670166, 2.5962672233581543, 2.7417569160461426, 2.88724684715271, 3.0327365398406982, 3.1782264709472656, 3.323716163635254, 3.469205856323242, 3.6146955490112305, 3.760185480117798, 3.905675172805786, 4.0511651039123535, 4.196654796600342, 4.34214448928833, 4.487634658813477, 4.633124351501465, 4.778614044189453, 4.924103736877441, 5.06959342956543, 5.215083122253418]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 5.0, 6.0, 2.0, 7.0, 10.0, 11.0, 6.0, 9.0, 8.0, 14.0, 14.0, 26.0, 28.0, 30.0, 26.0, 31.0, 28.0, 34.0, 34.0, 30.0, 30.0, 40.0, 42.0, 28.0, 34.0, 37.0, 50.0, 27.0, 37.0, 35.0, 31.0, 31.0, 29.0, 24.0, 18.0, 18.0, 18.0, 27.0, 22.0, 18.0, 11.0, 4.0, 11.0, 5.0, 4.0, 3.0, 4.0, 6.0, 0.0, 4.0, 3.0, 0.0, 1.0], "bins": [-3.208984375, -3.11663818359375, -3.0242919921875, -2.93194580078125, -2.839599609375, -2.74725341796875, -2.6549072265625, -2.56256103515625, -2.47021484375, -2.37786865234375, -2.2855224609375, -2.19317626953125, -2.100830078125, -2.00848388671875, -1.9161376953125, -1.82379150390625, -1.7314453125, -1.63909912109375, -1.5467529296875, -1.45440673828125, -1.362060546875, -1.26971435546875, -1.1773681640625, -1.08502197265625, -0.99267578125, -0.90032958984375, -0.8079833984375, -0.71563720703125, -0.623291015625, -0.53094482421875, -0.4385986328125, -0.34625244140625, -0.25390625, -0.16156005859375, -0.0692138671875, 0.02313232421875, 0.115478515625, 0.20782470703125, 0.3001708984375, 0.39251708984375, 0.48486328125, 0.57720947265625, 0.6695556640625, 0.76190185546875, 0.854248046875, 0.94659423828125, 1.0389404296875, 1.13128662109375, 1.2236328125, 1.31597900390625, 1.4083251953125, 1.50067138671875, 1.593017578125, 1.68536376953125, 1.7777099609375, 1.87005615234375, 1.96240234375, 2.05474853515625, 2.1470947265625, 2.23944091796875, 2.331787109375, 2.42413330078125, 2.5164794921875, 2.60882568359375, 2.701171875]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 2.0, 6.0, 5.0, 13.0, 14.0, 25.0, 28.0, 32.0, 44.0, 83.0, 116.0, 170.0, 300.0, 439.0, 741.0, 1211.0, 2025.0, 3441.0, 6361.0, 11613.0, 23341.0, 47761.0, 102667.0, 211102.0, 282079.0, 183911.0, 87238.0, 40136.0, 19826.0, 10452.0, 5511.0, 3215.0, 1820.0, 1069.0, 646.0, 372.0, 259.0, 170.0, 112.0, 60.0, 53.0, 31.0, 24.0, 9.0, 9.0, 10.0, 6.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.236328125, -2.157562255859375, -2.07879638671875, -2.000030517578125, -1.9212646484375, -1.842498779296875, -1.76373291015625, -1.684967041015625, -1.606201171875, -1.527435302734375, -1.44866943359375, -1.369903564453125, -1.2911376953125, -1.212371826171875, -1.13360595703125, -1.054840087890625, -0.97607421875, -0.897308349609375, -0.81854248046875, -0.739776611328125, -0.6610107421875, -0.582244873046875, -0.50347900390625, -0.424713134765625, -0.345947265625, -0.267181396484375, -0.18841552734375, -0.109649658203125, -0.0308837890625, 0.047882080078125, 0.12664794921875, 0.205413818359375, 0.2841796875, 0.362945556640625, 0.44171142578125, 0.520477294921875, 0.5992431640625, 0.678009033203125, 0.75677490234375, 0.835540771484375, 0.914306640625, 0.993072509765625, 1.07183837890625, 1.150604248046875, 1.2293701171875, 1.308135986328125, 1.38690185546875, 1.465667724609375, 1.54443359375, 1.623199462890625, 1.70196533203125, 1.780731201171875, 1.8594970703125, 1.938262939453125, 2.01702880859375, 2.095794677734375, 2.174560546875, 2.253326416015625, 2.33209228515625, 2.410858154296875, 2.4896240234375, 2.568389892578125, 2.64715576171875, 2.725921630859375, 2.8046875]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 4.0, 3.0, 0.0, 3.0, 1.0, 4.0, 3.0, 3.0, 12.0, 7.0, 6.0, 13.0, 10.0, 14.0, 18.0, 19.0, 22.0, 19.0, 27.0, 32.0, 32.0, 31.0, 37.0, 34.0, 51.0, 78.0, 112.0, 266.0, 1446.0, 207.0, 88.0, 62.0, 60.0, 37.0, 42.0, 29.0, 34.0, 17.0, 26.0, 23.0, 24.0, 13.0, 13.0, 15.0, 9.0, 12.0, 9.0, 9.0, 5.0, 7.0, 7.0, 3.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-12.1015625, -11.74951171875, -11.3974609375, -11.04541015625, -10.693359375, -10.34130859375, -9.9892578125, -9.63720703125, -9.28515625, -8.93310546875, -8.5810546875, -8.22900390625, -7.876953125, -7.52490234375, -7.1728515625, -6.82080078125, -6.46875, -6.11669921875, -5.7646484375, -5.41259765625, -5.060546875, -4.70849609375, -4.3564453125, -4.00439453125, -3.65234375, -3.30029296875, -2.9482421875, -2.59619140625, -2.244140625, -1.89208984375, -1.5400390625, -1.18798828125, -0.8359375, -0.48388671875, -0.1318359375, 0.22021484375, 0.572265625, 0.92431640625, 1.2763671875, 1.62841796875, 1.98046875, 2.33251953125, 2.6845703125, 3.03662109375, 3.388671875, 3.74072265625, 4.0927734375, 4.44482421875, 4.796875, 5.14892578125, 5.5009765625, 5.85302734375, 6.205078125, 6.55712890625, 6.9091796875, 7.26123046875, 7.61328125, 7.96533203125, 8.3173828125, 8.66943359375, 9.021484375, 9.37353515625, 9.7255859375, 10.07763671875, 10.4296875]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 4.0, 5.0, 8.0, 12.0, 13.0, 16.0, 15.0, 24.0, 35.0, 40.0, 55.0, 72.0, 136.0, 224.0, 412.0, 931.0, 3021.0, 24686.0, 1447823.0, 1636151.0, 26872.0, 3130.0, 941.0, 404.0, 224.0, 142.0, 83.0, 49.0, 49.0, 27.0, 24.0, 16.0, 17.0, 9.0, 13.0, 3.0, 2.0, 7.0, 4.0, 2.0, 4.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.203125, -16.665771484375, -16.12841796875, -15.591064453125, -15.0537109375, -14.516357421875, -13.97900390625, -13.441650390625, -12.904296875, -12.366943359375, -11.82958984375, -11.292236328125, -10.7548828125, -10.217529296875, -9.68017578125, -9.142822265625, -8.60546875, -8.068115234375, -7.53076171875, -6.993408203125, -6.4560546875, -5.918701171875, -5.38134765625, -4.843994140625, -4.306640625, -3.769287109375, -3.23193359375, -2.694580078125, -2.1572265625, -1.619873046875, -1.08251953125, -0.545166015625, -0.0078125, 0.529541015625, 1.06689453125, 1.604248046875, 2.1416015625, 2.678955078125, 3.21630859375, 3.753662109375, 4.291015625, 4.828369140625, 5.36572265625, 5.903076171875, 6.4404296875, 6.977783203125, 7.51513671875, 8.052490234375, 8.58984375, 9.127197265625, 9.66455078125, 10.201904296875, 10.7392578125, 11.276611328125, 11.81396484375, 12.351318359375, 12.888671875, 13.426025390625, 13.96337890625, 14.500732421875, 15.0380859375, 15.575439453125, 16.11279296875, 16.650146484375, 17.1875]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 826.0, 190.0], "bins": [-658.9078979492188, -648.4130249023438, -637.9181518554688, -627.4232788085938, -616.9284057617188, -606.4335327148438, -595.9386596679688, -585.4437866210938, -574.9489135742188, -564.4540405273438, -553.9591674804688, -543.4642944335938, -532.9694213867188, -522.4745483398438, -511.97967529296875, -501.48480224609375, -490.98992919921875, -480.49505615234375, -470.00018310546875, -459.50531005859375, -449.01043701171875, -438.51556396484375, -428.02069091796875, -417.52581787109375, -407.0309753417969, -396.5361022949219, -386.0412292480469, -375.5463562011719, -365.0514831542969, -354.5566101074219, -344.0617370605469, -333.5668640136719, -323.0719909667969, -312.5771179199219, -302.0822448730469, -291.5873718261719, -281.0924987792969, -270.5976257324219, -260.1027526855469, -249.60787963867188, -239.11300659179688, -228.61813354492188, -218.12326049804688, -207.62838745117188, -197.13351440429688, -186.63864135742188, -176.14376831054688, -165.64889526367188, -155.15402221679688, -144.65914916992188, -134.16427612304688, -123.66940307617188, -113.17453002929688, -102.67965698242188, -92.1847915649414, -81.6899185180664, -71.19505310058594, -60.70018005371094, -50.20530700683594, -39.7104377746582, -29.215564727783203, -18.720691680908203, -8.225822448730469, 2.2690505981445312, 12.763923645019531]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 2.0, 2.0, 7.0, 2.0, 7.0, 7.0, 13.0, 12.0, 12.0, 17.0, 19.0, 18.0, 30.0, 28.0, 34.0, 48.0, 25.0, 49.0, 46.0, 37.0, 40.0, 43.0, 34.0, 51.0, 35.0, 45.0, 42.0, 41.0, 34.0, 33.0, 33.0, 24.0, 28.0, 21.0, 20.0, 13.0, 15.0, 9.0, 9.0, 3.0, 3.0, 6.0, 3.0, 0.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-40.138648986816406, -38.85628128051758, -37.57391357421875, -36.29154586791992, -35.009178161621094, -33.726810455322266, -32.44444274902344, -31.16207504272461, -29.87970733642578, -28.597339630126953, -27.314971923828125, -26.032604217529297, -24.75023651123047, -23.46786880493164, -22.185501098632812, -20.903133392333984, -19.620765686035156, -18.338397979736328, -17.0560302734375, -15.773662567138672, -14.491294860839844, -13.208927154541016, -11.926559448242188, -10.64419174194336, -9.361824035644531, -8.079456329345703, -6.797088623046875, -5.514720916748047, -4.232353210449219, -2.9499855041503906, -1.6676177978515625, -0.3852500915527344, 0.8971214294433594, 2.1794891357421875, 3.4618568420410156, 4.744224548339844, 6.026592254638672, 7.3089599609375, 8.591327667236328, 9.873695373535156, 11.156063079833984, 12.438430786132812, 13.72079849243164, 15.003166198730469, 16.285533905029297, 17.567901611328125, 18.850269317626953, 20.13263702392578, 21.41500473022461, 22.697372436523438, 23.979740142822266, 25.262107849121094, 26.544475555419922, 27.82684326171875, 29.109210968017578, 30.391578674316406, 31.673946380615234, 32.95631408691406, 34.23868179321289, 35.52104949951172, 36.80341720581055, 38.085784912109375, 39.3681526184082, 40.65052032470703, 41.93288803100586]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 4.0, 3.0, 7.0, 8.0, 13.0, 7.0, 10.0, 9.0, 11.0, 9.0, 26.0, 21.0, 37.0, 28.0, 25.0, 23.0, 35.0, 29.0, 26.0, 36.0, 33.0, 37.0, 42.0, 39.0, 36.0, 26.0, 33.0, 27.0, 33.0, 32.0, 34.0, 28.0, 30.0, 25.0, 23.0, 17.0, 10.0, 32.0, 18.0, 9.0, 13.0, 11.0, 15.0, 5.0, 3.0, 6.0, 7.0, 3.0, 3.0, 6.0, 1.0, 1.0, 2.0, 1.0], "bins": [-3.115234375, -3.023101806640625, -2.93096923828125, -2.838836669921875, -2.7467041015625, -2.654571533203125, -2.56243896484375, -2.470306396484375, -2.378173828125, -2.286041259765625, -2.19390869140625, -2.101776123046875, -2.0096435546875, -1.917510986328125, -1.82537841796875, -1.733245849609375, -1.64111328125, -1.548980712890625, -1.45684814453125, -1.364715576171875, -1.2725830078125, -1.180450439453125, -1.08831787109375, -0.996185302734375, -0.904052734375, -0.811920166015625, -0.71978759765625, -0.627655029296875, -0.5355224609375, -0.443389892578125, -0.35125732421875, -0.259124755859375, -0.1669921875, -0.074859619140625, 0.01727294921875, 0.109405517578125, 0.2015380859375, 0.293670654296875, 0.38580322265625, 0.477935791015625, 0.570068359375, 0.662200927734375, 0.75433349609375, 0.846466064453125, 0.9385986328125, 1.030731201171875, 1.12286376953125, 1.214996337890625, 1.30712890625, 1.399261474609375, 1.49139404296875, 1.583526611328125, 1.6756591796875, 1.767791748046875, 1.85992431640625, 1.952056884765625, 2.044189453125, 2.136322021484375, 2.22845458984375, 2.320587158203125, 2.4127197265625, 2.504852294921875, 2.59698486328125, 2.689117431640625, 2.78125]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 3.0, 7.0, 7.0, 9.0, 7.0, 12.0, 10.0, 18.0, 13.0, 21.0, 35.0, 39.0, 79.0, 131.0, 290.0, 566.0, 1229.0, 3205.0, 8296.0, 24726.0, 85565.0, 394270.0, 1863379.0, 1451625.0, 267499.0, 63122.0, 19157.0, 6612.0, 2445.0, 943.0, 447.0, 216.0, 85.0, 65.0, 37.0, 19.0, 19.0, 11.0, 15.0, 18.0, 13.0, 7.0, 4.0, 4.0, 1.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-7.10546875, -6.88262939453125, -6.6597900390625, -6.43695068359375, -6.214111328125, -5.99127197265625, -5.7684326171875, -5.54559326171875, -5.32275390625, -5.09991455078125, -4.8770751953125, -4.65423583984375, -4.431396484375, -4.20855712890625, -3.9857177734375, -3.76287841796875, -3.5400390625, -3.31719970703125, -3.0943603515625, -2.87152099609375, -2.648681640625, -2.42584228515625, -2.2030029296875, -1.98016357421875, -1.75732421875, -1.53448486328125, -1.3116455078125, -1.08880615234375, -0.865966796875, -0.64312744140625, -0.4202880859375, -0.19744873046875, 0.025390625, 0.24822998046875, 0.4710693359375, 0.69390869140625, 0.916748046875, 1.13958740234375, 1.3624267578125, 1.58526611328125, 1.80810546875, 2.03094482421875, 2.2537841796875, 2.47662353515625, 2.699462890625, 2.92230224609375, 3.1451416015625, 3.36798095703125, 3.5908203125, 3.81365966796875, 4.0364990234375, 4.25933837890625, 4.482177734375, 4.70501708984375, 4.9278564453125, 5.15069580078125, 5.37353515625, 5.59637451171875, 5.8192138671875, 6.04205322265625, 6.264892578125, 6.48773193359375, 6.7105712890625, 6.93341064453125, 7.15625]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 4.0, 1.0, 12.0, 1.0, 7.0, 21.0, 22.0, 27.0, 30.0, 52.0, 79.0, 114.0, 143.0, 193.0, 261.0, 326.0, 429.0, 442.0, 439.0, 385.0, 283.0, 234.0, 162.0, 123.0, 84.0, 58.0, 37.0, 28.0, 24.0, 14.0, 16.0, 12.0, 5.0, 1.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-10.1875, -9.9173583984375, -9.647216796875, -9.3770751953125, -9.10693359375, -8.8367919921875, -8.566650390625, -8.2965087890625, -8.0263671875, -7.7562255859375, -7.486083984375, -7.2159423828125, -6.94580078125, -6.6756591796875, -6.405517578125, -6.1353759765625, -5.865234375, -5.5950927734375, -5.324951171875, -5.0548095703125, -4.78466796875, -4.5145263671875, -4.244384765625, -3.9742431640625, -3.7041015625, -3.4339599609375, -3.163818359375, -2.8936767578125, -2.62353515625, -2.3533935546875, -2.083251953125, -1.8131103515625, -1.54296875, -1.2728271484375, -1.002685546875, -0.7325439453125, -0.46240234375, -0.1922607421875, 0.077880859375, 0.3480224609375, 0.6181640625, 0.8883056640625, 1.158447265625, 1.4285888671875, 1.69873046875, 1.9688720703125, 2.239013671875, 2.5091552734375, 2.779296875, 3.0494384765625, 3.319580078125, 3.5897216796875, 3.85986328125, 4.1300048828125, 4.400146484375, 4.6702880859375, 4.9404296875, 5.2105712890625, 5.480712890625, 5.7508544921875, 6.02099609375, 6.2911376953125, 6.561279296875, 6.8314208984375, 7.1015625]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 5.0, 1.0, 11.0, 11.0, 22.0, 25.0, 33.0, 46.0, 73.0, 97.0, 134.0, 194.0, 392.0, 696.0, 1462.0, 3156.0, 7934.0, 21807.0, 65868.0, 219245.0, 812579.0, 1927027.0, 812157.0, 219587.0, 66129.0, 21387.0, 7992.0, 3111.0, 1377.0, 722.0, 369.0, 210.0, 118.0, 96.0, 65.0, 36.0, 36.0, 15.0, 19.0, 13.0, 9.0, 4.0, 4.0, 4.0, 4.0, 2.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.7734375, -9.481689453125, -9.18994140625, -8.898193359375, -8.6064453125, -8.314697265625, -8.02294921875, -7.731201171875, -7.439453125, -7.147705078125, -6.85595703125, -6.564208984375, -6.2724609375, -5.980712890625, -5.68896484375, -5.397216796875, -5.10546875, -4.813720703125, -4.52197265625, -4.230224609375, -3.9384765625, -3.646728515625, -3.35498046875, -3.063232421875, -2.771484375, -2.479736328125, -2.18798828125, -1.896240234375, -1.6044921875, -1.312744140625, -1.02099609375, -0.729248046875, -0.4375, -0.145751953125, 0.14599609375, 0.437744140625, 0.7294921875, 1.021240234375, 1.31298828125, 1.604736328125, 1.896484375, 2.188232421875, 2.47998046875, 2.771728515625, 3.0634765625, 3.355224609375, 3.64697265625, 3.938720703125, 4.23046875, 4.522216796875, 4.81396484375, 5.105712890625, 5.3974609375, 5.689208984375, 5.98095703125, 6.272705078125, 6.564453125, 6.856201171875, 7.14794921875, 7.439697265625, 7.7314453125, 8.023193359375, 8.31494140625, 8.606689453125, 8.8984375]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 14.0, 33.0, 64.0, 146.0, 197.0, 224.0, 180.0, 87.0, 46.0, 16.0, 8.0, 4.0, 1.0], "bins": [-166.586669921875, -163.6273651123047, -160.66806030273438, -157.70875549316406, -154.74945068359375, -151.7901611328125, -148.8308563232422, -145.87155151367188, -142.91224670410156, -139.95294189453125, -136.99363708496094, -134.03433227539062, -131.07504272460938, -128.11573791503906, -125.15643310546875, -122.19712829589844, -119.23782348632812, -116.27851867675781, -113.3192138671875, -110.35991668701172, -107.4006118774414, -104.4413070678711, -101.48200988769531, -98.522705078125, -95.56340026855469, -92.60409545898438, -89.64479064941406, -86.68549346923828, -83.72618865966797, -80.76688385009766, -77.80758666992188, -74.84828186035156, -71.88897705078125, -68.92967224121094, -65.97036743164062, -63.011070251464844, -60.05176544189453, -57.09246063232422, -54.13315963745117, -51.173858642578125, -48.21455383300781, -45.2552490234375, -42.29594802856445, -39.336647033691406, -36.377342224121094, -33.41803741455078, -30.458736419677734, -27.499433517456055, -24.540128707885742, -21.580825805664062, -18.621522903442383, -15.662220001220703, -12.702917098999023, -9.743614196777344, -6.784311294555664, -3.8250083923339844, -0.8657054901123047, 2.093597412109375, 5.052900314331055, 8.012203216552734, 10.971506118774414, 13.930809020996094, 16.890111923217773, 19.849414825439453, 22.808717727661133]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 4.0, 3.0, 2.0, 4.0, 7.0, 11.0, 19.0, 18.0, 19.0, 17.0, 17.0, 20.0, 20.0, 30.0, 28.0, 23.0, 32.0, 34.0, 32.0, 41.0, 31.0, 45.0, 36.0, 26.0, 39.0, 39.0, 42.0, 32.0, 32.0, 20.0, 36.0, 29.0, 34.0, 20.0, 17.0, 25.0, 18.0, 18.0, 16.0, 13.0, 11.0, 10.0, 13.0, 7.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0], "bins": [-25.950992584228516, -25.153017044067383, -24.355043411254883, -23.55706787109375, -22.759092330932617, -21.961118698120117, -21.163143157958984, -20.365169525146484, -19.56719398498535, -18.76921844482422, -17.97124481201172, -17.173269271850586, -16.375293731689453, -15.577320098876953, -14.77934455871582, -13.981369972229004, -13.183394432067871, -12.385419845581055, -11.587444305419922, -10.789469718933105, -9.991495132446289, -9.193519592285156, -8.39554500579834, -7.597570419311523, -6.799595355987549, -6.001620292663574, -5.203645706176758, -4.405670642852783, -3.6076958179473877, -2.809720993041992, -2.0117459297180176, -1.2137713432312012, -0.41579627990722656, 0.3821786046028137, 1.180153489112854, 1.978128433227539, 2.7761032581329346, 3.57407808303833, 4.372053146362305, 5.170027732849121, 5.968002796173096, 6.76597785949707, 7.563952445983887, 8.361927032470703, 9.159902572631836, 9.957877159118652, 10.755851745605469, 11.553827285766602, 12.351801872253418, 13.149776458740234, 13.947751998901367, 14.745726585388184, 15.543701171875, 16.341676712036133, 17.139652252197266, 17.937625885009766, 18.7356014251709, 19.53357696533203, 20.33155059814453, 21.129526138305664, 21.927501678466797, 22.725475311279297, 23.52345085144043, 24.321426391601562, 25.119400024414062]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 4.0, 6.0, 9.0, 6.0, 8.0, 11.0, 7.0, 17.0, 14.0, 19.0, 15.0, 26.0, 18.0, 27.0, 33.0, 29.0, 34.0, 33.0, 28.0, 45.0, 29.0, 38.0, 30.0, 38.0, 35.0, 32.0, 39.0, 39.0, 40.0, 30.0, 30.0, 21.0, 29.0, 19.0, 21.0, 20.0, 14.0, 17.0, 24.0, 10.0, 13.0, 11.0, 9.0, 7.0, 8.0, 5.0, 5.0, 2.0, 0.0, 3.0, 3.0, 2.0, 1.0], "bins": [-3.384765625, -3.28607177734375, -3.1873779296875, -3.08868408203125, -2.989990234375, -2.89129638671875, -2.7926025390625, -2.69390869140625, -2.59521484375, -2.49652099609375, -2.3978271484375, -2.29913330078125, -2.200439453125, -2.10174560546875, -2.0030517578125, -1.90435791015625, -1.8056640625, -1.70697021484375, -1.6082763671875, -1.50958251953125, -1.410888671875, -1.31219482421875, -1.2135009765625, -1.11480712890625, -1.01611328125, -0.91741943359375, -0.8187255859375, -0.72003173828125, -0.621337890625, -0.52264404296875, -0.4239501953125, -0.32525634765625, -0.2265625, -0.12786865234375, -0.0291748046875, 0.06951904296875, 0.168212890625, 0.26690673828125, 0.3656005859375, 0.46429443359375, 0.56298828125, 0.66168212890625, 0.7603759765625, 0.85906982421875, 0.957763671875, 1.05645751953125, 1.1551513671875, 1.25384521484375, 1.3525390625, 1.45123291015625, 1.5499267578125, 1.64862060546875, 1.747314453125, 1.84600830078125, 1.9447021484375, 2.04339599609375, 2.14208984375, 2.24078369140625, 2.3394775390625, 2.43817138671875, 2.536865234375, 2.63555908203125, 2.7342529296875, 2.83294677734375, 2.931640625]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 8.0, 12.0, 20.0, 20.0, 29.0, 73.0, 124.0, 213.0, 329.0, 605.0, 962.0, 1591.0, 2663.0, 4500.0, 6874.0, 10735.0, 16372.0, 23960.0, 34846.0, 47187.0, 61951.0, 76277.0, 89685.0, 99208.0, 102034.0, 98073.0, 88167.0, 75139.0, 60559.0, 45799.0, 33537.0, 23505.0, 15881.0, 10464.0, 6573.0, 4230.0, 2480.0, 1605.0, 959.0, 534.0, 317.0, 171.0, 111.0, 68.0, 61.0, 20.0, 18.0, 5.0, 6.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0], "bins": [-1.9111328125, -1.85400390625, -1.796875, -1.73974609375, -1.6826171875, -1.62548828125, -1.568359375, -1.51123046875, -1.4541015625, -1.39697265625, -1.33984375, -1.28271484375, -1.2255859375, -1.16845703125, -1.111328125, -1.05419921875, -0.9970703125, -0.93994140625, -0.8828125, -0.82568359375, -0.7685546875, -0.71142578125, -0.654296875, -0.59716796875, -0.5400390625, -0.48291015625, -0.42578125, -0.36865234375, -0.3115234375, -0.25439453125, -0.197265625, -0.14013671875, -0.0830078125, -0.02587890625, 0.03125, 0.08837890625, 0.1455078125, 0.20263671875, 0.259765625, 0.31689453125, 0.3740234375, 0.43115234375, 0.48828125, 0.54541015625, 0.6025390625, 0.65966796875, 0.716796875, 0.77392578125, 0.8310546875, 0.88818359375, 0.9453125, 1.00244140625, 1.0595703125, 1.11669921875, 1.173828125, 1.23095703125, 1.2880859375, 1.34521484375, 1.40234375, 1.45947265625, 1.5166015625, 1.57373046875, 1.630859375, 1.68798828125, 1.7451171875]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 5.0, 3.0, 1.0, 4.0, 0.0, 2.0, 10.0, 8.0, 8.0, 10.0, 15.0, 12.0, 11.0, 22.0, 21.0, 22.0, 28.0, 21.0, 24.0, 25.0, 29.0, 42.0, 30.0, 35.0, 35.0, 33.0, 47.0, 1060.0, 37.0, 40.0, 41.0, 33.0, 26.0, 26.0, 27.0, 33.0, 24.0, 27.0, 25.0, 16.0, 16.0, 13.0, 17.0, 9.0, 8.0, 7.0, 11.0, 6.0, 5.0, 3.0, 4.0, 5.0, 3.0, 8.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0], "bins": [-3.318359375, -3.21197509765625, -3.1055908203125, -2.99920654296875, -2.892822265625, -2.78643798828125, -2.6800537109375, -2.57366943359375, -2.46728515625, -2.36090087890625, -2.2545166015625, -2.14813232421875, -2.041748046875, -1.93536376953125, -1.8289794921875, -1.72259521484375, -1.6162109375, -1.50982666015625, -1.4034423828125, -1.29705810546875, -1.190673828125, -1.08428955078125, -0.9779052734375, -0.87152099609375, -0.76513671875, -0.65875244140625, -0.5523681640625, -0.44598388671875, -0.339599609375, -0.23321533203125, -0.1268310546875, -0.02044677734375, 0.0859375, 0.19232177734375, 0.2987060546875, 0.40509033203125, 0.511474609375, 0.61785888671875, 0.7242431640625, 0.83062744140625, 0.93701171875, 1.04339599609375, 1.1497802734375, 1.25616455078125, 1.362548828125, 1.46893310546875, 1.5753173828125, 1.68170166015625, 1.7880859375, 1.89447021484375, 2.0008544921875, 2.10723876953125, 2.213623046875, 2.32000732421875, 2.4263916015625, 2.53277587890625, 2.63916015625, 2.74554443359375, 2.8519287109375, 2.95831298828125, 3.064697265625, 3.17108154296875, 3.2774658203125, 3.38385009765625, 3.490234375]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 3.0, 16.0, 13.0, 29.0, 26.0, 56.0, 69.0, 104.0, 141.0, 236.0, 312.0, 462.0, 743.0, 1008.0, 1576.0, 2212.0, 3254.0, 4865.0, 7004.0, 10415.0, 15758.0, 26883.0, 69885.0, 1423346.0, 413670.0, 48905.0, 22776.0, 14042.0, 9239.0, 6224.0, 4429.0, 3059.0, 2085.0, 1371.0, 937.0, 611.0, 453.0, 271.0, 215.0, 156.0, 93.0, 55.0, 40.0, 27.0, 25.0, 16.0, 4.0, 7.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.46484375, -3.352569580078125, -3.24029541015625, -3.128021240234375, -3.0157470703125, -2.903472900390625, -2.79119873046875, -2.678924560546875, -2.566650390625, -2.454376220703125, -2.34210205078125, -2.229827880859375, -2.1175537109375, -2.005279541015625, -1.89300537109375, -1.780731201171875, -1.66845703125, -1.556182861328125, -1.44390869140625, -1.331634521484375, -1.2193603515625, -1.107086181640625, -0.99481201171875, -0.882537841796875, -0.770263671875, -0.657989501953125, -0.54571533203125, -0.433441162109375, -0.3211669921875, -0.208892822265625, -0.09661865234375, 0.015655517578125, 0.1279296875, 0.240203857421875, 0.35247802734375, 0.464752197265625, 0.5770263671875, 0.689300537109375, 0.80157470703125, 0.913848876953125, 1.026123046875, 1.138397216796875, 1.25067138671875, 1.362945556640625, 1.4752197265625, 1.587493896484375, 1.69976806640625, 1.812042236328125, 1.92431640625, 2.036590576171875, 2.14886474609375, 2.261138916015625, 2.3734130859375, 2.485687255859375, 2.59796142578125, 2.710235595703125, 2.822509765625, 2.934783935546875, 3.04705810546875, 3.159332275390625, 3.2716064453125, 3.383880615234375, 3.49615478515625, 3.608428955078125, 3.720703125]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 6.0, 7.0, 13.0, 16.0, 14.0, 29.0, 23.0, 32.0, 38.0, 34.0, 40.0, 50.0, 49.0, 48.0, 55.0, 44.0, 42.0, 41.0, 59.0, 45.0, 53.0, 43.0, 34.0, 44.0, 21.0, 25.0, 17.0, 19.0, 16.0, 15.0, 8.0, 6.0, 5.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.314208984375, -0.30356597900390625, -0.2929229736328125, -0.28227996826171875, -0.271636962890625, -0.26099395751953125, -0.2503509521484375, -0.23970794677734375, -0.22906494140625, -0.21842193603515625, -0.2077789306640625, -0.19713592529296875, -0.186492919921875, -0.17584991455078125, -0.1652069091796875, -0.15456390380859375, -0.1439208984375, -0.13327789306640625, -0.1226348876953125, -0.11199188232421875, -0.101348876953125, -0.09070587158203125, -0.0800628662109375, -0.06941986083984375, -0.05877685546875, -0.04813385009765625, -0.0374908447265625, -0.02684783935546875, -0.016204833984375, -0.00556182861328125, 0.0050811767578125, 0.01572418212890625, 0.0263671875, 0.03701019287109375, 0.0476531982421875, 0.05829620361328125, 0.068939208984375, 0.07958221435546875, 0.0902252197265625, 0.10086822509765625, 0.11151123046875, 0.12215423583984375, 0.1327972412109375, 0.14344024658203125, 0.154083251953125, 0.16472625732421875, 0.1753692626953125, 0.18601226806640625, 0.1966552734375, 0.20729827880859375, 0.2179412841796875, 0.22858428955078125, 0.239227294921875, 0.24987030029296875, 0.2605133056640625, 0.27115631103515625, 0.28179931640625, 0.29244232177734375, 0.3030853271484375, 0.31372833251953125, 0.324371337890625, 0.33501434326171875, 0.3456573486328125, 0.35630035400390625, 0.366943359375]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 7.0, 7.0, 9.0, 14.0, 16.0, 17.0, 28.0, 26.0, 46.0, 38.0, 89.0, 111.0, 160.0, 196.0, 301.0, 370.0, 698.0, 4755.0, 230957.0, 788768.0, 18988.0, 1200.0, 477.0, 321.0, 261.0, 189.0, 145.0, 97.0, 80.0, 56.0, 38.0, 32.0, 18.0, 16.0, 8.0, 5.0, 4.0, 1.0, 6.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-5.52734375, -5.370361328125, -5.21337890625, -5.056396484375, -4.8994140625, -4.742431640625, -4.58544921875, -4.428466796875, -4.271484375, -4.114501953125, -3.95751953125, -3.800537109375, -3.6435546875, -3.486572265625, -3.32958984375, -3.172607421875, -3.015625, -2.858642578125, -2.70166015625, -2.544677734375, -2.3876953125, -2.230712890625, -2.07373046875, -1.916748046875, -1.759765625, -1.602783203125, -1.44580078125, -1.288818359375, -1.1318359375, -0.974853515625, -0.81787109375, -0.660888671875, -0.50390625, -0.346923828125, -0.18994140625, -0.032958984375, 0.1240234375, 0.281005859375, 0.43798828125, 0.594970703125, 0.751953125, 0.908935546875, 1.06591796875, 1.222900390625, 1.3798828125, 1.536865234375, 1.69384765625, 1.850830078125, 2.0078125, 2.164794921875, 2.32177734375, 2.478759765625, 2.6357421875, 2.792724609375, 2.94970703125, 3.106689453125, 3.263671875, 3.420654296875, 3.57763671875, 3.734619140625, 3.8916015625, 4.048583984375, 4.20556640625, 4.362548828125, 4.51953125]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 6.0, 31.0, 248.0, 589.0, 118.0, 18.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.230270385742188, -20.74041175842285, -20.250551223754883, -19.760692596435547, -19.27083396911621, -18.780973434448242, -18.291114807128906, -17.80125617980957, -17.3113956451416, -16.821537017822266, -16.331676483154297, -15.841817855834961, -15.351958274841309, -14.862098693847656, -14.37224006652832, -13.882380485534668, -13.392521858215332, -12.90266227722168, -12.412803649902344, -11.922944068908691, -11.433084487915039, -10.943225860595703, -10.45336627960205, -9.963506698608398, -9.473648071289062, -8.98378849029541, -8.493929862976074, -8.004070281982422, -7.5142107009887695, -7.024351596832275, -6.534492492675781, -6.044632911682129, -5.55477237701416, -5.064913272857666, -4.575053691864014, -4.0851945877075195, -3.5953352451324463, -3.105475902557373, -2.615616798400879, -2.1257574558258057, -1.6358981132507324, -1.1460387706756592, -0.6561795473098755, -0.1663203239440918, 0.32353901863098145, 0.8133983612060547, 1.3032574653625488, 1.793116807937622, 2.2829761505126953, 2.7728354930877686, 3.262694835662842, 3.752553939819336, 4.242413520812988, 4.732272624969482, 5.222131729125977, 5.711991310119629, 6.201850414276123, 6.691709518432617, 7.1815690994262695, 7.671428203582764, 8.161287307739258, 8.65114688873291, 9.141006469726562, 9.630865097045898, 10.12072467803955]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 6.0, 8.0, 8.0, 14.0, 10.0, 13.0, 19.0, 28.0, 25.0, 19.0, 33.0, 37.0, 46.0, 42.0, 46.0, 49.0, 69.0, 42.0, 49.0, 45.0, 40.0, 51.0, 33.0, 48.0, 45.0, 25.0, 23.0, 26.0, 24.0, 17.0, 15.0, 11.0, 7.0, 12.0, 5.0, 5.0, 0.0, 8.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.898587942123413, -2.806439161300659, -2.7142903804779053, -2.6221415996551514, -2.5299928188323975, -2.4378440380096436, -2.3456954956054688, -2.253546714782715, -2.161397933959961, -2.069249153137207, -1.9771003723144531, -1.8849515914916992, -1.7928028106689453, -1.7006540298461914, -1.608505368232727, -1.5163565874099731, -1.4242076873779297, -1.3320589065551758, -1.2399101257324219, -1.147761344909668, -1.055612564086914, -0.9634638428688049, -0.8713151216506958, -0.7791663408279419, -0.687017560005188, -0.5948687791824341, -0.5027199983596802, -0.41057127714157104, -0.31842249631881714, -0.22627371549606323, -0.1341249942779541, -0.041976213455200195, 0.05017280578613281, 0.14232157170772552, 0.23447033762931824, 0.32661908864974976, 0.41876786947250366, 0.5109166502952576, 0.6030653715133667, 0.6952141523361206, 0.7873629331588745, 0.8795117139816284, 0.9716604948043823, 1.0638091564178467, 1.1559579372406006, 1.2481067180633545, 1.3402554988861084, 1.4324042797088623, 1.5245530605316162, 1.6167018413543701, 1.708850622177124, 1.800999402999878, 1.8931481838226318, 1.9852969646453857, 2.0774455070495605, 2.1695942878723145, 2.2617430686950684, 2.3538918495178223, 2.446040630340576, 2.53818941116333, 2.630338191986084, 2.722486972808838, 2.814635753631592, 2.9067845344543457, 2.9989333152770996]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 2.0, 7.0, 7.0, 11.0, 13.0, 19.0, 15.0, 20.0, 9.0, 18.0, 20.0, 24.0, 31.0, 39.0, 26.0, 27.0, 36.0, 37.0, 34.0, 36.0, 42.0, 37.0, 38.0, 41.0, 32.0, 41.0, 36.0, 33.0, 19.0, 29.0, 28.0, 28.0, 23.0, 19.0, 20.0, 12.0, 11.0, 16.0, 12.0, 9.0, 15.0, 8.0, 5.0, 5.0, 7.0, 3.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3515625, -3.248504638671875, -3.14544677734375, -3.042388916015625, -2.9393310546875, -2.836273193359375, -2.73321533203125, -2.630157470703125, -2.527099609375, -2.424041748046875, -2.32098388671875, -2.217926025390625, -2.1148681640625, -2.011810302734375, -1.90875244140625, -1.805694580078125, -1.70263671875, -1.599578857421875, -1.49652099609375, -1.393463134765625, -1.2904052734375, -1.187347412109375, -1.08428955078125, -0.981231689453125, -0.878173828125, -0.775115966796875, -0.67205810546875, -0.569000244140625, -0.4659423828125, -0.362884521484375, -0.25982666015625, -0.156768798828125, -0.0537109375, 0.049346923828125, 0.15240478515625, 0.255462646484375, 0.3585205078125, 0.461578369140625, 0.56463623046875, 0.667694091796875, 0.770751953125, 0.873809814453125, 0.97686767578125, 1.079925537109375, 1.1829833984375, 1.286041259765625, 1.38909912109375, 1.492156982421875, 1.59521484375, 1.698272705078125, 1.80133056640625, 1.904388427734375, 2.0074462890625, 2.110504150390625, 2.21356201171875, 2.316619873046875, 2.419677734375, 2.522735595703125, 2.62579345703125, 2.728851318359375, 2.8319091796875, 2.934967041015625, 3.03802490234375, 3.141082763671875, 3.244140625]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 2.0, 6.0, 7.0, 15.0, 15.0, 24.0, 41.0, 38.0, 64.0, 85.0, 119.0, 207.0, 306.0, 419.0, 650.0, 986.0, 1397.0, 2104.0, 3239.0, 5056.0, 8608.0, 14433.0, 25537.0, 46037.0, 85497.0, 169714.0, 319750.0, 169635.0, 85187.0, 46069.0, 25548.0, 14413.0, 8473.0, 5179.0, 3277.0, 2099.0, 1415.0, 916.0, 679.0, 452.0, 283.0, 188.0, 131.0, 89.0, 44.0, 47.0, 34.0, 15.0, 9.0, 6.0, 8.0, 6.0, 3.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-2.8984375, -2.80340576171875, -2.7083740234375, -2.61334228515625, -2.518310546875, -2.42327880859375, -2.3282470703125, -2.23321533203125, -2.13818359375, -2.04315185546875, -1.9481201171875, -1.85308837890625, -1.758056640625, -1.66302490234375, -1.5679931640625, -1.47296142578125, -1.3779296875, -1.28289794921875, -1.1878662109375, -1.09283447265625, -0.997802734375, -0.90277099609375, -0.8077392578125, -0.71270751953125, -0.61767578125, -0.52264404296875, -0.4276123046875, -0.33258056640625, -0.237548828125, -0.14251708984375, -0.0474853515625, 0.04754638671875, 0.142578125, 0.23760986328125, 0.3326416015625, 0.42767333984375, 0.522705078125, 0.61773681640625, 0.7127685546875, 0.80780029296875, 0.90283203125, 0.99786376953125, 1.0928955078125, 1.18792724609375, 1.282958984375, 1.37799072265625, 1.4730224609375, 1.56805419921875, 1.6630859375, 1.75811767578125, 1.8531494140625, 1.94818115234375, 2.043212890625, 2.13824462890625, 2.2332763671875, 2.32830810546875, 2.42333984375, 2.51837158203125, 2.6134033203125, 2.70843505859375, 2.803466796875, 2.89849853515625, 2.9935302734375, 3.08856201171875, 3.18359375]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 5.0, 5.0, 3.0, 3.0, 5.0, 9.0, 11.0, 10.0, 19.0, 13.0, 21.0, 24.0, 22.0, 22.0, 25.0, 25.0, 44.0, 42.0, 39.0, 40.0, 66.0, 101.0, 203.0, 1449.0, 268.0, 119.0, 54.0, 46.0, 49.0, 35.0, 37.0, 39.0, 25.0, 31.0, 24.0, 17.0, 11.0, 14.0, 13.0, 12.0, 7.0, 6.0, 7.0, 6.0, 5.0, 7.0, 4.0, 2.0, 2.0, 4.0, 1.0, 1.0, 3.0, 0.0, 4.0], "bins": [-13.2421875, -12.83740234375, -12.4326171875, -12.02783203125, -11.623046875, -11.21826171875, -10.8134765625, -10.40869140625, -10.00390625, -9.59912109375, -9.1943359375, -8.78955078125, -8.384765625, -7.97998046875, -7.5751953125, -7.17041015625, -6.765625, -6.36083984375, -5.9560546875, -5.55126953125, -5.146484375, -4.74169921875, -4.3369140625, -3.93212890625, -3.52734375, -3.12255859375, -2.7177734375, -2.31298828125, -1.908203125, -1.50341796875, -1.0986328125, -0.69384765625, -0.2890625, 0.11572265625, 0.5205078125, 0.92529296875, 1.330078125, 1.73486328125, 2.1396484375, 2.54443359375, 2.94921875, 3.35400390625, 3.7587890625, 4.16357421875, 4.568359375, 4.97314453125, 5.3779296875, 5.78271484375, 6.1875, 6.59228515625, 6.9970703125, 7.40185546875, 7.806640625, 8.21142578125, 8.6162109375, 9.02099609375, 9.42578125, 9.83056640625, 10.2353515625, 10.64013671875, 11.044921875, 11.44970703125, 11.8544921875, 12.25927734375, 12.6640625]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 5.0, 3.0, 6.0, 11.0, 11.0, 8.0, 17.0, 29.0, 22.0, 39.0, 50.0, 88.0, 113.0, 191.0, 273.0, 509.0, 1462.0, 8187.0, 230454.0, 2843269.0, 54994.0, 3806.0, 932.0, 452.0, 255.0, 145.0, 104.0, 74.0, 48.0, 38.0, 29.0, 26.0, 12.0, 9.0, 9.0, 5.0, 9.0, 7.0, 3.0, 3.0, 6.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.796875, -26.038330078125, -25.27978515625, -24.521240234375, -23.7626953125, -23.004150390625, -22.24560546875, -21.487060546875, -20.728515625, -19.969970703125, -19.21142578125, -18.452880859375, -17.6943359375, -16.935791015625, -16.17724609375, -15.418701171875, -14.66015625, -13.901611328125, -13.14306640625, -12.384521484375, -11.6259765625, -10.867431640625, -10.10888671875, -9.350341796875, -8.591796875, -7.833251953125, -7.07470703125, -6.316162109375, -5.5576171875, -4.799072265625, -4.04052734375, -3.281982421875, -2.5234375, -1.764892578125, -1.00634765625, -0.247802734375, 0.5107421875, 1.269287109375, 2.02783203125, 2.786376953125, 3.544921875, 4.303466796875, 5.06201171875, 5.820556640625, 6.5791015625, 7.337646484375, 8.09619140625, 8.854736328125, 9.61328125, 10.371826171875, 11.13037109375, 11.888916015625, 12.6474609375, 13.406005859375, 14.16455078125, 14.923095703125, 15.681640625, 16.440185546875, 17.19873046875, 17.957275390625, 18.7158203125, 19.474365234375, 20.23291015625, 20.991455078125, 21.75]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 16.0, 957.0, 46.0], "bins": [-669.2406616210938, -658.5440063476562, -647.8473510742188, -637.1506958007812, -626.4541015625, -615.7574462890625, -605.060791015625, -594.3641357421875, -583.66748046875, -572.9708251953125, -562.274169921875, -551.5775146484375, -540.880859375, -530.1842651367188, -519.4876098632812, -508.79095458984375, -498.09429931640625, -487.39764404296875, -476.70098876953125, -466.0043640136719, -455.3077087402344, -444.6110534667969, -433.9144287109375, -423.2177734375, -412.5211181640625, -401.824462890625, -391.1278076171875, -380.4311828613281, -369.7345275878906, -359.0378723144531, -348.34124755859375, -337.64459228515625, -326.94793701171875, -316.25128173828125, -305.55462646484375, -294.8580017089844, -284.1613464355469, -273.4646911621094, -262.76806640625, -252.0714111328125, -241.374755859375, -230.6781005859375, -219.98146057128906, -209.28482055664062, -198.58816528320312, -187.89151000976562, -177.1948699951172, -166.49822998046875, -155.80157470703125, -145.10491943359375, -134.4082794189453, -123.71163177490234, -113.01498413085938, -102.3183364868164, -91.62168884277344, -80.92504119873047, -70.22840118408203, -59.53175354003906, -48.835105895996094, -38.138458251953125, -27.441810607910156, -16.745162963867188, -6.048515319824219, 4.64813232421875, 15.344782829284668]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 11.0, 7.0, 8.0, 4.0, 6.0, 14.0, 15.0, 14.0, 17.0, 24.0, 16.0, 22.0, 23.0, 30.0, 31.0, 38.0, 48.0, 46.0, 46.0, 41.0, 43.0, 45.0, 39.0, 48.0, 49.0, 40.0, 37.0, 34.0, 31.0, 33.0, 30.0, 22.0, 24.0, 14.0, 11.0, 9.0, 11.0, 9.0, 3.0, 6.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0], "bins": [-45.36420440673828, -43.96215057373047, -42.560096740722656, -41.158042907714844, -39.75598907470703, -38.35393524169922, -36.951881408691406, -35.54983139038086, -34.14777755737305, -32.745723724365234, -31.343669891357422, -29.94161605834961, -28.53956413269043, -27.137510299682617, -25.735456466674805, -24.333404541015625, -22.93134880065918, -21.529294967651367, -20.127241134643555, -18.725189208984375, -17.323135375976562, -15.92108154296875, -14.519027709960938, -13.116974830627441, -11.714920997619629, -10.312867164611816, -8.91081428527832, -7.508760452270508, -6.1067070960998535, -4.704653739929199, -3.3025999069213867, -1.9005470275878906, -0.4984931945800781, 0.9035602807998657, 2.3056137561798096, 3.707667350769043, 5.109720706939697, 6.511774063110352, 7.913827896118164, 9.31588077545166, 10.717934608459473, 12.119988441467285, 13.522041320800781, 14.924095153808594, 16.326148986816406, 17.72820281982422, 19.13025665283203, 20.53230857849121, 21.934362411499023, 23.336416244506836, 24.73847007751465, 26.140522003173828, 27.54257583618164, 28.944629669189453, 30.346683502197266, 31.748737335205078, 33.15079116821289, 34.5528450012207, 35.954898834228516, 37.35695266723633, 38.75900650024414, 40.16105651855469, 41.5631103515625, 42.96516418457031, 44.367218017578125]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 3.0, 6.0, 5.0, 3.0, 5.0, 8.0, 8.0, 6.0, 12.0, 6.0, 16.0, 18.0, 24.0, 25.0, 27.0, 23.0, 27.0, 22.0, 27.0, 29.0, 49.0, 47.0, 25.0, 40.0, 39.0, 46.0, 37.0, 33.0, 39.0, 29.0, 31.0, 38.0, 27.0, 20.0, 23.0, 19.0, 25.0, 13.0, 29.0, 16.0, 12.0, 14.0, 13.0, 7.0, 7.0, 6.0, 3.0, 6.0, 8.0, 5.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.44921875, -3.34283447265625, -3.2364501953125, -3.13006591796875, -3.023681640625, -2.91729736328125, -2.8109130859375, -2.70452880859375, -2.59814453125, -2.49176025390625, -2.3853759765625, -2.27899169921875, -2.172607421875, -2.06622314453125, -1.9598388671875, -1.85345458984375, -1.7470703125, -1.64068603515625, -1.5343017578125, -1.42791748046875, -1.321533203125, -1.21514892578125, -1.1087646484375, -1.00238037109375, -0.89599609375, -0.78961181640625, -0.6832275390625, -0.57684326171875, -0.470458984375, -0.36407470703125, -0.2576904296875, -0.15130615234375, -0.044921875, 0.06146240234375, 0.1678466796875, 0.27423095703125, 0.380615234375, 0.48699951171875, 0.5933837890625, 0.69976806640625, 0.80615234375, 0.91253662109375, 1.0189208984375, 1.12530517578125, 1.231689453125, 1.33807373046875, 1.4444580078125, 1.55084228515625, 1.6572265625, 1.76361083984375, 1.8699951171875, 1.97637939453125, 2.082763671875, 2.18914794921875, 2.2955322265625, 2.40191650390625, 2.50830078125, 2.61468505859375, 2.7210693359375, 2.82745361328125, 2.933837890625, 3.04022216796875, 3.1466064453125, 3.25299072265625, 3.359375]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 5.0, 6.0, 5.0, 11.0, 12.0, 16.0, 32.0, 53.0, 65.0, 104.0, 177.0, 283.0, 426.0, 711.0, 1261.0, 2167.0, 3812.0, 7225.0, 14149.0, 28658.0, 62692.0, 152263.0, 417988.0, 1026675.0, 1335476.0, 703336.0, 253989.0, 97082.0, 42654.0, 20346.0, 10114.0, 5443.0, 2855.0, 1626.0, 971.0, 602.0, 334.0, 235.0, 147.0, 96.0, 75.0, 31.0, 27.0, 11.0, 17.0, 10.0, 6.0, 1.0, 4.0, 6.0, 1.0, 1.0, 3.0], "bins": [-4.75390625, -4.61907958984375, -4.4842529296875, -4.34942626953125, -4.214599609375, -4.07977294921875, -3.9449462890625, -3.81011962890625, -3.67529296875, -3.54046630859375, -3.4056396484375, -3.27081298828125, -3.135986328125, -3.00115966796875, -2.8663330078125, -2.73150634765625, -2.5966796875, -2.46185302734375, -2.3270263671875, -2.19219970703125, -2.057373046875, -1.92254638671875, -1.7877197265625, -1.65289306640625, -1.51806640625, -1.38323974609375, -1.2484130859375, -1.11358642578125, -0.978759765625, -0.84393310546875, -0.7091064453125, -0.57427978515625, -0.439453125, -0.30462646484375, -0.1697998046875, -0.03497314453125, 0.099853515625, 0.23468017578125, 0.3695068359375, 0.50433349609375, 0.63916015625, 0.77398681640625, 0.9088134765625, 1.04364013671875, 1.178466796875, 1.31329345703125, 1.4481201171875, 1.58294677734375, 1.7177734375, 1.85260009765625, 1.9874267578125, 2.12225341796875, 2.257080078125, 2.39190673828125, 2.5267333984375, 2.66156005859375, 2.79638671875, 2.93121337890625, 3.0660400390625, 3.20086669921875, 3.335693359375, 3.47052001953125, 3.6053466796875, 3.74017333984375, 3.875]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 6.0, 6.0, 10.0, 19.0, 22.0, 15.0, 36.0, 29.0, 52.0, 69.0, 90.0, 133.0, 192.0, 234.0, 320.0, 379.0, 459.0, 436.0, 391.0, 330.0, 239.0, 161.0, 115.0, 93.0, 63.0, 37.0, 35.0, 25.0, 24.0, 15.0, 6.0, 6.0, 6.0, 7.0, 7.0, 2.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 1.0], "bins": [-10.4140625, -10.1396484375, -9.865234375, -9.5908203125, -9.31640625, -9.0419921875, -8.767578125, -8.4931640625, -8.21875, -7.9443359375, -7.669921875, -7.3955078125, -7.12109375, -6.8466796875, -6.572265625, -6.2978515625, -6.0234375, -5.7490234375, -5.474609375, -5.2001953125, -4.92578125, -4.6513671875, -4.376953125, -4.1025390625, -3.828125, -3.5537109375, -3.279296875, -3.0048828125, -2.73046875, -2.4560546875, -2.181640625, -1.9072265625, -1.6328125, -1.3583984375, -1.083984375, -0.8095703125, -0.53515625, -0.2607421875, 0.013671875, 0.2880859375, 0.5625, 0.8369140625, 1.111328125, 1.3857421875, 1.66015625, 1.9345703125, 2.208984375, 2.4833984375, 2.7578125, 3.0322265625, 3.306640625, 3.5810546875, 3.85546875, 4.1298828125, 4.404296875, 4.6787109375, 4.953125, 5.2275390625, 5.501953125, 5.7763671875, 6.05078125, 6.3251953125, 6.599609375, 6.8740234375, 7.1484375]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 7.0, 4.0, 15.0, 15.0, 24.0, 38.0, 58.0, 118.0, 195.0, 376.0, 825.0, 1987.0, 5273.0, 16667.0, 62353.0, 269637.0, 1316463.0, 1937105.0, 447327.0, 98591.0, 25069.0, 7501.0, 2524.0, 1045.0, 480.0, 257.0, 139.0, 69.0, 48.0, 31.0, 14.0, 19.0, 9.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.796875, -12.4429931640625, -12.089111328125, -11.7352294921875, -11.38134765625, -11.0274658203125, -10.673583984375, -10.3197021484375, -9.9658203125, -9.6119384765625, -9.258056640625, -8.9041748046875, -8.55029296875, -8.1964111328125, -7.842529296875, -7.4886474609375, -7.134765625, -6.7808837890625, -6.427001953125, -6.0731201171875, -5.71923828125, -5.3653564453125, -5.011474609375, -4.6575927734375, -4.3037109375, -3.9498291015625, -3.595947265625, -3.2420654296875, -2.88818359375, -2.5343017578125, -2.180419921875, -1.8265380859375, -1.47265625, -1.1187744140625, -0.764892578125, -0.4110107421875, -0.05712890625, 0.2967529296875, 0.650634765625, 1.0045166015625, 1.3583984375, 1.7122802734375, 2.066162109375, 2.4200439453125, 2.77392578125, 3.1278076171875, 3.481689453125, 3.8355712890625, 4.189453125, 4.5433349609375, 4.897216796875, 5.2510986328125, 5.60498046875, 5.9588623046875, 6.312744140625, 6.6666259765625, 7.0205078125, 7.3743896484375, 7.728271484375, 8.0821533203125, 8.43603515625, 8.7899169921875, 9.143798828125, 9.4976806640625, 9.8515625]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 7.0, 12.0, 22.0, 54.0, 106.0, 143.0, 175.0, 191.0, 136.0, 89.0, 51.0, 18.0, 6.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-98.42951965332031, -95.8375244140625, -93.24552917480469, -90.65353393554688, -88.06153106689453, -85.46953582763672, -82.8775405883789, -80.2855453491211, -77.69355010986328, -75.10155487060547, -72.50955963134766, -69.91755676269531, -67.3255615234375, -64.73356628417969, -62.141571044921875, -59.54957580566406, -56.957576751708984, -54.36558151245117, -51.773582458496094, -49.18158721923828, -46.58959197998047, -43.997596740722656, -41.40559768676758, -38.813602447509766, -36.22160339355469, -33.629608154296875, -31.03761100769043, -28.445613861083984, -25.853618621826172, -23.261621475219727, -20.66962432861328, -18.07762908935547, -15.485633850097656, -12.893637657165527, -10.301641464233398, -7.709644317626953, -5.117648124694824, -2.5256519317626953, 0.06634521484375, 2.6583404541015625, 5.250337600708008, 7.842333793640137, 10.434329986572266, 13.026327133178711, 15.61832332611084, 18.21031951904297, 20.802316665649414, 23.394311904907227, 25.986309051513672, 28.578306198120117, 31.17030143737793, 33.762298583984375, 36.35429382324219, 38.9462890625, 41.53828811645508, 44.13028335571289, 46.72228240966797, 49.31427764892578, 51.90627670288086, 54.49827194213867, 57.090267181396484, 59.68226623535156, 62.274261474609375, 64.86625671386719, 67.458251953125]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 4.0, 6.0, 5.0, 6.0, 9.0, 13.0, 9.0, 8.0, 10.0, 14.0, 16.0, 16.0, 20.0, 26.0, 26.0, 27.0, 40.0, 34.0, 20.0, 28.0, 37.0, 34.0, 35.0, 36.0, 35.0, 28.0, 34.0, 33.0, 29.0, 25.0, 22.0, 27.0, 24.0, 30.0, 33.0, 21.0, 14.0, 20.0, 8.0, 26.0, 13.0, 16.0, 20.0, 7.0, 7.0, 7.0, 9.0, 3.0, 6.0, 9.0, 6.0, 4.0, 6.0, 2.0, 0.0, 1.0, 3.0], "bins": [-23.531768798828125, -22.810823440551758, -22.08987808227539, -21.36893081665039, -20.647985458374023, -19.927040100097656, -19.206092834472656, -18.48514747619629, -17.764202117919922, -17.043256759643555, -16.322311401367188, -15.601364135742188, -14.88041877746582, -14.159473419189453, -13.43852710723877, -12.717580795288086, -11.996635437011719, -11.275690078735352, -10.554743766784668, -9.833797454833984, -9.112852096557617, -8.39190673828125, -7.670960426330566, -6.950014591217041, -6.229068756103516, -5.50812292098999, -4.787177085876465, -4.0662312507629395, -3.345285415649414, -2.6243395805358887, -1.9033937454223633, -1.182447910308838, -0.4615020751953125, 0.2594437599182129, 0.9803895950317383, 1.7013354301452637, 2.422281265258789, 3.1432271003723145, 3.86417293548584, 4.585118770599365, 5.306064605712891, 6.027010440826416, 6.747956275939941, 7.468902111053467, 8.189847946166992, 8.91079330444336, 9.631739616394043, 10.352685928344727, 11.073631286621094, 11.794576644897461, 12.515522956848145, 13.236469268798828, 13.957414627075195, 14.678359985351562, 15.399306297302246, 16.12025260925293, 16.841197967529297, 17.562143325805664, 18.28308868408203, 19.00403594970703, 19.7249813079834, 20.445926666259766, 21.166873931884766, 21.887819290161133, 22.6087646484375]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 5.0, 2.0, 7.0, 11.0, 14.0, 6.0, 7.0, 15.0, 15.0, 15.0, 20.0, 19.0, 33.0, 27.0, 31.0, 25.0, 33.0, 24.0, 36.0, 27.0, 45.0, 50.0, 27.0, 44.0, 40.0, 26.0, 34.0, 24.0, 19.0, 27.0, 27.0, 32.0, 26.0, 24.0, 23.0, 23.0, 13.0, 21.0, 15.0, 19.0, 11.0, 8.0, 6.0, 4.0, 6.0, 9.0, 9.0, 10.0, 0.0, 3.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.037109375, -2.93719482421875, -2.8372802734375, -2.73736572265625, -2.637451171875, -2.53753662109375, -2.4376220703125, -2.33770751953125, -2.23779296875, -2.13787841796875, -2.0379638671875, -1.93804931640625, -1.838134765625, -1.73822021484375, -1.6383056640625, -1.53839111328125, -1.4384765625, -1.33856201171875, -1.2386474609375, -1.13873291015625, -1.038818359375, -0.93890380859375, -0.8389892578125, -0.73907470703125, -0.63916015625, -0.53924560546875, -0.4393310546875, -0.33941650390625, -0.239501953125, -0.13958740234375, -0.0396728515625, 0.06024169921875, 0.16015625, 0.26007080078125, 0.3599853515625, 0.45989990234375, 0.559814453125, 0.65972900390625, 0.7596435546875, 0.85955810546875, 0.95947265625, 1.05938720703125, 1.1593017578125, 1.25921630859375, 1.359130859375, 1.45904541015625, 1.5589599609375, 1.65887451171875, 1.7587890625, 1.85870361328125, 1.9586181640625, 2.05853271484375, 2.158447265625, 2.25836181640625, 2.3582763671875, 2.45819091796875, 2.55810546875, 2.65802001953125, 2.7579345703125, 2.85784912109375, 2.957763671875, 3.05767822265625, 3.1575927734375, 3.25750732421875, 3.357421875]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 6.0, 10.0, 4.0, 18.0, 33.0, 57.0, 89.0, 161.0, 273.0, 450.0, 681.0, 1188.0, 1974.0, 3321.0, 5306.0, 8492.0, 12804.0, 19767.0, 29199.0, 41366.0, 55201.0, 71825.0, 87519.0, 98711.0, 106017.0, 104298.0, 95100.0, 81561.0, 65796.0, 50006.0, 36227.0, 25306.0, 16842.0, 10876.0, 7006.0, 4256.0, 2698.0, 1667.0, 940.0, 582.0, 368.0, 216.0, 132.0, 75.0, 58.0, 28.0, 21.0, 13.0, 7.0, 7.0, 3.0, 1.0, 1.0, 1.0], "bins": [-2.064453125, -2.0051422119140625, -1.945831298828125, -1.8865203857421875, -1.82720947265625, -1.7678985595703125, -1.708587646484375, -1.6492767333984375, -1.5899658203125, -1.5306549072265625, -1.471343994140625, -1.4120330810546875, -1.35272216796875, -1.2934112548828125, -1.234100341796875, -1.1747894287109375, -1.115478515625, -1.0561676025390625, -0.996856689453125, -0.9375457763671875, -0.87823486328125, -0.8189239501953125, -0.759613037109375, -0.7003021240234375, -0.6409912109375, -0.5816802978515625, -0.522369384765625, -0.4630584716796875, -0.40374755859375, -0.3444366455078125, -0.285125732421875, -0.2258148193359375, -0.16650390625, -0.1071929931640625, -0.047882080078125, 0.0114288330078125, 0.07073974609375, 0.1300506591796875, 0.189361572265625, 0.2486724853515625, 0.3079833984375, 0.3672943115234375, 0.426605224609375, 0.4859161376953125, 0.54522705078125, 0.6045379638671875, 0.663848876953125, 0.7231597900390625, 0.782470703125, 0.8417816162109375, 0.901092529296875, 0.9604034423828125, 1.01971435546875, 1.0790252685546875, 1.138336181640625, 1.1976470947265625, 1.2569580078125, 1.3162689208984375, 1.375579833984375, 1.4348907470703125, 1.49420166015625, 1.5535125732421875, 1.612823486328125, 1.6721343994140625, 1.7314453125]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 3.0, 1.0, 5.0, 5.0, 6.0, 13.0, 8.0, 13.0, 24.0, 20.0, 22.0, 25.0, 26.0, 27.0, 36.0, 27.0, 32.0, 39.0, 40.0, 32.0, 31.0, 38.0, 1061.0, 25.0, 42.0, 31.0, 28.0, 35.0, 41.0, 32.0, 29.0, 31.0, 38.0, 23.0, 20.0, 16.0, 22.0, 20.0, 16.0, 11.0, 10.0, 8.0, 8.0, 7.0, 5.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-4.09375, -3.97528076171875, -3.8568115234375, -3.73834228515625, -3.619873046875, -3.50140380859375, -3.3829345703125, -3.26446533203125, -3.14599609375, -3.02752685546875, -2.9090576171875, -2.79058837890625, -2.672119140625, -2.55364990234375, -2.4351806640625, -2.31671142578125, -2.1982421875, -2.07977294921875, -1.9613037109375, -1.84283447265625, -1.724365234375, -1.60589599609375, -1.4874267578125, -1.36895751953125, -1.25048828125, -1.13201904296875, -1.0135498046875, -0.89508056640625, -0.776611328125, -0.65814208984375, -0.5396728515625, -0.42120361328125, -0.302734375, -0.18426513671875, -0.0657958984375, 0.05267333984375, 0.171142578125, 0.28961181640625, 0.4080810546875, 0.52655029296875, 0.64501953125, 0.76348876953125, 0.8819580078125, 1.00042724609375, 1.118896484375, 1.23736572265625, 1.3558349609375, 1.47430419921875, 1.5927734375, 1.71124267578125, 1.8297119140625, 1.94818115234375, 2.066650390625, 2.18511962890625, 2.3035888671875, 2.42205810546875, 2.54052734375, 2.65899658203125, 2.7774658203125, 2.89593505859375, 3.014404296875, 3.13287353515625, 3.2513427734375, 3.36981201171875, 3.48828125]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 2.0, 6.0, 9.0, 9.0, 18.0, 10.0, 32.0, 33.0, 57.0, 68.0, 112.0, 136.0, 212.0, 279.0, 424.0, 628.0, 950.0, 1282.0, 1849.0, 2663.0, 3828.0, 5364.0, 7487.0, 10923.0, 15527.0, 25408.0, 65596.0, 1220931.0, 604617.0, 54883.0, 23720.0, 14828.0, 10240.0, 7413.0, 5211.0, 3716.0, 2548.0, 1826.0, 1312.0, 900.0, 649.0, 427.0, 278.0, 199.0, 148.0, 112.0, 87.0, 58.0, 38.0, 27.0, 19.0, 15.0, 9.0, 3.0, 8.0, 3.0, 4.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0], "bins": [-3.0078125, -2.90386962890625, -2.7999267578125, -2.69598388671875, -2.592041015625, -2.48809814453125, -2.3841552734375, -2.28021240234375, -2.17626953125, -2.07232666015625, -1.9683837890625, -1.86444091796875, -1.760498046875, -1.65655517578125, -1.5526123046875, -1.44866943359375, -1.3447265625, -1.24078369140625, -1.1368408203125, -1.03289794921875, -0.928955078125, -0.82501220703125, -0.7210693359375, -0.61712646484375, -0.51318359375, -0.40924072265625, -0.3052978515625, -0.20135498046875, -0.097412109375, 0.00653076171875, 0.1104736328125, 0.21441650390625, 0.318359375, 0.42230224609375, 0.5262451171875, 0.63018798828125, 0.734130859375, 0.83807373046875, 0.9420166015625, 1.04595947265625, 1.14990234375, 1.25384521484375, 1.3577880859375, 1.46173095703125, 1.565673828125, 1.66961669921875, 1.7735595703125, 1.87750244140625, 1.9814453125, 2.08538818359375, 2.1893310546875, 2.29327392578125, 2.397216796875, 2.50115966796875, 2.6051025390625, 2.70904541015625, 2.81298828125, 2.91693115234375, 3.0208740234375, 3.12481689453125, 3.228759765625, 3.33270263671875, 3.4366455078125, 3.54058837890625, 3.64453125]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 7.0, 5.0, 10.0, 11.0, 4.0, 10.0, 14.0, 13.0, 8.0, 24.0, 27.0, 14.0, 24.0, 28.0, 31.0, 31.0, 43.0, 33.0, 50.0, 37.0, 43.0, 32.0, 36.0, 34.0, 48.0, 42.0, 36.0, 34.0, 36.0, 31.0, 27.0, 34.0, 22.0, 22.0, 12.0, 9.0, 16.0, 20.0, 6.0, 5.0, 8.0, 8.0, 8.0, 3.0, 5.0, 5.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-0.288818359375, -0.28014373779296875, -0.2714691162109375, -0.26279449462890625, -0.254119873046875, -0.24544525146484375, -0.2367706298828125, -0.22809600830078125, -0.21942138671875, -0.21074676513671875, -0.2020721435546875, -0.19339752197265625, -0.184722900390625, -0.17604827880859375, -0.1673736572265625, -0.15869903564453125, -0.1500244140625, -0.14134979248046875, -0.1326751708984375, -0.12400054931640625, -0.115325927734375, -0.10665130615234375, -0.0979766845703125, -0.08930206298828125, -0.08062744140625, -0.07195281982421875, -0.0632781982421875, -0.05460357666015625, -0.045928955078125, -0.03725433349609375, -0.0285797119140625, -0.01990509033203125, -0.01123046875, -0.00255584716796875, 0.0061187744140625, 0.01479339599609375, 0.023468017578125, 0.03214263916015625, 0.0408172607421875, 0.04949188232421875, 0.05816650390625, 0.06684112548828125, 0.0755157470703125, 0.08419036865234375, 0.092864990234375, 0.10153961181640625, 0.1102142333984375, 0.11888885498046875, 0.1275634765625, 0.13623809814453125, 0.1449127197265625, 0.15358734130859375, 0.162261962890625, 0.17093658447265625, 0.1796112060546875, 0.18828582763671875, 0.19696044921875, 0.20563507080078125, 0.2143096923828125, 0.22298431396484375, 0.231658935546875, 0.24033355712890625, 0.2490081787109375, 0.25768280029296875, 0.266357421875]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 5.0, 8.0, 6.0, 6.0, 7.0, 14.0, 14.0, 16.0, 17.0, 20.0, 37.0, 65.0, 72.0, 88.0, 158.0, 206.0, 288.0, 428.0, 768.0, 4398.0, 193242.0, 825183.0, 20377.0, 1387.0, 550.0, 317.0, 238.0, 162.0, 127.0, 81.0, 58.0, 46.0, 41.0, 23.0, 23.0, 18.0, 18.0, 2.0, 6.0, 9.0, 8.0, 6.0, 6.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.3984375, -4.24798583984375, -4.0975341796875, -3.94708251953125, -3.796630859375, -3.64617919921875, -3.4957275390625, -3.34527587890625, -3.19482421875, -3.04437255859375, -2.8939208984375, -2.74346923828125, -2.593017578125, -2.44256591796875, -2.2921142578125, -2.14166259765625, -1.9912109375, -1.84075927734375, -1.6903076171875, -1.53985595703125, -1.389404296875, -1.23895263671875, -1.0885009765625, -0.93804931640625, -0.78759765625, -0.63714599609375, -0.4866943359375, -0.33624267578125, -0.185791015625, -0.03533935546875, 0.1151123046875, 0.26556396484375, 0.416015625, 0.56646728515625, 0.7169189453125, 0.86737060546875, 1.017822265625, 1.16827392578125, 1.3187255859375, 1.46917724609375, 1.61962890625, 1.77008056640625, 1.9205322265625, 2.07098388671875, 2.221435546875, 2.37188720703125, 2.5223388671875, 2.67279052734375, 2.8232421875, 2.97369384765625, 3.1241455078125, 3.27459716796875, 3.425048828125, 3.57550048828125, 3.7259521484375, 3.87640380859375, 4.02685546875, 4.17730712890625, 4.3277587890625, 4.47821044921875, 4.628662109375, 4.77911376953125, 4.9295654296875, 5.08001708984375, 5.23046875]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 18.0, 96.0, 483.0, 323.0, 68.0, 17.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.607211112976074, -15.243490219116211, -14.879769325256348, -14.516048431396484, -14.152327537536621, -13.788606643676758, -13.424886703491211, -13.061164855957031, -12.697444915771484, -12.333724021911621, -11.970003128051758, -11.606282234191895, -11.242561340332031, -10.878840446472168, -10.515119552612305, -10.151399612426758, -9.787677764892578, -9.423956871032715, -9.060235977172852, -8.696515083312988, -8.332794189453125, -7.969073295593262, -7.605352878570557, -7.241631984710693, -6.87791109085083, -6.514190196990967, -6.1504693031311035, -5.786748886108398, -5.423027992248535, -5.059307098388672, -4.695586204528809, -4.331865310668945, -3.968144416809082, -3.6044235229492188, -3.2407026290893555, -2.8769819736480713, -2.513261079788208, -2.1495401859283447, -1.7858195304870605, -1.4220986366271973, -1.058377742767334, -0.6946569085121155, -0.330936074256897, 0.03278470039367676, 0.39650559425354004, 0.7602264881134033, 1.1239471435546875, 1.4876680374145508, 1.851388931274414, 2.2151098251342773, 2.5788307189941406, 2.942551374435425, 3.306272268295288, 3.6699931621551514, 4.0337138175964355, 4.397434711456299, 4.761155605316162, 5.124876499176025, 5.488597393035889, 5.852317810058594, 6.216038703918457, 6.57975959777832, 6.943480491638184, 7.307201385498047, 7.67092227935791]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 7.0, 9.0, 10.0, 8.0, 14.0, 15.0, 24.0, 31.0, 26.0, 40.0, 42.0, 48.0, 45.0, 44.0, 54.0, 52.0, 45.0, 64.0, 58.0, 40.0, 40.0, 48.0, 35.0, 48.0, 25.0, 24.0, 21.0, 23.0, 11.0, 11.0, 5.0, 11.0, 6.0, 4.0, 5.0, 5.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.852900743484497, -2.7609975337982178, -2.6690945625305176, -2.5771913528442383, -2.485288143157959, -2.3933849334716797, -2.3014819622039795, -2.2095787525177, -2.11767578125, -2.0257725715637207, -1.933869481086731, -1.8419663906097412, -1.750063180923462, -1.6581600904464722, -1.5662569999694824, -1.4743537902832031, -1.3824505805969238, -1.290547490119934, -1.1986442804336548, -1.106741189956665, -1.0148379802703857, -0.922934889793396, -0.8310317993164062, -0.7391286492347717, -0.6472254991531372, -0.5553223490715027, -0.46341922879219055, -0.3715161085128784, -0.2796129584312439, -0.18770980834960938, -0.09580671787261963, -0.0039035677909851074, 0.08799934387207031, 0.17990247905254364, 0.27180561423301697, 0.3637087345123291, 0.4556118845939636, 0.5475150346755981, 0.6394181251525879, 0.7313212752342224, 0.8232244253158569, 0.9151275753974915, 1.007030725479126, 1.0989338159561157, 1.1908369064331055, 1.2827401161193848, 1.3746432065963745, 1.4665462970733643, 1.5584495067596436, 1.6503525972366333, 1.7422558069229126, 1.8341588973999023, 1.9260621070861816, 2.017965316772461, 2.109868288040161, 2.2017714977264404, 2.2936744689941406, 2.38557767868042, 2.47748064994812, 2.5693838596343994, 2.6612870693206787, 2.753190040588379, 2.845093250274658, 2.9369964599609375, 3.028899669647217]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 4.0, 3.0, 5.0, 1.0, 9.0, 8.0, 5.0, 7.0, 8.0, 13.0, 19.0, 15.0, 25.0, 25.0, 24.0, 24.0, 24.0, 31.0, 36.0, 27.0, 31.0, 30.0, 36.0, 41.0, 17.0, 35.0, 42.0, 37.0, 23.0, 37.0, 34.0, 28.0, 38.0, 24.0, 25.0, 30.0, 32.0, 19.0, 17.0, 16.0, 10.0, 20.0, 15.0, 8.0, 13.0, 13.0, 5.0, 4.0, 4.0, 3.0, 2.0, 2.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-3.083984375, -2.981292724609375, -2.87860107421875, -2.775909423828125, -2.6732177734375, -2.570526123046875, -2.46783447265625, -2.365142822265625, -2.262451171875, -2.159759521484375, -2.05706787109375, -1.954376220703125, -1.8516845703125, -1.748992919921875, -1.64630126953125, -1.543609619140625, -1.44091796875, -1.338226318359375, -1.23553466796875, -1.132843017578125, -1.0301513671875, -0.927459716796875, -0.82476806640625, -0.722076416015625, -0.619384765625, -0.516693115234375, -0.41400146484375, -0.311309814453125, -0.2086181640625, -0.105926513671875, -0.00323486328125, 0.099456787109375, 0.2021484375, 0.304840087890625, 0.40753173828125, 0.510223388671875, 0.6129150390625, 0.715606689453125, 0.81829833984375, 0.920989990234375, 1.023681640625, 1.126373291015625, 1.22906494140625, 1.331756591796875, 1.4344482421875, 1.537139892578125, 1.63983154296875, 1.742523193359375, 1.84521484375, 1.947906494140625, 2.05059814453125, 2.153289794921875, 2.2559814453125, 2.358673095703125, 2.46136474609375, 2.564056396484375, 2.666748046875, 2.769439697265625, 2.87213134765625, 2.974822998046875, 3.0775146484375, 3.180206298828125, 3.28289794921875, 3.385589599609375, 3.48828125]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 5.0, 7.0, 8.0, 10.0, 12.0, 13.0, 9.0, 10.0, 17.0, 27.0, 31.0, 39.0, 82.0, 148.0, 302.0, 704.0, 1537.0, 3569.0, 9358.0, 27882.0, 111263.0, 591633.0, 232955.0, 45698.0, 13856.0, 5219.0, 2233.0, 976.0, 389.0, 227.0, 106.0, 61.0, 30.0, 22.0, 15.0, 23.0, 14.0, 10.0, 11.0, 17.0, 8.0, 6.0, 3.0, 2.0, 5.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 2.0], "bins": [-9.5078125, -9.217041015625, -8.92626953125, -8.635498046875, -8.3447265625, -8.053955078125, -7.76318359375, -7.472412109375, -7.181640625, -6.890869140625, -6.60009765625, -6.309326171875, -6.0185546875, -5.727783203125, -5.43701171875, -5.146240234375, -4.85546875, -4.564697265625, -4.27392578125, -3.983154296875, -3.6923828125, -3.401611328125, -3.11083984375, -2.820068359375, -2.529296875, -2.238525390625, -1.94775390625, -1.656982421875, -1.3662109375, -1.075439453125, -0.78466796875, -0.493896484375, -0.203125, 0.087646484375, 0.37841796875, 0.669189453125, 0.9599609375, 1.250732421875, 1.54150390625, 1.832275390625, 2.123046875, 2.413818359375, 2.70458984375, 2.995361328125, 3.2861328125, 3.576904296875, 3.86767578125, 4.158447265625, 4.44921875, 4.739990234375, 5.03076171875, 5.321533203125, 5.6123046875, 5.903076171875, 6.19384765625, 6.484619140625, 6.775390625, 7.066162109375, 7.35693359375, 7.647705078125, 7.9384765625, 8.229248046875, 8.52001953125, 8.810791015625, 9.1015625]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 5.0, 3.0, 4.0, 4.0, 5.0, 9.0, 10.0, 11.0, 15.0, 22.0, 25.0, 41.0, 22.0, 31.0, 43.0, 50.0, 46.0, 50.0, 60.0, 98.0, 181.0, 1405.0, 292.0, 139.0, 67.0, 67.0, 50.0, 45.0, 33.0, 29.0, 39.0, 25.0, 26.0, 21.0, 16.0, 17.0, 13.0, 2.0, 9.0, 4.0, 6.0, 3.0, 1.0, 2.0, 7.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.9375, -13.484130859375, -13.03076171875, -12.577392578125, -12.1240234375, -11.670654296875, -11.21728515625, -10.763916015625, -10.310546875, -9.857177734375, -9.40380859375, -8.950439453125, -8.4970703125, -8.043701171875, -7.59033203125, -7.136962890625, -6.68359375, -6.230224609375, -5.77685546875, -5.323486328125, -4.8701171875, -4.416748046875, -3.96337890625, -3.510009765625, -3.056640625, -2.603271484375, -2.14990234375, -1.696533203125, -1.2431640625, -0.789794921875, -0.33642578125, 0.116943359375, 0.5703125, 1.023681640625, 1.47705078125, 1.930419921875, 2.3837890625, 2.837158203125, 3.29052734375, 3.743896484375, 4.197265625, 4.650634765625, 5.10400390625, 5.557373046875, 6.0107421875, 6.464111328125, 6.91748046875, 7.370849609375, 7.82421875, 8.277587890625, 8.73095703125, 9.184326171875, 9.6376953125, 10.091064453125, 10.54443359375, 10.997802734375, 11.451171875, 11.904541015625, 12.35791015625, 12.811279296875, 13.2646484375, 13.718017578125, 14.17138671875, 14.624755859375, 15.078125]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 6.0, 10.0, 5.0, 15.0, 16.0, 26.0, 36.0, 53.0, 61.0, 80.0, 120.0, 185.0, 269.0, 554.0, 1646.0, 15685.0, 1457638.0, 1649605.0, 16439.0, 1778.0, 548.0, 291.0, 188.0, 122.0, 108.0, 62.0, 44.0, 33.0, 14.0, 19.0, 13.0, 8.0, 8.0, 5.0, 4.0, 3.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.875, -24.9169921875, -23.958984375, -23.0009765625, -22.04296875, -21.0849609375, -20.126953125, -19.1689453125, -18.2109375, -17.2529296875, -16.294921875, -15.3369140625, -14.37890625, -13.4208984375, -12.462890625, -11.5048828125, -10.546875, -9.5888671875, -8.630859375, -7.6728515625, -6.71484375, -5.7568359375, -4.798828125, -3.8408203125, -2.8828125, -1.9248046875, -0.966796875, -0.0087890625, 0.94921875, 1.9072265625, 2.865234375, 3.8232421875, 4.78125, 5.7392578125, 6.697265625, 7.6552734375, 8.61328125, 9.5712890625, 10.529296875, 11.4873046875, 12.4453125, 13.4033203125, 14.361328125, 15.3193359375, 16.27734375, 17.2353515625, 18.193359375, 19.1513671875, 20.109375, 21.0673828125, 22.025390625, 22.9833984375, 23.94140625, 24.8994140625, 25.857421875, 26.8154296875, 27.7734375, 28.7314453125, 29.689453125, 30.6474609375, 31.60546875, 32.5634765625, 33.521484375, 34.4794921875, 35.4375]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 35.0, 912.0, 71.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-543.472900390625, -533.5097045898438, -523.5465087890625, -513.583251953125, -503.62005615234375, -493.6568603515625, -483.6936340332031, -473.73040771484375, -463.7672119140625, -453.80401611328125, -443.8407897949219, -433.8775634765625, -423.91436767578125, -413.951171875, -403.9879455566406, -394.02471923828125, -384.0615234375, -374.09832763671875, -364.1351013183594, -354.171875, -344.20867919921875, -334.2454833984375, -324.2822570800781, -314.31903076171875, -304.3558349609375, -294.39263916015625, -284.4294128417969, -274.4661865234375, -264.50299072265625, -254.53977966308594, -244.57656860351562, -234.6133575439453, -224.650146484375, -214.6869354248047, -204.72372436523438, -194.76051330566406, -184.79730224609375, -174.83409118652344, -164.87088012695312, -154.9076690673828, -144.9444580078125, -134.9812469482422, -125.01803588867188, -115.05482482910156, -105.09161376953125, -95.12840270996094, -85.16519165039062, -75.20198059082031, -65.23877716064453, -55.27556610107422, -45.312355041503906, -35.349143981933594, -25.38593292236328, -15.422721862792969, -5.459510803222656, 4.503700256347656, 14.466911315917969, 24.43012237548828, 34.393333435058594, 44.356544494628906, 54.31975555419922, 64.28296661376953, 74.24617767333984, 84.20938873291016, 94.17259979248047]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 7.0, 5.0, 8.0, 13.0, 15.0, 16.0, 13.0, 26.0, 23.0, 26.0, 33.0, 29.0, 42.0, 37.0, 49.0, 46.0, 38.0, 51.0, 34.0, 43.0, 42.0, 41.0, 45.0, 36.0, 47.0, 34.0, 36.0, 24.0, 28.0, 29.0, 14.0, 14.0, 13.0, 13.0, 8.0, 7.0, 3.0, 5.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.55447006225586, -36.270118713378906, -34.98576736450195, -33.701416015625, -32.41706848144531, -31.132715225219727, -29.848365783691406, -28.564014434814453, -27.2796630859375, -25.995311737060547, -24.710960388183594, -23.426610946655273, -22.14225959777832, -20.857908248901367, -19.573558807373047, -18.289207458496094, -17.00485610961914, -15.720504760742188, -14.43615436553955, -13.151803970336914, -11.867452621459961, -10.583101272583008, -9.298750877380371, -8.014400482177734, -6.730049133300781, -5.445698261260986, -4.161347389221191, -2.8769965171813965, -1.5926456451416016, -0.30829477310180664, 0.9760560989379883, 2.260406494140625, 3.544757843017578, 4.829108715057373, 6.113459587097168, 7.397810459136963, 8.682161331176758, 9.966512680053711, 11.250863075256348, 12.535213470458984, 13.819564819335938, 15.10391616821289, 16.388267517089844, 17.672616958618164, 18.956968307495117, 20.24131965637207, 21.52566909790039, 22.810020446777344, 24.094371795654297, 25.37872314453125, 26.663074493408203, 27.947423934936523, 29.231775283813477, 30.51612663269043, 31.80047607421875, 33.0848274230957, 34.369178771972656, 35.65353012084961, 36.93788146972656, 38.222232818603516, 39.50658416748047, 40.790931701660156, 42.07528305053711, 43.35963439941406, 44.643985748291016]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 4.0, 5.0, 3.0, 3.0, 7.0, 4.0, 12.0, 4.0, 12.0, 12.0, 14.0, 16.0, 20.0, 21.0, 21.0, 29.0, 20.0, 25.0, 30.0, 34.0, 35.0, 31.0, 29.0, 44.0, 33.0, 36.0, 35.0, 29.0, 37.0, 27.0, 37.0, 29.0, 36.0, 35.0, 26.0, 24.0, 25.0, 16.0, 19.0, 15.0, 14.0, 19.0, 14.0, 10.0, 12.0, 8.0, 5.0, 9.0, 4.0, 9.0, 4.0, 6.0, 2.0, 1.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.08984375, -2.981597900390625, -2.87335205078125, -2.765106201171875, -2.6568603515625, -2.548614501953125, -2.44036865234375, -2.332122802734375, -2.223876953125, -2.115631103515625, -2.00738525390625, -1.899139404296875, -1.7908935546875, -1.682647705078125, -1.57440185546875, -1.466156005859375, -1.35791015625, -1.249664306640625, -1.14141845703125, -1.033172607421875, -0.9249267578125, -0.816680908203125, -0.70843505859375, -0.600189208984375, -0.491943359375, -0.383697509765625, -0.27545166015625, -0.167205810546875, -0.0589599609375, 0.049285888671875, 0.15753173828125, 0.265777587890625, 0.3740234375, 0.482269287109375, 0.59051513671875, 0.698760986328125, 0.8070068359375, 0.915252685546875, 1.02349853515625, 1.131744384765625, 1.239990234375, 1.348236083984375, 1.45648193359375, 1.564727783203125, 1.6729736328125, 1.781219482421875, 1.88946533203125, 1.997711181640625, 2.10595703125, 2.214202880859375, 2.32244873046875, 2.430694580078125, 2.5389404296875, 2.647186279296875, 2.75543212890625, 2.863677978515625, 2.971923828125, 3.080169677734375, 3.18841552734375, 3.296661376953125, 3.4049072265625, 3.513153076171875, 3.62139892578125, 3.729644775390625, 3.837890625]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 5.0, 0.0, 2.0, 5.0, 7.0, 10.0, 7.0, 7.0, 12.0, 14.0, 15.0, 14.0, 23.0, 35.0, 30.0, 44.0, 44.0, 64.0, 99.0, 164.0, 403.0, 1263.0, 5186.0, 28124.0, 226378.0, 2276618.0, 1505516.0, 126861.0, 17987.0, 3627.0, 924.0, 296.0, 128.0, 72.0, 52.0, 47.0, 42.0, 31.0, 21.0, 17.0, 11.0, 10.0, 20.0, 15.0, 10.0, 6.0, 5.0, 5.0, 8.0, 3.0, 3.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.0, -9.6279296875, -9.255859375, -8.8837890625, -8.51171875, -8.1396484375, -7.767578125, -7.3955078125, -7.0234375, -6.6513671875, -6.279296875, -5.9072265625, -5.53515625, -5.1630859375, -4.791015625, -4.4189453125, -4.046875, -3.6748046875, -3.302734375, -2.9306640625, -2.55859375, -2.1865234375, -1.814453125, -1.4423828125, -1.0703125, -0.6982421875, -0.326171875, 0.0458984375, 0.41796875, 0.7900390625, 1.162109375, 1.5341796875, 1.90625, 2.2783203125, 2.650390625, 3.0224609375, 3.39453125, 3.7666015625, 4.138671875, 4.5107421875, 4.8828125, 5.2548828125, 5.626953125, 5.9990234375, 6.37109375, 6.7431640625, 7.115234375, 7.4873046875, 7.859375, 8.2314453125, 8.603515625, 8.9755859375, 9.34765625, 9.7197265625, 10.091796875, 10.4638671875, 10.8359375, 11.2080078125, 11.580078125, 11.9521484375, 12.32421875, 12.6962890625, 13.068359375, 13.4404296875, 13.8125]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 7.0, 9.0, 16.0, 22.0, 46.0, 50.0, 73.0, 101.0, 178.0, 250.0, 356.0, 574.0, 622.0, 569.0, 419.0, 299.0, 173.0, 120.0, 71.0, 42.0, 33.0, 15.0, 13.0, 5.0, 7.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0], "bins": [-16.9375, -16.5396728515625, -16.141845703125, -15.7440185546875, -15.34619140625, -14.9483642578125, -14.550537109375, -14.1527099609375, -13.7548828125, -13.3570556640625, -12.959228515625, -12.5614013671875, -12.16357421875, -11.7657470703125, -11.367919921875, -10.9700927734375, -10.572265625, -10.1744384765625, -9.776611328125, -9.3787841796875, -8.98095703125, -8.5831298828125, -8.185302734375, -7.7874755859375, -7.3896484375, -6.9918212890625, -6.593994140625, -6.1961669921875, -5.79833984375, -5.4005126953125, -5.002685546875, -4.6048583984375, -4.20703125, -3.8092041015625, -3.411376953125, -3.0135498046875, -2.61572265625, -2.2178955078125, -1.820068359375, -1.4222412109375, -1.0244140625, -0.6265869140625, -0.228759765625, 0.1690673828125, 0.56689453125, 0.9647216796875, 1.362548828125, 1.7603759765625, 2.158203125, 2.5560302734375, 2.953857421875, 3.3516845703125, 3.74951171875, 4.1473388671875, 4.545166015625, 4.9429931640625, 5.3408203125, 5.7386474609375, 6.136474609375, 6.5343017578125, 6.93212890625, 7.3299560546875, 7.727783203125, 8.1256103515625, 8.5234375]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 5.0, 6.0, 15.0, 25.0, 47.0, 60.0, 101.0, 175.0, 394.0, 914.0, 6000.0, 167332.0, 3691484.0, 316639.0, 9074.0, 1130.0, 365.0, 199.0, 118.0, 68.0, 37.0, 37.0, 33.0, 13.0, 9.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.515625, -20.469970703125, -19.42431640625, -18.378662109375, -17.3330078125, -16.287353515625, -15.24169921875, -14.196044921875, -13.150390625, -12.104736328125, -11.05908203125, -10.013427734375, -8.9677734375, -7.922119140625, -6.87646484375, -5.830810546875, -4.78515625, -3.739501953125, -2.69384765625, -1.648193359375, -0.6025390625, 0.443115234375, 1.48876953125, 2.534423828125, 3.580078125, 4.625732421875, 5.67138671875, 6.717041015625, 7.7626953125, 8.808349609375, 9.85400390625, 10.899658203125, 11.9453125, 12.990966796875, 14.03662109375, 15.082275390625, 16.1279296875, 17.173583984375, 18.21923828125, 19.264892578125, 20.310546875, 21.356201171875, 22.40185546875, 23.447509765625, 24.4931640625, 25.538818359375, 26.58447265625, 27.630126953125, 28.67578125, 29.721435546875, 30.76708984375, 31.812744140625, 32.8583984375, 33.904052734375, 34.94970703125, 35.995361328125, 37.041015625, 38.086669921875, 39.13232421875, 40.177978515625, 41.2236328125, 42.269287109375, 43.31494140625, 44.360595703125, 45.40625]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 13.0, 23.0, 65.0, 159.0, 215.0, 207.0, 153.0, 102.0, 53.0, 17.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-86.35076904296875, -82.95674896240234, -79.5627212524414, -76.168701171875, -72.77467346191406, -69.38065338134766, -65.98662567138672, -62.59260559082031, -59.198577880859375, -55.8045539855957, -52.41053009033203, -49.01650619506836, -45.62248229980469, -42.22846221923828, -38.834434509277344, -35.44041442871094, -32.046390533447266, -28.652366638183594, -25.258342742919922, -21.86431884765625, -18.470294952392578, -15.076272964477539, -11.682249069213867, -8.288225173950195, -4.894201278686523, -1.5001776218414307, 1.893846035003662, 5.287869453430176, 8.681893348693848, 12.075916290283203, 15.469940185546875, 18.863964080810547, 22.25798797607422, 25.65201187133789, 29.046035766601562, 32.440059661865234, 35.834083557128906, 39.22810363769531, 42.62213134765625, 46.016151428222656, 49.410179138183594, 52.804203033447266, 56.19822692871094, 59.59225082397461, 62.98627471923828, 66.38029479980469, 69.77432250976562, 73.16834259033203, 76.56236267089844, 79.95638275146484, 83.35041046142578, 86.74443054199219, 90.13845825195312, 93.53247833251953, 96.92650604248047, 100.32052612304688, 103.71455383300781, 107.10857391357422, 110.50260162353516, 113.89662170410156, 117.2906494140625, 120.6846694946289, 124.07869720458984, 127.47271728515625, 130.8667449951172]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 8.0, 0.0, 2.0, 6.0, 9.0, 14.0, 12.0, 10.0, 16.0, 13.0, 20.0, 25.0, 25.0, 23.0, 26.0, 27.0, 29.0, 41.0, 58.0, 45.0, 47.0, 46.0, 37.0, 43.0, 32.0, 32.0, 28.0, 35.0, 25.0, 35.0, 31.0, 22.0, 26.0, 31.0, 17.0, 20.0, 19.0, 21.0, 9.0, 10.0, 8.0, 9.0, 7.0, 5.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-27.449129104614258, -26.456722259521484, -25.464313507080078, -24.471906661987305, -23.47949981689453, -22.487092971801758, -21.494686126708984, -20.502277374267578, -19.509870529174805, -18.51746368408203, -17.525054931640625, -16.53264808654785, -15.540241241455078, -14.547834396362305, -13.555426597595215, -12.563018798828125, -11.570611953735352, -10.578205108642578, -9.585797309875488, -8.593389511108398, -7.600982666015625, -6.608575344085693, -5.616168022155762, -4.62376070022583, -3.6313533782958984, -2.638946056365967, -1.6465387344360352, -0.6541314125061035, 0.3382759094238281, 1.3306832313537598, 2.3230905532836914, 3.315497875213623, 4.307903289794922, 5.3003106117248535, 6.292717933654785, 7.285125255584717, 8.277532577514648, 9.269939422607422, 10.262347221374512, 11.254755020141602, 12.247161865234375, 13.239568710327148, 14.231976509094238, 15.224384307861328, 16.2167911529541, 17.209197998046875, 18.20160675048828, 19.194013595581055, 20.186420440673828, 21.1788272857666, 22.171234130859375, 23.16364288330078, 24.156049728393555, 25.148456573486328, 26.140865325927734, 27.133272171020508, 28.12567901611328, 29.118085861206055, 30.110492706298828, 31.102901458740234, 32.095306396484375, 33.08771514892578, 34.08012390136719, 35.07252883911133, 36.064937591552734]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 5.0, 3.0, 4.0, 8.0, 5.0, 7.0, 5.0, 13.0, 15.0, 10.0, 11.0, 16.0, 22.0, 24.0, 21.0, 25.0, 18.0, 22.0, 38.0, 37.0, 27.0, 29.0, 41.0, 43.0, 48.0, 40.0, 38.0, 36.0, 44.0, 34.0, 29.0, 35.0, 25.0, 24.0, 27.0, 23.0, 21.0, 27.0, 14.0, 16.0, 14.0, 13.0, 6.0, 12.0, 9.0, 4.0, 8.0, 4.0, 5.0, 7.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.314453125, -3.198028564453125, -3.08160400390625, -2.965179443359375, -2.8487548828125, -2.732330322265625, -2.61590576171875, -2.499481201171875, -2.383056640625, -2.266632080078125, -2.15020751953125, -2.033782958984375, -1.9173583984375, -1.800933837890625, -1.68450927734375, -1.568084716796875, -1.45166015625, -1.335235595703125, -1.21881103515625, -1.102386474609375, -0.9859619140625, -0.869537353515625, -0.75311279296875, -0.636688232421875, -0.520263671875, -0.403839111328125, -0.28741455078125, -0.170989990234375, -0.0545654296875, 0.061859130859375, 0.17828369140625, 0.294708251953125, 0.4111328125, 0.527557373046875, 0.64398193359375, 0.760406494140625, 0.8768310546875, 0.993255615234375, 1.10968017578125, 1.226104736328125, 1.342529296875, 1.458953857421875, 1.57537841796875, 1.691802978515625, 1.8082275390625, 1.924652099609375, 2.04107666015625, 2.157501220703125, 2.27392578125, 2.390350341796875, 2.50677490234375, 2.623199462890625, 2.7396240234375, 2.856048583984375, 2.97247314453125, 3.088897705078125, 3.205322265625, 3.321746826171875, 3.43817138671875, 3.554595947265625, 3.6710205078125, 3.787445068359375, 3.90386962890625, 4.020294189453125, 4.13671875]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 2.0, 8.0, 12.0, 9.0, 13.0, 22.0, 36.0, 55.0, 93.0, 164.0, 295.0, 464.0, 830.0, 1467.0, 2564.0, 4369.0, 7256.0, 12095.0, 19414.0, 30281.0, 44986.0, 63048.0, 83171.0, 101660.0, 115194.0, 119212.0, 110949.0, 94764.0, 75051.0, 56093.0, 38948.0, 25571.0, 15893.0, 10034.0, 6065.0, 3585.0, 1957.0, 1184.0, 749.0, 395.0, 224.0, 146.0, 85.0, 48.0, 35.0, 34.0, 13.0, 10.0, 7.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.017578125, -1.94873046875, -1.8798828125, -1.81103515625, -1.7421875, -1.67333984375, -1.6044921875, -1.53564453125, -1.466796875, -1.39794921875, -1.3291015625, -1.26025390625, -1.19140625, -1.12255859375, -1.0537109375, -0.98486328125, -0.916015625, -0.84716796875, -0.7783203125, -0.70947265625, -0.640625, -0.57177734375, -0.5029296875, -0.43408203125, -0.365234375, -0.29638671875, -0.2275390625, -0.15869140625, -0.08984375, -0.02099609375, 0.0478515625, 0.11669921875, 0.185546875, 0.25439453125, 0.3232421875, 0.39208984375, 0.4609375, 0.52978515625, 0.5986328125, 0.66748046875, 0.736328125, 0.80517578125, 0.8740234375, 0.94287109375, 1.01171875, 1.08056640625, 1.1494140625, 1.21826171875, 1.287109375, 1.35595703125, 1.4248046875, 1.49365234375, 1.5625, 1.63134765625, 1.7001953125, 1.76904296875, 1.837890625, 1.90673828125, 1.9755859375, 2.04443359375, 2.11328125, 2.18212890625, 2.2509765625, 2.31982421875, 2.388671875]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 3.0, 1.0, 6.0, 7.0, 7.0, 10.0, 7.0, 10.0, 18.0, 21.0, 28.0, 25.0, 28.0, 44.0, 53.0, 36.0, 38.0, 44.0, 50.0, 37.0, 1069.0, 38.0, 47.0, 47.0, 35.0, 45.0, 38.0, 47.0, 25.0, 30.0, 26.0, 19.0, 19.0, 15.0, 9.0, 7.0, 13.0, 15.0, 5.0, 3.0, 4.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.80859375, -4.65338134765625, -4.4981689453125, -4.34295654296875, -4.187744140625, -4.03253173828125, -3.8773193359375, -3.72210693359375, -3.56689453125, -3.41168212890625, -3.2564697265625, -3.10125732421875, -2.946044921875, -2.79083251953125, -2.6356201171875, -2.48040771484375, -2.3251953125, -2.16998291015625, -2.0147705078125, -1.85955810546875, -1.704345703125, -1.54913330078125, -1.3939208984375, -1.23870849609375, -1.08349609375, -0.92828369140625, -0.7730712890625, -0.61785888671875, -0.462646484375, -0.30743408203125, -0.1522216796875, 0.00299072265625, 0.158203125, 0.31341552734375, 0.4686279296875, 0.62384033203125, 0.779052734375, 0.93426513671875, 1.0894775390625, 1.24468994140625, 1.39990234375, 1.55511474609375, 1.7103271484375, 1.86553955078125, 2.020751953125, 2.17596435546875, 2.3311767578125, 2.48638916015625, 2.6416015625, 2.79681396484375, 2.9520263671875, 3.10723876953125, 3.262451171875, 3.41766357421875, 3.5728759765625, 3.72808837890625, 3.88330078125, 4.03851318359375, 4.1937255859375, 4.34893798828125, 4.504150390625, 4.65936279296875, 4.8145751953125, 4.96978759765625, 5.125]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 5.0, 8.0, 9.0, 11.0, 17.0, 22.0, 47.0, 60.0, 78.0, 132.0, 157.0, 249.0, 364.0, 567.0, 946.0, 1342.0, 2063.0, 3022.0, 4881.0, 7523.0, 11263.0, 17691.0, 31601.0, 137957.0, 1676450.0, 121033.0, 30611.0, 17119.0, 11029.0, 7098.0, 4753.0, 3069.0, 2012.0, 1327.0, 911.0, 578.0, 381.0, 258.0, 163.0, 108.0, 76.0, 36.0, 42.0, 23.0, 14.0, 8.0, 9.0, 5.0, 9.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.69921875, -3.5645751953125, -3.429931640625, -3.2952880859375, -3.16064453125, -3.0260009765625, -2.891357421875, -2.7567138671875, -2.6220703125, -2.4874267578125, -2.352783203125, -2.2181396484375, -2.08349609375, -1.9488525390625, -1.814208984375, -1.6795654296875, -1.544921875, -1.4102783203125, -1.275634765625, -1.1409912109375, -1.00634765625, -0.8717041015625, -0.737060546875, -0.6024169921875, -0.4677734375, -0.3331298828125, -0.198486328125, -0.0638427734375, 0.07080078125, 0.2054443359375, 0.340087890625, 0.4747314453125, 0.609375, 0.7440185546875, 0.878662109375, 1.0133056640625, 1.14794921875, 1.2825927734375, 1.417236328125, 1.5518798828125, 1.6865234375, 1.8211669921875, 1.955810546875, 2.0904541015625, 2.22509765625, 2.3597412109375, 2.494384765625, 2.6290283203125, 2.763671875, 2.8983154296875, 3.032958984375, 3.1676025390625, 3.30224609375, 3.4368896484375, 3.571533203125, 3.7061767578125, 3.8408203125, 3.9754638671875, 4.110107421875, 4.2447509765625, 4.37939453125, 4.5140380859375, 4.648681640625, 4.7833251953125, 4.91796875]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 4.0, 2.0, 4.0, 6.0, 4.0, 10.0, 9.0, 15.0, 14.0, 24.0, 28.0, 33.0, 45.0, 51.0, 66.0, 51.0, 58.0, 72.0, 66.0, 55.0, 61.0, 50.0, 56.0, 39.0, 43.0, 40.0, 26.0, 14.0, 13.0, 19.0, 4.0, 5.0, 5.0, 4.0, 4.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.368896484375, -0.357696533203125, -0.34649658203125, -0.335296630859375, -0.3240966796875, -0.312896728515625, -0.30169677734375, -0.290496826171875, -0.279296875, -0.268096923828125, -0.25689697265625, -0.245697021484375, -0.2344970703125, -0.223297119140625, -0.21209716796875, -0.200897216796875, -0.189697265625, -0.178497314453125, -0.16729736328125, -0.156097412109375, -0.1448974609375, -0.133697509765625, -0.12249755859375, -0.111297607421875, -0.10009765625, -0.088897705078125, -0.07769775390625, -0.066497802734375, -0.0552978515625, -0.044097900390625, -0.03289794921875, -0.021697998046875, -0.010498046875, 0.000701904296875, 0.01190185546875, 0.023101806640625, 0.0343017578125, 0.045501708984375, 0.05670166015625, 0.067901611328125, 0.0791015625, 0.090301513671875, 0.10150146484375, 0.112701416015625, 0.1239013671875, 0.135101318359375, 0.14630126953125, 0.157501220703125, 0.168701171875, 0.179901123046875, 0.19110107421875, 0.202301025390625, 0.2135009765625, 0.224700927734375, 0.23590087890625, 0.247100830078125, 0.25830078125, 0.269500732421875, 0.28070068359375, 0.291900634765625, 0.3031005859375, 0.314300537109375, 0.32550048828125, 0.336700439453125, 0.347900390625]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 2.0, 2.0, 5.0, 4.0, 8.0, 9.0, 12.0, 14.0, 24.0, 33.0, 37.0, 68.0, 83.0, 159.0, 259.0, 501.0, 1426.0, 30351.0, 987502.0, 25472.0, 1355.0, 524.0, 262.0, 155.0, 104.0, 51.0, 44.0, 30.0, 16.0, 10.0, 10.0, 7.0, 7.0, 8.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.94140625, -5.752685546875, -5.56396484375, -5.375244140625, -5.1865234375, -4.997802734375, -4.80908203125, -4.620361328125, -4.431640625, -4.242919921875, -4.05419921875, -3.865478515625, -3.6767578125, -3.488037109375, -3.29931640625, -3.110595703125, -2.921875, -2.733154296875, -2.54443359375, -2.355712890625, -2.1669921875, -1.978271484375, -1.78955078125, -1.600830078125, -1.412109375, -1.223388671875, -1.03466796875, -0.845947265625, -0.6572265625, -0.468505859375, -0.27978515625, -0.091064453125, 0.09765625, 0.286376953125, 0.47509765625, 0.663818359375, 0.8525390625, 1.041259765625, 1.22998046875, 1.418701171875, 1.607421875, 1.796142578125, 1.98486328125, 2.173583984375, 2.3623046875, 2.551025390625, 2.73974609375, 2.928466796875, 3.1171875, 3.305908203125, 3.49462890625, 3.683349609375, 3.8720703125, 4.060791015625, 4.24951171875, 4.438232421875, 4.626953125, 4.815673828125, 5.00439453125, 5.193115234375, 5.3818359375, 5.570556640625, 5.75927734375, 5.947998046875, 6.13671875]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 11.0, 89.0, 514.0, 348.0, 38.0, 9.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.612584114074707, -14.271566390991211, -13.930548667907715, -13.589530944824219, -13.248514175415039, -12.907496452331543, -12.566478729248047, -12.22546100616455, -11.884443283081055, -11.543425559997559, -11.202407836914062, -10.861391067504883, -10.520373344421387, -10.17935562133789, -9.838337898254395, -9.497320175170898, -9.156303405761719, -8.815285682678223, -8.474267959594727, -8.133251190185547, -7.792233467102051, -7.451215744018555, -7.110198020935059, -6.7691802978515625, -6.428163051605225, -6.0871453285217285, -5.746128082275391, -5.4051103591918945, -5.064092636108398, -4.7230753898620605, -4.3820576667785645, -4.041040420532227, -3.700021743774414, -3.359004259109497, -3.01798677444458, -2.676969051361084, -2.335951566696167, -1.99493408203125, -1.653916358947754, -1.312898874282837, -0.9718813896179199, -0.6308638453483582, -0.2898463010787964, 0.051171302795410156, 0.39218878746032715, 0.7332062721252441, 1.0742239952087402, 1.4152414798736572, 1.7562589645385742, 2.097276449203491, 2.438293933868408, 2.7793116569519043, 3.1203291416168213, 3.4613466262817383, 3.8023643493652344, 4.1433820724487305, 4.484399318695068, 4.8254170417785645, 5.166434288024902, 5.507452011108398, 5.8484697341918945, 6.189486980438232, 6.5305047035217285, 6.871521949768066, 7.2125396728515625]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 5.0, 6.0, 8.0, 9.0, 5.0, 12.0, 20.0, 15.0, 36.0, 40.0, 37.0, 47.0, 61.0, 67.0, 59.0, 51.0, 64.0, 63.0, 56.0, 50.0, 52.0, 46.0, 42.0, 45.0, 23.0, 22.0, 17.0, 16.0, 11.0, 4.0, 9.0, 3.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6023480892181396, -2.515796422958374, -2.4292449951171875, -2.342693328857422, -2.2561416625976562, -2.1695899963378906, -2.083038330078125, -1.9964869022369385, -1.9099352359771729, -1.8233835697174072, -1.7368320226669312, -1.650280475616455, -1.5637288093566895, -1.4771771430969238, -1.3906255960464478, -1.3040740489959717, -1.217522382736206, -1.1309707164764404, -1.0444191694259644, -0.9578675627708435, -0.8713159561157227, -0.7847643494606018, -0.698212742805481, -0.6116611361503601, -0.5251095294952393, -0.4385579228401184, -0.35200631618499756, -0.2654547095298767, -0.17890310287475586, -0.09235149621963501, -0.00579988956451416, 0.08075171709060669, 0.16730332374572754, 0.2538549304008484, 0.34040653705596924, 0.4269581437110901, 0.5135097503662109, 0.6000613570213318, 0.6866129636764526, 0.7731645703315735, 0.8597161769866943, 0.9462677836418152, 1.032819390296936, 1.119370937347412, 1.2059226036071777, 1.2924742698669434, 1.3790258169174194, 1.4655773639678955, 1.5521290302276611, 1.6386806964874268, 1.7252322435379028, 1.811783790588379, 1.8983354568481445, 1.9848871231079102, 2.071438789367676, 2.1579902172088623, 2.244541883468628, 2.3310935497283936, 2.41764497756958, 2.5041966438293457, 2.5907483100891113, 2.677299976348877, 2.7638516426086426, 2.850403070449829, 2.9369547367095947]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 2.0, 3.0, 3.0, 1.0, 4.0, 11.0, 5.0, 6.0, 12.0, 6.0, 11.0, 16.0, 9.0, 16.0, 18.0, 17.0, 19.0, 31.0, 23.0, 34.0, 30.0, 32.0, 39.0, 37.0, 25.0, 25.0, 32.0, 37.0, 40.0, 40.0, 43.0, 31.0, 28.0, 32.0, 26.0, 23.0, 21.0, 24.0, 26.0, 17.0, 22.0, 20.0, 16.0, 17.0, 9.0, 18.0, 9.0, 8.0, 5.0, 5.0, 11.0, 3.0, 5.0, 3.0, 2.0, 4.0, 4.0, 1.0, 0.0, 1.0], "bins": [-3.556640625, -3.4449462890625, -3.333251953125, -3.2215576171875, -3.10986328125, -2.9981689453125, -2.886474609375, -2.7747802734375, -2.6630859375, -2.5513916015625, -2.439697265625, -2.3280029296875, -2.21630859375, -2.1046142578125, -1.992919921875, -1.8812255859375, -1.76953125, -1.6578369140625, -1.546142578125, -1.4344482421875, -1.32275390625, -1.2110595703125, -1.099365234375, -0.9876708984375, -0.8759765625, -0.7642822265625, -0.652587890625, -0.5408935546875, -0.42919921875, -0.3175048828125, -0.205810546875, -0.0941162109375, 0.017578125, 0.1292724609375, 0.240966796875, 0.3526611328125, 0.46435546875, 0.5760498046875, 0.687744140625, 0.7994384765625, 0.9111328125, 1.0228271484375, 1.134521484375, 1.2462158203125, 1.35791015625, 1.4696044921875, 1.581298828125, 1.6929931640625, 1.8046875, 1.9163818359375, 2.028076171875, 2.1397705078125, 2.25146484375, 2.3631591796875, 2.474853515625, 2.5865478515625, 2.6982421875, 2.8099365234375, 2.921630859375, 3.0333251953125, 3.14501953125, 3.2567138671875, 3.368408203125, 3.4801025390625, 3.591796875]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 5.0, 5.0, 3.0, 7.0, 11.0, 14.0, 22.0, 30.0, 51.0, 65.0, 100.0, 142.0, 176.0, 302.0, 477.0, 763.0, 1175.0, 1799.0, 3104.0, 5067.0, 8359.0, 13932.0, 24040.0, 40526.0, 71436.0, 131121.0, 230597.0, 223563.0, 126242.0, 68653.0, 39149.0, 22878.0, 13536.0, 8205.0, 5015.0, 2954.0, 1790.0, 1204.0, 675.0, 462.0, 298.0, 208.0, 119.0, 109.0, 51.0, 39.0, 26.0, 18.0, 13.0, 9.0, 7.0, 10.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.123046875, -3.018829345703125, -2.91461181640625, -2.810394287109375, -2.7061767578125, -2.601959228515625, -2.49774169921875, -2.393524169921875, -2.289306640625, -2.185089111328125, -2.08087158203125, -1.976654052734375, -1.8724365234375, -1.768218994140625, -1.66400146484375, -1.559783935546875, -1.45556640625, -1.351348876953125, -1.24713134765625, -1.142913818359375, -1.0386962890625, -0.934478759765625, -0.83026123046875, -0.726043701171875, -0.621826171875, -0.517608642578125, -0.41339111328125, -0.309173583984375, -0.2049560546875, -0.100738525390625, 0.00347900390625, 0.107696533203125, 0.2119140625, 0.316131591796875, 0.42034912109375, 0.524566650390625, 0.6287841796875, 0.733001708984375, 0.83721923828125, 0.941436767578125, 1.045654296875, 1.149871826171875, 1.25408935546875, 1.358306884765625, 1.4625244140625, 1.566741943359375, 1.67095947265625, 1.775177001953125, 1.87939453125, 1.983612060546875, 2.08782958984375, 2.192047119140625, 2.2962646484375, 2.400482177734375, 2.50469970703125, 2.608917236328125, 2.713134765625, 2.817352294921875, 2.92156982421875, 3.025787353515625, 3.1300048828125, 3.234222412109375, 3.33843994140625, 3.442657470703125, 3.546875]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 7.0, 6.0, 12.0, 13.0, 9.0, 14.0, 14.0, 21.0, 28.0, 27.0, 35.0, 34.0, 36.0, 43.0, 61.0, 70.0, 125.0, 329.0, 1497.0, 196.0, 111.0, 70.0, 42.0, 37.0, 43.0, 35.0, 25.0, 21.0, 16.0, 10.0, 12.0, 14.0, 15.0, 8.0, 4.0, 8.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-20.078125, -19.474853515625, -18.87158203125, -18.268310546875, -17.6650390625, -17.061767578125, -16.45849609375, -15.855224609375, -15.251953125, -14.648681640625, -14.04541015625, -13.442138671875, -12.8388671875, -12.235595703125, -11.63232421875, -11.029052734375, -10.42578125, -9.822509765625, -9.21923828125, -8.615966796875, -8.0126953125, -7.409423828125, -6.80615234375, -6.202880859375, -5.599609375, -4.996337890625, -4.39306640625, -3.789794921875, -3.1865234375, -2.583251953125, -1.97998046875, -1.376708984375, -0.7734375, -0.170166015625, 0.43310546875, 1.036376953125, 1.6396484375, 2.242919921875, 2.84619140625, 3.449462890625, 4.052734375, 4.656005859375, 5.25927734375, 5.862548828125, 6.4658203125, 7.069091796875, 7.67236328125, 8.275634765625, 8.87890625, 9.482177734375, 10.08544921875, 10.688720703125, 11.2919921875, 11.895263671875, 12.49853515625, 13.101806640625, 13.705078125, 14.308349609375, 14.91162109375, 15.514892578125, 16.1181640625, 16.721435546875, 17.32470703125, 17.927978515625, 18.53125]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 5.0, 1.0, 9.0, 12.0, 12.0, 26.0, 55.0, 66.0, 146.0, 301.0, 767.0, 6505.0, 3095661.0, 40054.0, 1262.0, 385.0, 196.0, 84.0, 61.0, 42.0, 25.0, 12.0, 7.0, 8.0, 3.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-71.0, -69.0087890625, -67.017578125, -65.0263671875, -63.03515625, -61.0439453125, -59.052734375, -57.0615234375, -55.0703125, -53.0791015625, -51.087890625, -49.0966796875, -47.10546875, -45.1142578125, -43.123046875, -41.1318359375, -39.140625, -37.1494140625, -35.158203125, -33.1669921875, -31.17578125, -29.1845703125, -27.193359375, -25.2021484375, -23.2109375, -21.2197265625, -19.228515625, -17.2373046875, -15.24609375, -13.2548828125, -11.263671875, -9.2724609375, -7.28125, -5.2900390625, -3.298828125, -1.3076171875, 0.68359375, 2.6748046875, 4.666015625, 6.6572265625, 8.6484375, 10.6396484375, 12.630859375, 14.6220703125, 16.61328125, 18.6044921875, 20.595703125, 22.5869140625, 24.578125, 26.5693359375, 28.560546875, 30.5517578125, 32.54296875, 34.5341796875, 36.525390625, 38.5166015625, 40.5078125, 42.4990234375, 44.490234375, 46.4814453125, 48.47265625, 50.4638671875, 52.455078125, 54.4462890625, 56.4375]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 7.0, 1008.0, 4.0], "bins": [-1313.296630859375, -1292.2696533203125, -1271.2425537109375, -1250.215576171875, -1229.1884765625, -1208.1614990234375, -1187.134521484375, -1166.107421875, -1145.0804443359375, -1124.053466796875, -1103.0263671875, -1081.9993896484375, -1060.972412109375, -1039.9453125, -1018.9183349609375, -997.8912963867188, -976.8642578125, -955.8372192382812, -934.8101806640625, -913.783203125, -892.7561645507812, -871.7291259765625, -850.7021484375, -829.6751098632812, -808.6480712890625, -787.6210327148438, -766.593994140625, -745.5670166015625, -724.5399780273438, -703.512939453125, -682.4859619140625, -661.4589233398438, -640.4319458007812, -619.4049072265625, -598.3779296875, -577.3508911132812, -556.3238525390625, -535.2968139648438, -514.269775390625, -493.2427978515625, -472.2157287597656, -451.188720703125, -430.16168212890625, -409.1346435546875, -388.1076354980469, -367.08062744140625, -346.0535888671875, -325.02655029296875, -303.9995422363281, -282.9725341796875, -261.94549560546875, -240.91847229003906, -219.89144897460938, -198.8644256591797, -177.83740234375, -156.8103790283203, -135.78335571289062, -114.75633239746094, -93.72930908203125, -72.70228576660156, -51.675262451171875, -30.648239135742188, -9.6212158203125, 11.405807495117188, 32.43282699584961]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 6.0, 6.0, 3.0, 8.0, 5.0, 11.0, 8.0, 16.0, 10.0, 15.0, 22.0, 19.0, 25.0, 28.0, 24.0, 41.0, 38.0, 40.0, 38.0, 55.0, 37.0, 39.0, 32.0, 48.0, 48.0, 42.0, 40.0, 41.0, 30.0, 33.0, 25.0, 27.0, 19.0, 22.0, 16.0, 22.0, 14.0, 12.0, 11.0, 10.0, 7.0, 2.0, 4.0, 4.0, 8.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.18935775756836, -47.5916633605957, -45.99396896362305, -44.39627456665039, -42.798580169677734, -41.20088577270508, -39.60319519042969, -38.00550079345703, -36.407806396484375, -34.81011199951172, -33.21241760253906, -31.614723205566406, -30.01702880859375, -28.419334411621094, -26.82164192199707, -25.223947525024414, -23.626251220703125, -22.02855682373047, -20.430862426757812, -18.833168029785156, -17.2354736328125, -15.63778018951416, -14.04008674621582, -12.442392349243164, -10.844697952270508, -9.247003555297852, -7.6493096351623535, -6.0516157150268555, -4.453921318054199, -2.856226921081543, -1.2585334777832031, 0.3391609191894531, 1.9368553161621094, 3.5345494747161865, 5.132243633270264, 6.729937553405762, 8.327631950378418, 9.925326347351074, 11.523019790649414, 13.12071418762207, 14.718408584594727, 16.316102981567383, 17.91379737854004, 19.511489868164062, 21.10918426513672, 22.706878662109375, 24.30457305908203, 25.902267456054688, 27.499961853027344, 29.09765625, 30.695350646972656, 32.29304504394531, 33.89073944091797, 35.488433837890625, 37.08612823486328, 38.68382263183594, 40.281517028808594, 41.87921142578125, 43.476905822753906, 45.07460021972656, 46.67229461669922, 48.269989013671875, 49.86768341064453, 51.46537780761719, 53.06306838989258]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 3.0, 9.0, 10.0, 9.0, 12.0, 16.0, 13.0, 12.0, 18.0, 17.0, 21.0, 20.0, 28.0, 24.0, 29.0, 30.0, 40.0, 46.0, 43.0, 34.0, 26.0, 46.0, 40.0, 40.0, 39.0, 27.0, 35.0, 40.0, 34.0, 26.0, 29.0, 20.0, 23.0, 23.0, 21.0, 18.0, 17.0, 10.0, 10.0, 9.0, 10.0, 4.0, 5.0, 5.0, 3.0, 8.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.8359375, -3.7078857421875, -3.579833984375, -3.4517822265625, -3.32373046875, -3.1956787109375, -3.067626953125, -2.9395751953125, -2.8115234375, -2.6834716796875, -2.555419921875, -2.4273681640625, -2.29931640625, -2.1712646484375, -2.043212890625, -1.9151611328125, -1.787109375, -1.6590576171875, -1.531005859375, -1.4029541015625, -1.27490234375, -1.1468505859375, -1.018798828125, -0.8907470703125, -0.7626953125, -0.6346435546875, -0.506591796875, -0.3785400390625, -0.25048828125, -0.1224365234375, 0.005615234375, 0.1336669921875, 0.26171875, 0.3897705078125, 0.517822265625, 0.6458740234375, 0.77392578125, 0.9019775390625, 1.030029296875, 1.1580810546875, 1.2861328125, 1.4141845703125, 1.542236328125, 1.6702880859375, 1.79833984375, 1.9263916015625, 2.054443359375, 2.1824951171875, 2.310546875, 2.4385986328125, 2.566650390625, 2.6947021484375, 2.82275390625, 2.9508056640625, 3.078857421875, 3.2069091796875, 3.3349609375, 3.4630126953125, 3.591064453125, 3.7191162109375, 3.84716796875, 3.9752197265625, 4.103271484375, 4.2313232421875, 4.359375]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 3.0, 3.0, 6.0, 3.0, 2.0, 6.0, 6.0, 5.0, 13.0, 21.0, 31.0, 37.0, 61.0, 63.0, 114.0, 152.0, 262.0, 419.0, 693.0, 1247.0, 2120.0, 3769.0, 7206.0, 14275.0, 30022.0, 68594.0, 175983.0, 494456.0, 1128620.0, 1263504.0, 623344.0, 222860.0, 84299.0, 36091.0, 17181.0, 8421.0, 4534.0, 2415.0, 1372.0, 743.0, 491.0, 303.0, 188.0, 122.0, 57.0, 47.0, 43.0, 21.0, 17.0, 12.0, 10.0, 8.0, 2.0, 8.0, 2.0, 3.0, 1.0, 3.0, 1.0, 2.0, 2.0], "bins": [-4.87890625, -4.72698974609375, -4.5750732421875, -4.42315673828125, -4.271240234375, -4.11932373046875, -3.9674072265625, -3.81549072265625, -3.66357421875, -3.51165771484375, -3.3597412109375, -3.20782470703125, -3.055908203125, -2.90399169921875, -2.7520751953125, -2.60015869140625, -2.4482421875, -2.29632568359375, -2.1444091796875, -1.99249267578125, -1.840576171875, -1.68865966796875, -1.5367431640625, -1.38482666015625, -1.23291015625, -1.08099365234375, -0.9290771484375, -0.77716064453125, -0.625244140625, -0.47332763671875, -0.3214111328125, -0.16949462890625, -0.017578125, 0.13433837890625, 0.2862548828125, 0.43817138671875, 0.590087890625, 0.74200439453125, 0.8939208984375, 1.04583740234375, 1.19775390625, 1.34967041015625, 1.5015869140625, 1.65350341796875, 1.805419921875, 1.95733642578125, 2.1092529296875, 2.26116943359375, 2.4130859375, 2.56500244140625, 2.7169189453125, 2.86883544921875, 3.020751953125, 3.17266845703125, 3.3245849609375, 3.47650146484375, 3.62841796875, 3.78033447265625, 3.9322509765625, 4.08416748046875, 4.236083984375, 4.38800048828125, 4.5399169921875, 4.69183349609375, 4.84375]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 14.0, 17.0, 11.0, 21.0, 24.0, 26.0, 40.0, 60.0, 65.0, 105.0, 112.0, 187.0, 185.0, 300.0, 426.0, 437.0, 395.0, 384.0, 276.0, 275.0, 183.0, 139.0, 102.0, 78.0, 55.0, 45.0, 26.0, 17.0, 15.0, 15.0, 11.0, 8.0, 7.0, 3.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.80859375, -7.53094482421875, -7.2532958984375, -6.97564697265625, -6.697998046875, -6.42034912109375, -6.1427001953125, -5.86505126953125, -5.58740234375, -5.30975341796875, -5.0321044921875, -4.75445556640625, -4.476806640625, -4.19915771484375, -3.9215087890625, -3.64385986328125, -3.3662109375, -3.08856201171875, -2.8109130859375, -2.53326416015625, -2.255615234375, -1.97796630859375, -1.7003173828125, -1.42266845703125, -1.14501953125, -0.86737060546875, -0.5897216796875, -0.31207275390625, -0.034423828125, 0.24322509765625, 0.5208740234375, 0.79852294921875, 1.076171875, 1.35382080078125, 1.6314697265625, 1.90911865234375, 2.186767578125, 2.46441650390625, 2.7420654296875, 3.01971435546875, 3.29736328125, 3.57501220703125, 3.8526611328125, 4.13031005859375, 4.407958984375, 4.68560791015625, 4.9632568359375, 5.24090576171875, 5.5185546875, 5.79620361328125, 6.0738525390625, 6.35150146484375, 6.629150390625, 6.90679931640625, 7.1844482421875, 7.46209716796875, 7.73974609375, 8.01739501953125, 8.2950439453125, 8.57269287109375, 8.850341796875, 9.12799072265625, 9.4056396484375, 9.68328857421875, 9.9609375]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 7.0, 6.0, 9.0, 14.0, 14.0, 15.0, 28.0, 29.0, 45.0, 57.0, 97.0, 152.0, 226.0, 499.0, 1147.0, 3407.0, 12792.0, 59751.0, 364423.0, 2232407.0, 1290855.0, 184012.0, 32784.0, 7450.0, 2283.0, 805.0, 355.0, 217.0, 131.0, 62.0, 47.0, 45.0, 29.0, 25.0, 20.0, 10.0, 11.0, 8.0, 6.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-15.6875, -15.2369384765625, -14.786376953125, -14.3358154296875, -13.88525390625, -13.4346923828125, -12.984130859375, -12.5335693359375, -12.0830078125, -11.6324462890625, -11.181884765625, -10.7313232421875, -10.28076171875, -9.8302001953125, -9.379638671875, -8.9290771484375, -8.478515625, -8.0279541015625, -7.577392578125, -7.1268310546875, -6.67626953125, -6.2257080078125, -5.775146484375, -5.3245849609375, -4.8740234375, -4.4234619140625, -3.972900390625, -3.5223388671875, -3.07177734375, -2.6212158203125, -2.170654296875, -1.7200927734375, -1.26953125, -0.8189697265625, -0.368408203125, 0.0821533203125, 0.53271484375, 0.9832763671875, 1.433837890625, 1.8843994140625, 2.3349609375, 2.7855224609375, 3.236083984375, 3.6866455078125, 4.13720703125, 4.5877685546875, 5.038330078125, 5.4888916015625, 5.939453125, 6.3900146484375, 6.840576171875, 7.2911376953125, 7.74169921875, 8.1922607421875, 8.642822265625, 9.0933837890625, 9.5439453125, 9.9945068359375, 10.445068359375, 10.8956298828125, 11.34619140625, 11.7967529296875, 12.247314453125, 12.6978759765625, 13.1484375]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [6.0, 0.0, 6.0, 8.0, 17.0, 23.0, 41.0, 56.0, 96.0, 107.0, 121.0, 126.0, 114.0, 95.0, 82.0, 48.0, 33.0, 13.0, 16.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.874792098999023, -19.96541404724121, -18.05603790283203, -16.14665985107422, -14.237282752990723, -12.327905654907227, -10.418527603149414, -8.509150505065918, -6.599773406982422, -4.690396308898926, -2.7810187339782715, -0.8716411590576172, 1.037735939025879, 2.947113037109375, 4.8564910888671875, 6.765868186950684, 8.67524528503418, 10.584622383117676, 12.493999481201172, 14.403377532958984, 16.312755584716797, 18.222131729125977, 20.13150978088379, 22.04088592529297, 23.95026397705078, 25.859642028808594, 27.769018173217773, 29.678396224975586, 31.587772369384766, 33.49715042114258, 35.40652847290039, 37.3159065246582, 39.22528076171875, 41.13465881347656, 43.044036865234375, 44.95341491699219, 46.862789154052734, 48.77216720581055, 50.68154525756836, 52.59092330932617, 54.50029754638672, 56.40967559814453, 58.319053649902344, 60.228431701660156, 62.1378059387207, 64.04718017578125, 65.95655822753906, 67.86593627929688, 69.77531433105469, 71.6846923828125, 73.59407043457031, 75.50344848632812, 77.41282653808594, 79.32220458984375, 81.23158264160156, 83.14095306396484, 85.05033874511719, 86.959716796875, 88.86909484863281, 90.77847290039062, 92.68785095214844, 94.59722900390625, 96.50660705566406, 98.41597747802734, 100.32535552978516]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [1.0, 4.0, 3.0, 5.0, 2.0, 4.0, 3.0, 6.0, 7.0, 8.0, 8.0, 12.0, 12.0, 14.0, 12.0, 21.0, 20.0, 25.0, 28.0, 33.0, 34.0, 36.0, 39.0, 39.0, 47.0, 50.0, 34.0, 38.0, 44.0, 37.0, 43.0, 46.0, 34.0, 36.0, 36.0, 26.0, 25.0, 22.0, 27.0, 16.0, 17.0, 10.0, 18.0, 13.0, 6.0, 5.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.081953048706055, -25.117475509643555, -24.152997970581055, -23.188518524169922, -22.224040985107422, -21.259563446044922, -20.295085906982422, -19.330608367919922, -18.366130828857422, -17.401653289794922, -16.437175750732422, -15.472697257995605, -14.508218765258789, -13.543741226196289, -12.579263687133789, -11.614786148071289, -10.650306701660156, -9.685829162597656, -8.72135066986084, -7.75687313079834, -6.792395114898682, -5.827917098999023, -4.863439559936523, -3.8989615440368652, -2.934483528137207, -1.9700056314468384, -1.0055277347564697, -0.041049957275390625, 0.9234280586242676, 1.8879060745239258, 2.852383613586426, 3.816861629486084, 4.781337738037109, 5.745815753936768, 6.710293769836426, 7.674771308898926, 8.639249801635742, 9.603727340698242, 10.568204879760742, 11.532682418823242, 12.497160911560059, 13.461638450622559, 14.426116943359375, 15.390594482421875, 16.355072021484375, 17.319549560546875, 18.284027099609375, 19.248506546020508, 20.212984085083008, 21.177461624145508, 22.141939163208008, 23.10641860961914, 24.07089614868164, 25.03537368774414, 25.99985122680664, 26.96432876586914, 27.92880630493164, 28.89328384399414, 29.85776138305664, 30.82223892211914, 31.786718368530273, 32.751197814941406, 33.715675354003906, 34.680152893066406, 35.644630432128906]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 3.0, 3.0, 9.0, 7.0, 8.0, 9.0, 13.0, 14.0, 12.0, 19.0, 32.0, 29.0, 26.0, 34.0, 39.0, 37.0, 33.0, 41.0, 47.0, 46.0, 57.0, 46.0, 35.0, 39.0, 44.0, 36.0, 35.0, 36.0, 39.0, 29.0, 23.0, 23.0, 22.0, 17.0, 12.0, 9.0, 12.0, 9.0, 6.0, 4.0, 3.0, 6.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-5.03125, -4.88739013671875, -4.7435302734375, -4.59967041015625, -4.455810546875, -4.31195068359375, -4.1680908203125, -4.02423095703125, -3.88037109375, -3.73651123046875, -3.5926513671875, -3.44879150390625, -3.304931640625, -3.16107177734375, -3.0172119140625, -2.87335205078125, -2.7294921875, -2.58563232421875, -2.4417724609375, -2.29791259765625, -2.154052734375, -2.01019287109375, -1.8663330078125, -1.72247314453125, -1.57861328125, -1.43475341796875, -1.2908935546875, -1.14703369140625, -1.003173828125, -0.85931396484375, -0.7154541015625, -0.57159423828125, -0.427734375, -0.28387451171875, -0.1400146484375, 0.00384521484375, 0.147705078125, 0.29156494140625, 0.4354248046875, 0.57928466796875, 0.72314453125, 0.86700439453125, 1.0108642578125, 1.15472412109375, 1.298583984375, 1.44244384765625, 1.5863037109375, 1.73016357421875, 1.8740234375, 2.01788330078125, 2.1617431640625, 2.30560302734375, 2.449462890625, 2.59332275390625, 2.7371826171875, 2.88104248046875, 3.02490234375, 3.16876220703125, 3.3126220703125, 3.45648193359375, 3.600341796875, 3.74420166015625, 3.8880615234375, 4.03192138671875, 4.17578125]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 6.0, 2.0, 4.0, 9.0, 6.0, 4.0, 8.0, 14.0, 13.0, 20.0, 36.0, 31.0, 54.0, 114.0, 184.0, 421.0, 657.0, 1365.0, 2661.0, 5274.0, 9754.0, 18148.0, 31410.0, 52175.0, 79177.0, 109616.0, 136248.0, 147425.0, 136405.0, 110794.0, 80947.0, 53381.0, 32257.0, 18601.0, 10207.0, 5474.0, 2669.0, 1408.0, 701.0, 338.0, 191.0, 114.0, 68.0, 41.0, 30.0, 26.0, 20.0, 23.0, 6.0, 8.0, 6.0, 1.0, 8.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.544921875, -2.4615478515625, -2.378173828125, -2.2947998046875, -2.21142578125, -2.1280517578125, -2.044677734375, -1.9613037109375, -1.8779296875, -1.7945556640625, -1.711181640625, -1.6278076171875, -1.54443359375, -1.4610595703125, -1.377685546875, -1.2943115234375, -1.2109375, -1.1275634765625, -1.044189453125, -0.9608154296875, -0.87744140625, -0.7940673828125, -0.710693359375, -0.6273193359375, -0.5439453125, -0.4605712890625, -0.377197265625, -0.2938232421875, -0.21044921875, -0.1270751953125, -0.043701171875, 0.0396728515625, 0.123046875, 0.2064208984375, 0.289794921875, 0.3731689453125, 0.45654296875, 0.5399169921875, 0.623291015625, 0.7066650390625, 0.7900390625, 0.8734130859375, 0.956787109375, 1.0401611328125, 1.12353515625, 1.2069091796875, 1.290283203125, 1.3736572265625, 1.45703125, 1.5404052734375, 1.623779296875, 1.7071533203125, 1.79052734375, 1.8739013671875, 1.957275390625, 2.0406494140625, 2.1240234375, 2.2073974609375, 2.290771484375, 2.3741455078125, 2.45751953125, 2.5408935546875, 2.624267578125, 2.7076416015625, 2.791015625]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 7.0, 3.0, 3.0, 2.0, 8.0, 10.0, 9.0, 7.0, 12.0, 15.0, 15.0, 22.0, 23.0, 17.0, 28.0, 23.0, 28.0, 30.0, 27.0, 38.0, 41.0, 41.0, 42.0, 40.0, 1062.0, 32.0, 32.0, 34.0, 49.0, 39.0, 48.0, 32.0, 27.0, 25.0, 21.0, 23.0, 20.0, 9.0, 19.0, 15.0, 13.0, 4.0, 10.0, 8.0, 6.0, 3.0, 2.0, 4.0, 4.0, 2.0, 3.0, 1.0, 2.0], "bins": [-4.94140625, -4.80206298828125, -4.6627197265625, -4.52337646484375, -4.384033203125, -4.24468994140625, -4.1053466796875, -3.96600341796875, -3.82666015625, -3.68731689453125, -3.5479736328125, -3.40863037109375, -3.269287109375, -3.12994384765625, -2.9906005859375, -2.85125732421875, -2.7119140625, -2.57257080078125, -2.4332275390625, -2.29388427734375, -2.154541015625, -2.01519775390625, -1.8758544921875, -1.73651123046875, -1.59716796875, -1.45782470703125, -1.3184814453125, -1.17913818359375, -1.039794921875, -0.90045166015625, -0.7611083984375, -0.62176513671875, -0.482421875, -0.34307861328125, -0.2037353515625, -0.06439208984375, 0.074951171875, 0.21429443359375, 0.3536376953125, 0.49298095703125, 0.63232421875, 0.77166748046875, 0.9110107421875, 1.05035400390625, 1.189697265625, 1.32904052734375, 1.4683837890625, 1.60772705078125, 1.7470703125, 1.88641357421875, 2.0257568359375, 2.16510009765625, 2.304443359375, 2.44378662109375, 2.5831298828125, 2.72247314453125, 2.86181640625, 3.00115966796875, 3.1405029296875, 3.27984619140625, 3.419189453125, 3.55853271484375, 3.6978759765625, 3.83721923828125, 3.9765625]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 5.0, 9.0, 21.0, 18.0, 32.0, 52.0, 88.0, 104.0, 174.0, 312.0, 423.0, 729.0, 1097.0, 1868.0, 2879.0, 4539.0, 7265.0, 11005.0, 17859.0, 34458.0, 206841.0, 1660050.0, 80629.0, 25890.0, 14983.0, 9516.0, 5941.0, 3844.0, 2373.0, 1482.0, 975.0, 595.0, 383.0, 255.0, 153.0, 95.0, 75.0, 42.0, 27.0, 22.0, 6.0, 11.0, 11.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.53125, -4.38653564453125, -4.2418212890625, -4.09710693359375, -3.952392578125, -3.80767822265625, -3.6629638671875, -3.51824951171875, -3.37353515625, -3.22882080078125, -3.0841064453125, -2.93939208984375, -2.794677734375, -2.64996337890625, -2.5052490234375, -2.36053466796875, -2.2158203125, -2.07110595703125, -1.9263916015625, -1.78167724609375, -1.636962890625, -1.49224853515625, -1.3475341796875, -1.20281982421875, -1.05810546875, -0.91339111328125, -0.7686767578125, -0.62396240234375, -0.479248046875, -0.33453369140625, -0.1898193359375, -0.04510498046875, 0.099609375, 0.24432373046875, 0.3890380859375, 0.53375244140625, 0.678466796875, 0.82318115234375, 0.9678955078125, 1.11260986328125, 1.25732421875, 1.40203857421875, 1.5467529296875, 1.69146728515625, 1.836181640625, 1.98089599609375, 2.1256103515625, 2.27032470703125, 2.4150390625, 2.55975341796875, 2.7044677734375, 2.84918212890625, 2.993896484375, 3.13861083984375, 3.2833251953125, 3.42803955078125, 3.57275390625, 3.71746826171875, 3.8621826171875, 4.00689697265625, 4.151611328125, 4.29632568359375, 4.4410400390625, 4.58575439453125, 4.73046875]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 4.0, 4.0, 6.0, 12.0, 14.0, 17.0, 24.0, 26.0, 29.0, 40.0, 45.0, 50.0, 66.0, 63.0, 78.0, 83.0, 73.0, 62.0, 62.0, 58.0, 34.0, 37.0, 26.0, 23.0, 12.0, 16.0, 11.0, 8.0, 8.0, 12.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.392578125, -0.38170623779296875, -0.3708343505859375, -0.35996246337890625, -0.349090576171875, -0.33821868896484375, -0.3273468017578125, -0.31647491455078125, -0.30560302734375, -0.29473114013671875, -0.2838592529296875, -0.27298736572265625, -0.262115478515625, -0.25124359130859375, -0.2403717041015625, -0.22949981689453125, -0.2186279296875, -0.20775604248046875, -0.1968841552734375, -0.18601226806640625, -0.175140380859375, -0.16426849365234375, -0.1533966064453125, -0.14252471923828125, -0.13165283203125, -0.12078094482421875, -0.1099090576171875, -0.09903717041015625, -0.088165283203125, -0.07729339599609375, -0.0664215087890625, -0.05554962158203125, -0.044677734375, -0.03380584716796875, -0.0229339599609375, -0.01206207275390625, -0.001190185546875, 0.00968170166015625, 0.0205535888671875, 0.03142547607421875, 0.04229736328125, 0.05316925048828125, 0.0640411376953125, 0.07491302490234375, 0.085784912109375, 0.09665679931640625, 0.1075286865234375, 0.11840057373046875, 0.1292724609375, 0.14014434814453125, 0.1510162353515625, 0.16188812255859375, 0.172760009765625, 0.18363189697265625, 0.1945037841796875, 0.20537567138671875, 0.21624755859375, 0.22711944580078125, 0.2379913330078125, 0.24886322021484375, 0.259735107421875, 0.27060699462890625, 0.2814788818359375, 0.29235076904296875, 0.30322265625]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 5.0, 14.0, 11.0, 12.0, 11.0, 14.0, 31.0, 37.0, 65.0, 95.0, 146.0, 257.0, 511.0, 1429.0, 80975.0, 952907.0, 10190.0, 867.0, 418.0, 192.0, 136.0, 67.0, 49.0, 28.0, 20.0, 19.0, 17.0, 11.0, 8.0, 6.0, 5.0, 3.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.9375, -4.76312255859375, -4.5887451171875, -4.41436767578125, -4.239990234375, -4.06561279296875, -3.8912353515625, -3.71685791015625, -3.54248046875, -3.36810302734375, -3.1937255859375, -3.01934814453125, -2.844970703125, -2.67059326171875, -2.4962158203125, -2.32183837890625, -2.1474609375, -1.97308349609375, -1.7987060546875, -1.62432861328125, -1.449951171875, -1.27557373046875, -1.1011962890625, -0.92681884765625, -0.75244140625, -0.57806396484375, -0.4036865234375, -0.22930908203125, -0.054931640625, 0.11944580078125, 0.2938232421875, 0.46820068359375, 0.642578125, 0.81695556640625, 0.9913330078125, 1.16571044921875, 1.340087890625, 1.51446533203125, 1.6888427734375, 1.86322021484375, 2.03759765625, 2.21197509765625, 2.3863525390625, 2.56072998046875, 2.735107421875, 2.90948486328125, 3.0838623046875, 3.25823974609375, 3.4326171875, 3.60699462890625, 3.7813720703125, 3.95574951171875, 4.130126953125, 4.30450439453125, 4.4788818359375, 4.65325927734375, 4.82763671875, 5.00201416015625, 5.1763916015625, 5.35076904296875, 5.525146484375, 5.69952392578125, 5.8739013671875, 6.04827880859375, 6.22265625]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 12.0, 39.0, 277.0, 505.0, 147.0, 24.0, 9.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.465948104858398, -10.212835311889648, -9.959723472595215, -9.706610679626465, -9.453498840332031, -9.200386047363281, -8.947274208068848, -8.694161415100098, -8.441049575805664, -8.187936782836914, -7.9348249435424805, -7.681712627410889, -7.428600311279297, -7.175487995147705, -6.922375679016113, -6.669262886047363, -6.4161505699157715, -6.16303825378418, -5.909925937652588, -5.656813621520996, -5.403701305389404, -5.1505889892578125, -4.8974761962890625, -4.644364356994629, -4.391251564025879, -4.138139247894287, -3.8850269317626953, -3.6319146156311035, -3.3788022994995117, -3.12568998336792, -2.872577428817749, -2.6194651126861572, -2.3663525581359863, -2.1132402420043945, -1.8601279258728027, -1.6070154905319214, -1.3539031744003296, -1.1007908582687378, -0.8476784229278564, -0.5945661067962646, -0.34145379066467285, -0.08834144473075867, 0.16477090120315552, 0.4178832769393921, 0.6709955930709839, 0.9241079092025757, 1.177220344543457, 1.4303326606750488, 1.6834449768066406, 1.9365572929382324, 2.189669609069824, 2.442781925201416, 2.695894241333008, 2.9490065574645996, 3.2021191120147705, 3.4552314281463623, 3.708343744277954, 3.961456060409546, 4.214568614959717, 4.467680931091309, 4.7207932472229, 4.973905563354492, 5.227017879486084, 5.480130195617676, 5.733242511749268]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 7.0, 7.0, 3.0, 5.0, 9.0, 16.0, 22.0, 29.0, 34.0, 37.0, 53.0, 50.0, 56.0, 56.0, 56.0, 74.0, 62.0, 58.0, 57.0, 49.0, 45.0, 48.0, 43.0, 31.0, 26.0, 16.0, 18.0, 12.0, 8.0, 7.0, 3.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0627939701080322, -1.990100622177124, -1.9174071550369263, -1.844713807106018, -1.7720203399658203, -1.699326992034912, -1.626633644104004, -1.5539402961730957, -1.481246829032898, -1.4085534811019897, -1.335860013961792, -1.2631666660308838, -1.1904733180999756, -1.1177798509597778, -1.0450865030288696, -0.9723930954933167, -0.8996996879577637, -0.8270062804222107, -0.7543128728866577, -0.6816195249557495, -0.6089261174201965, -0.5362327098846436, -0.46353933215141296, -0.3908459544181824, -0.3181525468826294, -0.2454591542482376, -0.17276576161384583, -0.10007236897945404, -0.027378976345062256, 0.04531443119049072, 0.11800780892372131, 0.1907011866569519, 0.2633943557739258, 0.33608776330947876, 0.40878114104270935, 0.48147451877593994, 0.5541679263114929, 0.6268613338470459, 0.6995546817779541, 0.7722480893135071, 0.8449414968490601, 0.917634904384613, 0.990328311920166, 1.0630216598510742, 1.1357150077819824, 1.2084084749221802, 1.2811018228530884, 1.3537952899932861, 1.4264886379241943, 1.4991819858551025, 1.5718754529953003, 1.6445688009262085, 1.7172622680664062, 1.7899556159973145, 1.8626489639282227, 1.9353423118591309, 2.008035659790039, 2.0807290077209473, 2.1534223556518555, 2.2261159420013428, 2.298809289932251, 2.371502637863159, 2.4441959857940674, 2.5168893337249756, 2.589582920074463]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 1.0, 1.0, 1.0, 6.0, 9.0, 9.0, 6.0, 16.0, 9.0, 18.0, 14.0, 17.0, 20.0, 24.0, 25.0, 24.0, 24.0, 36.0, 36.0, 42.0, 33.0, 37.0, 39.0, 40.0, 48.0, 49.0, 34.0, 33.0, 26.0, 53.0, 26.0, 29.0, 32.0, 14.0, 18.0, 30.0, 20.0, 18.0, 10.0, 16.0, 15.0, 7.0, 10.0, 8.0, 4.0, 6.0, 2.0, 2.0, 3.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-4.0078125, -3.88092041015625, -3.7540283203125, -3.62713623046875, -3.500244140625, -3.37335205078125, -3.2464599609375, -3.11956787109375, -2.99267578125, -2.86578369140625, -2.7388916015625, -2.61199951171875, -2.485107421875, -2.35821533203125, -2.2313232421875, -2.10443115234375, -1.9775390625, -1.85064697265625, -1.7237548828125, -1.59686279296875, -1.469970703125, -1.34307861328125, -1.2161865234375, -1.08929443359375, -0.96240234375, -0.83551025390625, -0.7086181640625, -0.58172607421875, -0.454833984375, -0.32794189453125, -0.2010498046875, -0.07415771484375, 0.052734375, 0.17962646484375, 0.3065185546875, 0.43341064453125, 0.560302734375, 0.68719482421875, 0.8140869140625, 0.94097900390625, 1.06787109375, 1.19476318359375, 1.3216552734375, 1.44854736328125, 1.575439453125, 1.70233154296875, 1.8292236328125, 1.95611572265625, 2.0830078125, 2.20989990234375, 2.3367919921875, 2.46368408203125, 2.590576171875, 2.71746826171875, 2.8443603515625, 2.97125244140625, 3.09814453125, 3.22503662109375, 3.3519287109375, 3.47882080078125, 3.605712890625, 3.73260498046875, 3.8594970703125, 3.98638916015625, 4.11328125]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 3.0, 1.0, 8.0, 10.0, 13.0, 20.0, 34.0, 49.0, 89.0, 133.0, 189.0, 341.0, 556.0, 996.0, 1631.0, 2692.0, 4940.0, 9192.0, 18146.0, 35639.0, 71252.0, 143352.0, 255923.0, 241316.0, 129333.0, 64469.0, 32598.0, 16434.0, 8319.0, 4578.0, 2554.0, 1476.0, 869.0, 545.0, 317.0, 194.0, 114.0, 86.0, 55.0, 37.0, 25.0, 13.0, 8.0, 8.0, 4.0, 0.0, 6.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.494140625, -3.353973388671875, -3.21380615234375, -3.073638916015625, -2.9334716796875, -2.793304443359375, -2.65313720703125, -2.512969970703125, -2.372802734375, -2.232635498046875, -2.09246826171875, -1.952301025390625, -1.8121337890625, -1.671966552734375, -1.53179931640625, -1.391632080078125, -1.25146484375, -1.111297607421875, -0.97113037109375, -0.830963134765625, -0.6907958984375, -0.550628662109375, -0.41046142578125, -0.270294189453125, -0.130126953125, 0.010040283203125, 0.15020751953125, 0.290374755859375, 0.4305419921875, 0.570709228515625, 0.71087646484375, 0.851043701171875, 0.9912109375, 1.131378173828125, 1.27154541015625, 1.411712646484375, 1.5518798828125, 1.692047119140625, 1.83221435546875, 1.972381591796875, 2.112548828125, 2.252716064453125, 2.39288330078125, 2.533050537109375, 2.6732177734375, 2.813385009765625, 2.95355224609375, 3.093719482421875, 3.23388671875, 3.374053955078125, 3.51422119140625, 3.654388427734375, 3.7945556640625, 3.934722900390625, 4.07489013671875, 4.215057373046875, 4.355224609375, 4.495391845703125, 4.63555908203125, 4.775726318359375, 4.9158935546875, 5.056060791015625, 5.19622802734375, 5.336395263671875, 5.4765625]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 6.0, 7.0, 9.0, 7.0, 12.0, 16.0, 19.0, 22.0, 27.0, 32.0, 28.0, 34.0, 43.0, 52.0, 66.0, 95.0, 165.0, 1381.0, 375.0, 158.0, 89.0, 58.0, 48.0, 49.0, 50.0, 38.0, 32.0, 22.0, 16.0, 23.0, 10.0, 10.0, 17.0, 10.0, 4.0, 3.0, 0.0, 4.0, 5.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.15625, -18.55712890625, -17.9580078125, -17.35888671875, -16.759765625, -16.16064453125, -15.5615234375, -14.96240234375, -14.36328125, -13.76416015625, -13.1650390625, -12.56591796875, -11.966796875, -11.36767578125, -10.7685546875, -10.16943359375, -9.5703125, -8.97119140625, -8.3720703125, -7.77294921875, -7.173828125, -6.57470703125, -5.9755859375, -5.37646484375, -4.77734375, -4.17822265625, -3.5791015625, -2.97998046875, -2.380859375, -1.78173828125, -1.1826171875, -0.58349609375, 0.015625, 0.61474609375, 1.2138671875, 1.81298828125, 2.412109375, 3.01123046875, 3.6103515625, 4.20947265625, 4.80859375, 5.40771484375, 6.0068359375, 6.60595703125, 7.205078125, 7.80419921875, 8.4033203125, 9.00244140625, 9.6015625, 10.20068359375, 10.7998046875, 11.39892578125, 11.998046875, 12.59716796875, 13.1962890625, 13.79541015625, 14.39453125, 14.99365234375, 15.5927734375, 16.19189453125, 16.791015625, 17.39013671875, 17.9892578125, 18.58837890625, 19.1875]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 6.0, 8.0, 13.0, 11.0, 14.0, 42.0, 44.0, 74.0, 120.0, 264.0, 547.0, 2238.0, 209559.0, 2924073.0, 7092.0, 811.0, 348.0, 161.0, 104.0, 64.0, 49.0, 25.0, 15.0, 11.0, 7.0, 7.0, 1.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.09375, -56.23193359375, -54.3701171875, -52.50830078125, -50.646484375, -48.78466796875, -46.9228515625, -45.06103515625, -43.19921875, -41.33740234375, -39.4755859375, -37.61376953125, -35.751953125, -33.89013671875, -32.0283203125, -30.16650390625, -28.3046875, -26.44287109375, -24.5810546875, -22.71923828125, -20.857421875, -18.99560546875, -17.1337890625, -15.27197265625, -13.41015625, -11.54833984375, -9.6865234375, -7.82470703125, -5.962890625, -4.10107421875, -2.2392578125, -0.37744140625, 1.484375, 3.34619140625, 5.2080078125, 7.06982421875, 8.931640625, 10.79345703125, 12.6552734375, 14.51708984375, 16.37890625, 18.24072265625, 20.1025390625, 21.96435546875, 23.826171875, 25.68798828125, 27.5498046875, 29.41162109375, 31.2734375, 33.13525390625, 34.9970703125, 36.85888671875, 38.720703125, 40.58251953125, 42.4443359375, 44.30615234375, 46.16796875, 48.02978515625, 49.8916015625, 51.75341796875, 53.615234375, 55.47705078125, 57.3388671875, 59.20068359375, 61.0625]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 110.0, 905.0], "bins": [-1176.0859375, -1157.48583984375, -1138.8858642578125, -1120.2857666015625, -1101.685791015625, -1083.085693359375, -1064.485595703125, -1045.8856201171875, -1027.2855224609375, -1008.6854858398438, -990.08544921875, -971.4853515625, -952.8853149414062, -934.2852783203125, -915.6851806640625, -897.0851440429688, -878.485107421875, -859.8850708007812, -841.2850341796875, -822.6849365234375, -804.0848999023438, -785.48486328125, -766.884765625, -748.2847290039062, -729.6846923828125, -711.0846557617188, -692.484619140625, -673.884521484375, -655.2844848632812, -636.6844482421875, -618.0843505859375, -599.4843139648438, -580.8843383789062, -562.2843017578125, -543.6842041015625, -525.0841674804688, -506.484130859375, -487.88409423828125, -469.2840270996094, -450.6839599609375, -432.08392333984375, -413.48388671875, -394.8838195800781, -376.28375244140625, -357.6837158203125, -339.08367919921875, -320.4836120605469, -301.883544921875, -283.28350830078125, -264.6834716796875, -246.08340454101562, -227.4833526611328, -208.88330078125, -190.2832489013672, -171.68319702148438, -153.08314514160156, -134.4830780029297, -115.88302612304688, -97.28297424316406, -78.68292236328125, -60.08287048339844, -41.482818603515625, -22.882766723632812, -4.28271484375, 14.317330360412598]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 3.0, 3.0, 4.0, 11.0, 10.0, 7.0, 13.0, 13.0, 20.0, 12.0, 14.0, 23.0, 33.0, 24.0, 30.0, 24.0, 40.0, 33.0, 45.0, 46.0, 43.0, 35.0, 56.0, 54.0, 41.0, 22.0, 35.0, 26.0, 38.0, 34.0, 26.0, 16.0, 21.0, 20.0, 23.0, 21.0, 22.0, 11.0, 11.0, 12.0, 6.0, 7.0, 5.0, 3.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-42.995201110839844, -41.622337341308594, -40.249473571777344, -38.876609802246094, -37.503746032714844, -36.130882263183594, -34.758018493652344, -33.385154724121094, -32.012290954589844, -30.639427185058594, -29.266563415527344, -27.893699645996094, -26.520835876464844, -25.147972106933594, -23.77510643005371, -22.40224266052246, -21.029376983642578, -19.656513214111328, -18.283649444580078, -16.910785675048828, -15.537920951843262, -14.165057182312012, -12.792192459106445, -11.419328689575195, -10.046464920043945, -8.673601150512695, -7.300736904144287, -5.927872657775879, -4.555008888244629, -3.182145118713379, -1.8092803955078125, -0.4364166259765625, 0.9364509582519531, 2.3093149662017822, 3.6821789741516113, 5.0550432205200195, 6.4279069900512695, 7.8007707595825195, 9.173635482788086, 10.546499252319336, 11.919363021850586, 13.292226791381836, 14.665090560913086, 16.03795623779297, 17.41082000732422, 18.78368377685547, 20.15654754638672, 21.52941131591797, 22.90227508544922, 24.27513885498047, 25.64800262451172, 27.02086639404297, 28.39373016357422, 29.76659393310547, 31.13945960998535, 32.51232147216797, 33.88518524169922, 35.25804901123047, 36.63091278076172, 38.00377655029297, 39.37664031982422, 40.74950408935547, 42.12236785888672, 43.49523162841797, 44.868099212646484]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 6.0, 4.0, 8.0, 5.0, 5.0, 8.0, 10.0, 14.0, 21.0, 27.0, 20.0, 26.0, 43.0, 33.0, 31.0, 49.0, 43.0, 41.0, 51.0, 57.0, 45.0, 36.0, 47.0, 47.0, 33.0, 39.0, 38.0, 32.0, 26.0, 28.0, 24.0, 20.0, 19.0, 11.0, 14.0, 12.0, 10.0, 5.0, 7.0, 1.0, 5.0, 1.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.171875, -5.01171875, -4.8515625, -4.69140625, -4.53125, -4.37109375, -4.2109375, -4.05078125, -3.890625, -3.73046875, -3.5703125, -3.41015625, -3.25, -3.08984375, -2.9296875, -2.76953125, -2.609375, -2.44921875, -2.2890625, -2.12890625, -1.96875, -1.80859375, -1.6484375, -1.48828125, -1.328125, -1.16796875, -1.0078125, -0.84765625, -0.6875, -0.52734375, -0.3671875, -0.20703125, -0.046875, 0.11328125, 0.2734375, 0.43359375, 0.59375, 0.75390625, 0.9140625, 1.07421875, 1.234375, 1.39453125, 1.5546875, 1.71484375, 1.875, 2.03515625, 2.1953125, 2.35546875, 2.515625, 2.67578125, 2.8359375, 2.99609375, 3.15625, 3.31640625, 3.4765625, 3.63671875, 3.796875, 3.95703125, 4.1171875, 4.27734375, 4.4375, 4.59765625, 4.7578125, 4.91796875, 5.078125]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 4.0, 0.0, 8.0, 0.0, 16.0, 12.0, 14.0, 18.0, 26.0, 29.0, 27.0, 43.0, 65.0, 117.0, 188.0, 365.0, 780.0, 1921.0, 5557.0, 20214.0, 103557.0, 853792.0, 2529189.0, 576429.0, 78044.0, 16410.0, 4536.0, 1538.0, 585.0, 300.0, 134.0, 102.0, 64.0, 40.0, 38.0, 27.0, 19.0, 16.0, 11.0, 11.0, 4.0, 9.0, 6.0, 5.0, 2.0, 1.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-10.65625, -10.2939453125, -9.931640625, -9.5693359375, -9.20703125, -8.8447265625, -8.482421875, -8.1201171875, -7.7578125, -7.3955078125, -7.033203125, -6.6708984375, -6.30859375, -5.9462890625, -5.583984375, -5.2216796875, -4.859375, -4.4970703125, -4.134765625, -3.7724609375, -3.41015625, -3.0478515625, -2.685546875, -2.3232421875, -1.9609375, -1.5986328125, -1.236328125, -0.8740234375, -0.51171875, -0.1494140625, 0.212890625, 0.5751953125, 0.9375, 1.2998046875, 1.662109375, 2.0244140625, 2.38671875, 2.7490234375, 3.111328125, 3.4736328125, 3.8359375, 4.1982421875, 4.560546875, 4.9228515625, 5.28515625, 5.6474609375, 6.009765625, 6.3720703125, 6.734375, 7.0966796875, 7.458984375, 7.8212890625, 8.18359375, 8.5458984375, 8.908203125, 9.2705078125, 9.6328125, 9.9951171875, 10.357421875, 10.7197265625, 11.08203125, 11.4443359375, 11.806640625, 12.1689453125, 12.53125]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 14.0, 6.0, 11.0, 22.0, 36.0, 42.0, 95.0, 141.0, 239.0, 364.0, 508.0, 690.0, 647.0, 437.0, 325.0, 205.0, 89.0, 72.0, 50.0, 32.0, 21.0, 17.0, 8.0, 7.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-21.859375, -21.3927001953125, -20.926025390625, -20.4593505859375, -19.99267578125, -19.5260009765625, -19.059326171875, -18.5926513671875, -18.1259765625, -17.6593017578125, -17.192626953125, -16.7259521484375, -16.25927734375, -15.7926025390625, -15.325927734375, -14.8592529296875, -14.392578125, -13.9259033203125, -13.459228515625, -12.9925537109375, -12.52587890625, -12.0592041015625, -11.592529296875, -11.1258544921875, -10.6591796875, -10.1925048828125, -9.725830078125, -9.2591552734375, -8.79248046875, -8.3258056640625, -7.859130859375, -7.3924560546875, -6.92578125, -6.4591064453125, -5.992431640625, -5.5257568359375, -5.05908203125, -4.5924072265625, -4.125732421875, -3.6590576171875, -3.1923828125, -2.7257080078125, -2.259033203125, -1.7923583984375, -1.32568359375, -0.8590087890625, -0.392333984375, 0.0743408203125, 0.541015625, 1.0076904296875, 1.474365234375, 1.9410400390625, 2.40771484375, 2.8743896484375, 3.341064453125, 3.8077392578125, 4.2744140625, 4.7410888671875, 5.207763671875, 5.6744384765625, 6.14111328125, 6.6077880859375, 7.074462890625, 7.5411376953125, 8.0078125]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 5.0, 7.0, 15.0, 28.0, 42.0, 60.0, 127.0, 194.0, 331.0, 663.0, 1999.0, 18775.0, 980433.0, 3126745.0, 59518.0, 3578.0, 852.0, 399.0, 209.0, 117.0, 74.0, 46.0, 21.0, 18.0, 11.0, 6.0, 6.0, 6.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.359375, -25.268798828125, -24.17822265625, -23.087646484375, -21.9970703125, -20.906494140625, -19.81591796875, -18.725341796875, -17.634765625, -16.544189453125, -15.45361328125, -14.363037109375, -13.2724609375, -12.181884765625, -11.09130859375, -10.000732421875, -8.91015625, -7.819580078125, -6.72900390625, -5.638427734375, -4.5478515625, -3.457275390625, -2.36669921875, -1.276123046875, -0.185546875, 0.905029296875, 1.99560546875, 3.086181640625, 4.1767578125, 5.267333984375, 6.35791015625, 7.448486328125, 8.5390625, 9.629638671875, 10.72021484375, 11.810791015625, 12.9013671875, 13.991943359375, 15.08251953125, 16.173095703125, 17.263671875, 18.354248046875, 19.44482421875, 20.535400390625, 21.6259765625, 22.716552734375, 23.80712890625, 24.897705078125, 25.98828125, 27.078857421875, 28.16943359375, 29.260009765625, 30.3505859375, 31.441162109375, 32.53173828125, 33.622314453125, 34.712890625, 35.803466796875, 36.89404296875, 37.984619140625, 39.0751953125, 40.165771484375, 41.25634765625, 42.346923828125, 43.4375]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 7.0, 23.0, 51.0, 82.0, 165.0, 214.0, 203.0, 130.0, 78.0, 29.0, 15.0, 6.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-111.54156494140625, -108.14229583740234, -104.7430191040039, -101.34375, -97.9444808959961, -94.54521179199219, -91.14593505859375, -87.74666595458984, -84.34739685058594, -80.94812774658203, -77.5488510131836, -74.14958190917969, -70.75031280517578, -67.35104370117188, -63.95176696777344, -60.55249786376953, -57.153221130371094, -53.75394821166992, -50.354679107666016, -46.955406188964844, -43.55613708496094, -40.156864166259766, -36.757591247558594, -33.35832214355469, -29.959049224853516, -26.559778213500977, -23.160507202148438, -19.761234283447266, -16.361963272094727, -12.962692260742188, -9.563419342041016, -6.164148330688477, -2.7648849487304688, 0.6343865394592285, 4.033658027648926, 7.432929992675781, 10.83220100402832, 14.23147201538086, 17.63074493408203, 21.03001594543457, 24.42928695678711, 27.82855796813965, 31.227828979492188, 34.62710189819336, 38.02637481689453, 41.42564392089844, 44.82491683959961, 48.22418975830078, 51.62345886230469, 55.02273178100586, 58.422000885009766, 61.82127380371094, 65.22054290771484, 68.61981201171875, 72.01908874511719, 75.4183578491211, 78.817626953125, 82.2168960571289, 85.61617279052734, 89.01544189453125, 92.41471099853516, 95.81398010253906, 99.2132568359375, 102.6125259399414, 106.01180267333984]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 4.0, 3.0, 7.0, 1.0, 5.0, 6.0, 8.0, 5.0, 14.0, 15.0, 15.0, 13.0, 22.0, 16.0, 22.0, 26.0, 30.0, 21.0, 30.0, 33.0, 44.0, 38.0, 40.0, 52.0, 52.0, 47.0, 44.0, 46.0, 28.0, 41.0, 41.0, 33.0, 22.0, 24.0, 26.0, 18.0, 11.0, 20.0, 19.0, 11.0, 14.0, 15.0, 4.0, 8.0, 5.0, 1.0, 4.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.28644943237305, -33.21458435058594, -32.14271545410156, -31.07084846496582, -29.998981475830078, -28.92711639404297, -27.855249404907227, -26.783382415771484, -25.711515426635742, -24.6396484375, -23.567781448364258, -22.495914459228516, -21.424049377441406, -20.35218048095703, -19.280315399169922, -18.20844841003418, -17.136581420898438, -16.064714431762695, -14.992847442626953, -13.920981407165527, -12.849114418029785, -11.777247428894043, -10.705381393432617, -9.633514404296875, -8.561647415161133, -7.489780426025391, -6.417913913726807, -5.346047401428223, -4.2741804122924805, -3.2023134231567383, -2.1304469108581543, -1.0585803985595703, 0.013286590576171875, 1.085153341293335, 2.157020092010498, 3.228886842727661, 4.300753593444824, 5.372620582580566, 6.44448709487915, 7.516353607177734, 8.588220596313477, 9.660087585449219, 10.731954574584961, 11.803820610046387, 12.875687599182129, 13.947554588317871, 15.019420623779297, 16.09128761291504, 17.16315460205078, 18.235021591186523, 19.306888580322266, 20.378755569458008, 21.45062255859375, 22.52248764038086, 23.5943546295166, 24.666221618652344, 25.738088607788086, 26.809955596923828, 27.88182258605957, 28.953689575195312, 30.025554656982422, 31.097423553466797, 32.169288635253906, 33.24115753173828, 34.31302261352539]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 5.0, 2.0, 2.0, 7.0, 6.0, 6.0, 5.0, 8.0, 2.0, 14.0, 13.0, 14.0, 22.0, 18.0, 24.0, 28.0, 31.0, 21.0, 25.0, 28.0, 33.0, 38.0, 44.0, 45.0, 40.0, 39.0, 43.0, 43.0, 45.0, 35.0, 23.0, 39.0, 40.0, 32.0, 28.0, 23.0, 19.0, 12.0, 21.0, 21.0, 15.0, 7.0, 7.0, 14.0, 5.0, 4.0, 4.0, 4.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.783203125, -3.646759033203125, -3.51031494140625, -3.373870849609375, -3.2374267578125, -3.100982666015625, -2.96453857421875, -2.828094482421875, -2.691650390625, -2.555206298828125, -2.41876220703125, -2.282318115234375, -2.1458740234375, -2.009429931640625, -1.87298583984375, -1.736541748046875, -1.60009765625, -1.463653564453125, -1.32720947265625, -1.190765380859375, -1.0543212890625, -0.917877197265625, -0.78143310546875, -0.644989013671875, -0.508544921875, -0.372100830078125, -0.23565673828125, -0.099212646484375, 0.0372314453125, 0.173675537109375, 0.31011962890625, 0.446563720703125, 0.5830078125, 0.719451904296875, 0.85589599609375, 0.992340087890625, 1.1287841796875, 1.265228271484375, 1.40167236328125, 1.538116455078125, 1.674560546875, 1.811004638671875, 1.94744873046875, 2.083892822265625, 2.2203369140625, 2.356781005859375, 2.49322509765625, 2.629669189453125, 2.76611328125, 2.902557373046875, 3.03900146484375, 3.175445556640625, 3.3118896484375, 3.448333740234375, 3.58477783203125, 3.721221923828125, 3.857666015625, 3.994110107421875, 4.13055419921875, 4.266998291015625, 4.4034423828125, 4.539886474609375, 4.67633056640625, 4.812774658203125, 4.94921875]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 5.0, 6.0, 2.0, 8.0, 14.0, 13.0, 20.0, 24.0, 44.0, 44.0, 88.0, 163.0, 326.0, 615.0, 1307.0, 2775.0, 5815.0, 12159.0, 24187.0, 45101.0, 79297.0, 125205.0, 178592.0, 195367.0, 152046.0, 99849.0, 60311.0, 32331.0, 16819.0, 8300.0, 4012.0, 1873.0, 855.0, 411.0, 204.0, 107.0, 85.0, 52.0, 31.0, 20.0, 19.0, 13.0, 12.0, 10.0, 9.0, 5.0, 3.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.275390625, -3.176849365234375, -3.07830810546875, -2.979766845703125, -2.8812255859375, -2.782684326171875, -2.68414306640625, -2.585601806640625, -2.487060546875, -2.388519287109375, -2.28997802734375, -2.191436767578125, -2.0928955078125, -1.994354248046875, -1.89581298828125, -1.797271728515625, -1.69873046875, -1.600189208984375, -1.50164794921875, -1.403106689453125, -1.3045654296875, -1.206024169921875, -1.10748291015625, -1.008941650390625, -0.910400390625, -0.811859130859375, -0.71331787109375, -0.614776611328125, -0.5162353515625, -0.417694091796875, -0.31915283203125, -0.220611572265625, -0.1220703125, -0.023529052734375, 0.07501220703125, 0.173553466796875, 0.2720947265625, 0.370635986328125, 0.46917724609375, 0.567718505859375, 0.666259765625, 0.764801025390625, 0.86334228515625, 0.961883544921875, 1.0604248046875, 1.158966064453125, 1.25750732421875, 1.356048583984375, 1.45458984375, 1.553131103515625, 1.65167236328125, 1.750213623046875, 1.8487548828125, 1.947296142578125, 2.04583740234375, 2.144378662109375, 2.242919921875, 2.341461181640625, 2.44000244140625, 2.538543701171875, 2.6370849609375, 2.735626220703125, 2.83416748046875, 2.932708740234375, 3.03125]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 3.0, 3.0, 2.0, 6.0, 3.0, 15.0, 6.0, 8.0, 12.0, 10.0, 17.0, 20.0, 17.0, 18.0, 24.0, 30.0, 23.0, 46.0, 32.0, 32.0, 34.0, 38.0, 47.0, 45.0, 1067.0, 45.0, 33.0, 44.0, 31.0, 28.0, 32.0, 27.0, 31.0, 26.0, 23.0, 19.0, 22.0, 22.0, 17.0, 15.0, 7.0, 10.0, 3.0, 7.0, 5.0, 8.0, 5.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-4.1484375, -4.02783203125, -3.9072265625, -3.78662109375, -3.666015625, -3.54541015625, -3.4248046875, -3.30419921875, -3.18359375, -3.06298828125, -2.9423828125, -2.82177734375, -2.701171875, -2.58056640625, -2.4599609375, -2.33935546875, -2.21875, -2.09814453125, -1.9775390625, -1.85693359375, -1.736328125, -1.61572265625, -1.4951171875, -1.37451171875, -1.25390625, -1.13330078125, -1.0126953125, -0.89208984375, -0.771484375, -0.65087890625, -0.5302734375, -0.40966796875, -0.2890625, -0.16845703125, -0.0478515625, 0.07275390625, 0.193359375, 0.31396484375, 0.4345703125, 0.55517578125, 0.67578125, 0.79638671875, 0.9169921875, 1.03759765625, 1.158203125, 1.27880859375, 1.3994140625, 1.52001953125, 1.640625, 1.76123046875, 1.8818359375, 2.00244140625, 2.123046875, 2.24365234375, 2.3642578125, 2.48486328125, 2.60546875, 2.72607421875, 2.8466796875, 2.96728515625, 3.087890625, 3.20849609375, 3.3291015625, 3.44970703125, 3.5703125]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 4.0, 4.0, 7.0, 3.0, 9.0, 7.0, 20.0, 24.0, 36.0, 45.0, 81.0, 95.0, 118.0, 195.0, 272.0, 335.0, 511.0, 704.0, 1045.0, 1523.0, 2106.0, 2979.0, 4290.0, 5937.0, 8499.0, 12238.0, 19028.0, 38167.0, 228467.0, 1586491.0, 103137.0, 27892.0, 16164.0, 10995.0, 7451.0, 5404.0, 3759.0, 2666.0, 1898.0, 1268.0, 916.0, 698.0, 496.0, 351.0, 239.0, 183.0, 102.0, 66.0, 70.0, 40.0, 33.0, 16.0, 14.0, 15.0, 9.0, 10.0, 3.0, 4.0, 4.0, 5.0], "bins": [-3.458984375, -3.355194091796875, -3.25140380859375, -3.147613525390625, -3.0438232421875, -2.940032958984375, -2.83624267578125, -2.732452392578125, -2.628662109375, -2.524871826171875, -2.42108154296875, -2.317291259765625, -2.2135009765625, -2.109710693359375, -2.00592041015625, -1.902130126953125, -1.79833984375, -1.694549560546875, -1.59075927734375, -1.486968994140625, -1.3831787109375, -1.279388427734375, -1.17559814453125, -1.071807861328125, -0.968017578125, -0.864227294921875, -0.76043701171875, -0.656646728515625, -0.5528564453125, -0.449066162109375, -0.34527587890625, -0.241485595703125, -0.1376953125, -0.033905029296875, 0.06988525390625, 0.173675537109375, 0.2774658203125, 0.381256103515625, 0.48504638671875, 0.588836669921875, 0.692626953125, 0.796417236328125, 0.90020751953125, 1.003997802734375, 1.1077880859375, 1.211578369140625, 1.31536865234375, 1.419158935546875, 1.52294921875, 1.626739501953125, 1.73052978515625, 1.834320068359375, 1.9381103515625, 2.041900634765625, 2.14569091796875, 2.249481201171875, 2.353271484375, 2.457061767578125, 2.56085205078125, 2.664642333984375, 2.7684326171875, 2.872222900390625, 2.97601318359375, 3.079803466796875, 3.18359375]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 6.0, 2.0, 1.0, 7.0, 9.0, 7.0, 12.0, 20.0, 25.0, 24.0, 32.0, 31.0, 40.0, 41.0, 41.0, 53.0, 45.0, 51.0, 50.0, 54.0, 57.0, 47.0, 45.0, 39.0, 40.0, 38.0, 26.0, 30.0, 28.0, 28.0, 16.0, 15.0, 8.0, 12.0, 9.0, 4.0, 1.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.2357177734375, -0.22881317138671875, -0.2219085693359375, -0.21500396728515625, -0.208099365234375, -0.20119476318359375, -0.1942901611328125, -0.18738555908203125, -0.18048095703125, -0.17357635498046875, -0.1666717529296875, -0.15976715087890625, -0.152862548828125, -0.14595794677734375, -0.1390533447265625, -0.13214874267578125, -0.125244140625, -0.11833953857421875, -0.1114349365234375, -0.10453033447265625, -0.097625732421875, -0.09072113037109375, -0.0838165283203125, -0.07691192626953125, -0.07000732421875, -0.06310272216796875, -0.0561981201171875, -0.04929351806640625, -0.042388916015625, -0.03548431396484375, -0.0285797119140625, -0.02167510986328125, -0.0147705078125, -0.00786590576171875, -0.0009613037109375, 0.00594329833984375, 0.012847900390625, 0.01975250244140625, 0.0266571044921875, 0.03356170654296875, 0.04046630859375, 0.04737091064453125, 0.0542755126953125, 0.06118011474609375, 0.068084716796875, 0.07498931884765625, 0.0818939208984375, 0.08879852294921875, 0.095703125, 0.10260772705078125, 0.1095123291015625, 0.11641693115234375, 0.123321533203125, 0.13022613525390625, 0.1371307373046875, 0.14403533935546875, 0.15093994140625, 0.15784454345703125, 0.1647491455078125, 0.17165374755859375, 0.178558349609375, 0.18546295166015625, 0.1923675537109375, 0.19927215576171875, 0.2061767578125]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 4.0, 11.0, 10.0, 15.0, 22.0, 25.0, 35.0, 42.0, 53.0, 91.0, 134.0, 230.0, 368.0, 657.0, 2245.0, 104288.0, 919884.0, 17864.0, 1168.0, 534.0, 284.0, 186.0, 130.0, 60.0, 54.0, 42.0, 32.0, 22.0, 14.0, 13.0, 7.0, 4.0, 5.0, 3.0, 3.0, 6.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.470703125, -3.352325439453125, -3.23394775390625, -3.115570068359375, -2.9971923828125, -2.878814697265625, -2.76043701171875, -2.642059326171875, -2.523681640625, -2.405303955078125, -2.28692626953125, -2.168548583984375, -2.0501708984375, -1.931793212890625, -1.81341552734375, -1.695037841796875, -1.57666015625, -1.458282470703125, -1.33990478515625, -1.221527099609375, -1.1031494140625, -0.984771728515625, -0.86639404296875, -0.748016357421875, -0.629638671875, -0.511260986328125, -0.39288330078125, -0.274505615234375, -0.1561279296875, -0.037750244140625, 0.08062744140625, 0.199005126953125, 0.3173828125, 0.435760498046875, 0.55413818359375, 0.672515869140625, 0.7908935546875, 0.909271240234375, 1.02764892578125, 1.146026611328125, 1.264404296875, 1.382781982421875, 1.50115966796875, 1.619537353515625, 1.7379150390625, 1.856292724609375, 1.97467041015625, 2.093048095703125, 2.21142578125, 2.329803466796875, 2.44818115234375, 2.566558837890625, 2.6849365234375, 2.803314208984375, 2.92169189453125, 3.040069580078125, 3.158447265625, 3.276824951171875, 3.39520263671875, 3.513580322265625, 3.6319580078125, 3.750335693359375, 3.86871337890625, 3.987091064453125, 4.10546875]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 1.0, 8.0, 26.0, 87.0, 235.0, 370.0, 200.0, 57.0, 17.0, 6.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8957417011260986, -1.7803415060043335, -1.6649413108825684, -1.5495411157608032, -1.434140920639038, -1.318740725517273, -1.2033405303955078, -1.0879403352737427, -0.9725401401519775, -0.8571399450302124, -0.7417397499084473, -0.6263395547866821, -0.510939359664917, -0.39553916454315186, -0.2801389694213867, -0.16473877429962158, -0.049338579177856445, 0.06606161594390869, 0.18146181106567383, 0.29686200618743896, 0.4122622013092041, 0.5276623964309692, 0.6430625915527344, 0.7584627866744995, 0.8738629817962646, 0.9892631769180298, 1.104663372039795, 1.22006356716156, 1.3354637622833252, 1.4508639574050903, 1.5662641525268555, 1.6816643476486206, 1.7970647811889648, 1.91246497631073, 2.027865171432495, 2.1432652473449707, 2.2586655616760254, 2.37406587600708, 2.4894659519195557, 2.6048660278320312, 2.720266342163086, 2.8356666564941406, 2.951066732406616, 3.066466808319092, 3.1818671226501465, 3.297267436981201, 3.4126675128936768, 3.5280675888061523, 3.643467903137207, 3.7588682174682617, 3.8742682933807373, 3.989668369293213, 4.105068683624268, 4.220468997955322, 4.335868835449219, 4.451269149780273, 4.566669464111328, 4.682069778442383, 4.7974700927734375, 4.912869930267334, 5.028270244598389, 5.143670558929443, 5.25907039642334, 5.3744707107543945, 5.489871025085449]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 1.0, 4.0, 4.0, 3.0, 16.0, 8.0, 20.0, 19.0, 30.0, 30.0, 39.0, 40.0, 40.0, 72.0, 49.0, 45.0, 47.0, 60.0, 55.0, 51.0, 46.0, 52.0, 40.0, 41.0, 44.0, 23.0, 27.0, 28.0, 16.0, 13.0, 15.0, 5.0, 7.0, 0.0, 6.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2652013301849365, -1.2211066484451294, -1.1770119667053223, -1.1329174041748047, -1.0888227224349976, -1.0447280406951904, -1.0006334781646729, -0.9565387964248657, -0.9124441146850586, -0.8683494329452515, -0.8242548108100891, -0.7801601886749268, -0.7360655069351196, -0.6919708251953125, -0.6478762030601501, -0.6037815809249878, -0.5596868991851807, -0.5155922174453735, -0.4714975953102112, -0.42740294337272644, -0.3833082914352417, -0.33921363949775696, -0.2951189875602722, -0.2510243356227875, -0.20692968368530273, -0.162835031747818, -0.11874037981033325, -0.07464572787284851, -0.03055107593536377, 0.013543576002120972, 0.05763822793960571, 0.10173287987709045, 0.1458275318145752, 0.18992218375205994, 0.23401683568954468, 0.2781114876270294, 0.32220613956451416, 0.3663007915019989, 0.41039544343948364, 0.4544900953769684, 0.4985847473144531, 0.5426794290542603, 0.5867740511894226, 0.630868673324585, 0.6749633550643921, 0.7190580368041992, 0.7631526589393616, 0.8072472810745239, 0.851341962814331, 0.8954366445541382, 0.9395312666893005, 0.9836258888244629, 1.02772057056427, 1.0718152523040771, 1.1159098148345947, 1.1600044965744019, 1.204099178314209, 1.2481938600540161, 1.2922885417938232, 1.3363831043243408, 1.380477786064148, 1.424572467803955, 1.4686670303344727, 1.5127617120742798, 1.556856393814087]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 6.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 5.0, 8.0, 7.0, 11.0, 11.0, 15.0, 16.0, 14.0, 22.0, 23.0, 23.0, 26.0, 36.0, 40.0, 44.0, 44.0, 38.0, 40.0, 31.0, 53.0, 41.0, 44.0, 42.0, 39.0, 38.0, 34.0, 24.0, 33.0, 30.0, 23.0, 25.0, 19.0, 21.0, 13.0, 11.0, 7.0, 5.0, 11.0, 5.0, 3.0, 4.0, 4.0, 2.0, 5.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.5390625, -4.39581298828125, -4.2525634765625, -4.10931396484375, -3.966064453125, -3.82281494140625, -3.6795654296875, -3.53631591796875, -3.39306640625, -3.24981689453125, -3.1065673828125, -2.96331787109375, -2.820068359375, -2.67681884765625, -2.5335693359375, -2.39031982421875, -2.2470703125, -2.10382080078125, -1.9605712890625, -1.81732177734375, -1.674072265625, -1.53082275390625, -1.3875732421875, -1.24432373046875, -1.10107421875, -0.95782470703125, -0.8145751953125, -0.67132568359375, -0.528076171875, -0.38482666015625, -0.2415771484375, -0.09832763671875, 0.044921875, 0.18817138671875, 0.3314208984375, 0.47467041015625, 0.617919921875, 0.76116943359375, 0.9044189453125, 1.04766845703125, 1.19091796875, 1.33416748046875, 1.4774169921875, 1.62066650390625, 1.763916015625, 1.90716552734375, 2.0504150390625, 2.19366455078125, 2.3369140625, 2.48016357421875, 2.6234130859375, 2.76666259765625, 2.909912109375, 3.05316162109375, 3.1964111328125, 3.33966064453125, 3.48291015625, 3.62615966796875, 3.7694091796875, 3.91265869140625, 4.055908203125, 4.19915771484375, 4.3424072265625, 4.48565673828125, 4.62890625]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 5.0, 5.0, 8.0, 9.0, 13.0, 21.0, 32.0, 35.0, 72.0, 76.0, 131.0, 241.0, 366.0, 537.0, 842.0, 1514.0, 2680.0, 4557.0, 7962.0, 14270.0, 25416.0, 43956.0, 74553.0, 122276.0, 203584.0, 219381.0, 132561.0, 80887.0, 48103.0, 27991.0, 15552.0, 8655.0, 5084.0, 2864.0, 1689.0, 1007.0, 603.0, 376.0, 222.0, 131.0, 92.0, 68.0, 34.0, 32.0, 19.0, 17.0, 12.0, 5.0, 3.0, 1.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.837890625, -3.71826171875, -3.5986328125, -3.47900390625, -3.359375, -3.23974609375, -3.1201171875, -3.00048828125, -2.880859375, -2.76123046875, -2.6416015625, -2.52197265625, -2.40234375, -2.28271484375, -2.1630859375, -2.04345703125, -1.923828125, -1.80419921875, -1.6845703125, -1.56494140625, -1.4453125, -1.32568359375, -1.2060546875, -1.08642578125, -0.966796875, -0.84716796875, -0.7275390625, -0.60791015625, -0.48828125, -0.36865234375, -0.2490234375, -0.12939453125, -0.009765625, 0.10986328125, 0.2294921875, 0.34912109375, 0.46875, 0.58837890625, 0.7080078125, 0.82763671875, 0.947265625, 1.06689453125, 1.1865234375, 1.30615234375, 1.42578125, 1.54541015625, 1.6650390625, 1.78466796875, 1.904296875, 2.02392578125, 2.1435546875, 2.26318359375, 2.3828125, 2.50244140625, 2.6220703125, 2.74169921875, 2.861328125, 2.98095703125, 3.1005859375, 3.22021484375, 3.33984375, 3.45947265625, 3.5791015625, 3.69873046875, 3.818359375]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0, 4.0, 1.0, 2.0, 8.0, 5.0, 8.0, 5.0, 12.0, 22.0, 19.0, 32.0, 36.0, 25.0, 44.0, 40.0, 58.0, 53.0, 96.0, 133.0, 255.0, 1443.0, 195.0, 121.0, 72.0, 57.0, 55.0, 54.0, 38.0, 34.0, 27.0, 17.0, 20.0, 12.0, 15.0, 10.0, 7.0, 5.0, 4.0, 1.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.7890625, -15.2110595703125, -14.633056640625, -14.0550537109375, -13.47705078125, -12.8990478515625, -12.321044921875, -11.7430419921875, -11.1650390625, -10.5870361328125, -10.009033203125, -9.4310302734375, -8.85302734375, -8.2750244140625, -7.697021484375, -7.1190185546875, -6.541015625, -5.9630126953125, -5.385009765625, -4.8070068359375, -4.22900390625, -3.6510009765625, -3.072998046875, -2.4949951171875, -1.9169921875, -1.3389892578125, -0.760986328125, -0.1829833984375, 0.39501953125, 0.9730224609375, 1.551025390625, 2.1290283203125, 2.70703125, 3.2850341796875, 3.863037109375, 4.4410400390625, 5.01904296875, 5.5970458984375, 6.175048828125, 6.7530517578125, 7.3310546875, 7.9090576171875, 8.487060546875, 9.0650634765625, 9.64306640625, 10.2210693359375, 10.799072265625, 11.3770751953125, 11.955078125, 12.5330810546875, 13.111083984375, 13.6890869140625, 14.26708984375, 14.8450927734375, 15.423095703125, 16.0010986328125, 16.5791015625, 17.1571044921875, 17.735107421875, 18.3131103515625, 18.89111328125, 19.4691162109375, 20.047119140625, 20.6251220703125, 21.203125]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 8.0, 14.0, 24.0, 41.0, 106.0, 205.0, 679.0, 5440.0, 3126956.0, 10998.0, 765.0, 260.0, 113.0, 46.0, 29.0, 13.0, 9.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-109.0, -105.8466796875, -102.693359375, -99.5400390625, -96.38671875, -93.2333984375, -90.080078125, -86.9267578125, -83.7734375, -80.6201171875, -77.466796875, -74.3134765625, -71.16015625, -68.0068359375, -64.853515625, -61.7001953125, -58.546875, -55.3935546875, -52.240234375, -49.0869140625, -45.93359375, -42.7802734375, -39.626953125, -36.4736328125, -33.3203125, -30.1669921875, -27.013671875, -23.8603515625, -20.70703125, -17.5537109375, -14.400390625, -11.2470703125, -8.09375, -4.9404296875, -1.787109375, 1.3662109375, 4.51953125, 7.6728515625, 10.826171875, 13.9794921875, 17.1328125, 20.2861328125, 23.439453125, 26.5927734375, 29.74609375, 32.8994140625, 36.052734375, 39.2060546875, 42.359375, 45.5126953125, 48.666015625, 51.8193359375, 54.97265625, 58.1259765625, 61.279296875, 64.4326171875, 67.5859375, 70.7392578125, 73.892578125, 77.0458984375, 80.19921875, 83.3525390625, 86.505859375, 89.6591796875, 92.8125]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 46.0, 972.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1358.526123046875, -1335.1968994140625, -1311.86767578125, -1288.538330078125, -1265.2091064453125, -1241.8798828125, -1218.5506591796875, -1195.2213134765625, -1171.89208984375, -1148.5628662109375, -1125.233642578125, -1101.904296875, -1078.5750732421875, -1055.245849609375, -1031.9166259765625, -1008.5873413085938, -985.258056640625, -961.9288330078125, -938.5995483398438, -915.2703247070312, -891.9410400390625, -868.61181640625, -845.2825317382812, -821.9533081054688, -798.6240844726562, -775.2948608398438, -751.965576171875, -728.6363525390625, -705.3070678710938, -681.9778442382812, -658.6485595703125, -635.3193359375, -611.9901123046875, -588.660888671875, -565.3316040039062, -542.0023803710938, -518.673095703125, -495.3438415527344, -472.01458740234375, -448.68536376953125, -425.3560791015625, -402.0268249511719, -378.69757080078125, -355.3683166503906, -332.0390625, -308.7098083496094, -285.38055419921875, -262.05133056640625, -238.7220458984375, -215.39279174804688, -192.06353759765625, -168.73428344726562, -145.405029296875, -122.0757827758789, -98.74653625488281, -75.41728210449219, -52.08802795410156, -28.75877571105957, -5.429523468017578, 17.89972686767578, 41.228981018066406, 64.55823516845703, 87.88748168945312, 111.21673583984375, 134.54598999023438]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 6.0, 8.0, 8.0, 7.0, 16.0, 17.0, 27.0, 22.0, 16.0, 30.0, 27.0, 34.0, 28.0, 41.0, 44.0, 47.0, 44.0, 49.0, 27.0, 42.0, 55.0, 54.0, 42.0, 42.0, 41.0, 31.0, 23.0, 28.0, 21.0, 22.0, 20.0, 13.0, 21.0, 10.0, 10.0, 10.0, 5.0, 5.0, 2.0, 4.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-48.598960876464844, -46.9704475402832, -45.34193420410156, -43.713417053222656, -42.084903717041016, -40.456390380859375, -38.827877044677734, -37.199363708496094, -35.57084655761719, -33.94233322143555, -32.313819885253906, -30.685304641723633, -29.05678939819336, -27.42827606201172, -25.799762725830078, -24.171249389648438, -22.542736053466797, -20.914222717285156, -19.285707473754883, -17.657194137573242, -16.02867889404297, -14.400165557861328, -12.771652221679688, -11.14313793182373, -9.514623641967773, -7.886109352111816, -6.257595539093018, -4.629081726074219, -3.0005674362182617, -1.3720531463623047, 0.25646018981933594, 1.884974479675293, 3.5134925842285156, 5.142006874084473, 6.7705206871032715, 8.39903450012207, 10.027548789978027, 11.656063079833984, 13.284576416015625, 14.913090705871582, 16.54160499572754, 18.17011833190918, 19.798633575439453, 21.427146911621094, 23.055660247802734, 24.684175491333008, 26.31268882751465, 27.941204071044922, 29.569717407226562, 31.198230743408203, 32.826744079589844, 34.45526123046875, 36.08377456665039, 37.71228790283203, 39.34080123901367, 40.96931457519531, 42.59783172607422, 44.22634506225586, 45.8548583984375, 47.483375549316406, 49.11188888549805, 50.74040222167969, 52.36891555786133, 53.99742889404297, 55.62594223022461]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 1.0, 6.0, 5.0, 8.0, 5.0, 7.0, 8.0, 15.0, 19.0, 20.0, 27.0, 25.0, 41.0, 47.0, 42.0, 46.0, 69.0, 67.0, 66.0, 49.0, 59.0, 48.0, 44.0, 36.0, 48.0, 26.0, 33.0, 33.0, 24.0, 25.0, 20.0, 4.0, 13.0, 5.0, 9.0, 1.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.65625, -7.4493408203125, -7.242431640625, -7.0355224609375, -6.82861328125, -6.6217041015625, -6.414794921875, -6.2078857421875, -6.0009765625, -5.7940673828125, -5.587158203125, -5.3802490234375, -5.17333984375, -4.9664306640625, -4.759521484375, -4.5526123046875, -4.345703125, -4.1387939453125, -3.931884765625, -3.7249755859375, -3.51806640625, -3.3111572265625, -3.104248046875, -2.8973388671875, -2.6904296875, -2.4835205078125, -2.276611328125, -2.0697021484375, -1.86279296875, -1.6558837890625, -1.448974609375, -1.2420654296875, -1.03515625, -0.8282470703125, -0.621337890625, -0.4144287109375, -0.20751953125, -0.0006103515625, 0.206298828125, 0.4132080078125, 0.6201171875, 0.8270263671875, 1.033935546875, 1.2408447265625, 1.44775390625, 1.6546630859375, 1.861572265625, 2.0684814453125, 2.275390625, 2.4822998046875, 2.689208984375, 2.8961181640625, 3.10302734375, 3.3099365234375, 3.516845703125, 3.7237548828125, 3.9306640625, 4.1375732421875, 4.344482421875, 4.5513916015625, 4.75830078125, 4.9652099609375, 5.172119140625, 5.3790283203125, 5.5859375]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 7.0, 3.0, 4.0, 6.0, 15.0, 17.0, 24.0, 20.0, 33.0, 50.0, 64.0, 83.0, 156.0, 263.0, 506.0, 1104.0, 2682.0, 7574.0, 25993.0, 122962.0, 817148.0, 2334909.0, 733318.0, 111286.0, 24370.0, 7105.0, 2343.0, 1009.0, 463.0, 225.0, 162.0, 102.0, 75.0, 46.0, 39.0, 32.0, 26.0, 15.0, 9.0, 9.0, 10.0, 4.0, 5.0, 7.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.8359375, -9.490478515625, -9.14501953125, -8.799560546875, -8.4541015625, -8.108642578125, -7.76318359375, -7.417724609375, -7.072265625, -6.726806640625, -6.38134765625, -6.035888671875, -5.6904296875, -5.344970703125, -4.99951171875, -4.654052734375, -4.30859375, -3.963134765625, -3.61767578125, -3.272216796875, -2.9267578125, -2.581298828125, -2.23583984375, -1.890380859375, -1.544921875, -1.199462890625, -0.85400390625, -0.508544921875, -0.1630859375, 0.182373046875, 0.52783203125, 0.873291015625, 1.21875, 1.564208984375, 1.90966796875, 2.255126953125, 2.6005859375, 2.946044921875, 3.29150390625, 3.636962890625, 3.982421875, 4.327880859375, 4.67333984375, 5.018798828125, 5.3642578125, 5.709716796875, 6.05517578125, 6.400634765625, 6.74609375, 7.091552734375, 7.43701171875, 7.782470703125, 8.1279296875, 8.473388671875, 8.81884765625, 9.164306640625, 9.509765625, 9.855224609375, 10.20068359375, 10.546142578125, 10.8916015625, 11.237060546875, 11.58251953125, 11.927978515625, 12.2734375]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 4.0, 11.0, 15.0, 12.0, 30.0, 44.0, 59.0, 93.0, 126.0, 203.0, 299.0, 440.0, 535.0, 604.0, 490.0, 348.0, 247.0, 163.0, 111.0, 87.0, 52.0, 39.0, 14.0, 19.0, 6.0, 6.0, 4.0, 4.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0], "bins": [-17.75, -17.33056640625, -16.9111328125, -16.49169921875, -16.072265625, -15.65283203125, -15.2333984375, -14.81396484375, -14.39453125, -13.97509765625, -13.5556640625, -13.13623046875, -12.716796875, -12.29736328125, -11.8779296875, -11.45849609375, -11.0390625, -10.61962890625, -10.2001953125, -9.78076171875, -9.361328125, -8.94189453125, -8.5224609375, -8.10302734375, -7.68359375, -7.26416015625, -6.8447265625, -6.42529296875, -6.005859375, -5.58642578125, -5.1669921875, -4.74755859375, -4.328125, -3.90869140625, -3.4892578125, -3.06982421875, -2.650390625, -2.23095703125, -1.8115234375, -1.39208984375, -0.97265625, -0.55322265625, -0.1337890625, 0.28564453125, 0.705078125, 1.12451171875, 1.5439453125, 1.96337890625, 2.3828125, 2.80224609375, 3.2216796875, 3.64111328125, 4.060546875, 4.47998046875, 4.8994140625, 5.31884765625, 5.73828125, 6.15771484375, 6.5771484375, 6.99658203125, 7.416015625, 7.83544921875, 8.2548828125, 8.67431640625, 9.09375]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 4.0, 1.0, 1.0, 2.0, 7.0, 5.0, 9.0, 18.0, 20.0, 35.0, 43.0, 92.0, 148.0, 240.0, 505.0, 1484.0, 12642.0, 779865.0, 3347412.0, 47480.0, 2872.0, 695.0, 296.0, 136.0, 90.0, 63.0, 41.0, 31.0, 15.0, 14.0, 11.0, 4.0, 1.0, 6.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.09375, -25.8154296875, -24.537109375, -23.2587890625, -21.98046875, -20.7021484375, -19.423828125, -18.1455078125, -16.8671875, -15.5888671875, -14.310546875, -13.0322265625, -11.75390625, -10.4755859375, -9.197265625, -7.9189453125, -6.640625, -5.3623046875, -4.083984375, -2.8056640625, -1.52734375, -0.2490234375, 1.029296875, 2.3076171875, 3.5859375, 4.8642578125, 6.142578125, 7.4208984375, 8.69921875, 9.9775390625, 11.255859375, 12.5341796875, 13.8125, 15.0908203125, 16.369140625, 17.6474609375, 18.92578125, 20.2041015625, 21.482421875, 22.7607421875, 24.0390625, 25.3173828125, 26.595703125, 27.8740234375, 29.15234375, 30.4306640625, 31.708984375, 32.9873046875, 34.265625, 35.5439453125, 36.822265625, 38.1005859375, 39.37890625, 40.6572265625, 41.935546875, 43.2138671875, 44.4921875, 45.7705078125, 47.048828125, 48.3271484375, 49.60546875, 50.8837890625, 52.162109375, 53.4404296875, 54.71875]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 18.0, 368.0, 582.0, 45.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-364.5497741699219, -351.1344909667969, -337.71923828125, -324.303955078125, -310.8887023925781, -297.4734191894531, -284.05816650390625, -270.64288330078125, -257.22760009765625, -243.8123321533203, -230.39706420898438, -216.98178100585938, -203.56651306152344, -190.1512451171875, -176.73597717285156, -163.32070922851562, -149.9054412841797, -136.49017333984375, -123.07489776611328, -109.65962982177734, -96.24435424804688, -82.82908630371094, -69.413818359375, -55.99854278564453, -42.583274841308594, -29.16800308227539, -15.75273323059082, -2.33746337890625, 11.077808380126953, 24.493080139160156, 37.908348083496094, 51.32362365722656, 64.7388916015625, 78.15415954589844, 91.5694351196289, 104.98470306396484, 118.39997863769531, 131.81524658203125, 145.2305145263672, 158.64578247070312, 172.06106567382812, 185.47633361816406, 198.8916015625, 212.306884765625, 225.72215270996094, 239.13742065429688, 252.5526885986328, 265.96795654296875, 279.38323974609375, 292.79852294921875, 306.2137756347656, 319.6290588378906, 333.0443115234375, 346.4595947265625, 359.8748779296875, 373.2901306152344, 386.70538330078125, 400.12066650390625, 413.5359191894531, 426.9512023925781, 440.366455078125, 453.78173828125, 467.197021484375, 480.6122741699219, 494.0275573730469]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 7.0, 9.0, 6.0, 5.0, 9.0, 12.0, 17.0, 20.0, 34.0, 38.0, 35.0, 54.0, 53.0, 51.0, 60.0, 60.0, 66.0, 67.0, 51.0, 66.0, 49.0, 53.0, 36.0, 31.0, 34.0, 16.0, 15.0, 24.0, 14.0, 4.0, 5.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.56044387817383, -37.8614501953125, -36.16245651245117, -34.463462829589844, -32.76446533203125, -31.065473556518555, -29.366477966308594, -27.667484283447266, -25.968490600585938, -24.26949691772461, -22.57050323486328, -20.87150764465332, -19.172513961791992, -17.473520278930664, -15.77452564239502, -14.075531005859375, -12.376537322998047, -10.677543640136719, -8.978549003601074, -7.279554843902588, -5.580560684204102, -3.8815670013427734, -2.182572364807129, -0.4835777282714844, 1.2154159545898438, 2.91441011428833, 4.613404273986816, 6.312398433685303, 8.011392593383789, 9.710386276245117, 11.409380912780762, 13.108375549316406, 14.807373046875, 16.506366729736328, 18.205360412597656, 19.904356002807617, 21.603349685668945, 23.302343368530273, 25.001338958740234, 26.700332641601562, 28.39932632446289, 30.09832000732422, 31.797313690185547, 33.496307373046875, 35.19530487060547, 36.89429473876953, 38.593292236328125, 40.29228591918945, 41.99127960205078, 43.69027328491211, 45.38926696777344, 47.088260650634766, 48.787254333496094, 50.48625183105469, 52.185245513916016, 53.884239196777344, 55.58323287963867, 57.2822265625, 58.98122024536133, 60.680213928222656, 62.37921142578125, 64.07820129394531, 65.7771987915039, 67.4761962890625, 69.17518615722656]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 2.0, 5.0, 11.0, 5.0, 12.0, 9.0, 20.0, 21.0, 21.0, 18.0, 24.0, 29.0, 44.0, 50.0, 45.0, 49.0, 57.0, 46.0, 52.0, 51.0, 49.0, 45.0, 51.0, 43.0, 31.0, 44.0, 26.0, 26.0, 23.0, 26.0, 13.0, 13.0, 8.0, 15.0, 5.0, 6.0, 3.0, 7.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.859375, -4.671142578125, -4.48291015625, -4.294677734375, -4.1064453125, -3.918212890625, -3.72998046875, -3.541748046875, -3.353515625, -3.165283203125, -2.97705078125, -2.788818359375, -2.6005859375, -2.412353515625, -2.22412109375, -2.035888671875, -1.84765625, -1.659423828125, -1.47119140625, -1.282958984375, -1.0947265625, -0.906494140625, -0.71826171875, -0.530029296875, -0.341796875, -0.153564453125, 0.03466796875, 0.222900390625, 0.4111328125, 0.599365234375, 0.78759765625, 0.975830078125, 1.1640625, 1.352294921875, 1.54052734375, 1.728759765625, 1.9169921875, 2.105224609375, 2.29345703125, 2.481689453125, 2.669921875, 2.858154296875, 3.04638671875, 3.234619140625, 3.4228515625, 3.611083984375, 3.79931640625, 3.987548828125, 4.17578125, 4.364013671875, 4.55224609375, 4.740478515625, 4.9287109375, 5.116943359375, 5.30517578125, 5.493408203125, 5.681640625, 5.869873046875, 6.05810546875, 6.246337890625, 6.4345703125, 6.622802734375, 6.81103515625, 6.999267578125, 7.1875]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 0.0, 4.0, 2.0, 2.0, 3.0, 9.0, 9.0, 10.0, 22.0, 22.0, 36.0, 36.0, 57.0, 83.0, 184.0, 320.0, 614.0, 1164.0, 2377.0, 4906.0, 9919.0, 19768.0, 37973.0, 68911.0, 113614.0, 162127.0, 185676.0, 165412.0, 119886.0, 73142.0, 40247.0, 20704.0, 10668.0, 5217.0, 2590.0, 1307.0, 666.0, 319.0, 219.0, 108.0, 72.0, 38.0, 25.0, 26.0, 24.0, 11.0, 8.0, 5.0, 4.0, 4.0, 3.0, 6.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-3.2734375, -3.166290283203125, -3.05914306640625, -2.951995849609375, -2.8448486328125, -2.737701416015625, -2.63055419921875, -2.523406982421875, -2.416259765625, -2.309112548828125, -2.20196533203125, -2.094818115234375, -1.9876708984375, -1.880523681640625, -1.77337646484375, -1.666229248046875, -1.55908203125, -1.451934814453125, -1.34478759765625, -1.237640380859375, -1.1304931640625, -1.023345947265625, -0.91619873046875, -0.809051513671875, -0.701904296875, -0.594757080078125, -0.48760986328125, -0.380462646484375, -0.2733154296875, -0.166168212890625, -0.05902099609375, 0.048126220703125, 0.1552734375, 0.262420654296875, 0.36956787109375, 0.476715087890625, 0.5838623046875, 0.691009521484375, 0.79815673828125, 0.905303955078125, 1.012451171875, 1.119598388671875, 1.22674560546875, 1.333892822265625, 1.4410400390625, 1.548187255859375, 1.65533447265625, 1.762481689453125, 1.86962890625, 1.976776123046875, 2.08392333984375, 2.191070556640625, 2.2982177734375, 2.405364990234375, 2.51251220703125, 2.619659423828125, 2.726806640625, 2.833953857421875, 2.94110107421875, 3.048248291015625, 3.1553955078125, 3.262542724609375, 3.36968994140625, 3.476837158203125, 3.583984375]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 5.0, 1.0, 4.0, 4.0, 5.0, 5.0, 8.0, 12.0, 13.0, 12.0, 13.0, 20.0, 16.0, 25.0, 20.0, 26.0, 25.0, 27.0, 35.0, 31.0, 31.0, 35.0, 41.0, 40.0, 36.0, 1058.0, 29.0, 34.0, 34.0, 32.0, 36.0, 35.0, 19.0, 35.0, 31.0, 22.0, 25.0, 23.0, 15.0, 24.0, 16.0, 11.0, 13.0, 10.0, 5.0, 10.0, 5.0, 7.0, 7.0, 2.0, 2.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0], "bins": [-4.40625, -4.2587890625, -4.111328125, -3.9638671875, -3.81640625, -3.6689453125, -3.521484375, -3.3740234375, -3.2265625, -3.0791015625, -2.931640625, -2.7841796875, -2.63671875, -2.4892578125, -2.341796875, -2.1943359375, -2.046875, -1.8994140625, -1.751953125, -1.6044921875, -1.45703125, -1.3095703125, -1.162109375, -1.0146484375, -0.8671875, -0.7197265625, -0.572265625, -0.4248046875, -0.27734375, -0.1298828125, 0.017578125, 0.1650390625, 0.3125, 0.4599609375, 0.607421875, 0.7548828125, 0.90234375, 1.0498046875, 1.197265625, 1.3447265625, 1.4921875, 1.6396484375, 1.787109375, 1.9345703125, 2.08203125, 2.2294921875, 2.376953125, 2.5244140625, 2.671875, 2.8193359375, 2.966796875, 3.1142578125, 3.26171875, 3.4091796875, 3.556640625, 3.7041015625, 3.8515625, 3.9990234375, 4.146484375, 4.2939453125, 4.44140625, 4.5888671875, 4.736328125, 4.8837890625, 5.03125]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 9.0, 5.0, 5.0, 12.0, 17.0, 18.0, 41.0, 50.0, 77.0, 119.0, 165.0, 251.0, 392.0, 568.0, 830.0, 1250.0, 1837.0, 2741.0, 3967.0, 5712.0, 8615.0, 12974.0, 20648.0, 42358.0, 300576.0, 1546105.0, 73511.0, 26784.0, 15794.0, 10162.0, 6888.0, 4743.0, 3245.0, 2172.0, 1435.0, 1006.0, 676.0, 466.0, 276.0, 206.0, 134.0, 101.0, 69.0, 38.0, 35.0, 17.0, 9.0, 11.0, 3.0, 3.0, 6.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0], "bins": [-4.453125, -4.31488037109375, -4.1766357421875, -4.03839111328125, -3.900146484375, -3.76190185546875, -3.6236572265625, -3.48541259765625, -3.34716796875, -3.20892333984375, -3.0706787109375, -2.93243408203125, -2.794189453125, -2.65594482421875, -2.5177001953125, -2.37945556640625, -2.2412109375, -2.10296630859375, -1.9647216796875, -1.82647705078125, -1.688232421875, -1.54998779296875, -1.4117431640625, -1.27349853515625, -1.13525390625, -0.99700927734375, -0.8587646484375, -0.72052001953125, -0.582275390625, -0.44403076171875, -0.3057861328125, -0.16754150390625, -0.029296875, 0.10894775390625, 0.2471923828125, 0.38543701171875, 0.523681640625, 0.66192626953125, 0.8001708984375, 0.93841552734375, 1.07666015625, 1.21490478515625, 1.3531494140625, 1.49139404296875, 1.629638671875, 1.76788330078125, 1.9061279296875, 2.04437255859375, 2.1826171875, 2.32086181640625, 2.4591064453125, 2.59735107421875, 2.735595703125, 2.87384033203125, 3.0120849609375, 3.15032958984375, 3.28857421875, 3.42681884765625, 3.5650634765625, 3.70330810546875, 3.841552734375, 3.97979736328125, 4.1180419921875, 4.25628662109375, 4.39453125]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 3.0, 5.0, 6.0, 0.0, 5.0, 8.0, 4.0, 10.0, 16.0, 14.0, 17.0, 18.0, 25.0, 32.0, 36.0, 45.0, 49.0, 60.0, 50.0, 59.0, 68.0, 65.0, 53.0, 56.0, 41.0, 36.0, 31.0, 35.0, 25.0, 25.0, 14.0, 17.0, 15.0, 18.0, 8.0, 13.0, 6.0, 4.0, 5.0, 3.0, 5.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.356201171875, -0.34471893310546875, -0.3332366943359375, -0.32175445556640625, -0.310272216796875, -0.29878997802734375, -0.2873077392578125, -0.27582550048828125, -0.26434326171875, -0.25286102294921875, -0.2413787841796875, -0.22989654541015625, -0.218414306640625, -0.20693206787109375, -0.1954498291015625, -0.18396759033203125, -0.1724853515625, -0.16100311279296875, -0.1495208740234375, -0.13803863525390625, -0.126556396484375, -0.11507415771484375, -0.1035919189453125, -0.09210968017578125, -0.08062744140625, -0.06914520263671875, -0.0576629638671875, -0.04618072509765625, -0.034698486328125, -0.02321624755859375, -0.0117340087890625, -0.00025177001953125, 0.01123046875, 0.02271270751953125, 0.0341949462890625, 0.04567718505859375, 0.057159423828125, 0.06864166259765625, 0.0801239013671875, 0.09160614013671875, 0.10308837890625, 0.11457061767578125, 0.1260528564453125, 0.13753509521484375, 0.149017333984375, 0.16049957275390625, 0.1719818115234375, 0.18346405029296875, 0.1949462890625, 0.20642852783203125, 0.2179107666015625, 0.22939300537109375, 0.240875244140625, 0.25235748291015625, 0.2638397216796875, 0.27532196044921875, 0.28680419921875, 0.29828643798828125, 0.3097686767578125, 0.32125091552734375, 0.332733154296875, 0.34421539306640625, 0.3556976318359375, 0.36717987060546875, 0.378662109375]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 6.0, 4.0, 6.0, 12.0, 13.0, 20.0, 15.0, 17.0, 24.0, 36.0, 48.0, 62.0, 106.0, 152.0, 306.0, 846.0, 5027.0, 497618.0, 537332.0, 5168.0, 833.0, 327.0, 187.0, 103.0, 71.0, 45.0, 44.0, 25.0, 22.0, 15.0, 15.0, 14.0, 9.0, 4.0, 4.0, 3.0, 4.0, 4.0, 2.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.91015625, -6.7008056640625, -6.491455078125, -6.2821044921875, -6.07275390625, -5.8634033203125, -5.654052734375, -5.4447021484375, -5.2353515625, -5.0260009765625, -4.816650390625, -4.6072998046875, -4.39794921875, -4.1885986328125, -3.979248046875, -3.7698974609375, -3.560546875, -3.3511962890625, -3.141845703125, -2.9324951171875, -2.72314453125, -2.5137939453125, -2.304443359375, -2.0950927734375, -1.8857421875, -1.6763916015625, -1.467041015625, -1.2576904296875, -1.04833984375, -0.8389892578125, -0.629638671875, -0.4202880859375, -0.2109375, -0.0015869140625, 0.207763671875, 0.4171142578125, 0.62646484375, 0.8358154296875, 1.045166015625, 1.2545166015625, 1.4638671875, 1.6732177734375, 1.882568359375, 2.0919189453125, 2.30126953125, 2.5106201171875, 2.719970703125, 2.9293212890625, 3.138671875, 3.3480224609375, 3.557373046875, 3.7667236328125, 3.97607421875, 4.1854248046875, 4.394775390625, 4.6041259765625, 4.8134765625, 5.0228271484375, 5.232177734375, 5.4415283203125, 5.65087890625, 5.8602294921875, 6.069580078125, 6.2789306640625, 6.48828125]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 6.0, 5.0, 14.0, 33.0, 49.0, 134.0, 248.0, 228.0, 141.0, 80.0, 28.0, 15.0, 12.0, 4.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.374390602111816, -5.257606506347656, -5.140822887420654, -5.024038791656494, -4.907254695892334, -4.790471076965332, -4.673686981201172, -4.556902885437012, -4.440118789672852, -4.323334693908691, -4.2065510749816895, -4.089766979217529, -3.972982883453369, -3.856199026107788, -3.739415168762207, -3.622631072998047, -3.505847454071045, -3.389063596725464, -3.2722795009613037, -3.1554956436157227, -3.0387115478515625, -2.9219276905059814, -2.8051438331604004, -2.6883597373962402, -2.571575880050659, -2.454792022705078, -2.338007926940918, -2.221224069595337, -2.104440212249756, -1.9876561164855957, -1.8708722591400146, -1.754088282585144, -1.6373045444488525, -1.520520567893982, -1.4037365913391113, -1.2869527339935303, -1.1701687574386597, -1.053384780883789, -0.9366008639335632, -0.8198169469833374, -0.7030329704284668, -0.5862489938735962, -0.46946507692337036, -0.35268113017082214, -0.23589718341827393, -0.11911320686340332, -0.0023292899131774902, 0.11445462703704834, 0.23123860359191895, 0.34802255034446716, 0.4648064970970154, 0.5815904140472412, 0.6983743906021118, 0.8151583671569824, 0.9319422841072083, 1.048726201057434, 1.1655101776123047, 1.2822941541671753, 1.399078130722046, 1.515861988067627, 1.6326459646224976, 1.7494299411773682, 1.8662137985229492, 1.9829977750778198, 2.0997817516326904]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 6.0, 6.0, 8.0, 10.0, 18.0, 30.0, 40.0, 40.0, 48.0, 49.0, 66.0, 64.0, 71.0, 71.0, 67.0, 70.0, 66.0, 61.0, 49.0, 52.0, 26.0, 25.0, 17.0, 15.0, 12.0, 5.0, 5.0, 6.0, 3.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1473071575164795, -3.059440851211548, -2.971574544906616, -2.8837082386016846, -2.795841693878174, -2.707975387573242, -2.6201090812683105, -2.532242774963379, -2.4443764686584473, -2.3565101623535156, -2.268643856048584, -2.1807775497436523, -2.0929112434387207, -2.00504469871521, -1.9171783924102783, -1.8293120861053467, -1.741445779800415, -1.6535794734954834, -1.5657131671905518, -1.4778467416763306, -1.389980435371399, -1.3021141290664673, -1.214247703552246, -1.1263813972473145, -1.0385150909423828, -0.9506487846374512, -0.8627824187278748, -0.7749160528182983, -0.6870497465133667, -0.5991834402084351, -0.5113170742988586, -0.4234507083892822, -0.3355841636657715, -0.24771782755851746, -0.15985149145126343, -0.0719851553440094, 0.01588118076324463, 0.10374751687049866, 0.19161385297775269, 0.2794802188873291, 0.36734652519226074, 0.45521286129951477, 0.5430791974067688, 0.6309455633163452, 0.7188118696212769, 0.8066781759262085, 0.8945445418357849, 0.9824109077453613, 1.070277214050293, 1.1581435203552246, 1.2460098266601562, 1.3338762521743774, 1.421742558479309, 1.5096088647842407, 1.597475290298462, 1.6853415966033936, 1.7732079029083252, 1.8610742092132568, 1.9489405155181885, 2.03680682182312, 2.124673366546631, 2.2125396728515625, 2.300405979156494, 2.388272285461426, 2.4761385917663574]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 7.0, 3.0, 7.0, 6.0, 10.0, 8.0, 19.0, 9.0, 13.0, 18.0, 28.0, 22.0, 29.0, 29.0, 42.0, 37.0, 38.0, 43.0, 37.0, 48.0, 43.0, 43.0, 45.0, 53.0, 47.0, 39.0, 38.0, 32.0, 31.0, 26.0, 23.0, 19.0, 18.0, 16.0, 20.0, 14.0, 14.0, 9.0, 8.0, 5.0, 4.0, 1.0, 5.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.2265625, -5.06256103515625, -4.8985595703125, -4.73455810546875, -4.570556640625, -4.40655517578125, -4.2425537109375, -4.07855224609375, -3.91455078125, -3.75054931640625, -3.5865478515625, -3.42254638671875, -3.258544921875, -3.09454345703125, -2.9305419921875, -2.76654052734375, -2.6025390625, -2.43853759765625, -2.2745361328125, -2.11053466796875, -1.946533203125, -1.78253173828125, -1.6185302734375, -1.45452880859375, -1.29052734375, -1.12652587890625, -0.9625244140625, -0.79852294921875, -0.634521484375, -0.47052001953125, -0.3065185546875, -0.14251708984375, 0.021484375, 0.18548583984375, 0.3494873046875, 0.51348876953125, 0.677490234375, 0.84149169921875, 1.0054931640625, 1.16949462890625, 1.33349609375, 1.49749755859375, 1.6614990234375, 1.82550048828125, 1.989501953125, 2.15350341796875, 2.3175048828125, 2.48150634765625, 2.6455078125, 2.80950927734375, 2.9735107421875, 3.13751220703125, 3.301513671875, 3.46551513671875, 3.6295166015625, 3.79351806640625, 3.95751953125, 4.12152099609375, 4.2855224609375, 4.44952392578125, 4.613525390625, 4.77752685546875, 4.9415283203125, 5.10552978515625, 5.26953125]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 1.0, 0.0, 5.0, 3.0, 6.0, 5.0, 12.0, 18.0, 24.0, 42.0, 47.0, 67.0, 109.0, 181.0, 255.0, 431.0, 715.0, 1151.0, 1960.0, 3384.0, 6108.0, 10961.0, 20160.0, 38601.0, 75072.0, 151103.0, 308184.0, 209416.0, 106183.0, 53228.0, 27516.0, 14621.0, 7984.0, 4547.0, 2601.0, 1523.0, 877.0, 556.0, 300.0, 187.0, 133.0, 83.0, 58.0, 46.0, 32.0, 17.0, 15.0, 8.0, 10.0, 6.0, 6.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.875, -4.7164306640625, -4.557861328125, -4.3992919921875, -4.24072265625, -4.0821533203125, -3.923583984375, -3.7650146484375, -3.6064453125, -3.4478759765625, -3.289306640625, -3.1307373046875, -2.97216796875, -2.8135986328125, -2.655029296875, -2.4964599609375, -2.337890625, -2.1793212890625, -2.020751953125, -1.8621826171875, -1.70361328125, -1.5450439453125, -1.386474609375, -1.2279052734375, -1.0693359375, -0.9107666015625, -0.752197265625, -0.5936279296875, -0.43505859375, -0.2764892578125, -0.117919921875, 0.0406494140625, 0.19921875, 0.3577880859375, 0.516357421875, 0.6749267578125, 0.83349609375, 0.9920654296875, 1.150634765625, 1.3092041015625, 1.4677734375, 1.6263427734375, 1.784912109375, 1.9434814453125, 2.10205078125, 2.2606201171875, 2.419189453125, 2.5777587890625, 2.736328125, 2.8948974609375, 3.053466796875, 3.2120361328125, 3.37060546875, 3.5291748046875, 3.687744140625, 3.8463134765625, 4.0048828125, 4.1634521484375, 4.322021484375, 4.4805908203125, 4.63916015625, 4.7977294921875, 4.956298828125, 5.1148681640625, 5.2734375]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 5.0, 7.0, 8.0, 15.0, 15.0, 15.0, 30.0, 38.0, 38.0, 60.0, 64.0, 76.0, 127.0, 293.0, 1567.0, 222.0, 133.0, 82.0, 48.0, 55.0, 39.0, 31.0, 19.0, 22.0, 12.0, 11.0, 9.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-21.84375, -20.94677734375, -20.0498046875, -19.15283203125, -18.255859375, -17.35888671875, -16.4619140625, -15.56494140625, -14.66796875, -13.77099609375, -12.8740234375, -11.97705078125, -11.080078125, -10.18310546875, -9.2861328125, -8.38916015625, -7.4921875, -6.59521484375, -5.6982421875, -4.80126953125, -3.904296875, -3.00732421875, -2.1103515625, -1.21337890625, -0.31640625, 0.58056640625, 1.4775390625, 2.37451171875, 3.271484375, 4.16845703125, 5.0654296875, 5.96240234375, 6.859375, 7.75634765625, 8.6533203125, 9.55029296875, 10.447265625, 11.34423828125, 12.2412109375, 13.13818359375, 14.03515625, 14.93212890625, 15.8291015625, 16.72607421875, 17.623046875, 18.52001953125, 19.4169921875, 20.31396484375, 21.2109375, 22.10791015625, 23.0048828125, 23.90185546875, 24.798828125, 25.69580078125, 26.5927734375, 27.48974609375, 28.38671875, 29.28369140625, 30.1806640625, 31.07763671875, 31.974609375, 32.87158203125, 33.7685546875, 34.66552734375, 35.5625]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 6.0, 8.0, 16.0, 16.0, 70.0, 219.0, 1293.0, 1798899.0, 1343478.0, 1321.0, 227.0, 73.0, 28.0, 11.0, 7.0, 4.0, 9.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-174.0, -168.19921875, -162.3984375, -156.59765625, -150.796875, -144.99609375, -139.1953125, -133.39453125, -127.59375, -121.79296875, -115.9921875, -110.19140625, -104.390625, -98.58984375, -92.7890625, -86.98828125, -81.1875, -75.38671875, -69.5859375, -63.78515625, -57.984375, -52.18359375, -46.3828125, -40.58203125, -34.78125, -28.98046875, -23.1796875, -17.37890625, -11.578125, -5.77734375, 0.0234375, 5.82421875, 11.625, 17.42578125, 23.2265625, 29.02734375, 34.828125, 40.62890625, 46.4296875, 52.23046875, 58.03125, 63.83203125, 69.6328125, 75.43359375, 81.234375, 87.03515625, 92.8359375, 98.63671875, 104.4375, 110.23828125, 116.0390625, 121.83984375, 127.640625, 133.44140625, 139.2421875, 145.04296875, 150.84375, 156.64453125, 162.4453125, 168.24609375, 174.046875, 179.84765625, 185.6484375, 191.44921875, 197.25]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1013.0, 3.0, 3.0], "bins": [-2173.353515625, -2138.10595703125, -2102.8583984375, -2067.61083984375, -2032.3634033203125, -1997.1158447265625, -1961.8682861328125, -1926.6207275390625, -1891.373291015625, -1856.125732421875, -1820.878173828125, -1785.6307373046875, -1750.3831787109375, -1715.1356201171875, -1679.8880615234375, -1644.6405029296875, -1609.3929443359375, -1574.1453857421875, -1538.8978271484375, -1503.650390625, -1468.40283203125, -1433.1552734375, -1397.90771484375, -1362.66015625, -1327.41259765625, -1292.1650390625, -1256.91748046875, -1221.6700439453125, -1186.4224853515625, -1151.1749267578125, -1115.9273681640625, -1080.6798095703125, -1045.432373046875, -1010.184814453125, -974.9373168945312, -939.6897583007812, -904.4422607421875, -869.1947021484375, -833.9471435546875, -798.6995849609375, -763.4520263671875, -728.2044677734375, -692.9569702148438, -657.7094116210938, -622.4619140625, -587.21435546875, -551.966796875, -516.71923828125, -481.47174072265625, -446.2242126464844, -410.9766845703125, -375.7291259765625, -340.4815979003906, -305.23406982421875, -269.98651123046875, -234.73898315429688, -199.49147033691406, -164.24392700195312, -128.99639892578125, -93.74886322021484, -58.50132751464844, -23.253799438476562, 11.993743896484375, 47.24128723144531, 82.48881530761719]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 7.0, 12.0, 15.0, 22.0, 38.0, 48.0, 39.0, 60.0, 74.0, 69.0, 76.0, 80.0, 89.0, 88.0, 64.0, 55.0, 47.0, 40.0, 31.0, 23.0, 13.0, 12.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-103.29937744140625, -100.31397247314453, -97.32857513427734, -94.34317016601562, -91.35777282714844, -88.37236785888672, -85.386962890625, -82.40156555175781, -79.4161605834961, -76.43075561523438, -73.44535827636719, -70.45995330810547, -67.47454833984375, -64.48915100097656, -61.503746032714844, -58.51834487915039, -55.53294372558594, -52.547542572021484, -49.56214141845703, -46.57673645019531, -43.59133529663086, -40.605934143066406, -37.62052917480469, -34.635128021240234, -31.64972686767578, -28.664325714111328, -25.678922653198242, -22.693519592285156, -19.708118438720703, -16.72271728515625, -13.737314224243164, -10.751911163330078, -7.766510009765625, -4.7811079025268555, -1.795705795288086, 1.1896963119506836, 4.175098419189453, 7.160500526428223, 10.145902633666992, 13.131305694580078, 16.11670684814453, 19.102108001708984, 22.08751106262207, 25.072914123535156, 28.05831527709961, 31.043716430664062, 34.02912139892578, 37.014522552490234, 39.99992370605469, 42.98532485961914, 45.970726013183594, 48.95613098144531, 51.941532135009766, 54.92693328857422, 57.91233825683594, 60.89773941040039, 63.883140563964844, 66.86854553222656, 69.85394287109375, 72.83934783935547, 75.82475280761719, 78.81015014648438, 81.7955551147461, 84.78096008300781, 87.766357421875]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 6.0, 2.0, 3.0, 3.0, 10.0, 3.0, 7.0, 9.0, 11.0, 15.0, 13.0, 19.0, 30.0, 25.0, 22.0, 19.0, 31.0, 28.0, 38.0, 40.0, 40.0, 49.0, 39.0, 42.0, 35.0, 44.0, 47.0, 37.0, 37.0, 32.0, 30.0, 33.0, 30.0, 19.0, 18.0, 23.0, 20.0, 19.0, 9.0, 10.0, 13.0, 15.0, 4.0, 3.0, 7.0, 5.0, 4.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-4.984375, -4.8236083984375, -4.662841796875, -4.5020751953125, -4.34130859375, -4.1805419921875, -4.019775390625, -3.8590087890625, -3.6982421875, -3.5374755859375, -3.376708984375, -3.2159423828125, -3.05517578125, -2.8944091796875, -2.733642578125, -2.5728759765625, -2.412109375, -2.2513427734375, -2.090576171875, -1.9298095703125, -1.76904296875, -1.6082763671875, -1.447509765625, -1.2867431640625, -1.1259765625, -0.9652099609375, -0.804443359375, -0.6436767578125, -0.48291015625, -0.3221435546875, -0.161376953125, -0.0006103515625, 0.16015625, 0.3209228515625, 0.481689453125, 0.6424560546875, 0.80322265625, 0.9639892578125, 1.124755859375, 1.2855224609375, 1.4462890625, 1.6070556640625, 1.767822265625, 1.9285888671875, 2.08935546875, 2.2501220703125, 2.410888671875, 2.5716552734375, 2.732421875, 2.8931884765625, 3.053955078125, 3.2147216796875, 3.37548828125, 3.5362548828125, 3.697021484375, 3.8577880859375, 4.0185546875, 4.1793212890625, 4.340087890625, 4.5008544921875, 4.66162109375, 4.8223876953125, 4.983154296875, 5.1439208984375, 5.3046875]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 2.0, 8.0, 8.0, 13.0, 17.0, 30.0, 43.0, 67.0, 93.0, 159.0, 231.0, 358.0, 618.0, 996.0, 1775.0, 3300.0, 6528.0, 15646.0, 43682.0, 153015.0, 634082.0, 1727925.0, 1172346.0, 305277.0, 80602.0, 26602.0, 10447.0, 4790.0, 2332.0, 1285.0, 748.0, 451.0, 272.0, 180.0, 116.0, 86.0, 50.0, 30.0, 20.0, 20.0, 11.0, 8.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0], "bins": [-8.3671875, -8.1116943359375, -7.856201171875, -7.6007080078125, -7.34521484375, -7.0897216796875, -6.834228515625, -6.5787353515625, -6.3232421875, -6.0677490234375, -5.812255859375, -5.5567626953125, -5.30126953125, -5.0457763671875, -4.790283203125, -4.5347900390625, -4.279296875, -4.0238037109375, -3.768310546875, -3.5128173828125, -3.25732421875, -3.0018310546875, -2.746337890625, -2.4908447265625, -2.2353515625, -1.9798583984375, -1.724365234375, -1.4688720703125, -1.21337890625, -0.9578857421875, -0.702392578125, -0.4468994140625, -0.19140625, 0.0640869140625, 0.319580078125, 0.5750732421875, 0.83056640625, 1.0860595703125, 1.341552734375, 1.5970458984375, 1.8525390625, 2.1080322265625, 2.363525390625, 2.6190185546875, 2.87451171875, 3.1300048828125, 3.385498046875, 3.6409912109375, 3.896484375, 4.1519775390625, 4.407470703125, 4.6629638671875, 4.91845703125, 5.1739501953125, 5.429443359375, 5.6849365234375, 5.9404296875, 6.1959228515625, 6.451416015625, 6.7069091796875, 6.96240234375, 7.2178955078125, 7.473388671875, 7.7288818359375, 7.984375]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 10.0, 7.0, 9.0, 15.0, 32.0, 50.0, 70.0, 177.0, 255.0, 492.0, 794.0, 883.0, 570.0, 328.0, 199.0, 82.0, 61.0, 22.0, 15.0, 5.0, 6.0, 3.0, 5.0, 0.0, 0.0, 1.0, 1.0], "bins": [-30.96875, -30.32568359375, -29.6826171875, -29.03955078125, -28.396484375, -27.75341796875, -27.1103515625, -26.46728515625, -25.82421875, -25.18115234375, -24.5380859375, -23.89501953125, -23.251953125, -22.60888671875, -21.9658203125, -21.32275390625, -20.6796875, -20.03662109375, -19.3935546875, -18.75048828125, -18.107421875, -17.46435546875, -16.8212890625, -16.17822265625, -15.53515625, -14.89208984375, -14.2490234375, -13.60595703125, -12.962890625, -12.31982421875, -11.6767578125, -11.03369140625, -10.390625, -9.74755859375, -9.1044921875, -8.46142578125, -7.818359375, -7.17529296875, -6.5322265625, -5.88916015625, -5.24609375, -4.60302734375, -3.9599609375, -3.31689453125, -2.673828125, -2.03076171875, -1.3876953125, -0.74462890625, -0.1015625, 0.54150390625, 1.1845703125, 1.82763671875, 2.470703125, 3.11376953125, 3.7568359375, 4.39990234375, 5.04296875, 5.68603515625, 6.3291015625, 6.97216796875, 7.615234375, 8.25830078125, 8.9013671875, 9.54443359375, 10.1875]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 7.0, 9.0, 15.0, 26.0, 44.0, 76.0, 153.0, 299.0, 660.0, 2927.0, 285374.0, 3884123.0, 18498.0, 1178.0, 430.0, 215.0, 115.0, 55.0, 40.0, 22.0, 17.0, 5.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.015625, -29.109130859375, -27.20263671875, -25.296142578125, -23.3896484375, -21.483154296875, -19.57666015625, -17.670166015625, -15.763671875, -13.857177734375, -11.95068359375, -10.044189453125, -8.1376953125, -6.231201171875, -4.32470703125, -2.418212890625, -0.51171875, 1.394775390625, 3.30126953125, 5.207763671875, 7.1142578125, 9.020751953125, 10.92724609375, 12.833740234375, 14.740234375, 16.646728515625, 18.55322265625, 20.459716796875, 22.3662109375, 24.272705078125, 26.17919921875, 28.085693359375, 29.9921875, 31.898681640625, 33.80517578125, 35.711669921875, 37.6181640625, 39.524658203125, 41.43115234375, 43.337646484375, 45.244140625, 47.150634765625, 49.05712890625, 50.963623046875, 52.8701171875, 54.776611328125, 56.68310546875, 58.589599609375, 60.49609375, 62.402587890625, 64.30908203125, 66.215576171875, 68.1220703125, 70.028564453125, 71.93505859375, 73.841552734375, 75.748046875, 77.654541015625, 79.56103515625, 81.467529296875, 83.3740234375, 85.280517578125, 87.18701171875, 89.093505859375, 91.0]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 7.0, 27.0, 114.0, 259.0, 312.0, 195.0, 67.0, 28.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-88.58467864990234, -83.49061584472656, -78.39655303955078, -73.302490234375, -68.20843505859375, -63.1143684387207, -58.02030944824219, -52.926246643066406, -47.832183837890625, -42.738121032714844, -37.64405822753906, -32.54999923706055, -27.455936431884766, -22.361873626708984, -17.267812728881836, -12.173751831054688, -7.079689025878906, -1.9856271743774414, 3.1084346771240234, 8.202496528625488, 13.296558380126953, 18.390621185302734, 23.484682083129883, 28.57874298095703, 33.67280578613281, 38.766868591308594, 43.860931396484375, 48.95499038696289, 54.04905319213867, 59.14311599731445, 64.23717498779297, 69.33123779296875, 74.42529296875, 79.51935577392578, 84.61341857910156, 89.70748138427734, 94.80154418945312, 99.89559936523438, 104.98966217041016, 110.08372497558594, 115.17778778076172, 120.2718505859375, 125.36591339111328, 130.45997619628906, 135.5540313720703, 140.64810180664062, 145.74215698242188, 150.83621215820312, 155.93028259277344, 161.0243377685547, 166.118408203125, 171.21246337890625, 176.30653381347656, 181.4005889892578, 186.49465942382812, 191.58871459960938, 196.68276977539062, 201.77682495117188, 206.8708953857422, 211.96495056152344, 217.05902099609375, 222.153076171875, 227.2471466064453, 232.34120178222656, 237.43527221679688]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 5.0, 2.0, 7.0, 6.0, 3.0, 13.0, 9.0, 13.0, 12.0, 23.0, 19.0, 16.0, 22.0, 23.0, 33.0, 25.0, 34.0, 30.0, 36.0, 42.0, 41.0, 42.0, 39.0, 38.0, 44.0, 34.0, 31.0, 43.0, 47.0, 37.0, 29.0, 31.0, 28.0, 19.0, 15.0, 16.0, 13.0, 17.0, 13.0, 11.0, 13.0, 9.0, 7.0, 3.0, 8.0, 5.0, 0.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-39.76934814453125, -38.58564758300781, -37.401947021484375, -36.21824645996094, -35.0345458984375, -33.85084533691406, -32.667144775390625, -31.483444213867188, -30.29974365234375, -29.116043090820312, -27.932342529296875, -26.748641967773438, -25.56494140625, -24.381240844726562, -23.197540283203125, -22.013839721679688, -20.83013916015625, -19.646438598632812, -18.462738037109375, -17.279037475585938, -16.0953369140625, -14.911636352539062, -13.727935791015625, -12.544235229492188, -11.36053466796875, -10.176834106445312, -8.993133544921875, -7.8094329833984375, -6.625732421875, -5.4420318603515625, -4.258331298828125, -3.0746307373046875, -1.8909263610839844, -0.7072257995605469, 0.4764747619628906, 1.6601753234863281, 2.8438758850097656, 4.027576446533203, 5.211277008056641, 6.394977569580078, 7.578678131103516, 8.762378692626953, 9.94607925415039, 11.129779815673828, 12.313480377197266, 13.497180938720703, 14.68088150024414, 15.864582061767578, 17.048282623291016, 18.231983184814453, 19.41568374633789, 20.599384307861328, 21.783084869384766, 22.966785430908203, 24.15048599243164, 25.334186553955078, 26.517887115478516, 27.701587677001953, 28.88528823852539, 30.068988800048828, 31.252689361572266, 32.4363899230957, 33.62009048461914, 34.80379104614258, 35.987491607666016]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 6.0, 3.0, 6.0, 11.0, 18.0, 7.0, 17.0, 16.0, 14.0, 16.0, 31.0, 20.0, 32.0, 27.0, 21.0, 28.0, 43.0, 34.0, 43.0, 40.0, 44.0, 48.0, 38.0, 46.0, 37.0, 35.0, 41.0, 32.0, 35.0, 24.0, 29.0, 32.0, 18.0, 20.0, 14.0, 15.0, 10.0, 9.0, 10.0, 6.0, 8.0, 3.0, 4.0, 3.0, 1.0, 0.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.17578125, -5.01434326171875, -4.8529052734375, -4.69146728515625, -4.530029296875, -4.36859130859375, -4.2071533203125, -4.04571533203125, -3.88427734375, -3.72283935546875, -3.5614013671875, -3.39996337890625, -3.238525390625, -3.07708740234375, -2.9156494140625, -2.75421142578125, -2.5927734375, -2.43133544921875, -2.2698974609375, -2.10845947265625, -1.947021484375, -1.78558349609375, -1.6241455078125, -1.46270751953125, -1.30126953125, -1.13983154296875, -0.9783935546875, -0.81695556640625, -0.655517578125, -0.49407958984375, -0.3326416015625, -0.17120361328125, -0.009765625, 0.15167236328125, 0.3131103515625, 0.47454833984375, 0.635986328125, 0.79742431640625, 0.9588623046875, 1.12030029296875, 1.28173828125, 1.44317626953125, 1.6046142578125, 1.76605224609375, 1.927490234375, 2.08892822265625, 2.2503662109375, 2.41180419921875, 2.5732421875, 2.73468017578125, 2.8961181640625, 3.05755615234375, 3.218994140625, 3.38043212890625, 3.5418701171875, 3.70330810546875, 3.86474609375, 4.02618408203125, 4.1876220703125, 4.34906005859375, 4.510498046875, 4.67193603515625, 4.8333740234375, 4.99481201171875, 5.15625]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 7.0, 14.0, 12.0, 25.0, 37.0, 58.0, 91.0, 137.0, 252.0, 433.0, 738.0, 1345.0, 2658.0, 5236.0, 10704.0, 23636.0, 49380.0, 100370.0, 180733.0, 242356.0, 199882.0, 117378.0, 59165.0, 28170.0, 13032.0, 6077.0, 3049.0, 1572.0, 836.0, 475.0, 266.0, 153.0, 102.0, 67.0, 29.0, 28.0, 22.0, 10.0, 7.0, 6.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.462890625, -3.341888427734375, -3.22088623046875, -3.099884033203125, -2.9788818359375, -2.857879638671875, -2.73687744140625, -2.615875244140625, -2.494873046875, -2.373870849609375, -2.25286865234375, -2.131866455078125, -2.0108642578125, -1.889862060546875, -1.76885986328125, -1.647857666015625, -1.52685546875, -1.405853271484375, -1.28485107421875, -1.163848876953125, -1.0428466796875, -0.921844482421875, -0.80084228515625, -0.679840087890625, -0.558837890625, -0.437835693359375, -0.31683349609375, -0.195831298828125, -0.0748291015625, 0.046173095703125, 0.16717529296875, 0.288177490234375, 0.4091796875, 0.530181884765625, 0.65118408203125, 0.772186279296875, 0.8931884765625, 1.014190673828125, 1.13519287109375, 1.256195068359375, 1.377197265625, 1.498199462890625, 1.61920166015625, 1.740203857421875, 1.8612060546875, 1.982208251953125, 2.10321044921875, 2.224212646484375, 2.34521484375, 2.466217041015625, 2.58721923828125, 2.708221435546875, 2.8292236328125, 2.950225830078125, 3.07122802734375, 3.192230224609375, 3.313232421875, 3.434234619140625, 3.55523681640625, 3.676239013671875, 3.7972412109375, 3.918243408203125, 4.03924560546875, 4.160247802734375, 4.28125]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 3.0, 6.0, 6.0, 2.0, 9.0, 14.0, 11.0, 22.0, 24.0, 33.0, 43.0, 52.0, 53.0, 61.0, 62.0, 55.0, 1096.0, 67.0, 59.0, 49.0, 50.0, 59.0, 39.0, 37.0, 25.0, 27.0, 24.0, 8.0, 13.0, 7.0, 7.0, 3.0, 5.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.8515625, -8.580810546875, -8.31005859375, -8.039306640625, -7.7685546875, -7.497802734375, -7.22705078125, -6.956298828125, -6.685546875, -6.414794921875, -6.14404296875, -5.873291015625, -5.6025390625, -5.331787109375, -5.06103515625, -4.790283203125, -4.51953125, -4.248779296875, -3.97802734375, -3.707275390625, -3.4365234375, -3.165771484375, -2.89501953125, -2.624267578125, -2.353515625, -2.082763671875, -1.81201171875, -1.541259765625, -1.2705078125, -0.999755859375, -0.72900390625, -0.458251953125, -0.1875, 0.083251953125, 0.35400390625, 0.624755859375, 0.8955078125, 1.166259765625, 1.43701171875, 1.707763671875, 1.978515625, 2.249267578125, 2.52001953125, 2.790771484375, 3.0615234375, 3.332275390625, 3.60302734375, 3.873779296875, 4.14453125, 4.415283203125, 4.68603515625, 4.956787109375, 5.2275390625, 5.498291015625, 5.76904296875, 6.039794921875, 6.310546875, 6.581298828125, 6.85205078125, 7.122802734375, 7.3935546875, 7.664306640625, 7.93505859375, 8.205810546875, 8.4765625]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 9.0, 11.0, 17.0, 18.0, 29.0, 35.0, 53.0, 100.0, 151.0, 241.0, 386.0, 563.0, 885.0, 1621.0, 2948.0, 5085.0, 9277.0, 18567.0, 42339.0, 1047311.0, 885759.0, 42207.0, 17945.0, 9426.0, 5208.0, 2823.0, 1618.0, 926.0, 556.0, 359.0, 207.0, 153.0, 103.0, 54.0, 30.0, 33.0, 28.0, 22.0, 9.0, 12.0, 5.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.37109375, -7.16046142578125, -6.9498291015625, -6.73919677734375, -6.528564453125, -6.31793212890625, -6.1072998046875, -5.89666748046875, -5.68603515625, -5.47540283203125, -5.2647705078125, -5.05413818359375, -4.843505859375, -4.63287353515625, -4.4222412109375, -4.21160888671875, -4.0009765625, -3.79034423828125, -3.5797119140625, -3.36907958984375, -3.158447265625, -2.94781494140625, -2.7371826171875, -2.52655029296875, -2.31591796875, -2.10528564453125, -1.8946533203125, -1.68402099609375, -1.473388671875, -1.26275634765625, -1.0521240234375, -0.84149169921875, -0.630859375, -0.42022705078125, -0.2095947265625, 0.00103759765625, 0.211669921875, 0.42230224609375, 0.6329345703125, 0.84356689453125, 1.05419921875, 1.26483154296875, 1.4754638671875, 1.68609619140625, 1.896728515625, 2.10736083984375, 2.3179931640625, 2.52862548828125, 2.7392578125, 2.94989013671875, 3.1605224609375, 3.37115478515625, 3.581787109375, 3.79241943359375, 4.0030517578125, 4.21368408203125, 4.42431640625, 4.63494873046875, 4.8455810546875, 5.05621337890625, 5.266845703125, 5.47747802734375, 5.6881103515625, 5.89874267578125, 6.109375]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 4.0, 5.0, 8.0, 18.0, 31.0, 28.0, 49.0, 54.0, 90.0, 110.0, 158.0, 120.0, 77.0, 59.0, 55.0, 43.0, 21.0, 15.0, 14.0, 10.0, 4.0, 5.0, 3.0, 2.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.615234375, -0.5950546264648438, -0.5748748779296875, -0.5546951293945312, -0.534515380859375, -0.5143356323242188, -0.4941558837890625, -0.47397613525390625, -0.45379638671875, -0.43361663818359375, -0.4134368896484375, -0.39325714111328125, -0.373077392578125, -0.35289764404296875, -0.3327178955078125, -0.31253814697265625, -0.2923583984375, -0.27217864990234375, -0.2519989013671875, -0.23181915283203125, -0.211639404296875, -0.19145965576171875, -0.1712799072265625, -0.15110015869140625, -0.13092041015625, -0.11074066162109375, -0.0905609130859375, -0.07038116455078125, -0.050201416015625, -0.03002166748046875, -0.0098419189453125, 0.01033782958984375, 0.030517578125, 0.05069732666015625, 0.0708770751953125, 0.09105682373046875, 0.111236572265625, 0.13141632080078125, 0.1515960693359375, 0.17177581787109375, 0.19195556640625, 0.21213531494140625, 0.2323150634765625, 0.25249481201171875, 0.272674560546875, 0.29285430908203125, 0.3130340576171875, 0.33321380615234375, 0.3533935546875, 0.37357330322265625, 0.3937530517578125, 0.41393280029296875, 0.434112548828125, 0.45429229736328125, 0.4744720458984375, 0.49465179443359375, 0.51483154296875, 0.5350112915039062, 0.5551910400390625, 0.5753707885742188, 0.595550537109375, 0.6157302856445312, 0.6359100341796875, 0.6560897827148438, 0.67626953125]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 3.0, 4.0, 7.0, 12.0, 13.0, 23.0, 28.0, 71.0, 100.0, 149.0, 386.0, 4273.0, 1028403.0, 14097.0, 541.0, 171.0, 109.0, 44.0, 42.0, 32.0, 16.0, 6.0, 5.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.71875, -13.310791015625, -12.90283203125, -12.494873046875, -12.0869140625, -11.678955078125, -11.27099609375, -10.863037109375, -10.455078125, -10.047119140625, -9.63916015625, -9.231201171875, -8.8232421875, -8.415283203125, -8.00732421875, -7.599365234375, -7.19140625, -6.783447265625, -6.37548828125, -5.967529296875, -5.5595703125, -5.151611328125, -4.74365234375, -4.335693359375, -3.927734375, -3.519775390625, -3.11181640625, -2.703857421875, -2.2958984375, -1.887939453125, -1.47998046875, -1.072021484375, -0.6640625, -0.256103515625, 0.15185546875, 0.559814453125, 0.9677734375, 1.375732421875, 1.78369140625, 2.191650390625, 2.599609375, 3.007568359375, 3.41552734375, 3.823486328125, 4.2314453125, 4.639404296875, 5.04736328125, 5.455322265625, 5.86328125, 6.271240234375, 6.67919921875, 7.087158203125, 7.4951171875, 7.903076171875, 8.31103515625, 8.718994140625, 9.126953125, 9.534912109375, 9.94287109375, 10.350830078125, 10.7587890625, 11.166748046875, 11.57470703125, 11.982666015625, 12.390625]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 8.0, 25.0, 75.0, 242.0, 443.0, 148.0, 50.0, 8.0, 7.0, 3.0, 0.0, 0.0, 2.0], "bins": [-10.14067268371582, -9.957185745239258, -9.773698806762695, -9.590211868286133, -9.406725883483887, -9.223238945007324, -9.039752006530762, -8.8562650680542, -8.672778129577637, -8.489291191101074, -8.305804252624512, -8.12231731414795, -7.938830852508545, -7.755343914031982, -7.571857452392578, -7.388370513916016, -7.204883575439453, -7.021396636962891, -6.837910175323486, -6.654423236846924, -6.470936298370361, -6.287449359893799, -6.1039628982543945, -5.920475959777832, -5.736989498138428, -5.553502559661865, -5.370016098022461, -5.186529159545898, -5.003042221069336, -4.819555282592773, -4.636068820953369, -4.452581882476807, -4.269095420837402, -4.08560848236084, -3.9021217823028564, -3.718635082244873, -3.5351481437683105, -3.351661443710327, -3.1681747436523438, -2.9846878051757812, -2.8012008666992188, -2.6177141666412354, -2.434227228164673, -2.2507405281066895, -2.067253589630127, -1.8837668895721436, -1.7002800703048706, -1.5167932510375977, -1.3333063125610352, -1.1498194932937622, -0.9663326740264893, -0.7828459143638611, -0.5993590950965881, -0.4158722758293152, -0.232385516166687, -0.04889869689941406, 0.1345881223678589, 0.31807494163513184, 0.5015617609024048, 0.685048520565033, 0.8685353398323059, 1.0520222187042236, 1.235508918762207, 1.41899573802948, 1.602482557296753]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 5.0, 6.0, 9.0, 16.0, 24.0, 20.0, 30.0, 50.0, 42.0, 52.0, 60.0, 48.0, 77.0, 84.0, 64.0, 65.0, 56.0, 62.0, 40.0, 48.0, 37.0, 35.0, 17.0, 19.0, 12.0, 12.0, 9.0, 5.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6537468433380127, -1.590704321861267, -1.5276618003845215, -1.4646192789077759, -1.4015767574310303, -1.3385343551635742, -1.2754918336868286, -1.212449312210083, -1.1494067907333374, -1.0863642692565918, -1.0233217477798462, -0.9602792859077454, -0.8972367644309998, -0.8341942429542542, -0.7711517810821533, -0.7081092596054077, -0.6450667381286621, -0.5820242166519165, -0.5189816951751709, -0.45593923330307007, -0.39289671182632446, -0.32985419034957886, -0.26681169867515564, -0.20376920700073242, -0.14072668552398682, -0.0776841789484024, -0.014641672372817993, 0.04840083420276642, 0.11144334077835083, 0.17448586225509644, 0.23752835392951965, 0.30057084560394287, 0.3636131286621094, 0.426655650138855, 0.4896981418132782, 0.5527406334877014, 0.615783154964447, 0.6788256764411926, 0.7418681383132935, 0.8049106597900391, 0.8679531812667847, 0.9309957027435303, 0.9940382242202759, 1.0570807456970215, 1.1201231479644775, 1.1831657886505127, 1.2462081909179688, 1.3092507123947144, 1.37229323387146, 1.4353357553482056, 1.4983782768249512, 1.5614207983016968, 1.6244633197784424, 1.6875057220458984, 1.750548243522644, 1.8135907649993896, 1.8766332864761353, 1.9396758079528809, 2.002718210220337, 2.065760850906372, 2.128803253173828, 2.1918458938598633, 2.2548882961273193, 2.3179306983947754, 2.3809733390808105]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 5.0, 2.0, 2.0, 6.0, 4.0, 10.0, 14.0, 12.0, 16.0, 20.0, 19.0, 26.0, 16.0, 18.0, 35.0, 36.0, 35.0, 33.0, 42.0, 47.0, 36.0, 40.0, 51.0, 39.0, 51.0, 50.0, 38.0, 36.0, 25.0, 28.0, 32.0, 26.0, 24.0, 29.0, 22.0, 16.0, 14.0, 8.0, 13.0, 3.0, 6.0, 7.0, 5.0, 6.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.45703125, -5.28802490234375, -5.1190185546875, -4.95001220703125, -4.781005859375, -4.61199951171875, -4.4429931640625, -4.27398681640625, -4.10498046875, -3.93597412109375, -3.7669677734375, -3.59796142578125, -3.428955078125, -3.25994873046875, -3.0909423828125, -2.92193603515625, -2.7529296875, -2.58392333984375, -2.4149169921875, -2.24591064453125, -2.076904296875, -1.90789794921875, -1.7388916015625, -1.56988525390625, -1.40087890625, -1.23187255859375, -1.0628662109375, -0.89385986328125, -0.724853515625, -0.55584716796875, -0.3868408203125, -0.21783447265625, -0.048828125, 0.12017822265625, 0.2891845703125, 0.45819091796875, 0.627197265625, 0.79620361328125, 0.9652099609375, 1.13421630859375, 1.30322265625, 1.47222900390625, 1.6412353515625, 1.81024169921875, 1.979248046875, 2.14825439453125, 2.3172607421875, 2.48626708984375, 2.6552734375, 2.82427978515625, 2.9932861328125, 3.16229248046875, 3.331298828125, 3.50030517578125, 3.6693115234375, 3.83831787109375, 4.00732421875, 4.17633056640625, 4.3453369140625, 4.51434326171875, 4.683349609375, 4.85235595703125, 5.0213623046875, 5.19036865234375, 5.359375]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 6.0, 6.0, 15.0, 9.0, 16.0, 28.0, 38.0, 57.0, 101.0, 136.0, 202.0, 328.0, 508.0, 826.0, 1324.0, 2304.0, 4008.0, 6952.0, 12486.0, 22494.0, 41532.0, 78176.0, 153843.0, 349894.0, 179891.0, 88615.0, 47178.0, 25296.0, 13717.0, 7706.0, 4338.0, 2611.0, 1463.0, 904.0, 548.0, 360.0, 226.0, 139.0, 104.0, 62.0, 41.0, 22.0, 14.0, 12.0, 6.0, 9.0, 5.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.94140625, -5.75335693359375, -5.5653076171875, -5.37725830078125, -5.189208984375, -5.00115966796875, -4.8131103515625, -4.62506103515625, -4.43701171875, -4.24896240234375, -4.0609130859375, -3.87286376953125, -3.684814453125, -3.49676513671875, -3.3087158203125, -3.12066650390625, -2.9326171875, -2.74456787109375, -2.5565185546875, -2.36846923828125, -2.180419921875, -1.99237060546875, -1.8043212890625, -1.61627197265625, -1.42822265625, -1.24017333984375, -1.0521240234375, -0.86407470703125, -0.676025390625, -0.48797607421875, -0.2999267578125, -0.11187744140625, 0.076171875, 0.26422119140625, 0.4522705078125, 0.64031982421875, 0.828369140625, 1.01641845703125, 1.2044677734375, 1.39251708984375, 1.58056640625, 1.76861572265625, 1.9566650390625, 2.14471435546875, 2.332763671875, 2.52081298828125, 2.7088623046875, 2.89691162109375, 3.0849609375, 3.27301025390625, 3.4610595703125, 3.64910888671875, 3.837158203125, 4.02520751953125, 4.2132568359375, 4.40130615234375, 4.58935546875, 4.77740478515625, 4.9654541015625, 5.15350341796875, 5.341552734375, 5.52960205078125, 5.7176513671875, 5.90570068359375, 6.09375]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 3.0, 6.0, 6.0, 10.0, 19.0, 23.0, 34.0, 41.0, 52.0, 66.0, 71.0, 128.0, 269.0, 1625.0, 226.0, 116.0, 82.0, 71.0, 53.0, 41.0, 26.0, 19.0, 21.0, 10.0, 11.0, 6.0, 4.0, 6.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.15625, -31.10107421875, -30.0458984375, -28.99072265625, -27.935546875, -26.88037109375, -25.8251953125, -24.77001953125, -23.71484375, -22.65966796875, -21.6044921875, -20.54931640625, -19.494140625, -18.43896484375, -17.3837890625, -16.32861328125, -15.2734375, -14.21826171875, -13.1630859375, -12.10791015625, -11.052734375, -9.99755859375, -8.9423828125, -7.88720703125, -6.83203125, -5.77685546875, -4.7216796875, -3.66650390625, -2.611328125, -1.55615234375, -0.5009765625, 0.55419921875, 1.609375, 2.66455078125, 3.7197265625, 4.77490234375, 5.830078125, 6.88525390625, 7.9404296875, 8.99560546875, 10.05078125, 11.10595703125, 12.1611328125, 13.21630859375, 14.271484375, 15.32666015625, 16.3818359375, 17.43701171875, 18.4921875, 19.54736328125, 20.6025390625, 21.65771484375, 22.712890625, 23.76806640625, 24.8232421875, 25.87841796875, 26.93359375, 27.98876953125, 29.0439453125, 30.09912109375, 31.154296875, 32.20947265625, 33.2646484375, 34.31982421875, 35.375]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 4.0, 4.0, 8.0, 21.0, 49.0, 153.0, 652.0, 31044.0, 3111966.0, 1429.0, 242.0, 81.0, 19.0, 13.0, 6.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-211.625, -204.837890625, -198.05078125, -191.263671875, -184.4765625, -177.689453125, -170.90234375, -164.115234375, -157.328125, -150.541015625, -143.75390625, -136.966796875, -130.1796875, -123.392578125, -116.60546875, -109.818359375, -103.03125, -96.244140625, -89.45703125, -82.669921875, -75.8828125, -69.095703125, -62.30859375, -55.521484375, -48.734375, -41.947265625, -35.16015625, -28.373046875, -21.5859375, -14.798828125, -8.01171875, -1.224609375, 5.5625, 12.349609375, 19.13671875, 25.923828125, 32.7109375, 39.498046875, 46.28515625, 53.072265625, 59.859375, 66.646484375, 73.43359375, 80.220703125, 87.0078125, 93.794921875, 100.58203125, 107.369140625, 114.15625, 120.943359375, 127.73046875, 134.517578125, 141.3046875, 148.091796875, 154.87890625, 161.666015625, 168.453125, 175.240234375, 182.02734375, 188.814453125, 195.6015625, 202.388671875, 209.17578125, 215.962890625, 222.75]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 735.0, 281.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1327.390625, -1304.853515625, -1282.3165283203125, -1259.7794189453125, -1237.2423095703125, -1214.705322265625, -1192.168212890625, -1169.631103515625, -1147.0941162109375, -1124.5570068359375, -1102.02001953125, -1079.48291015625, -1056.94580078125, -1034.4088134765625, -1011.8717041015625, -989.3346557617188, -966.7975463867188, -944.260498046875, -921.723388671875, -899.1863403320312, -876.6492919921875, -854.1121826171875, -831.5751342773438, -809.0380859375, -786.5009765625, -763.9639282226562, -741.4268188476562, -718.8897705078125, -696.3527221679688, -673.815673828125, -651.278564453125, -628.7415161132812, -606.2044677734375, -583.6674194335938, -561.1303100585938, -538.59326171875, -516.0562133789062, -493.5191345214844, -470.9820556640625, -448.44500732421875, -425.9079284667969, -403.370849609375, -380.83380126953125, -358.2967224121094, -335.7596435546875, -313.22259521484375, -290.6855163574219, -268.1484375, -245.61138916015625, -223.07432556152344, -200.53726196289062, -178.00018310546875, -155.46311950683594, -132.92605590820312, -110.38897705078125, -87.85191345214844, -65.31484985351562, -42.77778244018555, -20.24071502685547, 2.296356201171875, 24.833419799804688, 47.3704833984375, 69.90756225585938, 92.44462585449219, 114.981689453125]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 5.0, 7.0, 9.0, 3.0, 8.0, 20.0, 16.0, 23.0, 24.0, 30.0, 28.0, 32.0, 48.0, 50.0, 49.0, 55.0, 55.0, 58.0, 61.0, 48.0, 63.0, 50.0, 33.0, 49.0, 31.0, 34.0, 34.0, 25.0, 13.0, 12.0, 12.0, 7.0, 4.0, 4.0, 0.0, 4.0, 1.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-76.64471435546875, -74.57112884521484, -72.49754333496094, -70.42395782470703, -68.35037231445312, -66.27678680419922, -64.20320129394531, -62.129615783691406, -60.0560302734375, -57.982444763183594, -55.90885925292969, -53.83527374267578, -51.761688232421875, -49.68810272216797, -47.61451721191406, -45.540931701660156, -43.46734619140625, -41.393760681152344, -39.32017517089844, -37.24658966064453, -35.173004150390625, -33.09941864013672, -31.025833129882812, -28.952247619628906, -26.878662109375, -24.805076599121094, -22.731491088867188, -20.65790557861328, -18.584320068359375, -16.51073455810547, -14.437149047851562, -12.363563537597656, -10.289970397949219, -8.216384887695312, -6.142799377441406, -4.0692138671875, -1.9956283569335938, 0.0779571533203125, 2.1515426635742188, 4.225128173828125, 6.298713684082031, 8.372299194335938, 10.445884704589844, 12.51947021484375, 14.593055725097656, 16.666641235351562, 18.74022674560547, 20.813812255859375, 22.88739776611328, 24.960983276367188, 27.034568786621094, 29.108154296875, 31.181739807128906, 33.25532531738281, 35.32891082763672, 37.402496337890625, 39.47608184814453, 41.54966735839844, 43.623252868652344, 45.69683837890625, 47.770423889160156, 49.84400939941406, 51.91759490966797, 53.991180419921875, 56.06476593017578]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 2.0, 2.0, 6.0, 11.0, 11.0, 15.0, 11.0, 20.0, 20.0, 12.0, 20.0, 24.0, 34.0, 40.0, 31.0, 37.0, 47.0, 42.0, 43.0, 43.0, 45.0, 43.0, 49.0, 42.0, 40.0, 32.0, 45.0, 31.0, 35.0, 22.0, 31.0, 17.0, 17.0, 16.0, 20.0, 12.0, 6.0, 3.0, 4.0, 4.0, 7.0, 4.0, 6.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.96875, -5.7786865234375, -5.588623046875, -5.3985595703125, -5.20849609375, -5.0184326171875, -4.828369140625, -4.6383056640625, -4.4482421875, -4.2581787109375, -4.068115234375, -3.8780517578125, -3.68798828125, -3.4979248046875, -3.307861328125, -3.1177978515625, -2.927734375, -2.7376708984375, -2.547607421875, -2.3575439453125, -2.16748046875, -1.9774169921875, -1.787353515625, -1.5972900390625, -1.4072265625, -1.2171630859375, -1.027099609375, -0.8370361328125, -0.64697265625, -0.4569091796875, -0.266845703125, -0.0767822265625, 0.11328125, 0.3033447265625, 0.493408203125, 0.6834716796875, 0.87353515625, 1.0635986328125, 1.253662109375, 1.4437255859375, 1.6337890625, 1.8238525390625, 2.013916015625, 2.2039794921875, 2.39404296875, 2.5841064453125, 2.774169921875, 2.9642333984375, 3.154296875, 3.3443603515625, 3.534423828125, 3.7244873046875, 3.91455078125, 4.1046142578125, 4.294677734375, 4.4847412109375, 4.6748046875, 4.8648681640625, 5.054931640625, 5.2449951171875, 5.43505859375, 5.6251220703125, 5.815185546875, 6.0052490234375, 6.1953125]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 6.0, 6.0, 4.0, 15.0, 15.0, 34.0, 49.0, 87.0, 115.0, 210.0, 337.0, 579.0, 992.0, 1799.0, 3696.0, 8283.0, 22994.0, 88830.0, 515652.0, 2124130.0, 1166545.0, 195075.0, 41048.0, 12962.0, 5287.0, 2512.0, 1292.0, 705.0, 396.0, 237.0, 151.0, 78.0, 73.0, 36.0, 19.0, 17.0, 14.0, 5.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-12.65625, -12.2918701171875, -11.927490234375, -11.5631103515625, -11.19873046875, -10.8343505859375, -10.469970703125, -10.1055908203125, -9.7412109375, -9.3768310546875, -9.012451171875, -8.6480712890625, -8.28369140625, -7.9193115234375, -7.554931640625, -7.1905517578125, -6.826171875, -6.4617919921875, -6.097412109375, -5.7330322265625, -5.36865234375, -5.0042724609375, -4.639892578125, -4.2755126953125, -3.9111328125, -3.5467529296875, -3.182373046875, -2.8179931640625, -2.45361328125, -2.0892333984375, -1.724853515625, -1.3604736328125, -0.99609375, -0.6317138671875, -0.267333984375, 0.0970458984375, 0.46142578125, 0.8258056640625, 1.190185546875, 1.5545654296875, 1.9189453125, 2.2833251953125, 2.647705078125, 3.0120849609375, 3.37646484375, 3.7408447265625, 4.105224609375, 4.4696044921875, 4.833984375, 5.1983642578125, 5.562744140625, 5.9271240234375, 6.29150390625, 6.6558837890625, 7.020263671875, 7.3846435546875, 7.7490234375, 8.1134033203125, 8.477783203125, 8.8421630859375, 9.20654296875, 9.5709228515625, 9.935302734375, 10.2996826171875, 10.6640625]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 4.0, 2.0, 7.0, 10.0, 28.0, 41.0, 69.0, 136.0, 278.0, 535.0, 891.0, 947.0, 534.0, 294.0, 135.0, 69.0, 54.0, 23.0, 11.0, 5.0, 9.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.28125, -33.5194091796875, -32.757568359375, -31.9957275390625, -31.23388671875, -30.4720458984375, -29.710205078125, -28.9483642578125, -28.1865234375, -27.4246826171875, -26.662841796875, -25.9010009765625, -25.13916015625, -24.3773193359375, -23.615478515625, -22.8536376953125, -22.091796875, -21.3299560546875, -20.568115234375, -19.8062744140625, -19.04443359375, -18.2825927734375, -17.520751953125, -16.7589111328125, -15.9970703125, -15.2352294921875, -14.473388671875, -13.7115478515625, -12.94970703125, -12.1878662109375, -11.426025390625, -10.6641845703125, -9.90234375, -9.1405029296875, -8.378662109375, -7.6168212890625, -6.85498046875, -6.0931396484375, -5.331298828125, -4.5694580078125, -3.8076171875, -3.0457763671875, -2.283935546875, -1.5220947265625, -0.76025390625, 0.0015869140625, 0.763427734375, 1.5252685546875, 2.287109375, 3.0489501953125, 3.810791015625, 4.5726318359375, 5.33447265625, 6.0963134765625, 6.858154296875, 7.6199951171875, 8.3818359375, 9.1436767578125, 9.905517578125, 10.6673583984375, 11.42919921875, 12.1910400390625, 12.952880859375, 13.7147216796875, 14.4765625]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 10.0, 7.0, 18.0, 40.0, 89.0, 147.0, 275.0, 868.0, 9351.0, 4124746.0, 56848.0, 1172.0, 369.0, 176.0, 75.0, 49.0, 21.0, 12.0, 7.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.21875, -55.09619140625, -51.9736328125, -48.85107421875, -45.728515625, -42.60595703125, -39.4833984375, -36.36083984375, -33.23828125, -30.11572265625, -26.9931640625, -23.87060546875, -20.748046875, -17.62548828125, -14.5029296875, -11.38037109375, -8.2578125, -5.13525390625, -2.0126953125, 1.10986328125, 4.232421875, 7.35498046875, 10.4775390625, 13.60009765625, 16.72265625, 19.84521484375, 22.9677734375, 26.09033203125, 29.212890625, 32.33544921875, 35.4580078125, 38.58056640625, 41.703125, 44.82568359375, 47.9482421875, 51.07080078125, 54.193359375, 57.31591796875, 60.4384765625, 63.56103515625, 66.68359375, 69.80615234375, 72.9287109375, 76.05126953125, 79.173828125, 82.29638671875, 85.4189453125, 88.54150390625, 91.6640625, 94.78662109375, 97.9091796875, 101.03173828125, 104.154296875, 107.27685546875, 110.3994140625, 113.52197265625, 116.64453125, 119.76708984375, 122.8896484375, 126.01220703125, 129.134765625, 132.25732421875, 135.3798828125, 138.50244140625, 141.625]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 8.0, 62.0, 354.0, 423.0, 140.0, 24.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-312.4545593261719, -304.0603942871094, -295.6662292480469, -287.27203369140625, -278.87786865234375, -270.48370361328125, -262.08953857421875, -253.6953582763672, -245.30117797851562, -236.90701293945312, -228.51283264160156, -220.11866760253906, -211.7244873046875, -203.330322265625, -194.9361572265625, -186.54197692871094, -178.14781188964844, -169.75364685058594, -161.35946655273438, -152.96530151367188, -144.5711212158203, -136.1769561767578, -127.78278350830078, -119.38861083984375, -110.99443817138672, -102.60026550292969, -94.20609283447266, -85.81192016601562, -77.41775512695312, -69.02357482910156, -60.62940979003906, -52.23523712158203, -43.841064453125, -35.44689178466797, -27.05272102355957, -18.658550262451172, -10.26437759399414, -1.8702049255371094, 6.523963928222656, 14.918136596679688, 23.31230926513672, 31.70648193359375, 40.10065460205078, 48.49482345581055, 56.88899612426758, 65.28317260742188, 73.67733764648438, 82.0715103149414, 90.46568298339844, 98.85985565185547, 107.2540283203125, 115.648193359375, 124.04237365722656, 132.43653869628906, 140.83071899414062, 149.22488403320312, 157.61904907226562, 166.01321411132812, 174.4073944091797, 182.8015594482422, 191.19573974609375, 199.58990478515625, 207.98406982421875, 216.3782501220703, 224.77243041992188]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 2.0, 5.0, 3.0, 8.0, 6.0, 7.0, 7.0, 10.0, 16.0, 11.0, 15.0, 28.0, 11.0, 24.0, 33.0, 27.0, 29.0, 29.0, 40.0, 36.0, 35.0, 34.0, 44.0, 28.0, 40.0, 32.0, 34.0, 23.0, 27.0, 31.0, 44.0, 35.0, 26.0, 23.0, 26.0, 27.0, 21.0, 7.0, 14.0, 14.0, 15.0, 11.0, 11.0, 10.0, 12.0, 5.0, 3.0, 7.0, 4.0, 2.0, 4.0, 0.0, 4.0, 4.0, 0.0, 3.0], "bins": [-36.92861557006836, -35.834754943847656, -34.74089813232422, -33.647037506103516, -32.55318069458008, -31.459320068359375, -30.365461349487305, -29.271602630615234, -28.17774200439453, -27.08388328552246, -25.99002456665039, -24.896163940429688, -23.802305221557617, -22.708446502685547, -21.614587783813477, -20.520729064941406, -19.426870346069336, -18.333011627197266, -17.239152908325195, -16.145294189453125, -15.051433563232422, -13.957574844360352, -12.863716125488281, -11.769857406616211, -10.675997734069824, -9.582139015197754, -8.488279342651367, -7.394420623779297, -6.300561428070068, -5.20670223236084, -4.1128435134887695, -3.018984317779541, -1.9251251220703125, -0.8312660455703735, 0.26259303092956543, 1.3564519882202148, 2.4503111839294434, 3.544170379638672, 4.638029098510742, 5.731888294219971, 6.825747489929199, 7.919606685638428, 9.013465881347656, 10.107324600219727, 11.201183319091797, 12.295042991638184, 13.388901710510254, 14.48276138305664, 15.576620101928711, 16.67047882080078, 17.76433753967285, 18.858196258544922, 19.952056884765625, 21.045915603637695, 22.139774322509766, 23.233633041381836, 24.327491760253906, 25.421350479125977, 26.515209197998047, 27.60906982421875, 28.70292854309082, 29.79678726196289, 30.89064598083496, 31.98450469970703, 33.078365325927734]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 8.0, 6.0, 3.0, 10.0, 14.0, 11.0, 10.0, 20.0, 26.0, 27.0, 20.0, 33.0, 26.0, 38.0, 40.0, 36.0, 42.0, 36.0, 41.0, 37.0, 53.0, 48.0, 40.0, 28.0, 38.0, 43.0, 33.0, 33.0, 31.0, 27.0, 23.0, 22.0, 15.0, 14.0, 18.0, 19.0, 9.0, 7.0, 3.0, 2.0, 1.0, 5.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-5.859375, -5.67730712890625, -5.4952392578125, -5.31317138671875, -5.131103515625, -4.94903564453125, -4.7669677734375, -4.58489990234375, -4.40283203125, -4.22076416015625, -4.0386962890625, -3.85662841796875, -3.674560546875, -3.49249267578125, -3.3104248046875, -3.12835693359375, -2.9462890625, -2.76422119140625, -2.5821533203125, -2.40008544921875, -2.218017578125, -2.03594970703125, -1.8538818359375, -1.67181396484375, -1.48974609375, -1.30767822265625, -1.1256103515625, -0.94354248046875, -0.761474609375, -0.57940673828125, -0.3973388671875, -0.21527099609375, -0.033203125, 0.14886474609375, 0.3309326171875, 0.51300048828125, 0.695068359375, 0.87713623046875, 1.0592041015625, 1.24127197265625, 1.42333984375, 1.60540771484375, 1.7874755859375, 1.96954345703125, 2.151611328125, 2.33367919921875, 2.5157470703125, 2.69781494140625, 2.8798828125, 3.06195068359375, 3.2440185546875, 3.42608642578125, 3.608154296875, 3.79022216796875, 3.9722900390625, 4.15435791015625, 4.33642578125, 4.51849365234375, 4.7005615234375, 4.88262939453125, 5.064697265625, 5.24676513671875, 5.4288330078125, 5.61090087890625, 5.79296875]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 5.0, 3.0, 6.0, 7.0, 8.0, 20.0, 26.0, 33.0, 38.0, 70.0, 116.0, 165.0, 285.0, 412.0, 696.0, 1217.0, 2066.0, 3704.0, 6483.0, 11967.0, 22340.0, 40466.0, 72934.0, 123180.0, 187211.0, 206959.0, 154450.0, 94102.0, 53824.0, 29512.0, 16018.0, 8814.0, 4773.0, 2684.0, 1546.0, 889.0, 551.0, 314.0, 225.0, 137.0, 97.0, 66.0, 37.0, 34.0, 22.0, 17.0, 12.0, 6.0, 8.0, 1.0, 3.0, 1.0, 2.0, 3.0], "bins": [-3.115234375, -3.026824951171875, -2.93841552734375, -2.850006103515625, -2.7615966796875, -2.673187255859375, -2.58477783203125, -2.496368408203125, -2.407958984375, -2.319549560546875, -2.23114013671875, -2.142730712890625, -2.0543212890625, -1.965911865234375, -1.87750244140625, -1.789093017578125, -1.70068359375, -1.612274169921875, -1.52386474609375, -1.435455322265625, -1.3470458984375, -1.258636474609375, -1.17022705078125, -1.081817626953125, -0.993408203125, -0.904998779296875, -0.81658935546875, -0.728179931640625, -0.6397705078125, -0.551361083984375, -0.46295166015625, -0.374542236328125, -0.2861328125, -0.197723388671875, -0.10931396484375, -0.020904541015625, 0.0675048828125, 0.155914306640625, 0.24432373046875, 0.332733154296875, 0.421142578125, 0.509552001953125, 0.59796142578125, 0.686370849609375, 0.7747802734375, 0.863189697265625, 0.95159912109375, 1.040008544921875, 1.12841796875, 1.216827392578125, 1.30523681640625, 1.393646240234375, 1.4820556640625, 1.570465087890625, 1.65887451171875, 1.747283935546875, 1.835693359375, 1.924102783203125, 2.01251220703125, 2.100921630859375, 2.1893310546875, 2.277740478515625, 2.36614990234375, 2.454559326171875, 2.54296875]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 1.0, 3.0, 5.0, 3.0, 4.0, 3.0, 8.0, 7.0, 7.0, 6.0, 9.0, 10.0, 13.0, 12.0, 17.0, 21.0, 23.0, 25.0, 14.0, 30.0, 36.0, 40.0, 40.0, 31.0, 49.0, 32.0, 28.0, 38.0, 1060.0, 33.0, 35.0, 46.0, 49.0, 31.0, 25.0, 33.0, 34.0, 15.0, 18.0, 12.0, 27.0, 13.0, 14.0, 10.0, 16.0, 12.0, 5.0, 5.0, 9.0, 5.0, 6.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.3828125, -4.24151611328125, -4.1002197265625, -3.95892333984375, -3.817626953125, -3.67633056640625, -3.5350341796875, -3.39373779296875, -3.25244140625, -3.11114501953125, -2.9698486328125, -2.82855224609375, -2.687255859375, -2.54595947265625, -2.4046630859375, -2.26336669921875, -2.1220703125, -1.98077392578125, -1.8394775390625, -1.69818115234375, -1.556884765625, -1.41558837890625, -1.2742919921875, -1.13299560546875, -0.99169921875, -0.85040283203125, -0.7091064453125, -0.56781005859375, -0.426513671875, -0.28521728515625, -0.1439208984375, -0.00262451171875, 0.138671875, 0.27996826171875, 0.4212646484375, 0.56256103515625, 0.703857421875, 0.84515380859375, 0.9864501953125, 1.12774658203125, 1.26904296875, 1.41033935546875, 1.5516357421875, 1.69293212890625, 1.834228515625, 1.97552490234375, 2.1168212890625, 2.25811767578125, 2.3994140625, 2.54071044921875, 2.6820068359375, 2.82330322265625, 2.964599609375, 3.10589599609375, 3.2471923828125, 3.38848876953125, 3.52978515625, 3.67108154296875, 3.8123779296875, 3.95367431640625, 4.094970703125, 4.23626708984375, 4.3775634765625, 4.51885986328125, 4.66015625]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 5.0, 5.0, 7.0, 8.0, 16.0, 17.0, 28.0, 50.0, 56.0, 87.0, 122.0, 164.0, 225.0, 357.0, 567.0, 856.0, 1321.0, 2105.0, 3292.0, 5334.0, 8737.0, 15516.0, 30245.0, 149775.0, 1740520.0, 78606.0, 24851.0, 13329.0, 7834.0, 4673.0, 2877.0, 1889.0, 1210.0, 825.0, 526.0, 332.0, 229.0, 175.0, 99.0, 76.0, 64.0, 39.0, 20.0, 15.0, 18.0, 13.0, 7.0, 4.0, 7.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0], "bins": [-4.6640625, -4.5242919921875, -4.384521484375, -4.2447509765625, -4.10498046875, -3.9652099609375, -3.825439453125, -3.6856689453125, -3.5458984375, -3.4061279296875, -3.266357421875, -3.1265869140625, -2.98681640625, -2.8470458984375, -2.707275390625, -2.5675048828125, -2.427734375, -2.2879638671875, -2.148193359375, -2.0084228515625, -1.86865234375, -1.7288818359375, -1.589111328125, -1.4493408203125, -1.3095703125, -1.1697998046875, -1.030029296875, -0.8902587890625, -0.75048828125, -0.6107177734375, -0.470947265625, -0.3311767578125, -0.19140625, -0.0516357421875, 0.088134765625, 0.2279052734375, 0.36767578125, 0.5074462890625, 0.647216796875, 0.7869873046875, 0.9267578125, 1.0665283203125, 1.206298828125, 1.3460693359375, 1.48583984375, 1.6256103515625, 1.765380859375, 1.9051513671875, 2.044921875, 2.1846923828125, 2.324462890625, 2.4642333984375, 2.60400390625, 2.7437744140625, 2.883544921875, 3.0233154296875, 3.1630859375, 3.3028564453125, 3.442626953125, 3.5823974609375, 3.72216796875, 3.8619384765625, 4.001708984375, 4.1414794921875, 4.28125]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 9.0, 8.0, 12.0, 20.0, 20.0, 20.0, 22.0, 35.0, 32.0, 52.0, 53.0, 50.0, 70.0, 84.0, 99.0, 103.0, 60.0, 44.0, 39.0, 36.0, 31.0, 24.0, 19.0, 20.0, 13.0, 5.0, 5.0, 6.0, 10.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.304443359375, -0.2946662902832031, -0.28488922119140625, -0.2751121520996094, -0.2653350830078125, -0.2555580139160156, -0.24578094482421875, -0.23600387573242188, -0.226226806640625, -0.21644973754882812, -0.20667266845703125, -0.19689559936523438, -0.1871185302734375, -0.17734146118164062, -0.16756439208984375, -0.15778732299804688, -0.14801025390625, -0.13823318481445312, -0.12845611572265625, -0.11867904663085938, -0.1089019775390625, -0.09912490844726562, -0.08934783935546875, -0.07957077026367188, -0.069793701171875, -0.060016632080078125, -0.05023956298828125, -0.040462493896484375, -0.0306854248046875, -0.020908355712890625, -0.01113128662109375, -0.001354217529296875, 0.0084228515625, 0.018199920654296875, 0.02797698974609375, 0.037754058837890625, 0.0475311279296875, 0.057308197021484375, 0.06708526611328125, 0.07686233520507812, 0.086639404296875, 0.09641647338867188, 0.10619354248046875, 0.11597061157226562, 0.1257476806640625, 0.13552474975585938, 0.14530181884765625, 0.15507888793945312, 0.16485595703125, 0.17463302612304688, 0.18441009521484375, 0.19418716430664062, 0.2039642333984375, 0.21374130249023438, 0.22351837158203125, 0.23329544067382812, 0.243072509765625, 0.2528495788574219, 0.26262664794921875, 0.2724037170410156, 0.2821807861328125, 0.2919578552246094, 0.30173492431640625, 0.3115119934082031, 0.3212890625]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 5.0, 13.0, 2.0, 10.0, 20.0, 14.0, 24.0, 37.0, 46.0, 71.0, 118.0, 265.0, 951.0, 36052.0, 1006252.0, 3577.0, 562.0, 182.0, 113.0, 67.0, 39.0, 32.0, 21.0, 19.0, 20.0, 14.0, 13.0, 8.0, 7.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.5703125, -6.3729248046875, -6.175537109375, -5.9781494140625, -5.78076171875, -5.5833740234375, -5.385986328125, -5.1885986328125, -4.9912109375, -4.7938232421875, -4.596435546875, -4.3990478515625, -4.20166015625, -4.0042724609375, -3.806884765625, -3.6094970703125, -3.412109375, -3.2147216796875, -3.017333984375, -2.8199462890625, -2.62255859375, -2.4251708984375, -2.227783203125, -2.0303955078125, -1.8330078125, -1.6356201171875, -1.438232421875, -1.2408447265625, -1.04345703125, -0.8460693359375, -0.648681640625, -0.4512939453125, -0.25390625, -0.0565185546875, 0.140869140625, 0.3382568359375, 0.53564453125, 0.7330322265625, 0.930419921875, 1.1278076171875, 1.3251953125, 1.5225830078125, 1.719970703125, 1.9173583984375, 2.11474609375, 2.3121337890625, 2.509521484375, 2.7069091796875, 2.904296875, 3.1016845703125, 3.299072265625, 3.4964599609375, 3.69384765625, 3.8912353515625, 4.088623046875, 4.2860107421875, 4.4833984375, 4.6807861328125, 4.878173828125, 5.0755615234375, 5.27294921875, 5.4703369140625, 5.667724609375, 5.8651123046875, 6.0625]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 18.0, 51.0, 193.0, 470.0, 200.0, 53.0, 18.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0992207527160645, -2.002164363861084, -1.905108094215393, -1.8080518245697021, -1.7109954357147217, -1.6139390468597412, -1.5168827772140503, -1.4198265075683594, -1.322770118713379, -1.2257137298583984, -1.1286574602127075, -1.0316011905670166, -0.9345448017120361, -0.8374884724617004, -0.7404321432113647, -0.643375813961029, -0.5463194847106934, -0.44926315546035767, -0.352206826210022, -0.2551504969596863, -0.15809416770935059, -0.06103783845901489, 0.0360184907913208, 0.1330748200416565, 0.2301311492919922, 0.3271874785423279, 0.4242438077926636, 0.5213001370429993, 0.618356466293335, 0.7154127955436707, 0.8124691247940063, 0.909525454044342, 1.0065817832946777, 1.1036381721496582, 1.2006944417953491, 1.29775071144104, 1.3948071002960205, 1.491863489151001, 1.588919758796692, 1.6859760284423828, 1.7830324172973633, 1.8800888061523438, 1.9771450757980347, 2.0742013454437256, 2.171257734298706, 2.2683141231536865, 2.365370273590088, 2.4624266624450684, 2.559483051300049, 2.6565394401550293, 2.7535958290100098, 2.850651979446411, 2.9477083683013916, 3.044764757156372, 3.1418209075927734, 3.238877296447754, 3.3359336853027344, 3.432990074157715, 3.5300464630126953, 3.6271026134490967, 3.724159002304077, 3.8212153911590576, 3.918271541595459, 4.0153279304504395, 4.11238431930542]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 6.0, 8.0, 6.0, 10.0, 11.0, 17.0, 20.0, 25.0, 32.0, 42.0, 42.0, 46.0, 48.0, 51.0, 67.0, 56.0, 66.0, 52.0, 60.0, 67.0, 51.0, 44.0, 31.0, 44.0, 29.0, 26.0, 16.0, 11.0, 11.0, 8.0, 2.0, 4.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1282494068145752, -1.1000169515609741, -1.0717846155166626, -1.0435521602630615, -1.01531982421875, -0.9870874285697937, -0.9588550329208374, -0.9306225776672363, -0.9023902416229248, -0.8741578459739685, -0.8459254503250122, -0.8176930546760559, -0.7894606590270996, -0.7612282633781433, -0.732995867729187, -0.7047634124755859, -0.6765310168266296, -0.6482986211776733, -0.620066225528717, -0.5918338298797607, -0.5636014342308044, -0.5353690385818481, -0.5071365833282471, -0.47890421748161316, -0.45067182183265686, -0.42243942618370056, -0.39420703053474426, -0.3659746050834656, -0.3377422094345093, -0.309509813785553, -0.2812774181365967, -0.2530450224876404, -0.22481262683868408, -0.19658023118972778, -0.16834783554077148, -0.140115424990654, -0.11188302934169769, -0.0836506336927414, -0.0554182231426239, -0.027185827493667603, 0.0010465681552886963, 0.029278967529535294, 0.05751136690378189, 0.08574377000331879, 0.11397616565227509, 0.14220856130123138, 0.17044097185134888, 0.19867336750030518, 0.22690576314926147, 0.2551381587982178, 0.2833705544471741, 0.31160295009613037, 0.33983534574508667, 0.36806774139404297, 0.39630016684532166, 0.42453256249427795, 0.45276495814323425, 0.48099735379219055, 0.5092297792434692, 0.5374621748924255, 0.5656945705413818, 0.5939269661903381, 0.6221593618392944, 0.6503917574882507, 0.678624153137207]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 6.0, 11.0, 7.0, 7.0, 14.0, 21.0, 29.0, 21.0, 28.0, 25.0, 37.0, 34.0, 38.0, 41.0, 47.0, 49.0, 58.0, 35.0, 59.0, 34.0, 41.0, 51.0, 42.0, 53.0, 37.0, 29.0, 26.0, 21.0, 17.0, 21.0, 16.0, 12.0, 10.0, 9.0, 4.0, 6.0, 5.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.3984375, -5.19683837890625, -4.9952392578125, -4.79364013671875, -4.592041015625, -4.39044189453125, -4.1888427734375, -3.98724365234375, -3.78564453125, -3.58404541015625, -3.3824462890625, -3.18084716796875, -2.979248046875, -2.77764892578125, -2.5760498046875, -2.37445068359375, -2.1728515625, -1.97125244140625, -1.7696533203125, -1.56805419921875, -1.366455078125, -1.16485595703125, -0.9632568359375, -0.76165771484375, -0.56005859375, -0.35845947265625, -0.1568603515625, 0.04473876953125, 0.246337890625, 0.44793701171875, 0.6495361328125, 0.85113525390625, 1.052734375, 1.25433349609375, 1.4559326171875, 1.65753173828125, 1.859130859375, 2.06072998046875, 2.2623291015625, 2.46392822265625, 2.66552734375, 2.86712646484375, 3.0687255859375, 3.27032470703125, 3.471923828125, 3.67352294921875, 3.8751220703125, 4.07672119140625, 4.2783203125, 4.47991943359375, 4.6815185546875, 4.88311767578125, 5.084716796875, 5.28631591796875, 5.4879150390625, 5.68951416015625, 5.89111328125, 6.09271240234375, 6.2943115234375, 6.49591064453125, 6.697509765625, 6.89910888671875, 7.1007080078125, 7.30230712890625, 7.50390625]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 5.0, 9.0, 8.0, 7.0, 12.0, 21.0, 30.0, 38.0, 72.0, 116.0, 234.0, 391.0, 664.0, 1304.0, 2490.0, 4869.0, 9568.0, 19488.0, 40868.0, 86637.0, 182318.0, 336625.0, 189651.0, 89611.0, 42679.0, 20356.0, 9804.0, 5064.0, 2574.0, 1354.0, 724.0, 374.0, 236.0, 125.0, 83.0, 43.0, 23.0, 21.0, 21.0, 14.0, 7.0, 11.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.5234375, -6.328857421875, -6.13427734375, -5.939697265625, -5.7451171875, -5.550537109375, -5.35595703125, -5.161376953125, -4.966796875, -4.772216796875, -4.57763671875, -4.383056640625, -4.1884765625, -3.993896484375, -3.79931640625, -3.604736328125, -3.41015625, -3.215576171875, -3.02099609375, -2.826416015625, -2.6318359375, -2.437255859375, -2.24267578125, -2.048095703125, -1.853515625, -1.658935546875, -1.46435546875, -1.269775390625, -1.0751953125, -0.880615234375, -0.68603515625, -0.491455078125, -0.296875, -0.102294921875, 0.09228515625, 0.286865234375, 0.4814453125, 0.676025390625, 0.87060546875, 1.065185546875, 1.259765625, 1.454345703125, 1.64892578125, 1.843505859375, 2.0380859375, 2.232666015625, 2.42724609375, 2.621826171875, 2.81640625, 3.010986328125, 3.20556640625, 3.400146484375, 3.5947265625, 3.789306640625, 3.98388671875, 4.178466796875, 4.373046875, 4.567626953125, 4.76220703125, 4.956787109375, 5.1513671875, 5.345947265625, 5.54052734375, 5.735107421875, 5.9296875]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 4.0, 2.0, 7.0, 6.0, 8.0, 5.0, 6.0, 16.0, 22.0, 16.0, 13.0, 28.0, 32.0, 26.0, 37.0, 37.0, 54.0, 66.0, 78.0, 124.0, 231.0, 1375.0, 256.0, 127.0, 71.0, 51.0, 57.0, 51.0, 28.0, 32.0, 33.0, 25.0, 17.0, 19.0, 15.0, 13.0, 12.0, 14.0, 5.0, 12.0, 6.0, 6.0, 3.0, 2.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.4375, -18.820556640625, -18.20361328125, -17.586669921875, -16.9697265625, -16.352783203125, -15.73583984375, -15.118896484375, -14.501953125, -13.885009765625, -13.26806640625, -12.651123046875, -12.0341796875, -11.417236328125, -10.80029296875, -10.183349609375, -9.56640625, -8.949462890625, -8.33251953125, -7.715576171875, -7.0986328125, -6.481689453125, -5.86474609375, -5.247802734375, -4.630859375, -4.013916015625, -3.39697265625, -2.780029296875, -2.1630859375, -1.546142578125, -0.92919921875, -0.312255859375, 0.3046875, 0.921630859375, 1.53857421875, 2.155517578125, 2.7724609375, 3.389404296875, 4.00634765625, 4.623291015625, 5.240234375, 5.857177734375, 6.47412109375, 7.091064453125, 7.7080078125, 8.324951171875, 8.94189453125, 9.558837890625, 10.17578125, 10.792724609375, 11.40966796875, 12.026611328125, 12.6435546875, 13.260498046875, 13.87744140625, 14.494384765625, 15.111328125, 15.728271484375, 16.34521484375, 16.962158203125, 17.5791015625, 18.196044921875, 18.81298828125, 19.429931640625, 20.046875]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 1.0, 9.0, 10.0, 10.0, 15.0, 25.0, 31.0, 45.0, 73.0, 106.0, 174.0, 300.0, 586.0, 2582.0, 545355.0, 2590126.0, 4627.0, 753.0, 341.0, 176.0, 128.0, 78.0, 46.0, 34.0, 25.0, 16.0, 15.0, 5.0, 4.0, 2.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.9375, -55.947265625, -53.95703125, -51.966796875, -49.9765625, -47.986328125, -45.99609375, -44.005859375, -42.015625, -40.025390625, -38.03515625, -36.044921875, -34.0546875, -32.064453125, -30.07421875, -28.083984375, -26.09375, -24.103515625, -22.11328125, -20.123046875, -18.1328125, -16.142578125, -14.15234375, -12.162109375, -10.171875, -8.181640625, -6.19140625, -4.201171875, -2.2109375, -0.220703125, 1.76953125, 3.759765625, 5.75, 7.740234375, 9.73046875, 11.720703125, 13.7109375, 15.701171875, 17.69140625, 19.681640625, 21.671875, 23.662109375, 25.65234375, 27.642578125, 29.6328125, 31.623046875, 33.61328125, 35.603515625, 37.59375, 39.583984375, 41.57421875, 43.564453125, 45.5546875, 47.544921875, 49.53515625, 51.525390625, 53.515625, 55.505859375, 57.49609375, 59.486328125, 61.4765625, 63.466796875, 65.45703125, 67.447265625, 69.4375]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 828.0, 190.0], "bins": [-1736.7906494140625, -1709.169921875, -1681.5491943359375, -1653.928466796875, -1626.3077392578125, -1598.68701171875, -1571.066162109375, -1543.445556640625, -1515.82470703125, -1488.2039794921875, -1460.583251953125, -1432.9625244140625, -1405.341796875, -1377.7210693359375, -1350.100341796875, -1322.4794921875, -1294.85888671875, -1267.2381591796875, -1239.617431640625, -1211.9967041015625, -1184.3759765625, -1156.7552490234375, -1129.134521484375, -1101.513671875, -1073.8929443359375, -1046.272216796875, -1018.6514892578125, -991.03076171875, -963.4099731445312, -935.7892456054688, -908.1685180664062, -880.5477905273438, -852.927001953125, -825.3062744140625, -797.685546875, -770.0648193359375, -742.4440307617188, -714.8233032226562, -687.2025756835938, -659.5818481445312, -631.9611206054688, -604.3403930664062, -576.7196655273438, -549.098876953125, -521.4781494140625, -493.857421875, -466.2366943359375, -438.615966796875, -410.9952392578125, -383.37451171875, -355.7537536621094, -328.1330261230469, -300.5122985839844, -272.89154052734375, -245.27081298828125, -217.65008544921875, -190.02932739257812, -162.40858459472656, -134.78785705566406, -107.1671142578125, -79.54637908935547, -51.92564392089844, -24.304901123046875, 3.315826416015625, 30.936569213867188]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 6.0, 9.0, 11.0, 9.0, 12.0, 16.0, 20.0, 20.0, 17.0, 21.0, 26.0, 31.0, 41.0, 44.0, 50.0, 35.0, 47.0, 43.0, 50.0, 49.0, 43.0, 48.0, 56.0, 51.0, 38.0, 35.0, 26.0, 25.0, 30.0, 22.0, 18.0, 17.0, 8.0, 15.0, 3.0, 4.0, 2.0, 6.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.147281646728516, -55.297386169433594, -53.447486877441406, -51.597591400146484, -49.74769592285156, -47.89780044555664, -46.04790496826172, -44.19800567626953, -42.34811019897461, -40.49821472167969, -38.6483154296875, -36.79841995239258, -34.948524475097656, -33.098628997802734, -31.24873161315918, -29.398834228515625, -27.548938751220703, -25.69904327392578, -23.849145889282227, -21.999248504638672, -20.14935302734375, -18.299457550048828, -16.449560165405273, -14.599663734436035, -12.749767303466797, -10.899870872497559, -9.04997444152832, -7.200078010559082, -5.350181579589844, -3.5002851486206055, -1.6503887176513672, 0.1995077133178711, 2.0494041442871094, 3.8993005752563477, 5.749197006225586, 7.599093437194824, 9.448989868164062, 11.2988862991333, 13.148782730102539, 14.998679161071777, 16.848575592041016, 18.698471069335938, 20.548368453979492, 22.398265838623047, 24.24816131591797, 26.09805679321289, 27.947954177856445, 29.7978515625, 31.647747039794922, 33.497642517089844, 35.34754180908203, 37.19743728637695, 39.047332763671875, 40.8972282409668, 42.74712371826172, 44.597023010253906, 46.44691848754883, 48.29681396484375, 50.14671325683594, 51.99660873413086, 53.84650421142578, 55.6963996887207, 57.546295166015625, 59.39619445800781, 61.246089935302734]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 6.0, 3.0, 5.0, 10.0, 5.0, 7.0, 8.0, 7.0, 13.0, 13.0, 18.0, 16.0, 20.0, 27.0, 25.0, 24.0, 24.0, 33.0, 34.0, 25.0, 36.0, 33.0, 37.0, 44.0, 25.0, 24.0, 45.0, 40.0, 34.0, 36.0, 37.0, 30.0, 28.0, 32.0, 29.0, 25.0, 19.0, 22.0, 17.0, 19.0, 14.0, 11.0, 11.0, 11.0, 5.0, 3.0, 3.0, 7.0, 3.0, 0.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-5.25390625, -5.0843505859375, -4.914794921875, -4.7452392578125, -4.57568359375, -4.4061279296875, -4.236572265625, -4.0670166015625, -3.8974609375, -3.7279052734375, -3.558349609375, -3.3887939453125, -3.21923828125, -3.0496826171875, -2.880126953125, -2.7105712890625, -2.541015625, -2.3714599609375, -2.201904296875, -2.0323486328125, -1.86279296875, -1.6932373046875, -1.523681640625, -1.3541259765625, -1.1845703125, -1.0150146484375, -0.845458984375, -0.6759033203125, -0.50634765625, -0.3367919921875, -0.167236328125, 0.0023193359375, 0.171875, 0.3414306640625, 0.510986328125, 0.6805419921875, 0.85009765625, 1.0196533203125, 1.189208984375, 1.3587646484375, 1.5283203125, 1.6978759765625, 1.867431640625, 2.0369873046875, 2.20654296875, 2.3760986328125, 2.545654296875, 2.7152099609375, 2.884765625, 3.0543212890625, 3.223876953125, 3.3934326171875, 3.56298828125, 3.7325439453125, 3.902099609375, 4.0716552734375, 4.2412109375, 4.4107666015625, 4.580322265625, 4.7498779296875, 4.91943359375, 5.0889892578125, 5.258544921875, 5.4281005859375, 5.59765625]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 6.0, 7.0, 7.0, 7.0, 16.0, 22.0, 18.0, 43.0, 73.0, 88.0, 124.0, 178.0, 313.0, 431.0, 699.0, 1147.0, 1967.0, 3412.0, 6764.0, 14614.0, 39705.0, 144484.0, 664807.0, 1899957.0, 1073460.0, 241274.0, 60281.0, 20594.0, 8855.0, 4545.0, 2604.0, 1395.0, 846.0, 546.0, 324.0, 219.0, 128.0, 104.0, 69.0, 53.0, 35.0, 29.0, 18.0, 11.0, 5.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0], "bins": [-11.3125, -11.0040283203125, -10.695556640625, -10.3870849609375, -10.07861328125, -9.7701416015625, -9.461669921875, -9.1531982421875, -8.8447265625, -8.5362548828125, -8.227783203125, -7.9193115234375, -7.61083984375, -7.3023681640625, -6.993896484375, -6.6854248046875, -6.376953125, -6.0684814453125, -5.760009765625, -5.4515380859375, -5.14306640625, -4.8345947265625, -4.526123046875, -4.2176513671875, -3.9091796875, -3.6007080078125, -3.292236328125, -2.9837646484375, -2.67529296875, -2.3668212890625, -2.058349609375, -1.7498779296875, -1.44140625, -1.1329345703125, -0.824462890625, -0.5159912109375, -0.20751953125, 0.1009521484375, 0.409423828125, 0.7178955078125, 1.0263671875, 1.3348388671875, 1.643310546875, 1.9517822265625, 2.26025390625, 2.5687255859375, 2.877197265625, 3.1856689453125, 3.494140625, 3.8026123046875, 4.111083984375, 4.4195556640625, 4.72802734375, 5.0364990234375, 5.344970703125, 5.6534423828125, 5.9619140625, 6.2703857421875, 6.578857421875, 6.8873291015625, 7.19580078125, 7.5042724609375, 7.812744140625, 8.1212158203125, 8.4296875]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 8.0, 5.0, 5.0, 6.0, 12.0, 14.0, 23.0, 33.0, 45.0, 75.0, 89.0, 118.0, 162.0, 264.0, 400.0, 514.0, 618.0, 508.0, 379.0, 257.0, 167.0, 123.0, 71.0, 54.0, 45.0, 26.0, 17.0, 13.0, 4.0, 5.0, 7.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.1875, -14.7586669921875, -14.329833984375, -13.9010009765625, -13.47216796875, -13.0433349609375, -12.614501953125, -12.1856689453125, -11.7568359375, -11.3280029296875, -10.899169921875, -10.4703369140625, -10.04150390625, -9.6126708984375, -9.183837890625, -8.7550048828125, -8.326171875, -7.8973388671875, -7.468505859375, -7.0396728515625, -6.61083984375, -6.1820068359375, -5.753173828125, -5.3243408203125, -4.8955078125, -4.4666748046875, -4.037841796875, -3.6090087890625, -3.18017578125, -2.7513427734375, -2.322509765625, -1.8936767578125, -1.46484375, -1.0360107421875, -0.607177734375, -0.1783447265625, 0.25048828125, 0.6793212890625, 1.108154296875, 1.5369873046875, 1.9658203125, 2.3946533203125, 2.823486328125, 3.2523193359375, 3.68115234375, 4.1099853515625, 4.538818359375, 4.9676513671875, 5.396484375, 5.8253173828125, 6.254150390625, 6.6829833984375, 7.11181640625, 7.5406494140625, 7.969482421875, 8.3983154296875, 8.8271484375, 9.2559814453125, 9.684814453125, 10.1136474609375, 10.54248046875, 10.9713134765625, 11.400146484375, 11.8289794921875, 12.2578125]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 2.0, 8.0, 4.0, 16.0, 10.0, 22.0, 42.0, 47.0, 66.0, 116.0, 184.0, 372.0, 830.0, 4671.0, 167986.0, 3943323.0, 72248.0, 2967.0, 601.0, 259.0, 148.0, 103.0, 83.0, 49.0, 34.0, 26.0, 16.0, 13.0, 9.0, 2.0, 7.0, 4.0, 5.0, 3.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-50.125, -48.4208984375, -46.716796875, -45.0126953125, -43.30859375, -41.6044921875, -39.900390625, -38.1962890625, -36.4921875, -34.7880859375, -33.083984375, -31.3798828125, -29.67578125, -27.9716796875, -26.267578125, -24.5634765625, -22.859375, -21.1552734375, -19.451171875, -17.7470703125, -16.04296875, -14.3388671875, -12.634765625, -10.9306640625, -9.2265625, -7.5224609375, -5.818359375, -4.1142578125, -2.41015625, -0.7060546875, 0.998046875, 2.7021484375, 4.40625, 6.1103515625, 7.814453125, 9.5185546875, 11.22265625, 12.9267578125, 14.630859375, 16.3349609375, 18.0390625, 19.7431640625, 21.447265625, 23.1513671875, 24.85546875, 26.5595703125, 28.263671875, 29.9677734375, 31.671875, 33.3759765625, 35.080078125, 36.7841796875, 38.48828125, 40.1923828125, 41.896484375, 43.6005859375, 45.3046875, 47.0087890625, 48.712890625, 50.4169921875, 52.12109375, 53.8251953125, 55.529296875, 57.2333984375, 58.9375]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 16.0, 202.0, 593.0, 186.0, 16.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-368.457763671875, -358.08978271484375, -347.7218322753906, -337.3538513183594, -326.9858703613281, -316.617919921875, -306.24993896484375, -295.8819580078125, -285.5140075683594, -275.1460266113281, -264.778076171875, -254.41009521484375, -244.04212951660156, -233.67416381835938, -223.30618286132812, -212.93821716308594, -202.5702362060547, -192.2022705078125, -181.83428955078125, -171.46632385253906, -161.09835815429688, -150.73037719726562, -140.36241149902344, -129.99444580078125, -119.62647247314453, -109.25849914550781, -98.89053344726562, -88.5225601196289, -78.15458679199219, -67.78662109375, -57.41864776611328, -47.050682067871094, -36.682708740234375, -26.314739227294922, -15.946767807006836, -5.57879638671875, 4.789173126220703, 15.157142639160156, 25.525115966796875, 35.89308166503906, 46.26105499267578, 56.629024505615234, 66.99699401855469, 77.3649673461914, 87.73294067382812, 98.10090637207031, 108.46887969970703, 118.83684539794922, 129.20481872558594, 139.57278442382812, 149.94076538085938, 160.30873107910156, 170.67669677734375, 181.044677734375, 191.4126434326172, 201.78060913085938, 212.14859008789062, 222.5165557861328, 232.88453674316406, 243.25250244140625, 253.62046813964844, 263.9884338378906, 274.3564147949219, 284.724365234375, 295.09234619140625]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 4.0, 4.0, 2.0, 3.0, 1.0, 6.0, 9.0, 6.0, 13.0, 11.0, 12.0, 19.0, 11.0, 19.0, 23.0, 22.0, 26.0, 28.0, 33.0, 39.0, 33.0, 34.0, 43.0, 43.0, 54.0, 47.0, 44.0, 38.0, 43.0, 42.0, 38.0, 19.0, 34.0, 23.0, 20.0, 22.0, 19.0, 24.0, 21.0, 15.0, 11.0, 14.0, 10.0, 8.0, 4.0, 5.0, 4.0, 3.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-37.39897155761719, -36.17768096923828, -34.95639419555664, -33.735103607177734, -32.513816833496094, -31.292526245117188, -30.071237564086914, -28.84994888305664, -27.628660202026367, -26.407371520996094, -25.18608283996582, -23.964794158935547, -22.74350357055664, -21.522216796875, -20.300926208496094, -19.07963752746582, -17.858348846435547, -16.637060165405273, -15.415771484375, -14.19448184967041, -12.973193168640137, -11.751904487609863, -10.530614852905273, -9.309326171875, -8.088037490844727, -6.866748809814453, -5.6454596519470215, -4.42417049407959, -3.2028818130493164, -1.981593132019043, -0.7603039741516113, 0.4609851837158203, 1.6822738647460938, 2.9035627841949463, 4.124851703643799, 5.3461408615112305, 6.567429542541504, 7.788718223571777, 9.010007858276367, 10.23129653930664, 11.452585220336914, 12.673873901367188, 13.895162582397461, 15.11645221710205, 16.33774185180664, 17.55902862548828, 18.780319213867188, 20.00160789489746, 21.222896575927734, 22.444185256958008, 23.66547393798828, 24.886762619018555, 26.108051300048828, 27.329341888427734, 28.550630569458008, 29.77191925048828, 30.993207931518555, 32.21449661254883, 33.435787200927734, 34.657073974609375, 35.87836456298828, 37.09965133666992, 38.32094192504883, 39.54222869873047, 40.763519287109375]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 6.0, 11.0, 6.0, 9.0, 19.0, 17.0, 18.0, 24.0, 20.0, 26.0, 19.0, 36.0, 39.0, 42.0, 47.0, 44.0, 51.0, 40.0, 51.0, 41.0, 37.0, 43.0, 50.0, 34.0, 32.0, 40.0, 28.0, 27.0, 19.0, 18.0, 21.0, 21.0, 16.0, 9.0, 13.0, 7.0, 8.0, 3.0, 3.0, 4.0, 3.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.859375, -5.66741943359375, -5.4754638671875, -5.28350830078125, -5.091552734375, -4.89959716796875, -4.7076416015625, -4.51568603515625, -4.32373046875, -4.13177490234375, -3.9398193359375, -3.74786376953125, -3.555908203125, -3.36395263671875, -3.1719970703125, -2.98004150390625, -2.7880859375, -2.59613037109375, -2.4041748046875, -2.21221923828125, -2.020263671875, -1.82830810546875, -1.6363525390625, -1.44439697265625, -1.25244140625, -1.06048583984375, -0.8685302734375, -0.67657470703125, -0.484619140625, -0.29266357421875, -0.1007080078125, 0.09124755859375, 0.283203125, 0.47515869140625, 0.6671142578125, 0.85906982421875, 1.051025390625, 1.24298095703125, 1.4349365234375, 1.62689208984375, 1.81884765625, 2.01080322265625, 2.2027587890625, 2.39471435546875, 2.586669921875, 2.77862548828125, 2.9705810546875, 3.16253662109375, 3.3544921875, 3.54644775390625, 3.7384033203125, 3.93035888671875, 4.122314453125, 4.31427001953125, 4.5062255859375, 4.69818115234375, 4.89013671875, 5.08209228515625, 5.2740478515625, 5.46600341796875, 5.657958984375, 5.84991455078125, 6.0418701171875, 6.23382568359375, 6.42578125]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 4.0, 3.0, 8.0, 9.0, 8.0, 12.0, 22.0, 37.0, 50.0, 94.0, 151.0, 254.0, 516.0, 907.0, 1833.0, 3678.0, 7796.0, 17036.0, 38201.0, 83980.0, 168786.0, 253959.0, 228126.0, 130465.0, 61408.0, 27483.0, 12251.0, 5733.0, 2817.0, 1336.0, 666.0, 369.0, 211.0, 141.0, 76.0, 41.0, 33.0, 24.0, 12.0, 13.0, 4.0, 5.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.267578125, -3.1708984375, -3.07421875, -2.9775390625, -2.880859375, -2.7841796875, -2.6875, -2.5908203125, -2.494140625, -2.3974609375, -2.30078125, -2.2041015625, -2.107421875, -2.0107421875, -1.9140625, -1.8173828125, -1.720703125, -1.6240234375, -1.52734375, -1.4306640625, -1.333984375, -1.2373046875, -1.140625, -1.0439453125, -0.947265625, -0.8505859375, -0.75390625, -0.6572265625, -0.560546875, -0.4638671875, -0.3671875, -0.2705078125, -0.173828125, -0.0771484375, 0.01953125, 0.1162109375, 0.212890625, 0.3095703125, 0.40625, 0.5029296875, 0.599609375, 0.6962890625, 0.79296875, 0.8896484375, 0.986328125, 1.0830078125, 1.1796875, 1.2763671875, 1.373046875, 1.4697265625, 1.56640625, 1.6630859375, 1.759765625, 1.8564453125, 1.953125, 2.0498046875, 2.146484375, 2.2431640625, 2.33984375, 2.4365234375, 2.533203125, 2.6298828125, 2.7265625, 2.8232421875, 2.919921875]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 6.0, 3.0, 11.0, 6.0, 4.0, 12.0, 5.0, 12.0, 12.0, 15.0, 7.0, 18.0, 20.0, 21.0, 17.0, 35.0, 43.0, 30.0, 33.0, 27.0, 41.0, 36.0, 52.0, 30.0, 1052.0, 36.0, 36.0, 37.0, 43.0, 36.0, 27.0, 21.0, 31.0, 35.0, 29.0, 21.0, 22.0, 14.0, 18.0, 20.0, 17.0, 8.0, 9.0, 6.0, 5.0, 7.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-4.50390625, -4.3602294921875, -4.216552734375, -4.0728759765625, -3.92919921875, -3.7855224609375, -3.641845703125, -3.4981689453125, -3.3544921875, -3.2108154296875, -3.067138671875, -2.9234619140625, -2.77978515625, -2.6361083984375, -2.492431640625, -2.3487548828125, -2.205078125, -2.0614013671875, -1.917724609375, -1.7740478515625, -1.63037109375, -1.4866943359375, -1.343017578125, -1.1993408203125, -1.0556640625, -0.9119873046875, -0.768310546875, -0.6246337890625, -0.48095703125, -0.3372802734375, -0.193603515625, -0.0499267578125, 0.09375, 0.2374267578125, 0.381103515625, 0.5247802734375, 0.66845703125, 0.8121337890625, 0.955810546875, 1.0994873046875, 1.2431640625, 1.3868408203125, 1.530517578125, 1.6741943359375, 1.81787109375, 1.9615478515625, 2.105224609375, 2.2489013671875, 2.392578125, 2.5362548828125, 2.679931640625, 2.8236083984375, 2.96728515625, 3.1109619140625, 3.254638671875, 3.3983154296875, 3.5419921875, 3.6856689453125, 3.829345703125, 3.9730224609375, 4.11669921875, 4.2603759765625, 4.404052734375, 4.5477294921875, 4.69140625]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 8.0, 8.0, 19.0, 15.0, 28.0, 20.0, 54.0, 71.0, 118.0, 206.0, 320.0, 523.0, 878.0, 1510.0, 2781.0, 4871.0, 9146.0, 17905.0, 41059.0, 1098503.0, 840668.0, 40234.0, 17777.0, 9075.0, 4969.0, 2628.0, 1466.0, 918.0, 468.0, 339.0, 195.0, 135.0, 62.0, 52.0, 38.0, 29.0, 12.0, 13.0, 4.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-5.44140625, -5.29022216796875, -5.1390380859375, -4.98785400390625, -4.836669921875, -4.68548583984375, -4.5343017578125, -4.38311767578125, -4.23193359375, -4.08074951171875, -3.9295654296875, -3.77838134765625, -3.627197265625, -3.47601318359375, -3.3248291015625, -3.17364501953125, -3.0224609375, -2.87127685546875, -2.7200927734375, -2.56890869140625, -2.417724609375, -2.26654052734375, -2.1153564453125, -1.96417236328125, -1.81298828125, -1.66180419921875, -1.5106201171875, -1.35943603515625, -1.208251953125, -1.05706787109375, -0.9058837890625, -0.75469970703125, -0.603515625, -0.45233154296875, -0.3011474609375, -0.14996337890625, 0.001220703125, 0.15240478515625, 0.3035888671875, 0.45477294921875, 0.60595703125, 0.75714111328125, 0.9083251953125, 1.05950927734375, 1.210693359375, 1.36187744140625, 1.5130615234375, 1.66424560546875, 1.8154296875, 1.96661376953125, 2.1177978515625, 2.26898193359375, 2.420166015625, 2.57135009765625, 2.7225341796875, 2.87371826171875, 3.02490234375, 3.17608642578125, 3.3272705078125, 3.47845458984375, 3.629638671875, 3.78082275390625, 3.9320068359375, 4.08319091796875, 4.234375]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 5.0, 7.0, 5.0, 8.0, 8.0, 10.0, 14.0, 12.0, 40.0, 29.0, 37.0, 39.0, 46.0, 64.0, 77.0, 94.0, 92.0, 97.0, 80.0, 56.0, 32.0, 35.0, 24.0, 26.0, 14.0, 12.0, 12.0, 8.0, 7.0, 3.0, 6.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.310546875, -0.3016242980957031, -0.29270172119140625, -0.2837791442871094, -0.2748565673828125, -0.2659339904785156, -0.25701141357421875, -0.24808883666992188, -0.239166259765625, -0.23024368286132812, -0.22132110595703125, -0.21239852905273438, -0.2034759521484375, -0.19455337524414062, -0.18563079833984375, -0.17670822143554688, -0.16778564453125, -0.15886306762695312, -0.14994049072265625, -0.14101791381835938, -0.1320953369140625, -0.12317276000976562, -0.11425018310546875, -0.10532760620117188, -0.096405029296875, -0.08748245239257812, -0.07855987548828125, -0.06963729858398438, -0.0607147216796875, -0.051792144775390625, -0.04286956787109375, -0.033946990966796875, -0.0250244140625, -0.016101837158203125, -0.00717926025390625, 0.001743316650390625, 0.0106658935546875, 0.019588470458984375, 0.02851104736328125, 0.037433624267578125, 0.046356201171875, 0.055278778076171875, 0.06420135498046875, 0.07312393188476562, 0.0820465087890625, 0.09096908569335938, 0.09989166259765625, 0.10881423950195312, 0.11773681640625, 0.12665939331054688, 0.13558197021484375, 0.14450454711914062, 0.1534271240234375, 0.16234970092773438, 0.17127227783203125, 0.18019485473632812, 0.189117431640625, 0.19804000854492188, 0.20696258544921875, 0.21588516235351562, 0.2248077392578125, 0.23373031616210938, 0.24265289306640625, 0.2515754699707031, 0.260498046875]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 6.0, 4.0, 7.0, 7.0, 8.0, 16.0, 17.0, 20.0, 33.0, 45.0, 70.0, 133.0, 242.0, 628.0, 14626.0, 1024806.0, 6815.0, 516.0, 208.0, 110.0, 56.0, 72.0, 30.0, 19.0, 16.0, 8.0, 13.0, 7.0, 4.0, 6.0, 5.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.38671875, -5.20367431640625, -5.0206298828125, -4.83758544921875, -4.654541015625, -4.47149658203125, -4.2884521484375, -4.10540771484375, -3.92236328125, -3.73931884765625, -3.5562744140625, -3.37322998046875, -3.190185546875, -3.00714111328125, -2.8240966796875, -2.64105224609375, -2.4580078125, -2.27496337890625, -2.0919189453125, -1.90887451171875, -1.725830078125, -1.54278564453125, -1.3597412109375, -1.17669677734375, -0.99365234375, -0.81060791015625, -0.6275634765625, -0.44451904296875, -0.261474609375, -0.07843017578125, 0.1046142578125, 0.28765869140625, 0.470703125, 0.65374755859375, 0.8367919921875, 1.01983642578125, 1.202880859375, 1.38592529296875, 1.5689697265625, 1.75201416015625, 1.93505859375, 2.11810302734375, 2.3011474609375, 2.48419189453125, 2.667236328125, 2.85028076171875, 3.0333251953125, 3.21636962890625, 3.3994140625, 3.58245849609375, 3.7655029296875, 3.94854736328125, 4.131591796875, 4.31463623046875, 4.4976806640625, 4.68072509765625, 4.86376953125, 5.04681396484375, 5.2298583984375, 5.41290283203125, 5.595947265625, 5.77899169921875, 5.9620361328125, 6.14508056640625, 6.328125]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 11.0, 33.0, 185.0, 498.0, 215.0, 52.0, 10.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5676462650299072, -2.4674689769744873, -2.3672919273376465, -2.2671146392822266, -2.1669373512268066, -2.066760301589966, -1.966583013534546, -1.8664058446884155, -1.7662286758422852, -1.6660515069961548, -1.5658743381500244, -1.4656970500946045, -1.3655198812484741, -1.2653427124023438, -1.1651654243469238, -1.0649882555007935, -0.9648110866546631, -0.8646339178085327, -0.7644566893577576, -0.6642794609069824, -0.564102292060852, -0.4639251232147217, -0.36374789476394653, -0.2635706663131714, -0.16339349746704102, -0.06321629881858826, 0.0369608998298645, 0.13713809847831726, 0.23731529712677002, 0.3374924659729004, 0.43766969442367554, 0.5378469228744507, 0.638024091720581, 0.7382012605667114, 0.8383784890174866, 0.9385557174682617, 1.038732886314392, 1.1389100551605225, 1.2390873432159424, 1.3392645120620728, 1.4394416809082031, 1.5396188497543335, 1.6397960186004639, 1.7399733066558838, 1.8401504755020142, 1.9403276443481445, 2.0405049324035645, 2.1406822204589844, 2.240859270095825, 2.341036558151245, 2.441213607788086, 2.541390895843506, 2.641568183898926, 2.7417452335357666, 2.8419225215911865, 2.9420995712280273, 3.0422768592834473, 3.142454147338867, 3.242631196975708, 3.342808485031128, 3.4429855346679688, 3.5431628227233887, 3.6433401107788086, 3.7435173988342285, 3.8436944484710693]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 8.0, 5.0, 13.0, 13.0, 20.0, 21.0, 31.0, 35.0, 52.0, 50.0, 54.0, 64.0, 64.0, 58.0, 69.0, 65.0, 78.0, 49.0, 51.0, 40.0, 31.0, 37.0, 24.0, 18.0, 24.0, 13.0, 8.0, 7.0, 6.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2473028898239136, -1.2161965370178223, -1.1850900650024414, -1.15398371219635, -1.1228773593902588, -1.0917710065841675, -1.0606645345687866, -1.0295581817626953, -0.998451828956604, -0.9673454165458679, -0.9362390637397766, -0.9051326513290405, -0.8740262985229492, -0.8429198861122131, -0.811813473701477, -0.7807071208953857, -0.7496007084846497, -0.7184942960739136, -0.6873879432678223, -0.6562815308570862, -0.6251751780509949, -0.5940687656402588, -0.5629624128341675, -0.5318560004234314, -0.5007495880126953, -0.4696432054042816, -0.4385368227958679, -0.40743041038513184, -0.3763240575790405, -0.34521764516830444, -0.31411126255989075, -0.28300487995147705, -0.25189846754074097, -0.22079208493232727, -0.18968570232391357, -0.15857930481433868, -0.127472922205925, -0.09636653959751129, -0.0652601420879364, -0.034153759479522705, -0.003047376871109009, 0.028059009462594986, 0.05916539579629898, 0.09027178585529327, 0.12137816846370697, 0.15248455107212067, 0.18359094858169556, 0.21469733119010925, 0.24580371379852295, 0.27691009640693665, 0.30801647901535034, 0.3391228914260864, 0.37022924423217773, 0.4013356566429138, 0.4324420392513275, 0.4635484218597412, 0.4946548044681549, 0.5257611870765686, 0.5568675994873047, 0.587973952293396, 0.6190803647041321, 0.6501867175102234, 0.6812931299209595, 0.7123994827270508, 0.7435058951377869]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 3.0, 2.0, 5.0, 8.0, 3.0, 9.0, 12.0, 18.0, 9.0, 16.0, 23.0, 16.0, 27.0, 31.0, 35.0, 23.0, 28.0, 35.0, 49.0, 41.0, 37.0, 42.0, 45.0, 30.0, 35.0, 36.0, 50.0, 40.0, 38.0, 27.0, 30.0, 24.0, 27.0, 27.0, 13.0, 21.0, 20.0, 16.0, 11.0, 8.0, 7.0, 10.0, 2.0, 5.0, 4.0, 3.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-5.80859375, -5.63671875, -5.46484375, -5.29296875, -5.12109375, -4.94921875, -4.77734375, -4.60546875, -4.43359375, -4.26171875, -4.08984375, -3.91796875, -3.74609375, -3.57421875, -3.40234375, -3.23046875, -3.05859375, -2.88671875, -2.71484375, -2.54296875, -2.37109375, -2.19921875, -2.02734375, -1.85546875, -1.68359375, -1.51171875, -1.33984375, -1.16796875, -0.99609375, -0.82421875, -0.65234375, -0.48046875, -0.30859375, -0.13671875, 0.03515625, 0.20703125, 0.37890625, 0.55078125, 0.72265625, 0.89453125, 1.06640625, 1.23828125, 1.41015625, 1.58203125, 1.75390625, 1.92578125, 2.09765625, 2.26953125, 2.44140625, 2.61328125, 2.78515625, 2.95703125, 3.12890625, 3.30078125, 3.47265625, 3.64453125, 3.81640625, 3.98828125, 4.16015625, 4.33203125, 4.50390625, 4.67578125, 4.84765625, 5.01953125, 5.19140625]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 4.0, 5.0, 2.0, 6.0, 3.0, 12.0, 19.0, 24.0, 25.0, 46.0, 80.0, 104.0, 155.0, 259.0, 483.0, 821.0, 1699.0, 3308.0, 7027.0, 15165.0, 33667.0, 74825.0, 156366.0, 340746.0, 220226.0, 104363.0, 48137.0, 21514.0, 9977.0, 4539.0, 2228.0, 1187.0, 594.0, 345.0, 219.0, 131.0, 86.0, 52.0, 30.0, 20.0, 15.0, 12.0, 15.0, 2.0, 7.0, 7.0, 4.0, 6.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.0390625, -5.82122802734375, -5.6033935546875, -5.38555908203125, -5.167724609375, -4.94989013671875, -4.7320556640625, -4.51422119140625, -4.29638671875, -4.07855224609375, -3.8607177734375, -3.64288330078125, -3.425048828125, -3.20721435546875, -2.9893798828125, -2.77154541015625, -2.5537109375, -2.33587646484375, -2.1180419921875, -1.90020751953125, -1.682373046875, -1.46453857421875, -1.2467041015625, -1.02886962890625, -0.81103515625, -0.59320068359375, -0.3753662109375, -0.15753173828125, 0.060302734375, 0.27813720703125, 0.4959716796875, 0.71380615234375, 0.931640625, 1.14947509765625, 1.3673095703125, 1.58514404296875, 1.802978515625, 2.02081298828125, 2.2386474609375, 2.45648193359375, 2.67431640625, 2.89215087890625, 3.1099853515625, 3.32781982421875, 3.545654296875, 3.76348876953125, 3.9813232421875, 4.19915771484375, 4.4169921875, 4.63482666015625, 4.8526611328125, 5.07049560546875, 5.288330078125, 5.50616455078125, 5.7239990234375, 5.94183349609375, 6.15966796875, 6.37750244140625, 6.5953369140625, 6.81317138671875, 7.031005859375, 7.24884033203125, 7.4666748046875, 7.68450927734375, 7.90234375]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 5.0, 8.0, 5.0, 15.0, 18.0, 17.0, 29.0, 23.0, 23.0, 36.0, 37.0, 55.0, 57.0, 70.0, 108.0, 201.0, 1415.0, 307.0, 147.0, 100.0, 65.0, 55.0, 46.0, 37.0, 35.0, 28.0, 31.0, 20.0, 15.0, 12.0, 8.0, 3.0, 2.0, 5.0, 1.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0], "bins": [-24.859375, -24.145263671875, -23.43115234375, -22.717041015625, -22.0029296875, -21.288818359375, -20.57470703125, -19.860595703125, -19.146484375, -18.432373046875, -17.71826171875, -17.004150390625, -16.2900390625, -15.575927734375, -14.86181640625, -14.147705078125, -13.43359375, -12.719482421875, -12.00537109375, -11.291259765625, -10.5771484375, -9.863037109375, -9.14892578125, -8.434814453125, -7.720703125, -7.006591796875, -6.29248046875, -5.578369140625, -4.8642578125, -4.150146484375, -3.43603515625, -2.721923828125, -2.0078125, -1.293701171875, -0.57958984375, 0.134521484375, 0.8486328125, 1.562744140625, 2.27685546875, 2.990966796875, 3.705078125, 4.419189453125, 5.13330078125, 5.847412109375, 6.5615234375, 7.275634765625, 7.98974609375, 8.703857421875, 9.41796875, 10.132080078125, 10.84619140625, 11.560302734375, 12.2744140625, 12.988525390625, 13.70263671875, 14.416748046875, 15.130859375, 15.844970703125, 16.55908203125, 17.273193359375, 17.9873046875, 18.701416015625, 19.41552734375, 20.129638671875, 20.84375]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 0.0, 2.0, 5.0, 6.0, 8.0, 15.0, 16.0, 23.0, 48.0, 67.0, 133.0, 226.0, 367.0, 1159.0, 10744.0, 3019355.0, 109565.0, 2708.0, 592.0, 261.0, 142.0, 92.0, 67.0, 40.0, 20.0, 16.0, 9.0, 7.0, 6.0, 2.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-87.4375, -84.990234375, -82.54296875, -80.095703125, -77.6484375, -75.201171875, -72.75390625, -70.306640625, -67.859375, -65.412109375, -62.96484375, -60.517578125, -58.0703125, -55.623046875, -53.17578125, -50.728515625, -48.28125, -45.833984375, -43.38671875, -40.939453125, -38.4921875, -36.044921875, -33.59765625, -31.150390625, -28.703125, -26.255859375, -23.80859375, -21.361328125, -18.9140625, -16.466796875, -14.01953125, -11.572265625, -9.125, -6.677734375, -4.23046875, -1.783203125, 0.6640625, 3.111328125, 5.55859375, 8.005859375, 10.453125, 12.900390625, 15.34765625, 17.794921875, 20.2421875, 22.689453125, 25.13671875, 27.583984375, 30.03125, 32.478515625, 34.92578125, 37.373046875, 39.8203125, 42.267578125, 44.71484375, 47.162109375, 49.609375, 52.056640625, 54.50390625, 56.951171875, 59.3984375, 61.845703125, 64.29296875, 66.740234375, 69.1875]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 6.0, 435.0, 566.0, 10.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-619.5796508789062, -608.3321533203125, -597.0846557617188, -585.837158203125, -574.5896606445312, -563.3421630859375, -552.0947265625, -540.84716796875, -529.5997314453125, -518.3522338867188, -507.104736328125, -495.85723876953125, -484.6097717285156, -473.3622741699219, -462.1147766113281, -450.8672790527344, -439.6197509765625, -428.37225341796875, -417.124755859375, -405.87725830078125, -394.6297912597656, -383.3822937011719, -372.1347961425781, -360.8872985839844, -349.63983154296875, -338.392333984375, -327.14483642578125, -315.8973388671875, -304.6498718261719, -293.4023742675781, -282.1548767089844, -270.9073791503906, -259.65985107421875, -248.412353515625, -237.1648712158203, -225.91737365722656, -214.6698760986328, -203.42239379882812, -192.17489624023438, -180.92739868164062, -169.67991638183594, -158.4324188232422, -147.1849365234375, -135.93743896484375, -124.68994140625, -113.44245147705078, -102.19496154785156, -90.94746398925781, -79.6999740600586, -68.45248413085938, -57.204986572265625, -45.957496643066406, -34.71000289916992, -23.462509155273438, -12.215019226074219, -0.9675216674804688, 10.27996826171875, 21.527462005615234, 32.77495574951172, 44.02244567871094, 55.26993942260742, 66.5174331665039, 77.76492309570312, 89.01242065429688, 100.2599105834961]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 6.0, 8.0, 23.0, 21.0, 16.0, 21.0, 29.0, 46.0, 37.0, 50.0, 52.0, 64.0, 61.0, 78.0, 77.0, 79.0, 64.0, 46.0, 61.0, 32.0, 37.0, 25.0, 24.0, 11.0, 9.0, 13.0, 7.0, 3.0, 5.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0], "bins": [-97.33786010742188, -94.95618438720703, -92.57450103759766, -90.19282531738281, -87.81114959716797, -85.42947387695312, -83.04779052734375, -80.6661148071289, -78.28443908691406, -75.90276336669922, -73.52108001708984, -71.139404296875, -68.75772857666016, -66.37605285644531, -63.99436950683594, -61.612693786621094, -59.23101043701172, -56.84933090209961, -54.467655181884766, -52.085975646972656, -49.70429992675781, -47.3226203918457, -44.940940856933594, -42.55926513671875, -40.17758560180664, -37.79590606689453, -35.41423034667969, -33.03255081176758, -30.6508731842041, -28.269195556640625, -25.887516021728516, -23.50583839416504, -21.12415313720703, -18.742475509643555, -16.360797882080078, -13.979118347167969, -11.597440719604492, -9.215763092041016, -6.834084510803223, -4.45240592956543, -2.070728302001953, 0.31094980239868164, 2.6926279067993164, 5.074306011199951, 7.455984115600586, 9.837661743164062, 12.219340324401855, 14.601018905639648, 16.982696533203125, 19.3643741607666, 21.746051788330078, 24.127731323242188, 26.509408950805664, 28.89108657836914, 31.27276611328125, 33.654441833496094, 36.0361213684082, 38.41780090332031, 40.799476623535156, 43.181156158447266, 45.562835693359375, 47.94451141357422, 50.32619094848633, 52.70787048339844, 55.08954620361328]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 2.0, 2.0, 14.0, 6.0, 12.0, 13.0, 12.0, 12.0, 15.0, 29.0, 26.0, 27.0, 22.0, 36.0, 29.0, 38.0, 32.0, 46.0, 36.0, 47.0, 47.0, 49.0, 34.0, 31.0, 54.0, 43.0, 43.0, 28.0, 35.0, 29.0, 20.0, 20.0, 20.0, 19.0, 16.0, 19.0, 10.0, 5.0, 4.0, 6.0, 7.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.15234375, -5.95819091796875, -5.7640380859375, -5.56988525390625, -5.375732421875, -5.18157958984375, -4.9874267578125, -4.79327392578125, -4.59912109375, -4.40496826171875, -4.2108154296875, -4.01666259765625, -3.822509765625, -3.62835693359375, -3.4342041015625, -3.24005126953125, -3.0458984375, -2.85174560546875, -2.6575927734375, -2.46343994140625, -2.269287109375, -2.07513427734375, -1.8809814453125, -1.68682861328125, -1.49267578125, -1.29852294921875, -1.1043701171875, -0.91021728515625, -0.716064453125, -0.52191162109375, -0.3277587890625, -0.13360595703125, 0.060546875, 0.25469970703125, 0.4488525390625, 0.64300537109375, 0.837158203125, 1.03131103515625, 1.2254638671875, 1.41961669921875, 1.61376953125, 1.80792236328125, 2.0020751953125, 2.19622802734375, 2.390380859375, 2.58453369140625, 2.7786865234375, 2.97283935546875, 3.1669921875, 3.36114501953125, 3.5552978515625, 3.74945068359375, 3.943603515625, 4.13775634765625, 4.3319091796875, 4.52606201171875, 4.72021484375, 4.91436767578125, 5.1085205078125, 5.30267333984375, 5.496826171875, 5.69097900390625, 5.8851318359375, 6.07928466796875, 6.2734375]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 5.0, 7.0, 6.0, 12.0, 18.0, 20.0, 28.0, 30.0, 57.0, 86.0, 118.0, 157.0, 242.0, 388.0, 552.0, 942.0, 1396.0, 2412.0, 4243.0, 8016.0, 17854.0, 48029.0, 183687.0, 883451.0, 2037270.0, 765260.0, 159983.0, 44344.0, 16988.0, 7995.0, 4215.0, 2373.0, 1434.0, 883.0, 604.0, 375.0, 260.0, 166.0, 121.0, 71.0, 47.0, 42.0, 28.0, 24.0, 11.0, 10.0, 11.0, 7.0, 3.0, 3.0, 3.0, 3.0, 2.0], "bins": [-11.34375, -11.0238037109375, -10.703857421875, -10.3839111328125, -10.06396484375, -9.7440185546875, -9.424072265625, -9.1041259765625, -8.7841796875, -8.4642333984375, -8.144287109375, -7.8243408203125, -7.50439453125, -7.1844482421875, -6.864501953125, -6.5445556640625, -6.224609375, -5.9046630859375, -5.584716796875, -5.2647705078125, -4.94482421875, -4.6248779296875, -4.304931640625, -3.9849853515625, -3.6650390625, -3.3450927734375, -3.025146484375, -2.7052001953125, -2.38525390625, -2.0653076171875, -1.745361328125, -1.4254150390625, -1.10546875, -0.7855224609375, -0.465576171875, -0.1456298828125, 0.17431640625, 0.4942626953125, 0.814208984375, 1.1341552734375, 1.4541015625, 1.7740478515625, 2.093994140625, 2.4139404296875, 2.73388671875, 3.0538330078125, 3.373779296875, 3.6937255859375, 4.013671875, 4.3336181640625, 4.653564453125, 4.9735107421875, 5.29345703125, 5.6134033203125, 5.933349609375, 6.2532958984375, 6.5732421875, 6.8931884765625, 7.213134765625, 7.5330810546875, 7.85302734375, 8.1729736328125, 8.492919921875, 8.8128662109375, 9.1328125]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 2.0, 2.0, 2.0, 8.0, 15.0, 18.0, 18.0, 26.0, 36.0, 47.0, 86.0, 81.0, 117.0, 193.0, 273.0, 352.0, 478.0, 555.0, 492.0, 360.0, 248.0, 172.0, 124.0, 114.0, 57.0, 55.0, 34.0, 33.0, 21.0, 14.0, 10.0, 14.0, 4.0, 5.0, 3.0, 5.0, 0.0, 4.0, 3.0, 2.0], "bins": [-15.2265625, -14.8582763671875, -14.489990234375, -14.1217041015625, -13.75341796875, -13.3851318359375, -13.016845703125, -12.6485595703125, -12.2802734375, -11.9119873046875, -11.543701171875, -11.1754150390625, -10.80712890625, -10.4388427734375, -10.070556640625, -9.7022705078125, -9.333984375, -8.9656982421875, -8.597412109375, -8.2291259765625, -7.86083984375, -7.4925537109375, -7.124267578125, -6.7559814453125, -6.3876953125, -6.0194091796875, -5.651123046875, -5.2828369140625, -4.91455078125, -4.5462646484375, -4.177978515625, -3.8096923828125, -3.44140625, -3.0731201171875, -2.704833984375, -2.3365478515625, -1.96826171875, -1.5999755859375, -1.231689453125, -0.8634033203125, -0.4951171875, -0.1268310546875, 0.241455078125, 0.6097412109375, 0.97802734375, 1.3463134765625, 1.714599609375, 2.0828857421875, 2.451171875, 2.8194580078125, 3.187744140625, 3.5560302734375, 3.92431640625, 4.2926025390625, 4.660888671875, 5.0291748046875, 5.3974609375, 5.7657470703125, 6.134033203125, 6.5023193359375, 6.87060546875, 7.2388916015625, 7.607177734375, 7.9754638671875, 8.34375]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 2.0, 1.0, 6.0, 2.0, 8.0, 8.0, 13.0, 12.0, 21.0, 22.0, 34.0, 53.0, 62.0, 107.0, 140.0, 205.0, 351.0, 921.0, 11239.0, 2246422.0, 1922506.0, 10465.0, 834.0, 291.0, 178.0, 105.0, 84.0, 52.0, 39.0, 31.0, 24.0, 13.0, 13.0, 9.0, 4.0, 2.0, 4.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.71875, -41.81689453125, -39.9150390625, -38.01318359375, -36.111328125, -34.20947265625, -32.3076171875, -30.40576171875, -28.50390625, -26.60205078125, -24.7001953125, -22.79833984375, -20.896484375, -18.99462890625, -17.0927734375, -15.19091796875, -13.2890625, -11.38720703125, -9.4853515625, -7.58349609375, -5.681640625, -3.77978515625, -1.8779296875, 0.02392578125, 1.92578125, 3.82763671875, 5.7294921875, 7.63134765625, 9.533203125, 11.43505859375, 13.3369140625, 15.23876953125, 17.140625, 19.04248046875, 20.9443359375, 22.84619140625, 24.748046875, 26.64990234375, 28.5517578125, 30.45361328125, 32.35546875, 34.25732421875, 36.1591796875, 38.06103515625, 39.962890625, 41.86474609375, 43.7666015625, 45.66845703125, 47.5703125, 49.47216796875, 51.3740234375, 53.27587890625, 55.177734375, 57.07958984375, 58.9814453125, 60.88330078125, 62.78515625, 64.68701171875, 66.5888671875, 68.49072265625, 70.392578125, 72.29443359375, 74.1962890625, 76.09814453125, 78.0]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 35.0, 232.0, 457.0, 229.0, 51.0, 10.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-342.3238525390625, -334.9528503417969, -327.58184814453125, -320.2108459472656, -312.83984375, -305.4688415527344, -298.09783935546875, -290.72686767578125, -283.3558349609375, -275.9848327636719, -268.61383056640625, -261.2428283691406, -253.871826171875, -246.50082397460938, -239.1298370361328, -231.7588348388672, -224.38784790039062, -217.016845703125, -209.64584350585938, -202.27484130859375, -194.90383911132812, -187.5328369140625, -180.16184997558594, -172.7908477783203, -165.4198455810547, -158.04884338378906, -150.67784118652344, -143.3068389892578, -135.93585205078125, -128.56484985351562, -121.19384765625, -113.82284545898438, -106.45185852050781, -99.08085632324219, -91.70985412597656, -84.33885955810547, -76.96785736083984, -69.59685516357422, -62.22585678100586, -54.8548583984375, -47.483856201171875, -40.11285400390625, -32.74185562133789, -25.3708553314209, -17.999855041503906, -10.628852844238281, -3.257854461669922, 4.1131439208984375, 11.484146118164062, 18.855146408081055, 26.226146697998047, 33.597145080566406, 40.96814727783203, 48.339149475097656, 55.710147857666016, 63.081146240234375, 70.4521484375, 77.82315063476562, 85.19415283203125, 92.56514739990234, 99.93614959716797, 107.3071517944336, 114.67814636230469, 122.04914855957031, 129.42015075683594]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 4.0, 1.0, 1.0, 3.0, 3.0, 9.0, 6.0, 9.0, 10.0, 11.0, 18.0, 27.0, 30.0, 26.0, 21.0, 39.0, 28.0, 27.0, 31.0, 31.0, 45.0, 46.0, 41.0, 48.0, 35.0, 41.0, 35.0, 38.0, 35.0, 44.0, 38.0, 24.0, 32.0, 24.0, 26.0, 18.0, 17.0, 15.0, 18.0, 6.0, 12.0, 11.0, 8.0, 3.0, 3.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-37.58034133911133, -36.42027282714844, -35.26020050048828, -34.10013198852539, -32.940059661865234, -31.779991149902344, -30.61992073059082, -29.459850311279297, -28.299779891967773, -27.13970947265625, -25.979639053344727, -24.819568634033203, -23.659500122070312, -22.499427795410156, -21.339359283447266, -20.179288864135742, -19.01921844482422, -17.859148025512695, -16.699077606201172, -15.539008140563965, -14.378937721252441, -13.218867301940918, -12.058797836303711, -10.898727416992188, -9.738656997680664, -8.57858657836914, -7.418516635894775, -6.25844669342041, -5.098376274108887, -3.9383058547973633, -2.778235912322998, -1.6181659698486328, -0.45809173583984375, 0.7019784450531006, 1.862048625946045, 3.0221188068389893, 4.182188987731934, 5.342259407043457, 6.502329349517822, 7.6623992919921875, 8.822469711303711, 9.982540130615234, 11.142610549926758, 12.302680015563965, 13.462750434875488, 14.622820854187012, 15.782890319824219, 16.942960739135742, 18.103031158447266, 19.26310157775879, 20.423171997070312, 21.583242416381836, 22.74331283569336, 23.90338134765625, 25.063451766967773, 26.223522186279297, 27.38359260559082, 28.543663024902344, 29.703733444213867, 30.86380386352539, 32.02387237548828, 33.18394470214844, 34.34401321411133, 35.50408172607422, 36.664154052734375]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 4.0, 6.0, 9.0, 6.0, 11.0, 9.0, 11.0, 11.0, 13.0, 19.0, 27.0, 24.0, 27.0, 25.0, 33.0, 37.0, 33.0, 34.0, 37.0, 34.0, 54.0, 52.0, 34.0, 55.0, 42.0, 38.0, 34.0, 40.0, 31.0, 31.0, 25.0, 19.0, 23.0, 18.0, 20.0, 10.0, 16.0, 16.0, 9.0, 6.0, 7.0, 5.0, 5.0, 0.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.8125, -5.6236572265625, -5.434814453125, -5.2459716796875, -5.05712890625, -4.8682861328125, -4.679443359375, -4.4906005859375, -4.3017578125, -4.1129150390625, -3.924072265625, -3.7352294921875, -3.54638671875, -3.3575439453125, -3.168701171875, -2.9798583984375, -2.791015625, -2.6021728515625, -2.413330078125, -2.2244873046875, -2.03564453125, -1.8468017578125, -1.657958984375, -1.4691162109375, -1.2802734375, -1.0914306640625, -0.902587890625, -0.7137451171875, -0.52490234375, -0.3360595703125, -0.147216796875, 0.0416259765625, 0.23046875, 0.4193115234375, 0.608154296875, 0.7969970703125, 0.98583984375, 1.1746826171875, 1.363525390625, 1.5523681640625, 1.7412109375, 1.9300537109375, 2.118896484375, 2.3077392578125, 2.49658203125, 2.6854248046875, 2.874267578125, 3.0631103515625, 3.251953125, 3.4407958984375, 3.629638671875, 3.8184814453125, 4.00732421875, 4.1961669921875, 4.385009765625, 4.5738525390625, 4.7626953125, 4.9515380859375, 5.140380859375, 5.3292236328125, 5.51806640625, 5.7069091796875, 5.895751953125, 6.0845947265625, 6.2734375]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 7.0, 1.0, 4.0, 5.0, 8.0, 10.0, 15.0, 42.0, 47.0, 95.0, 156.0, 292.0, 510.0, 947.0, 1709.0, 3451.0, 6391.0, 12613.0, 24689.0, 48016.0, 89242.0, 152397.0, 211540.0, 200008.0, 135320.0, 77120.0, 40713.0, 20881.0, 10662.0, 5501.0, 2839.0, 1505.0, 804.0, 453.0, 235.0, 141.0, 82.0, 48.0, 24.0, 14.0, 6.0, 8.0, 5.0, 1.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.0078125, -1.94482421875, -1.8818359375, -1.81884765625, -1.755859375, -1.69287109375, -1.6298828125, -1.56689453125, -1.50390625, -1.44091796875, -1.3779296875, -1.31494140625, -1.251953125, -1.18896484375, -1.1259765625, -1.06298828125, -1.0, -0.93701171875, -0.8740234375, -0.81103515625, -0.748046875, -0.68505859375, -0.6220703125, -0.55908203125, -0.49609375, -0.43310546875, -0.3701171875, -0.30712890625, -0.244140625, -0.18115234375, -0.1181640625, -0.05517578125, 0.0078125, 0.07080078125, 0.1337890625, 0.19677734375, 0.259765625, 0.32275390625, 0.3857421875, 0.44873046875, 0.51171875, 0.57470703125, 0.6376953125, 0.70068359375, 0.763671875, 0.82666015625, 0.8896484375, 0.95263671875, 1.015625, 1.07861328125, 1.1416015625, 1.20458984375, 1.267578125, 1.33056640625, 1.3935546875, 1.45654296875, 1.51953125, 1.58251953125, 1.6455078125, 1.70849609375, 1.771484375, 1.83447265625, 1.8974609375, 1.96044921875, 2.0234375]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 1.0, 3.0, 6.0, 2.0, 3.0, 14.0, 7.0, 12.0, 14.0, 19.0, 15.0, 27.0, 24.0, 22.0, 24.0, 25.0, 26.0, 38.0, 36.0, 36.0, 35.0, 41.0, 35.0, 1071.0, 50.0, 34.0, 40.0, 35.0, 39.0, 28.0, 29.0, 33.0, 23.0, 24.0, 24.0, 21.0, 19.0, 6.0, 26.0, 14.0, 12.0, 7.0, 10.0, 9.0, 4.0, 2.0, 3.0, 4.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-4.84765625, -4.70489501953125, -4.5621337890625, -4.41937255859375, -4.276611328125, -4.13385009765625, -3.9910888671875, -3.84832763671875, -3.70556640625, -3.56280517578125, -3.4200439453125, -3.27728271484375, -3.134521484375, -2.99176025390625, -2.8489990234375, -2.70623779296875, -2.5634765625, -2.42071533203125, -2.2779541015625, -2.13519287109375, -1.992431640625, -1.84967041015625, -1.7069091796875, -1.56414794921875, -1.42138671875, -1.27862548828125, -1.1358642578125, -0.99310302734375, -0.850341796875, -0.70758056640625, -0.5648193359375, -0.42205810546875, -0.279296875, -0.13653564453125, 0.0062255859375, 0.14898681640625, 0.291748046875, 0.43450927734375, 0.5772705078125, 0.72003173828125, 0.86279296875, 1.00555419921875, 1.1483154296875, 1.29107666015625, 1.433837890625, 1.57659912109375, 1.7193603515625, 1.86212158203125, 2.0048828125, 2.14764404296875, 2.2904052734375, 2.43316650390625, 2.575927734375, 2.71868896484375, 2.8614501953125, 3.00421142578125, 3.14697265625, 3.28973388671875, 3.4324951171875, 3.57525634765625, 3.718017578125, 3.86077880859375, 4.0035400390625, 4.14630126953125, 4.2890625]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 4.0, 0.0, 0.0, 0.0, 4.0, 4.0, 4.0, 3.0, 9.0, 15.0, 25.0, 35.0, 55.0, 90.0, 116.0, 165.0, 254.0, 376.0, 588.0, 1002.0, 1583.0, 2646.0, 4282.0, 7385.0, 13178.0, 23738.0, 67909.0, 1719922.0, 182601.0, 31848.0, 16302.0, 9175.0, 5324.0, 3254.0, 1910.0, 1204.0, 758.0, 478.0, 318.0, 204.0, 132.0, 87.0, 56.0, 32.0, 19.0, 13.0, 15.0, 8.0, 5.0, 7.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.037109375, -2.9312744140625, -2.825439453125, -2.7196044921875, -2.61376953125, -2.5079345703125, -2.402099609375, -2.2962646484375, -2.1904296875, -2.0845947265625, -1.978759765625, -1.8729248046875, -1.76708984375, -1.6612548828125, -1.555419921875, -1.4495849609375, -1.34375, -1.2379150390625, -1.132080078125, -1.0262451171875, -0.92041015625, -0.8145751953125, -0.708740234375, -0.6029052734375, -0.4970703125, -0.3912353515625, -0.285400390625, -0.1795654296875, -0.07373046875, 0.0321044921875, 0.137939453125, 0.2437744140625, 0.349609375, 0.4554443359375, 0.561279296875, 0.6671142578125, 0.77294921875, 0.8787841796875, 0.984619140625, 1.0904541015625, 1.1962890625, 1.3021240234375, 1.407958984375, 1.5137939453125, 1.61962890625, 1.7254638671875, 1.831298828125, 1.9371337890625, 2.04296875, 2.1488037109375, 2.254638671875, 2.3604736328125, 2.46630859375, 2.5721435546875, 2.677978515625, 2.7838134765625, 2.8896484375, 2.9954833984375, 3.101318359375, 3.2071533203125, 3.31298828125, 3.4188232421875, 3.524658203125, 3.6304931640625, 3.736328125]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 5.0, 2.0, 4.0, 2.0, 4.0, 9.0, 8.0, 10.0, 10.0, 13.0, 21.0, 47.0, 32.0, 37.0, 42.0, 51.0, 40.0, 60.0, 53.0, 53.0, 56.0, 57.0, 63.0, 41.0, 36.0, 52.0, 35.0, 32.0, 31.0, 24.0, 17.0, 14.0, 12.0, 10.0, 6.0, 6.0, 4.0, 4.0, 2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.145751953125, -0.14133262634277344, -0.13691329956054688, -0.1324939727783203, -0.12807464599609375, -0.12365531921386719, -0.11923599243164062, -0.11481666564941406, -0.1103973388671875, -0.10597801208496094, -0.10155868530273438, -0.09713935852050781, -0.09272003173828125, -0.08830070495605469, -0.08388137817382812, -0.07946205139160156, -0.075042724609375, -0.07062339782714844, -0.06620407104492188, -0.06178474426269531, -0.05736541748046875, -0.05294609069824219, -0.048526763916015625, -0.04410743713378906, -0.0396881103515625, -0.03526878356933594, -0.030849456787109375, -0.026430130004882812, -0.02201080322265625, -0.017591476440429688, -0.013172149658203125, -0.008752822875976562, -0.00433349609375, 8.58306884765625e-05, 0.004505157470703125, 0.008924484252929688, 0.01334381103515625, 0.017763137817382812, 0.022182464599609375, 0.026601791381835938, 0.0310211181640625, 0.03544044494628906, 0.039859771728515625, 0.04427909851074219, 0.04869842529296875, 0.05311775207519531, 0.057537078857421875, 0.06195640563964844, 0.066375732421875, 0.07079505920410156, 0.07521438598632812, 0.07963371276855469, 0.08405303955078125, 0.08847236633300781, 0.09289169311523438, 0.09731101989746094, 0.1017303466796875, 0.10614967346191406, 0.11056900024414062, 0.11498832702636719, 0.11940765380859375, 0.12382698059082031, 0.12824630737304688, 0.13266563415527344, 0.1370849609375]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 5.0, 4.0, 6.0, 4.0, 10.0, 10.0, 19.0, 12.0, 23.0, 32.0, 38.0, 41.0, 58.0, 74.0, 130.0, 223.0, 556.0, 3843.0, 317247.0, 718392.0, 6387.0, 652.0, 269.0, 143.0, 91.0, 64.0, 45.0, 40.0, 40.0, 32.0, 12.0, 11.0, 10.0, 6.0, 9.0, 3.0, 6.0, 1.0, 3.0, 6.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.650390625, -2.56512451171875, -2.4798583984375, -2.39459228515625, -2.309326171875, -2.22406005859375, -2.1387939453125, -2.05352783203125, -1.96826171875, -1.88299560546875, -1.7977294921875, -1.71246337890625, -1.627197265625, -1.54193115234375, -1.4566650390625, -1.37139892578125, -1.2861328125, -1.20086669921875, -1.1156005859375, -1.03033447265625, -0.945068359375, -0.85980224609375, -0.7745361328125, -0.68927001953125, -0.60400390625, -0.51873779296875, -0.4334716796875, -0.34820556640625, -0.262939453125, -0.17767333984375, -0.0924072265625, -0.00714111328125, 0.078125, 0.16339111328125, 0.2486572265625, 0.33392333984375, 0.419189453125, 0.50445556640625, 0.5897216796875, 0.67498779296875, 0.76025390625, 0.84552001953125, 0.9307861328125, 1.01605224609375, 1.101318359375, 1.18658447265625, 1.2718505859375, 1.35711669921875, 1.4423828125, 1.52764892578125, 1.6129150390625, 1.69818115234375, 1.783447265625, 1.86871337890625, 1.9539794921875, 2.03924560546875, 2.12451171875, 2.20977783203125, 2.2950439453125, 2.38031005859375, 2.465576171875, 2.55084228515625, 2.6361083984375, 2.72137451171875, 2.806640625]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 3.0, 1.0, 8.0, 8.0, 27.0, 44.0, 71.0, 201.0, 340.0, 169.0, 68.0, 35.0, 21.0, 8.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5958751440048218, -1.5508592128753662, -1.505843162536621, -1.4608272314071655, -1.41581130027771, -1.3707952499389648, -1.3257793188095093, -1.2807633876800537, -1.2357473373413086, -1.190731406211853, -1.145715355873108, -1.1006994247436523, -1.0556833744049072, -1.0106674432754517, -0.9656515121459961, -0.9206355214118958, -0.8756195306777954, -0.8306035399436951, -0.7855875492095947, -0.7405716180801392, -0.6955556273460388, -0.6505396366119385, -0.6055237054824829, -0.5605077147483826, -0.5154917240142822, -0.4704757332801819, -0.42545977234840393, -0.380443811416626, -0.33542782068252563, -0.2904118299484253, -0.24539586901664734, -0.20037990808486938, -0.1553640365600586, -0.11034806072711945, -0.0653320848941803, -0.02031610906124115, 0.024699866771697998, 0.06971584260463715, 0.1147318184375763, 0.15974777936935425, 0.2047637701034546, 0.24977974593639374, 0.2947957217693329, 0.33981168270111084, 0.3848276734352112, 0.4298436641693115, 0.4748596251010895, 0.5198755860328674, 0.5648915767669678, 0.6099075675010681, 0.6549235582351685, 0.699939489364624, 0.7449554800987244, 0.7899714708328247, 0.8349874019622803, 0.8800033926963806, 0.925019383430481, 0.9700353741645813, 1.0150513648986816, 1.0600672960281372, 1.1050832271575928, 1.150099277496338, 1.1951152086257935, 1.240131139755249, 1.2851471900939941]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 4.0, 3.0, 7.0, 7.0, 12.0, 15.0, 16.0, 21.0, 27.0, 35.0, 35.0, 36.0, 41.0, 59.0, 48.0, 43.0, 49.0, 58.0, 60.0, 50.0, 53.0, 40.0, 29.0, 44.0, 31.0, 42.0, 27.0, 33.0, 24.0, 18.0, 7.0, 13.0, 8.0, 5.0, 1.0, 3.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3902274966239929, -0.3785134255886078, -0.36679935455322266, -0.35508525371551514, -0.34337118268013, -0.3316571116447449, -0.31994304060935974, -0.3082289695739746, -0.2965148687362671, -0.28480079770088196, -0.2730867266654968, -0.2613726258277893, -0.24965855479240417, -0.23794448375701904, -0.2262304127216339, -0.21451632678508759, -0.20280225574970245, -0.19108818471431732, -0.179374098777771, -0.16766002774238586, -0.15594594180583954, -0.1442318707704544, -0.13251778483390808, -0.12080371379852295, -0.10908963531255722, -0.09737555682659149, -0.08566147834062576, -0.07394739985466003, -0.062233325093984604, -0.050519246608018875, -0.038805171847343445, -0.027091093361377716, -0.015377014875411987, -0.003662937320768833, 0.008051140233874321, 0.0197652168571949, 0.03147929534316063, 0.04319337382912636, 0.05490744858980179, 0.06662152707576752, 0.07833560556173325, 0.09004968404769897, 0.1017637625336647, 0.11347784101963043, 0.12519191205501556, 0.1369059979915619, 0.14862006902694702, 0.16033414006233215, 0.17204822599887848, 0.1837622970342636, 0.19547638297080994, 0.20719045400619507, 0.2189045399427414, 0.23061861097812653, 0.24233269691467285, 0.254046767950058, 0.2657608389854431, 0.27747491002082825, 0.2891889810562134, 0.3009030818939209, 0.31261715292930603, 0.32433122396469116, 0.3360452950000763, 0.3477593660354614, 0.35947346687316895]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 7.0, 3.0, 10.0, 13.0, 10.0, 12.0, 11.0, 10.0, 23.0, 27.0, 23.0, 27.0, 37.0, 26.0, 31.0, 38.0, 29.0, 54.0, 52.0, 47.0, 50.0, 32.0, 51.0, 41.0, 40.0, 34.0, 38.0, 37.0, 26.0, 29.0, 22.0, 16.0, 15.0, 17.0, 13.0, 9.0, 14.0, 12.0, 7.0, 3.0, 2.0, 1.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.9140625, -5.71826171875, -5.5224609375, -5.32666015625, -5.130859375, -4.93505859375, -4.7392578125, -4.54345703125, -4.34765625, -4.15185546875, -3.9560546875, -3.76025390625, -3.564453125, -3.36865234375, -3.1728515625, -2.97705078125, -2.78125, -2.58544921875, -2.3896484375, -2.19384765625, -1.998046875, -1.80224609375, -1.6064453125, -1.41064453125, -1.21484375, -1.01904296875, -0.8232421875, -0.62744140625, -0.431640625, -0.23583984375, -0.0400390625, 0.15576171875, 0.3515625, 0.54736328125, 0.7431640625, 0.93896484375, 1.134765625, 1.33056640625, 1.5263671875, 1.72216796875, 1.91796875, 2.11376953125, 2.3095703125, 2.50537109375, 2.701171875, 2.89697265625, 3.0927734375, 3.28857421875, 3.484375, 3.68017578125, 3.8759765625, 4.07177734375, 4.267578125, 4.46337890625, 4.6591796875, 4.85498046875, 5.05078125, 5.24658203125, 5.4423828125, 5.63818359375, 5.833984375, 6.02978515625, 6.2255859375, 6.42138671875, 6.6171875]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 4.0, 10.0, 10.0, 9.0, 13.0, 18.0, 29.0, 40.0, 60.0, 86.0, 122.0, 179.0, 284.0, 564.0, 1109.0, 2478.0, 6469.0, 18473.0, 54940.0, 161450.0, 431108.0, 243882.0, 82683.0, 28156.0, 9620.0, 3537.0, 1454.0, 705.0, 409.0, 208.0, 137.0, 94.0, 55.0, 40.0, 34.0, 16.0, 22.0, 13.0, 9.0, 12.0, 3.0, 2.0, 6.0, 1.0, 0.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.3203125, -8.0491943359375, -7.778076171875, -7.5069580078125, -7.23583984375, -6.9647216796875, -6.693603515625, -6.4224853515625, -6.1513671875, -5.8802490234375, -5.609130859375, -5.3380126953125, -5.06689453125, -4.7957763671875, -4.524658203125, -4.2535400390625, -3.982421875, -3.7113037109375, -3.440185546875, -3.1690673828125, -2.89794921875, -2.6268310546875, -2.355712890625, -2.0845947265625, -1.8134765625, -1.5423583984375, -1.271240234375, -1.0001220703125, -0.72900390625, -0.4578857421875, -0.186767578125, 0.0843505859375, 0.35546875, 0.6265869140625, 0.897705078125, 1.1688232421875, 1.43994140625, 1.7110595703125, 1.982177734375, 2.2532958984375, 2.5244140625, 2.7955322265625, 3.066650390625, 3.3377685546875, 3.60888671875, 3.8800048828125, 4.151123046875, 4.4222412109375, 4.693359375, 4.9644775390625, 5.235595703125, 5.5067138671875, 5.77783203125, 6.0489501953125, 6.320068359375, 6.5911865234375, 6.8623046875, 7.1334228515625, 7.404541015625, 7.6756591796875, 7.94677734375, 8.2178955078125, 8.489013671875, 8.7601318359375, 9.03125]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 5.0, 8.0, 9.0, 13.0, 23.0, 19.0, 19.0, 13.0, 39.0, 41.0, 39.0, 53.0, 71.0, 69.0, 132.0, 210.0, 1428.0, 267.0, 138.0, 101.0, 65.0, 36.0, 35.0, 52.0, 32.0, 28.0, 22.0, 16.0, 19.0, 17.0, 7.0, 6.0, 8.0, 4.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.75, -22.006103515625, -21.26220703125, -20.518310546875, -19.7744140625, -19.030517578125, -18.28662109375, -17.542724609375, -16.798828125, -16.054931640625, -15.31103515625, -14.567138671875, -13.8232421875, -13.079345703125, -12.33544921875, -11.591552734375, -10.84765625, -10.103759765625, -9.35986328125, -8.615966796875, -7.8720703125, -7.128173828125, -6.38427734375, -5.640380859375, -4.896484375, -4.152587890625, -3.40869140625, -2.664794921875, -1.9208984375, -1.177001953125, -0.43310546875, 0.310791015625, 1.0546875, 1.798583984375, 2.54248046875, 3.286376953125, 4.0302734375, 4.774169921875, 5.51806640625, 6.261962890625, 7.005859375, 7.749755859375, 8.49365234375, 9.237548828125, 9.9814453125, 10.725341796875, 11.46923828125, 12.213134765625, 12.95703125, 13.700927734375, 14.44482421875, 15.188720703125, 15.9326171875, 16.676513671875, 17.42041015625, 18.164306640625, 18.908203125, 19.652099609375, 20.39599609375, 21.139892578125, 21.8837890625, 22.627685546875, 23.37158203125, 24.115478515625, 24.859375]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 3.0, 5.0, 5.0, 18.0, 26.0, 60.0, 70.0, 168.0, 383.0, 1766.0, 269865.0, 2869196.0, 3210.0, 510.0, 199.0, 98.0, 50.0, 35.0, 14.0, 12.0, 6.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-98.6875, -95.4111328125, -92.134765625, -88.8583984375, -85.58203125, -82.3056640625, -79.029296875, -75.7529296875, -72.4765625, -69.2001953125, -65.923828125, -62.6474609375, -59.37109375, -56.0947265625, -52.818359375, -49.5419921875, -46.265625, -42.9892578125, -39.712890625, -36.4365234375, -33.16015625, -29.8837890625, -26.607421875, -23.3310546875, -20.0546875, -16.7783203125, -13.501953125, -10.2255859375, -6.94921875, -3.6728515625, -0.396484375, 2.8798828125, 6.15625, 9.4326171875, 12.708984375, 15.9853515625, 19.26171875, 22.5380859375, 25.814453125, 29.0908203125, 32.3671875, 35.6435546875, 38.919921875, 42.1962890625, 45.47265625, 48.7490234375, 52.025390625, 55.3017578125, 58.578125, 61.8544921875, 65.130859375, 68.4072265625, 71.68359375, 74.9599609375, 78.236328125, 81.5126953125, 84.7890625, 88.0654296875, 91.341796875, 94.6181640625, 97.89453125, 101.1708984375, 104.447265625, 107.7236328125, 111.0]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 257.0, 757.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1223.1302490234375, -1202.4288330078125, -1181.7274169921875, -1161.02587890625, -1140.324462890625, -1119.623046875, -1098.921630859375, -1078.22021484375, -1057.518798828125, -1036.8173828125, -1016.1159057617188, -995.4144897460938, -974.7130126953125, -954.0115966796875, -933.3101806640625, -912.6087646484375, -891.9072265625, -871.205810546875, -850.5043334960938, -829.8029174804688, -809.1014404296875, -788.4000244140625, -767.6986083984375, -746.9971923828125, -726.2957153320312, -705.5942993164062, -684.892822265625, -664.19140625, -643.489990234375, -622.7885131835938, -602.0870971679688, -581.3856201171875, -560.6841430664062, -539.9827270507812, -519.28125, -498.579833984375, -477.8783874511719, -457.17694091796875, -436.47552490234375, -415.7740783691406, -395.0726318359375, -374.3711853027344, -353.66973876953125, -332.96832275390625, -312.2668762207031, -291.5654296875, -270.864013671875, -250.16256713867188, -229.46112060546875, -208.75967407226562, -188.05824279785156, -167.3568115234375, -146.65536499023438, -125.95392608642578, -105.25248718261719, -84.55105590820312, -63.84961700439453, -43.14817810058594, -22.446739196777344, -1.74530029296875, 18.956138610839844, 39.65757751464844, 60.35901641845703, 81.0604476928711, 101.76189422607422]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 6.0, 9.0, 10.0, 18.0, 9.0, 9.0, 14.0, 17.0, 8.0, 21.0, 26.0, 35.0, 35.0, 37.0, 37.0, 32.0, 33.0, 37.0, 40.0, 41.0, 50.0, 27.0, 47.0, 43.0, 26.0, 39.0, 38.0, 31.0, 30.0, 30.0, 31.0, 21.0, 15.0, 20.0, 10.0, 13.0, 11.0, 5.0, 12.0, 8.0, 4.0, 3.0, 4.0, 3.0, 4.0, 3.0, 0.0, 4.0, 0.0, 2.0, 0.0, 2.0], "bins": [-56.05120849609375, -54.31155014038086, -52.57189178466797, -50.83222961425781, -49.09257125854492, -47.35291290283203, -45.61325454711914, -43.87359619140625, -42.133934020996094, -40.3942756652832, -38.65461730957031, -36.914955139160156, -35.175296783447266, -33.435638427734375, -31.695980072021484, -29.956321716308594, -28.216663360595703, -26.477005004882812, -24.73734474182129, -22.9976863861084, -21.258026123046875, -19.518367767333984, -17.778709411621094, -16.039051055908203, -14.29939079284668, -12.559731483459473, -10.820072174072266, -9.080413818359375, -7.340754508972168, -5.601095199584961, -3.8614368438720703, -2.1217775344848633, -0.3821144104003906, 1.3575446605682373, 3.0972037315368652, 4.836862564086914, 6.576521873474121, 8.316181182861328, 10.055839538574219, 11.795498847961426, 13.535158157348633, 15.27481746673584, 17.014476776123047, 18.754135131835938, 20.493793487548828, 22.23345375061035, 23.973112106323242, 25.712772369384766, 27.452430725097656, 29.192089080810547, 30.93174934387207, 32.671409606933594, 34.411067962646484, 36.150726318359375, 37.890384674072266, 39.630043029785156, 41.36970520019531, 43.1093635559082, 44.849021911621094, 46.58868408203125, 48.32834243774414, 50.06800079345703, 51.80765914916992, 53.54731750488281, 55.2869758605957]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 7.0, 5.0, 7.0, 7.0, 20.0, 13.0, 12.0, 20.0, 26.0, 16.0, 22.0, 30.0, 38.0, 37.0, 41.0, 55.0, 53.0, 61.0, 52.0, 41.0, 45.0, 45.0, 52.0, 44.0, 42.0, 31.0, 25.0, 30.0, 25.0, 24.0, 20.0, 16.0, 11.0, 12.0, 10.0, 3.0, 2.0, 2.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.44140625, -7.19964599609375, -6.9578857421875, -6.71612548828125, -6.474365234375, -6.23260498046875, -5.9908447265625, -5.74908447265625, -5.50732421875, -5.26556396484375, -5.0238037109375, -4.78204345703125, -4.540283203125, -4.29852294921875, -4.0567626953125, -3.81500244140625, -3.5732421875, -3.33148193359375, -3.0897216796875, -2.84796142578125, -2.606201171875, -2.36444091796875, -2.1226806640625, -1.88092041015625, -1.63916015625, -1.39739990234375, -1.1556396484375, -0.91387939453125, -0.672119140625, -0.43035888671875, -0.1885986328125, 0.05316162109375, 0.294921875, 0.53668212890625, 0.7784423828125, 1.02020263671875, 1.261962890625, 1.50372314453125, 1.7454833984375, 1.98724365234375, 2.22900390625, 2.47076416015625, 2.7125244140625, 2.95428466796875, 3.196044921875, 3.43780517578125, 3.6795654296875, 3.92132568359375, 4.1630859375, 4.40484619140625, 4.6466064453125, 4.88836669921875, 5.130126953125, 5.37188720703125, 5.6136474609375, 5.85540771484375, 6.09716796875, 6.33892822265625, 6.5806884765625, 6.82244873046875, 7.064208984375, 7.30596923828125, 7.5477294921875, 7.78948974609375, 8.03125]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 4.0, 3.0, 7.0, 8.0, 15.0, 22.0, 20.0, 24.0, 45.0, 71.0, 78.0, 124.0, 163.0, 250.0, 380.0, 539.0, 927.0, 1475.0, 2583.0, 4987.0, 11022.0, 28109.0, 90206.0, 363572.0, 1306365.0, 1635709.0, 549640.0, 132441.0, 37548.0, 13684.0, 6258.0, 3143.0, 1731.0, 1077.0, 667.0, 399.0, 301.0, 188.0, 139.0, 105.0, 81.0, 48.0, 38.0, 30.0, 13.0, 21.0, 7.0, 9.0, 6.0, 5.0, 5.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-9.328125, -9.008056640625, -8.68798828125, -8.367919921875, -8.0478515625, -7.727783203125, -7.40771484375, -7.087646484375, -6.767578125, -6.447509765625, -6.12744140625, -5.807373046875, -5.4873046875, -5.167236328125, -4.84716796875, -4.527099609375, -4.20703125, -3.886962890625, -3.56689453125, -3.246826171875, -2.9267578125, -2.606689453125, -2.28662109375, -1.966552734375, -1.646484375, -1.326416015625, -1.00634765625, -0.686279296875, -0.3662109375, -0.046142578125, 0.27392578125, 0.593994140625, 0.9140625, 1.234130859375, 1.55419921875, 1.874267578125, 2.1943359375, 2.514404296875, 2.83447265625, 3.154541015625, 3.474609375, 3.794677734375, 4.11474609375, 4.434814453125, 4.7548828125, 5.074951171875, 5.39501953125, 5.715087890625, 6.03515625, 6.355224609375, 6.67529296875, 6.995361328125, 7.3154296875, 7.635498046875, 7.95556640625, 8.275634765625, 8.595703125, 8.915771484375, 9.23583984375, 9.555908203125, 9.8759765625, 10.196044921875, 10.51611328125, 10.836181640625, 11.15625]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 2.0, 1.0, 3.0, 6.0, 5.0, 13.0, 12.0, 27.0, 23.0, 26.0, 34.0, 41.0, 72.0, 108.0, 153.0, 169.0, 228.0, 318.0, 376.0, 445.0, 497.0, 403.0, 296.0, 233.0, 151.0, 105.0, 101.0, 51.0, 47.0, 39.0, 25.0, 19.0, 12.0, 9.0, 7.0, 7.0, 2.0, 2.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0], "bins": [-13.640625, -13.259521484375, -12.87841796875, -12.497314453125, -12.1162109375, -11.735107421875, -11.35400390625, -10.972900390625, -10.591796875, -10.210693359375, -9.82958984375, -9.448486328125, -9.0673828125, -8.686279296875, -8.30517578125, -7.924072265625, -7.54296875, -7.161865234375, -6.78076171875, -6.399658203125, -6.0185546875, -5.637451171875, -5.25634765625, -4.875244140625, -4.494140625, -4.113037109375, -3.73193359375, -3.350830078125, -2.9697265625, -2.588623046875, -2.20751953125, -1.826416015625, -1.4453125, -1.064208984375, -0.68310546875, -0.302001953125, 0.0791015625, 0.460205078125, 0.84130859375, 1.222412109375, 1.603515625, 1.984619140625, 2.36572265625, 2.746826171875, 3.1279296875, 3.509033203125, 3.89013671875, 4.271240234375, 4.65234375, 5.033447265625, 5.41455078125, 5.795654296875, 6.1767578125, 6.557861328125, 6.93896484375, 7.320068359375, 7.701171875, 8.082275390625, 8.46337890625, 8.844482421875, 9.2255859375, 9.606689453125, 9.98779296875, 10.368896484375, 10.75]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 5.0, 2.0, 14.0, 12.0, 24.0, 27.0, 54.0, 101.0, 151.0, 300.0, 640.0, 1789.0, 25912.0, 3810552.0, 348468.0, 4438.0, 884.0, 387.0, 216.0, 114.0, 63.0, 36.0, 34.0, 25.0, 12.0, 7.0, 7.0, 2.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.125, -38.1904296875, -36.255859375, -34.3212890625, -32.38671875, -30.4521484375, -28.517578125, -26.5830078125, -24.6484375, -22.7138671875, -20.779296875, -18.8447265625, -16.91015625, -14.9755859375, -13.041015625, -11.1064453125, -9.171875, -7.2373046875, -5.302734375, -3.3681640625, -1.43359375, 0.5009765625, 2.435546875, 4.3701171875, 6.3046875, 8.2392578125, 10.173828125, 12.1083984375, 14.04296875, 15.9775390625, 17.912109375, 19.8466796875, 21.78125, 23.7158203125, 25.650390625, 27.5849609375, 29.51953125, 31.4541015625, 33.388671875, 35.3232421875, 37.2578125, 39.1923828125, 41.126953125, 43.0615234375, 44.99609375, 46.9306640625, 48.865234375, 50.7998046875, 52.734375, 54.6689453125, 56.603515625, 58.5380859375, 60.47265625, 62.4072265625, 64.341796875, 66.2763671875, 68.2109375, 70.1455078125, 72.080078125, 74.0146484375, 75.94921875, 77.8837890625, 79.818359375, 81.7529296875, 83.6875]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 343.0, 660.0, 9.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-633.7293701171875, -615.1734008789062, -596.6173706054688, -578.0614013671875, -559.50537109375, -540.9494018554688, -522.3933715820312, -503.83740234375, -485.2813720703125, -466.7253723144531, -448.16937255859375, -429.6133728027344, -411.057373046875, -392.5013732910156, -373.94537353515625, -355.389404296875, -336.8334045410156, -318.27740478515625, -299.7214050292969, -281.1654052734375, -262.6094055175781, -244.05340576171875, -225.49742126464844, -206.94142150878906, -188.3854217529297, -169.8294219970703, -151.27342224121094, -132.71743774414062, -114.16143035888672, -95.60543060302734, -77.0494384765625, -58.493438720703125, -39.93743896484375, -21.381441116333008, -2.8254432678222656, 15.730552673339844, 34.28655242919922, 52.842552185058594, 71.39854431152344, 89.95454406738281, 108.51054382324219, 127.06654357910156, 145.62254333496094, 164.17852783203125, 182.73452758789062, 201.29052734375, 219.84652709960938, 238.40252685546875, 256.9585266113281, 275.5145263671875, 294.0705261230469, 312.62652587890625, 331.1825256347656, 349.738525390625, 368.29449462890625, 386.85052490234375, 405.406494140625, 423.9624938964844, 442.51849365234375, 461.0744934082031, 479.6304931640625, 498.1864929199219, 516.7424926757812, 535.2984619140625, 553.8544921875]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 8.0, 6.0, 4.0, 5.0, 8.0, 10.0, 13.0, 16.0, 10.0, 18.0, 29.0, 26.0, 17.0, 31.0, 34.0, 32.0, 36.0, 42.0, 28.0, 39.0, 42.0, 40.0, 47.0, 38.0, 43.0, 35.0, 35.0, 35.0, 33.0, 33.0, 28.0, 27.0, 20.0, 30.0, 18.0, 10.0, 18.0, 15.0, 15.0, 11.0, 5.0, 6.0, 2.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.11483383178711, -41.77745056152344, -40.44007110595703, -39.10268783569336, -37.76530838012695, -36.42792510986328, -35.090545654296875, -33.7531623840332, -32.4157829284668, -31.078401565551758, -29.74102020263672, -28.40363883972168, -27.06625747680664, -25.7288761138916, -24.391494750976562, -23.05411148071289, -21.71673011779785, -20.379348754882812, -19.041967391967773, -17.704586029052734, -16.367204666137695, -15.029823303222656, -13.6924409866333, -12.355059623718262, -11.017678260803223, -9.680296897888184, -8.342915534973145, -7.005533695220947, -5.668152332305908, -4.330770969390869, -2.993389129638672, -1.6560077667236328, -0.31862640380859375, 1.0187550783157349, 2.3561365604400635, 3.6935181617736816, 5.030899524688721, 6.36828088760376, 7.705662727355957, 9.043044090270996, 10.380425453186035, 11.717806816101074, 13.055188179016113, 14.392570495605469, 15.729951858520508, 17.067333221435547, 18.404714584350586, 19.742095947265625, 21.079477310180664, 22.416858673095703, 23.754240036010742, 25.09162139892578, 26.42900276184082, 27.76638412475586, 29.10376739501953, 30.441146850585938, 31.77853012084961, 33.11591339111328, 34.45329284667969, 35.79067611694336, 37.128055572509766, 38.46543884277344, 39.802818298339844, 41.140201568603516, 42.47758102416992]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 11.0, 3.0, 5.0, 8.0, 6.0, 10.0, 17.0, 13.0, 24.0, 28.0, 23.0, 28.0, 42.0, 40.0, 47.0, 54.0, 49.0, 51.0, 53.0, 50.0, 47.0, 54.0, 45.0, 44.0, 44.0, 40.0, 38.0, 26.0, 26.0, 22.0, 12.0, 10.0, 12.0, 9.0, 7.0, 2.0, 3.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.625, -7.38519287109375, -7.1453857421875, -6.90557861328125, -6.665771484375, -6.42596435546875, -6.1861572265625, -5.94635009765625, -5.70654296875, -5.46673583984375, -5.2269287109375, -4.98712158203125, -4.747314453125, -4.50750732421875, -4.2677001953125, -4.02789306640625, -3.7880859375, -3.54827880859375, -3.3084716796875, -3.06866455078125, -2.828857421875, -2.58905029296875, -2.3492431640625, -2.10943603515625, -1.86962890625, -1.62982177734375, -1.3900146484375, -1.15020751953125, -0.910400390625, -0.67059326171875, -0.4307861328125, -0.19097900390625, 0.048828125, 0.28863525390625, 0.5284423828125, 0.76824951171875, 1.008056640625, 1.24786376953125, 1.4876708984375, 1.72747802734375, 1.96728515625, 2.20709228515625, 2.4468994140625, 2.68670654296875, 2.926513671875, 3.16632080078125, 3.4061279296875, 3.64593505859375, 3.8857421875, 4.12554931640625, 4.3653564453125, 4.60516357421875, 4.844970703125, 5.08477783203125, 5.3245849609375, 5.56439208984375, 5.80419921875, 6.04400634765625, 6.2838134765625, 6.52362060546875, 6.763427734375, 7.00323486328125, 7.2430419921875, 7.48284912109375, 7.72265625]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 8.0, 9.0, 11.0, 13.0, 29.0, 53.0, 48.0, 112.0, 146.0, 213.0, 394.0, 599.0, 928.0, 1596.0, 2680.0, 4424.0, 7649.0, 12980.0, 22251.0, 37959.0, 62812.0, 98962.0, 142252.0, 169506.0, 159391.0, 121405.0, 80478.0, 49914.0, 29550.0, 17221.0, 10165.0, 5898.0, 3483.0, 2045.0, 1292.0, 780.0, 478.0, 315.0, 173.0, 113.0, 78.0, 55.0, 32.0, 22.0, 11.0, 11.0, 7.0, 6.0, 2.0, 3.0, 4.0, 0.0, 0.0, 1.0], "bins": [-1.46875, -1.4252471923828125, -1.381744384765625, -1.3382415771484375, -1.29473876953125, -1.2512359619140625, -1.207733154296875, -1.1642303466796875, -1.1207275390625, -1.0772247314453125, -1.033721923828125, -0.9902191162109375, -0.94671630859375, -0.9032135009765625, -0.859710693359375, -0.8162078857421875, -0.772705078125, -0.7292022705078125, -0.685699462890625, -0.6421966552734375, -0.59869384765625, -0.5551910400390625, -0.511688232421875, -0.4681854248046875, -0.4246826171875, -0.3811798095703125, -0.337677001953125, -0.2941741943359375, -0.25067138671875, -0.2071685791015625, -0.163665771484375, -0.1201629638671875, -0.07666015625, -0.0331573486328125, 0.010345458984375, 0.0538482666015625, 0.09735107421875, 0.1408538818359375, 0.184356689453125, 0.2278594970703125, 0.2713623046875, 0.3148651123046875, 0.358367919921875, 0.4018707275390625, 0.44537353515625, 0.4888763427734375, 0.532379150390625, 0.5758819580078125, 0.619384765625, 0.6628875732421875, 0.706390380859375, 0.7498931884765625, 0.79339599609375, 0.8368988037109375, 0.880401611328125, 0.9239044189453125, 0.9674072265625, 1.0109100341796875, 1.054412841796875, 1.0979156494140625, 1.14141845703125, 1.1849212646484375, 1.228424072265625, 1.2719268798828125, 1.3154296875]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 6.0, 2.0, 6.0, 2.0, 3.0, 8.0, 1.0, 8.0, 5.0, 11.0, 11.0, 13.0, 11.0, 16.0, 11.0, 29.0, 25.0, 34.0, 34.0, 26.0, 27.0, 39.0, 32.0, 52.0, 35.0, 32.0, 1065.0, 41.0, 41.0, 40.0, 32.0, 33.0, 44.0, 29.0, 26.0, 33.0, 25.0, 16.0, 18.0, 13.0, 23.0, 11.0, 13.0, 8.0, 7.0, 11.0, 9.0, 6.0, 5.0, 2.0, 7.0, 2.0, 0.0, 2.0, 4.0], "bins": [-4.98828125, -4.848541259765625, -4.70880126953125, -4.569061279296875, -4.4293212890625, -4.289581298828125, -4.14984130859375, -4.010101318359375, -3.870361328125, -3.730621337890625, -3.59088134765625, -3.451141357421875, -3.3114013671875, -3.171661376953125, -3.03192138671875, -2.892181396484375, -2.75244140625, -2.612701416015625, -2.47296142578125, -2.333221435546875, -2.1934814453125, -2.053741455078125, -1.91400146484375, -1.774261474609375, -1.634521484375, -1.494781494140625, -1.35504150390625, -1.215301513671875, -1.0755615234375, -0.935821533203125, -0.79608154296875, -0.656341552734375, -0.5166015625, -0.376861572265625, -0.23712158203125, -0.097381591796875, 0.0423583984375, 0.182098388671875, 0.32183837890625, 0.461578369140625, 0.601318359375, 0.741058349609375, 0.88079833984375, 1.020538330078125, 1.1602783203125, 1.300018310546875, 1.43975830078125, 1.579498291015625, 1.71923828125, 1.858978271484375, 1.99871826171875, 2.138458251953125, 2.2781982421875, 2.417938232421875, 2.55767822265625, 2.697418212890625, 2.837158203125, 2.976898193359375, 3.11663818359375, 3.256378173828125, 3.3961181640625, 3.535858154296875, 3.67559814453125, 3.815338134765625, 3.955078125]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 5.0, 11.0, 7.0, 14.0, 14.0, 27.0, 42.0, 43.0, 67.0, 90.0, 136.0, 209.0, 302.0, 415.0, 619.0, 898.0, 1263.0, 1938.0, 2870.0, 4240.0, 6260.0, 9376.0, 14328.0, 23431.0, 60576.0, 1415024.0, 446283.0, 46858.0, 21118.0, 13326.0, 8712.0, 5930.0, 4022.0, 2662.0, 1891.0, 1282.0, 881.0, 618.0, 381.0, 293.0, 201.0, 145.0, 103.0, 66.0, 38.0, 33.0, 22.0, 21.0, 17.0, 10.0, 8.0, 4.0, 5.0, 2.0, 2.0, 0.0, 1.0], "bins": [-2.193359375, -2.126708984375, -2.06005859375, -1.993408203125, -1.9267578125, -1.860107421875, -1.79345703125, -1.726806640625, -1.66015625, -1.593505859375, -1.52685546875, -1.460205078125, -1.3935546875, -1.326904296875, -1.26025390625, -1.193603515625, -1.126953125, -1.060302734375, -0.99365234375, -0.927001953125, -0.8603515625, -0.793701171875, -0.72705078125, -0.660400390625, -0.59375, -0.527099609375, -0.46044921875, -0.393798828125, -0.3271484375, -0.260498046875, -0.19384765625, -0.127197265625, -0.060546875, 0.006103515625, 0.07275390625, 0.139404296875, 0.2060546875, 0.272705078125, 0.33935546875, 0.406005859375, 0.47265625, 0.539306640625, 0.60595703125, 0.672607421875, 0.7392578125, 0.805908203125, 0.87255859375, 0.939208984375, 1.005859375, 1.072509765625, 1.13916015625, 1.205810546875, 1.2724609375, 1.339111328125, 1.40576171875, 1.472412109375, 1.5390625, 1.605712890625, 1.67236328125, 1.739013671875, 1.8056640625, 1.872314453125, 1.93896484375, 2.005615234375, 2.072265625]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 3.0, 2.0, 4.0, 5.0, 5.0, 6.0, 14.0, 11.0, 21.0, 31.0, 36.0, 45.0, 54.0, 61.0, 79.0, 83.0, 82.0, 87.0, 67.0, 76.0, 58.0, 43.0, 33.0, 22.0, 16.0, 16.0, 9.0, 11.0, 7.0, 8.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1824951171875, -0.1771526336669922, -0.17181015014648438, -0.16646766662597656, -0.16112518310546875, -0.15578269958496094, -0.15044021606445312, -0.1450977325439453, -0.1397552490234375, -0.1344127655029297, -0.12907028198242188, -0.12372779846191406, -0.11838531494140625, -0.11304283142089844, -0.10770034790039062, -0.10235786437988281, -0.097015380859375, -0.09167289733886719, -0.08633041381835938, -0.08098793029785156, -0.07564544677734375, -0.07030296325683594, -0.06496047973632812, -0.05961799621582031, -0.0542755126953125, -0.04893302917480469, -0.043590545654296875, -0.03824806213378906, -0.03290557861328125, -0.027563095092773438, -0.022220611572265625, -0.016878128051757812, -0.01153564453125, -0.0061931610107421875, -0.000850677490234375, 0.0044918060302734375, 0.00983428955078125, 0.015176773071289062, 0.020519256591796875, 0.025861740112304688, 0.0312042236328125, 0.03654670715332031, 0.041889190673828125, 0.04723167419433594, 0.05257415771484375, 0.05791664123535156, 0.06325912475585938, 0.06860160827636719, 0.073944091796875, 0.07928657531738281, 0.08462905883789062, 0.08997154235839844, 0.09531402587890625, 0.10065650939941406, 0.10599899291992188, 0.11134147644042969, 0.1166839599609375, 0.12202644348144531, 0.12736892700195312, 0.13271141052246094, 0.13805389404296875, 0.14339637756347656, 0.14873886108398438, 0.1540813446044922, 0.159423828125]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 4.0, 6.0, 9.0, 12.0, 14.0, 17.0, 24.0, 27.0, 34.0, 80.0, 128.0, 169.0, 395.0, 2905.0, 704222.0, 337790.0, 1917.0, 353.0, 143.0, 99.0, 56.0, 48.0, 35.0, 19.0, 8.0, 12.0, 7.0, 3.0, 4.0, 3.0, 4.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.337890625, -3.226409912109375, -3.11492919921875, -3.003448486328125, -2.8919677734375, -2.780487060546875, -2.66900634765625, -2.557525634765625, -2.446044921875, -2.334564208984375, -2.22308349609375, -2.111602783203125, -2.0001220703125, -1.888641357421875, -1.77716064453125, -1.665679931640625, -1.55419921875, -1.442718505859375, -1.33123779296875, -1.219757080078125, -1.1082763671875, -0.996795654296875, -0.88531494140625, -0.773834228515625, -0.662353515625, -0.550872802734375, -0.43939208984375, -0.327911376953125, -0.2164306640625, -0.104949951171875, 0.00653076171875, 0.118011474609375, 0.2294921875, 0.340972900390625, 0.45245361328125, 0.563934326171875, 0.6754150390625, 0.786895751953125, 0.89837646484375, 1.009857177734375, 1.121337890625, 1.232818603515625, 1.34429931640625, 1.455780029296875, 1.5672607421875, 1.678741455078125, 1.79022216796875, 1.901702880859375, 2.01318359375, 2.124664306640625, 2.23614501953125, 2.347625732421875, 2.4591064453125, 2.570587158203125, 2.68206787109375, 2.793548583984375, 2.905029296875, 3.016510009765625, 3.12799072265625, 3.239471435546875, 3.3509521484375, 3.462432861328125, 3.57391357421875, 3.685394287109375, 3.796875]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 4.0, 2.0, 4.0, 10.0, 8.0, 23.0, 37.0, 58.0, 111.0, 239.0, 230.0, 131.0, 63.0, 42.0, 20.0, 21.0, 4.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9322048425674438, -0.9048234820365906, -0.8774421215057373, -0.850060760974884, -0.8226794004440308, -0.7952980399131775, -0.7679166793823242, -0.7405353784561157, -0.7131539583206177, -0.6857725977897644, -0.6583912372589111, -0.6310098767280579, -0.6036285161972046, -0.5762471556663513, -0.548865795135498, -0.5214844942092896, -0.4941031336784363, -0.466721773147583, -0.43934041261672974, -0.41195905208587646, -0.3845776915550232, -0.3571963310241699, -0.32981500029563904, -0.30243363976478577, -0.2750522792339325, -0.24767091870307922, -0.22028955817222595, -0.19290821254253387, -0.1655268520116806, -0.13814549148082733, -0.11076414585113525, -0.08338278532028198, -0.056001365184783936, -0.028620008379220963, -0.0012386515736579895, 0.026142701506614685, 0.05352406203746796, 0.08090542256832123, 0.1082867681980133, 0.13566812872886658, 0.16304948925971985, 0.19043084979057312, 0.2178122103214264, 0.24519355595111847, 0.27257490158081055, 0.2999562621116638, 0.3273376226425171, 0.35471898317337036, 0.38210034370422363, 0.4094817042350769, 0.4368630647659302, 0.46424442529678345, 0.4916257858276367, 0.51900714635849, 0.5463885068893433, 0.5737698078155518, 0.6011512279510498, 0.6285325884819031, 0.6559139490127563, 0.6832953095436096, 0.7106766700744629, 0.7380580306053162, 0.7654393911361694, 0.7928206920623779, 0.8202020525932312]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 8.0, 8.0, 4.0, 3.0, 14.0, 5.0, 10.0, 12.0, 17.0, 22.0, 18.0, 10.0, 19.0, 30.0, 26.0, 32.0, 33.0, 31.0, 41.0, 32.0, 35.0, 48.0, 36.0, 45.0, 34.0, 30.0, 38.0, 36.0, 35.0, 33.0, 27.0, 27.0, 24.0, 28.0, 30.0, 14.0, 16.0, 11.0, 12.0, 19.0, 10.0, 4.0, 6.0, 6.0, 8.0, 7.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.16295462846755981, -0.1579987108707428, -0.15304279327392578, -0.14808687567710876, -0.14313095808029175, -0.13817502558231354, -0.13321910798549652, -0.1282631903886795, -0.12330727279186249, -0.11835135519504547, -0.11339543759822845, -0.10843951255083084, -0.10348359495401382, -0.09852767735719681, -0.0935717523097992, -0.08861583471298218, -0.08365991711616516, -0.07870399951934814, -0.07374808192253113, -0.06879215687513351, -0.0638362392783165, -0.05888032168149948, -0.053924400359392166, -0.04896847903728485, -0.044012561440467834, -0.03905664384365082, -0.0341007225215435, -0.029144803062081337, -0.02418888360261917, -0.019232964143157005, -0.01427704468369484, -0.009321123361587524, -0.004365205764770508, 0.000590713694691658, 0.005546633154153824, 0.01050255261361599, 0.015458472073078156, 0.02041439153254032, 0.025370310992002487, 0.030326232314109802, 0.03528214991092682, 0.040238067507743835, 0.04519398882985115, 0.050149910151958466, 0.05510582774877548, 0.0600617453455925, 0.06501767039299011, 0.06997358798980713, 0.07492950558662415, 0.07988542318344116, 0.08484134078025818, 0.08979726582765579, 0.09475318342447281, 0.09970910102128983, 0.10466502606868744, 0.10962094366550446, 0.11457686126232147, 0.11953277885913849, 0.1244886964559555, 0.12944461405277252, 0.13440054655075073, 0.13935646414756775, 0.14431238174438477, 0.14926829934120178, 0.1542242169380188]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 1.0, 5.0, 6.0, 10.0, 8.0, 10.0, 12.0, 20.0, 19.0, 18.0, 29.0, 47.0, 36.0, 41.0, 44.0, 44.0, 53.0, 45.0, 53.0, 56.0, 53.0, 51.0, 49.0, 40.0, 48.0, 47.0, 34.0, 25.0, 23.0, 10.0, 14.0, 15.0, 12.0, 8.0, 6.0, 3.0, 4.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.75, -6.507080078125, -6.26416015625, -6.021240234375, -5.7783203125, -5.535400390625, -5.29248046875, -5.049560546875, -4.806640625, -4.563720703125, -4.32080078125, -4.077880859375, -3.8349609375, -3.592041015625, -3.34912109375, -3.106201171875, -2.86328125, -2.620361328125, -2.37744140625, -2.134521484375, -1.8916015625, -1.648681640625, -1.40576171875, -1.162841796875, -0.919921875, -0.677001953125, -0.43408203125, -0.191162109375, 0.0517578125, 0.294677734375, 0.53759765625, 0.780517578125, 1.0234375, 1.266357421875, 1.50927734375, 1.752197265625, 1.9951171875, 2.238037109375, 2.48095703125, 2.723876953125, 2.966796875, 3.209716796875, 3.45263671875, 3.695556640625, 3.9384765625, 4.181396484375, 4.42431640625, 4.667236328125, 4.91015625, 5.153076171875, 5.39599609375, 5.638916015625, 5.8818359375, 6.124755859375, 6.36767578125, 6.610595703125, 6.853515625, 7.096435546875, 7.33935546875, 7.582275390625, 7.8251953125, 8.068115234375, 8.31103515625, 8.553955078125, 8.796875]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 4.0, 1.0, 1.0, 4.0, 3.0, 11.0, 9.0, 14.0, 23.0, 35.0, 65.0, 78.0, 118.0, 217.0, 325.0, 468.0, 700.0, 1207.0, 1839.0, 3026.0, 4915.0, 8183.0, 13982.0, 24078.0, 42878.0, 78294.0, 145891.0, 228460.0, 212770.0, 125003.0, 67043.0, 36764.0, 21172.0, 12035.0, 7320.0, 4351.0, 2685.0, 1659.0, 1038.0, 704.0, 423.0, 283.0, 143.0, 96.0, 88.0, 64.0, 27.0, 26.0, 21.0, 10.0, 6.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.9609375, -4.78912353515625, -4.6173095703125, -4.44549560546875, -4.273681640625, -4.10186767578125, -3.9300537109375, -3.75823974609375, -3.58642578125, -3.41461181640625, -3.2427978515625, -3.07098388671875, -2.899169921875, -2.72735595703125, -2.5555419921875, -2.38372802734375, -2.2119140625, -2.04010009765625, -1.8682861328125, -1.69647216796875, -1.524658203125, -1.35284423828125, -1.1810302734375, -1.00921630859375, -0.83740234375, -0.66558837890625, -0.4937744140625, -0.32196044921875, -0.150146484375, 0.02166748046875, 0.1934814453125, 0.36529541015625, 0.537109375, 0.70892333984375, 0.8807373046875, 1.05255126953125, 1.224365234375, 1.39617919921875, 1.5679931640625, 1.73980712890625, 1.91162109375, 2.08343505859375, 2.2552490234375, 2.42706298828125, 2.598876953125, 2.77069091796875, 2.9425048828125, 3.11431884765625, 3.2861328125, 3.45794677734375, 3.6297607421875, 3.80157470703125, 3.973388671875, 4.14520263671875, 4.3170166015625, 4.48883056640625, 4.66064453125, 4.83245849609375, 5.0042724609375, 5.17608642578125, 5.347900390625, 5.51971435546875, 5.6915283203125, 5.86334228515625, 6.03515625]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 4.0, 6.0, 12.0, 15.0, 16.0, 23.0, 19.0, 24.0, 39.0, 45.0, 42.0, 69.0, 82.0, 168.0, 346.0, 1467.0, 219.0, 104.0, 65.0, 52.0, 48.0, 41.0, 41.0, 18.0, 22.0, 17.0, 13.0, 14.0, 6.0, 3.0, 7.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.265625, -28.409912109375, -27.55419921875, -26.698486328125, -25.8427734375, -24.987060546875, -24.13134765625, -23.275634765625, -22.419921875, -21.564208984375, -20.70849609375, -19.852783203125, -18.9970703125, -18.141357421875, -17.28564453125, -16.429931640625, -15.57421875, -14.718505859375, -13.86279296875, -13.007080078125, -12.1513671875, -11.295654296875, -10.43994140625, -9.584228515625, -8.728515625, -7.872802734375, -7.01708984375, -6.161376953125, -5.3056640625, -4.449951171875, -3.59423828125, -2.738525390625, -1.8828125, -1.027099609375, -0.17138671875, 0.684326171875, 1.5400390625, 2.395751953125, 3.25146484375, 4.107177734375, 4.962890625, 5.818603515625, 6.67431640625, 7.530029296875, 8.3857421875, 9.241455078125, 10.09716796875, 10.952880859375, 11.80859375, 12.664306640625, 13.52001953125, 14.375732421875, 15.2314453125, 16.087158203125, 16.94287109375, 17.798583984375, 18.654296875, 19.510009765625, 20.36572265625, 21.221435546875, 22.0771484375, 22.932861328125, 23.78857421875, 24.644287109375, 25.5]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 4.0, 0.0, 5.0, 5.0, 8.0, 13.0, 16.0, 28.0, 43.0, 48.0, 75.0, 126.0, 229.0, 392.0, 1009.0, 8077.0, 424014.0, 2679362.0, 28902.0, 2015.0, 600.0, 279.0, 146.0, 101.0, 64.0, 38.0, 43.0, 23.0, 9.0, 11.0, 9.0, 7.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-44.34375, -43.04736328125, -41.7509765625, -40.45458984375, -39.158203125, -37.86181640625, -36.5654296875, -35.26904296875, -33.97265625, -32.67626953125, -31.3798828125, -30.08349609375, -28.787109375, -27.49072265625, -26.1943359375, -24.89794921875, -23.6015625, -22.30517578125, -21.0087890625, -19.71240234375, -18.416015625, -17.11962890625, -15.8232421875, -14.52685546875, -13.23046875, -11.93408203125, -10.6376953125, -9.34130859375, -8.044921875, -6.74853515625, -5.4521484375, -4.15576171875, -2.859375, -1.56298828125, -0.2666015625, 1.02978515625, 2.326171875, 3.62255859375, 4.9189453125, 6.21533203125, 7.51171875, 8.80810546875, 10.1044921875, 11.40087890625, 12.697265625, 13.99365234375, 15.2900390625, 16.58642578125, 17.8828125, 19.17919921875, 20.4755859375, 21.77197265625, 23.068359375, 24.36474609375, 25.6611328125, 26.95751953125, 28.25390625, 29.55029296875, 30.8466796875, 32.14306640625, 33.439453125, 34.73583984375, 36.0322265625, 37.32861328125, 38.625]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 99.0, 901.0, 17.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-723.0773315429688, -710.251953125, -697.4265747070312, -684.6011352539062, -671.7757568359375, -658.9503784179688, -646.125, -633.299560546875, -620.4741821289062, -607.6488037109375, -594.8234252929688, -581.9979858398438, -569.172607421875, -556.3472290039062, -543.5218505859375, -530.6964111328125, -517.87109375, -505.04571533203125, -492.2203063964844, -479.3949279785156, -466.56951904296875, -453.744140625, -440.91876220703125, -428.0933532714844, -415.2679443359375, -402.44256591796875, -389.6171569824219, -376.7917785644531, -363.96636962890625, -351.1409912109375, -338.31561279296875, -325.4902038574219, -312.664794921875, -299.83941650390625, -287.0140075683594, -274.1886291503906, -261.36322021484375, -248.537841796875, -235.7124481201172, -222.88705444335938, -210.0616455078125, -197.2362518310547, -184.41085815429688, -171.58547973632812, -158.76007080078125, -145.9346923828125, -133.1092987060547, -120.28390502929688, -107.4585189819336, -94.63312530517578, -81.8077392578125, -68.98234558105469, -56.156951904296875, -43.33155822753906, -30.50617218017578, -17.68077850341797, -4.855384826660156, 7.970006942749023, 20.795398712158203, 33.62078857421875, 46.44618225097656, 59.271575927734375, 72.09696197509766, 84.92235565185547, 97.74774932861328]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 7.0, 9.0, 6.0, 7.0, 15.0, 10.0, 17.0, 15.0, 16.0, 20.0, 26.0, 23.0, 24.0, 32.0, 29.0, 43.0, 46.0, 41.0, 54.0, 44.0, 35.0, 35.0, 41.0, 46.0, 46.0, 35.0, 43.0, 25.0, 34.0, 26.0, 26.0, 25.0, 19.0, 19.0, 18.0, 12.0, 12.0, 8.0, 2.0, 3.0, 4.0, 3.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-56.41648864746094, -54.635276794433594, -52.854061126708984, -51.07284927368164, -49.29163360595703, -47.51042175292969, -45.729209899902344, -43.947994232177734, -42.16678237915039, -40.38557052612305, -38.60435485839844, -36.823143005371094, -35.041927337646484, -33.26071548461914, -31.479501724243164, -29.698287963867188, -27.91707420349121, -26.135860443115234, -24.354646682739258, -22.57343292236328, -20.792221069335938, -19.01100730895996, -17.229793548583984, -15.448580741882324, -13.667366981506348, -11.886153221130371, -10.104940414428711, -8.323726654052734, -6.542513370513916, -4.761300086975098, -2.980086326599121, -1.198873519897461, 0.5823402404785156, 2.363553524017334, 4.144766807556152, 5.925980567932129, 7.707193851470947, 9.488407135009766, 11.269620895385742, 13.050833702087402, 14.832047462463379, 16.61326026916504, 18.394474029541016, 20.175687789916992, 21.95690155029297, 23.738113403320312, 25.519329071044922, 27.300540924072266, 29.081754684448242, 30.86296844482422, 32.64418029785156, 34.42539596557617, 36.206607818603516, 37.987823486328125, 39.76903533935547, 41.55024719238281, 43.33146286010742, 45.112674713134766, 46.893890380859375, 48.67510223388672, 50.45631790161133, 52.23752975463867, 54.01874542236328, 55.799957275390625, 57.58116912841797]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 1.0, 5.0, 6.0, 5.0, 4.0, 12.0, 10.0, 10.0, 15.0, 18.0, 21.0, 25.0, 21.0, 25.0, 20.0, 31.0, 44.0, 45.0, 43.0, 39.0, 51.0, 53.0, 47.0, 41.0, 38.0, 37.0, 50.0, 38.0, 34.0, 39.0, 25.0, 32.0, 23.0, 19.0, 21.0, 10.0, 8.0, 11.0, 9.0, 4.0, 4.0, 4.0, 6.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-7.33984375, -7.1168212890625, -6.893798828125, -6.6707763671875, -6.44775390625, -6.2247314453125, -6.001708984375, -5.7786865234375, -5.5556640625, -5.3326416015625, -5.109619140625, -4.8865966796875, -4.66357421875, -4.4405517578125, -4.217529296875, -3.9945068359375, -3.771484375, -3.5484619140625, -3.325439453125, -3.1024169921875, -2.87939453125, -2.6563720703125, -2.433349609375, -2.2103271484375, -1.9873046875, -1.7642822265625, -1.541259765625, -1.3182373046875, -1.09521484375, -0.8721923828125, -0.649169921875, -0.4261474609375, -0.203125, 0.0198974609375, 0.242919921875, 0.4659423828125, 0.68896484375, 0.9119873046875, 1.135009765625, 1.3580322265625, 1.5810546875, 1.8040771484375, 2.027099609375, 2.2501220703125, 2.47314453125, 2.6961669921875, 2.919189453125, 3.1422119140625, 3.365234375, 3.5882568359375, 3.811279296875, 4.0343017578125, 4.25732421875, 4.4803466796875, 4.703369140625, 4.9263916015625, 5.1494140625, 5.3724365234375, 5.595458984375, 5.8184814453125, 6.04150390625, 6.2645263671875, 6.487548828125, 6.7105712890625, 6.93359375]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 2.0, 4.0, 1.0, 3.0, 11.0, 8.0, 11.0, 24.0, 23.0, 27.0, 39.0, 47.0, 53.0, 98.0, 109.0, 160.0, 254.0, 388.0, 498.0, 713.0, 1155.0, 1875.0, 3281.0, 6216.0, 13762.0, 37305.0, 129912.0, 567255.0, 1898838.0, 1156242.0, 265972.0, 67434.0, 22087.0, 9217.0, 4403.0, 2500.0, 1535.0, 863.0, 585.0, 352.0, 291.0, 209.0, 142.0, 88.0, 65.0, 70.0, 36.0, 40.0, 33.0, 16.0, 15.0, 12.0, 8.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0], "bins": [-10.28125, -9.96728515625, -9.6533203125, -9.33935546875, -9.025390625, -8.71142578125, -8.3974609375, -8.08349609375, -7.76953125, -7.45556640625, -7.1416015625, -6.82763671875, -6.513671875, -6.19970703125, -5.8857421875, -5.57177734375, -5.2578125, -4.94384765625, -4.6298828125, -4.31591796875, -4.001953125, -3.68798828125, -3.3740234375, -3.06005859375, -2.74609375, -2.43212890625, -2.1181640625, -1.80419921875, -1.490234375, -1.17626953125, -0.8623046875, -0.54833984375, -0.234375, 0.07958984375, 0.3935546875, 0.70751953125, 1.021484375, 1.33544921875, 1.6494140625, 1.96337890625, 2.27734375, 2.59130859375, 2.9052734375, 3.21923828125, 3.533203125, 3.84716796875, 4.1611328125, 4.47509765625, 4.7890625, 5.10302734375, 5.4169921875, 5.73095703125, 6.044921875, 6.35888671875, 6.6728515625, 6.98681640625, 7.30078125, 7.61474609375, 7.9287109375, 8.24267578125, 8.556640625, 8.87060546875, 9.1845703125, 9.49853515625, 9.8125]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 7.0, 10.0, 7.0, 9.0, 14.0, 11.0, 12.0, 20.0, 23.0, 37.0, 50.0, 62.0, 79.0, 116.0, 165.0, 186.0, 301.0, 360.0, 453.0, 511.0, 417.0, 316.0, 248.0, 160.0, 135.0, 85.0, 66.0, 49.0, 36.0, 29.0, 22.0, 16.0, 13.0, 18.0, 6.0, 8.0, 5.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-11.7890625, -11.472412109375, -11.15576171875, -10.839111328125, -10.5224609375, -10.205810546875, -9.88916015625, -9.572509765625, -9.255859375, -8.939208984375, -8.62255859375, -8.305908203125, -7.9892578125, -7.672607421875, -7.35595703125, -7.039306640625, -6.72265625, -6.406005859375, -6.08935546875, -5.772705078125, -5.4560546875, -5.139404296875, -4.82275390625, -4.506103515625, -4.189453125, -3.872802734375, -3.55615234375, -3.239501953125, -2.9228515625, -2.606201171875, -2.28955078125, -1.972900390625, -1.65625, -1.339599609375, -1.02294921875, -0.706298828125, -0.3896484375, -0.072998046875, 0.24365234375, 0.560302734375, 0.876953125, 1.193603515625, 1.51025390625, 1.826904296875, 2.1435546875, 2.460205078125, 2.77685546875, 3.093505859375, 3.41015625, 3.726806640625, 4.04345703125, 4.360107421875, 4.6767578125, 4.993408203125, 5.31005859375, 5.626708984375, 5.943359375, 6.260009765625, 6.57666015625, 6.893310546875, 7.2099609375, 7.526611328125, 7.84326171875, 8.159912109375, 8.4765625]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 6.0, 7.0, 6.0, 8.0, 11.0, 15.0, 21.0, 24.0, 25.0, 43.0, 64.0, 89.0, 128.0, 191.0, 294.0, 556.0, 1858.0, 12927.0, 264503.0, 3646264.0, 251983.0, 12148.0, 1660.0, 549.0, 287.0, 179.0, 116.0, 91.0, 56.0, 41.0, 29.0, 25.0, 8.0, 17.0, 18.0, 6.0, 9.0, 8.0, 6.0, 3.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.59375, -29.48095703125, -28.3681640625, -27.25537109375, -26.142578125, -25.02978515625, -23.9169921875, -22.80419921875, -21.69140625, -20.57861328125, -19.4658203125, -18.35302734375, -17.240234375, -16.12744140625, -15.0146484375, -13.90185546875, -12.7890625, -11.67626953125, -10.5634765625, -9.45068359375, -8.337890625, -7.22509765625, -6.1123046875, -4.99951171875, -3.88671875, -2.77392578125, -1.6611328125, -0.54833984375, 0.564453125, 1.67724609375, 2.7900390625, 3.90283203125, 5.015625, 6.12841796875, 7.2412109375, 8.35400390625, 9.466796875, 10.57958984375, 11.6923828125, 12.80517578125, 13.91796875, 15.03076171875, 16.1435546875, 17.25634765625, 18.369140625, 19.48193359375, 20.5947265625, 21.70751953125, 22.8203125, 23.93310546875, 25.0458984375, 26.15869140625, 27.271484375, 28.38427734375, 29.4970703125, 30.60986328125, 31.72265625, 32.83544921875, 33.9482421875, 35.06103515625, 36.173828125, 37.28662109375, 38.3994140625, 39.51220703125, 40.625]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 31.0, 145.0, 420.0, 318.0, 80.0, 12.0, 8.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-216.545166015625, -210.97146606445312, -205.39776611328125, -199.82408142089844, -194.25038146972656, -188.6766815185547, -183.10299682617188, -177.529296875, -171.95559692382812, -166.38189697265625, -160.80819702148438, -155.23451232910156, -149.6608123779297, -144.0871124267578, -138.513427734375, -132.93972778320312, -127.36602783203125, -121.79232788085938, -116.21863555908203, -110.64494323730469, -105.07124328613281, -99.49754333496094, -93.9238510131836, -88.35015869140625, -82.77645874023438, -77.2027587890625, -71.62906646728516, -66.05537414550781, -60.48167419433594, -54.90797805786133, -49.33428192138672, -43.76058578491211, -38.1868896484375, -32.61319351196289, -27.03949737548828, -21.465801239013672, -15.892105102539062, -10.318408966064453, -4.744712829589844, 0.8289833068847656, 6.402679443359375, 11.976375579833984, 17.550071716308594, 23.123767852783203, 28.697463989257812, 34.27116012573242, 39.84485626220703, 45.41855239868164, 50.99224853515625, 56.56594467163086, 62.13964080810547, 67.71333312988281, 73.28703308105469, 78.86073303222656, 84.4344253540039, 90.00811767578125, 95.58181762695312, 101.155517578125, 106.72920989990234, 112.30290222167969, 117.87660217285156, 123.45030212402344, 129.02398681640625, 134.59768676757812, 140.17138671875]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 4.0, 4.0, 6.0, 5.0, 4.0, 10.0, 10.0, 13.0, 14.0, 10.0, 18.0, 13.0, 10.0, 21.0, 30.0, 32.0, 34.0, 31.0, 45.0, 38.0, 32.0, 40.0, 33.0, 33.0, 43.0, 37.0, 43.0, 46.0, 45.0, 32.0, 40.0, 40.0, 30.0, 28.0, 41.0, 17.0, 19.0, 15.0, 15.0, 4.0, 8.0, 7.0, 4.0, 2.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.599456787109375, -39.386138916015625, -38.17281723022461, -36.95949935913086, -35.746177673339844, -34.532859802246094, -33.319541931152344, -32.106224060058594, -30.892902374267578, -29.679582595825195, -28.466262817382812, -27.252944946289062, -26.03962516784668, -24.826305389404297, -23.612987518310547, -22.399667739868164, -21.18634796142578, -19.9730281829834, -18.759708404541016, -17.546390533447266, -16.333070755004883, -15.1197509765625, -13.906432151794434, -12.693113327026367, -11.479793548583984, -10.266473770141602, -9.053154945373535, -7.8398356437683105, -6.626516342163086, -5.413197040557861, -4.199877738952637, -2.9865589141845703, -1.7732429504394531, -0.5599236488342285, 0.6533956527709961, 1.8667149543762207, 3.0800342559814453, 4.29335355758667, 5.5066728591918945, 6.719991683959961, 7.933311462402344, 9.146631240844727, 10.359950065612793, 11.57326889038086, 12.786588668823242, 13.999908447265625, 15.213227272033691, 16.426546096801758, 17.63986587524414, 18.853185653686523, 20.066505432128906, 21.279823303222656, 22.49314308166504, 23.706462860107422, 24.919780731201172, 26.133100509643555, 27.346420288085938, 28.55974006652832, 29.773059844970703, 30.986377716064453, 32.19969940185547, 33.41301727294922, 34.62633514404297, 35.83965301513672, 37.052974700927734]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 6.0, 5.0, 8.0, 5.0, 7.0, 6.0, 10.0, 20.0, 17.0, 17.0, 19.0, 20.0, 29.0, 38.0, 28.0, 26.0, 43.0, 43.0, 55.0, 36.0, 53.0, 39.0, 50.0, 37.0, 51.0, 42.0, 41.0, 43.0, 33.0, 32.0, 24.0, 25.0, 13.0, 24.0, 12.0, 18.0, 7.0, 9.0, 7.0, 6.0, 3.0, 3.0, 0.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.4375, -6.2255859375, -6.013671875, -5.8017578125, -5.58984375, -5.3779296875, -5.166015625, -4.9541015625, -4.7421875, -4.5302734375, -4.318359375, -4.1064453125, -3.89453125, -3.6826171875, -3.470703125, -3.2587890625, -3.046875, -2.8349609375, -2.623046875, -2.4111328125, -2.19921875, -1.9873046875, -1.775390625, -1.5634765625, -1.3515625, -1.1396484375, -0.927734375, -0.7158203125, -0.50390625, -0.2919921875, -0.080078125, 0.1318359375, 0.34375, 0.5556640625, 0.767578125, 0.9794921875, 1.19140625, 1.4033203125, 1.615234375, 1.8271484375, 2.0390625, 2.2509765625, 2.462890625, 2.6748046875, 2.88671875, 3.0986328125, 3.310546875, 3.5224609375, 3.734375, 3.9462890625, 4.158203125, 4.3701171875, 4.58203125, 4.7939453125, 5.005859375, 5.2177734375, 5.4296875, 5.6416015625, 5.853515625, 6.0654296875, 6.27734375, 6.4892578125, 6.701171875, 6.9130859375, 7.125]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 2.0, 1.0, 12.0, 9.0, 24.0, 21.0, 35.0, 52.0, 74.0, 133.0, 170.0, 269.0, 384.0, 642.0, 1013.0, 1578.0, 2531.0, 4049.0, 6484.0, 10550.0, 16920.0, 27029.0, 43547.0, 65837.0, 96897.0, 129720.0, 149941.0, 143481.0, 115163.0, 82770.0, 55219.0, 35355.0, 22378.0, 13837.0, 8299.0, 5190.0, 3222.0, 2106.0, 1278.0, 830.0, 515.0, 352.0, 201.0, 131.0, 103.0, 68.0, 37.0, 31.0, 26.0, 17.0, 10.0, 6.0, 5.0, 7.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.009765625, -0.976959228515625, -0.94415283203125, -0.911346435546875, -0.8785400390625, -0.845733642578125, -0.81292724609375, -0.780120849609375, -0.747314453125, -0.714508056640625, -0.68170166015625, -0.648895263671875, -0.6160888671875, -0.583282470703125, -0.55047607421875, -0.517669677734375, -0.48486328125, -0.452056884765625, -0.41925048828125, -0.386444091796875, -0.3536376953125, -0.320831298828125, -0.28802490234375, -0.255218505859375, -0.222412109375, -0.189605712890625, -0.15679931640625, -0.123992919921875, -0.0911865234375, -0.058380126953125, -0.02557373046875, 0.007232666015625, 0.0400390625, 0.072845458984375, 0.10565185546875, 0.138458251953125, 0.1712646484375, 0.204071044921875, 0.23687744140625, 0.269683837890625, 0.302490234375, 0.335296630859375, 0.36810302734375, 0.400909423828125, 0.4337158203125, 0.466522216796875, 0.49932861328125, 0.532135009765625, 0.56494140625, 0.597747802734375, 0.63055419921875, 0.663360595703125, 0.6961669921875, 0.728973388671875, 0.76177978515625, 0.794586181640625, 0.827392578125, 0.860198974609375, 0.89300537109375, 0.925811767578125, 0.9586181640625, 0.991424560546875, 1.02423095703125, 1.057037353515625, 1.08984375]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 2.0, 3.0, 7.0, 9.0, 13.0, 14.0, 9.0, 16.0, 13.0, 16.0, 27.0, 21.0, 43.0, 21.0, 26.0, 40.0, 36.0, 39.0, 39.0, 52.0, 40.0, 1066.0, 31.0, 32.0, 44.0, 37.0, 42.0, 41.0, 27.0, 23.0, 29.0, 20.0, 18.0, 24.0, 18.0, 13.0, 15.0, 12.0, 8.0, 12.0, 3.0, 3.0, 6.0, 3.0, 8.0, 3.0, 3.0, 2.0, 0.0, 2.0, 3.0], "bins": [-4.98046875, -4.837646484375, -4.69482421875, -4.552001953125, -4.4091796875, -4.266357421875, -4.12353515625, -3.980712890625, -3.837890625, -3.695068359375, -3.55224609375, -3.409423828125, -3.2666015625, -3.123779296875, -2.98095703125, -2.838134765625, -2.6953125, -2.552490234375, -2.40966796875, -2.266845703125, -2.1240234375, -1.981201171875, -1.83837890625, -1.695556640625, -1.552734375, -1.409912109375, -1.26708984375, -1.124267578125, -0.9814453125, -0.838623046875, -0.69580078125, -0.552978515625, -0.41015625, -0.267333984375, -0.12451171875, 0.018310546875, 0.1611328125, 0.303955078125, 0.44677734375, 0.589599609375, 0.732421875, 0.875244140625, 1.01806640625, 1.160888671875, 1.3037109375, 1.446533203125, 1.58935546875, 1.732177734375, 1.875, 2.017822265625, 2.16064453125, 2.303466796875, 2.4462890625, 2.589111328125, 2.73193359375, 2.874755859375, 3.017578125, 3.160400390625, 3.30322265625, 3.446044921875, 3.5888671875, 3.731689453125, 3.87451171875, 4.017333984375, 4.16015625]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 3.0, 1.0, 3.0, 4.0, 4.0, 11.0, 12.0, 19.0, 31.0, 24.0, 47.0, 76.0, 121.0, 116.0, 227.0, 314.0, 446.0, 610.0, 976.0, 1375.0, 2014.0, 2945.0, 4181.0, 6641.0, 9611.0, 15430.0, 25728.0, 82611.0, 1662578.0, 194593.0, 34131.0, 17710.0, 11344.0, 7364.0, 5108.0, 3420.0, 2207.0, 1604.0, 1021.0, 751.0, 488.0, 420.0, 256.0, 168.0, 118.0, 90.0, 63.0, 49.0, 21.0, 17.0, 8.0, 14.0, 11.0, 6.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.822265625, -1.7664947509765625, -1.710723876953125, -1.6549530029296875, -1.59918212890625, -1.5434112548828125, -1.487640380859375, -1.4318695068359375, -1.3760986328125, -1.3203277587890625, -1.264556884765625, -1.2087860107421875, -1.15301513671875, -1.0972442626953125, -1.041473388671875, -0.9857025146484375, -0.929931640625, -0.8741607666015625, -0.818389892578125, -0.7626190185546875, -0.70684814453125, -0.6510772705078125, -0.595306396484375, -0.5395355224609375, -0.4837646484375, -0.4279937744140625, -0.372222900390625, -0.3164520263671875, -0.26068115234375, -0.2049102783203125, -0.149139404296875, -0.0933685302734375, -0.03759765625, 0.0181732177734375, 0.073944091796875, 0.1297149658203125, 0.18548583984375, 0.2412567138671875, 0.297027587890625, 0.3527984619140625, 0.4085693359375, 0.4643402099609375, 0.520111083984375, 0.5758819580078125, 0.63165283203125, 0.6874237060546875, 0.743194580078125, 0.7989654541015625, 0.854736328125, 0.9105072021484375, 0.966278076171875, 1.0220489501953125, 1.07781982421875, 1.1335906982421875, 1.189361572265625, 1.2451324462890625, 1.3009033203125, 1.3566741943359375, 1.412445068359375, 1.4682159423828125, 1.52398681640625, 1.5797576904296875, 1.635528564453125, 1.6912994384765625, 1.7470703125]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 3.0, 2.0, 5.0, 7.0, 3.0, 3.0, 1.0, 6.0, 4.0, 11.0, 7.0, 8.0, 15.0, 19.0, 16.0, 15.0, 22.0, 31.0, 32.0, 41.0, 41.0, 43.0, 51.0, 59.0, 64.0, 69.0, 61.0, 40.0, 64.0, 41.0, 38.0, 28.0, 26.0, 26.0, 18.0, 16.0, 16.0, 10.0, 9.0, 8.0, 8.0, 4.0, 2.0, 7.0, 3.0, 1.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.11895751953125, -0.11484622955322266, -0.11073493957519531, -0.10662364959716797, -0.10251235961914062, -0.09840106964111328, -0.09428977966308594, -0.0901784896850586, -0.08606719970703125, -0.0819559097290039, -0.07784461975097656, -0.07373332977294922, -0.06962203979492188, -0.06551074981689453, -0.06139945983886719, -0.057288169860839844, -0.0531768798828125, -0.049065589904785156, -0.04495429992675781, -0.04084300994873047, -0.036731719970703125, -0.03262042999267578, -0.028509140014648438, -0.024397850036621094, -0.02028656005859375, -0.016175270080566406, -0.012063980102539062, -0.007952690124511719, -0.003841400146484375, 0.00026988983154296875, 0.0043811798095703125, 0.008492469787597656, 0.012603759765625, 0.016715049743652344, 0.020826339721679688, 0.02493762969970703, 0.029048919677734375, 0.03316020965576172, 0.03727149963378906, 0.041382789611816406, 0.04549407958984375, 0.049605369567871094, 0.05371665954589844, 0.05782794952392578, 0.061939239501953125, 0.06605052947998047, 0.07016181945800781, 0.07427310943603516, 0.0783843994140625, 0.08249568939208984, 0.08660697937011719, 0.09071826934814453, 0.09482955932617188, 0.09894084930419922, 0.10305213928222656, 0.1071634292602539, 0.11127471923828125, 0.1153860092163086, 0.11949729919433594, 0.12360858917236328, 0.12771987915039062, 0.13183116912841797, 0.1359424591064453, 0.14005374908447266, 0.1441650390625]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 0.0, 3.0, 3.0, 2.0, 6.0, 6.0, 3.0, 6.0, 8.0, 10.0, 13.0, 12.0, 24.0, 33.0, 35.0, 46.0, 65.0, 90.0, 130.0, 208.0, 326.0, 704.0, 6760.0, 1026716.0, 11494.0, 755.0, 346.0, 218.0, 142.0, 103.0, 56.0, 52.0, 32.0, 39.0, 20.0, 23.0, 13.0, 9.0, 12.0, 7.0, 2.0, 4.0, 3.0, 4.0, 4.0, 4.0, 4.0, 4.0, 1.0, 3.0, 1.0, 2.0], "bins": [-2.966796875, -2.883331298828125, -2.79986572265625, -2.716400146484375, -2.6329345703125, -2.549468994140625, -2.46600341796875, -2.382537841796875, -2.299072265625, -2.215606689453125, -2.13214111328125, -2.048675537109375, -1.9652099609375, -1.881744384765625, -1.79827880859375, -1.714813232421875, -1.63134765625, -1.547882080078125, -1.46441650390625, -1.380950927734375, -1.2974853515625, -1.214019775390625, -1.13055419921875, -1.047088623046875, -0.963623046875, -0.880157470703125, -0.79669189453125, -0.713226318359375, -0.6297607421875, -0.546295166015625, -0.46282958984375, -0.379364013671875, -0.2958984375, -0.212432861328125, -0.12896728515625, -0.045501708984375, 0.0379638671875, 0.121429443359375, 0.20489501953125, 0.288360595703125, 0.371826171875, 0.455291748046875, 0.53875732421875, 0.622222900390625, 0.7056884765625, 0.789154052734375, 0.87261962890625, 0.956085205078125, 1.03955078125, 1.123016357421875, 1.20648193359375, 1.289947509765625, 1.3734130859375, 1.456878662109375, 1.54034423828125, 1.623809814453125, 1.707275390625, 1.790740966796875, 1.87420654296875, 1.957672119140625, 2.0411376953125, 2.124603271484375, 2.20806884765625, 2.291534423828125, 2.375]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 8.0, 80.0, 663.0, 252.0, 8.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.70831298828125, -1.664258599281311, -1.620204210281372, -1.5761499404907227, -1.5320955514907837, -1.4880411624908447, -1.4439868927001953, -1.3999325037002563, -1.3558781147003174, -1.3118237257003784, -1.2677693367004395, -1.22371506690979, -1.179660677909851, -1.135606288909912, -1.0915520191192627, -1.0474976301193237, -1.0034432411193848, -0.9593888521194458, -0.9153345227241516, -0.8712801933288574, -0.8272258043289185, -0.7831714153289795, -0.7391170859336853, -0.6950627565383911, -0.6510083675384521, -0.6069539785385132, -0.562899649143219, -0.5188453197479248, -0.47479093074798584, -0.43073657155036926, -0.3866822123527527, -0.3426278531551361, -0.29857349395751953, -0.25451913475990295, -0.21046477556228638, -0.1664104163646698, -0.12235605716705322, -0.07830169796943665, -0.03424733877182007, 0.009807020425796509, 0.053861379623413086, 0.09791573882102966, 0.14197009801864624, 0.18602445721626282, 0.2300788164138794, 0.27413317561149597, 0.31818753480911255, 0.3622418940067291, 0.4062962532043457, 0.4503506124019623, 0.49440497159957886, 0.538459300994873, 0.582513689994812, 0.626568078994751, 0.6706224083900452, 0.7146767377853394, 0.7587311267852783, 0.8027855157852173, 0.8468398451805115, 0.8908941745758057, 0.9349485635757446, 0.9790029525756836, 1.023057222366333, 1.067111611366272, 1.111166000366211]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 9.0, 16.0, 18.0, 21.0, 40.0, 42.0, 52.0, 56.0, 50.0, 64.0, 83.0, 74.0, 70.0, 66.0, 61.0, 67.0, 54.0, 39.0, 43.0, 22.0, 17.0, 16.0, 11.0, 3.0, 8.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.26400524377822876, -0.2540777921676636, -0.2441503405570984, -0.2342229038476944, -0.2242954522371292, -0.21436800062656403, -0.20444056391716003, -0.19451311230659485, -0.18458566069602966, -0.17465820908546448, -0.1647307574748993, -0.1548033207654953, -0.14487586915493011, -0.13494841754436493, -0.12502098083496094, -0.11509352922439575, -0.10516607761383057, -0.09523862600326538, -0.08531118184328079, -0.0753837376832962, -0.06545628607273102, -0.05552883818745613, -0.045601390302181244, -0.035673946142196655, -0.02574649453163147, -0.015819046646356583, -0.0058915987610816956, 0.0040358491241931915, 0.013963297009468079, 0.023890744894742966, 0.03381819278001785, 0.04374563694000244, 0.05367308855056763, 0.06360054016113281, 0.0735279843211174, 0.08345542848110199, 0.09338288009166718, 0.10331033170223236, 0.11323777586221695, 0.12316522002220154, 0.13309267163276672, 0.1430201232433319, 0.1529475748538971, 0.1628750115633011, 0.17280246317386627, 0.18272991478443146, 0.19265735149383545, 0.20258480310440063, 0.21251225471496582, 0.222439706325531, 0.2323671579360962, 0.24229459464550018, 0.25222206115722656, 0.26214948296546936, 0.27207693457603455, 0.28200438618659973, 0.2919318377971649, 0.3018592894077301, 0.3117867410182953, 0.3217141926288605, 0.33164161443710327, 0.34156906604766846, 0.35149651765823364, 0.36142396926879883, 0.371351420879364]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 6.0, 7.0, 4.0, 7.0, 12.0, 12.0, 14.0, 17.0, 17.0, 14.0, 19.0, 33.0, 32.0, 26.0, 28.0, 42.0, 39.0, 50.0, 45.0, 55.0, 38.0, 52.0, 58.0, 41.0, 36.0, 42.0, 48.0, 27.0, 36.0, 31.0, 26.0, 17.0, 17.0, 9.0, 12.0, 12.0, 8.0, 7.0, 3.0, 5.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-7.09765625, -6.8800048828125, -6.662353515625, -6.4447021484375, -6.22705078125, -6.0093994140625, -5.791748046875, -5.5740966796875, -5.3564453125, -5.1387939453125, -4.921142578125, -4.7034912109375, -4.48583984375, -4.2681884765625, -4.050537109375, -3.8328857421875, -3.615234375, -3.3975830078125, -3.179931640625, -2.9622802734375, -2.74462890625, -2.5269775390625, -2.309326171875, -2.0916748046875, -1.8740234375, -1.6563720703125, -1.438720703125, -1.2210693359375, -1.00341796875, -0.7857666015625, -0.568115234375, -0.3504638671875, -0.1328125, 0.0848388671875, 0.302490234375, 0.5201416015625, 0.73779296875, 0.9554443359375, 1.173095703125, 1.3907470703125, 1.6083984375, 1.8260498046875, 2.043701171875, 2.2613525390625, 2.47900390625, 2.6966552734375, 2.914306640625, 3.1319580078125, 3.349609375, 3.5672607421875, 3.784912109375, 4.0025634765625, 4.22021484375, 4.4378662109375, 4.655517578125, 4.8731689453125, 5.0908203125, 5.3084716796875, 5.526123046875, 5.7437744140625, 5.96142578125, 6.1790771484375, 6.396728515625, 6.6143798828125, 6.83203125]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 7.0, 7.0, 13.0, 20.0, 19.0, 31.0, 45.0, 68.0, 115.0, 227.0, 432.0, 728.0, 1442.0, 3055.0, 6777.0, 17792.0, 54415.0, 203961.0, 487007.0, 191594.0, 51559.0, 16838.0, 6518.0, 2799.0, 1465.0, 719.0, 394.0, 212.0, 102.0, 77.0, 41.0, 32.0, 24.0, 10.0, 11.0, 4.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.890625, -10.5552978515625, -10.219970703125, -9.8846435546875, -9.54931640625, -9.2139892578125, -8.878662109375, -8.5433349609375, -8.2080078125, -7.8726806640625, -7.537353515625, -7.2020263671875, -6.86669921875, -6.5313720703125, -6.196044921875, -5.8607177734375, -5.525390625, -5.1900634765625, -4.854736328125, -4.5194091796875, -4.18408203125, -3.8487548828125, -3.513427734375, -3.1781005859375, -2.8427734375, -2.5074462890625, -2.172119140625, -1.8367919921875, -1.50146484375, -1.1661376953125, -0.830810546875, -0.4954833984375, -0.16015625, 0.1751708984375, 0.510498046875, 0.8458251953125, 1.18115234375, 1.5164794921875, 1.851806640625, 2.1871337890625, 2.5224609375, 2.8577880859375, 3.193115234375, 3.5284423828125, 3.86376953125, 4.1990966796875, 4.534423828125, 4.8697509765625, 5.205078125, 5.5404052734375, 5.875732421875, 6.2110595703125, 6.54638671875, 6.8817138671875, 7.217041015625, 7.5523681640625, 7.8876953125, 8.2230224609375, 8.558349609375, 8.8936767578125, 9.22900390625, 9.5643310546875, 9.899658203125, 10.2349853515625, 10.5703125]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 3.0, 6.0, 5.0, 10.0, 5.0, 12.0, 12.0, 15.0, 22.0, 17.0, 32.0, 20.0, 18.0, 19.0, 54.0, 43.0, 47.0, 42.0, 65.0, 99.0, 186.0, 1335.0, 324.0, 160.0, 99.0, 53.0, 44.0, 42.0, 49.0, 19.0, 32.0, 27.0, 22.0, 17.0, 12.0, 16.0, 15.0, 7.0, 12.0, 2.0, 13.0, 3.0, 6.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-20.109375, -19.532958984375, -18.95654296875, -18.380126953125, -17.8037109375, -17.227294921875, -16.65087890625, -16.074462890625, -15.498046875, -14.921630859375, -14.34521484375, -13.768798828125, -13.1923828125, -12.615966796875, -12.03955078125, -11.463134765625, -10.88671875, -10.310302734375, -9.73388671875, -9.157470703125, -8.5810546875, -8.004638671875, -7.42822265625, -6.851806640625, -6.275390625, -5.698974609375, -5.12255859375, -4.546142578125, -3.9697265625, -3.393310546875, -2.81689453125, -2.240478515625, -1.6640625, -1.087646484375, -0.51123046875, 0.065185546875, 0.6416015625, 1.218017578125, 1.79443359375, 2.370849609375, 2.947265625, 3.523681640625, 4.10009765625, 4.676513671875, 5.2529296875, 5.829345703125, 6.40576171875, 6.982177734375, 7.55859375, 8.135009765625, 8.71142578125, 9.287841796875, 9.8642578125, 10.440673828125, 11.01708984375, 11.593505859375, 12.169921875, 12.746337890625, 13.32275390625, 13.899169921875, 14.4755859375, 15.052001953125, 15.62841796875, 16.204833984375, 16.78125]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 4.0, 9.0, 8.0, 12.0, 13.0, 16.0, 30.0, 36.0, 33.0, 60.0, 61.0, 66.0, 98.0, 158.0, 236.0, 434.0, 983.0, 3585.0, 24664.0, 618120.0, 2417755.0, 68999.0, 7129.0, 1590.0, 545.0, 313.0, 201.0, 137.0, 88.0, 72.0, 47.0, 46.0, 33.0, 36.0, 21.0, 16.0, 10.0, 8.0, 11.0, 8.0, 2.0, 5.0, 2.0, 4.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-26.859375, -25.99853515625, -25.1376953125, -24.27685546875, -23.416015625, -22.55517578125, -21.6943359375, -20.83349609375, -19.97265625, -19.11181640625, -18.2509765625, -17.39013671875, -16.529296875, -15.66845703125, -14.8076171875, -13.94677734375, -13.0859375, -12.22509765625, -11.3642578125, -10.50341796875, -9.642578125, -8.78173828125, -7.9208984375, -7.06005859375, -6.19921875, -5.33837890625, -4.4775390625, -3.61669921875, -2.755859375, -1.89501953125, -1.0341796875, -0.17333984375, 0.6875, 1.54833984375, 2.4091796875, 3.27001953125, 4.130859375, 4.99169921875, 5.8525390625, 6.71337890625, 7.57421875, 8.43505859375, 9.2958984375, 10.15673828125, 11.017578125, 11.87841796875, 12.7392578125, 13.60009765625, 14.4609375, 15.32177734375, 16.1826171875, 17.04345703125, 17.904296875, 18.76513671875, 19.6259765625, 20.48681640625, 21.34765625, 22.20849609375, 23.0693359375, 23.93017578125, 24.791015625, 25.65185546875, 26.5126953125, 27.37353515625, 28.234375]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 13.0, 39.0, 169.0, 312.0, 291.0, 128.0, 52.0, 8.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.449399948120117, -24.695510864257812, -21.94162368774414, -19.18773651123047, -16.433847427368164, -13.679959297180176, -10.926071166992188, -8.172182083129883, -5.418294906616211, -2.6644067764282227, 0.08948135375976562, 2.843369483947754, 5.597257614135742, 8.35114574432373, 11.105033874511719, 13.858922958374023, 16.612810134887695, 19.36669921875, 22.120586395263672, 24.874473571777344, 27.62836265563965, 30.382251739501953, 33.136138916015625, 35.89002990722656, 38.64391326904297, 41.39780044555664, 44.15168762207031, 46.90557861328125, 49.65946578979492, 52.413352966308594, 55.16724395751953, 57.9211311340332, 60.675018310546875, 63.42890548706055, 66.18279266357422, 68.93668365478516, 71.69056701660156, 74.4444580078125, 77.19834899902344, 79.95223999023438, 82.70612335205078, 85.46001434326172, 88.21389770507812, 90.96778869628906, 93.7216796875, 96.4755630493164, 99.22945404052734, 101.98333740234375, 104.73722839355469, 107.49111938476562, 110.24500274658203, 112.99889373779297, 115.75277709960938, 118.50666809082031, 121.26055908203125, 124.01445007324219, 126.7683334350586, 129.522216796875, 132.27610778808594, 135.02999877929688, 137.7838897705078, 140.53778076171875, 143.29165649414062, 146.04554748535156, 148.7994384765625]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 5.0, 7.0, 6.0, 10.0, 10.0, 13.0, 16.0, 26.0, 24.0, 22.0, 25.0, 52.0, 43.0, 40.0, 48.0, 52.0, 54.0, 46.0, 40.0, 37.0, 42.0, 44.0, 43.0, 36.0, 41.0, 32.0, 24.0, 30.0, 18.0, 20.0, 20.0, 12.0, 20.0, 16.0, 5.0, 7.0, 7.0, 2.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-50.17162322998047, -48.43405532836914, -46.69648742675781, -44.95892333984375, -43.22135543823242, -41.483787536621094, -39.74622344970703, -38.0086555480957, -36.271087646484375, -34.53351974487305, -32.79595184326172, -31.058387756347656, -29.320819854736328, -27.583251953125, -25.845685958862305, -24.10811996459961, -22.37055206298828, -20.632984161376953, -18.895418167114258, -17.157852172851562, -15.420284271240234, -13.682717323303223, -11.945150375366211, -10.2075834274292, -8.470016479492188, -6.732449531555176, -4.994882583618164, -3.2573156356811523, -1.5197486877441406, 0.2178182601928711, 1.9553852081298828, 3.6929521560668945, 5.430515289306641, 7.168082237243652, 8.905649185180664, 10.643216133117676, 12.380783081054688, 14.1183500289917, 15.855916976928711, 17.593482971191406, 19.331050872802734, 21.068618774414062, 22.806184768676758, 24.543750762939453, 26.28131866455078, 28.01888656616211, 29.756452560424805, 31.4940185546875, 33.23158645629883, 34.969154357910156, 36.70671844482422, 38.44428634643555, 40.181854248046875, 41.9194221496582, 43.65699005126953, 45.394554138183594, 47.13212203979492, 48.86968994140625, 50.60725402832031, 52.34482192993164, 54.08238983154297, 55.8199577331543, 57.557525634765625, 59.29508972167969, 61.032657623291016]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 6.0, 6.0, 7.0, 4.0, 13.0, 12.0, 12.0, 20.0, 26.0, 22.0, 26.0, 35.0, 24.0, 39.0, 42.0, 42.0, 43.0, 49.0, 67.0, 35.0, 63.0, 48.0, 53.0, 39.0, 46.0, 31.0, 33.0, 28.0, 29.0, 16.0, 15.0, 22.0, 14.0, 15.0, 6.0, 7.0, 2.0, 6.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-8.2421875, -8.00067138671875, -7.7591552734375, -7.51763916015625, -7.276123046875, -7.03460693359375, -6.7930908203125, -6.55157470703125, -6.31005859375, -6.06854248046875, -5.8270263671875, -5.58551025390625, -5.343994140625, -5.10247802734375, -4.8609619140625, -4.61944580078125, -4.3779296875, -4.13641357421875, -3.8948974609375, -3.65338134765625, -3.411865234375, -3.17034912109375, -2.9288330078125, -2.68731689453125, -2.44580078125, -2.20428466796875, -1.9627685546875, -1.72125244140625, -1.479736328125, -1.23822021484375, -0.9967041015625, -0.75518798828125, -0.513671875, -0.27215576171875, -0.0306396484375, 0.21087646484375, 0.452392578125, 0.69390869140625, 0.9354248046875, 1.17694091796875, 1.41845703125, 1.65997314453125, 1.9014892578125, 2.14300537109375, 2.384521484375, 2.62603759765625, 2.8675537109375, 3.10906982421875, 3.3505859375, 3.59210205078125, 3.8336181640625, 4.07513427734375, 4.316650390625, 4.55816650390625, 4.7996826171875, 5.04119873046875, 5.28271484375, 5.52423095703125, 5.7657470703125, 6.00726318359375, 6.248779296875, 6.49029541015625, 6.7318115234375, 6.97332763671875, 7.21484375]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 4.0, 5.0, 7.0, 5.0, 7.0, 19.0, 12.0, 24.0, 25.0, 29.0, 54.0, 68.0, 90.0, 112.0, 156.0, 229.0, 306.0, 429.0, 637.0, 923.0, 1448.0, 2697.0, 5139.0, 11399.0, 29661.0, 98179.0, 387919.0, 1401827.0, 1582304.0, 487248.0, 122185.0, 35701.0, 12771.0, 5542.0, 2765.0, 1556.0, 916.0, 593.0, 391.0, 260.0, 172.0, 120.0, 91.0, 67.0, 59.0, 41.0, 32.0, 20.0, 14.0, 9.0, 8.0, 7.0, 4.0, 2.0, 1.0, 4.0, 1.0], "bins": [-9.9296875, -9.6466064453125, -9.363525390625, -9.0804443359375, -8.79736328125, -8.5142822265625, -8.231201171875, -7.9481201171875, -7.6650390625, -7.3819580078125, -7.098876953125, -6.8157958984375, -6.53271484375, -6.2496337890625, -5.966552734375, -5.6834716796875, -5.400390625, -5.1173095703125, -4.834228515625, -4.5511474609375, -4.26806640625, -3.9849853515625, -3.701904296875, -3.4188232421875, -3.1357421875, -2.8526611328125, -2.569580078125, -2.2864990234375, -2.00341796875, -1.7203369140625, -1.437255859375, -1.1541748046875, -0.87109375, -0.5880126953125, -0.304931640625, -0.0218505859375, 0.26123046875, 0.5443115234375, 0.827392578125, 1.1104736328125, 1.3935546875, 1.6766357421875, 1.959716796875, 2.2427978515625, 2.52587890625, 2.8089599609375, 3.092041015625, 3.3751220703125, 3.658203125, 3.9412841796875, 4.224365234375, 4.5074462890625, 4.79052734375, 5.0736083984375, 5.356689453125, 5.6397705078125, 5.9228515625, 6.2059326171875, 6.489013671875, 6.7720947265625, 7.05517578125, 7.3382568359375, 7.621337890625, 7.9044189453125, 8.1875]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 2.0, 4.0, 7.0, 6.0, 13.0, 19.0, 19.0, 20.0, 41.0, 41.0, 67.0, 94.0, 107.0, 167.0, 230.0, 312.0, 402.0, 508.0, 482.0, 384.0, 296.0, 212.0, 183.0, 116.0, 85.0, 63.0, 39.0, 37.0, 29.0, 28.0, 13.0, 8.0, 5.0, 10.0, 4.0, 3.0, 4.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.734375, -9.4197998046875, -9.105224609375, -8.7906494140625, -8.47607421875, -8.1614990234375, -7.846923828125, -7.5323486328125, -7.2177734375, -6.9031982421875, -6.588623046875, -6.2740478515625, -5.95947265625, -5.6448974609375, -5.330322265625, -5.0157470703125, -4.701171875, -4.3865966796875, -4.072021484375, -3.7574462890625, -3.44287109375, -3.1282958984375, -2.813720703125, -2.4991455078125, -2.1845703125, -1.8699951171875, -1.555419921875, -1.2408447265625, -0.92626953125, -0.6116943359375, -0.297119140625, 0.0174560546875, 0.33203125, 0.6466064453125, 0.961181640625, 1.2757568359375, 1.59033203125, 1.9049072265625, 2.219482421875, 2.5340576171875, 2.8486328125, 3.1632080078125, 3.477783203125, 3.7923583984375, 4.10693359375, 4.4215087890625, 4.736083984375, 5.0506591796875, 5.365234375, 5.6798095703125, 5.994384765625, 6.3089599609375, 6.62353515625, 6.9381103515625, 7.252685546875, 7.5672607421875, 7.8818359375, 8.1964111328125, 8.510986328125, 8.8255615234375, 9.14013671875, 9.4547119140625, 9.769287109375, 10.0838623046875, 10.3984375]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 8.0, 9.0, 13.0, 21.0, 29.0, 80.0, 104.0, 208.0, 410.0, 960.0, 5859.0, 174342.0, 3864821.0, 140727.0, 5042.0, 899.0, 342.0, 168.0, 94.0, 68.0, 31.0, 18.0, 7.0, 8.0, 8.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.734375, -29.366943359375, -27.99951171875, -26.632080078125, -25.2646484375, -23.897216796875, -22.52978515625, -21.162353515625, -19.794921875, -18.427490234375, -17.06005859375, -15.692626953125, -14.3251953125, -12.957763671875, -11.59033203125, -10.222900390625, -8.85546875, -7.488037109375, -6.12060546875, -4.753173828125, -3.3857421875, -2.018310546875, -0.65087890625, 0.716552734375, 2.083984375, 3.451416015625, 4.81884765625, 6.186279296875, 7.5537109375, 8.921142578125, 10.28857421875, 11.656005859375, 13.0234375, 14.390869140625, 15.75830078125, 17.125732421875, 18.4931640625, 19.860595703125, 21.22802734375, 22.595458984375, 23.962890625, 25.330322265625, 26.69775390625, 28.065185546875, 29.4326171875, 30.800048828125, 32.16748046875, 33.534912109375, 34.90234375, 36.269775390625, 37.63720703125, 39.004638671875, 40.3720703125, 41.739501953125, 43.10693359375, 44.474365234375, 45.841796875, 47.209228515625, 48.57666015625, 49.944091796875, 51.3115234375, 52.678955078125, 54.04638671875, 55.413818359375, 56.78125]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 7.0, 21.0, 43.0, 89.0, 119.0, 175.0, 189.0, 155.0, 111.0, 48.0, 24.0, 12.0, 8.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.9244384765625, -71.63594818115234, -69.34745025634766, -67.0589599609375, -64.77046966552734, -62.48197555541992, -60.1934814453125, -57.904991149902344, -55.61650085449219, -53.328006744384766, -51.03951644897461, -48.75102233886719, -46.46253204345703, -44.17403793334961, -41.88554382324219, -39.59705352783203, -37.30855941772461, -35.02006530761719, -32.73157501220703, -30.44308090209961, -28.154590606689453, -25.86609649658203, -23.577604293823242, -21.289112091064453, -19.000619888305664, -16.712127685546875, -14.423635482788086, -12.13514232635498, -9.846650123596191, -7.558157920837402, -5.269664764404297, -2.981172561645508, -0.6926803588867188, 1.5958120822906494, 3.8843045234680176, 6.172797203063965, 8.461289405822754, 10.749781608581543, 13.038274765014648, 15.326766967773438, 17.615259170532227, 19.903751373291016, 22.192243576049805, 24.480735778808594, 26.769229888916016, 29.057720184326172, 31.346214294433594, 33.63470458984375, 35.92319869995117, 38.211692810058594, 40.50018310546875, 42.78867721557617, 45.07716751098633, 47.36566162109375, 49.654151916503906, 51.94264602661133, 54.23114013671875, 56.51963424682617, 58.80812454223633, 61.09661865234375, 63.385108947753906, 65.67359924316406, 67.96209716796875, 70.2505874633789, 72.53907775878906]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [5.0, 0.0, 0.0, 2.0, 1.0, 4.0, 5.0, 1.0, 7.0, 10.0, 4.0, 13.0, 8.0, 12.0, 14.0, 23.0, 17.0, 16.0, 24.0, 29.0, 32.0, 22.0, 27.0, 42.0, 27.0, 43.0, 34.0, 49.0, 39.0, 35.0, 52.0, 36.0, 32.0, 35.0, 34.0, 40.0, 23.0, 25.0, 26.0, 20.0, 22.0, 22.0, 12.0, 12.0, 13.0, 15.0, 6.0, 7.0, 10.0, 5.0, 4.0, 3.0, 9.0, 2.0, 3.0, 2.0, 4.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-32.83982467651367, -31.7388858795166, -30.6379451751709, -29.537006378173828, -28.436065673828125, -27.335126876831055, -26.234188079833984, -25.13324737548828, -24.032306671142578, -22.931367874145508, -21.830427169799805, -20.729488372802734, -19.62854766845703, -18.52760887145996, -17.42667007446289, -16.325729370117188, -15.224790573120117, -14.12385082244873, -13.022911071777344, -11.921972274780273, -10.82103157043457, -9.7200927734375, -8.619153022766113, -7.518213272094727, -6.41727352142334, -5.316333770751953, -4.215394020080566, -3.114454746246338, -2.013514995574951, -0.9125752449035645, 0.18836402893066406, 1.2893037796020508, 2.3902435302734375, 3.491183280944824, 4.592123031616211, 5.6930623054504395, 6.794002056121826, 7.894941806793213, 8.995881080627441, 10.096820831298828, 11.197760581970215, 12.298700332641602, 13.399640083312988, 14.500579833984375, 15.601518630981445, 16.70245933532715, 17.80339813232422, 18.904338836669922, 20.005277633666992, 21.106216430664062, 22.207157135009766, 23.308095932006836, 24.40903663635254, 25.50997543334961, 26.610916137695312, 27.711854934692383, 28.812793731689453, 29.913732528686523, 31.014673233032227, 32.1156120300293, 33.216552734375, 34.3174934387207, 35.41843032836914, 36.519371032714844, 37.62031173706055]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 2.0, 3.0, 3.0, 7.0, 7.0, 10.0, 15.0, 10.0, 13.0, 24.0, 21.0, 30.0, 26.0, 46.0, 44.0, 38.0, 34.0, 46.0, 54.0, 45.0, 53.0, 48.0, 45.0, 44.0, 54.0, 34.0, 41.0, 35.0, 35.0, 35.0, 15.0, 14.0, 17.0, 16.0, 12.0, 4.0, 6.0, 8.0, 6.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-8.015625, -7.775634765625, -7.53564453125, -7.295654296875, -7.0556640625, -6.815673828125, -6.57568359375, -6.335693359375, -6.095703125, -5.855712890625, -5.61572265625, -5.375732421875, -5.1357421875, -4.895751953125, -4.65576171875, -4.415771484375, -4.17578125, -3.935791015625, -3.69580078125, -3.455810546875, -3.2158203125, -2.975830078125, -2.73583984375, -2.495849609375, -2.255859375, -2.015869140625, -1.77587890625, -1.535888671875, -1.2958984375, -1.055908203125, -0.81591796875, -0.575927734375, -0.3359375, -0.095947265625, 0.14404296875, 0.384033203125, 0.6240234375, 0.864013671875, 1.10400390625, 1.343994140625, 1.583984375, 1.823974609375, 2.06396484375, 2.303955078125, 2.5439453125, 2.783935546875, 3.02392578125, 3.263916015625, 3.50390625, 3.743896484375, 3.98388671875, 4.223876953125, 4.4638671875, 4.703857421875, 4.94384765625, 5.183837890625, 5.423828125, 5.663818359375, 5.90380859375, 6.143798828125, 6.3837890625, 6.623779296875, 6.86376953125, 7.103759765625, 7.34375]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 6.0, 2.0, 3.0, 6.0, 6.0, 12.0, 17.0, 33.0, 45.0, 50.0, 80.0, 105.0, 178.0, 276.0, 408.0, 560.0, 849.0, 1330.0, 2033.0, 2830.0, 4299.0, 6550.0, 9897.0, 15366.0, 23192.0, 35433.0, 52616.0, 77172.0, 105756.0, 132011.0, 141480.0, 126875.0, 98218.0, 70017.0, 47792.0, 31598.0, 21103.0, 13841.0, 8921.0, 5768.0, 3875.0, 2643.0, 1716.0, 1186.0, 797.0, 529.0, 364.0, 247.0, 145.0, 99.0, 83.0, 48.0, 37.0, 23.0, 15.0, 12.0, 5.0, 6.0, 5.0, 0.0, 3.0, 2.0], "bins": [-0.99755859375, -0.9667434692382812, -0.9359283447265625, -0.9051132202148438, -0.874298095703125, -0.8434829711914062, -0.8126678466796875, -0.7818527221679688, -0.75103759765625, -0.7202224731445312, -0.6894073486328125, -0.6585922241210938, -0.627777099609375, -0.5969619750976562, -0.5661468505859375, -0.5353317260742188, -0.5045166015625, -0.47370147705078125, -0.4428863525390625, -0.41207122802734375, -0.381256103515625, -0.35044097900390625, -0.3196258544921875, -0.28881072998046875, -0.25799560546875, -0.22718048095703125, -0.1963653564453125, -0.16555023193359375, -0.134735107421875, -0.10391998291015625, -0.0731048583984375, -0.04228973388671875, -0.011474609375, 0.01934051513671875, 0.0501556396484375, 0.08097076416015625, 0.111785888671875, 0.14260101318359375, 0.1734161376953125, 0.20423126220703125, 0.23504638671875, 0.26586151123046875, 0.2966766357421875, 0.32749176025390625, 0.358306884765625, 0.38912200927734375, 0.4199371337890625, 0.45075225830078125, 0.4815673828125, 0.5123825073242188, 0.5431976318359375, 0.5740127563476562, 0.604827880859375, 0.6356430053710938, 0.6664581298828125, 0.6972732543945312, 0.72808837890625, 0.7589035034179688, 0.7897186279296875, 0.8205337524414062, 0.851348876953125, 0.8821640014648438, 0.9129791259765625, 0.9437942504882812, 0.974609375]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 7.0, 1.0, 1.0, 1.0, 4.0, 6.0, 5.0, 7.0, 6.0, 10.0, 12.0, 10.0, 18.0, 18.0, 12.0, 20.0, 25.0, 32.0, 25.0, 30.0, 34.0, 31.0, 30.0, 31.0, 29.0, 28.0, 32.0, 44.0, 1060.0, 44.0, 35.0, 34.0, 35.0, 28.0, 26.0, 23.0, 27.0, 34.0, 30.0, 9.0, 24.0, 15.0, 14.0, 15.0, 12.0, 15.0, 11.0, 9.0, 8.0, 4.0, 3.0, 5.0, 3.0, 4.0, 3.0, 2.0], "bins": [-5.5390625, -5.3856201171875, -5.232177734375, -5.0787353515625, -4.92529296875, -4.7718505859375, -4.618408203125, -4.4649658203125, -4.3115234375, -4.1580810546875, -4.004638671875, -3.8511962890625, -3.69775390625, -3.5443115234375, -3.390869140625, -3.2374267578125, -3.083984375, -2.9305419921875, -2.777099609375, -2.6236572265625, -2.47021484375, -2.3167724609375, -2.163330078125, -2.0098876953125, -1.8564453125, -1.7030029296875, -1.549560546875, -1.3961181640625, -1.24267578125, -1.0892333984375, -0.935791015625, -0.7823486328125, -0.62890625, -0.4754638671875, -0.322021484375, -0.1685791015625, -0.01513671875, 0.1383056640625, 0.291748046875, 0.4451904296875, 0.5986328125, 0.7520751953125, 0.905517578125, 1.0589599609375, 1.21240234375, 1.3658447265625, 1.519287109375, 1.6727294921875, 1.826171875, 1.9796142578125, 2.133056640625, 2.2864990234375, 2.43994140625, 2.5933837890625, 2.746826171875, 2.9002685546875, 3.0537109375, 3.2071533203125, 3.360595703125, 3.5140380859375, 3.66748046875, 3.8209228515625, 3.974365234375, 4.1278076171875, 4.28125]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 10.0, 8.0, 8.0, 11.0, 26.0, 33.0, 40.0, 60.0, 76.0, 122.0, 143.0, 189.0, 245.0, 353.0, 452.0, 694.0, 877.0, 1267.0, 1741.0, 2556.0, 3698.0, 5042.0, 7281.0, 10471.0, 16380.0, 28945.0, 113453.0, 1656184.0, 159175.0, 32943.0, 17342.0, 11183.0, 7731.0, 5320.0, 3646.0, 2636.0, 1960.0, 1328.0, 939.0, 691.0, 504.0, 368.0, 289.0, 212.0, 132.0, 106.0, 73.0, 49.0, 32.0, 33.0, 27.0, 20.0, 11.0, 11.0, 7.0, 4.0, 1.0, 0.0, 2.0, 3.0, 1.0], "bins": [-1.6318359375, -1.578460693359375, -1.52508544921875, -1.471710205078125, -1.4183349609375, -1.364959716796875, -1.31158447265625, -1.258209228515625, -1.204833984375, -1.151458740234375, -1.09808349609375, -1.044708251953125, -0.9913330078125, -0.937957763671875, -0.88458251953125, -0.831207275390625, -0.77783203125, -0.724456787109375, -0.67108154296875, -0.617706298828125, -0.5643310546875, -0.510955810546875, -0.45758056640625, -0.404205322265625, -0.350830078125, -0.297454833984375, -0.24407958984375, -0.190704345703125, -0.1373291015625, -0.083953857421875, -0.03057861328125, 0.022796630859375, 0.076171875, 0.129547119140625, 0.18292236328125, 0.236297607421875, 0.2896728515625, 0.343048095703125, 0.39642333984375, 0.449798583984375, 0.503173828125, 0.556549072265625, 0.60992431640625, 0.663299560546875, 0.7166748046875, 0.770050048828125, 0.82342529296875, 0.876800537109375, 0.93017578125, 0.983551025390625, 1.03692626953125, 1.090301513671875, 1.1436767578125, 1.197052001953125, 1.25042724609375, 1.303802490234375, 1.357177734375, 1.410552978515625, 1.46392822265625, 1.517303466796875, 1.5706787109375, 1.624053955078125, 1.67742919921875, 1.730804443359375, 1.7841796875]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 4.0, 1.0, 6.0, 2.0, 9.0, 15.0, 19.0, 14.0, 17.0, 25.0, 27.0, 36.0, 39.0, 47.0, 58.0, 61.0, 71.0, 63.0, 61.0, 57.0, 66.0, 55.0, 33.0, 41.0, 41.0, 28.0, 29.0, 11.0, 9.0, 16.0, 14.0, 6.0, 5.0, 3.0, 5.0, 2.0, 4.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.1766357421875, -0.17159080505371094, -0.16654586791992188, -0.1615009307861328, -0.15645599365234375, -0.1514110565185547, -0.14636611938476562, -0.14132118225097656, -0.1362762451171875, -0.13123130798339844, -0.12618637084960938, -0.12114143371582031, -0.11609649658203125, -0.11105155944824219, -0.10600662231445312, -0.10096168518066406, -0.095916748046875, -0.09087181091308594, -0.08582687377929688, -0.08078193664550781, -0.07573699951171875, -0.07069206237792969, -0.06564712524414062, -0.06060218811035156, -0.0555572509765625, -0.05051231384277344, -0.045467376708984375, -0.04042243957519531, -0.03537750244140625, -0.030332565307617188, -0.025287628173828125, -0.020242691040039062, -0.01519775390625, -0.010152816772460938, -0.005107879638671875, -6.29425048828125e-05, 0.00498199462890625, 0.010026931762695312, 0.015071868896484375, 0.020116806030273438, 0.0251617431640625, 0.030206680297851562, 0.035251617431640625, 0.04029655456542969, 0.04534149169921875, 0.05038642883300781, 0.055431365966796875, 0.06047630310058594, 0.065521240234375, 0.07056617736816406, 0.07561111450195312, 0.08065605163574219, 0.08570098876953125, 0.09074592590332031, 0.09579086303710938, 0.10083580017089844, 0.1058807373046875, 0.11092567443847656, 0.11597061157226562, 0.12101554870605469, 0.12606048583984375, 0.1311054229736328, 0.13615036010742188, 0.14119529724121094, 0.146240234375]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 6.0, 3.0, 4.0, 2.0, 5.0, 7.0, 9.0, 10.0, 21.0, 13.0, 24.0, 29.0, 63.0, 66.0, 97.0, 160.0, 294.0, 579.0, 3353.0, 1037323.0, 4937.0, 702.0, 320.0, 154.0, 107.0, 65.0, 60.0, 31.0, 33.0, 19.0, 15.0, 15.0, 10.0, 6.0, 4.0, 4.0, 5.0, 1.0, 2.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.08984375, -2.9815673828125, -2.873291015625, -2.7650146484375, -2.65673828125, -2.5484619140625, -2.440185546875, -2.3319091796875, -2.2236328125, -2.1153564453125, -2.007080078125, -1.8988037109375, -1.79052734375, -1.6822509765625, -1.573974609375, -1.4656982421875, -1.357421875, -1.2491455078125, -1.140869140625, -1.0325927734375, -0.92431640625, -0.8160400390625, -0.707763671875, -0.5994873046875, -0.4912109375, -0.3829345703125, -0.274658203125, -0.1663818359375, -0.05810546875, 0.0501708984375, 0.158447265625, 0.2667236328125, 0.375, 0.4832763671875, 0.591552734375, 0.6998291015625, 0.80810546875, 0.9163818359375, 1.024658203125, 1.1329345703125, 1.2412109375, 1.3494873046875, 1.457763671875, 1.5660400390625, 1.67431640625, 1.7825927734375, 1.890869140625, 1.9991455078125, 2.107421875, 2.2156982421875, 2.323974609375, 2.4322509765625, 2.54052734375, 2.6488037109375, 2.757080078125, 2.8653564453125, 2.9736328125, 3.0819091796875, 3.190185546875, 3.2984619140625, 3.40673828125, 3.5150146484375, 3.623291015625, 3.7315673828125, 3.83984375]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 142.0, 865.0, 5.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.7723889350891113, -3.706509590148926, -3.6406302452087402, -3.5747509002685547, -3.5088717937469482, -3.4429924488067627, -3.377113103866577, -3.3112337589263916, -3.245354413986206, -3.1794750690460205, -3.113595724105835, -3.0477166175842285, -2.981837272644043, -2.9159579277038574, -2.850078582763672, -2.7841992378234863, -2.718319892883301, -2.6524405479431152, -2.5865612030029297, -2.520681858062744, -2.4548027515411377, -2.388923406600952, -2.3230440616607666, -2.257164716720581, -2.1912856101989746, -2.125406265258789, -2.0595269203186035, -1.9936476945877075, -1.927768349647522, -1.861889123916626, -1.7960097789764404, -1.7301304340362549, -1.6642513275146484, -1.598371982574463, -1.532492756843567, -1.4666134119033813, -1.4007340669631958, -1.3348548412322998, -1.2689754962921143, -1.2030961513519287, -1.1372168064117432, -1.0713374614715576, -1.0054582357406616, -0.9395788908004761, -0.8736995458602905, -0.8078202605247498, -0.741940975189209, -0.6760616302490234, -0.6101823449134827, -0.5443030595779419, -0.47842371463775635, -0.4125444293022156, -0.3466651141643524, -0.28078579902648926, -0.2149065136909485, -0.14902719855308533, -0.08314788341522217, -0.017268575727939606, 0.04861073195934296, 0.11449003219604492, 0.18036934733390808, 0.24624866247177124, 0.312127947807312, 0.37800726294517517, 0.44388657808303833]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 13.0, 5.0, 11.0, 10.0, 17.0, 21.0, 32.0, 39.0, 58.0, 53.0, 52.0, 72.0, 72.0, 62.0, 47.0, 75.0, 65.0, 44.0, 60.0, 45.0, 30.0, 30.0, 24.0, 20.0, 14.0, 9.0, 11.0, 4.0, 8.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.23244065046310425, -0.22381605207920074, -0.21519143879413605, -0.20656684041023254, -0.19794222712516785, -0.18931762874126434, -0.18069303035736084, -0.17206841707229614, -0.16344381868839264, -0.15481922030448914, -0.14619460701942444, -0.13757000863552094, -0.12894541025161743, -0.12032079696655273, -0.11169619858264923, -0.10307159274816513, -0.09444698691368103, -0.08582238107919693, -0.07719777524471283, -0.06857317686080933, -0.059948571026325226, -0.051323965191841125, -0.042699363082647324, -0.03407476097345352, -0.02545015513896942, -0.01682555116713047, -0.00820094719529152, 0.00042365677654743195, 0.009048260748386383, 0.017672866582870483, 0.026297468692064285, 0.03492207080125809, 0.04354667663574219, 0.05217128247022629, 0.06079588457942009, 0.06942048668861389, 0.07804509252309799, 0.08666969835758209, 0.0952942967414856, 0.1039189025759697, 0.1125435084104538, 0.1211681142449379, 0.129792720079422, 0.1384173184633255, 0.147041916847229, 0.1556665301322937, 0.1642911285161972, 0.1729157269001007, 0.1815403401851654, 0.1901649385690689, 0.1987895518541336, 0.2074141502380371, 0.2160387635231018, 0.2246633619070053, 0.2332879602909088, 0.2419125735759735, 0.2505371570587158, 0.2591617703437805, 0.2677863538265228, 0.2764109671115875, 0.2850355803966522, 0.29366016387939453, 0.30228477716445923, 0.3109093904495239, 0.3195340037345886]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 5.0, 6.0, 5.0, 3.0, 10.0, 7.0, 13.0, 19.0, 17.0, 22.0, 24.0, 32.0, 31.0, 26.0, 52.0, 37.0, 43.0, 60.0, 54.0, 51.0, 57.0, 51.0, 47.0, 49.0, 49.0, 42.0, 37.0, 33.0, 23.0, 29.0, 17.0, 15.0, 12.0, 13.0, 9.0, 6.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.98828125, -7.73614501953125, -7.4840087890625, -7.23187255859375, -6.979736328125, -6.72760009765625, -6.4754638671875, -6.22332763671875, -5.97119140625, -5.71905517578125, -5.4669189453125, -5.21478271484375, -4.962646484375, -4.71051025390625, -4.4583740234375, -4.20623779296875, -3.9541015625, -3.70196533203125, -3.4498291015625, -3.19769287109375, -2.945556640625, -2.69342041015625, -2.4412841796875, -2.18914794921875, -1.93701171875, -1.68487548828125, -1.4327392578125, -1.18060302734375, -0.928466796875, -0.67633056640625, -0.4241943359375, -0.17205810546875, 0.080078125, 0.33221435546875, 0.5843505859375, 0.83648681640625, 1.088623046875, 1.34075927734375, 1.5928955078125, 1.84503173828125, 2.09716796875, 2.34930419921875, 2.6014404296875, 2.85357666015625, 3.105712890625, 3.35784912109375, 3.6099853515625, 3.86212158203125, 4.1142578125, 4.36639404296875, 4.6185302734375, 4.87066650390625, 5.122802734375, 5.37493896484375, 5.6270751953125, 5.87921142578125, 6.13134765625, 6.38348388671875, 6.6356201171875, 6.88775634765625, 7.139892578125, 7.39202880859375, 7.6441650390625, 7.89630126953125, 8.1484375]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 3.0, 6.0, 12.0, 23.0, 33.0, 47.0, 47.0, 85.0, 123.0, 217.0, 394.0, 830.0, 1816.0, 4648.0, 12274.0, 35884.0, 127003.0, 580980.0, 206291.0, 50362.0, 16647.0, 6139.0, 2433.0, 1046.0, 484.0, 289.0, 167.0, 93.0, 59.0, 49.0, 19.0, 19.0, 10.0, 9.0, 8.0, 4.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.25, -11.790283203125, -11.33056640625, -10.870849609375, -10.4111328125, -9.951416015625, -9.49169921875, -9.031982421875, -8.572265625, -8.112548828125, -7.65283203125, -7.193115234375, -6.7333984375, -6.273681640625, -5.81396484375, -5.354248046875, -4.89453125, -4.434814453125, -3.97509765625, -3.515380859375, -3.0556640625, -2.595947265625, -2.13623046875, -1.676513671875, -1.216796875, -0.757080078125, -0.29736328125, 0.162353515625, 0.6220703125, 1.081787109375, 1.54150390625, 2.001220703125, 2.4609375, 2.920654296875, 3.38037109375, 3.840087890625, 4.2998046875, 4.759521484375, 5.21923828125, 5.678955078125, 6.138671875, 6.598388671875, 7.05810546875, 7.517822265625, 7.9775390625, 8.437255859375, 8.89697265625, 9.356689453125, 9.81640625, 10.276123046875, 10.73583984375, 11.195556640625, 11.6552734375, 12.114990234375, 12.57470703125, 13.034423828125, 13.494140625, 13.953857421875, 14.41357421875, 14.873291015625, 15.3330078125, 15.792724609375, 16.25244140625, 16.712158203125, 17.171875]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 7.0, 11.0, 15.0, 20.0, 14.0, 13.0, 22.0, 33.0, 26.0, 16.0, 33.0, 54.0, 53.0, 60.0, 95.0, 148.0, 1437.0, 390.0, 155.0, 91.0, 54.0, 40.0, 33.0, 48.0, 33.0, 23.0, 18.0, 32.0, 16.0, 19.0, 10.0, 12.0, 6.0, 2.0, 7.0, 4.0, 1.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.890625, -22.21630859375, -21.5419921875, -20.86767578125, -20.193359375, -19.51904296875, -18.8447265625, -18.17041015625, -17.49609375, -16.82177734375, -16.1474609375, -15.47314453125, -14.798828125, -14.12451171875, -13.4501953125, -12.77587890625, -12.1015625, -11.42724609375, -10.7529296875, -10.07861328125, -9.404296875, -8.72998046875, -8.0556640625, -7.38134765625, -6.70703125, -6.03271484375, -5.3583984375, -4.68408203125, -4.009765625, -3.33544921875, -2.6611328125, -1.98681640625, -1.3125, -0.63818359375, 0.0361328125, 0.71044921875, 1.384765625, 2.05908203125, 2.7333984375, 3.40771484375, 4.08203125, 4.75634765625, 5.4306640625, 6.10498046875, 6.779296875, 7.45361328125, 8.1279296875, 8.80224609375, 9.4765625, 10.15087890625, 10.8251953125, 11.49951171875, 12.173828125, 12.84814453125, 13.5224609375, 14.19677734375, 14.87109375, 15.54541015625, 16.2197265625, 16.89404296875, 17.568359375, 18.24267578125, 18.9169921875, 19.59130859375, 20.265625]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0, 2.0, 0.0, 3.0, 5.0, 7.0, 15.0, 10.0, 14.0, 16.0, 24.0, 37.0, 43.0, 71.0, 79.0, 128.0, 178.0, 330.0, 644.0, 1596.0, 6960.0, 55120.0, 2542073.0, 509803.0, 22446.0, 3745.0, 1095.0, 489.0, 255.0, 130.0, 94.0, 77.0, 65.0, 37.0, 28.0, 29.0, 24.0, 12.0, 8.0, 5.0, 1.0, 4.0, 3.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-32.03125, -31.054931640625, -30.07861328125, -29.102294921875, -28.1259765625, -27.149658203125, -26.17333984375, -25.197021484375, -24.220703125, -23.244384765625, -22.26806640625, -21.291748046875, -20.3154296875, -19.339111328125, -18.36279296875, -17.386474609375, -16.41015625, -15.433837890625, -14.45751953125, -13.481201171875, -12.5048828125, -11.528564453125, -10.55224609375, -9.575927734375, -8.599609375, -7.623291015625, -6.64697265625, -5.670654296875, -4.6943359375, -3.718017578125, -2.74169921875, -1.765380859375, -0.7890625, 0.187255859375, 1.16357421875, 2.139892578125, 3.1162109375, 4.092529296875, 5.06884765625, 6.045166015625, 7.021484375, 7.997802734375, 8.97412109375, 9.950439453125, 10.9267578125, 11.903076171875, 12.87939453125, 13.855712890625, 14.83203125, 15.808349609375, 16.78466796875, 17.760986328125, 18.7373046875, 19.713623046875, 20.68994140625, 21.666259765625, 22.642578125, 23.618896484375, 24.59521484375, 25.571533203125, 26.5478515625, 27.524169921875, 28.50048828125, 29.476806640625, 30.453125]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 24.0, 263.0, 539.0, 175.0, 13.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-237.19248962402344, -232.1883544921875, -227.1842041015625, -222.18006896972656, -217.17593383789062, -212.1717987060547, -207.1676483154297, -202.16351318359375, -197.1593780517578, -192.15524291992188, -187.15109252929688, -182.14695739746094, -177.142822265625, -172.13868713378906, -167.13453674316406, -162.13040161132812, -157.12625122070312, -152.1221160888672, -147.1179656982422, -142.11383056640625, -137.1096954345703, -132.10556030273438, -127.10140991210938, -122.09727478027344, -117.0931396484375, -112.08899688720703, -107.0848617553711, -102.08071899414062, -97.07658386230469, -92.07244110107422, -87.06829833984375, -82.06416320800781, -77.06002807617188, -72.0558853149414, -67.05175018310547, -62.047607421875, -57.04347229003906, -52.039329528808594, -47.03519058227539, -42.03105163574219, -37.026912689208984, -32.02277374267578, -27.018634796142578, -22.014493942260742, -17.01035499572754, -12.006216049194336, -7.0020751953125, -1.9979362487792969, 3.0062026977539062, 8.01034164428711, 13.014481544494629, 18.01862144470215, 23.02276039123535, 28.026899337768555, 33.03104019165039, 38.035179138183594, 43.0393180847168, 48.04345703125, 53.0475959777832, 58.051734924316406, 63.055877685546875, 68.06001281738281, 73.06415557861328, 78.06829833984375, 83.07243347167969]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 3.0, 2.0, 9.0, 7.0, 10.0, 10.0, 13.0, 23.0, 22.0, 27.0, 33.0, 40.0, 37.0, 37.0, 43.0, 35.0, 32.0, 52.0, 39.0, 51.0, 53.0, 44.0, 37.0, 47.0, 42.0, 47.0, 30.0, 32.0, 24.0, 29.0, 26.0, 18.0, 15.0, 12.0, 8.0, 5.0, 4.0, 4.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-66.27040100097656, -64.48889923095703, -62.707401275634766, -60.9259033203125, -59.144405364990234, -57.36290740966797, -55.58140563964844, -53.79990768432617, -52.018409729003906, -50.23691177368164, -48.45541000366211, -46.673912048339844, -44.89241409301758, -43.11091613769531, -41.32941436767578, -39.547916412353516, -37.766414642333984, -35.98491668701172, -34.20341491699219, -32.42191696166992, -30.640419006347656, -28.858919143676758, -27.07741928100586, -25.295921325683594, -23.514421463012695, -21.732921600341797, -19.95142364501953, -18.169923782348633, -16.388423919677734, -14.606925964355469, -12.82542610168457, -11.043927192687988, -9.262432098388672, -7.48093318939209, -5.69943380355835, -3.9179344177246094, -2.1364355087280273, -0.3549365997314453, 1.4265632629394531, 3.208062171936035, 4.989561080932617, 6.771059989929199, 8.552558898925781, 10.33405876159668, 12.115557670593262, 13.897056579589844, 15.678556442260742, 17.46005630493164, 19.241554260253906, 21.023054122924805, 22.80455207824707, 24.58605194091797, 26.367549896240234, 28.149049758911133, 29.93054962158203, 31.712047576904297, 33.49354553222656, 35.27504348754883, 37.05654525756836, 38.838043212890625, 40.61954116821289, 42.401039123535156, 44.18254089355469, 45.96403884887695, 47.745540618896484]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 6.0, 5.0, 5.0, 5.0, 8.0, 6.0, 12.0, 11.0, 12.0, 15.0, 20.0, 18.0, 38.0, 21.0, 34.0, 40.0, 30.0, 35.0, 45.0, 55.0, 55.0, 63.0, 54.0, 36.0, 45.0, 46.0, 34.0, 37.0, 31.0, 24.0, 22.0, 21.0, 18.0, 18.0, 22.0, 12.0, 17.0, 16.0, 8.0, 7.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.55859375, -7.3201904296875, -7.081787109375, -6.8433837890625, -6.60498046875, -6.3665771484375, -6.128173828125, -5.8897705078125, -5.6513671875, -5.4129638671875, -5.174560546875, -4.9361572265625, -4.69775390625, -4.4593505859375, -4.220947265625, -3.9825439453125, -3.744140625, -3.5057373046875, -3.267333984375, -3.0289306640625, -2.79052734375, -2.5521240234375, -2.313720703125, -2.0753173828125, -1.8369140625, -1.5985107421875, -1.360107421875, -1.1217041015625, -0.88330078125, -0.6448974609375, -0.406494140625, -0.1680908203125, 0.0703125, 0.3087158203125, 0.547119140625, 0.7855224609375, 1.02392578125, 1.2623291015625, 1.500732421875, 1.7391357421875, 1.9775390625, 2.2159423828125, 2.454345703125, 2.6927490234375, 2.93115234375, 3.1695556640625, 3.407958984375, 3.6463623046875, 3.884765625, 4.1231689453125, 4.361572265625, 4.5999755859375, 4.83837890625, 5.0767822265625, 5.315185546875, 5.5535888671875, 5.7919921875, 6.0303955078125, 6.268798828125, 6.5072021484375, 6.74560546875, 6.9840087890625, 7.222412109375, 7.4608154296875, 7.69921875]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 9.0, 9.0, 17.0, 31.0, 37.0, 55.0, 84.0, 118.0, 218.0, 340.0, 611.0, 1098.0, 2230.0, 5054.0, 13569.0, 43970.0, 184173.0, 878098.0, 2042118.0, 793208.0, 168444.0, 39823.0, 12129.0, 4641.0, 1962.0, 947.0, 525.0, 283.0, 186.0, 108.0, 72.0, 48.0, 25.0, 24.0, 11.0, 4.0, 6.0, 3.0, 0.0, 1.0], "bins": [-13.6171875, -13.2965087890625, -12.975830078125, -12.6551513671875, -12.33447265625, -12.0137939453125, -11.693115234375, -11.3724365234375, -11.0517578125, -10.7310791015625, -10.410400390625, -10.0897216796875, -9.76904296875, -9.4483642578125, -9.127685546875, -8.8070068359375, -8.486328125, -8.1656494140625, -7.844970703125, -7.5242919921875, -7.20361328125, -6.8829345703125, -6.562255859375, -6.2415771484375, -5.9208984375, -5.6002197265625, -5.279541015625, -4.9588623046875, -4.63818359375, -4.3175048828125, -3.996826171875, -3.6761474609375, -3.35546875, -3.0347900390625, -2.714111328125, -2.3934326171875, -2.07275390625, -1.7520751953125, -1.431396484375, -1.1107177734375, -0.7900390625, -0.4693603515625, -0.148681640625, 0.1719970703125, 0.49267578125, 0.8133544921875, 1.134033203125, 1.4547119140625, 1.775390625, 2.0960693359375, 2.416748046875, 2.7374267578125, 3.05810546875, 3.3787841796875, 3.699462890625, 4.0201416015625, 4.3408203125, 4.6614990234375, 4.982177734375, 5.3028564453125, 5.62353515625, 5.9442138671875, 6.264892578125, 6.5855712890625, 6.90625]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 6.0, 7.0, 7.0, 4.0, 15.0, 13.0, 27.0, 35.0, 42.0, 61.0, 74.0, 111.0, 184.0, 284.0, 380.0, 514.0, 618.0, 499.0, 366.0, 246.0, 173.0, 123.0, 72.0, 49.0, 49.0, 32.0, 17.0, 16.0, 13.0, 20.0, 4.0, 8.0, 1.0, 5.0, 2.0, 4.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-14.296875, -13.923828125, -13.55078125, -13.177734375, -12.8046875, -12.431640625, -12.05859375, -11.685546875, -11.3125, -10.939453125, -10.56640625, -10.193359375, -9.8203125, -9.447265625, -9.07421875, -8.701171875, -8.328125, -7.955078125, -7.58203125, -7.208984375, -6.8359375, -6.462890625, -6.08984375, -5.716796875, -5.34375, -4.970703125, -4.59765625, -4.224609375, -3.8515625, -3.478515625, -3.10546875, -2.732421875, -2.359375, -1.986328125, -1.61328125, -1.240234375, -0.8671875, -0.494140625, -0.12109375, 0.251953125, 0.625, 0.998046875, 1.37109375, 1.744140625, 2.1171875, 2.490234375, 2.86328125, 3.236328125, 3.609375, 3.982421875, 4.35546875, 4.728515625, 5.1015625, 5.474609375, 5.84765625, 6.220703125, 6.59375, 6.966796875, 7.33984375, 7.712890625, 8.0859375, 8.458984375, 8.83203125, 9.205078125, 9.578125]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 0.0, 5.0, 11.0, 18.0, 44.0, 75.0, 235.0, 916.0, 15407.0, 4127258.0, 48806.0, 1106.0, 245.0, 98.0, 31.0, 16.0, 8.0, 5.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.53125, -41.84814453125, -39.1650390625, -36.48193359375, -33.798828125, -31.11572265625, -28.4326171875, -25.74951171875, -23.06640625, -20.38330078125, -17.7001953125, -15.01708984375, -12.333984375, -9.65087890625, -6.9677734375, -4.28466796875, -1.6015625, 1.08154296875, 3.7646484375, 6.44775390625, 9.130859375, 11.81396484375, 14.4970703125, 17.18017578125, 19.86328125, 22.54638671875, 25.2294921875, 27.91259765625, 30.595703125, 33.27880859375, 35.9619140625, 38.64501953125, 41.328125, 44.01123046875, 46.6943359375, 49.37744140625, 52.060546875, 54.74365234375, 57.4267578125, 60.10986328125, 62.79296875, 65.47607421875, 68.1591796875, 70.84228515625, 73.525390625, 76.20849609375, 78.8916015625, 81.57470703125, 84.2578125, 86.94091796875, 89.6240234375, 92.30712890625, 94.990234375, 97.67333984375, 100.3564453125, 103.03955078125, 105.72265625, 108.40576171875, 111.0888671875, 113.77197265625, 116.455078125, 119.13818359375, 121.8212890625, 124.50439453125, 127.1875]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 18.0, 86.0, 299.0, 381.0, 164.0, 52.0, 10.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-109.99696350097656, -104.82659912109375, -99.65623474121094, -94.48587036132812, -89.31550598144531, -84.1451416015625, -78.97478485107422, -73.8044204711914, -68.6340560913086, -63.46369171142578, -58.29332733154297, -53.12296676635742, -47.95260238647461, -42.7822380065918, -37.61187744140625, -32.44151306152344, -27.271148681640625, -22.100784301757812, -16.930421829223633, -11.760058403015137, -6.589694976806641, -1.4193305969238281, 3.7510318756103516, 8.921394348144531, 14.091758728027344, 19.262123107910156, 24.432485580444336, 29.602848052978516, 34.77321243286133, 39.94357681274414, 45.11393737792969, 50.2843017578125, 55.454681396484375, 60.62504577636719, 65.79541015625, 70.96577453613281, 76.13613891601562, 81.30650329589844, 86.47686004638672, 91.64722442626953, 96.81758880615234, 101.98795318603516, 107.15831756591797, 112.32868194580078, 117.49903869628906, 122.66940307617188, 127.83976745605469, 133.0101318359375, 138.1804962158203, 143.35086059570312, 148.52122497558594, 153.69158935546875, 158.86195373535156, 164.03231811523438, 169.2026824951172, 174.373046875, 179.54339599609375, 184.71376037597656, 189.88412475585938, 195.0544891357422, 200.224853515625, 205.3952178955078, 210.56558227539062, 215.73593139648438, 220.90631103515625]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 10.0, 7.0, 5.0, 10.0, 14.0, 19.0, 24.0, 41.0, 38.0, 57.0, 49.0, 54.0, 53.0, 61.0, 57.0, 65.0, 73.0, 40.0, 50.0, 47.0, 49.0, 35.0, 34.0, 35.0, 16.0, 20.0, 14.0, 7.0, 11.0, 6.0, 2.0, 7.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.226409912109375, -43.55092239379883, -41.87543487548828, -40.19994354248047, -38.52445602416992, -36.848968505859375, -35.17347717285156, -33.497989654541016, -31.82250213623047, -30.147014617919922, -28.471525192260742, -26.796035766601562, -25.120548248291016, -23.44506072998047, -21.76957130432129, -20.09408187866211, -18.418594360351562, -16.743106842041016, -15.067617416381836, -13.392128944396973, -11.71664047241211, -10.041152000427246, -8.365663528442383, -6.6901750564575195, -5.014686584472656, -3.339198112487793, -1.6637096405029297, 0.011778831481933594, 1.6872673034667969, 3.36275577545166, 5.038244247436523, 6.713732719421387, 8.389225006103516, 10.064713478088379, 11.740201950073242, 13.415690422058105, 15.091178894042969, 16.766666412353516, 18.442155838012695, 20.117645263671875, 21.793132781982422, 23.46862030029297, 25.14410972595215, 26.819599151611328, 28.495086669921875, 30.170574188232422, 31.8460636138916, 33.52155303955078, 35.19704055786133, 36.872528076171875, 38.54801940917969, 40.223506927490234, 41.89899444580078, 43.57448196411133, 45.249969482421875, 46.92546081542969, 48.600948333740234, 50.27643585205078, 51.951927185058594, 53.62741470336914, 55.30290222167969, 56.978389739990234, 58.65387725830078, 60.329368591308594, 62.00485610961914]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 1.0, 5.0, 4.0, 9.0, 4.0, 5.0, 8.0, 8.0, 17.0, 15.0, 17.0, 18.0, 30.0, 28.0, 28.0, 48.0, 37.0, 42.0, 40.0, 30.0, 54.0, 55.0, 36.0, 45.0, 47.0, 32.0, 36.0, 33.0, 28.0, 36.0, 33.0, 31.0, 35.0, 13.0, 13.0, 19.0, 20.0, 8.0, 7.0, 7.0, 6.0, 5.0, 5.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.65234375, -6.4337158203125, -6.215087890625, -5.9964599609375, -5.77783203125, -5.5592041015625, -5.340576171875, -5.1219482421875, -4.9033203125, -4.6846923828125, -4.466064453125, -4.2474365234375, -4.02880859375, -3.8101806640625, -3.591552734375, -3.3729248046875, -3.154296875, -2.9356689453125, -2.717041015625, -2.4984130859375, -2.27978515625, -2.0611572265625, -1.842529296875, -1.6239013671875, -1.4052734375, -1.1866455078125, -0.968017578125, -0.7493896484375, -0.53076171875, -0.3121337890625, -0.093505859375, 0.1251220703125, 0.34375, 0.5623779296875, 0.781005859375, 0.9996337890625, 1.21826171875, 1.4368896484375, 1.655517578125, 1.8741455078125, 2.0927734375, 2.3114013671875, 2.530029296875, 2.7486572265625, 2.96728515625, 3.1859130859375, 3.404541015625, 3.6231689453125, 3.841796875, 4.0604248046875, 4.279052734375, 4.4976806640625, 4.71630859375, 4.9349365234375, 5.153564453125, 5.3721923828125, 5.5908203125, 5.8094482421875, 6.028076171875, 6.2467041015625, 6.46533203125, 6.6839599609375, 6.902587890625, 7.1212158203125, 7.33984375]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 5.0, 5.0, 9.0, 15.0, 18.0, 28.0, 39.0, 69.0, 82.0, 147.0, 192.0, 291.0, 464.0, 648.0, 990.0, 1418.0, 2144.0, 3186.0, 4987.0, 7538.0, 11822.0, 18039.0, 27741.0, 42033.0, 62555.0, 90103.0, 120288.0, 143242.0, 140552.0, 114553.0, 84341.0, 58309.0, 39059.0, 25693.0, 16465.0, 10671.0, 7153.0, 4522.0, 3076.0, 2011.0, 1338.0, 876.0, 617.0, 407.0, 248.0, 176.0, 128.0, 88.0, 57.0, 40.0, 35.0, 14.0, 17.0, 11.0, 1.0, 6.0, 3.0, 1.0, 3.0], "bins": [-1.001953125, -0.9715042114257812, -0.9410552978515625, -0.9106063842773438, -0.880157470703125, -0.8497085571289062, -0.8192596435546875, -0.7888107299804688, -0.75836181640625, -0.7279129028320312, -0.6974639892578125, -0.6670150756835938, -0.636566162109375, -0.6061172485351562, -0.5756683349609375, -0.5452194213867188, -0.5147705078125, -0.48432159423828125, -0.4538726806640625, -0.42342376708984375, -0.392974853515625, -0.36252593994140625, -0.3320770263671875, -0.30162811279296875, -0.27117919921875, -0.24073028564453125, -0.2102813720703125, -0.17983245849609375, -0.149383544921875, -0.11893463134765625, -0.0884857177734375, -0.05803680419921875, -0.027587890625, 0.00286102294921875, 0.0333099365234375, 0.06375885009765625, 0.094207763671875, 0.12465667724609375, 0.1551055908203125, 0.18555450439453125, 0.21600341796875, 0.24645233154296875, 0.2769012451171875, 0.30735015869140625, 0.337799072265625, 0.36824798583984375, 0.3986968994140625, 0.42914581298828125, 0.4595947265625, 0.49004364013671875, 0.5204925537109375, 0.5509414672851562, 0.581390380859375, 0.6118392944335938, 0.6422882080078125, 0.6727371215820312, 0.70318603515625, 0.7336349487304688, 0.7640838623046875, 0.7945327758789062, 0.824981689453125, 0.8554306030273438, 0.8858795166015625, 0.9163284301757812, 0.94677734375]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 2.0, 3.0, 9.0, 6.0, 4.0, 9.0, 7.0, 17.0, 10.0, 18.0, 23.0, 23.0, 16.0, 19.0, 36.0, 25.0, 35.0, 24.0, 30.0, 34.0, 50.0, 36.0, 44.0, 30.0, 1070.0, 38.0, 41.0, 32.0, 38.0, 44.0, 33.0, 24.0, 16.0, 28.0, 22.0, 18.0, 20.0, 14.0, 14.0, 13.0, 10.0, 9.0, 13.0, 3.0, 7.0, 6.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-5.18359375, -5.02191162109375, -4.8602294921875, -4.69854736328125, -4.536865234375, -4.37518310546875, -4.2135009765625, -4.05181884765625, -3.89013671875, -3.72845458984375, -3.5667724609375, -3.40509033203125, -3.243408203125, -3.08172607421875, -2.9200439453125, -2.75836181640625, -2.5966796875, -2.43499755859375, -2.2733154296875, -2.11163330078125, -1.949951171875, -1.78826904296875, -1.6265869140625, -1.46490478515625, -1.30322265625, -1.14154052734375, -0.9798583984375, -0.81817626953125, -0.656494140625, -0.49481201171875, -0.3331298828125, -0.17144775390625, -0.009765625, 0.15191650390625, 0.3135986328125, 0.47528076171875, 0.636962890625, 0.79864501953125, 0.9603271484375, 1.12200927734375, 1.28369140625, 1.44537353515625, 1.6070556640625, 1.76873779296875, 1.930419921875, 2.09210205078125, 2.2537841796875, 2.41546630859375, 2.5771484375, 2.73883056640625, 2.9005126953125, 3.06219482421875, 3.223876953125, 3.38555908203125, 3.5472412109375, 3.70892333984375, 3.87060546875, 4.03228759765625, 4.1939697265625, 4.35565185546875, 4.517333984375, 4.67901611328125, 4.8406982421875, 5.00238037109375, 5.1640625]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 7.0, 5.0, 12.0, 10.0, 16.0, 15.0, 39.0, 48.0, 65.0, 101.0, 144.0, 185.0, 263.0, 380.0, 558.0, 784.0, 1169.0, 1734.0, 2479.0, 3645.0, 5475.0, 8291.0, 12797.0, 21414.0, 53041.0, 1468396.0, 419529.0, 41947.0, 19375.0, 11850.0, 7584.0, 5075.0, 3433.0, 2241.0, 1539.0, 1043.0, 712.0, 519.0, 365.0, 249.0, 176.0, 115.0, 86.0, 61.0, 59.0, 29.0, 25.0, 18.0, 13.0, 10.0, 7.0, 6.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.943359375, -1.8824615478515625, -1.821563720703125, -1.7606658935546875, -1.69976806640625, -1.6388702392578125, -1.577972412109375, -1.5170745849609375, -1.4561767578125, -1.3952789306640625, -1.334381103515625, -1.2734832763671875, -1.21258544921875, -1.1516876220703125, -1.090789794921875, -1.0298919677734375, -0.968994140625, -0.9080963134765625, -0.847198486328125, -0.7863006591796875, -0.72540283203125, -0.6645050048828125, -0.603607177734375, -0.5427093505859375, -0.4818115234375, -0.4209136962890625, -0.360015869140625, -0.2991180419921875, -0.23822021484375, -0.1773223876953125, -0.116424560546875, -0.0555267333984375, 0.00537109375, 0.0662689208984375, 0.127166748046875, 0.1880645751953125, 0.24896240234375, 0.3098602294921875, 0.370758056640625, 0.4316558837890625, 0.4925537109375, 0.5534515380859375, 0.614349365234375, 0.6752471923828125, 0.73614501953125, 0.7970428466796875, 0.857940673828125, 0.9188385009765625, 0.979736328125, 1.0406341552734375, 1.101531982421875, 1.1624298095703125, 1.22332763671875, 1.2842254638671875, 1.345123291015625, 1.4060211181640625, 1.4669189453125, 1.5278167724609375, 1.588714599609375, 1.6496124267578125, 1.71051025390625, 1.7714080810546875, 1.832305908203125, 1.8932037353515625, 1.9541015625]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 5.0, 2.0, 4.0, 8.0, 13.0, 6.0, 14.0, 10.0, 16.0, 18.0, 29.0, 24.0, 27.0, 34.0, 42.0, 30.0, 46.0, 54.0, 56.0, 59.0, 67.0, 62.0, 53.0, 34.0, 50.0, 36.0, 35.0, 28.0, 24.0, 19.0, 23.0, 17.0, 11.0, 10.0, 6.0, 2.0, 7.0, 5.0, 3.0, 6.0, 4.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1104736328125, -0.10691070556640625, -0.1033477783203125, -0.09978485107421875, -0.096221923828125, -0.09265899658203125, -0.0890960693359375, -0.08553314208984375, -0.08197021484375, -0.07840728759765625, -0.0748443603515625, -0.07128143310546875, -0.067718505859375, -0.06415557861328125, -0.0605926513671875, -0.05702972412109375, -0.053466796875, -0.04990386962890625, -0.0463409423828125, -0.04277801513671875, -0.039215087890625, -0.03565216064453125, -0.0320892333984375, -0.02852630615234375, -0.02496337890625, -0.02140045166015625, -0.0178375244140625, -0.01427459716796875, -0.010711669921875, -0.00714874267578125, -0.0035858154296875, -2.288818359375e-05, 0.0035400390625, 0.00710296630859375, 0.0106658935546875, 0.01422882080078125, 0.017791748046875, 0.02135467529296875, 0.0249176025390625, 0.02848052978515625, 0.03204345703125, 0.03560638427734375, 0.0391693115234375, 0.04273223876953125, 0.046295166015625, 0.04985809326171875, 0.0534210205078125, 0.05698394775390625, 0.060546875, 0.06410980224609375, 0.0676727294921875, 0.07123565673828125, 0.074798583984375, 0.07836151123046875, 0.0819244384765625, 0.08548736572265625, 0.08905029296875, 0.09261322021484375, 0.0961761474609375, 0.09973907470703125, 0.103302001953125, 0.10686492919921875, 0.1104278564453125, 0.11399078369140625, 0.1175537109375]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 5.0, 5.0, 3.0, 2.0, 6.0, 6.0, 5.0, 5.0, 12.0, 13.0, 22.0, 26.0, 41.0, 38.0, 50.0, 88.0, 99.0, 158.0, 264.0, 471.0, 1284.0, 309820.0, 733118.0, 1554.0, 553.0, 271.0, 186.0, 107.0, 83.0, 57.0, 53.0, 28.0, 26.0, 25.0, 16.0, 14.0, 10.0, 10.0, 8.0, 7.0, 3.0, 3.0, 1.0, 5.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.4296875, -2.356201171875, -2.28271484375, -2.209228515625, -2.1357421875, -2.062255859375, -1.98876953125, -1.915283203125, -1.841796875, -1.768310546875, -1.69482421875, -1.621337890625, -1.5478515625, -1.474365234375, -1.40087890625, -1.327392578125, -1.25390625, -1.180419921875, -1.10693359375, -1.033447265625, -0.9599609375, -0.886474609375, -0.81298828125, -0.739501953125, -0.666015625, -0.592529296875, -0.51904296875, -0.445556640625, -0.3720703125, -0.298583984375, -0.22509765625, -0.151611328125, -0.078125, -0.004638671875, 0.06884765625, 0.142333984375, 0.2158203125, 0.289306640625, 0.36279296875, 0.436279296875, 0.509765625, 0.583251953125, 0.65673828125, 0.730224609375, 0.8037109375, 0.877197265625, 0.95068359375, 1.024169921875, 1.09765625, 1.171142578125, 1.24462890625, 1.318115234375, 1.3916015625, 1.465087890625, 1.53857421875, 1.612060546875, 1.685546875, 1.759033203125, 1.83251953125, 1.906005859375, 1.9794921875, 2.052978515625, 2.12646484375, 2.199951171875, 2.2734375]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 7.0, 946.0, 63.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.683729887008667, -3.6209278106689453, -3.5581257343292236, -3.495323657989502, -3.4325215816497803, -3.3697195053100586, -3.306917428970337, -3.2441153526306152, -3.1813132762908936, -3.118511199951172, -3.05570912361145, -2.9929070472717285, -2.930104970932007, -2.867302894592285, -2.8045008182525635, -2.741698741912842, -2.678896427154541, -2.6160943508148193, -2.5532922744750977, -2.490490198135376, -2.4276881217956543, -2.3648860454559326, -2.302083969116211, -2.2392818927764893, -2.1764798164367676, -2.113677740097046, -2.050875663757324, -1.9880735874176025, -1.9252715110778809, -1.8624694347381592, -1.7996673583984375, -1.7368652820587158, -1.674062967300415, -1.6112608909606934, -1.5484588146209717, -1.48565673828125, -1.4228546619415283, -1.3600525856018066, -1.297250509262085, -1.2344484329223633, -1.1716463565826416, -1.10884428024292, -1.0460422039031982, -0.9832401275634766, -0.9204380512237549, -0.8576359748840332, -0.7948338389396667, -0.7320317625999451, -0.6692296862602234, -0.6064276099205017, -0.54362553358078, -0.48082342743873596, -0.4180213510990143, -0.3552192747592926, -0.29241716861724854, -0.22961509227752686, -0.16681301593780518, -0.1040109321475029, -0.04120884835720062, 0.02159324288368225, 0.08439531922340393, 0.1471973955631256, 0.20999950170516968, 0.27280157804489136, 0.33560365438461304]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 6.0, 6.0, 3.0, 8.0, 20.0, 9.0, 15.0, 18.0, 24.0, 28.0, 32.0, 25.0, 26.0, 41.0, 39.0, 40.0, 42.0, 44.0, 47.0, 38.0, 48.0, 44.0, 46.0, 40.0, 49.0, 46.0, 37.0, 36.0, 24.0, 24.0, 31.0, 16.0, 9.0, 10.0, 8.0, 5.0, 2.0, 7.0, 5.0, 3.0, 4.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.16095411777496338, -0.15575681626796722, -0.15055952966213226, -0.1453622281551361, -0.14016492664813995, -0.1349676251411438, -0.12977033853530884, -0.12457303702831268, -0.11937574297189713, -0.11417844891548157, -0.10898114740848541, -0.10378385335206985, -0.0985865592956543, -0.09338925778865814, -0.08819196373224258, -0.08299466967582703, -0.07779736816883087, -0.07260007411241531, -0.06740277260541916, -0.0622054785490036, -0.057008180767297745, -0.05181088298559189, -0.04661358892917633, -0.041416291147470474, -0.03621899336576462, -0.03102169558405876, -0.025824399664998055, -0.020627103745937347, -0.015429805964231491, -0.010232508182525635, -0.005035212263464928, 0.00016208365559577942, 0.005359381437301636, 0.010556678287684917, 0.0157539751380682, 0.020951271057128906, 0.026148568838834763, 0.03134586662054062, 0.03654316067695618, 0.04174045845866203, 0.04693775624036789, 0.052135054022073746, 0.0573323518037796, 0.06252964586019516, 0.06772693991661072, 0.07292424142360687, 0.07812153548002243, 0.08331882953643799, 0.08851613104343414, 0.0937134250998497, 0.09891072660684586, 0.10410802066326141, 0.10930532217025757, 0.11450261622667313, 0.11969991028308868, 0.12489721179008484, 0.1300944983959198, 0.13529179990291595, 0.14048908650875092, 0.14568638801574707, 0.15088368952274323, 0.15608099102973938, 0.16127827763557434, 0.1664755791425705, 0.17167288064956665]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 5.0, 6.0, 7.0, 9.0, 10.0, 14.0, 20.0, 14.0, 36.0, 21.0, 39.0, 33.0, 36.0, 52.0, 51.0, 47.0, 46.0, 48.0, 40.0, 45.0, 45.0, 58.0, 46.0, 41.0, 30.0, 37.0, 39.0, 24.0, 22.0, 17.0, 9.0, 12.0, 12.0, 9.0, 6.0, 6.0, 5.0, 5.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.0234375, -7.7745361328125, -7.525634765625, -7.2767333984375, -7.02783203125, -6.7789306640625, -6.530029296875, -6.2811279296875, -6.0322265625, -5.7833251953125, -5.534423828125, -5.2855224609375, -5.03662109375, -4.7877197265625, -4.538818359375, -4.2899169921875, -4.041015625, -3.7921142578125, -3.543212890625, -3.2943115234375, -3.04541015625, -2.7965087890625, -2.547607421875, -2.2987060546875, -2.0498046875, -1.8009033203125, -1.552001953125, -1.3031005859375, -1.05419921875, -0.8052978515625, -0.556396484375, -0.3074951171875, -0.05859375, 0.1903076171875, 0.439208984375, 0.6881103515625, 0.93701171875, 1.1859130859375, 1.434814453125, 1.6837158203125, 1.9326171875, 2.1815185546875, 2.430419921875, 2.6793212890625, 2.92822265625, 3.1771240234375, 3.426025390625, 3.6749267578125, 3.923828125, 4.1727294921875, 4.421630859375, 4.6705322265625, 4.91943359375, 5.1683349609375, 5.417236328125, 5.6661376953125, 5.9150390625, 6.1639404296875, 6.412841796875, 6.6617431640625, 6.91064453125, 7.1595458984375, 7.408447265625, 7.6573486328125, 7.90625]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 5.0, 6.0, 3.0, 9.0, 3.0, 12.0, 12.0, 26.0, 21.0, 53.0, 58.0, 104.0, 148.0, 229.0, 394.0, 550.0, 870.0, 1433.0, 2320.0, 3585.0, 6245.0, 10751.0, 19015.0, 36311.0, 71291.0, 148423.0, 276723.0, 233807.0, 113701.0, 55590.0, 28877.0, 15650.0, 8921.0, 5127.0, 3051.0, 1921.0, 1160.0, 763.0, 486.0, 327.0, 171.0, 115.0, 96.0, 65.0, 42.0, 33.0, 20.0, 12.0, 10.0, 8.0, 5.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.46875, -6.24432373046875, -6.0198974609375, -5.79547119140625, -5.571044921875, -5.34661865234375, -5.1221923828125, -4.89776611328125, -4.67333984375, -4.44891357421875, -4.2244873046875, -4.00006103515625, -3.775634765625, -3.55120849609375, -3.3267822265625, -3.10235595703125, -2.8779296875, -2.65350341796875, -2.4290771484375, -2.20465087890625, -1.980224609375, -1.75579833984375, -1.5313720703125, -1.30694580078125, -1.08251953125, -0.85809326171875, -0.6336669921875, -0.40924072265625, -0.184814453125, 0.03961181640625, 0.2640380859375, 0.48846435546875, 0.712890625, 0.93731689453125, 1.1617431640625, 1.38616943359375, 1.610595703125, 1.83502197265625, 2.0594482421875, 2.28387451171875, 2.50830078125, 2.73272705078125, 2.9571533203125, 3.18157958984375, 3.406005859375, 3.63043212890625, 3.8548583984375, 4.07928466796875, 4.3037109375, 4.52813720703125, 4.7525634765625, 4.97698974609375, 5.201416015625, 5.42584228515625, 5.6502685546875, 5.87469482421875, 6.09912109375, 6.32354736328125, 6.5479736328125, 6.77239990234375, 6.996826171875, 7.22125244140625, 7.4456787109375, 7.67010498046875, 7.89453125]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 3.0, 7.0, 13.0, 10.0, 9.0, 11.0, 13.0, 21.0, 20.0, 19.0, 22.0, 26.0, 30.0, 30.0, 37.0, 64.0, 50.0, 68.0, 112.0, 177.0, 1338.0, 270.0, 162.0, 85.0, 63.0, 53.0, 43.0, 41.0, 35.0, 34.0, 21.0, 26.0, 27.0, 12.0, 19.0, 11.0, 15.0, 6.0, 7.0, 11.0, 6.0, 7.0, 4.0, 3.0, 0.0, 0.0, 1.0, 5.0, 3.0, 0.0, 3.0, 2.0], "bins": [-18.140625, -17.589111328125, -17.03759765625, -16.486083984375, -15.9345703125, -15.383056640625, -14.83154296875, -14.280029296875, -13.728515625, -13.177001953125, -12.62548828125, -12.073974609375, -11.5224609375, -10.970947265625, -10.41943359375, -9.867919921875, -9.31640625, -8.764892578125, -8.21337890625, -7.661865234375, -7.1103515625, -6.558837890625, -6.00732421875, -5.455810546875, -4.904296875, -4.352783203125, -3.80126953125, -3.249755859375, -2.6982421875, -2.146728515625, -1.59521484375, -1.043701171875, -0.4921875, 0.059326171875, 0.61083984375, 1.162353515625, 1.7138671875, 2.265380859375, 2.81689453125, 3.368408203125, 3.919921875, 4.471435546875, 5.02294921875, 5.574462890625, 6.1259765625, 6.677490234375, 7.22900390625, 7.780517578125, 8.33203125, 8.883544921875, 9.43505859375, 9.986572265625, 10.5380859375, 11.089599609375, 11.64111328125, 12.192626953125, 12.744140625, 13.295654296875, 13.84716796875, 14.398681640625, 14.9501953125, 15.501708984375, 16.05322265625, 16.604736328125, 17.15625]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 8.0, 4.0, 6.0, 20.0, 26.0, 34.0, 51.0, 69.0, 101.0, 143.0, 239.0, 352.0, 670.0, 1842.0, 7089.0, 40309.0, 468771.0, 2438479.0, 160387.0, 20398.0, 4203.0, 1158.0, 500.0, 270.0, 174.0, 133.0, 71.0, 57.0, 44.0, 31.0, 18.0, 12.0, 13.0, 3.0, 8.0, 4.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.171875, -19.45947265625, -18.7470703125, -18.03466796875, -17.322265625, -16.60986328125, -15.8974609375, -15.18505859375, -14.47265625, -13.76025390625, -13.0478515625, -12.33544921875, -11.623046875, -10.91064453125, -10.1982421875, -9.48583984375, -8.7734375, -8.06103515625, -7.3486328125, -6.63623046875, -5.923828125, -5.21142578125, -4.4990234375, -3.78662109375, -3.07421875, -2.36181640625, -1.6494140625, -0.93701171875, -0.224609375, 0.48779296875, 1.2001953125, 1.91259765625, 2.625, 3.33740234375, 4.0498046875, 4.76220703125, 5.474609375, 6.18701171875, 6.8994140625, 7.61181640625, 8.32421875, 9.03662109375, 9.7490234375, 10.46142578125, 11.173828125, 11.88623046875, 12.5986328125, 13.31103515625, 14.0234375, 14.73583984375, 15.4482421875, 16.16064453125, 16.873046875, 17.58544921875, 18.2978515625, 19.01025390625, 19.72265625, 20.43505859375, 21.1474609375, 21.85986328125, 22.572265625, 23.28466796875, 23.9970703125, 24.70947265625, 25.421875]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 15.0, 718.0, 282.0, 4.0], "bins": [-700.5646362304688, -689.233642578125, -677.9027099609375, -666.5717163085938, -655.24072265625, -643.9097900390625, -632.5787963867188, -621.247802734375, -609.9168701171875, -598.5858764648438, -587.2549438476562, -575.9239501953125, -564.5929565429688, -553.2620239257812, -541.9310302734375, -530.6000366210938, -519.26904296875, -507.9380798339844, -496.6070861816406, -485.276123046875, -473.94512939453125, -462.6141662597656, -451.283203125, -439.95220947265625, -428.6212463378906, -417.290283203125, -405.95928955078125, -394.6283264160156, -383.29736328125, -371.96636962890625, -360.6354064941406, -349.304443359375, -337.9734802246094, -326.64251708984375, -315.3115234375, -303.9805603027344, -292.64959716796875, -281.318603515625, -269.9876403808594, -258.65667724609375, -247.32568359375, -235.9947052001953, -224.66372680664062, -213.332763671875, -202.0017852783203, -190.67080688476562, -179.33984375, -168.0088653564453, -156.67788696289062, -145.34690856933594, -134.01593017578125, -122.68496704101562, -111.35398864746094, -100.02301025390625, -88.6920394897461, -77.36106872558594, -66.03009033203125, -54.69911575317383, -43.368141174316406, -32.037166595458984, -20.706192016601562, -9.37521743774414, 1.9557571411132812, 13.286727905273438, 24.617708206176758]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 3.0, 3.0, 5.0, 5.0, 5.0, 12.0, 10.0, 12.0, 14.0, 19.0, 24.0, 26.0, 26.0, 34.0, 35.0, 30.0, 42.0, 45.0, 51.0, 42.0, 41.0, 40.0, 36.0, 49.0, 54.0, 50.0, 36.0, 32.0, 43.0, 32.0, 31.0, 19.0, 19.0, 16.0, 16.0, 6.0, 14.0, 11.0, 5.0, 5.0, 5.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-60.706729888916016, -59.10851287841797, -57.51029968261719, -55.91208267211914, -54.313865661621094, -52.71565246582031, -51.117435455322266, -49.51921844482422, -47.92100524902344, -46.32278823852539, -44.72457504272461, -43.12635803222656, -41.528141021728516, -39.92992401123047, -38.33171081542969, -36.73349380493164, -35.135276794433594, -33.53705978393555, -31.938844680786133, -30.34062957763672, -28.742412567138672, -27.144197463989258, -25.545982360839844, -23.947765350341797, -22.349550247192383, -20.75133514404297, -19.153118133544922, -17.554903030395508, -15.956686973571777, -14.358470916748047, -12.760255813598633, -11.162039756774902, -9.563827514648438, -7.965611457824707, -6.367395877838135, -4.7691802978515625, -3.170964241027832, -1.5727481842041016, 0.0254669189453125, 1.623682975769043, 3.2218990325927734, 4.820115089416504, 6.418330669403076, 8.016546249389648, 9.614762306213379, 11.21297836303711, 12.811193466186523, 14.409409523010254, 16.007625579833984, 17.6058406829834, 19.204057693481445, 20.80227279663086, 22.400489807128906, 23.99870491027832, 25.596920013427734, 27.19513702392578, 28.793352127075195, 30.39156723022461, 31.989784240722656, 33.58799743652344, 35.186214447021484, 36.78443145751953, 38.38264465332031, 39.98086166381836, 41.579078674316406]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 4.0, 2.0, 3.0, 5.0, 4.0, 7.0, 13.0, 10.0, 10.0, 15.0, 19.0, 18.0, 29.0, 33.0, 27.0, 35.0, 52.0, 43.0, 41.0, 43.0, 45.0, 44.0, 53.0, 31.0, 39.0, 57.0, 40.0, 39.0, 33.0, 30.0, 28.0, 28.0, 15.0, 25.0, 17.0, 17.0, 14.0, 14.0, 8.0, 2.0, 4.0, 7.0, 2.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.81640625, -7.57904052734375, -7.3416748046875, -7.10430908203125, -6.866943359375, -6.62957763671875, -6.3922119140625, -6.15484619140625, -5.91748046875, -5.68011474609375, -5.4427490234375, -5.20538330078125, -4.968017578125, -4.73065185546875, -4.4932861328125, -4.25592041015625, -4.0185546875, -3.78118896484375, -3.5438232421875, -3.30645751953125, -3.069091796875, -2.83172607421875, -2.5943603515625, -2.35699462890625, -2.11962890625, -1.88226318359375, -1.6448974609375, -1.40753173828125, -1.170166015625, -0.93280029296875, -0.6954345703125, -0.45806884765625, -0.220703125, 0.01666259765625, 0.2540283203125, 0.49139404296875, 0.728759765625, 0.96612548828125, 1.2034912109375, 1.44085693359375, 1.67822265625, 1.91558837890625, 2.1529541015625, 2.39031982421875, 2.627685546875, 2.86505126953125, 3.1024169921875, 3.33978271484375, 3.5771484375, 3.81451416015625, 4.0518798828125, 4.28924560546875, 4.526611328125, 4.76397705078125, 5.0013427734375, 5.23870849609375, 5.47607421875, 5.71343994140625, 5.9508056640625, 6.18817138671875, 6.425537109375, 6.66290283203125, 6.9002685546875, 7.13763427734375, 7.375]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 8.0, 16.0, 33.0, 40.0, 78.0, 167.0, 319.0, 638.0, 1768.0, 6084.0, 27754.0, 211573.0, 2085430.0, 1669090.0, 161283.0, 22317.0, 5081.0, 1513.0, 562.0, 250.0, 119.0, 74.0, 34.0, 31.0, 18.0, 8.0, 6.0, 1.0, 1.0], "bins": [-23.34375, -22.8568115234375, -22.369873046875, -21.8829345703125, -21.39599609375, -20.9090576171875, -20.422119140625, -19.9351806640625, -19.4482421875, -18.9613037109375, -18.474365234375, -17.9874267578125, -17.50048828125, -17.0135498046875, -16.526611328125, -16.0396728515625, -15.552734375, -15.0657958984375, -14.578857421875, -14.0919189453125, -13.60498046875, -13.1180419921875, -12.631103515625, -12.1441650390625, -11.6572265625, -11.1702880859375, -10.683349609375, -10.1964111328125, -9.70947265625, -9.2225341796875, -8.735595703125, -8.2486572265625, -7.76171875, -7.2747802734375, -6.787841796875, -6.3009033203125, -5.81396484375, -5.3270263671875, -4.840087890625, -4.3531494140625, -3.8662109375, -3.3792724609375, -2.892333984375, -2.4053955078125, -1.91845703125, -1.4315185546875, -0.944580078125, -0.4576416015625, 0.029296875, 0.5162353515625, 1.003173828125, 1.4901123046875, 1.97705078125, 2.4639892578125, 2.950927734375, 3.4378662109375, 3.9248046875, 4.4117431640625, 4.898681640625, 5.3856201171875, 5.87255859375, 6.3594970703125, 6.846435546875, 7.3333740234375, 7.8203125]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 1.0, 7.0, 10.0, 4.0, 5.0, 9.0, 16.0, 13.0, 25.0, 31.0, 34.0, 40.0, 66.0, 74.0, 95.0, 141.0, 212.0, 339.0, 415.0, 495.0, 496.0, 397.0, 335.0, 205.0, 168.0, 104.0, 80.0, 52.0, 49.0, 43.0, 21.0, 23.0, 14.0, 13.0, 7.0, 7.0, 7.0, 10.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.8359375, -8.5411376953125, -8.246337890625, -7.9515380859375, -7.65673828125, -7.3619384765625, -7.067138671875, -6.7723388671875, -6.4775390625, -6.1827392578125, -5.887939453125, -5.5931396484375, -5.29833984375, -5.0035400390625, -4.708740234375, -4.4139404296875, -4.119140625, -3.8243408203125, -3.529541015625, -3.2347412109375, -2.93994140625, -2.6451416015625, -2.350341796875, -2.0555419921875, -1.7607421875, -1.4659423828125, -1.171142578125, -0.8763427734375, -0.58154296875, -0.2867431640625, 0.008056640625, 0.3028564453125, 0.59765625, 0.8924560546875, 1.187255859375, 1.4820556640625, 1.77685546875, 2.0716552734375, 2.366455078125, 2.6612548828125, 2.9560546875, 3.2508544921875, 3.545654296875, 3.8404541015625, 4.13525390625, 4.4300537109375, 4.724853515625, 5.0196533203125, 5.314453125, 5.6092529296875, 5.904052734375, 6.1988525390625, 6.49365234375, 6.7884521484375, 7.083251953125, 7.3780517578125, 7.6728515625, 7.9676513671875, 8.262451171875, 8.5572509765625, 8.85205078125, 9.1468505859375, 9.441650390625, 9.7364501953125, 10.03125]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 7.0, 3.0, 5.0, 9.0, 12.0, 20.0, 32.0, 34.0, 52.0, 89.0, 146.0, 268.0, 544.0, 1381.0, 5039.0, 28924.0, 296165.0, 3282052.0, 527349.0, 42289.0, 6855.0, 1691.0, 592.0, 282.0, 187.0, 97.0, 54.0, 29.0, 33.0, 12.0, 19.0, 4.0, 5.0, 7.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.640625, -21.924072265625, -21.20751953125, -20.490966796875, -19.7744140625, -19.057861328125, -18.34130859375, -17.624755859375, -16.908203125, -16.191650390625, -15.47509765625, -14.758544921875, -14.0419921875, -13.325439453125, -12.60888671875, -11.892333984375, -11.17578125, -10.459228515625, -9.74267578125, -9.026123046875, -8.3095703125, -7.593017578125, -6.87646484375, -6.159912109375, -5.443359375, -4.726806640625, -4.01025390625, -3.293701171875, -2.5771484375, -1.860595703125, -1.14404296875, -0.427490234375, 0.2890625, 1.005615234375, 1.72216796875, 2.438720703125, 3.1552734375, 3.871826171875, 4.58837890625, 5.304931640625, 6.021484375, 6.738037109375, 7.45458984375, 8.171142578125, 8.8876953125, 9.604248046875, 10.32080078125, 11.037353515625, 11.75390625, 12.470458984375, 13.18701171875, 13.903564453125, 14.6201171875, 15.336669921875, 16.05322265625, 16.769775390625, 17.486328125, 18.202880859375, 18.91943359375, 19.635986328125, 20.3525390625, 21.069091796875, 21.78564453125, 22.502197265625, 23.21875]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 23.0, 156.0, 357.0, 343.0, 112.0, 18.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-237.08856201171875, -232.3387451171875, -227.58892822265625, -222.839111328125, -218.08929443359375, -213.3394775390625, -208.58966064453125, -203.83984375, -199.09002685546875, -194.3402099609375, -189.59039306640625, -184.840576171875, -180.09075927734375, -175.3409423828125, -170.59112548828125, -165.84130859375, -161.09149169921875, -156.3416748046875, -151.59185791015625, -146.842041015625, -142.09222412109375, -137.3424072265625, -132.59259033203125, -127.8427734375, -123.09295654296875, -118.3431396484375, -113.59332275390625, -108.843505859375, -104.09368896484375, -99.3438720703125, -94.59405517578125, -89.84423828125, -85.09442138671875, -80.3446044921875, -75.59478759765625, -70.844970703125, -66.09515380859375, -61.3453369140625, -56.59552001953125, -51.845703125, -47.09588623046875, -42.3460693359375, -37.59625244140625, -32.846435546875, -28.09661865234375, -23.3468017578125, -18.59698486328125, -13.84716796875, -9.09735107421875, -4.3475341796875, 0.40228271484375, 5.152099609375, 9.90191650390625, 14.6517333984375, 19.40155029296875, 24.1513671875, 28.90118408203125, 33.6510009765625, 38.40081787109375, 43.150634765625, 47.90045166015625, 52.6502685546875, 57.40008544921875, 62.14990234375, 66.89971923828125]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 0.0, 4.0, 5.0, 3.0, 8.0, 9.0, 7.0, 12.0, 9.0, 9.0, 15.0, 21.0, 22.0, 19.0, 22.0, 30.0, 28.0, 35.0, 37.0, 32.0, 37.0, 48.0, 44.0, 43.0, 28.0, 33.0, 38.0, 48.0, 42.0, 40.0, 35.0, 26.0, 23.0, 21.0, 24.0, 26.0, 22.0, 22.0, 11.0, 14.0, 14.0, 13.0, 7.0, 4.0, 4.0, 4.0, 5.0, 5.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-37.77101135253906, -36.71135330200195, -35.651695251464844, -34.59203338623047, -33.53237533569336, -32.47271728515625, -31.41305923461914, -30.3533992767334, -29.293739318847656, -28.234081268310547, -27.174421310424805, -26.114763259887695, -25.055103302001953, -23.995445251464844, -22.935787200927734, -21.876127243041992, -20.816469192504883, -19.756811141967773, -18.69715118408203, -17.637493133544922, -16.57783317565918, -15.51817512512207, -14.458516120910645, -13.398857116699219, -12.339198112487793, -11.279539108276367, -10.219880104064941, -9.160221099853516, -8.100563049316406, -7.040903568267822, -5.981245040893555, -4.921586036682129, -3.861928939819336, -2.80226993560791, -1.7426111698150635, -0.6829524040222168, 0.376706600189209, 1.4363656044006348, 2.4960241317749023, 3.555683135986328, 4.615342140197754, 5.67500114440918, 6.7346601486206055, 7.794318675994873, 8.85397720336914, 9.913637161254883, 10.973295211791992, 12.032954216003418, 13.092613220214844, 14.15227222442627, 15.211931228637695, 16.271589279174805, 17.331249237060547, 18.390907287597656, 19.450565338134766, 20.510225296020508, 21.56988525390625, 22.62954330444336, 23.6892032623291, 24.74886131286621, 25.808521270751953, 26.868179321289062, 27.927837371826172, 28.987497329711914, 30.047155380249023]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 6.0, 5.0, 6.0, 15.0, 12.0, 17.0, 15.0, 9.0, 27.0, 25.0, 25.0, 32.0, 21.0, 33.0, 25.0, 35.0, 38.0, 31.0, 47.0, 39.0, 36.0, 33.0, 31.0, 37.0, 45.0, 46.0, 35.0, 34.0, 28.0, 36.0, 26.0, 21.0, 23.0, 26.0, 19.0, 10.0, 12.0, 6.0, 5.0, 9.0, 7.0, 3.0, 3.0, 2.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-6.828125, -6.6263427734375, -6.424560546875, -6.2227783203125, -6.02099609375, -5.8192138671875, -5.617431640625, -5.4156494140625, -5.2138671875, -5.0120849609375, -4.810302734375, -4.6085205078125, -4.40673828125, -4.2049560546875, -4.003173828125, -3.8013916015625, -3.599609375, -3.3978271484375, -3.196044921875, -2.9942626953125, -2.79248046875, -2.5906982421875, -2.388916015625, -2.1871337890625, -1.9853515625, -1.7835693359375, -1.581787109375, -1.3800048828125, -1.17822265625, -0.9764404296875, -0.774658203125, -0.5728759765625, -0.37109375, -0.1693115234375, 0.032470703125, 0.2342529296875, 0.43603515625, 0.6378173828125, 0.839599609375, 1.0413818359375, 1.2431640625, 1.4449462890625, 1.646728515625, 1.8485107421875, 2.05029296875, 2.2520751953125, 2.453857421875, 2.6556396484375, 2.857421875, 3.0592041015625, 3.260986328125, 3.4627685546875, 3.66455078125, 3.8663330078125, 4.068115234375, 4.2698974609375, 4.4716796875, 4.6734619140625, 4.875244140625, 5.0770263671875, 5.27880859375, 5.4805908203125, 5.682373046875, 5.8841552734375, 6.0859375]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 5.0, 4.0, 3.0, 4.0, 6.0, 10.0, 20.0, 33.0, 33.0, 75.0, 72.0, 153.0, 206.0, 290.0, 448.0, 679.0, 975.0, 1613.0, 2451.0, 3882.0, 6175.0, 9752.0, 15344.0, 24169.0, 38538.0, 60853.0, 92248.0, 132258.0, 161771.0, 155682.0, 118578.0, 80626.0, 52171.0, 32625.0, 20782.0, 13058.0, 8170.0, 5194.0, 3337.0, 2110.0, 1427.0, 913.0, 610.0, 401.0, 270.0, 159.0, 135.0, 69.0, 63.0, 41.0, 21.0, 16.0, 14.0, 8.0, 6.0, 6.0, 4.0, 3.0, 0.0, 0.0, 1.0], "bins": [-1.08984375, -1.05560302734375, -1.0213623046875, -0.98712158203125, -0.952880859375, -0.91864013671875, -0.8843994140625, -0.85015869140625, -0.81591796875, -0.78167724609375, -0.7474365234375, -0.71319580078125, -0.678955078125, -0.64471435546875, -0.6104736328125, -0.57623291015625, -0.5419921875, -0.50775146484375, -0.4735107421875, -0.43927001953125, -0.405029296875, -0.37078857421875, -0.3365478515625, -0.30230712890625, -0.26806640625, -0.23382568359375, -0.1995849609375, -0.16534423828125, -0.131103515625, -0.09686279296875, -0.0626220703125, -0.02838134765625, 0.005859375, 0.04010009765625, 0.0743408203125, 0.10858154296875, 0.142822265625, 0.17706298828125, 0.2113037109375, 0.24554443359375, 0.27978515625, 0.31402587890625, 0.3482666015625, 0.38250732421875, 0.416748046875, 0.45098876953125, 0.4852294921875, 0.51947021484375, 0.5537109375, 0.58795166015625, 0.6221923828125, 0.65643310546875, 0.690673828125, 0.72491455078125, 0.7591552734375, 0.79339599609375, 0.82763671875, 0.86187744140625, 0.8961181640625, 0.93035888671875, 0.964599609375, 0.99884033203125, 1.0330810546875, 1.06732177734375, 1.1015625]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 4.0, 6.0, 8.0, 10.0, 7.0, 17.0, 15.0, 17.0, 12.0, 19.0, 21.0, 22.0, 24.0, 32.0, 32.0, 37.0, 28.0, 36.0, 30.0, 40.0, 36.0, 1056.0, 47.0, 38.0, 31.0, 32.0, 39.0, 37.0, 37.0, 37.0, 28.0, 29.0, 23.0, 15.0, 27.0, 15.0, 12.0, 18.0, 14.0, 11.0, 6.0, 4.0, 5.0, 5.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.48828125, -5.32061767578125, -5.1529541015625, -4.98529052734375, -4.817626953125, -4.64996337890625, -4.4822998046875, -4.31463623046875, -4.14697265625, -3.97930908203125, -3.8116455078125, -3.64398193359375, -3.476318359375, -3.30865478515625, -3.1409912109375, -2.97332763671875, -2.8056640625, -2.63800048828125, -2.4703369140625, -2.30267333984375, -2.135009765625, -1.96734619140625, -1.7996826171875, -1.63201904296875, -1.46435546875, -1.29669189453125, -1.1290283203125, -0.96136474609375, -0.793701171875, -0.62603759765625, -0.4583740234375, -0.29071044921875, -0.123046875, 0.04461669921875, 0.2122802734375, 0.37994384765625, 0.547607421875, 0.71527099609375, 0.8829345703125, 1.05059814453125, 1.21826171875, 1.38592529296875, 1.5535888671875, 1.72125244140625, 1.888916015625, 2.05657958984375, 2.2242431640625, 2.39190673828125, 2.5595703125, 2.72723388671875, 2.8948974609375, 3.06256103515625, 3.230224609375, 3.39788818359375, 3.5655517578125, 3.73321533203125, 3.90087890625, 4.06854248046875, 4.2362060546875, 4.40386962890625, 4.571533203125, 4.73919677734375, 4.9068603515625, 5.07452392578125, 5.2421875]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 5.0, 4.0, 7.0, 7.0, 15.0, 17.0, 18.0, 40.0, 40.0, 70.0, 100.0, 148.0, 185.0, 266.0, 409.0, 556.0, 821.0, 1189.0, 1707.0, 2581.0, 3836.0, 5919.0, 9452.0, 15435.0, 29356.0, 135856.0, 1738968.0, 85340.0, 25192.0, 14268.0, 8623.0, 5522.0, 3622.0, 2434.0, 1591.0, 1075.0, 699.0, 495.0, 385.0, 255.0, 183.0, 132.0, 90.0, 82.0, 38.0, 36.0, 24.0, 17.0, 10.0, 9.0, 10.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1015625, -2.032440185546875, -1.96331787109375, -1.894195556640625, -1.8250732421875, -1.755950927734375, -1.68682861328125, -1.617706298828125, -1.548583984375, -1.479461669921875, -1.41033935546875, -1.341217041015625, -1.2720947265625, -1.202972412109375, -1.13385009765625, -1.064727783203125, -0.99560546875, -0.926483154296875, -0.85736083984375, -0.788238525390625, -0.7191162109375, -0.649993896484375, -0.58087158203125, -0.511749267578125, -0.442626953125, -0.373504638671875, -0.30438232421875, -0.235260009765625, -0.1661376953125, -0.097015380859375, -0.02789306640625, 0.041229248046875, 0.1103515625, 0.179473876953125, 0.24859619140625, 0.317718505859375, 0.3868408203125, 0.455963134765625, 0.52508544921875, 0.594207763671875, 0.663330078125, 0.732452392578125, 0.80157470703125, 0.870697021484375, 0.9398193359375, 1.008941650390625, 1.07806396484375, 1.147186279296875, 1.21630859375, 1.285430908203125, 1.35455322265625, 1.423675537109375, 1.4927978515625, 1.561920166015625, 1.63104248046875, 1.700164794921875, 1.769287109375, 1.838409423828125, 1.90753173828125, 1.976654052734375, 2.0457763671875, 2.114898681640625, 2.18402099609375, 2.253143310546875, 2.322265625]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 6.0, 3.0, 10.0, 3.0, 11.0, 5.0, 11.0, 10.0, 7.0, 13.0, 22.0, 18.0, 20.0, 33.0, 33.0, 35.0, 45.0, 37.0, 43.0, 52.0, 49.0, 43.0, 49.0, 52.0, 45.0, 50.0, 31.0, 36.0, 36.0, 23.0, 32.0, 24.0, 13.0, 10.0, 17.0, 14.0, 12.0, 10.0, 5.0, 13.0, 6.0, 7.0, 2.0, 5.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09228515625, -0.08918380737304688, -0.08608245849609375, -0.08298110961914062, -0.0798797607421875, -0.07677841186523438, -0.07367706298828125, -0.07057571411132812, -0.067474365234375, -0.06437301635742188, -0.06127166748046875, -0.058170318603515625, -0.0550689697265625, -0.051967620849609375, -0.04886627197265625, -0.045764923095703125, -0.04266357421875, -0.039562225341796875, -0.03646087646484375, -0.033359527587890625, -0.0302581787109375, -0.027156829833984375, -0.02405548095703125, -0.020954132080078125, -0.017852783203125, -0.014751434326171875, -0.01165008544921875, -0.008548736572265625, -0.0054473876953125, -0.002346038818359375, 0.00075531005859375, 0.003856658935546875, 0.0069580078125, 0.010059356689453125, 0.01316070556640625, 0.016262054443359375, 0.0193634033203125, 0.022464752197265625, 0.02556610107421875, 0.028667449951171875, 0.031768798828125, 0.034870147705078125, 0.03797149658203125, 0.041072845458984375, 0.0441741943359375, 0.047275543212890625, 0.05037689208984375, 0.053478240966796875, 0.05657958984375, 0.059680938720703125, 0.06278228759765625, 0.06588363647460938, 0.0689849853515625, 0.07208633422851562, 0.07518768310546875, 0.07828903198242188, 0.081390380859375, 0.08449172973632812, 0.08759307861328125, 0.09069442749023438, 0.0937957763671875, 0.09689712524414062, 0.09999847412109375, 0.10309982299804688, 0.106201171875]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 2.0, 2.0, 4.0, 3.0, 7.0, 9.0, 14.0, 7.0, 17.0, 16.0, 13.0, 24.0, 28.0, 35.0, 47.0, 56.0, 92.0, 101.0, 159.0, 242.0, 379.0, 685.0, 2524.0, 990008.0, 51544.0, 1009.0, 478.0, 310.0, 189.0, 131.0, 102.0, 74.0, 47.0, 43.0, 34.0, 21.0, 20.0, 17.0, 8.0, 10.0, 9.0, 11.0, 7.0, 4.0, 7.0, 1.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 3.0], "bins": [-2.177734375, -2.1150360107421875, -2.052337646484375, -1.9896392822265625, -1.92694091796875, -1.8642425537109375, -1.801544189453125, -1.7388458251953125, -1.6761474609375, -1.6134490966796875, -1.550750732421875, -1.4880523681640625, -1.42535400390625, -1.3626556396484375, -1.299957275390625, -1.2372589111328125, -1.174560546875, -1.1118621826171875, -1.049163818359375, -0.9864654541015625, -0.92376708984375, -0.8610687255859375, -0.798370361328125, -0.7356719970703125, -0.6729736328125, -0.6102752685546875, -0.547576904296875, -0.4848785400390625, -0.42218017578125, -0.3594818115234375, -0.296783447265625, -0.2340850830078125, -0.17138671875, -0.1086883544921875, -0.045989990234375, 0.0167083740234375, 0.07940673828125, 0.1421051025390625, 0.204803466796875, 0.2675018310546875, 0.3302001953125, 0.3928985595703125, 0.455596923828125, 0.5182952880859375, 0.58099365234375, 0.6436920166015625, 0.706390380859375, 0.7690887451171875, 0.831787109375, 0.8944854736328125, 0.957183837890625, 1.0198822021484375, 1.08258056640625, 1.1452789306640625, 1.207977294921875, 1.2706756591796875, 1.3333740234375, 1.3960723876953125, 1.458770751953125, 1.5214691162109375, 1.58416748046875, 1.6468658447265625, 1.709564208984375, 1.7722625732421875, 1.8349609375]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 47.0, 788.0, 175.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.682706356048584, -1.6507647037506104, -1.6188229322433472, -1.5868812799453735, -1.5549396276474, -1.5229978561401367, -1.491056203842163, -1.4591145515441895, -1.4271728992462158, -1.3952312469482422, -1.363289475440979, -1.3313478231430054, -1.2994061708450317, -1.2674643993377686, -1.235522747039795, -1.2035810947418213, -1.171639323234558, -1.1396976709365845, -1.1077558994293213, -1.0758142471313477, -1.043872594833374, -1.0119309425354004, -0.9799891710281372, -0.9480475187301636, -0.9161058068275452, -0.8841640949249268, -0.8522224426269531, -0.8202807307243347, -0.7883390188217163, -0.7563973665237427, -0.7244556546211243, -0.6925139427185059, -0.6605724096298218, -0.6286306977272034, -0.5966890454292297, -0.5647473335266113, -0.5328056812286377, -0.5008639693260193, -0.4689222574234009, -0.43698057532310486, -0.40503889322280884, -0.3730972111225128, -0.3411555290222168, -0.3092138171195984, -0.27727213501930237, -0.24533045291900635, -0.21338875591754913, -0.18144705891609192, -0.1495053768157959, -0.11756368726491928, -0.08562199771404266, -0.053680308163166046, -0.02173861861228943, 0.010203063488006592, 0.042144760489463806, 0.07408645749092102, 0.10602813959121704, 0.13796982169151306, 0.16991151869297028, 0.2018532156944275, 0.2337948977947235, 0.26573657989501953, 0.29767829179763794, 0.32961997389793396, 0.36156165599823]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 6.0, 9.0, 10.0, 10.0, 15.0, 21.0, 31.0, 26.0, 28.0, 50.0, 48.0, 52.0, 41.0, 53.0, 59.0, 59.0, 60.0, 70.0, 63.0, 47.0, 50.0, 36.0, 40.0, 24.0, 23.0, 23.0, 20.0, 7.0, 12.0, 2.0, 4.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.14378100633621216, -0.1384156048297882, -0.13305020332336426, -0.1276847869157791, -0.12231938540935516, -0.11695398390293121, -0.11158857494592667, -0.10622316598892212, -0.10085776448249817, -0.09549236297607422, -0.09012695401906967, -0.08476154506206512, -0.07939614355564117, -0.07403074204921722, -0.06866533309221268, -0.06329992413520813, -0.05793452262878418, -0.05256911739706993, -0.04720371216535568, -0.041838306933641434, -0.036472901701927185, -0.031107496470212936, -0.025742091238498688, -0.02037668600678444, -0.01501128077507019, -0.009645875543355942, -0.004280470311641693, 0.0010849349200725555, 0.006450340151786804, 0.011815745383501053, 0.0171811506152153, 0.02254655584692955, 0.0279119610786438, 0.03327736631035805, 0.038642771542072296, 0.044008176773786545, 0.04937358200550079, 0.05473898723721504, 0.06010439246892929, 0.06546980142593384, 0.07083520293235779, 0.07620060443878174, 0.08156601339578629, 0.08693142235279083, 0.09229682385921478, 0.09766222536563873, 0.10302763432264328, 0.10839304327964783, 0.11375844478607178, 0.11912384629249573, 0.12448925524950027, 0.12985466420650482, 0.13522006571292877, 0.14058546721935272, 0.14595088362693787, 0.15131628513336182, 0.15668168663978577, 0.16204708814620972, 0.16741248965263367, 0.1727779060602188, 0.17814330756664276, 0.1835087090730667, 0.18887412548065186, 0.1942395269870758, 0.19960492849349976]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 4.0, 4.0, 9.0, 4.0, 11.0, 6.0, 12.0, 17.0, 13.0, 20.0, 25.0, 18.0, 27.0, 23.0, 26.0, 46.0, 24.0, 44.0, 34.0, 38.0, 35.0, 42.0, 50.0, 40.0, 45.0, 36.0, 35.0, 28.0, 41.0, 32.0, 30.0, 28.0, 35.0, 17.0, 20.0, 19.0, 16.0, 14.0, 10.0, 9.0, 5.0, 4.0, 6.0, 6.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-6.6796875, -6.4727783203125, -6.265869140625, -6.0589599609375, -5.85205078125, -5.6451416015625, -5.438232421875, -5.2313232421875, -5.0244140625, -4.8175048828125, -4.610595703125, -4.4036865234375, -4.19677734375, -3.9898681640625, -3.782958984375, -3.5760498046875, -3.369140625, -3.1622314453125, -2.955322265625, -2.7484130859375, -2.54150390625, -2.3345947265625, -2.127685546875, -1.9207763671875, -1.7138671875, -1.5069580078125, -1.300048828125, -1.0931396484375, -0.88623046875, -0.6793212890625, -0.472412109375, -0.2655029296875, -0.05859375, 0.1483154296875, 0.355224609375, 0.5621337890625, 0.76904296875, 0.9759521484375, 1.182861328125, 1.3897705078125, 1.5966796875, 1.8035888671875, 2.010498046875, 2.2174072265625, 2.42431640625, 2.6312255859375, 2.838134765625, 3.0450439453125, 3.251953125, 3.4588623046875, 3.665771484375, 3.8726806640625, 4.07958984375, 4.2864990234375, 4.493408203125, 4.7003173828125, 4.9072265625, 5.1141357421875, 5.321044921875, 5.5279541015625, 5.73486328125, 5.9417724609375, 6.148681640625, 6.3555908203125, 6.5625]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 5.0, 18.0, 16.0, 17.0, 22.0, 42.0, 66.0, 96.0, 155.0, 250.0, 383.0, 605.0, 996.0, 1802.0, 3250.0, 6050.0, 11702.0, 22747.0, 44746.0, 91945.0, 195407.0, 295321.0, 191415.0, 90409.0, 44067.0, 22064.0, 11250.0, 6021.0, 3226.0, 1827.0, 1049.0, 601.0, 339.0, 224.0, 133.0, 83.0, 59.0, 56.0, 34.0, 27.0, 11.0, 8.0, 3.0, 3.0, 4.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.53125, -7.29205322265625, -7.0528564453125, -6.81365966796875, -6.574462890625, -6.33526611328125, -6.0960693359375, -5.85687255859375, -5.61767578125, -5.37847900390625, -5.1392822265625, -4.90008544921875, -4.660888671875, -4.42169189453125, -4.1824951171875, -3.94329833984375, -3.7041015625, -3.46490478515625, -3.2257080078125, -2.98651123046875, -2.747314453125, -2.50811767578125, -2.2689208984375, -2.02972412109375, -1.79052734375, -1.55133056640625, -1.3121337890625, -1.07293701171875, -0.833740234375, -0.59454345703125, -0.3553466796875, -0.11614990234375, 0.123046875, 0.36224365234375, 0.6014404296875, 0.84063720703125, 1.079833984375, 1.31903076171875, 1.5582275390625, 1.79742431640625, 2.03662109375, 2.27581787109375, 2.5150146484375, 2.75421142578125, 2.993408203125, 3.23260498046875, 3.4718017578125, 3.71099853515625, 3.9501953125, 4.18939208984375, 4.4285888671875, 4.66778564453125, 4.906982421875, 5.14617919921875, 5.3853759765625, 5.62457275390625, 5.86376953125, 6.10296630859375, 6.3421630859375, 6.58135986328125, 6.820556640625, 7.05975341796875, 7.2989501953125, 7.53814697265625, 7.77734375]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 6.0, 6.0, 7.0, 7.0, 6.0, 8.0, 9.0, 11.0, 18.0, 19.0, 16.0, 28.0, 29.0, 29.0, 32.0, 40.0, 49.0, 42.0, 63.0, 80.0, 157.0, 245.0, 1314.0, 233.0, 126.0, 77.0, 53.0, 45.0, 39.0, 28.0, 25.0, 27.0, 32.0, 24.0, 22.0, 10.0, 7.0, 8.0, 16.0, 10.0, 8.0, 8.0, 9.0, 7.0, 5.0, 2.0, 4.0, 3.0, 4.0, 3.0, 1.0], "bins": [-16.921875, -16.4429931640625, -15.964111328125, -15.4852294921875, -15.00634765625, -14.5274658203125, -14.048583984375, -13.5697021484375, -13.0908203125, -12.6119384765625, -12.133056640625, -11.6541748046875, -11.17529296875, -10.6964111328125, -10.217529296875, -9.7386474609375, -9.259765625, -8.7808837890625, -8.302001953125, -7.8231201171875, -7.34423828125, -6.8653564453125, -6.386474609375, -5.9075927734375, -5.4287109375, -4.9498291015625, -4.470947265625, -3.9920654296875, -3.51318359375, -3.0343017578125, -2.555419921875, -2.0765380859375, -1.59765625, -1.1187744140625, -0.639892578125, -0.1610107421875, 0.31787109375, 0.7967529296875, 1.275634765625, 1.7545166015625, 2.2333984375, 2.7122802734375, 3.191162109375, 3.6700439453125, 4.14892578125, 4.6278076171875, 5.106689453125, 5.5855712890625, 6.064453125, 6.5433349609375, 7.022216796875, 7.5010986328125, 7.97998046875, 8.4588623046875, 8.937744140625, 9.4166259765625, 9.8955078125, 10.3743896484375, 10.853271484375, 11.3321533203125, 11.81103515625, 12.2899169921875, 12.768798828125, 13.2476806640625, 13.7265625]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 4.0, 7.0, 4.0, 5.0, 11.0, 12.0, 20.0, 21.0, 27.0, 38.0, 50.0, 65.0, 104.0, 135.0, 196.0, 232.0, 322.0, 647.0, 1682.0, 7879.0, 58258.0, 1552826.0, 1456066.0, 56167.0, 7367.0, 1635.0, 601.0, 385.0, 268.0, 173.0, 133.0, 95.0, 69.0, 35.0, 43.0, 33.0, 21.0, 18.0, 7.0, 14.0, 10.0, 6.0, 5.0, 2.0, 4.0, 3.0, 5.0, 3.0, 3.0], "bins": [-25.59375, -24.90185546875, -24.2099609375, -23.51806640625, -22.826171875, -22.13427734375, -21.4423828125, -20.75048828125, -20.05859375, -19.36669921875, -18.6748046875, -17.98291015625, -17.291015625, -16.59912109375, -15.9072265625, -15.21533203125, -14.5234375, -13.83154296875, -13.1396484375, -12.44775390625, -11.755859375, -11.06396484375, -10.3720703125, -9.68017578125, -8.98828125, -8.29638671875, -7.6044921875, -6.91259765625, -6.220703125, -5.52880859375, -4.8369140625, -4.14501953125, -3.453125, -2.76123046875, -2.0693359375, -1.37744140625, -0.685546875, 0.00634765625, 0.6982421875, 1.39013671875, 2.08203125, 2.77392578125, 3.4658203125, 4.15771484375, 4.849609375, 5.54150390625, 6.2333984375, 6.92529296875, 7.6171875, 8.30908203125, 9.0009765625, 9.69287109375, 10.384765625, 11.07666015625, 11.7685546875, 12.46044921875, 13.15234375, 13.84423828125, 14.5361328125, 15.22802734375, 15.919921875, 16.61181640625, 17.3037109375, 17.99560546875, 18.6875]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 91.0, 911.0, 16.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-570.0995483398438, -556.6431884765625, -543.1868896484375, -529.7305297851562, -516.274169921875, -502.8178405761719, -489.36151123046875, -475.9051513671875, -462.44879150390625, -448.9924621582031, -435.5361022949219, -422.07977294921875, -408.6234130859375, -395.1670837402344, -381.71075439453125, -368.25439453125, -354.7980651855469, -341.34173583984375, -327.8853759765625, -314.4290466308594, -300.9726867675781, -287.516357421875, -274.05999755859375, -260.6036682128906, -247.14732360839844, -233.69097900390625, -220.23463439941406, -206.77828979492188, -193.32196044921875, -179.8656005859375, -166.40927124023438, -152.9529266357422, -139.49658203125, -126.04023742675781, -112.58389282226562, -99.12755584716797, -85.67121124267578, -72.2148666381836, -58.75852966308594, -45.30218505859375, -31.845840454101562, -18.389497756958008, -4.933155059814453, 8.523185729980469, 21.979530334472656, 35.435874938964844, 48.8922119140625, 62.34855651855469, 75.80490112304688, 89.26124572753906, 102.71759033203125, 116.1739273071289, 129.63027954101562, 143.08660888671875, 156.54295349121094, 169.99929809570312, 183.4556427001953, 196.9119873046875, 210.3683319091797, 223.82467651367188, 237.281005859375, 250.73736572265625, 264.1936950683594, 277.6500244140625, 291.10638427734375]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 4.0, 3.0, 8.0, 5.0, 6.0, 8.0, 5.0, 10.0, 8.0, 11.0, 13.0, 18.0, 30.0, 28.0, 32.0, 25.0, 34.0, 36.0, 38.0, 44.0, 42.0, 40.0, 53.0, 33.0, 43.0, 42.0, 36.0, 38.0, 27.0, 30.0, 29.0, 23.0, 28.0, 34.0, 20.0, 28.0, 19.0, 21.0, 10.0, 10.0, 8.0, 9.0, 8.0, 6.0, 5.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0], "bins": [-47.68923568725586, -46.34653091430664, -45.00382614135742, -43.66112518310547, -42.31842041015625, -40.97571563720703, -39.63301086425781, -38.290306091308594, -36.947601318359375, -35.604896545410156, -34.26219177246094, -32.91948699951172, -31.576786041259766, -30.234081268310547, -28.891376495361328, -27.54867172241211, -26.205970764160156, -24.863265991210938, -23.52056312561035, -22.177858352661133, -20.835155487060547, -19.492450714111328, -18.14974594116211, -16.80704116821289, -15.464338302612305, -14.121634483337402, -12.7789306640625, -11.436225891113281, -10.093522071838379, -8.750818252563477, -7.408113479614258, -6.0654096603393555, -4.722705841064453, -3.3800017833709717, -2.0372977256774902, -0.6945934295654297, 0.6481103897094727, 1.990814208984375, 3.3335189819335938, 4.676222801208496, 6.018926620483398, 7.361630439758301, 8.704334259033203, 10.047039031982422, 11.389742851257324, 12.732446670532227, 14.075151443481445, 15.417855262756348, 16.76055908203125, 18.10326385498047, 19.445966720581055, 20.788671493530273, 22.13137435913086, 23.474079132080078, 24.816783905029297, 26.159488677978516, 27.5021915435791, 28.84489631652832, 30.187599182128906, 31.530303955078125, 32.873008728027344, 34.21571350097656, 35.55841827392578, 36.901119232177734, 38.24382400512695]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 2.0, 3.0, 9.0, 7.0, 12.0, 10.0, 11.0, 10.0, 19.0, 20.0, 18.0, 30.0, 33.0, 25.0, 36.0, 32.0, 51.0, 31.0, 35.0, 42.0, 48.0, 37.0, 47.0, 38.0, 45.0, 49.0, 32.0, 29.0, 26.0, 32.0, 30.0, 34.0, 24.0, 18.0, 18.0, 12.0, 7.0, 7.0, 9.0, 6.0, 7.0, 5.0, 2.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-7.63671875, -7.4149169921875, -7.193115234375, -6.9713134765625, -6.74951171875, -6.5277099609375, -6.305908203125, -6.0841064453125, -5.8623046875, -5.6405029296875, -5.418701171875, -5.1968994140625, -4.97509765625, -4.7532958984375, -4.531494140625, -4.3096923828125, -4.087890625, -3.8660888671875, -3.644287109375, -3.4224853515625, -3.20068359375, -2.9788818359375, -2.757080078125, -2.5352783203125, -2.3134765625, -2.0916748046875, -1.869873046875, -1.6480712890625, -1.42626953125, -1.2044677734375, -0.982666015625, -0.7608642578125, -0.5390625, -0.3172607421875, -0.095458984375, 0.1263427734375, 0.34814453125, 0.5699462890625, 0.791748046875, 1.0135498046875, 1.2353515625, 1.4571533203125, 1.678955078125, 1.9007568359375, 2.12255859375, 2.3443603515625, 2.566162109375, 2.7879638671875, 3.009765625, 3.2315673828125, 3.453369140625, 3.6751708984375, 3.89697265625, 4.1187744140625, 4.340576171875, 4.5623779296875, 4.7841796875, 5.0059814453125, 5.227783203125, 5.4495849609375, 5.67138671875, 5.8931884765625, 6.114990234375, 6.3367919921875, 6.55859375]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 10.0, 13.0, 16.0, 26.0, 29.0, 56.0, 90.0, 137.0, 308.0, 546.0, 4177.0, 4185537.0, 2223.0, 501.0, 256.0, 143.0, 77.0, 53.0, 38.0, 18.0, 14.0, 7.0, 5.0, 8.0, 2.0, 1.0, 0.0, 1.0], "bins": [-197.875, -193.7041015625, -189.533203125, -185.3623046875, -181.19140625, -177.0205078125, -172.849609375, -168.6787109375, -164.5078125, -160.3369140625, -156.166015625, -151.9951171875, -147.82421875, -143.6533203125, -139.482421875, -135.3115234375, -131.140625, -126.9697265625, -122.798828125, -118.6279296875, -114.45703125, -110.2861328125, -106.115234375, -101.9443359375, -97.7734375, -93.6025390625, -89.431640625, -85.2607421875, -81.08984375, -76.9189453125, -72.748046875, -68.5771484375, -64.40625, -60.2353515625, -56.064453125, -51.8935546875, -47.72265625, -43.5517578125, -39.380859375, -35.2099609375, -31.0390625, -26.8681640625, -22.697265625, -18.5263671875, -14.35546875, -10.1845703125, -6.013671875, -1.8427734375, 2.328125, 6.4990234375, 10.669921875, 14.8408203125, 19.01171875, 23.1826171875, 27.353515625, 31.5244140625, 35.6953125, 39.8662109375, 44.037109375, 48.2080078125, 52.37890625, 56.5498046875, 60.720703125, 64.8916015625, 69.0625]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 4.0, 9.0, 10.0, 12.0, 18.0, 19.0, 24.0, 47.0, 48.0, 83.0, 117.0, 141.0, 262.0, 429.0, 548.0, 603.0, 516.0, 386.0, 196.0, 155.0, 102.0, 84.0, 62.0, 37.0, 36.0, 23.0, 20.0, 19.0, 16.0, 8.0, 11.0, 9.0, 3.0, 5.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.3046875, -8.9884033203125, -8.672119140625, -8.3558349609375, -8.03955078125, -7.7232666015625, -7.406982421875, -7.0906982421875, -6.7744140625, -6.4581298828125, -6.141845703125, -5.8255615234375, -5.50927734375, -5.1929931640625, -4.876708984375, -4.5604248046875, -4.244140625, -3.9278564453125, -3.611572265625, -3.2952880859375, -2.97900390625, -2.6627197265625, -2.346435546875, -2.0301513671875, -1.7138671875, -1.3975830078125, -1.081298828125, -0.7650146484375, -0.44873046875, -0.1324462890625, 0.183837890625, 0.5001220703125, 0.81640625, 1.1326904296875, 1.448974609375, 1.7652587890625, 2.08154296875, 2.3978271484375, 2.714111328125, 3.0303955078125, 3.3466796875, 3.6629638671875, 3.979248046875, 4.2955322265625, 4.61181640625, 4.9281005859375, 5.244384765625, 5.5606689453125, 5.876953125, 6.1932373046875, 6.509521484375, 6.8258056640625, 7.14208984375, 7.4583740234375, 7.774658203125, 8.0909423828125, 8.4072265625, 8.7235107421875, 9.039794921875, 9.3560791015625, 9.67236328125, 9.9886474609375, 10.304931640625, 10.6212158203125, 10.9375]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 12.0, 25.0, 42.0, 83.0, 216.0, 886.0, 496558.0, 3694482.0, 1638.0, 231.0, 79.0, 21.0, 8.0, 8.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-126.25, -123.38720703125, -120.5244140625, -117.66162109375, -114.798828125, -111.93603515625, -109.0732421875, -106.21044921875, -103.34765625, -100.48486328125, -97.6220703125, -94.75927734375, -91.896484375, -89.03369140625, -86.1708984375, -83.30810546875, -80.4453125, -77.58251953125, -74.7197265625, -71.85693359375, -68.994140625, -66.13134765625, -63.2685546875, -60.40576171875, -57.54296875, -54.68017578125, -51.8173828125, -48.95458984375, -46.091796875, -43.22900390625, -40.3662109375, -37.50341796875, -34.640625, -31.77783203125, -28.9150390625, -26.05224609375, -23.189453125, -20.32666015625, -17.4638671875, -14.60107421875, -11.73828125, -8.87548828125, -6.0126953125, -3.14990234375, -0.287109375, 2.57568359375, 5.4384765625, 8.30126953125, 11.1640625, 14.02685546875, 16.8896484375, 19.75244140625, 22.615234375, 25.47802734375, 28.3408203125, 31.20361328125, 34.06640625, 36.92919921875, 39.7919921875, 42.65478515625, 45.517578125, 48.38037109375, 51.2431640625, 54.10595703125, 56.96875]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 10.0, 60.0, 261.0, 367.0, 233.0, 68.0, 10.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-221.9549102783203, -217.72549438476562, -213.49607849121094, -209.26666259765625, -205.0372314453125, -200.8078155517578, -196.57839965820312, -192.34898376464844, -188.11956787109375, -183.89015197753906, -179.66073608398438, -175.43130493164062, -171.20188903808594, -166.97247314453125, -162.74305725097656, -158.51364135742188, -154.28421020507812, -150.05479431152344, -145.82537841796875, -141.595947265625, -137.3665313720703, -133.13711547851562, -128.90769958496094, -124.67828369140625, -120.44886779785156, -116.21945190429688, -111.99002838134766, -107.76061248779297, -103.53119659423828, -99.30177307128906, -95.07235717773438, -90.84294128417969, -86.613525390625, -82.38410949707031, -78.1546859741211, -73.9252700805664, -69.69585418701172, -65.4664306640625, -61.23701477050781, -57.007598876953125, -52.77818298339844, -48.548763275146484, -44.3193473815918, -40.089927673339844, -35.860511779785156, -31.631092071533203, -27.40167236328125, -23.17225456237793, -18.94283676147461, -14.713418960571289, -10.484000205993652, -6.254581451416016, -2.0251636505126953, 2.204254150390625, 6.433673858642578, 10.663091659545898, 14.892509460449219, 19.12192726135254, 23.35134506225586, 27.580764770507812, 31.810182571411133, 36.03960037231445, 40.269020080566406, 44.498435974121094, 48.72785568237305]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 5.0, 4.0, 5.0, 10.0, 12.0, 10.0, 10.0, 16.0, 11.0, 27.0, 23.0, 34.0, 34.0, 18.0, 35.0, 32.0, 23.0, 31.0, 38.0, 43.0, 41.0, 44.0, 43.0, 36.0, 44.0, 35.0, 34.0, 37.0, 32.0, 29.0, 32.0, 31.0, 29.0, 23.0, 14.0, 15.0, 8.0, 8.0, 10.0, 11.0, 9.0, 3.0, 1.0, 4.0, 5.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-32.18357467651367, -31.2036190032959, -30.223663330078125, -29.24370765686035, -28.263751983642578, -27.283794403076172, -26.3038387298584, -25.323883056640625, -24.34392738342285, -23.363971710205078, -22.384016036987305, -21.40406036376953, -20.424102783203125, -19.444149017333984, -18.464191436767578, -17.484235763549805, -16.50428009033203, -15.524324417114258, -14.544368743896484, -13.564412117004395, -12.584456443786621, -11.604500770568848, -10.624544143676758, -9.644588470458984, -8.664632797241211, -7.6846771240234375, -6.704720973968506, -5.724764823913574, -4.744809150695801, -3.7648534774780273, -2.7848973274230957, -1.804941177368164, -0.8249874114990234, 0.1549685001373291, 1.1349244117736816, 2.114880323410034, 3.0948362350463867, 4.07479190826416, 5.054748058319092, 6.034704208374023, 7.014659881591797, 7.99461555480957, 8.974571228027344, 9.954527854919434, 10.934483528137207, 11.91443920135498, 12.89439582824707, 13.874351501464844, 14.854307174682617, 15.83426284790039, 16.814218521118164, 17.794174194335938, 18.774131774902344, 19.754085540771484, 20.73404312133789, 21.713998794555664, 22.693954467773438, 23.67391014099121, 24.653865814208984, 25.633821487426758, 26.61377716064453, 27.593734741210938, 28.57369041442871, 29.553646087646484, 30.533601760864258]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 7.0, 4.0, 8.0, 7.0, 17.0, 13.0, 15.0, 26.0, 31.0, 25.0, 42.0, 29.0, 46.0, 45.0, 41.0, 53.0, 53.0, 55.0, 45.0, 53.0, 55.0, 48.0, 44.0, 44.0, 35.0, 37.0, 26.0, 23.0, 17.0, 15.0, 17.0, 11.0, 8.0, 4.0, 3.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.0625, -7.8155517578125, -7.568603515625, -7.3216552734375, -7.07470703125, -6.8277587890625, -6.580810546875, -6.3338623046875, -6.0869140625, -5.8399658203125, -5.593017578125, -5.3460693359375, -5.09912109375, -4.8521728515625, -4.605224609375, -4.3582763671875, -4.111328125, -3.8643798828125, -3.617431640625, -3.3704833984375, -3.12353515625, -2.8765869140625, -2.629638671875, -2.3826904296875, -2.1357421875, -1.8887939453125, -1.641845703125, -1.3948974609375, -1.14794921875, -0.9010009765625, -0.654052734375, -0.4071044921875, -0.16015625, 0.0867919921875, 0.333740234375, 0.5806884765625, 0.82763671875, 1.0745849609375, 1.321533203125, 1.5684814453125, 1.8154296875, 2.0623779296875, 2.309326171875, 2.5562744140625, 2.80322265625, 3.0501708984375, 3.297119140625, 3.5440673828125, 3.791015625, 4.0379638671875, 4.284912109375, 4.5318603515625, 4.77880859375, 5.0257568359375, 5.272705078125, 5.5196533203125, 5.7666015625, 6.0135498046875, 6.260498046875, 6.5074462890625, 6.75439453125, 7.0013427734375, 7.248291015625, 7.4952392578125, 7.7421875]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 11.0, 9.0, 27.0, 28.0, 42.0, 64.0, 126.0, 202.0, 374.0, 659.0, 1061.0, 1942.0, 3393.0, 6354.0, 11566.0, 21118.0, 38791.0, 68829.0, 116123.0, 174424.0, 202551.0, 161965.0, 103742.0, 60032.0, 33777.0, 18486.0, 10249.0, 5615.0, 3094.0, 1659.0, 977.0, 504.0, 316.0, 176.0, 95.0, 55.0, 39.0, 30.0, 22.0, 9.0, 7.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0], "bins": [-1.53515625, -1.4929656982421875, -1.450775146484375, -1.4085845947265625, -1.36639404296875, -1.3242034912109375, -1.282012939453125, -1.2398223876953125, -1.1976318359375, -1.1554412841796875, -1.113250732421875, -1.0710601806640625, -1.02886962890625, -0.9866790771484375, -0.944488525390625, -0.9022979736328125, -0.860107421875, -0.8179168701171875, -0.775726318359375, -0.7335357666015625, -0.69134521484375, -0.6491546630859375, -0.606964111328125, -0.5647735595703125, -0.5225830078125, -0.4803924560546875, -0.438201904296875, -0.3960113525390625, -0.35382080078125, -0.3116302490234375, -0.269439697265625, -0.2272491455078125, -0.18505859375, -0.1428680419921875, -0.100677490234375, -0.0584869384765625, -0.01629638671875, 0.0258941650390625, 0.068084716796875, 0.1102752685546875, 0.1524658203125, 0.1946563720703125, 0.236846923828125, 0.2790374755859375, 0.32122802734375, 0.3634185791015625, 0.405609130859375, 0.4477996826171875, 0.489990234375, 0.5321807861328125, 0.574371337890625, 0.6165618896484375, 0.65875244140625, 0.7009429931640625, 0.743133544921875, 0.7853240966796875, 0.8275146484375, 0.8697052001953125, 0.911895751953125, 0.9540863037109375, 0.99627685546875, 1.0384674072265625, 1.080657958984375, 1.1228485107421875, 1.1650390625]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 3.0, 3.0, 6.0, 8.0, 7.0, 4.0, 7.0, 12.0, 10.0, 12.0, 11.0, 10.0, 19.0, 23.0, 25.0, 23.0, 24.0, 33.0, 27.0, 33.0, 44.0, 30.0, 39.0, 49.0, 36.0, 1060.0, 36.0, 26.0, 35.0, 38.0, 26.0, 42.0, 31.0, 29.0, 20.0, 30.0, 22.0, 21.0, 15.0, 19.0, 10.0, 20.0, 5.0, 7.0, 10.0, 7.0, 4.0, 6.0, 5.0, 7.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.21484375, -4.07281494140625, -3.9307861328125, -3.78875732421875, -3.646728515625, -3.50469970703125, -3.3626708984375, -3.22064208984375, -3.07861328125, -2.93658447265625, -2.7945556640625, -2.65252685546875, -2.510498046875, -2.36846923828125, -2.2264404296875, -2.08441162109375, -1.9423828125, -1.80035400390625, -1.6583251953125, -1.51629638671875, -1.374267578125, -1.23223876953125, -1.0902099609375, -0.94818115234375, -0.80615234375, -0.66412353515625, -0.5220947265625, -0.38006591796875, -0.238037109375, -0.09600830078125, 0.0460205078125, 0.18804931640625, 0.330078125, 0.47210693359375, 0.6141357421875, 0.75616455078125, 0.898193359375, 1.04022216796875, 1.1822509765625, 1.32427978515625, 1.46630859375, 1.60833740234375, 1.7503662109375, 1.89239501953125, 2.034423828125, 2.17645263671875, 2.3184814453125, 2.46051025390625, 2.6025390625, 2.74456787109375, 2.8865966796875, 3.02862548828125, 3.170654296875, 3.31268310546875, 3.4547119140625, 3.59674072265625, 3.73876953125, 3.88079833984375, 4.0228271484375, 4.16485595703125, 4.306884765625, 4.44891357421875, 4.5909423828125, 4.73297119140625, 4.875]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 0.0, 5.0, 6.0, 9.0, 11.0, 22.0, 29.0, 31.0, 54.0, 63.0, 78.0, 107.0, 170.0, 226.0, 344.0, 478.0, 702.0, 943.0, 1373.0, 1920.0, 2899.0, 4155.0, 6040.0, 8959.0, 13918.0, 23274.0, 64526.0, 1578499.0, 294204.0, 39040.0, 18630.0, 11643.0, 7666.0, 5166.0, 3671.0, 2413.0, 1674.0, 1194.0, 856.0, 630.0, 467.0, 310.0, 204.0, 163.0, 110.0, 79.0, 75.0, 32.0, 23.0, 15.0, 16.0, 7.0, 5.0, 3.0, 2.0, 0.0, 4.0, 0.0, 0.0, 2.0], "bins": [-1.7421875, -1.6874237060546875, -1.632659912109375, -1.5778961181640625, -1.52313232421875, -1.4683685302734375, -1.413604736328125, -1.3588409423828125, -1.3040771484375, -1.2493133544921875, -1.194549560546875, -1.1397857666015625, -1.08502197265625, -1.0302581787109375, -0.975494384765625, -0.9207305908203125, -0.865966796875, -0.8112030029296875, -0.756439208984375, -0.7016754150390625, -0.64691162109375, -0.5921478271484375, -0.537384033203125, -0.4826202392578125, -0.4278564453125, -0.3730926513671875, -0.318328857421875, -0.2635650634765625, -0.20880126953125, -0.1540374755859375, -0.099273681640625, -0.0445098876953125, 0.01025390625, 0.0650177001953125, 0.119781494140625, 0.1745452880859375, 0.22930908203125, 0.2840728759765625, 0.338836669921875, 0.3936004638671875, 0.4483642578125, 0.5031280517578125, 0.557891845703125, 0.6126556396484375, 0.66741943359375, 0.7221832275390625, 0.776947021484375, 0.8317108154296875, 0.886474609375, 0.9412384033203125, 0.996002197265625, 1.0507659912109375, 1.10552978515625, 1.1602935791015625, 1.215057373046875, 1.2698211669921875, 1.3245849609375, 1.3793487548828125, 1.434112548828125, 1.4888763427734375, 1.54364013671875, 1.5984039306640625, 1.653167724609375, 1.7079315185546875, 1.7626953125]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 6.0, 3.0, 6.0, 3.0, 6.0, 14.0, 17.0, 18.0, 18.0, 15.0, 25.0, 23.0, 38.0, 50.0, 50.0, 52.0, 65.0, 58.0, 66.0, 55.0, 53.0, 55.0, 49.0, 58.0, 44.0, 32.0, 22.0, 22.0, 22.0, 13.0, 17.0, 13.0, 9.0, 4.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1358642578125, -0.1310901641845703, -0.12631607055664062, -0.12154197692871094, -0.11676788330078125, -0.11199378967285156, -0.10721969604492188, -0.10244560241699219, -0.0976715087890625, -0.09289741516113281, -0.08812332153320312, -0.08334922790527344, -0.07857513427734375, -0.07380104064941406, -0.06902694702148438, -0.06425285339355469, -0.059478759765625, -0.05470466613769531, -0.049930572509765625, -0.04515647888183594, -0.04038238525390625, -0.03560829162597656, -0.030834197998046875, -0.026060104370117188, -0.0212860107421875, -0.016511917114257812, -0.011737823486328125, -0.0069637298583984375, -0.00218963623046875, 0.0025844573974609375, 0.007358551025390625, 0.012132644653320312, 0.01690673828125, 0.021680831909179688, 0.026454925537109375, 0.031229019165039062, 0.03600311279296875, 0.04077720642089844, 0.045551300048828125, 0.05032539367675781, 0.0550994873046875, 0.05987358093261719, 0.06464767456054688, 0.06942176818847656, 0.07419586181640625, 0.07896995544433594, 0.08374404907226562, 0.08851814270019531, 0.093292236328125, 0.09806632995605469, 0.10284042358398438, 0.10761451721191406, 0.11238861083984375, 0.11716270446777344, 0.12193679809570312, 0.1267108917236328, 0.1314849853515625, 0.1362590789794922, 0.14103317260742188, 0.14580726623535156, 0.15058135986328125, 0.15535545349121094, 0.16012954711914062, 0.1649036407470703, 0.169677734375]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 4.0, 10.0, 11.0, 19.0, 15.0, 20.0, 33.0, 34.0, 55.0, 74.0, 119.0, 153.0, 271.0, 490.0, 1026.0, 24828.0, 1017988.0, 1779.0, 642.0, 339.0, 192.0, 135.0, 91.0, 53.0, 37.0, 29.0, 22.0, 28.0, 18.0, 9.0, 8.0, 5.0, 7.0, 4.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.388671875, -3.292510986328125, -3.19635009765625, -3.100189208984375, -3.0040283203125, -2.907867431640625, -2.81170654296875, -2.715545654296875, -2.619384765625, -2.523223876953125, -2.42706298828125, -2.330902099609375, -2.2347412109375, -2.138580322265625, -2.04241943359375, -1.946258544921875, -1.85009765625, -1.753936767578125, -1.65777587890625, -1.561614990234375, -1.4654541015625, -1.369293212890625, -1.27313232421875, -1.176971435546875, -1.080810546875, -0.984649658203125, -0.88848876953125, -0.792327880859375, -0.6961669921875, -0.600006103515625, -0.50384521484375, -0.407684326171875, -0.3115234375, -0.215362548828125, -0.11920166015625, -0.023040771484375, 0.0731201171875, 0.169281005859375, 0.26544189453125, 0.361602783203125, 0.457763671875, 0.553924560546875, 0.65008544921875, 0.746246337890625, 0.8424072265625, 0.938568115234375, 1.03472900390625, 1.130889892578125, 1.22705078125, 1.323211669921875, 1.41937255859375, 1.515533447265625, 1.6116943359375, 1.707855224609375, 1.80401611328125, 1.900177001953125, 1.996337890625, 2.092498779296875, 2.18865966796875, 2.284820556640625, 2.3809814453125, 2.477142333984375, 2.57330322265625, 2.669464111328125, 2.765625]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 16.0, 630.0, 359.0, 8.0, 2.0], "bins": [-2.2640185356140137, -2.226835012435913, -2.1896514892578125, -2.152468204498291, -2.1152846813201904, -2.07810115814209, -2.0409176349639893, -2.0037343502044678, -1.9665508270263672, -1.9293673038482666, -1.8921838998794556, -1.855000376701355, -1.817816972732544, -1.7806334495544434, -1.7434500455856323, -1.7062665224075317, -1.6690831184387207, -1.6318995952606201, -1.594716191291809, -1.5575326681137085, -1.5203492641448975, -1.4831657409667969, -1.4459823369979858, -1.4087988138198853, -1.3716152906417847, -1.334431767463684, -1.297248363494873, -1.2600648403167725, -1.2228814363479614, -1.1856979131698608, -1.1485145092010498, -1.1113309860229492, -1.0741475820541382, -1.0369640588760376, -0.9997806549072266, -0.9625971913337708, -0.9254137277603149, -0.8882302641868591, -0.8510468006134033, -0.8138632774353027, -0.7766798734664917, -0.7394964098930359, -0.7023129463195801, -0.6651294827461243, -0.6279460191726685, -0.5907625555992126, -0.5535790920257568, -0.5163955688476562, -0.4792121350765228, -0.442028671503067, -0.4048452079296112, -0.367661714553833, -0.3304782509803772, -0.2932947874069214, -0.2561113238334656, -0.21892786026000977, -0.18174439668655396, -0.14456093311309814, -0.10737746208906174, -0.07019399106502533, -0.03301052749156952, 0.0041729360818862915, 0.041356414556503296, 0.0785398781299591, 0.11572334170341492]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 2.0, 5.0, 5.0, 8.0, 13.0, 13.0, 18.0, 12.0, 18.0, 19.0, 28.0, 25.0, 31.0, 23.0, 23.0, 42.0, 39.0, 31.0, 45.0, 35.0, 44.0, 44.0, 52.0, 50.0, 31.0, 31.0, 34.0, 40.0, 29.0, 33.0, 21.0, 27.0, 24.0, 21.0, 16.0, 14.0, 14.0, 6.0, 4.0, 12.0, 5.0, 5.0, 3.0, 4.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1762499213218689, -0.17074425518512726, -0.16523858904838562, -0.15973293781280518, -0.15422727167606354, -0.1487216055393219, -0.14321595430374146, -0.13771028816699982, -0.13220462203025818, -0.12669895589351654, -0.1211932972073555, -0.11568763852119446, -0.11018197238445282, -0.10467630624771118, -0.09917064756155014, -0.0936649888753891, -0.08815932273864746, -0.08265365660190582, -0.07714799791574478, -0.07164233922958374, -0.0661366730928421, -0.06063101068139076, -0.05512534826993942, -0.04961968585848808, -0.04411402344703674, -0.0386083610355854, -0.033102698624134064, -0.027597036212682724, -0.022091373801231384, -0.016585711389780045, -0.011080048978328705, -0.005574386566877365, -6.872415542602539e-05, 0.005436938256025314, 0.010942600667476654, 0.016448263078927994, 0.021953925490379333, 0.027459587901830673, 0.03296525031328201, 0.03847091272473335, 0.04397657513618469, 0.04948223754763603, 0.05498789995908737, 0.06049356237053871, 0.06599922478199005, 0.07150489091873169, 0.07701054960489273, 0.08251620829105377, 0.08802187442779541, 0.09352754056453705, 0.09903319925069809, 0.10453885793685913, 0.11004452407360077, 0.11555019021034241, 0.12105584889650345, 0.1265615075826645, 0.13206717371940613, 0.13757283985614777, 0.1430785059928894, 0.14858415722846985, 0.1540898233652115, 0.15959548950195312, 0.16510114073753357, 0.1706068068742752, 0.17611247301101685]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 4.0, 4.0, 4.0, 8.0, 7.0, 11.0, 9.0, 17.0, 26.0, 27.0, 29.0, 36.0, 26.0, 36.0, 33.0, 36.0, 52.0, 42.0, 37.0, 42.0, 54.0, 40.0, 46.0, 43.0, 37.0, 35.0, 38.0, 39.0, 27.0, 36.0, 26.0, 15.0, 21.0, 20.0, 5.0, 9.0, 8.0, 4.0, 7.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.68359375, -7.46966552734375, -7.2557373046875, -7.04180908203125, -6.827880859375, -6.61395263671875, -6.4000244140625, -6.18609619140625, -5.97216796875, -5.75823974609375, -5.5443115234375, -5.33038330078125, -5.116455078125, -4.90252685546875, -4.6885986328125, -4.47467041015625, -4.2607421875, -4.04681396484375, -3.8328857421875, -3.61895751953125, -3.405029296875, -3.19110107421875, -2.9771728515625, -2.76324462890625, -2.54931640625, -2.33538818359375, -2.1214599609375, -1.90753173828125, -1.693603515625, -1.47967529296875, -1.2657470703125, -1.05181884765625, -0.837890625, -0.62396240234375, -0.4100341796875, -0.19610595703125, 0.017822265625, 0.23175048828125, 0.4456787109375, 0.65960693359375, 0.87353515625, 1.08746337890625, 1.3013916015625, 1.51531982421875, 1.729248046875, 1.94317626953125, 2.1571044921875, 2.37103271484375, 2.5849609375, 2.79888916015625, 3.0128173828125, 3.22674560546875, 3.440673828125, 3.65460205078125, 3.8685302734375, 4.08245849609375, 4.29638671875, 4.51031494140625, 4.7242431640625, 4.93817138671875, 5.152099609375, 5.36602783203125, 5.5799560546875, 5.79388427734375, 6.0078125]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 6.0, 2.0, 5.0, 6.0, 15.0, 17.0, 23.0, 33.0, 43.0, 56.0, 108.0, 156.0, 236.0, 430.0, 749.0, 1281.0, 2692.0, 5461.0, 12160.0, 27558.0, 62841.0, 149292.0, 334467.0, 261377.0, 106010.0, 45782.0, 20041.0, 8986.0, 4106.0, 2004.0, 1044.0, 601.0, 332.0, 200.0, 151.0, 105.0, 54.0, 46.0, 34.0, 18.0, 10.0, 12.0, 7.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.8125, -7.5504150390625, -7.288330078125, -7.0262451171875, -6.76416015625, -6.5020751953125, -6.239990234375, -5.9779052734375, -5.7158203125, -5.4537353515625, -5.191650390625, -4.9295654296875, -4.66748046875, -4.4053955078125, -4.143310546875, -3.8812255859375, -3.619140625, -3.3570556640625, -3.094970703125, -2.8328857421875, -2.57080078125, -2.3087158203125, -2.046630859375, -1.7845458984375, -1.5224609375, -1.2603759765625, -0.998291015625, -0.7362060546875, -0.47412109375, -0.2120361328125, 0.050048828125, 0.3121337890625, 0.57421875, 0.8363037109375, 1.098388671875, 1.3604736328125, 1.62255859375, 1.8846435546875, 2.146728515625, 2.4088134765625, 2.6708984375, 2.9329833984375, 3.195068359375, 3.4571533203125, 3.71923828125, 3.9813232421875, 4.243408203125, 4.5054931640625, 4.767578125, 5.0296630859375, 5.291748046875, 5.5538330078125, 5.81591796875, 6.0780029296875, 6.340087890625, 6.6021728515625, 6.8642578125, 7.1263427734375, 7.388427734375, 7.6505126953125, 7.91259765625, 8.1746826171875, 8.436767578125, 8.6988525390625, 8.9609375]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 4.0, 4.0, 8.0, 12.0, 13.0, 15.0, 21.0, 17.0, 29.0, 32.0, 53.0, 58.0, 72.0, 100.0, 167.0, 341.0, 1436.0, 195.0, 104.0, 71.0, 52.0, 50.0, 44.0, 34.0, 30.0, 23.0, 11.0, 15.0, 10.0, 9.0, 8.0, 4.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-24.359375, -23.703857421875, -23.04833984375, -22.392822265625, -21.7373046875, -21.081787109375, -20.42626953125, -19.770751953125, -19.115234375, -18.459716796875, -17.80419921875, -17.148681640625, -16.4931640625, -15.837646484375, -15.18212890625, -14.526611328125, -13.87109375, -13.215576171875, -12.56005859375, -11.904541015625, -11.2490234375, -10.593505859375, -9.93798828125, -9.282470703125, -8.626953125, -7.971435546875, -7.31591796875, -6.660400390625, -6.0048828125, -5.349365234375, -4.69384765625, -4.038330078125, -3.3828125, -2.727294921875, -2.07177734375, -1.416259765625, -0.7607421875, -0.105224609375, 0.55029296875, 1.205810546875, 1.861328125, 2.516845703125, 3.17236328125, 3.827880859375, 4.4833984375, 5.138916015625, 5.79443359375, 6.449951171875, 7.10546875, 7.760986328125, 8.41650390625, 9.072021484375, 9.7275390625, 10.383056640625, 11.03857421875, 11.694091796875, 12.349609375, 13.005126953125, 13.66064453125, 14.316162109375, 14.9716796875, 15.627197265625, 16.28271484375, 16.938232421875, 17.59375]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 5.0, 8.0, 14.0, 12.0, 11.0, 20.0, 29.0, 40.0, 58.0, 68.0, 124.0, 189.0, 274.0, 430.0, 743.0, 1556.0, 23440.0, 3101183.0, 14123.0, 1480.0, 677.0, 392.0, 240.0, 173.0, 114.0, 75.0, 54.0, 44.0, 22.0, 24.0, 23.0, 11.0, 12.0, 14.0, 8.0, 8.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-64.4375, -62.71728515625, -60.9970703125, -59.27685546875, -57.556640625, -55.83642578125, -54.1162109375, -52.39599609375, -50.67578125, -48.95556640625, -47.2353515625, -45.51513671875, -43.794921875, -42.07470703125, -40.3544921875, -38.63427734375, -36.9140625, -35.19384765625, -33.4736328125, -31.75341796875, -30.033203125, -28.31298828125, -26.5927734375, -24.87255859375, -23.15234375, -21.43212890625, -19.7119140625, -17.99169921875, -16.271484375, -14.55126953125, -12.8310546875, -11.11083984375, -9.390625, -7.67041015625, -5.9501953125, -4.22998046875, -2.509765625, -0.78955078125, 0.9306640625, 2.65087890625, 4.37109375, 6.09130859375, 7.8115234375, 9.53173828125, 11.251953125, 12.97216796875, 14.6923828125, 16.41259765625, 18.1328125, 19.85302734375, 21.5732421875, 23.29345703125, 25.013671875, 26.73388671875, 28.4541015625, 30.17431640625, 31.89453125, 33.61474609375, 35.3349609375, 37.05517578125, 38.775390625, 40.49560546875, 42.2158203125, 43.93603515625, 45.65625]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 10.0, 821.0, 185.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-691.927001953125, -678.8102416992188, -665.6934814453125, -652.5767822265625, -639.4600219726562, -626.34326171875, -613.2265014648438, -600.1097412109375, -586.9929809570312, -573.876220703125, -560.7594604492188, -547.6427001953125, -534.5260009765625, -521.4092407226562, -508.29248046875, -495.17572021484375, -482.0589904785156, -468.9422302246094, -455.82550048828125, -442.708740234375, -429.59197998046875, -416.4752197265625, -403.3584899902344, -390.2417297363281, -377.125, -364.00823974609375, -350.8915100097656, -337.7747497558594, -324.6579895019531, -311.541259765625, -298.42449951171875, -285.3077392578125, -272.19097900390625, -259.07421875, -245.9574737548828, -232.84072875976562, -219.72396850585938, -206.6072235107422, -193.490478515625, -180.37371826171875, -167.25697326660156, -154.14022827148438, -141.02346801757812, -127.90672302246094, -114.78997039794922, -101.6732177734375, -88.55647277832031, -75.4397201538086, -62.322967529296875, -49.206214904785156, -36.0894660949707, -22.97271728515625, -9.855964660644531, 3.2607879638671875, 16.377532958984375, 29.494285583496094, 42.61103820800781, 55.72779083251953, 68.84454345703125, 81.96128845214844, 95.07804107666016, 108.19479370117188, 121.31153869628906, 134.42828369140625, 147.5450439453125]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 6.0, 9.0, 12.0, 10.0, 12.0, 17.0, 23.0, 13.0, 18.0, 21.0, 44.0, 35.0, 32.0, 32.0, 41.0, 33.0, 46.0, 55.0, 42.0, 47.0, 52.0, 48.0, 34.0, 40.0, 38.0, 30.0, 23.0, 25.0, 26.0, 19.0, 26.0, 15.0, 19.0, 16.0, 10.0, 11.0, 7.0, 7.0, 4.0, 4.0, 5.0, 3.0, 2.0, 0.0, 2.0], "bins": [-56.578216552734375, -55.04109573364258, -53.50397491455078, -51.96685791015625, -50.42973709106445, -48.892616271972656, -47.355499267578125, -45.81837844848633, -44.28125762939453, -42.744136810302734, -41.20701599121094, -39.669898986816406, -38.13277816772461, -36.59565734863281, -35.05854034423828, -33.521419525146484, -31.984298706054688, -30.44717788696289, -28.910058975219727, -27.372940063476562, -25.835819244384766, -24.29869842529297, -22.761579513549805, -21.22446060180664, -19.687339782714844, -18.150218963623047, -16.613100051879883, -15.075980186462402, -13.538860321044922, -12.001740455627441, -10.464620590209961, -8.92750072479248, -7.390377044677734, -5.853257179260254, -4.316137313842773, -2.779017448425293, -1.2418975830078125, 0.29522228240966797, 1.8323421478271484, 3.369462013244629, 4.906581878662109, 6.44370174407959, 7.98082160949707, 9.51794147491455, 11.055061340332031, 12.592181205749512, 14.129301071166992, 15.666420936584473, 17.203540802001953, 18.74066162109375, 20.277780532836914, 21.814899444580078, 23.352020263671875, 24.889141082763672, 26.426259994506836, 27.96337890625, 29.500499725341797, 31.037620544433594, 32.574737548828125, 34.11185836791992, 35.64897918701172, 37.186100006103516, 38.72322082519531, 40.260337829589844, 41.79745864868164]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 6.0, 5.0, 7.0, 5.0, 5.0, 8.0, 9.0, 11.0, 11.0, 12.0, 16.0, 13.0, 19.0, 24.0, 31.0, 50.0, 31.0, 41.0, 34.0, 39.0, 29.0, 40.0, 47.0, 40.0, 49.0, 45.0, 47.0, 42.0, 33.0, 36.0, 28.0, 18.0, 32.0, 24.0, 24.0, 16.0, 18.0, 10.0, 9.0, 9.0, 4.0, 7.0, 8.0, 5.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.35546875, -6.15582275390625, -5.9561767578125, -5.75653076171875, -5.556884765625, -5.35723876953125, -5.1575927734375, -4.95794677734375, -4.75830078125, -4.55865478515625, -4.3590087890625, -4.15936279296875, -3.959716796875, -3.76007080078125, -3.5604248046875, -3.36077880859375, -3.1611328125, -2.96148681640625, -2.7618408203125, -2.56219482421875, -2.362548828125, -2.16290283203125, -1.9632568359375, -1.76361083984375, -1.56396484375, -1.36431884765625, -1.1646728515625, -0.96502685546875, -0.765380859375, -0.56573486328125, -0.3660888671875, -0.16644287109375, 0.033203125, 0.23284912109375, 0.4324951171875, 0.63214111328125, 0.831787109375, 1.03143310546875, 1.2310791015625, 1.43072509765625, 1.63037109375, 1.83001708984375, 2.0296630859375, 2.22930908203125, 2.428955078125, 2.62860107421875, 2.8282470703125, 3.02789306640625, 3.2275390625, 3.42718505859375, 3.6268310546875, 3.82647705078125, 4.026123046875, 4.22576904296875, 4.4254150390625, 4.62506103515625, 4.82470703125, 5.02435302734375, 5.2239990234375, 5.42364501953125, 5.623291015625, 5.82293701171875, 6.0225830078125, 6.22222900390625, 6.421875]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 0.0, 3.0, 5.0, 4.0, 12.0, 14.0, 19.0, 33.0, 47.0, 52.0, 94.0, 119.0, 175.0, 273.0, 425.0, 691.0, 1260.0, 2512.0, 5919.0, 19497.0, 104903.0, 730645.0, 2332147.0, 836621.0, 124575.0, 21860.0, 6381.0, 2671.0, 1315.0, 715.0, 426.0, 269.0, 193.0, 143.0, 83.0, 63.0, 37.0, 34.0, 16.0, 15.0, 7.0, 4.0, 4.0, 1.0, 2.0, 2.0, 1.0], "bins": [-14.6484375, -14.2779541015625, -13.907470703125, -13.5369873046875, -13.16650390625, -12.7960205078125, -12.425537109375, -12.0550537109375, -11.6845703125, -11.3140869140625, -10.943603515625, -10.5731201171875, -10.20263671875, -9.8321533203125, -9.461669921875, -9.0911865234375, -8.720703125, -8.3502197265625, -7.979736328125, -7.6092529296875, -7.23876953125, -6.8682861328125, -6.497802734375, -6.1273193359375, -5.7568359375, -5.3863525390625, -5.015869140625, -4.6453857421875, -4.27490234375, -3.9044189453125, -3.533935546875, -3.1634521484375, -2.79296875, -2.4224853515625, -2.052001953125, -1.6815185546875, -1.31103515625, -0.9405517578125, -0.570068359375, -0.1995849609375, 0.1708984375, 0.5413818359375, 0.911865234375, 1.2823486328125, 1.65283203125, 2.0233154296875, 2.393798828125, 2.7642822265625, 3.134765625, 3.5052490234375, 3.875732421875, 4.2462158203125, 4.61669921875, 4.9871826171875, 5.357666015625, 5.7281494140625, 6.0986328125, 6.4691162109375, 6.839599609375, 7.2100830078125, 7.58056640625, 7.9510498046875, 8.321533203125, 8.6920166015625, 9.0625]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 8.0, 13.0, 20.0, 38.0, 47.0, 80.0, 125.0, 198.0, 331.0, 640.0, 891.0, 655.0, 394.0, 235.0, 151.0, 89.0, 54.0, 36.0, 35.0, 14.0, 9.0, 9.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-23.859375, -23.2850341796875, -22.710693359375, -22.1363525390625, -21.56201171875, -20.9876708984375, -20.413330078125, -19.8389892578125, -19.2646484375, -18.6903076171875, -18.115966796875, -17.5416259765625, -16.96728515625, -16.3929443359375, -15.818603515625, -15.2442626953125, -14.669921875, -14.0955810546875, -13.521240234375, -12.9468994140625, -12.37255859375, -11.7982177734375, -11.223876953125, -10.6495361328125, -10.0751953125, -9.5008544921875, -8.926513671875, -8.3521728515625, -7.77783203125, -7.2034912109375, -6.629150390625, -6.0548095703125, -5.48046875, -4.9061279296875, -4.331787109375, -3.7574462890625, -3.18310546875, -2.6087646484375, -2.034423828125, -1.4600830078125, -0.8857421875, -0.3114013671875, 0.262939453125, 0.8372802734375, 1.41162109375, 1.9859619140625, 2.560302734375, 3.1346435546875, 3.708984375, 4.2833251953125, 4.857666015625, 5.4320068359375, 6.00634765625, 6.5806884765625, 7.155029296875, 7.7293701171875, 8.3037109375, 8.8780517578125, 9.452392578125, 10.0267333984375, 10.60107421875, 11.1754150390625, 11.749755859375, 12.3240966796875, 12.8984375]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 8.0, 19.0, 59.0, 126.0, 676.0, 3821.0, 1654251.0, 2530281.0, 4233.0, 579.0, 133.0, 53.0, 12.0, 7.0, 8.0, 2.0, 4.0, 6.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.0, -49.921875, -47.84375, -45.765625, -43.6875, -41.609375, -39.53125, -37.453125, -35.375, -33.296875, -31.21875, -29.140625, -27.0625, -24.984375, -22.90625, -20.828125, -18.75, -16.671875, -14.59375, -12.515625, -10.4375, -8.359375, -6.28125, -4.203125, -2.125, -0.046875, 2.03125, 4.109375, 6.1875, 8.265625, 10.34375, 12.421875, 14.5, 16.578125, 18.65625, 20.734375, 22.8125, 24.890625, 26.96875, 29.046875, 31.125, 33.203125, 35.28125, 37.359375, 39.4375, 41.515625, 43.59375, 45.671875, 47.75, 49.828125, 51.90625, 53.984375, 56.0625, 58.140625, 60.21875, 62.296875, 64.375, 66.453125, 68.53125, 70.609375, 72.6875, 74.765625, 76.84375, 78.921875, 81.0]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 81.0, 697.0, 228.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-496.9566650390625, -486.74383544921875, -476.531005859375, -466.3182067871094, -456.1053771972656, -445.8925476074219, -435.6797180175781, -425.4669189453125, -415.25408935546875, -405.041259765625, -394.82843017578125, -384.6156311035156, -374.4028015136719, -364.1899719238281, -353.9771423339844, -343.76434326171875, -333.551513671875, -323.33868408203125, -313.1258544921875, -302.9130554199219, -292.7002258300781, -282.4873962402344, -272.2745666503906, -262.061767578125, -251.84890747070312, -241.63607788085938, -231.4232635498047, -221.21043395996094, -210.99761962890625, -200.7847900390625, -190.57196044921875, -180.35914611816406, -170.14634704589844, -159.9335174560547, -149.720703125, -139.50787353515625, -129.29505920410156, -119.08222961425781, -108.8694076538086, -98.65658569335938, -88.44376373291016, -78.23094177246094, -68.01811981201172, -57.805294036865234, -47.592472076416016, -37.3796501159668, -27.166824340820312, -16.954002380371094, -6.741180419921875, 3.47164249420166, 13.684465408325195, 23.897289276123047, 34.110111236572266, 44.322933197021484, 54.53575897216797, 64.74858093261719, 74.9614028930664, 85.17422485351562, 95.38704681396484, 105.59986877441406, 115.81269836425781, 126.0255126953125, 136.23834228515625, 146.451171875, 156.6639862060547]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 4.0, 17.0, 14.0, 25.0, 36.0, 51.0, 66.0, 69.0, 75.0, 90.0, 98.0, 85.0, 79.0, 77.0, 64.0, 54.0, 38.0, 30.0, 14.0, 15.0, 6.0, 5.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.463279724121094, -58.66629409790039, -55.86930847167969, -53.072322845458984, -50.27533721923828, -47.47835159301758, -44.681365966796875, -41.88438034057617, -39.08739471435547, -36.290409088134766, -33.49342346191406, -30.69643783569336, -27.899452209472656, -25.102466583251953, -22.30548095703125, -19.508495330810547, -16.711509704589844, -13.91452407836914, -11.117538452148438, -8.320552825927734, -5.523567199707031, -2.726581573486328, 0.070404052734375, 2.867389678955078, 5.664375305175781, 8.461360931396484, 11.258346557617188, 14.05533218383789, 16.852317810058594, 19.649303436279297, 22.4462890625, 25.243274688720703, 28.040260314941406, 30.83724594116211, 33.63423156738281, 36.431217193603516, 39.22820281982422, 42.02518844604492, 44.822174072265625, 47.61915969848633, 50.41614532470703, 53.213130950927734, 56.01011657714844, 58.80710220336914, 61.604087829589844, 64.40107727050781, 67.19805908203125, 69.99504089355469, 72.79203033447266, 75.58901977539062, 78.38600158691406, 81.1829833984375, 83.97997283935547, 86.77696228027344, 89.57394409179688, 92.37092590332031, 95.16791534423828, 97.96490478515625, 100.76188659667969, 103.55886840820312, 106.3558578491211, 109.15284729003906, 111.9498291015625, 114.74681091308594, 117.5438003540039]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 2.0, 8.0, 6.0, 8.0, 14.0, 20.0, 23.0, 31.0, 43.0, 47.0, 56.0, 56.0, 70.0, 74.0, 64.0, 64.0, 68.0, 66.0, 62.0, 45.0, 49.0, 27.0, 25.0, 21.0, 22.0, 13.0, 9.0, 9.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.7265625, -8.46826171875, -8.2099609375, -7.95166015625, -7.693359375, -7.43505859375, -7.1767578125, -6.91845703125, -6.66015625, -6.40185546875, -6.1435546875, -5.88525390625, -5.626953125, -5.36865234375, -5.1103515625, -4.85205078125, -4.59375, -4.33544921875, -4.0771484375, -3.81884765625, -3.560546875, -3.30224609375, -3.0439453125, -2.78564453125, -2.52734375, -2.26904296875, -2.0107421875, -1.75244140625, -1.494140625, -1.23583984375, -0.9775390625, -0.71923828125, -0.4609375, -0.20263671875, 0.0556640625, 0.31396484375, 0.572265625, 0.83056640625, 1.0888671875, 1.34716796875, 1.60546875, 1.86376953125, 2.1220703125, 2.38037109375, 2.638671875, 2.89697265625, 3.1552734375, 3.41357421875, 3.671875, 3.93017578125, 4.1884765625, 4.44677734375, 4.705078125, 4.96337890625, 5.2216796875, 5.47998046875, 5.73828125, 5.99658203125, 6.2548828125, 6.51318359375, 6.771484375, 7.02978515625, 7.2880859375, 7.54638671875, 7.8046875]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 3.0, 9.0, 10.0, 16.0, 11.0, 18.0, 44.0, 40.0, 82.0, 110.0, 211.0, 317.0, 627.0, 985.0, 1928.0, 3248.0, 5655.0, 9790.0, 17764.0, 30356.0, 52097.0, 87060.0, 135199.0, 181442.0, 180442.0, 133828.0, 85674.0, 51097.0, 30368.0, 17321.0, 9754.0, 5622.0, 3067.0, 1848.0, 1002.0, 573.0, 351.0, 209.0, 144.0, 60.0, 58.0, 25.0, 30.0, 23.0, 16.0, 9.0, 2.0, 4.0, 7.0, 3.0, 2.0, 0.0, 0.0, 4.0], "bins": [-0.9775390625, -0.9487762451171875, -0.920013427734375, -0.8912506103515625, -0.86248779296875, -0.8337249755859375, -0.804962158203125, -0.7761993408203125, -0.7474365234375, -0.7186737060546875, -0.689910888671875, -0.6611480712890625, -0.63238525390625, -0.6036224365234375, -0.574859619140625, -0.5460968017578125, -0.517333984375, -0.4885711669921875, -0.459808349609375, -0.4310455322265625, -0.40228271484375, -0.3735198974609375, -0.344757080078125, -0.3159942626953125, -0.2872314453125, -0.2584686279296875, -0.229705810546875, -0.2009429931640625, -0.17218017578125, -0.1434173583984375, -0.114654541015625, -0.0858917236328125, -0.05712890625, -0.0283660888671875, 0.000396728515625, 0.0291595458984375, 0.05792236328125, 0.0866851806640625, 0.115447998046875, 0.1442108154296875, 0.1729736328125, 0.2017364501953125, 0.230499267578125, 0.2592620849609375, 0.28802490234375, 0.3167877197265625, 0.345550537109375, 0.3743133544921875, 0.403076171875, 0.4318389892578125, 0.460601806640625, 0.4893646240234375, 0.51812744140625, 0.5468902587890625, 0.575653076171875, 0.6044158935546875, 0.6331787109375, 0.6619415283203125, 0.690704345703125, 0.7194671630859375, 0.74822998046875, 0.7769927978515625, 0.805755615234375, 0.8345184326171875, 0.86328125]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 6.0, 6.0, 6.0, 11.0, 12.0, 13.0, 11.0, 24.0, 31.0, 34.0, 31.0, 33.0, 40.0, 35.0, 43.0, 43.0, 38.0, 37.0, 1077.0, 44.0, 44.0, 39.0, 50.0, 45.0, 51.0, 23.0, 24.0, 35.0, 19.0, 24.0, 17.0, 20.0, 13.0, 12.0, 9.0, 10.0, 7.0, 5.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.578125, -4.42327880859375, -4.2684326171875, -4.11358642578125, -3.958740234375, -3.80389404296875, -3.6490478515625, -3.49420166015625, -3.33935546875, -3.18450927734375, -3.0296630859375, -2.87481689453125, -2.719970703125, -2.56512451171875, -2.4102783203125, -2.25543212890625, -2.1005859375, -1.94573974609375, -1.7908935546875, -1.63604736328125, -1.481201171875, -1.32635498046875, -1.1715087890625, -1.01666259765625, -0.86181640625, -0.70697021484375, -0.5521240234375, -0.39727783203125, -0.242431640625, -0.08758544921875, 0.0672607421875, 0.22210693359375, 0.376953125, 0.53179931640625, 0.6866455078125, 0.84149169921875, 0.996337890625, 1.15118408203125, 1.3060302734375, 1.46087646484375, 1.61572265625, 1.77056884765625, 1.9254150390625, 2.08026123046875, 2.235107421875, 2.38995361328125, 2.5447998046875, 2.69964599609375, 2.8544921875, 3.00933837890625, 3.1641845703125, 3.31903076171875, 3.473876953125, 3.62872314453125, 3.7835693359375, 3.93841552734375, 4.09326171875, 4.24810791015625, 4.4029541015625, 4.55780029296875, 4.712646484375, 4.86749267578125, 5.0223388671875, 5.17718505859375, 5.33203125]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 5.0, 7.0, 6.0, 14.0, 19.0, 38.0, 50.0, 101.0, 128.0, 229.0, 368.0, 553.0, 963.0, 1603.0, 2753.0, 4936.0, 8749.0, 15901.0, 34403.0, 319131.0, 1618469.0, 46048.0, 18876.0, 10088.0, 5720.0, 3154.0, 1888.0, 1135.0, 706.0, 410.0, 251.0, 161.0, 92.0, 65.0, 47.0, 34.0, 12.0, 10.0, 6.0, 5.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.208984375, -2.140228271484375, -2.07147216796875, -2.002716064453125, -1.9339599609375, -1.865203857421875, -1.79644775390625, -1.727691650390625, -1.658935546875, -1.590179443359375, -1.52142333984375, -1.452667236328125, -1.3839111328125, -1.315155029296875, -1.24639892578125, -1.177642822265625, -1.10888671875, -1.040130615234375, -0.97137451171875, -0.902618408203125, -0.8338623046875, -0.765106201171875, -0.69635009765625, -0.627593994140625, -0.558837890625, -0.490081787109375, -0.42132568359375, -0.352569580078125, -0.2838134765625, -0.215057373046875, -0.14630126953125, -0.077545166015625, -0.0087890625, 0.059967041015625, 0.12872314453125, 0.197479248046875, 0.2662353515625, 0.334991455078125, 0.40374755859375, 0.472503662109375, 0.541259765625, 0.610015869140625, 0.67877197265625, 0.747528076171875, 0.8162841796875, 0.885040283203125, 0.95379638671875, 1.022552490234375, 1.09130859375, 1.160064697265625, 1.22882080078125, 1.297576904296875, 1.3663330078125, 1.435089111328125, 1.50384521484375, 1.572601318359375, 1.641357421875, 1.710113525390625, 1.77886962890625, 1.847625732421875, 1.9163818359375, 1.985137939453125, 2.05389404296875, 2.122650146484375, 2.19140625]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 7.0, 3.0, 9.0, 8.0, 13.0, 12.0, 16.0, 22.0, 23.0, 35.0, 33.0, 64.0, 58.0, 53.0, 70.0, 83.0, 72.0, 56.0, 92.0, 48.0, 52.0, 48.0, 24.0, 25.0, 25.0, 15.0, 11.0, 9.0, 6.0, 3.0, 7.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11505126953125, -0.1102304458618164, -0.10540962219238281, -0.10058879852294922, -0.09576797485351562, -0.09094715118408203, -0.08612632751464844, -0.08130550384521484, -0.07648468017578125, -0.07166385650634766, -0.06684303283691406, -0.06202220916748047, -0.057201385498046875, -0.05238056182861328, -0.04755973815917969, -0.042738914489746094, -0.0379180908203125, -0.033097267150878906, -0.028276443481445312, -0.02345561981201172, -0.018634796142578125, -0.013813972473144531, -0.008993148803710938, -0.004172325134277344, 0.00064849853515625, 0.005469322204589844, 0.010290145874023438, 0.015110969543457031, 0.019931793212890625, 0.02475261688232422, 0.029573440551757812, 0.034394264221191406, 0.039215087890625, 0.044035911560058594, 0.04885673522949219, 0.05367755889892578, 0.058498382568359375, 0.06331920623779297, 0.06814002990722656, 0.07296085357666016, 0.07778167724609375, 0.08260250091552734, 0.08742332458496094, 0.09224414825439453, 0.09706497192382812, 0.10188579559326172, 0.10670661926269531, 0.1115274429321289, 0.1163482666015625, 0.1211690902709961, 0.1259899139404297, 0.13081073760986328, 0.13563156127929688, 0.14045238494873047, 0.14527320861816406, 0.15009403228759766, 0.15491485595703125, 0.15973567962646484, 0.16455650329589844, 0.16937732696533203, 0.17419815063476562, 0.17901897430419922, 0.1838397979736328, 0.1886606216430664, 0.1934814453125]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 7.0, 3.0, 10.0, 14.0, 10.0, 22.0, 33.0, 53.0, 54.0, 99.0, 136.0, 202.0, 401.0, 819.0, 4767.0, 1038027.0, 2285.0, 665.0, 333.0, 221.0, 116.0, 66.0, 54.0, 48.0, 27.0, 24.0, 19.0, 11.0, 11.0, 4.0, 5.0, 6.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.859375, -3.763824462890625, -3.66827392578125, -3.572723388671875, -3.4771728515625, -3.381622314453125, -3.28607177734375, -3.190521240234375, -3.094970703125, -2.999420166015625, -2.90386962890625, -2.808319091796875, -2.7127685546875, -2.617218017578125, -2.52166748046875, -2.426116943359375, -2.33056640625, -2.235015869140625, -2.13946533203125, -2.043914794921875, -1.9483642578125, -1.852813720703125, -1.75726318359375, -1.661712646484375, -1.566162109375, -1.470611572265625, -1.37506103515625, -1.279510498046875, -1.1839599609375, -1.088409423828125, -0.99285888671875, -0.897308349609375, -0.8017578125, -0.706207275390625, -0.61065673828125, -0.515106201171875, -0.4195556640625, -0.324005126953125, -0.22845458984375, -0.132904052734375, -0.037353515625, 0.058197021484375, 0.15374755859375, 0.249298095703125, 0.3448486328125, 0.440399169921875, 0.53594970703125, 0.631500244140625, 0.72705078125, 0.822601318359375, 0.91815185546875, 1.013702392578125, 1.1092529296875, 1.204803466796875, 1.30035400390625, 1.395904541015625, 1.491455078125, 1.587005615234375, 1.68255615234375, 1.778106689453125, 1.8736572265625, 1.969207763671875, 2.06475830078125, 2.160308837890625, 2.255859375]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 14.0, 984.0, 17.0, 3.0, 1.0], "bins": [-3.56630277633667, -3.507347345352173, -3.448392152786255, -3.389436721801758, -3.3304812908172607, -3.2715258598327637, -3.2125706672668457, -3.1536152362823486, -3.0946598052978516, -3.0357043743133545, -2.9767491817474365, -2.9177937507629395, -2.8588383197784424, -2.7998828887939453, -2.7409276962280273, -2.6819722652435303, -2.6230170726776123, -2.5640616416931152, -2.5051064491271973, -2.4461510181427, -2.387195587158203, -2.328240394592285, -2.269284963607788, -2.210329532623291, -2.151374340057373, -2.092418909072876, -2.033463716506958, -1.974508285522461, -1.9155528545379639, -1.8565975427627563, -1.7976422309875488, -1.7386868000030518, -1.6797313690185547, -1.6207760572433472, -1.56182062625885, -1.5028653144836426, -1.4439098834991455, -1.384954571723938, -1.3259992599487305, -1.2670438289642334, -1.2080885171890259, -1.1491332054138184, -1.0901777744293213, -1.0312224626541138, -0.9722670912742615, -0.9133117198944092, -0.8543564081192017, -0.7954010367393494, -0.7364456057548523, -0.677490234375, -0.6185349225997925, -0.5595795512199402, -0.5006241798400879, -0.4416688084602356, -0.3827134668827057, -0.3237581253051758, -0.2648027539253235, -0.20584739744663239, -0.14689204096794128, -0.08793668448925018, -0.028981328010559082, 0.029974043369293213, 0.08892938494682312, 0.14788472652435303, 0.20684008300304413]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 3.0, 7.0, 4.0, 5.0, 13.0, 12.0, 13.0, 9.0, 17.0, 15.0, 23.0, 24.0, 32.0, 29.0, 30.0, 47.0, 43.0, 42.0, 39.0, 50.0, 46.0, 37.0, 47.0, 33.0, 45.0, 44.0, 39.0, 34.0, 18.0, 35.0, 29.0, 28.0, 19.0, 18.0, 15.0, 11.0, 8.0, 11.0, 9.0, 4.0, 1.0, 8.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.15697723627090454, -0.15180335938930511, -0.1466294825077057, -0.14145560562610626, -0.13628172874450684, -0.13110783696174622, -0.1259339600801468, -0.12076008319854736, -0.11558620631694794, -0.11041232943534851, -0.10523845255374908, -0.10006456822156906, -0.09489069133996964, -0.08971681445837021, -0.08454293012619019, -0.07936905324459076, -0.07419517636299133, -0.0690212994813919, -0.06384742259979248, -0.05867353826761246, -0.05349966138601303, -0.048325784504413605, -0.04315190389752388, -0.037978023290634155, -0.03280414640903473, -0.027630267664790154, -0.022456388920545578, -0.017282510176301003, -0.012108631432056427, -0.0069347526878118515, -0.001760873943567276, 0.0034130066633224487, 0.008586883544921875, 0.01376076228916645, 0.018934641033411026, 0.0241085197776556, 0.029282398521900177, 0.0344562754034996, 0.03963015601038933, 0.04480403661727905, 0.04997791349887848, 0.055151790380477905, 0.06032567098736763, 0.06549955159425735, 0.07067342847585678, 0.07584730535745621, 0.08102118968963623, 0.08619506657123566, 0.09136894345283508, 0.09654282033443451, 0.10171669721603394, 0.10689058154821396, 0.11206445842981339, 0.11723833531141281, 0.12241221964359283, 0.12758609652519226, 0.1327599734067917, 0.1379338502883911, 0.14310772716999054, 0.14828160405158997, 0.15345549583435059, 0.15862937271595, 0.16380324959754944, 0.16897712647914886, 0.1741510033607483]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 5.0, 10.0, 5.0, 7.0, 6.0, 9.0, 16.0, 17.0, 20.0, 19.0, 26.0, 30.0, 26.0, 48.0, 40.0, 53.0, 43.0, 43.0, 35.0, 43.0, 34.0, 52.0, 53.0, 40.0, 31.0, 39.0, 47.0, 27.0, 34.0, 26.0, 15.0, 17.0, 16.0, 13.0, 17.0, 8.0, 7.0, 4.0, 8.0, 7.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.6171875, -5.4510498046875, -5.284912109375, -5.1187744140625, -4.95263671875, -4.7864990234375, -4.620361328125, -4.4542236328125, -4.2880859375, -4.1219482421875, -3.955810546875, -3.7896728515625, -3.62353515625, -3.4573974609375, -3.291259765625, -3.1251220703125, -2.958984375, -2.7928466796875, -2.626708984375, -2.4605712890625, -2.29443359375, -2.1282958984375, -1.962158203125, -1.7960205078125, -1.6298828125, -1.4637451171875, -1.297607421875, -1.1314697265625, -0.96533203125, -0.7991943359375, -0.633056640625, -0.4669189453125, -0.30078125, -0.1346435546875, 0.031494140625, 0.1976318359375, 0.36376953125, 0.5299072265625, 0.696044921875, 0.8621826171875, 1.0283203125, 1.1944580078125, 1.360595703125, 1.5267333984375, 1.69287109375, 1.8590087890625, 2.025146484375, 2.1912841796875, 2.357421875, 2.5235595703125, 2.689697265625, 2.8558349609375, 3.02197265625, 3.1881103515625, 3.354248046875, 3.5203857421875, 3.6865234375, 3.8526611328125, 4.018798828125, 4.1849365234375, 4.35107421875, 4.5172119140625, 4.683349609375, 4.8494873046875, 5.015625]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 5.0, 7.0, 13.0, 22.0, 29.0, 28.0, 27.0, 63.0, 75.0, 112.0, 155.0, 253.0, 367.0, 608.0, 1121.0, 2107.0, 4690.0, 11760.0, 34054.0, 115145.0, 467906.0, 296780.0, 73822.0, 23351.0, 8525.0, 3482.0, 1613.0, 872.0, 535.0, 335.0, 215.0, 126.0, 106.0, 73.0, 52.0, 27.0, 21.0, 19.0, 15.0, 10.0, 9.0, 9.0, 7.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-9.5546875, -9.272216796875, -8.98974609375, -8.707275390625, -8.4248046875, -8.142333984375, -7.85986328125, -7.577392578125, -7.294921875, -7.012451171875, -6.72998046875, -6.447509765625, -6.1650390625, -5.882568359375, -5.60009765625, -5.317626953125, -5.03515625, -4.752685546875, -4.47021484375, -4.187744140625, -3.9052734375, -3.622802734375, -3.34033203125, -3.057861328125, -2.775390625, -2.492919921875, -2.21044921875, -1.927978515625, -1.6455078125, -1.363037109375, -1.08056640625, -0.798095703125, -0.515625, -0.233154296875, 0.04931640625, 0.331787109375, 0.6142578125, 0.896728515625, 1.17919921875, 1.461669921875, 1.744140625, 2.026611328125, 2.30908203125, 2.591552734375, 2.8740234375, 3.156494140625, 3.43896484375, 3.721435546875, 4.00390625, 4.286376953125, 4.56884765625, 4.851318359375, 5.1337890625, 5.416259765625, 5.69873046875, 5.981201171875, 6.263671875, 6.546142578125, 6.82861328125, 7.111083984375, 7.3935546875, 7.676025390625, 7.95849609375, 8.240966796875, 8.5234375]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 8.0, 9.0, 11.0, 14.0, 19.0, 23.0, 27.0, 49.0, 46.0, 60.0, 98.0, 177.0, 1538.0, 461.0, 178.0, 89.0, 53.0, 42.0, 42.0, 34.0, 23.0, 7.0, 9.0, 14.0, 10.0, 4.0, 1.0, 2.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-22.125, -21.431640625, -20.73828125, -20.044921875, -19.3515625, -18.658203125, -17.96484375, -17.271484375, -16.578125, -15.884765625, -15.19140625, -14.498046875, -13.8046875, -13.111328125, -12.41796875, -11.724609375, -11.03125, -10.337890625, -9.64453125, -8.951171875, -8.2578125, -7.564453125, -6.87109375, -6.177734375, -5.484375, -4.791015625, -4.09765625, -3.404296875, -2.7109375, -2.017578125, -1.32421875, -0.630859375, 0.0625, 0.755859375, 1.44921875, 2.142578125, 2.8359375, 3.529296875, 4.22265625, 4.916015625, 5.609375, 6.302734375, 6.99609375, 7.689453125, 8.3828125, 9.076171875, 9.76953125, 10.462890625, 11.15625, 11.849609375, 12.54296875, 13.236328125, 13.9296875, 14.623046875, 15.31640625, 16.009765625, 16.703125, 17.396484375, 18.08984375, 18.783203125, 19.4765625, 20.169921875, 20.86328125, 21.556640625, 22.25]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 5.0, 3.0, 4.0, 10.0, 8.0, 12.0, 27.0, 47.0, 78.0, 125.0, 244.0, 426.0, 1089.0, 8802.0, 3128743.0, 4245.0, 893.0, 431.0, 212.0, 126.0, 56.0, 39.0, 32.0, 9.0, 10.0, 10.0, 11.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-74.125, -71.837890625, -69.55078125, -67.263671875, -64.9765625, -62.689453125, -60.40234375, -58.115234375, -55.828125, -53.541015625, -51.25390625, -48.966796875, -46.6796875, -44.392578125, -42.10546875, -39.818359375, -37.53125, -35.244140625, -32.95703125, -30.669921875, -28.3828125, -26.095703125, -23.80859375, -21.521484375, -19.234375, -16.947265625, -14.66015625, -12.373046875, -10.0859375, -7.798828125, -5.51171875, -3.224609375, -0.9375, 1.349609375, 3.63671875, 5.923828125, 8.2109375, 10.498046875, 12.78515625, 15.072265625, 17.359375, 19.646484375, 21.93359375, 24.220703125, 26.5078125, 28.794921875, 31.08203125, 33.369140625, 35.65625, 37.943359375, 40.23046875, 42.517578125, 44.8046875, 47.091796875, 49.37890625, 51.666015625, 53.953125, 56.240234375, 58.52734375, 60.814453125, 63.1015625, 65.388671875, 67.67578125, 69.962890625, 72.25]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 14.0, 199.0, 587.0, 203.0, 9.0, 0.0, 0.0, 1.0], "bins": [-347.1723327636719, -341.2425231933594, -335.3127136230469, -329.3829040527344, -323.4530944824219, -317.5233154296875, -311.593505859375, -305.6636962890625, -299.73388671875, -293.8040771484375, -287.874267578125, -281.9444580078125, -276.0146484375, -270.0848388671875, -264.155029296875, -258.2252502441406, -252.29542541503906, -246.36561584472656, -240.43580627441406, -234.50601196289062, -228.57620239257812, -222.64639282226562, -216.71658325195312, -210.78677368164062, -204.85696411132812, -198.92715454101562, -192.99734497070312, -187.06753540039062, -181.1377410888672, -175.2079315185547, -169.2781219482422, -163.3483123779297, -157.41851806640625, -151.48870849609375, -145.55889892578125, -139.62908935546875, -133.6992950439453, -127.76948547363281, -121.83967590332031, -115.90986633300781, -109.98005676269531, -104.05024719238281, -98.12044525146484, -92.19063568115234, -86.26083374023438, -80.33102416992188, -74.40121459960938, -68.47140502929688, -62.54160690307617, -56.61180114746094, -50.68199157714844, -44.7521858215332, -38.82238006591797, -32.892574310302734, -26.962764739990234, -21.032958984375, -15.103153228759766, -9.173346519470215, -3.243539810180664, 2.686267852783203, 8.616073608398438, 14.545879364013672, 20.475688934326172, 26.405494689941406, 32.33530044555664]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 3.0, 3.0, 5.0, 3.0, 3.0, 10.0, 8.0, 7.0, 13.0, 17.0, 23.0, 21.0, 31.0, 21.0, 22.0, 36.0, 35.0, 30.0, 36.0, 44.0, 40.0, 34.0, 49.0, 52.0, 57.0, 48.0, 46.0, 30.0, 30.0, 26.0, 39.0, 41.0, 25.0, 20.0, 21.0, 24.0, 10.0, 14.0, 16.0, 6.0, 2.0, 3.0, 4.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0], "bins": [-51.750999450683594, -50.345767974853516, -48.9405403137207, -47.535308837890625, -46.13008117675781, -44.724849700927734, -43.319618225097656, -41.914390563964844, -40.509159088134766, -39.10392761230469, -37.698699951171875, -36.2934684753418, -34.88823699951172, -33.483009338378906, -32.07777786254883, -30.672548294067383, -29.267318725585938, -27.862089157104492, -26.456859588623047, -25.05162811279297, -23.646398544311523, -22.241168975830078, -20.8359375, -19.430707931518555, -18.02547836303711, -16.620248794555664, -15.215018272399902, -13.80978775024414, -12.404558181762695, -10.99932861328125, -9.594098091125488, -8.188867568969727, -6.783634185791016, -5.378404140472412, -3.9731740951538086, -2.567944049835205, -1.1627140045166016, 0.24251604080200195, 1.6477460861206055, 3.052976608276367, 4.4582061767578125, 5.863436222076416, 7.2686662673950195, 8.673896789550781, 10.079126358032227, 11.484355926513672, 12.889586448669434, 14.294816970825195, 15.70004653930664, 17.105276107788086, 18.51050567626953, 19.91573715209961, 21.320966720581055, 22.7261962890625, 24.131427764892578, 25.536657333374023, 26.94188690185547, 28.347116470336914, 29.75234603881836, 31.157577514648438, 32.56280517578125, 33.96803665161133, 35.373268127441406, 36.77849578857422, 38.1837272644043]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 0.0, 2.0, 1.0, 13.0, 4.0, 8.0, 9.0, 15.0, 17.0, 9.0, 20.0, 25.0, 22.0, 23.0, 42.0, 34.0, 33.0, 44.0, 39.0, 42.0, 37.0, 32.0, 40.0, 53.0, 45.0, 39.0, 40.0, 33.0, 35.0, 32.0, 25.0, 26.0, 35.0, 23.0, 19.0, 18.0, 9.0, 14.0, 13.0, 2.0, 5.0, 10.0, 2.0, 6.0, 1.0, 5.0, 2.0, 1.0, 5.0, 1.0, 1.0, 1.0, 1.0], "bins": [-5.8203125, -5.6474609375, -5.474609375, -5.3017578125, -5.12890625, -4.9560546875, -4.783203125, -4.6103515625, -4.4375, -4.2646484375, -4.091796875, -3.9189453125, -3.74609375, -3.5732421875, -3.400390625, -3.2275390625, -3.0546875, -2.8818359375, -2.708984375, -2.5361328125, -2.36328125, -2.1904296875, -2.017578125, -1.8447265625, -1.671875, -1.4990234375, -1.326171875, -1.1533203125, -0.98046875, -0.8076171875, -0.634765625, -0.4619140625, -0.2890625, -0.1162109375, 0.056640625, 0.2294921875, 0.40234375, 0.5751953125, 0.748046875, 0.9208984375, 1.09375, 1.2666015625, 1.439453125, 1.6123046875, 1.78515625, 1.9580078125, 2.130859375, 2.3037109375, 2.4765625, 2.6494140625, 2.822265625, 2.9951171875, 3.16796875, 3.3408203125, 3.513671875, 3.6865234375, 3.859375, 4.0322265625, 4.205078125, 4.3779296875, 4.55078125, 4.7236328125, 4.896484375, 5.0693359375, 5.2421875]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 4.0, 1.0, 1.0, 2.0, 7.0, 11.0, 7.0, 7.0, 11.0, 16.0, 23.0, 39.0, 39.0, 70.0, 94.0, 135.0, 171.0, 290.0, 473.0, 918.0, 1707.0, 3301.0, 7512.0, 21661.0, 109686.0, 835583.0, 2382313.0, 705378.0, 91359.0, 19557.0, 6912.0, 3125.0, 1629.0, 831.0, 474.0, 292.0, 201.0, 136.0, 81.0, 53.0, 46.0, 37.0, 23.0, 20.0, 16.0, 10.0, 7.0, 3.0, 9.0, 1.0, 2.0, 3.0, 4.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-9.9921875, -9.6529541015625, -9.313720703125, -8.9744873046875, -8.63525390625, -8.2960205078125, -7.956787109375, -7.6175537109375, -7.2783203125, -6.9390869140625, -6.599853515625, -6.2606201171875, -5.92138671875, -5.5821533203125, -5.242919921875, -4.9036865234375, -4.564453125, -4.2252197265625, -3.885986328125, -3.5467529296875, -3.20751953125, -2.8682861328125, -2.529052734375, -2.1898193359375, -1.8505859375, -1.5113525390625, -1.172119140625, -0.8328857421875, -0.49365234375, -0.1544189453125, 0.184814453125, 0.5240478515625, 0.86328125, 1.2025146484375, 1.541748046875, 1.8809814453125, 2.22021484375, 2.5594482421875, 2.898681640625, 3.2379150390625, 3.5771484375, 3.9163818359375, 4.255615234375, 4.5948486328125, 4.93408203125, 5.2733154296875, 5.612548828125, 5.9517822265625, 6.291015625, 6.6302490234375, 6.969482421875, 7.3087158203125, 7.64794921875, 7.9871826171875, 8.326416015625, 8.6656494140625, 9.0048828125, 9.3441162109375, 9.683349609375, 10.0225830078125, 10.36181640625, 10.7010498046875, 11.040283203125, 11.3795166015625, 11.71875]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 8.0, 6.0, 13.0, 15.0, 13.0, 24.0, 43.0, 84.0, 120.0, 175.0, 258.0, 436.0, 640.0, 731.0, 555.0, 344.0, 220.0, 146.0, 88.0, 61.0, 31.0, 13.0, 7.0, 14.0, 4.0, 1.0, 6.0, 4.0, 4.0, 1.0, 0.0, 2.0, 2.0, 4.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.7109375, -14.2681884765625, -13.825439453125, -13.3826904296875, -12.93994140625, -12.4971923828125, -12.054443359375, -11.6116943359375, -11.1689453125, -10.7261962890625, -10.283447265625, -9.8406982421875, -9.39794921875, -8.9552001953125, -8.512451171875, -8.0697021484375, -7.626953125, -7.1842041015625, -6.741455078125, -6.2987060546875, -5.85595703125, -5.4132080078125, -4.970458984375, -4.5277099609375, -4.0849609375, -3.6422119140625, -3.199462890625, -2.7567138671875, -2.31396484375, -1.8712158203125, -1.428466796875, -0.9857177734375, -0.54296875, -0.1002197265625, 0.342529296875, 0.7852783203125, 1.22802734375, 1.6707763671875, 2.113525390625, 2.5562744140625, 2.9990234375, 3.4417724609375, 3.884521484375, 4.3272705078125, 4.77001953125, 5.2127685546875, 5.655517578125, 6.0982666015625, 6.541015625, 6.9837646484375, 7.426513671875, 7.8692626953125, 8.31201171875, 8.7547607421875, 9.197509765625, 9.6402587890625, 10.0830078125, 10.5257568359375, 10.968505859375, 11.4112548828125, 11.85400390625, 12.2967529296875, 12.739501953125, 13.1822509765625, 13.625]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 2.0, 0.0, 2.0, 3.0, 3.0, 6.0, 7.0, 9.0, 6.0, 15.0, 25.0, 34.0, 54.0, 76.0, 187.0, 410.0, 1089.0, 4588.0, 115132.0, 3990254.0, 76536.0, 4016.0, 1036.0, 357.0, 171.0, 100.0, 46.0, 28.0, 27.0, 23.0, 9.0, 6.0, 10.0, 1.0, 2.0, 7.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-38.8125, -37.718017578125, -36.62353515625, -35.529052734375, -34.4345703125, -33.340087890625, -32.24560546875, -31.151123046875, -30.056640625, -28.962158203125, -27.86767578125, -26.773193359375, -25.6787109375, -24.584228515625, -23.48974609375, -22.395263671875, -21.30078125, -20.206298828125, -19.11181640625, -18.017333984375, -16.9228515625, -15.828369140625, -14.73388671875, -13.639404296875, -12.544921875, -11.450439453125, -10.35595703125, -9.261474609375, -8.1669921875, -7.072509765625, -5.97802734375, -4.883544921875, -3.7890625, -2.694580078125, -1.60009765625, -0.505615234375, 0.5888671875, 1.683349609375, 2.77783203125, 3.872314453125, 4.966796875, 6.061279296875, 7.15576171875, 8.250244140625, 9.3447265625, 10.439208984375, 11.53369140625, 12.628173828125, 13.72265625, 14.817138671875, 15.91162109375, 17.006103515625, 18.1005859375, 19.195068359375, 20.28955078125, 21.384033203125, 22.478515625, 23.572998046875, 24.66748046875, 25.761962890625, 26.8564453125, 27.950927734375, 29.04541015625, 30.139892578125, 31.234375]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 356.0, 644.0, 9.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-763.1830444335938, -749.0755004882812, -734.9678955078125, -720.8603515625, -706.7527465820312, -692.6452026367188, -678.53759765625, -664.4300537109375, -650.322509765625, -636.2149658203125, -622.1073608398438, -607.9998168945312, -593.8922119140625, -579.78466796875, -565.6771240234375, -551.5695190429688, -537.4619140625, -523.3543701171875, -509.24676513671875, -495.13922119140625, -481.0316467285156, -466.924072265625, -452.8164978027344, -438.70892333984375, -424.60137939453125, -410.4938049316406, -396.38623046875, -382.2786865234375, -368.1711120605469, -354.06353759765625, -339.9559631347656, -325.848388671875, -311.7408752441406, -297.63330078125, -283.5257263183594, -269.41815185546875, -255.31060791015625, -241.20303344726562, -227.095458984375, -212.98788452148438, -198.8803253173828, -184.7727508544922, -170.66519165039062, -156.5576171875, -142.45004272460938, -128.3424835205078, -114.23490905761719, -100.1273422241211, -86.019775390625, -71.9122085571289, -57.80463790893555, -43.69706726074219, -29.589500427246094, -15.48193359375, -1.374359130859375, 12.733207702636719, 26.840774536132812, 40.948341369628906, 55.055912017822266, 69.16348266601562, 83.27104949951172, 97.37861633300781, 111.48619079589844, 125.59375762939453, 139.70132446289062]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 2.0, 4.0, 6.0, 17.0, 33.0, 30.0, 57.0, 65.0, 79.0, 101.0, 89.0, 97.0, 94.0, 85.0, 80.0, 50.0, 47.0, 31.0, 19.0, 15.0, 7.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.440521240234375, -59.84383773803711, -57.247154235839844, -54.65047073364258, -52.05378723144531, -49.45710372924805, -46.86042022705078, -44.263736724853516, -41.66705322265625, -39.070369720458984, -36.47368621826172, -33.87700271606445, -31.280319213867188, -28.683635711669922, -26.086952209472656, -23.49026870727539, -20.893585205078125, -18.29690170288086, -15.700218200683594, -13.103534698486328, -10.506851196289062, -7.910167694091797, -5.313484191894531, -2.7168006896972656, -0.1201171875, 2.4765663146972656, 5.073249816894531, 7.669933319091797, 10.266616821289062, 12.863300323486328, 15.459983825683594, 18.05666732788086, 20.653350830078125, 23.25003433227539, 25.846717834472656, 28.443401336669922, 31.040084838867188, 33.63676834106445, 36.23345184326172, 38.830135345458984, 41.42681884765625, 44.023502349853516, 46.62018585205078, 49.21686935424805, 51.81355285644531, 54.41023635864258, 57.006919860839844, 59.60360336303711, 62.200286865234375, 64.79696655273438, 67.3936538696289, 69.99034118652344, 72.58702087402344, 75.18370056152344, 77.78038787841797, 80.3770751953125, 82.9737548828125, 85.5704345703125, 88.16712188720703, 90.76380920410156, 93.36048889160156, 95.95716857910156, 98.5538558959961, 101.15054321289062, 103.74722290039062]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 3.0, 6.0, 4.0, 9.0, 10.0, 14.0, 15.0, 15.0, 16.0, 26.0, 23.0, 28.0, 31.0, 42.0, 37.0, 40.0, 41.0, 38.0, 45.0, 51.0, 51.0, 41.0, 51.0, 56.0, 48.0, 33.0, 30.0, 32.0, 34.0, 22.0, 18.0, 18.0, 14.0, 12.0, 15.0, 9.0, 6.0, 5.0, 2.0, 8.0, 5.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.234375, -4.0889892578125, -3.943603515625, -3.7982177734375, -3.65283203125, -3.5074462890625, -3.362060546875, -3.2166748046875, -3.0712890625, -2.9259033203125, -2.780517578125, -2.6351318359375, -2.48974609375, -2.3443603515625, -2.198974609375, -2.0535888671875, -1.908203125, -1.7628173828125, -1.617431640625, -1.4720458984375, -1.32666015625, -1.1812744140625, -1.035888671875, -0.8905029296875, -0.7451171875, -0.5997314453125, -0.454345703125, -0.3089599609375, -0.16357421875, -0.0181884765625, 0.127197265625, 0.2725830078125, 0.41796875, 0.5633544921875, 0.708740234375, 0.8541259765625, 0.99951171875, 1.1448974609375, 1.290283203125, 1.4356689453125, 1.5810546875, 1.7264404296875, 1.871826171875, 2.0172119140625, 2.16259765625, 2.3079833984375, 2.453369140625, 2.5987548828125, 2.744140625, 2.8895263671875, 3.034912109375, 3.1802978515625, 3.32568359375, 3.4710693359375, 3.616455078125, 3.7618408203125, 3.9072265625, 4.0526123046875, 4.197998046875, 4.3433837890625, 4.48876953125, 4.6341552734375, 4.779541015625, 4.9249267578125, 5.0703125]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 5.0, 7.0, 5.0, 9.0, 12.0, 27.0, 28.0, 49.0, 57.0, 112.0, 134.0, 191.0, 314.0, 453.0, 587.0, 922.0, 1279.0, 1856.0, 2693.0, 4074.0, 6046.0, 9017.0, 13217.0, 19664.0, 29028.0, 42719.0, 62271.0, 88433.0, 116197.0, 136808.0, 134764.0, 111173.0, 83237.0, 58948.0, 40132.0, 27136.0, 18374.0, 12489.0, 8427.0, 5648.0, 3846.0, 2559.0, 1795.0, 1196.0, 837.0, 569.0, 398.0, 255.0, 179.0, 124.0, 93.0, 49.0, 44.0, 29.0, 15.0, 17.0, 11.0, 8.0, 0.0, 3.0, 3.0], "bins": [-0.5791015625, -0.5615081787109375, -0.543914794921875, -0.5263214111328125, -0.50872802734375, -0.4911346435546875, -0.473541259765625, -0.4559478759765625, -0.4383544921875, -0.4207611083984375, -0.403167724609375, -0.3855743408203125, -0.36798095703125, -0.3503875732421875, -0.332794189453125, -0.3152008056640625, -0.297607421875, -0.2800140380859375, -0.262420654296875, -0.2448272705078125, -0.22723388671875, -0.2096405029296875, -0.192047119140625, -0.1744537353515625, -0.1568603515625, -0.1392669677734375, -0.121673583984375, -0.1040802001953125, -0.08648681640625, -0.0688934326171875, -0.051300048828125, -0.0337066650390625, -0.01611328125, 0.0014801025390625, 0.019073486328125, 0.0366668701171875, 0.05426025390625, 0.0718536376953125, 0.089447021484375, 0.1070404052734375, 0.1246337890625, 0.1422271728515625, 0.159820556640625, 0.1774139404296875, 0.19500732421875, 0.2126007080078125, 0.230194091796875, 0.2477874755859375, 0.265380859375, 0.2829742431640625, 0.300567626953125, 0.3181610107421875, 0.33575439453125, 0.3533477783203125, 0.370941162109375, 0.3885345458984375, 0.4061279296875, 0.4237213134765625, 0.441314697265625, 0.4589080810546875, 0.47650146484375, 0.4940948486328125, 0.511688232421875, 0.5292816162109375, 0.546875]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 5.0, 2.0, 3.0, 3.0, 7.0, 12.0, 8.0, 9.0, 10.0, 18.0, 20.0, 19.0, 21.0, 23.0, 25.0, 26.0, 33.0, 33.0, 37.0, 50.0, 47.0, 41.0, 45.0, 1059.0, 41.0, 50.0, 35.0, 36.0, 33.0, 39.0, 25.0, 33.0, 30.0, 19.0, 23.0, 20.0, 17.0, 12.0, 13.0, 15.0, 8.0, 4.0, 7.0, 5.0, 4.0, 3.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.025390625, -2.922271728515625, -2.81915283203125, -2.716033935546875, -2.6129150390625, -2.509796142578125, -2.40667724609375, -2.303558349609375, -2.200439453125, -2.097320556640625, -1.99420166015625, -1.891082763671875, -1.7879638671875, -1.684844970703125, -1.58172607421875, -1.478607177734375, -1.37548828125, -1.272369384765625, -1.16925048828125, -1.066131591796875, -0.9630126953125, -0.859893798828125, -0.75677490234375, -0.653656005859375, -0.550537109375, -0.447418212890625, -0.34429931640625, -0.241180419921875, -0.1380615234375, -0.034942626953125, 0.06817626953125, 0.171295166015625, 0.2744140625, 0.377532958984375, 0.48065185546875, 0.583770751953125, 0.6868896484375, 0.790008544921875, 0.89312744140625, 0.996246337890625, 1.099365234375, 1.202484130859375, 1.30560302734375, 1.408721923828125, 1.5118408203125, 1.614959716796875, 1.71807861328125, 1.821197509765625, 1.92431640625, 2.027435302734375, 2.13055419921875, 2.233673095703125, 2.3367919921875, 2.439910888671875, 2.54302978515625, 2.646148681640625, 2.749267578125, 2.852386474609375, 2.95550537109375, 3.058624267578125, 3.1617431640625, 3.264862060546875, 3.36798095703125, 3.471099853515625, 3.57421875]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 7.0, 8.0, 10.0, 31.0, 33.0, 46.0, 72.0, 87.0, 141.0, 228.0, 328.0, 536.0, 815.0, 1283.0, 2003.0, 3013.0, 4805.0, 7799.0, 12603.0, 21864.0, 53731.0, 1579338.0, 323962.0, 36971.0, 18195.0, 10918.0, 6764.0, 4099.0, 2727.0, 1637.0, 1044.0, 677.0, 468.0, 290.0, 206.0, 137.0, 77.0, 53.0, 40.0, 32.0, 21.0, 6.0, 12.0, 7.0, 6.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.44921875, -1.4051055908203125, -1.360992431640625, -1.3168792724609375, -1.27276611328125, -1.2286529541015625, -1.184539794921875, -1.1404266357421875, -1.0963134765625, -1.0522003173828125, -1.008087158203125, -0.9639739990234375, -0.91986083984375, -0.8757476806640625, -0.831634521484375, -0.7875213623046875, -0.743408203125, -0.6992950439453125, -0.655181884765625, -0.6110687255859375, -0.56695556640625, -0.5228424072265625, -0.478729248046875, -0.4346160888671875, -0.3905029296875, -0.3463897705078125, -0.302276611328125, -0.2581634521484375, -0.21405029296875, -0.1699371337890625, -0.125823974609375, -0.0817108154296875, -0.03759765625, 0.0065155029296875, 0.050628662109375, 0.0947418212890625, 0.13885498046875, 0.1829681396484375, 0.227081298828125, 0.2711944580078125, 0.3153076171875, 0.3594207763671875, 0.403533935546875, 0.4476470947265625, 0.49176025390625, 0.5358734130859375, 0.579986572265625, 0.6240997314453125, 0.668212890625, 0.7123260498046875, 0.756439208984375, 0.8005523681640625, 0.84466552734375, 0.8887786865234375, 0.932891845703125, 0.9770050048828125, 1.0211181640625, 1.0652313232421875, 1.109344482421875, 1.1534576416015625, 1.19757080078125, 1.2416839599609375, 1.285797119140625, 1.3299102783203125, 1.3740234375]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 1.0, 5.0, 3.0, 9.0, 11.0, 8.0, 12.0, 15.0, 23.0, 23.0, 39.0, 39.0, 48.0, 52.0, 63.0, 75.0, 64.0, 79.0, 67.0, 61.0, 49.0, 64.0, 40.0, 29.0, 27.0, 20.0, 13.0, 19.0, 13.0, 6.0, 9.0, 6.0, 5.0, 2.0, 5.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08160400390625, -0.07870960235595703, -0.07581520080566406, -0.0729207992553711, -0.07002639770507812, -0.06713199615478516, -0.06423759460449219, -0.06134319305419922, -0.05844879150390625, -0.05555438995361328, -0.05265998840332031, -0.049765586853027344, -0.046871185302734375, -0.043976783752441406, -0.04108238220214844, -0.03818798065185547, -0.0352935791015625, -0.03239917755126953, -0.029504776000976562, -0.026610374450683594, -0.023715972900390625, -0.020821571350097656, -0.017927169799804688, -0.015032768249511719, -0.01213836669921875, -0.009243965148925781, -0.0063495635986328125, -0.0034551620483398438, -0.000560760498046875, 0.0023336410522460938, 0.0052280426025390625, 0.008122444152832031, 0.011016845703125, 0.013911247253417969, 0.016805648803710938, 0.019700050354003906, 0.022594451904296875, 0.025488853454589844, 0.028383255004882812, 0.03127765655517578, 0.03417205810546875, 0.03706645965576172, 0.03996086120605469, 0.042855262756347656, 0.045749664306640625, 0.048644065856933594, 0.05153846740722656, 0.05443286895751953, 0.0573272705078125, 0.06022167205810547, 0.06311607360839844, 0.0660104751586914, 0.06890487670898438, 0.07179927825927734, 0.07469367980957031, 0.07758808135986328, 0.08048248291015625, 0.08337688446044922, 0.08627128601074219, 0.08916568756103516, 0.09206008911132812, 0.0949544906616211, 0.09784889221191406, 0.10074329376220703, 0.1036376953125]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 6.0, 2.0, 2.0, 3.0, 3.0, 3.0, 7.0, 7.0, 11.0, 19.0, 22.0, 35.0, 35.0, 38.0, 57.0, 69.0, 99.0, 150.0, 212.0, 347.0, 536.0, 1085.0, 9817.0, 1022480.0, 10766.0, 1058.0, 570.0, 299.0, 193.0, 160.0, 126.0, 96.0, 55.0, 38.0, 34.0, 32.0, 17.0, 27.0, 11.0, 3.0, 11.0, 5.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.4013671875, -1.3595428466796875, -1.317718505859375, -1.2758941650390625, -1.23406982421875, -1.1922454833984375, -1.150421142578125, -1.1085968017578125, -1.0667724609375, -1.0249481201171875, -0.983123779296875, -0.9412994384765625, -0.89947509765625, -0.8576507568359375, -0.815826416015625, -0.7740020751953125, -0.732177734375, -0.6903533935546875, -0.648529052734375, -0.6067047119140625, -0.56488037109375, -0.5230560302734375, -0.481231689453125, -0.4394073486328125, -0.3975830078125, -0.3557586669921875, -0.313934326171875, -0.2721099853515625, -0.23028564453125, -0.1884613037109375, -0.146636962890625, -0.1048126220703125, -0.06298828125, -0.0211639404296875, 0.020660400390625, 0.0624847412109375, 0.10430908203125, 0.1461334228515625, 0.187957763671875, 0.2297821044921875, 0.2716064453125, 0.3134307861328125, 0.355255126953125, 0.3970794677734375, 0.43890380859375, 0.4807281494140625, 0.522552490234375, 0.5643768310546875, 0.606201171875, 0.6480255126953125, 0.689849853515625, 0.7316741943359375, 0.77349853515625, 0.8153228759765625, 0.857147216796875, 0.8989715576171875, 0.9407958984375, 0.9826202392578125, 1.024444580078125, 1.0662689208984375, 1.10809326171875, 1.1499176025390625, 1.191741943359375, 1.2335662841796875, 1.275390625]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 74.0, 895.0, 42.0], "bins": [-2.1489078998565674, -2.1144659519195557, -2.080024003982544, -2.0455820560455322, -2.0111401081085205, -1.9766981601715088, -1.942256212234497, -1.9078142642974854, -1.8733723163604736, -1.838930368423462, -1.8044884204864502, -1.7700464725494385, -1.7356045246124268, -1.701162576675415, -1.6667206287384033, -1.6322786808013916, -1.5978368520736694, -1.5633949041366577, -1.528952956199646, -1.4945110082626343, -1.4600690603256226, -1.4256271123886108, -1.3911851644515991, -1.356743335723877, -1.3223013877868652, -1.2878594398498535, -1.2534174919128418, -1.21897554397583, -1.1845335960388184, -1.1500916481018066, -1.115649700164795, -1.0812077522277832, -1.046765685081482, -1.0123237371444702, -0.9778817892074585, -0.9434398412704468, -0.9089978933334351, -0.8745559453964233, -0.8401140570640564, -0.8056721091270447, -0.7712302207946777, -0.736788272857666, -0.7023463249206543, -0.6679043769836426, -0.6334624290466309, -0.5990204811096191, -0.5645785927772522, -0.5301366448402405, -0.49569466710090637, -0.46125271916389465, -0.4268108010292053, -0.3923688530921936, -0.3579269051551819, -0.32348495721817017, -0.28904300928115845, -0.2546010911464691, -0.2201591432094574, -0.18571719527244568, -0.15127526223659515, -0.11683332175016403, -0.08239138126373291, -0.04794943332672119, -0.013507500290870667, 0.02093443274497986, 0.05537638068199158]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 6.0, 0.0, 6.0, 4.0, 7.0, 10.0, 4.0, 16.0, 15.0, 20.0, 25.0, 25.0, 28.0, 39.0, 37.0, 44.0, 44.0, 42.0, 47.0, 49.0, 59.0, 57.0, 59.0, 47.0, 48.0, 38.0, 37.0, 35.0, 37.0, 26.0, 21.0, 19.0, 10.0, 16.0, 10.0, 7.0, 6.0, 7.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15559381246566772, -0.15094004571437836, -0.14628629386425018, -0.14163252711296082, -0.13697877526283264, -0.13232500851154327, -0.1276712566614151, -0.12301748991012573, -0.11836373060941696, -0.11370997130870819, -0.10905621200799942, -0.10440245270729065, -0.09974868595600128, -0.09509493410587311, -0.09044116735458374, -0.08578740805387497, -0.0811336487531662, -0.07647988945245743, -0.07182613015174866, -0.06717237085103989, -0.06251861155033112, -0.057864848524332047, -0.05321108549833298, -0.04855732619762421, -0.043903566896915436, -0.039249807596206665, -0.034596048295497894, -0.029942285269498825, -0.025288525968790054, -0.020634766668081284, -0.015981005504727364, -0.011327244341373444, -0.006673485040664673, -0.0020197248086333275, 0.002634035423398018, 0.007287795655429363, 0.011941555887460709, 0.01659531518816948, 0.0212490763515234, 0.02590283751487732, 0.03055659681558609, 0.03521035611629486, 0.03986411541700363, 0.0445178784430027, 0.04917163774371147, 0.05382539704442024, 0.05847916007041931, 0.06313291937112808, 0.06778667867183685, 0.07244043797254562, 0.0770941972732544, 0.08174795657396317, 0.08640171587467194, 0.0910554826259613, 0.09570924192667007, 0.10036300122737885, 0.10501676052808762, 0.10967051982879639, 0.11432427912950516, 0.11897803843021393, 0.1236318051815033, 0.12828555703163147, 0.13293932378292084, 0.1375930905342102, 0.14224684238433838]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 4.0, 6.0, 12.0, 4.0, 9.0, 16.0, 11.0, 23.0, 18.0, 22.0, 23.0, 23.0, 30.0, 32.0, 33.0, 30.0, 41.0, 46.0, 29.0, 38.0, 51.0, 45.0, 50.0, 48.0, 38.0, 40.0, 39.0, 31.0, 33.0, 27.0, 23.0, 25.0, 12.0, 18.0, 15.0, 12.0, 7.0, 8.0, 7.0, 6.0, 5.0, 9.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.84375, -3.7098388671875, -3.575927734375, -3.4420166015625, -3.30810546875, -3.1741943359375, -3.040283203125, -2.9063720703125, -2.7724609375, -2.6385498046875, -2.504638671875, -2.3707275390625, -2.23681640625, -2.1029052734375, -1.968994140625, -1.8350830078125, -1.701171875, -1.5672607421875, -1.433349609375, -1.2994384765625, -1.16552734375, -1.0316162109375, -0.897705078125, -0.7637939453125, -0.6298828125, -0.4959716796875, -0.362060546875, -0.2281494140625, -0.09423828125, 0.0396728515625, 0.173583984375, 0.3074951171875, 0.44140625, 0.5753173828125, 0.709228515625, 0.8431396484375, 0.97705078125, 1.1109619140625, 1.244873046875, 1.3787841796875, 1.5126953125, 1.6466064453125, 1.780517578125, 1.9144287109375, 2.04833984375, 2.1822509765625, 2.316162109375, 2.4500732421875, 2.583984375, 2.7178955078125, 2.851806640625, 2.9857177734375, 3.11962890625, 3.2535400390625, 3.387451171875, 3.5213623046875, 3.6552734375, 3.7891845703125, 3.923095703125, 4.0570068359375, 4.19091796875, 4.3248291015625, 4.458740234375, 4.5926513671875, 4.7265625]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 3.0, 7.0, 6.0, 4.0, 10.0, 16.0, 11.0, 23.0, 21.0, 22.0, 41.0, 48.0, 75.0, 97.0, 136.0, 204.0, 273.0, 434.0, 655.0, 1084.0, 1975.0, 3976.0, 8845.0, 22129.0, 63701.0, 213659.0, 433719.0, 199032.0, 60195.0, 20902.0, 8512.0, 3889.0, 1908.0, 1041.0, 607.0, 352.0, 237.0, 181.0, 120.0, 105.0, 71.0, 53.0, 36.0, 46.0, 31.0, 25.0, 11.0, 7.0, 9.0, 4.0, 3.0, 1.0, 4.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-5.1015625, -4.93414306640625, -4.7667236328125, -4.59930419921875, -4.431884765625, -4.26446533203125, -4.0970458984375, -3.92962646484375, -3.76220703125, -3.59478759765625, -3.4273681640625, -3.25994873046875, -3.092529296875, -2.92510986328125, -2.7576904296875, -2.59027099609375, -2.4228515625, -2.25543212890625, -2.0880126953125, -1.92059326171875, -1.753173828125, -1.58575439453125, -1.4183349609375, -1.25091552734375, -1.08349609375, -0.91607666015625, -0.7486572265625, -0.58123779296875, -0.413818359375, -0.24639892578125, -0.0789794921875, 0.08843994140625, 0.255859375, 0.42327880859375, 0.5906982421875, 0.75811767578125, 0.925537109375, 1.09295654296875, 1.2603759765625, 1.42779541015625, 1.59521484375, 1.76263427734375, 1.9300537109375, 2.09747314453125, 2.264892578125, 2.43231201171875, 2.5997314453125, 2.76715087890625, 2.9345703125, 3.10198974609375, 3.2694091796875, 3.43682861328125, 3.604248046875, 3.77166748046875, 3.9390869140625, 4.10650634765625, 4.27392578125, 4.44134521484375, 4.6087646484375, 4.77618408203125, 4.943603515625, 5.11102294921875, 5.2784423828125, 5.44586181640625, 5.61328125]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 5.0, 1.0, 4.0, 1.0, 6.0, 7.0, 12.0, 17.0, 16.0, 22.0, 25.0, 37.0, 45.0, 46.0, 74.0, 84.0, 152.0, 304.0, 1414.0, 270.0, 145.0, 76.0, 63.0, 58.0, 31.0, 35.0, 21.0, 24.0, 17.0, 10.0, 3.0, 9.0, 5.0, 3.0, 4.0, 0.0, 5.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.8671875, -14.3621826171875, -13.857177734375, -13.3521728515625, -12.84716796875, -12.3421630859375, -11.837158203125, -11.3321533203125, -10.8271484375, -10.3221435546875, -9.817138671875, -9.3121337890625, -8.80712890625, -8.3021240234375, -7.797119140625, -7.2921142578125, -6.787109375, -6.2821044921875, -5.777099609375, -5.2720947265625, -4.76708984375, -4.2620849609375, -3.757080078125, -3.2520751953125, -2.7470703125, -2.2420654296875, -1.737060546875, -1.2320556640625, -0.72705078125, -0.2220458984375, 0.282958984375, 0.7879638671875, 1.29296875, 1.7979736328125, 2.302978515625, 2.8079833984375, 3.31298828125, 3.8179931640625, 4.322998046875, 4.8280029296875, 5.3330078125, 5.8380126953125, 6.343017578125, 6.8480224609375, 7.35302734375, 7.8580322265625, 8.363037109375, 8.8680419921875, 9.373046875, 9.8780517578125, 10.383056640625, 10.8880615234375, 11.39306640625, 11.8980712890625, 12.403076171875, 12.9080810546875, 13.4130859375, 13.9180908203125, 14.423095703125, 14.9281005859375, 15.43310546875, 15.9381103515625, 16.443115234375, 16.9481201171875, 17.453125]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 5.0, 4.0, 9.0, 14.0, 10.0, 9.0, 16.0, 25.0, 44.0, 68.0, 97.0, 121.0, 256.0, 537.0, 1642.0, 45002.0, 3086468.0, 9209.0, 1097.0, 451.0, 191.0, 117.0, 97.0, 60.0, 38.0, 33.0, 21.0, 15.0, 16.0, 11.0, 3.0, 2.0, 9.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-30.71875, -29.671875, -28.625, -27.578125, -26.53125, -25.484375, -24.4375, -23.390625, -22.34375, -21.296875, -20.25, -19.203125, -18.15625, -17.109375, -16.0625, -15.015625, -13.96875, -12.921875, -11.875, -10.828125, -9.78125, -8.734375, -7.6875, -6.640625, -5.59375, -4.546875, -3.5, -2.453125, -1.40625, -0.359375, 0.6875, 1.734375, 2.78125, 3.828125, 4.875, 5.921875, 6.96875, 8.015625, 9.0625, 10.109375, 11.15625, 12.203125, 13.25, 14.296875, 15.34375, 16.390625, 17.4375, 18.484375, 19.53125, 20.578125, 21.625, 22.671875, 23.71875, 24.765625, 25.8125, 26.859375, 27.90625, 28.953125, 30.0, 31.046875, 32.09375, 33.140625, 34.1875, 35.234375, 36.28125]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 305.0, 690.0, 15.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-424.4847412109375, -416.5041809082031, -408.5236511230469, -400.5430908203125, -392.56256103515625, -384.5820007324219, -376.6014404296875, -368.62091064453125, -360.6403503417969, -352.6597900390625, -344.67926025390625, -336.6986999511719, -328.7181701660156, -320.73760986328125, -312.7570495605469, -304.7765197753906, -296.79595947265625, -288.8153991699219, -280.8348693847656, -272.85430908203125, -264.873779296875, -256.8932189941406, -248.9126739501953, -240.93212890625, -232.9515838623047, -224.97103881835938, -216.99049377441406, -209.0099334716797, -201.02938842773438, -193.04884338378906, -185.06829833984375, -177.08773803710938, -169.107177734375, -161.1266326904297, -153.14608764648438, -145.16552734375, -137.1849822998047, -129.20443725585938, -121.22389221191406, -113.24333953857422, -105.26280212402344, -97.28225708007812, -89.30170440673828, -81.32115936279297, -73.34060668945312, -65.36006164550781, -57.379512786865234, -49.398963928222656, -41.41841125488281, -33.437862396240234, -25.457313537597656, -17.47676658630371, -9.496217727661133, -1.5156707763671875, 6.464878082275391, 14.445426940917969, 22.425975799560547, 30.406524658203125, 38.3870735168457, 46.36762237548828, 54.348167419433594, 62.32871627807617, 70.30926513671875, 78.28981018066406, 86.2703628540039]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 4.0, 6.0, 9.0, 10.0, 8.0, 6.0, 9.0, 12.0, 23.0, 19.0, 28.0, 35.0, 38.0, 37.0, 48.0, 24.0, 45.0, 41.0, 47.0, 58.0, 45.0, 31.0, 38.0, 44.0, 40.0, 43.0, 32.0, 31.0, 24.0, 38.0, 25.0, 14.0, 12.0, 25.0, 14.0, 11.0, 9.0, 9.0, 4.0, 4.0, 3.0, 1.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.00141525268555, -33.01638412475586, -32.03135681152344, -31.04632568359375, -30.061296463012695, -29.07626724243164, -28.091238021850586, -27.10620880126953, -26.121177673339844, -25.13614845275879, -24.151119232177734, -23.166088104248047, -22.181058883666992, -21.196029663085938, -20.211000442504883, -19.225971221923828, -18.240942001342773, -17.25591278076172, -16.270883560180664, -15.285853385925293, -14.300823211669922, -13.315793991088867, -12.330764770507812, -11.345735549926758, -10.360705375671387, -9.375676155090332, -8.390645980834961, -7.405616760253906, -6.420587062835693, -5.4355573654174805, -4.450528144836426, -3.465498447418213, -2.48046875, -1.4954391717910767, -0.5104095935821533, 0.47461986541748047, 1.4596495628356934, 2.4446792602539062, 3.429708480834961, 4.414738178253174, 5.399767875671387, 6.3847975730896, 7.3698272705078125, 8.354856491088867, 9.339885711669922, 10.324915885925293, 11.309945106506348, 12.294975280761719, 13.280004501342773, 14.265033721923828, 15.2500638961792, 16.235092163085938, 17.220123291015625, 18.20515251159668, 19.190181732177734, 20.17521095275879, 21.160240173339844, 22.1452693939209, 23.130298614501953, 24.11532974243164, 25.100358963012695, 26.08538818359375, 27.070417404174805, 28.05544662475586, 29.040477752685547]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 8.0, 5.0, 3.0, 4.0, 10.0, 7.0, 13.0, 14.0, 13.0, 20.0, 18.0, 16.0, 25.0, 31.0, 31.0, 28.0, 34.0, 51.0, 38.0, 45.0, 43.0, 49.0, 53.0, 39.0, 38.0, 41.0, 42.0, 23.0, 36.0, 29.0, 24.0, 25.0, 26.0, 28.0, 18.0, 18.0, 12.0, 12.0, 7.0, 5.0, 5.0, 6.0, 1.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 3.0], "bins": [-5.1640625, -5.00732421875, -4.8505859375, -4.69384765625, -4.537109375, -4.38037109375, -4.2236328125, -4.06689453125, -3.91015625, -3.75341796875, -3.5966796875, -3.43994140625, -3.283203125, -3.12646484375, -2.9697265625, -2.81298828125, -2.65625, -2.49951171875, -2.3427734375, -2.18603515625, -2.029296875, -1.87255859375, -1.7158203125, -1.55908203125, -1.40234375, -1.24560546875, -1.0888671875, -0.93212890625, -0.775390625, -0.61865234375, -0.4619140625, -0.30517578125, -0.1484375, 0.00830078125, 0.1650390625, 0.32177734375, 0.478515625, 0.63525390625, 0.7919921875, 0.94873046875, 1.10546875, 1.26220703125, 1.4189453125, 1.57568359375, 1.732421875, 1.88916015625, 2.0458984375, 2.20263671875, 2.359375, 2.51611328125, 2.6728515625, 2.82958984375, 2.986328125, 3.14306640625, 3.2998046875, 3.45654296875, 3.61328125, 3.77001953125, 3.9267578125, 4.08349609375, 4.240234375, 4.39697265625, 4.5537109375, 4.71044921875, 4.8671875]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 2.0, 2.0, 4.0, 8.0, 18.0, 20.0, 31.0, 50.0, 65.0, 103.0, 171.0, 236.0, 443.0, 733.0, 1301.0, 4065.0, 59406.0, 3901202.0, 216827.0, 5896.0, 1566.0, 853.0, 473.0, 305.0, 194.0, 129.0, 86.0, 47.0, 25.0, 12.0, 10.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-24.84375, -23.57763671875, -22.3115234375, -21.04541015625, -19.779296875, -18.51318359375, -17.2470703125, -15.98095703125, -14.71484375, -13.44873046875, -12.1826171875, -10.91650390625, -9.650390625, -8.38427734375, -7.1181640625, -5.85205078125, -4.5859375, -3.31982421875, -2.0537109375, -0.78759765625, 0.478515625, 1.74462890625, 3.0107421875, 4.27685546875, 5.54296875, 6.80908203125, 8.0751953125, 9.34130859375, 10.607421875, 11.87353515625, 13.1396484375, 14.40576171875, 15.671875, 16.93798828125, 18.2041015625, 19.47021484375, 20.736328125, 22.00244140625, 23.2685546875, 24.53466796875, 25.80078125, 27.06689453125, 28.3330078125, 29.59912109375, 30.865234375, 32.13134765625, 33.3974609375, 34.66357421875, 35.9296875, 37.19580078125, 38.4619140625, 39.72802734375, 40.994140625, 42.26025390625, 43.5263671875, 44.79248046875, 46.05859375, 47.32470703125, 48.5908203125, 49.85693359375, 51.123046875, 52.38916015625, 53.6552734375, 54.92138671875, 56.1875]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 9.0, 8.0, 12.0, 38.0, 48.0, 99.0, 193.0, 321.0, 563.0, 671.0, 704.0, 525.0, 363.0, 236.0, 108.0, 78.0, 46.0, 26.0, 15.0, 8.0, 2.0, 1.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.0625, -13.6224365234375, -13.182373046875, -12.7423095703125, -12.30224609375, -11.8621826171875, -11.422119140625, -10.9820556640625, -10.5419921875, -10.1019287109375, -9.661865234375, -9.2218017578125, -8.78173828125, -8.3416748046875, -7.901611328125, -7.4615478515625, -7.021484375, -6.5814208984375, -6.141357421875, -5.7012939453125, -5.26123046875, -4.8211669921875, -4.381103515625, -3.9410400390625, -3.5009765625, -3.0609130859375, -2.620849609375, -2.1807861328125, -1.74072265625, -1.3006591796875, -0.860595703125, -0.4205322265625, 0.01953125, 0.4595947265625, 0.899658203125, 1.3397216796875, 1.77978515625, 2.2198486328125, 2.659912109375, 3.0999755859375, 3.5400390625, 3.9801025390625, 4.420166015625, 4.8602294921875, 5.30029296875, 5.7403564453125, 6.180419921875, 6.6204833984375, 7.060546875, 7.5006103515625, 7.940673828125, 8.3807373046875, 8.82080078125, 9.2608642578125, 9.700927734375, 10.1409912109375, 10.5810546875, 11.0211181640625, 11.461181640625, 11.9012451171875, 12.34130859375, 12.7813720703125, 13.221435546875, 13.6614990234375, 14.1015625]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 5.0, 2.0, 10.0, 9.0, 8.0, 21.0, 38.0, 87.0, 155.0, 282.0, 588.0, 1667.0, 7468.0, 94415.0, 2132306.0, 1868452.0, 79260.0, 6711.0, 1586.0, 571.0, 325.0, 155.0, 75.0, 34.0, 27.0, 7.0, 9.0, 3.0, 4.0, 3.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.640625, -17.121337890625, -16.60205078125, -16.082763671875, -15.5634765625, -15.044189453125, -14.52490234375, -14.005615234375, -13.486328125, -12.967041015625, -12.44775390625, -11.928466796875, -11.4091796875, -10.889892578125, -10.37060546875, -9.851318359375, -9.33203125, -8.812744140625, -8.29345703125, -7.774169921875, -7.2548828125, -6.735595703125, -6.21630859375, -5.697021484375, -5.177734375, -4.658447265625, -4.13916015625, -3.619873046875, -3.1005859375, -2.581298828125, -2.06201171875, -1.542724609375, -1.0234375, -0.504150390625, 0.01513671875, 0.534423828125, 1.0537109375, 1.572998046875, 2.09228515625, 2.611572265625, 3.130859375, 3.650146484375, 4.16943359375, 4.688720703125, 5.2080078125, 5.727294921875, 6.24658203125, 6.765869140625, 7.28515625, 7.804443359375, 8.32373046875, 8.843017578125, 9.3623046875, 9.881591796875, 10.40087890625, 10.920166015625, 11.439453125, 11.958740234375, 12.47802734375, 12.997314453125, 13.5166015625, 14.035888671875, 14.55517578125, 15.074462890625, 15.59375]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 6.0, 8.0, 12.0, 17.0, 25.0, 35.0, 29.0, 35.0, 66.0, 67.0, 106.0, 95.0, 102.0, 89.0, 76.0, 65.0, 49.0, 28.0, 28.0, 24.0, 15.0, 9.0, 6.0, 8.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-52.5525016784668, -50.56928253173828, -48.5860595703125, -46.602840423583984, -44.61962127685547, -42.63639831542969, -40.65317916870117, -38.669960021972656, -36.686737060546875, -34.70351791381836, -32.72029495239258, -30.737075805664062, -28.753856658935547, -26.7706356048584, -24.78741455078125, -22.804195404052734, -20.82097625732422, -18.83775520324707, -16.854536056518555, -14.871315002441406, -12.888094902038574, -10.904874801635742, -8.921653747558594, -6.938433647155762, -4.95521354675293, -2.9719932079315186, -0.9887728691101074, 0.9944477081298828, 2.977667808532715, 4.960887908935547, 6.944108963012695, 8.927329063415527, 10.910552978515625, 12.893773078918457, 14.876993179321289, 16.860214233398438, 18.843433380126953, 20.8266544342041, 22.80987548828125, 24.793094635009766, 26.776315689086914, 28.759536743164062, 30.742755889892578, 32.725975036621094, 34.709197998046875, 36.69241714477539, 38.675636291503906, 40.65885925292969, 42.6420783996582, 44.62529754638672, 46.6085205078125, 48.591739654541016, 50.57495880126953, 52.55818176269531, 54.54140090942383, 56.524620056152344, 58.507843017578125, 60.49106216430664, 62.47428512573242, 64.45750427246094, 66.44072723388672, 68.42394256591797, 70.40716552734375, 72.39038848876953, 74.37360382080078]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 9.0, 3.0, 9.0, 18.0, 18.0, 21.0, 25.0, 26.0, 38.0, 39.0, 44.0, 53.0, 70.0, 51.0, 58.0, 67.0, 64.0, 60.0, 49.0, 39.0, 46.0, 37.0, 33.0, 39.0, 19.0, 13.0, 19.0, 8.0, 13.0, 6.0, 3.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.976768493652344, -47.36441421508789, -45.7520637512207, -44.13970947265625, -42.52735900878906, -40.91500473022461, -39.302650451660156, -37.69029998779297, -36.077945709228516, -34.46559143066406, -32.853240966796875, -31.240886688232422, -29.6285343170166, -28.01618194580078, -26.403827667236328, -24.791475296020508, -23.179122924804688, -21.566770553588867, -19.954418182373047, -18.342063903808594, -16.729711532592773, -15.117359161376953, -13.505005836486816, -11.89265251159668, -10.28030014038086, -8.667947769165039, -7.055594444274902, -5.443241596221924, -3.8308887481689453, -2.218536376953125, -0.6061830520629883, 1.0061702728271484, 2.6185226440429688, 4.230875492095947, 5.843228340148926, 7.455581188201904, 9.067934036254883, 10.680286407470703, 12.29263973236084, 13.904993057250977, 15.517345428466797, 17.129697799682617, 18.742050170898438, 20.35440444946289, 21.96675682067871, 23.57910919189453, 25.191463470458984, 26.803815841674805, 28.416168212890625, 30.028520584106445, 31.640872955322266, 33.25322723388672, 34.865577697753906, 36.47793197631836, 38.09028625488281, 39.70263671875, 41.31499099731445, 42.927345275878906, 44.539695739746094, 46.15205001831055, 47.764404296875, 49.37675476074219, 50.98910903930664, 52.601463317871094, 54.21381378173828]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 6.0, 7.0, 8.0, 7.0, 12.0, 12.0, 18.0, 16.0, 15.0, 24.0, 27.0, 23.0, 42.0, 38.0, 46.0, 56.0, 43.0, 51.0, 55.0, 48.0, 47.0, 43.0, 31.0, 46.0, 41.0, 28.0, 36.0, 45.0, 21.0, 18.0, 16.0, 18.0, 13.0, 11.0, 12.0, 8.0, 5.0, 9.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-102.0625, -99.390625, -96.71875, -94.046875, -91.375, -88.703125, -86.03125, -83.359375, -80.6875, -78.015625, -75.34375, -72.671875, -70.0, -67.328125, -64.65625, -61.984375, -59.3125, -56.640625, -53.96875, -51.296875, -48.625, -45.953125, -43.28125, -40.609375, -37.9375, -35.265625, -32.59375, -29.921875, -27.25, -24.578125, -21.90625, -19.234375, -16.5625, -13.890625, -11.21875, -8.546875, -5.875, -3.203125, -0.53125, 2.140625, 4.8125, 7.484375, 10.15625, 12.828125, 15.5, 18.171875, 20.84375, 23.515625, 26.1875, 28.859375, 31.53125, 34.203125, 36.875, 39.546875, 42.21875, 44.890625, 47.5625, 50.234375, 52.90625, 55.578125, 58.25, 60.921875, 63.59375, 66.265625, 68.9375]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 7.0, 1.0, 5.0, 14.0, 15.0, 16.0, 40.0, 50.0, 85.0, 139.0, 255.0, 359.0, 618.0, 1039.0, 1697.0, 3024.0, 4945.0, 8297.0, 13584.0, 22492.0, 37079.0, 58908.0, 90191.0, 127530.0, 158439.0, 156226.0, 126189.0, 88365.0, 57338.0, 36042.0, 22038.0, 13476.0, 8091.0, 4749.0, 2892.0, 1757.0, 1031.0, 615.0, 359.0, 210.0, 144.0, 69.0, 56.0, 27.0, 24.0, 19.0, 5.0, 4.0, 6.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.3359375, -6.143798828125, -5.95166015625, -5.759521484375, -5.5673828125, -5.375244140625, -5.18310546875, -4.990966796875, -4.798828125, -4.606689453125, -4.41455078125, -4.222412109375, -4.0302734375, -3.838134765625, -3.64599609375, -3.453857421875, -3.26171875, -3.069580078125, -2.87744140625, -2.685302734375, -2.4931640625, -2.301025390625, -2.10888671875, -1.916748046875, -1.724609375, -1.532470703125, -1.34033203125, -1.148193359375, -0.9560546875, -0.763916015625, -0.57177734375, -0.379638671875, -0.1875, 0.004638671875, 0.19677734375, 0.388916015625, 0.5810546875, 0.773193359375, 0.96533203125, 1.157470703125, 1.349609375, 1.541748046875, 1.73388671875, 1.926025390625, 2.1181640625, 2.310302734375, 2.50244140625, 2.694580078125, 2.88671875, 3.078857421875, 3.27099609375, 3.463134765625, 3.6552734375, 3.847412109375, 4.03955078125, 4.231689453125, 4.423828125, 4.615966796875, 4.80810546875, 5.000244140625, 5.1923828125, 5.384521484375, 5.57666015625, 5.768798828125, 5.9609375]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 5.0, 1.0, 0.0, 2.0, 4.0, 4.0, 6.0, 4.0, 6.0, 5.0, 10.0, 13.0, 14.0, 11.0, 14.0, 24.0, 17.0, 31.0, 23.0, 19.0, 31.0, 38.0, 32.0, 33.0, 35.0, 29.0, 30.0, 42.0, 1067.0, 43.0, 46.0, 36.0, 39.0, 34.0, 37.0, 35.0, 30.0, 26.0, 19.0, 25.0, 11.0, 17.0, 18.0, 10.0, 6.0, 10.0, 9.0, 9.0, 4.0, 5.0, 4.0, 5.0, 4.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-37.90625, -36.669921875, -35.43359375, -34.197265625, -32.9609375, -31.724609375, -30.48828125, -29.251953125, -28.015625, -26.779296875, -25.54296875, -24.306640625, -23.0703125, -21.833984375, -20.59765625, -19.361328125, -18.125, -16.888671875, -15.65234375, -14.416015625, -13.1796875, -11.943359375, -10.70703125, -9.470703125, -8.234375, -6.998046875, -5.76171875, -4.525390625, -3.2890625, -2.052734375, -0.81640625, 0.419921875, 1.65625, 2.892578125, 4.12890625, 5.365234375, 6.6015625, 7.837890625, 9.07421875, 10.310546875, 11.546875, 12.783203125, 14.01953125, 15.255859375, 16.4921875, 17.728515625, 18.96484375, 20.201171875, 21.4375, 22.673828125, 23.91015625, 25.146484375, 26.3828125, 27.619140625, 28.85546875, 30.091796875, 31.328125, 32.564453125, 33.80078125, 35.037109375, 36.2734375, 37.509765625, 38.74609375, 39.982421875, 41.21875]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 11.0, 10.0, 13.0, 27.0, 23.0, 54.0, 73.0, 104.0, 152.0, 220.0, 309.0, 474.0, 652.0, 988.0, 1389.0, 2069.0, 2789.0, 4181.0, 5875.0, 8515.0, 12252.0, 19121.0, 37299.0, 173895.0, 1592407.0, 142850.0, 34514.0, 18258.0, 11858.0, 8178.0, 5741.0, 3922.0, 2714.0, 1878.0, 1376.0, 930.0, 635.0, 410.0, 288.0, 216.0, 159.0, 104.0, 63.0, 54.0, 33.0, 22.0, 6.0, 4.0, 12.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0], "bins": [-11.421875, -11.0699462890625, -10.718017578125, -10.3660888671875, -10.01416015625, -9.6622314453125, -9.310302734375, -8.9583740234375, -8.6064453125, -8.2545166015625, -7.902587890625, -7.5506591796875, -7.19873046875, -6.8468017578125, -6.494873046875, -6.1429443359375, -5.791015625, -5.4390869140625, -5.087158203125, -4.7352294921875, -4.38330078125, -4.0313720703125, -3.679443359375, -3.3275146484375, -2.9755859375, -2.6236572265625, -2.271728515625, -1.9197998046875, -1.56787109375, -1.2159423828125, -0.864013671875, -0.5120849609375, -0.16015625, 0.1917724609375, 0.543701171875, 0.8956298828125, 1.24755859375, 1.5994873046875, 1.951416015625, 2.3033447265625, 2.6552734375, 3.0072021484375, 3.359130859375, 3.7110595703125, 4.06298828125, 4.4149169921875, 4.766845703125, 5.1187744140625, 5.470703125, 5.8226318359375, 6.174560546875, 6.5264892578125, 6.87841796875, 7.2303466796875, 7.582275390625, 7.9342041015625, 8.2861328125, 8.6380615234375, 8.989990234375, 9.3419189453125, 9.69384765625, 10.0457763671875, 10.397705078125, 10.7496337890625, 11.1015625]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 4.0, 4.0, 4.0, 7.0, 7.0, 8.0, 9.0, 8.0, 15.0, 11.0, 13.0, 23.0, 24.0, 24.0, 31.0, 43.0, 51.0, 44.0, 62.0, 48.0, 46.0, 57.0, 47.0, 37.0, 46.0, 46.0, 48.0, 42.0, 34.0, 25.0, 27.0, 14.0, 15.0, 23.0, 7.0, 13.0, 8.0, 7.0, 12.0, 3.0, 2.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.374267578125, -0.3628196716308594, -0.35137176513671875, -0.3399238586425781, -0.3284759521484375, -0.3170280456542969, -0.30558013916015625, -0.2941322326660156, -0.282684326171875, -0.2712364196777344, -0.25978851318359375, -0.24834060668945312, -0.2368927001953125, -0.22544479370117188, -0.21399688720703125, -0.20254898071289062, -0.19110107421875, -0.17965316772460938, -0.16820526123046875, -0.15675735473632812, -0.1453094482421875, -0.13386154174804688, -0.12241363525390625, -0.11096572875976562, -0.099517822265625, -0.08806991577148438, -0.07662200927734375, -0.06517410278320312, -0.0537261962890625, -0.042278289794921875, -0.03083038330078125, -0.019382476806640625, -0.0079345703125, 0.003513336181640625, 0.01496124267578125, 0.026409149169921875, 0.0378570556640625, 0.049304962158203125, 0.06075286865234375, 0.07220077514648438, 0.083648681640625, 0.09509658813476562, 0.10654449462890625, 0.11799240112304688, 0.1294403076171875, 0.14088821411132812, 0.15233612060546875, 0.16378402709960938, 0.17523193359375, 0.18667984008789062, 0.19812774658203125, 0.20957565307617188, 0.2210235595703125, 0.23247146606445312, 0.24391937255859375, 0.2553672790527344, 0.266815185546875, 0.2782630920410156, 0.28971099853515625, 0.3011589050292969, 0.3126068115234375, 0.3240547180175781, 0.33550262451171875, 0.3469505310058594, 0.3583984375]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 8.0, 7.0, 10.0, 10.0, 14.0, 22.0, 32.0, 35.0, 42.0, 57.0, 88.0, 119.0, 161.0, 241.0, 311.0, 471.0, 654.0, 1110.0, 1884.0, 3290.0, 6636.0, 14564.0, 35126.0, 83697.0, 177229.0, 269168.0, 230742.0, 125322.0, 54190.0, 22509.0, 9622.0, 4685.0, 2481.0, 1355.0, 824.0, 496.0, 343.0, 286.0, 181.0, 143.0, 95.0, 74.0, 57.0, 46.0, 29.0, 22.0, 21.0, 16.0, 9.0, 8.0, 4.0, 9.0, 4.0, 1.0, 3.0, 2.0, 2.0], "bins": [-1.43359375, -1.3898162841796875, -1.346038818359375, -1.3022613525390625, -1.25848388671875, -1.2147064208984375, -1.170928955078125, -1.1271514892578125, -1.0833740234375, -1.0395965576171875, -0.995819091796875, -0.9520416259765625, -0.90826416015625, -0.8644866943359375, -0.820709228515625, -0.7769317626953125, -0.733154296875, -0.6893768310546875, -0.645599365234375, -0.6018218994140625, -0.55804443359375, -0.5142669677734375, -0.470489501953125, -0.4267120361328125, -0.3829345703125, -0.3391571044921875, -0.295379638671875, -0.2516021728515625, -0.20782470703125, -0.1640472412109375, -0.120269775390625, -0.0764923095703125, -0.03271484375, 0.0110626220703125, 0.054840087890625, 0.0986175537109375, 0.14239501953125, 0.1861724853515625, 0.229949951171875, 0.2737274169921875, 0.3175048828125, 0.3612823486328125, 0.405059814453125, 0.4488372802734375, 0.49261474609375, 0.5363922119140625, 0.580169677734375, 0.6239471435546875, 0.667724609375, 0.7115020751953125, 0.755279541015625, 0.7990570068359375, 0.84283447265625, 0.8866119384765625, 0.930389404296875, 0.9741668701171875, 1.0179443359375, 1.0617218017578125, 1.105499267578125, 1.1492767333984375, 1.19305419921875, 1.2368316650390625, 1.280609130859375, 1.3243865966796875, 1.3681640625]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 1.0, 3.0, 2.0, 1.0, 4.0, 3.0, 10.0, 17.0, 25.0, 35.0, 46.0, 77.0, 103.0, 156.0, 159.0, 144.0, 83.0, 67.0, 31.0, 19.0, 8.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9699581265449524, -0.939214825630188, -0.9084715247154236, -0.8777282238006592, -0.8469849228858948, -0.8162416219711304, -0.785498321056366, -0.7547550201416016, -0.7240117192268372, -0.6932684183120728, -0.6625251173973083, -0.631781816482544, -0.6010385155677795, -0.5702952146530151, -0.5395519137382507, -0.5088086128234863, -0.47806528210639954, -0.44732198119163513, -0.4165786802768707, -0.3858353793621063, -0.3550920784473419, -0.3243487477302551, -0.2936054468154907, -0.2628621459007263, -0.2321188598871231, -0.2013755589723587, -0.1706322580575943, -0.1398889422416687, -0.1091456487774849, -0.07840234041213989, -0.04765903949737549, -0.016915738582611084, 0.01382756233215332, 0.044570863246917725, 0.07531416416168213, 0.10605747252702713, 0.13680076599121094, 0.16754408180713654, 0.19828738272190094, 0.22903068363666534, 0.25977396965026855, 0.29051727056503296, 0.32126057147979736, 0.35200387239456177, 0.38274717330932617, 0.4134904742240906, 0.444233775138855, 0.4749770760536194, 0.5057203769683838, 0.5364636778831482, 0.5672069787979126, 0.597950279712677, 0.6286935806274414, 0.6594368815422058, 0.6901801824569702, 0.7209234833717346, 0.7516668438911438, 0.7824101448059082, 0.8131534457206726, 0.843896746635437, 0.8746400475502014, 0.9053833484649658, 0.9361266493797302, 0.9668699502944946, 0.997613251209259]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 6.0, 2.0, 3.0, 11.0, 7.0, 7.0, 16.0, 12.0, 23.0, 12.0, 22.0, 23.0, 24.0, 27.0, 39.0, 35.0, 31.0, 35.0, 46.0, 51.0, 63.0, 43.0, 46.0, 45.0, 39.0, 39.0, 36.0, 33.0, 21.0, 32.0, 31.0, 24.0, 18.0, 27.0, 16.0, 19.0, 10.0, 7.0, 8.0, 11.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4439167380332947, -0.42715683579444885, -0.410396933555603, -0.3936370313167572, -0.3768771290779114, -0.36011719703674316, -0.34335729479789734, -0.3265973925590515, -0.3098374903202057, -0.29307758808135986, -0.27631768584251404, -0.2595577836036682, -0.2427978664636612, -0.22603796422481537, -0.20927804708480835, -0.19251814484596252, -0.1757582426071167, -0.15899834036827087, -0.14223843812942505, -0.12547852098941803, -0.1087186187505722, -0.09195871651172638, -0.07519880682229996, -0.058438897132873535, -0.04167899489402771, -0.024919088929891586, -0.008159182965755463, 0.008600722998380661, 0.025360628962516785, 0.04212053120136261, 0.05888044089078903, 0.07564035058021545, 0.09240031242370605, 0.10916021466255188, 0.1259201169013977, 0.14268003404140472, 0.15943993628025055, 0.17619983851909637, 0.1929597556591034, 0.20971965789794922, 0.22647956013679504, 0.24323946237564087, 0.2599993646144867, 0.2767592668533325, 0.29351919889450073, 0.31027907133102417, 0.3270390033721924, 0.3437989056110382, 0.36055880784988403, 0.37731871008872986, 0.3940786123275757, 0.4108385145664215, 0.42759841680526733, 0.44435834884643555, 0.46111825108528137, 0.4778781533241272, 0.494638055562973, 0.5113979578018188, 0.5281578898429871, 0.5449177622795105, 0.5616776943206787, 0.5784375667572021, 0.5951974987983704, 0.6119574308395386, 0.628717303276062]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 9.0, 9.0, 6.0, 10.0, 16.0, 16.0, 18.0, 21.0, 30.0, 23.0, 36.0, 43.0, 30.0, 44.0, 54.0, 44.0, 64.0, 58.0, 49.0, 47.0, 50.0, 42.0, 42.0, 30.0, 38.0, 32.0, 21.0, 27.0, 16.0, 22.0, 21.0, 13.0, 10.0, 6.0, 5.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-109.5625, -106.7236328125, -103.884765625, -101.0458984375, -98.20703125, -95.3681640625, -92.529296875, -89.6904296875, -86.8515625, -84.0126953125, -81.173828125, -78.3349609375, -75.49609375, -72.6572265625, -69.818359375, -66.9794921875, -64.140625, -61.3017578125, -58.462890625, -55.6240234375, -52.78515625, -49.9462890625, -47.107421875, -44.2685546875, -41.4296875, -38.5908203125, -35.751953125, -32.9130859375, -30.07421875, -27.2353515625, -24.396484375, -21.5576171875, -18.71875, -15.8798828125, -13.041015625, -10.2021484375, -7.36328125, -4.5244140625, -1.685546875, 1.1533203125, 3.9921875, 6.8310546875, 9.669921875, 12.5087890625, 15.34765625, 18.1865234375, 21.025390625, 23.8642578125, 26.703125, 29.5419921875, 32.380859375, 35.2197265625, 38.05859375, 40.8974609375, 43.736328125, 46.5751953125, 49.4140625, 52.2529296875, 55.091796875, 57.9306640625, 60.76953125, 63.6083984375, 66.447265625, 69.2861328125, 72.125]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 10.0, 9.0, 11.0, 11.0, 15.0, 19.0, 32.0, 33.0, 37.0, 42.0, 58.0, 86.0, 125.0, 218.0, 381.0, 1244.0, 7623.0, 115856.0, 734626.0, 174421.0, 10967.0, 1502.0, 472.0, 227.0, 145.0, 96.0, 59.0, 48.0, 30.0, 36.0, 30.0, 26.0, 19.0, 8.0, 12.0, 7.0, 8.0, 2.0, 2.0, 6.0, 0.0, 2.0, 1.0, 1.0], "bins": [-21.390625, -20.8360595703125, -20.281494140625, -19.7269287109375, -19.17236328125, -18.6177978515625, -18.063232421875, -17.5086669921875, -16.9541015625, -16.3995361328125, -15.844970703125, -15.2904052734375, -14.73583984375, -14.1812744140625, -13.626708984375, -13.0721435546875, -12.517578125, -11.9630126953125, -11.408447265625, -10.8538818359375, -10.29931640625, -9.7447509765625, -9.190185546875, -8.6356201171875, -8.0810546875, -7.5264892578125, -6.971923828125, -6.4173583984375, -5.86279296875, -5.3082275390625, -4.753662109375, -4.1990966796875, -3.64453125, -3.0899658203125, -2.535400390625, -1.9808349609375, -1.42626953125, -0.8717041015625, -0.317138671875, 0.2374267578125, 0.7919921875, 1.3465576171875, 1.901123046875, 2.4556884765625, 3.01025390625, 3.5648193359375, 4.119384765625, 4.6739501953125, 5.228515625, 5.7830810546875, 6.337646484375, 6.8922119140625, 7.44677734375, 8.0013427734375, 8.555908203125, 9.1104736328125, 9.6650390625, 10.2196044921875, 10.774169921875, 11.3287353515625, 11.88330078125, 12.4378662109375, 12.992431640625, 13.5469970703125, 14.1015625]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 2.0, 1.0, 2.0, 5.0, 5.0, 11.0, 27.0, 21.0, 52.0, 58.0, 73.0, 106.0, 114.0, 2144.0, 100.0, 103.0, 72.0, 65.0, 34.0, 22.0, 14.0, 9.0, 3.0, 1.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-228.875, -221.041015625, -213.20703125, -205.373046875, -197.5390625, -189.705078125, -181.87109375, -174.037109375, -166.203125, -158.369140625, -150.53515625, -142.701171875, -134.8671875, -127.033203125, -119.19921875, -111.365234375, -103.53125, -95.697265625, -87.86328125, -80.029296875, -72.1953125, -64.361328125, -56.52734375, -48.693359375, -40.859375, -33.025390625, -25.19140625, -17.357421875, -9.5234375, -1.689453125, 6.14453125, 13.978515625, 21.8125, 29.646484375, 37.48046875, 45.314453125, 53.1484375, 60.982421875, 68.81640625, 76.650390625, 84.484375, 92.318359375, 100.15234375, 107.986328125, 115.8203125, 123.654296875, 131.48828125, 139.322265625, 147.15625, 154.990234375, 162.82421875, 170.658203125, 178.4921875, 186.326171875, 194.16015625, 201.994140625, 209.828125, 217.662109375, 225.49609375, 233.330078125, 241.1640625, 248.998046875, 256.83203125, 264.666015625, 272.5]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 5.0, 2.0, 4.0, 7.0, 8.0, 10.0, 20.0, 22.0, 38.0, 56.0, 134.0, 288.0, 744.0, 2090.0, 9612.0, 386070.0, 2727523.0, 14956.0, 2614.0, 826.0, 328.0, 144.0, 75.0, 36.0, 19.0, 14.0, 10.0, 7.0, 14.0, 6.0, 5.0, 6.0, 5.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-28.625, -27.831787109375, -27.03857421875, -26.245361328125, -25.4521484375, -24.658935546875, -23.86572265625, -23.072509765625, -22.279296875, -21.486083984375, -20.69287109375, -19.899658203125, -19.1064453125, -18.313232421875, -17.52001953125, -16.726806640625, -15.93359375, -15.140380859375, -14.34716796875, -13.553955078125, -12.7607421875, -11.967529296875, -11.17431640625, -10.381103515625, -9.587890625, -8.794677734375, -8.00146484375, -7.208251953125, -6.4150390625, -5.621826171875, -4.82861328125, -4.035400390625, -3.2421875, -2.448974609375, -1.65576171875, -0.862548828125, -0.0693359375, 0.723876953125, 1.51708984375, 2.310302734375, 3.103515625, 3.896728515625, 4.68994140625, 5.483154296875, 6.2763671875, 7.069580078125, 7.86279296875, 8.656005859375, 9.44921875, 10.242431640625, 11.03564453125, 11.828857421875, 12.6220703125, 13.415283203125, 14.20849609375, 15.001708984375, 15.794921875, 16.588134765625, 17.38134765625, 18.174560546875, 18.9677734375, 19.760986328125, 20.55419921875, 21.347412109375, 22.140625]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 9.0, 34.0, 73.0, 182.0, 251.0, 216.0, 114.0, 50.0, 21.0, 12.0, 12.0, 8.0, 1.0, 4.0, 4.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-174.75625610351562, -165.95217895507812, -157.14808654785156, -148.343994140625, -139.5399169921875, -130.73583984375, -121.93174743652344, -113.1276626586914, -104.32357788085938, -95.51949310302734, -86.71540832519531, -77.91132354736328, -69.10723876953125, -60.30315399169922, -51.49906921386719, -42.694984436035156, -33.890899658203125, -25.086814880371094, -16.282730102539062, -7.478645324707031, 1.325439453125, 10.129524230957031, 18.933609008789062, 27.737693786621094, 36.541778564453125, 45.345863342285156, 54.14994812011719, 62.95403289794922, 71.75811767578125, 80.56220245361328, 89.36628723144531, 98.17037200927734, 106.97442626953125, 115.77851104736328, 124.58259582519531, 133.38668823242188, 142.19076538085938, 150.99484252929688, 159.79893493652344, 168.60302734375, 177.4071044921875, 186.211181640625, 195.01527404785156, 203.81936645507812, 212.62344360351562, 221.42752075195312, 230.2316131591797, 239.03570556640625, 247.83978271484375, 256.64385986328125, 265.44793701171875, 274.2520446777344, 283.0561218261719, 291.8601989746094, 300.664306640625, 309.4683837890625, 318.2724609375, 327.0765380859375, 335.880615234375, 344.6847229003906, 353.4888000488281, 362.2928771972656, 371.09698486328125, 379.90106201171875, 388.70513916015625]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 6.0, 3.0, 2.0, 11.0, 4.0, 12.0, 11.0, 7.0, 17.0, 17.0, 21.0, 30.0, 24.0, 32.0, 34.0, 29.0, 40.0, 38.0, 43.0, 39.0, 53.0, 44.0, 50.0, 43.0, 33.0, 47.0, 50.0, 39.0, 36.0, 28.0, 28.0, 25.0, 13.0, 18.0, 13.0, 13.0, 8.0, 7.0, 13.0, 11.0, 1.0, 3.0, 6.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-188.64398193359375, -183.0454559326172, -177.44692993164062, -171.84840393066406, -166.2498779296875, -160.65135192871094, -155.05282592773438, -149.45431518554688, -143.85577392578125, -138.2572479248047, -132.65872192382812, -127.06019592285156, -121.461669921875, -115.86314392089844, -110.2646255493164, -104.66609954833984, -99.06758117675781, -93.46905517578125, -87.87052917480469, -82.27200317382812, -76.67347717285156, -71.074951171875, -65.47643280029297, -59.877906799316406, -54.279380798339844, -48.68085479736328, -43.08232879638672, -37.48380661010742, -31.88528060913086, -26.286754608154297, -20.688232421875, -15.089706420898438, -9.491165161132812, -3.8926401138305664, 1.7058849334716797, 7.304409027099609, 12.902935028076172, 18.501461029052734, 24.09998321533203, 29.698509216308594, 35.297035217285156, 40.89556121826172, 46.49408721923828, 52.09260940551758, 57.69113540649414, 63.2896614074707, 68.88818359375, 74.48670959472656, 80.08523559570312, 85.68376159667969, 91.28228759765625, 96.88081359863281, 102.47933959960938, 108.07786560058594, 113.67638397216797, 119.27490997314453, 124.8734359741211, 130.47195434570312, 136.0704803466797, 141.66900634765625, 147.2675323486328, 152.86605834960938, 158.46458435058594, 164.0631103515625, 169.66163635253906]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 11.0, 4.0, 7.0, 14.0, 20.0, 15.0, 29.0, 31.0, 46.0, 82.0, 76.0, 119.0, 178.0, 255.0, 355.0, 510.0, 748.0, 1204.0, 1816.0, 2633.0, 3966.0, 6172.0, 1006232.0, 8309.0, 5166.0, 3501.0, 2324.0, 1535.0, 980.0, 702.0, 448.0, 320.0, 216.0, 168.0, 102.0, 82.0, 48.0, 43.0, 33.0, 20.0, 15.0, 10.0, 5.0, 6.0, 2.0, 2.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.26542091369629, -25.465192794799805, -24.66496467590332, -23.864736557006836, -23.06450843811035, -22.264280319213867, -21.464054107666016, -20.66382598876953, -19.863597869873047, -19.063369750976562, -18.263141632080078, -17.462913513183594, -16.66268539428711, -15.862457275390625, -15.062230110168457, -14.262001991271973, -13.461772918701172, -12.661544799804688, -11.861316680908203, -11.061088562011719, -10.260860443115234, -9.46063232421875, -8.660405158996582, -7.860177040100098, -7.059948921203613, -6.259720802307129, -5.4594926834106445, -4.659265041351318, -3.859036922454834, -3.0588088035583496, -2.2585811614990234, -1.458353042602539, -0.6581249237060547, 0.14210307598114014, 0.942331075668335, 1.7425589561462402, 2.5427870750427246, 3.343015193939209, 4.143242835998535, 4.9434709548950195, 5.743699073791504, 6.543927192687988, 7.344155311584473, 8.14438247680664, 8.944610595703125, 9.74483871459961, 10.545066833496094, 11.345294952392578, 12.145523071289062, 12.945751190185547, 13.745979309082031, 14.546207427978516, 15.346435546875, 16.146663665771484, 16.94689178466797, 17.747119903564453, 18.547348022460938, 19.347576141357422, 20.147804260253906, 20.94803237915039, 21.748260498046875, 22.54848861694336, 23.348716735839844, 24.148944854736328, 24.94917106628418]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 2.0, 7.0, 3.0, 5.0, 3.0, 6.0, 15.0, 13.0, 23.0, 20.0, 62.0, 149.0, 7628.0, 51454360.0, 669.0, 97.0, 34.0, 17.0, 13.0, 8.0, 9.0, 5.0, 2.0, 3.0, 2.0, 2.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-926.5679931640625, -883.014892578125, -839.4617919921875, -795.9086303710938, -752.3555297851562, -708.8024291992188, -665.249267578125, -621.6961669921875, -578.14306640625, -534.5899658203125, -491.0368347167969, -447.48370361328125, -403.93060302734375, -360.37750244140625, -316.8243713378906, -273.271240234375, -229.7181396484375, -186.16502380371094, -142.61190795898438, -99.05879211425781, -55.50567626953125, -11.952560424804688, 31.600555419921875, 75.1536865234375, 118.706787109375, 162.25990295410156, 205.81301879882812, 249.3661346435547, 292.91925048828125, 336.47235107421875, 380.0254821777344, 423.57861328125, 467.1317138671875, 510.684814453125, 554.2379150390625, 597.7910766601562, 641.3441772460938, 684.8972778320312, 728.450439453125, 772.0035400390625, 815.556640625, 859.1097412109375, 902.662841796875, 946.2160034179688, 989.7691040039062, 1033.322265625, 1076.8753662109375, 1120.428466796875, 1163.9815673828125, 1207.53466796875, 1251.0877685546875, 1294.640869140625, 1338.194091796875, 1381.7471923828125, 1425.30029296875, 1468.8533935546875, 1512.406494140625, 1555.9595947265625, 1599.5126953125, 1643.0657958984375, 1686.618896484375, 1730.172119140625, 1773.7252197265625, 1817.2783203125, 1860.8314208984375]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 5.0, 1.0, 2.0, 5.0, 6.0, 7.0, 7.0, 9.0, 14.0, 21.0, 32.0, 32.0, 43.0, 80.0, 133.0, 159.0, 130.0, 88.0, 79.0, 49.0, 27.0, 25.0, 14.0, 8.0, 7.0, 9.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-192.30743408203125, -186.0612030029297, -179.81497192382812, -173.56875610351562, -167.32252502441406, -161.0762939453125, -154.830078125, -148.58384704589844, -142.33761596679688, -136.0913848876953, -129.84515380859375, -123.59893798828125, -117.35270690917969, -111.10647583007812, -104.8602523803711, -98.61402893066406, -92.3677978515625, -86.12156677246094, -79.8753433227539, -73.62911987304688, -67.38288879394531, -61.136661529541016, -54.89043426513672, -48.64420700073242, -42.397979736328125, -36.15175247192383, -29.90552520751953, -23.659297943115234, -17.413070678710938, -11.16684341430664, -4.920616149902344, 1.3256111145019531, 7.5718231201171875, 13.818050384521484, 20.06427764892578, 26.310504913330078, 32.556732177734375, 38.80295944213867, 45.04918670654297, 51.295413970947266, 57.54164123535156, 63.78786849975586, 70.03409576416016, 76.28031921386719, 82.52655029296875, 88.77278137207031, 95.01900482177734, 101.26522827148438, 107.51145935058594, 113.7576904296875, 120.00391387939453, 126.25013732910156, 132.49636840820312, 138.7425994873047, 144.98883056640625, 151.23504638671875, 157.4812774658203, 163.72750854492188, 169.97372436523438, 176.21995544433594, 182.4661865234375, 188.71241760253906, 194.95864868164062, 201.20486450195312, 207.4510955810547]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 4.0, 7.0, 6.0, 9.0, 13.0, 17.0, 25.0, 15.0, 30.0, 42.0, 44.0, 73.0, 62.0, 59.0, 78.0, 75.0, 63.0, 63.0, 56.0, 40.0, 52.0, 33.0, 30.0, 17.0, 27.0, 18.0, 10.0, 8.0, 10.0, 4.0, 5.0, 4.0, 0.0, 4.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-213.3799285888672, -207.8774871826172, -202.3750457763672, -196.87258911132812, -191.37014770507812, -185.86770629882812, -180.36526489257812, -174.86282348632812, -169.36038208007812, -163.85794067382812, -158.35549926757812, -152.85305786132812, -147.35060119628906, -141.84815979003906, -136.34571838378906, -130.84327697753906, -125.3408203125, -119.83837890625, -114.33592987060547, -108.83348846435547, -103.33103942871094, -97.82859802246094, -92.32615661621094, -86.82371520996094, -81.3212661743164, -75.8188247680664, -70.31637573242188, -64.81393432617188, -59.31148910522461, -53.809043884277344, -48.306602478027344, -42.80415725708008, -37.30171203613281, -31.799266815185547, -26.296823501586914, -20.79438018798828, -15.291934967041016, -9.78948974609375, -4.28704833984375, 1.2153968811035156, 6.717842102050781, 12.22028636932373, 17.72273063659668, 23.225173950195312, 28.727619171142578, 34.230064392089844, 39.732505798339844, 45.23495101928711, 50.737396240234375, 56.23984146118164, 61.742286682128906, 67.2447280883789, 72.74717712402344, 78.24961853027344, 83.75205993652344, 89.25450134277344, 94.75695037841797, 100.25939178466797, 105.7618408203125, 111.2642822265625, 116.7667236328125, 122.26917266845703, 127.77161407470703, 133.27406311035156, 138.77650451660156]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 6.0, 9.0, 9.0, 14.0, 22.0, 25.0, 41.0, 66.0, 87.0, 127.0, 195.0, 301.0, 463.0, 701.0, 1176.0, 1924.0, 3300.0, 5980.0, 11477.0, 25959.0, 81600.0, 3169954.0, 792002.0, 61843.0, 18838.0, 8139.0, 4190.0, 2293.0, 1330.0, 824.0, 489.0, 319.0, 197.0, 138.0, 103.0, 47.0, 31.0, 21.0, 13.0, 12.0, 10.0, 5.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.125, -8.870849609375, -8.61669921875, -8.362548828125, -8.1083984375, -7.854248046875, -7.60009765625, -7.345947265625, -7.091796875, -6.837646484375, -6.58349609375, -6.329345703125, -6.0751953125, -5.821044921875, -5.56689453125, -5.312744140625, -5.05859375, -4.804443359375, -4.55029296875, -4.296142578125, -4.0419921875, -3.787841796875, -3.53369140625, -3.279541015625, -3.025390625, -2.771240234375, -2.51708984375, -2.262939453125, -2.0087890625, -1.754638671875, -1.50048828125, -1.246337890625, -0.9921875, -0.738037109375, -0.48388671875, -0.229736328125, 0.0244140625, 0.278564453125, 0.53271484375, 0.786865234375, 1.041015625, 1.295166015625, 1.54931640625, 1.803466796875, 2.0576171875, 2.311767578125, 2.56591796875, 2.820068359375, 3.07421875, 3.328369140625, 3.58251953125, 3.836669921875, 4.0908203125, 4.344970703125, 4.59912109375, 4.853271484375, 5.107421875, 5.361572265625, 5.61572265625, 5.869873046875, 6.1240234375, 6.378173828125, 6.63232421875, 6.886474609375, 7.140625]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 6.0, 5.0, 2.0, 4.0, 6.0, 2.0, 6.0, 5.0, 11.0, 7.0, 9.0, 12.0, 21.0, 36.0, 54.0, 101.0, 169.0, 176.0, 142.0, 90.0, 55.0, 28.0, 16.0, 6.0, 9.0, 3.0, 3.0, 4.0, 4.0, 4.0, 5.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.1396484375, -1.1080322265625, -1.076416015625, -1.0447998046875, -1.01318359375, -0.9815673828125, -0.949951171875, -0.9183349609375, -0.88671875, -0.8551025390625, -0.823486328125, -0.7918701171875, -0.76025390625, -0.7286376953125, -0.697021484375, -0.6654052734375, -0.6337890625, -0.6021728515625, -0.570556640625, -0.5389404296875, -0.50732421875, -0.4757080078125, -0.444091796875, -0.4124755859375, -0.380859375, -0.3492431640625, -0.317626953125, -0.2860107421875, -0.25439453125, -0.2227783203125, -0.191162109375, -0.1595458984375, -0.1279296875, -0.0963134765625, -0.064697265625, -0.0330810546875, -0.00146484375, 0.0301513671875, 0.061767578125, 0.0933837890625, 0.125, 0.1566162109375, 0.188232421875, 0.2198486328125, 0.25146484375, 0.2830810546875, 0.314697265625, 0.3463134765625, 0.3779296875, 0.4095458984375, 0.441162109375, 0.4727783203125, 0.50439453125, 0.5360107421875, 0.567626953125, 0.5992431640625, 0.630859375, 0.6624755859375, 0.694091796875, 0.7257080078125, 0.75732421875, 0.7889404296875, 0.820556640625, 0.8521728515625, 0.8837890625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 5.0, 3.0, 3.0, 4.0, 5.0, 10.0, 13.0, 18.0, 16.0, 31.0, 46.0, 57.0, 95.0, 153.0, 205.0, 337.0, 529.0, 904.0, 1677.0, 3070.0, 6355.0, 14575.0, 40161.0, 151783.0, 1230401.0, 2464175.0, 196737.0, 49177.0, 17375.0, 7490.0, 3723.0, 1924.0, 1126.0, 665.0, 460.0, 275.0, 188.0, 120.0, 114.0, 72.0, 52.0, 40.0, 37.0, 27.0, 16.0, 12.0, 5.0, 10.0, 6.0, 5.0, 3.0, 3.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.171875, -4.97357177734375, -4.7752685546875, -4.57696533203125, -4.378662109375, -4.18035888671875, -3.9820556640625, -3.78375244140625, -3.58544921875, -3.38714599609375, -3.1888427734375, -2.99053955078125, -2.792236328125, -2.59393310546875, -2.3956298828125, -2.19732666015625, -1.9990234375, -1.80072021484375, -1.6024169921875, -1.40411376953125, -1.205810546875, -1.00750732421875, -0.8092041015625, -0.61090087890625, -0.41259765625, -0.21429443359375, -0.0159912109375, 0.18231201171875, 0.380615234375, 0.57891845703125, 0.7772216796875, 0.97552490234375, 1.173828125, 1.37213134765625, 1.5704345703125, 1.76873779296875, 1.967041015625, 2.16534423828125, 2.3636474609375, 2.56195068359375, 2.76025390625, 2.95855712890625, 3.1568603515625, 3.35516357421875, 3.553466796875, 3.75177001953125, 3.9500732421875, 4.14837646484375, 4.3466796875, 4.54498291015625, 4.7432861328125, 4.94158935546875, 5.139892578125, 5.33819580078125, 5.5364990234375, 5.73480224609375, 5.93310546875, 6.13140869140625, 6.3297119140625, 6.52801513671875, 6.726318359375, 6.92462158203125, 7.1229248046875, 7.32122802734375, 7.51953125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 5.0, 1.0, 2.0, 3.0, 6.0, 14.0, 18.0, 23.0, 28.0, 51.0, 65.0, 105.0, 147.0, 234.0, 358.0, 944.0, 961.0, 385.0, 229.0, 135.0, 106.0, 65.0, 64.0, 35.0, 24.0, 12.0, 17.0, 14.0, 8.0, 9.0, 5.0, 7.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.4091796875, -1.3549957275390625, -1.300811767578125, -1.2466278076171875, -1.19244384765625, -1.1382598876953125, -1.084075927734375, -1.0298919677734375, -0.9757080078125, -0.9215240478515625, -0.867340087890625, -0.8131561279296875, -0.75897216796875, -0.7047882080078125, -0.650604248046875, -0.5964202880859375, -0.542236328125, -0.4880523681640625, -0.433868408203125, -0.3796844482421875, -0.32550048828125, -0.2713165283203125, -0.217132568359375, -0.1629486083984375, -0.1087646484375, -0.0545806884765625, -0.000396728515625, 0.0537872314453125, 0.10797119140625, 0.1621551513671875, 0.216339111328125, 0.2705230712890625, 0.32470703125, 0.3788909912109375, 0.433074951171875, 0.4872589111328125, 0.54144287109375, 0.5956268310546875, 0.649810791015625, 0.7039947509765625, 0.7581787109375, 0.8123626708984375, 0.866546630859375, 0.9207305908203125, 0.97491455078125, 1.0290985107421875, 1.083282470703125, 1.1374664306640625, 1.191650390625, 1.2458343505859375, 1.300018310546875, 1.3542022705078125, 1.40838623046875, 1.4625701904296875, 1.516754150390625, 1.5709381103515625, 1.6251220703125, 1.6793060302734375, 1.733489990234375, 1.7876739501953125, 1.84185791015625, 1.8960418701171875, 1.950225830078125, 2.0044097900390625, 2.05859375]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 6.0, 6.0, 17.0, 35.0, 73.0, 162.0, 258.0, 214.0, 120.0, 46.0, 27.0, 13.0, 11.0, 7.0, 7.0, 0.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.495975494384766, -35.5299186706543, -34.56386184692383, -33.597801208496094, -32.631744384765625, -31.665687561035156, -30.699630737304688, -29.73357391357422, -28.76751708984375, -27.80146026611328, -26.83540153503418, -25.86934471130371, -24.903287887573242, -23.93722915649414, -22.971172332763672, -22.005115509033203, -21.0390567779541, -20.072999954223633, -19.10694122314453, -18.140884399414062, -17.174827575683594, -16.208770751953125, -15.242712020874023, -14.276655197143555, -13.31059741973877, -12.344539642333984, -11.378482818603516, -10.41242504119873, -9.446367263793945, -8.480310440063477, -7.514252662658691, -6.5481953620910645, -5.58213996887207, -4.616082668304443, -3.6500251293182373, -2.6839675903320312, -1.7179102897644043, -0.7518529891967773, 0.2142047882080078, 1.1802620887756348, 2.1463193893432617, 3.1123766899108887, 4.078433990478516, 5.044491767883301, 6.010549068450928, 6.976606369018555, 7.94266414642334, 8.908721923828125, 9.874778747558594, 10.840836524963379, 11.806893348693848, 12.772951126098633, 13.739007949829102, 14.705065727233887, 15.671123504638672, 16.63718032836914, 17.60323715209961, 18.569293975830078, 19.53535270690918, 20.50140953063965, 21.467466354370117, 22.43352508544922, 23.399581909179688, 24.365638732910156, 25.331697463989258]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 5.0, 6.0, 11.0, 10.0, 14.0, 16.0, 17.0, 17.0, 32.0, 40.0, 53.0, 47.0, 63.0, 63.0, 79.0, 59.0, 71.0, 59.0, 52.0, 55.0, 45.0, 48.0, 41.0, 25.0, 19.0, 11.0, 6.0, 20.0, 7.0, 6.0, 6.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.673098087310791, -7.379970073699951, -7.0868425369262695, -6.79371452331543, -6.50058650970459, -6.207458972930908, -5.914330959320068, -5.621203422546387, -5.328075408935547, -5.034947395324707, -4.741819858551025, -4.4486918449401855, -4.155564308166504, -3.862436294555664, -3.569308280944824, -3.2761805057525635, -2.9830527305603027, -2.689924955368042, -2.3967971801757812, -2.1036691665649414, -1.8105413913726807, -1.51741361618042, -1.2242857217788696, -0.9311578273773193, -0.6380300521850586, -0.3449022173881531, -0.05177438259124756, 0.24135345220565796, 0.5344812870025635, 0.8276090621948242, 1.1207369565963745, 1.4138648509979248, 1.7069921493530273, 2.000119924545288, 2.293247699737549, 2.5863757133483887, 2.8795034885406494, 3.17263126373291, 3.46575927734375, 3.7588870525360107, 4.0520148277282715, 4.345142841339111, 4.638270378112793, 4.931398391723633, 5.224526405334473, 5.517653942108154, 5.810781955718994, 6.103909492492676, 6.397037506103516, 6.6901655197143555, 6.983293056488037, 7.276421070098877, 7.569548606872559, 7.862676620483398, 8.155804634094238, 8.448932647705078, 8.742059707641602, 9.035187721252441, 9.328315734863281, 9.621442794799805, 9.914570808410645, 10.207698822021484, 10.500826835632324, 10.793954849243164, 11.087082862854004]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 4.0, 14.0, 7.0, 15.0, 17.0, 32.0, 34.0, 45.0, 70.0, 108.0, 184.0, 244.0, 390.0, 633.0, 931.0, 1470.0, 2362.0, 3990.0, 6574.0, 10693.0, 20003.0, 45725.0, 154756.0, 442291.0, 236558.0, 63845.0, 24869.0, 13044.0, 7420.0, 4630.0, 2746.0, 1745.0, 1094.0, 692.0, 458.0, 287.0, 198.0, 126.0, 97.0, 49.0, 35.0, 23.0, 13.0, 14.0, 8.0, 7.0, 5.0, 3.0, 1.0, 0.0, 0.0, 5.0, 0.0, 2.0], "bins": [-4.48828125, -4.35491943359375, -4.2215576171875, -4.08819580078125, -3.954833984375, -3.82147216796875, -3.6881103515625, -3.55474853515625, -3.42138671875, -3.28802490234375, -3.1546630859375, -3.02130126953125, -2.887939453125, -2.75457763671875, -2.6212158203125, -2.48785400390625, -2.3544921875, -2.22113037109375, -2.0877685546875, -1.95440673828125, -1.821044921875, -1.68768310546875, -1.5543212890625, -1.42095947265625, -1.28759765625, -1.15423583984375, -1.0208740234375, -0.88751220703125, -0.754150390625, -0.62078857421875, -0.4874267578125, -0.35406494140625, -0.220703125, -0.08734130859375, 0.0460205078125, 0.17938232421875, 0.312744140625, 0.44610595703125, 0.5794677734375, 0.71282958984375, 0.84619140625, 0.97955322265625, 1.1129150390625, 1.24627685546875, 1.379638671875, 1.51300048828125, 1.6463623046875, 1.77972412109375, 1.9130859375, 2.04644775390625, 2.1798095703125, 2.31317138671875, 2.446533203125, 2.57989501953125, 2.7132568359375, 2.84661865234375, 2.97998046875, 3.11334228515625, 3.2467041015625, 3.38006591796875, 3.513427734375, 3.64678955078125, 3.7801513671875, 3.91351318359375, 4.046875]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 4.0, 4.0, 5.0, 1.0, 3.0, 2.0, 4.0, 6.0, 10.0, 13.0, 13.0, 19.0, 23.0, 30.0, 58.0, 101.0, 150.0, 165.0, 147.0, 85.0, 59.0, 37.0, 14.0, 16.0, 8.0, 7.0, 4.0, 1.0, 4.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-1.173828125, -1.1413192749023438, -1.1088104248046875, -1.0763015747070312, -1.043792724609375, -1.0112838745117188, -0.9787750244140625, -0.9462661743164062, -0.91375732421875, -0.8812484741210938, -0.8487396240234375, -0.8162307739257812, -0.783721923828125, -0.7512130737304688, -0.7187042236328125, -0.6861953735351562, -0.6536865234375, -0.6211776733398438, -0.5886688232421875, -0.5561599731445312, -0.523651123046875, -0.49114227294921875, -0.4586334228515625, -0.42612457275390625, -0.39361572265625, -0.36110687255859375, -0.3285980224609375, -0.29608917236328125, -0.263580322265625, -0.23107147216796875, -0.1985626220703125, -0.16605377197265625, -0.133544921875, -0.10103607177734375, -0.0685272216796875, -0.03601837158203125, -0.003509521484375, 0.02899932861328125, 0.0615081787109375, 0.09401702880859375, 0.12652587890625, 0.15903472900390625, 0.1915435791015625, 0.22405242919921875, 0.256561279296875, 0.28907012939453125, 0.3215789794921875, 0.35408782958984375, 0.3865966796875, 0.41910552978515625, 0.4516143798828125, 0.48412322998046875, 0.516632080078125, 0.5491409301757812, 0.5816497802734375, 0.6141586303710938, 0.64666748046875, 0.6791763305664062, 0.7116851806640625, 0.7441940307617188, 0.776702880859375, 0.8092117309570312, 0.8417205810546875, 0.8742294311523438, 0.90673828125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 9.0, 7.0, 20.0, 21.0, 30.0, 47.0, 66.0, 96.0, 122.0, 205.0, 301.0, 424.0, 616.0, 946.0, 1430.0, 2408.0, 3749.0, 6269.0, 11044.0, 20576.0, 39949.0, 81377.0, 162527.0, 262792.0, 216999.0, 115320.0, 56280.0, 28464.0, 14934.0, 8290.0, 4812.0, 2996.0, 1839.0, 1157.0, 798.0, 498.0, 364.0, 261.0, 165.0, 110.0, 85.0, 42.0, 41.0, 22.0, 14.0, 8.0, 8.0, 6.0, 5.0, 3.0, 1.0, 2.0, 0.0, 6.0, 1.0], "bins": [-2.99609375, -2.90460205078125, -2.8131103515625, -2.72161865234375, -2.630126953125, -2.53863525390625, -2.4471435546875, -2.35565185546875, -2.26416015625, -2.17266845703125, -2.0811767578125, -1.98968505859375, -1.898193359375, -1.80670166015625, -1.7152099609375, -1.62371826171875, -1.5322265625, -1.44073486328125, -1.3492431640625, -1.25775146484375, -1.166259765625, -1.07476806640625, -0.9832763671875, -0.89178466796875, -0.80029296875, -0.70880126953125, -0.6173095703125, -0.52581787109375, -0.434326171875, -0.34283447265625, -0.2513427734375, -0.15985107421875, -0.068359375, 0.02313232421875, 0.1146240234375, 0.20611572265625, 0.297607421875, 0.38909912109375, 0.4805908203125, 0.57208251953125, 0.66357421875, 0.75506591796875, 0.8465576171875, 0.93804931640625, 1.029541015625, 1.12103271484375, 1.2125244140625, 1.30401611328125, 1.3955078125, 1.48699951171875, 1.5784912109375, 1.66998291015625, 1.761474609375, 1.85296630859375, 1.9444580078125, 2.03594970703125, 2.12744140625, 2.21893310546875, 2.3104248046875, 2.40191650390625, 2.493408203125, 2.58489990234375, 2.6763916015625, 2.76788330078125, 2.859375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 2.0, 5.0, 7.0, 8.0, 13.0, 14.0, 12.0, 8.0, 14.0, 12.0, 15.0, 21.0, 26.0, 25.0, 30.0, 25.0, 40.0, 29.0, 32.0, 41.0, 48.0, 34.0, 36.0, 39.0, 46.0, 31.0, 24.0, 45.0, 37.0, 35.0, 24.0, 27.0, 23.0, 19.0, 20.0, 20.0, 20.0, 16.0, 15.0, 13.0, 8.0, 8.0, 11.0, 5.0, 8.0, 6.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.013671875, -2.914520263671875, -2.81536865234375, -2.716217041015625, -2.6170654296875, -2.517913818359375, -2.41876220703125, -2.319610595703125, -2.220458984375, -2.121307373046875, -2.02215576171875, -1.923004150390625, -1.8238525390625, -1.724700927734375, -1.62554931640625, -1.526397705078125, -1.42724609375, -1.328094482421875, -1.22894287109375, -1.129791259765625, -1.0306396484375, -0.931488037109375, -0.83233642578125, -0.733184814453125, -0.634033203125, -0.534881591796875, -0.43572998046875, -0.336578369140625, -0.2374267578125, -0.138275146484375, -0.03912353515625, 0.060028076171875, 0.1591796875, 0.258331298828125, 0.35748291015625, 0.456634521484375, 0.5557861328125, 0.654937744140625, 0.75408935546875, 0.853240966796875, 0.952392578125, 1.051544189453125, 1.15069580078125, 1.249847412109375, 1.3489990234375, 1.448150634765625, 1.54730224609375, 1.646453857421875, 1.74560546875, 1.844757080078125, 1.94390869140625, 2.043060302734375, 2.1422119140625, 2.241363525390625, 2.34051513671875, 2.439666748046875, 2.538818359375, 2.637969970703125, 2.73712158203125, 2.836273193359375, 2.9354248046875, 3.034576416015625, 3.13372802734375, 3.232879638671875, 3.33203125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 5.0, 7.0, 10.0, 9.0, 6.0, 15.0, 26.0, 43.0, 64.0, 99.0, 161.0, 324.0, 609.0, 1199.0, 2693.0, 7313.0, 28740.0, 327453.0, 621690.0, 42217.0, 9642.0, 3338.0, 1356.0, 645.0, 351.0, 200.0, 137.0, 80.0, 36.0, 23.0, 20.0, 13.0, 6.0, 9.0, 4.0, 5.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.734375, -20.06787109375, -19.4013671875, -18.73486328125, -18.068359375, -17.40185546875, -16.7353515625, -16.06884765625, -15.40234375, -14.73583984375, -14.0693359375, -13.40283203125, -12.736328125, -12.06982421875, -11.4033203125, -10.73681640625, -10.0703125, -9.40380859375, -8.7373046875, -8.07080078125, -7.404296875, -6.73779296875, -6.0712890625, -5.40478515625, -4.73828125, -4.07177734375, -3.4052734375, -2.73876953125, -2.072265625, -1.40576171875, -0.7392578125, -0.07275390625, 0.59375, 1.26025390625, 1.9267578125, 2.59326171875, 3.259765625, 3.92626953125, 4.5927734375, 5.25927734375, 5.92578125, 6.59228515625, 7.2587890625, 7.92529296875, 8.591796875, 9.25830078125, 9.9248046875, 10.59130859375, 11.2578125, 11.92431640625, 12.5908203125, 13.25732421875, 13.923828125, 14.59033203125, 15.2568359375, 15.92333984375, 16.58984375, 17.25634765625, 17.9228515625, 18.58935546875, 19.255859375, 19.92236328125, 20.5888671875, 21.25537109375, 21.921875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 6.0, 4.0, 1.0, 10.0, 3.0, 14.0, 28.0, 35.0, 45.0, 55.0, 82.0, 128.0, 160.0, 113.0, 84.0, 64.0, 54.0, 40.0, 26.0, 15.0, 15.0, 9.0, 2.0, 3.0, 5.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001918792724609375, -0.0018633753061294556, -0.0018079578876495361, -0.0017525404691696167, -0.0016971230506896973, -0.0016417056322097778, -0.0015862882137298584, -0.001530870795249939, -0.0014754533767700195, -0.0014200359582901, -0.0013646185398101807, -0.0013092011213302612, -0.0012537837028503418, -0.0011983662843704224, -0.001142948865890503, -0.0010875314474105835, -0.001032114028930664, -0.0009766966104507446, -0.0009212791919708252, -0.0008658617734909058, -0.0008104443550109863, -0.0007550269365310669, -0.0006996095180511475, -0.000644192099571228, -0.0005887746810913086, -0.0005333572626113892, -0.0004779398441314697, -0.0004225224256515503, -0.00036710500717163086, -0.0003116875886917114, -0.000256270170211792, -0.00020085275173187256, -0.00014543533325195312, -9.001791477203369e-05, -3.460049629211426e-05, 2.0816922187805176e-05, 7.623434066772461e-05, 0.00013165175914764404, 0.00018706917762756348, 0.0002424865961074829, 0.00029790401458740234, 0.0003533214330673218, 0.0004087388515472412, 0.00046415627002716064, 0.0005195736885070801, 0.0005749911069869995, 0.0006304085254669189, 0.0006858259439468384, 0.0007412433624267578, 0.0007966607809066772, 0.0008520781993865967, 0.0009074956178665161, 0.0009629130363464355, 0.001018330454826355, 0.0010737478733062744, 0.0011291652917861938, 0.0011845827102661133, 0.0012400001287460327, 0.0012954175472259521, 0.0013508349657058716, 0.001406252384185791, 0.0014616698026657104, 0.0015170872211456299, 0.0015725046396255493, 0.0016279220581054688]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 6.0, 10.0, 8.0, 17.0, 20.0, 37.0, 43.0, 73.0, 103.0, 162.0, 230.0, 448.0, 666.0, 1374.0, 2659.0, 5656.0, 14044.0, 45551.0, 253835.0, 573483.0, 106757.0, 25572.0, 9220.0, 4156.0, 1920.0, 1027.0, 584.0, 325.0, 201.0, 130.0, 71.0, 48.0, 43.0, 26.0, 18.0, 10.0, 7.0, 3.0, 3.0, 4.0, 5.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.4140625, -9.139404296875, -8.86474609375, -8.590087890625, -8.3154296875, -8.040771484375, -7.76611328125, -7.491455078125, -7.216796875, -6.942138671875, -6.66748046875, -6.392822265625, -6.1181640625, -5.843505859375, -5.56884765625, -5.294189453125, -5.01953125, -4.744873046875, -4.47021484375, -4.195556640625, -3.9208984375, -3.646240234375, -3.37158203125, -3.096923828125, -2.822265625, -2.547607421875, -2.27294921875, -1.998291015625, -1.7236328125, -1.448974609375, -1.17431640625, -0.899658203125, -0.625, -0.350341796875, -0.07568359375, 0.198974609375, 0.4736328125, 0.748291015625, 1.02294921875, 1.297607421875, 1.572265625, 1.846923828125, 2.12158203125, 2.396240234375, 2.6708984375, 2.945556640625, 3.22021484375, 3.494873046875, 3.76953125, 4.044189453125, 4.31884765625, 4.593505859375, 4.8681640625, 5.142822265625, 5.41748046875, 5.692138671875, 5.966796875, 6.241455078125, 6.51611328125, 6.790771484375, 7.0654296875, 7.340087890625, 7.61474609375, 7.889404296875, 8.1640625]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 8.0, 10.0, 10.0, 19.0, 23.0, 32.0, 48.0, 55.0, 75.0, 87.0, 100.0, 115.0, 96.0, 87.0, 73.0, 48.0, 29.0, 22.0, 22.0, 9.0, 7.0, 7.0, 7.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.09765625, -5.87347412109375, -5.6492919921875, -5.42510986328125, -5.200927734375, -4.97674560546875, -4.7525634765625, -4.52838134765625, -4.30419921875, -4.08001708984375, -3.8558349609375, -3.63165283203125, -3.407470703125, -3.18328857421875, -2.9591064453125, -2.73492431640625, -2.5107421875, -2.28656005859375, -2.0623779296875, -1.83819580078125, -1.614013671875, -1.38983154296875, -1.1656494140625, -0.94146728515625, -0.71728515625, -0.49310302734375, -0.2689208984375, -0.04473876953125, 0.179443359375, 0.40362548828125, 0.6278076171875, 0.85198974609375, 1.076171875, 1.30035400390625, 1.5245361328125, 1.74871826171875, 1.972900390625, 2.19708251953125, 2.4212646484375, 2.64544677734375, 2.86962890625, 3.09381103515625, 3.3179931640625, 3.54217529296875, 3.766357421875, 3.99053955078125, 4.2147216796875, 4.43890380859375, 4.6630859375, 4.88726806640625, 5.1114501953125, 5.33563232421875, 5.559814453125, 5.78399658203125, 6.0081787109375, 6.23236083984375, 6.45654296875, 6.68072509765625, 6.9049072265625, 7.12908935546875, 7.353271484375, 7.57745361328125, 7.8016357421875, 8.02581787109375, 8.25]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 3.0, 9.0, 16.0, 20.0, 38.0, 84.0, 170.0, 218.0, 217.0, 111.0, 63.0, 24.0, 15.0, 7.0, 5.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-170.45306396484375, -166.38182067871094, -162.3105926513672, -158.23934936523438, -154.16812133789062, -150.0968780517578, -146.025634765625, -141.95440673828125, -137.88316345214844, -133.81192016601562, -129.74069213867188, -125.66944885253906, -121.59821319580078, -117.5269775390625, -113.45573425292969, -109.3844985961914, -105.31326293945312, -101.24202728271484, -97.17079162597656, -93.09954833984375, -89.02831268310547, -84.95707702636719, -80.88583374023438, -76.8145980834961, -72.74336242675781, -68.67212677001953, -64.60089111328125, -60.52964782714844, -56.458412170410156, -52.387176513671875, -48.31593704223633, -44.24469757080078, -40.17345428466797, -36.10221862792969, -32.03097915649414, -27.959741592407227, -23.888504028320312, -19.8172664642334, -15.746028900146484, -11.67479133605957, -7.603553771972656, -3.532316207885742, 0.5389213562011719, 4.610158920288086, 8.681396484375, 12.752634048461914, 16.823871612548828, 20.895109176635742, 24.966346740722656, 29.03758430480957, 33.108821868896484, 37.18006134033203, 41.25129699707031, 45.322532653808594, 49.39377212524414, 53.46501159667969, 57.53624725341797, 61.60748291015625, 65.67872619628906, 69.74996185302734, 73.82119750976562, 77.8924331665039, 81.96366882324219, 86.034912109375, 90.10614776611328]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 6.0, 4.0, 3.0, 11.0, 7.0, 6.0, 7.0, 11.0, 28.0, 52.0, 65.0, 97.0, 117.0, 165.0, 107.0, 99.0, 73.0, 39.0, 22.0, 14.0, 9.0, 9.0, 6.0, 7.0, 6.0, 6.0, 9.0, 4.0, 4.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.25209045410156, -62.070133209228516, -59.88817596435547, -57.70621871948242, -55.524261474609375, -53.34230041503906, -51.160343170166016, -48.97838592529297, -46.79642868041992, -44.614471435546875, -42.43251419067383, -40.25055694580078, -38.06859588623047, -35.88664245605469, -33.704681396484375, -31.522724151611328, -29.34076690673828, -27.158809661865234, -24.976852416992188, -22.794893264770508, -20.61293601989746, -18.430978775024414, -16.249019622802734, -14.067062377929688, -11.88510513305664, -9.703147888183594, -7.5211896896362305, -5.339231967926025, -3.1572742462158203, -0.9753170013427734, 1.2066411972045898, 3.388599395751953, 5.570556640625, 7.752514362335205, 9.93447208404541, 12.116430282592773, 14.29838752746582, 16.480344772338867, 18.662303924560547, 20.844261169433594, 23.02621841430664, 25.208175659179688, 27.390132904052734, 29.572092056274414, 31.75404930114746, 33.936004638671875, 36.11796569824219, 38.299922943115234, 40.48188018798828, 42.66383743286133, 44.845794677734375, 47.02775192260742, 49.20970916748047, 51.39167022705078, 53.57362747192383, 55.755584716796875, 57.93754196166992, 60.11949920654297, 62.301456451416016, 64.48341369628906, 66.66537475585938, 68.84732818603516, 71.02928924560547, 73.21124267578125, 75.39320373535156]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 3.0, 6.0, 4.0, 10.0, 10.0, 7.0, 16.0, 22.0, 28.0, 36.0, 65.0, 73.0, 113.0, 226.0, 350.0, 557.0, 1037.0, 1839.0, 3827.0, 9098.0, 28327.0, 177571.0, 3737603.0, 187437.0, 29096.0, 8955.0, 3744.0, 1796.0, 942.0, 540.0, 336.0, 221.0, 102.0, 89.0, 61.0, 32.0, 22.0, 23.0, 12.0, 10.0, 8.0, 3.0, 5.0, 6.0, 3.0, 6.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.3984375, -12.0284423828125, -11.658447265625, -11.2884521484375, -10.91845703125, -10.5484619140625, -10.178466796875, -9.8084716796875, -9.4384765625, -9.0684814453125, -8.698486328125, -8.3284912109375, -7.95849609375, -7.5885009765625, -7.218505859375, -6.8485107421875, -6.478515625, -6.1085205078125, -5.738525390625, -5.3685302734375, -4.99853515625, -4.6285400390625, -4.258544921875, -3.8885498046875, -3.5185546875, -3.1485595703125, -2.778564453125, -2.4085693359375, -2.03857421875, -1.6685791015625, -1.298583984375, -0.9285888671875, -0.55859375, -0.1885986328125, 0.181396484375, 0.5513916015625, 0.92138671875, 1.2913818359375, 1.661376953125, 2.0313720703125, 2.4013671875, 2.7713623046875, 3.141357421875, 3.5113525390625, 3.88134765625, 4.2513427734375, 4.621337890625, 4.9913330078125, 5.361328125, 5.7313232421875, 6.101318359375, 6.4713134765625, 6.84130859375, 7.2113037109375, 7.581298828125, 7.9512939453125, 8.3212890625, 8.6912841796875, 9.061279296875, 9.4312744140625, 9.80126953125, 10.1712646484375, 10.541259765625, 10.9112548828125, 11.28125]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 4.0, 3.0, 9.0, 8.0, 19.0, 21.0, 33.0, 40.0, 60.0, 90.0, 131.0, 157.0, 119.0, 97.0, 70.0, 42.0, 33.0, 19.0, 7.0, 8.0, 4.0, 7.0, 1.0, 3.0, 5.0, 6.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0], "bins": [-1.3193359375, -1.287567138671875, -1.25579833984375, -1.224029541015625, -1.1922607421875, -1.160491943359375, -1.12872314453125, -1.096954345703125, -1.065185546875, -1.033416748046875, -1.00164794921875, -0.969879150390625, -0.9381103515625, -0.906341552734375, -0.87457275390625, -0.842803955078125, -0.81103515625, -0.779266357421875, -0.74749755859375, -0.715728759765625, -0.6839599609375, -0.652191162109375, -0.62042236328125, -0.588653564453125, -0.556884765625, -0.525115966796875, -0.49334716796875, -0.461578369140625, -0.4298095703125, -0.398040771484375, -0.36627197265625, -0.334503173828125, -0.302734375, -0.270965576171875, -0.23919677734375, -0.207427978515625, -0.1756591796875, -0.143890380859375, -0.11212158203125, -0.080352783203125, -0.048583984375, -0.016815185546875, 0.01495361328125, 0.046722412109375, 0.0784912109375, 0.110260009765625, 0.14202880859375, 0.173797607421875, 0.20556640625, 0.237335205078125, 0.26910400390625, 0.300872802734375, 0.3326416015625, 0.364410400390625, 0.39617919921875, 0.427947998046875, 0.459716796875, 0.491485595703125, 0.52325439453125, 0.555023193359375, 0.5867919921875, 0.618560791015625, 0.65032958984375, 0.682098388671875, 0.7138671875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 7.0, 8.0, 15.0, 24.0, 33.0, 42.0, 86.0, 146.0, 263.0, 469.0, 919.0, 1773.0, 3770.0, 8893.0, 23713.0, 77533.0, 362418.0, 3059849.0, 510645.0, 96867.0, 28191.0, 10428.0, 4273.0, 1922.0, 956.0, 452.0, 255.0, 141.0, 75.0, 49.0, 26.0, 19.0, 14.0, 6.0, 8.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.21484375, -6.95330810546875, -6.6917724609375, -6.43023681640625, -6.168701171875, -5.90716552734375, -5.6456298828125, -5.38409423828125, -5.12255859375, -4.86102294921875, -4.5994873046875, -4.33795166015625, -4.076416015625, -3.81488037109375, -3.5533447265625, -3.29180908203125, -3.0302734375, -2.76873779296875, -2.5072021484375, -2.24566650390625, -1.984130859375, -1.72259521484375, -1.4610595703125, -1.19952392578125, -0.93798828125, -0.67645263671875, -0.4149169921875, -0.15338134765625, 0.108154296875, 0.36968994140625, 0.6312255859375, 0.89276123046875, 1.154296875, 1.41583251953125, 1.6773681640625, 1.93890380859375, 2.200439453125, 2.46197509765625, 2.7235107421875, 2.98504638671875, 3.24658203125, 3.50811767578125, 3.7696533203125, 4.03118896484375, 4.292724609375, 4.55426025390625, 4.8157958984375, 5.07733154296875, 5.3388671875, 5.60040283203125, 5.8619384765625, 6.12347412109375, 6.385009765625, 6.64654541015625, 6.9080810546875, 7.16961669921875, 7.43115234375, 7.69268798828125, 7.9542236328125, 8.21575927734375, 8.477294921875, 8.73883056640625, 9.0003662109375, 9.26190185546875, 9.5234375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 6.0, 2.0, 8.0, 5.0, 23.0, 19.0, 31.0, 28.0, 44.0, 63.0, 98.0, 127.0, 189.0, 351.0, 798.0, 1247.0, 412.0, 193.0, 149.0, 89.0, 62.0, 36.0, 31.0, 27.0, 15.0, 8.0, 6.0, 4.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4521484375, -1.4130096435546875, -1.373870849609375, -1.3347320556640625, -1.29559326171875, -1.2564544677734375, -1.217315673828125, -1.1781768798828125, -1.1390380859375, -1.0998992919921875, -1.060760498046875, -1.0216217041015625, -0.98248291015625, -0.9433441162109375, -0.904205322265625, -0.8650665283203125, -0.825927734375, -0.7867889404296875, -0.747650146484375, -0.7085113525390625, -0.66937255859375, -0.6302337646484375, -0.591094970703125, -0.5519561767578125, -0.5128173828125, -0.4736785888671875, -0.434539794921875, -0.3954010009765625, -0.35626220703125, -0.3171234130859375, -0.277984619140625, -0.2388458251953125, -0.19970703125, -0.1605682373046875, -0.121429443359375, -0.0822906494140625, -0.04315185546875, -0.0040130615234375, 0.035125732421875, 0.0742645263671875, 0.1134033203125, 0.1525421142578125, 0.191680908203125, 0.2308197021484375, 0.26995849609375, 0.3090972900390625, 0.348236083984375, 0.3873748779296875, 0.426513671875, 0.4656524658203125, 0.504791259765625, 0.5439300537109375, 0.58306884765625, 0.6222076416015625, 0.661346435546875, 0.7004852294921875, 0.7396240234375, 0.7787628173828125, 0.817901611328125, 0.8570404052734375, 0.89617919921875, 0.9353179931640625, 0.974456787109375, 1.0135955810546875, 1.052734375]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 4.0, 3.0, 13.0, 13.0, 33.0, 77.0, 191.0, 257.0, 232.0, 121.0, 39.0, 14.0, 6.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-30.0752010345459, -29.470487594604492, -28.865772247314453, -28.261058807373047, -27.65634536743164, -27.0516300201416, -26.446916580200195, -25.842201232910156, -25.23748779296875, -24.632774353027344, -24.028059005737305, -23.4233455657959, -22.81863021850586, -22.213916778564453, -21.609203338623047, -21.00448989868164, -20.3997745513916, -19.795061111450195, -19.190345764160156, -18.58563232421875, -17.980918884277344, -17.376203536987305, -16.7714900970459, -16.16677474975586, -15.562061309814453, -14.95734691619873, -14.352632522583008, -13.747919082641602, -13.143204689025879, -12.538490295410156, -11.93377685546875, -11.329062461853027, -10.724347114562988, -10.119632720947266, -9.51491928100586, -8.910204887390137, -8.305490493774414, -7.700776100158691, -7.096062183380127, -6.4913482666015625, -5.88663387298584, -5.281919479370117, -4.677205562591553, -4.072491645812988, -3.4677772521972656, -2.863063097000122, -2.2583489418029785, -1.653635025024414, -1.0489206314086914, -0.44420647621154785, 0.1605076789855957, 0.7652218341827393, 1.3699359893798828, 1.9746501445770264, 2.57936429977417, 3.1840782165527344, 3.788792610168457, 4.39350700378418, 4.998220920562744, 5.602934837341309, 6.207649230957031, 6.812363624572754, 7.417077541351318, 8.021791458129883, 8.626505851745605]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 5.0, 10.0, 13.0, 20.0, 29.0, 39.0, 50.0, 47.0, 82.0, 79.0, 83.0, 86.0, 89.0, 79.0, 75.0, 58.0, 54.0, 35.0, 21.0, 21.0, 12.0, 6.0, 7.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.822272777557373, -7.562080383300781, -7.301888465881348, -7.041696548461914, -6.781504154205322, -6.5213117599487305, -6.261119842529297, -6.000927925109863, -5.7407355308532715, -5.48054313659668, -5.220351219177246, -4.9601593017578125, -4.699966907501221, -4.439774513244629, -4.179582595825195, -3.9193904399871826, -3.65919828414917, -3.3990061283111572, -3.1388139724731445, -2.878621816635132, -2.618429660797119, -2.3582375049591064, -2.0980453491210938, -1.837853193283081, -1.5776610374450684, -1.3174688816070557, -1.057276725769043, -0.7970845699310303, -0.5368924140930176, -0.2767002582550049, -0.016508102416992188, 0.2436840534210205, 0.5038766860961914, 0.7640688419342041, 1.0242609977722168, 1.2844531536102295, 1.5446453094482422, 1.8048374652862549, 2.0650296211242676, 2.3252217769622803, 2.585413932800293, 2.8456060886383057, 3.1057982444763184, 3.365990400314331, 3.6261825561523438, 3.8863747119903564, 4.146566867828369, 4.406759262084961, 4.6669511795043945, 4.927143096923828, 5.18733549118042, 5.447527885437012, 5.707719802856445, 5.967911720275879, 6.228104114532471, 6.4882965087890625, 6.748488426208496, 7.00868034362793, 7.2688727378845215, 7.529065132141113, 7.789257049560547, 8.04944896697998, 8.309640884399414, 8.569833755493164, 8.830025672912598]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 4.0, 5.0, 9.0, 8.0, 15.0, 16.0, 41.0, 48.0, 91.0, 124.0, 214.0, 456.0, 914.0, 2056.0, 5061.0, 13185.0, 43253.0, 198338.0, 521980.0, 197243.0, 43121.0, 13356.0, 5127.0, 2070.0, 834.0, 432.0, 230.0, 127.0, 68.0, 52.0, 18.0, 21.0, 10.0, 12.0, 7.0, 5.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.7265625, -6.49853515625, -6.2705078125, -6.04248046875, -5.814453125, -5.58642578125, -5.3583984375, -5.13037109375, -4.90234375, -4.67431640625, -4.4462890625, -4.21826171875, -3.990234375, -3.76220703125, -3.5341796875, -3.30615234375, -3.078125, -2.85009765625, -2.6220703125, -2.39404296875, -2.166015625, -1.93798828125, -1.7099609375, -1.48193359375, -1.25390625, -1.02587890625, -0.7978515625, -0.56982421875, -0.341796875, -0.11376953125, 0.1142578125, 0.34228515625, 0.5703125, 0.79833984375, 1.0263671875, 1.25439453125, 1.482421875, 1.71044921875, 1.9384765625, 2.16650390625, 2.39453125, 2.62255859375, 2.8505859375, 3.07861328125, 3.306640625, 3.53466796875, 3.7626953125, 3.99072265625, 4.21875, 4.44677734375, 4.6748046875, 4.90283203125, 5.130859375, 5.35888671875, 5.5869140625, 5.81494140625, 6.04296875, 6.27099609375, 6.4990234375, 6.72705078125, 6.955078125, 7.18310546875, 7.4111328125, 7.63916015625, 7.8671875]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0, 2.0, 11.0, 9.0, 12.0, 19.0, 28.0, 58.0, 74.0, 129.0, 152.0, 148.0, 114.0, 97.0, 57.0, 37.0, 21.0, 6.0, 6.0, 4.0, 4.0, 4.0, 2.0, 7.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4453125, -1.4091720581054688, -1.3730316162109375, -1.3368911743164062, -1.300750732421875, -1.2646102905273438, -1.2284698486328125, -1.1923294067382812, -1.15618896484375, -1.1200485229492188, -1.0839080810546875, -1.0477676391601562, -1.011627197265625, -0.9754867553710938, -0.9393463134765625, -0.9032058715820312, -0.8670654296875, -0.8309249877929688, -0.7947845458984375, -0.7586441040039062, -0.722503662109375, -0.6863632202148438, -0.6502227783203125, -0.6140823364257812, -0.57794189453125, -0.5418014526367188, -0.5056610107421875, -0.46952056884765625, -0.433380126953125, -0.39723968505859375, -0.3610992431640625, -0.32495880126953125, -0.288818359375, -0.25267791748046875, -0.2165374755859375, -0.18039703369140625, -0.144256591796875, -0.10811614990234375, -0.0719757080078125, -0.03583526611328125, 0.00030517578125, 0.03644561767578125, 0.0725860595703125, 0.10872650146484375, 0.144866943359375, 0.18100738525390625, 0.2171478271484375, 0.25328826904296875, 0.2894287109375, 0.32556915283203125, 0.3617095947265625, 0.39785003662109375, 0.433990478515625, 0.47013092041015625, 0.5062713623046875, 0.5424118041992188, 0.57855224609375, 0.6146926879882812, 0.6508331298828125, 0.6869735717773438, 0.723114013671875, 0.7592544555664062, 0.7953948974609375, 0.8315353393554688, 0.86767578125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 7.0, 6.0, 9.0, 10.0, 26.0, 24.0, 44.0, 79.0, 118.0, 230.0, 358.0, 629.0, 1168.0, 2160.0, 4293.0, 8829.0, 19937.0, 48213.0, 120627.0, 258592.0, 303497.0, 163155.0, 65673.0, 27216.0, 11879.0, 5680.0, 2714.0, 1429.0, 835.0, 437.0, 262.0, 162.0, 110.0, 47.0, 36.0, 23.0, 21.0, 12.0, 4.0, 2.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.8203125, -3.701568603515625, -3.58282470703125, -3.464080810546875, -3.3453369140625, -3.226593017578125, -3.10784912109375, -2.989105224609375, -2.870361328125, -2.751617431640625, -2.63287353515625, -2.514129638671875, -2.3953857421875, -2.276641845703125, -2.15789794921875, -2.039154052734375, -1.92041015625, -1.801666259765625, -1.68292236328125, -1.564178466796875, -1.4454345703125, -1.326690673828125, -1.20794677734375, -1.089202880859375, -0.970458984375, -0.851715087890625, -0.73297119140625, -0.614227294921875, -0.4954833984375, -0.376739501953125, -0.25799560546875, -0.139251708984375, -0.0205078125, 0.098236083984375, 0.21697998046875, 0.335723876953125, 0.4544677734375, 0.573211669921875, 0.69195556640625, 0.810699462890625, 0.929443359375, 1.048187255859375, 1.16693115234375, 1.285675048828125, 1.4044189453125, 1.523162841796875, 1.64190673828125, 1.760650634765625, 1.87939453125, 1.998138427734375, 2.11688232421875, 2.235626220703125, 2.3543701171875, 2.473114013671875, 2.59185791015625, 2.710601806640625, 2.829345703125, 2.948089599609375, 3.06683349609375, 3.185577392578125, 3.3043212890625, 3.423065185546875, 3.54180908203125, 3.660552978515625, 3.779296875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 6.0, 4.0, 4.0, 7.0, 14.0, 10.0, 20.0, 16.0, 23.0, 23.0, 25.0, 33.0, 25.0, 36.0, 44.0, 48.0, 51.0, 36.0, 41.0, 40.0, 47.0, 51.0, 49.0, 48.0, 55.0, 46.0, 28.0, 35.0, 22.0, 13.0, 25.0, 18.0, 16.0, 9.0, 4.0, 11.0, 6.0, 6.0, 3.0, 2.0, 1.0, 0.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.263671875, -3.171112060546875, -3.07855224609375, -2.985992431640625, -2.8934326171875, -2.800872802734375, -2.70831298828125, -2.615753173828125, -2.523193359375, -2.430633544921875, -2.33807373046875, -2.245513916015625, -2.1529541015625, -2.060394287109375, -1.96783447265625, -1.875274658203125, -1.78271484375, -1.690155029296875, -1.59759521484375, -1.505035400390625, -1.4124755859375, -1.319915771484375, -1.22735595703125, -1.134796142578125, -1.042236328125, -0.949676513671875, -0.85711669921875, -0.764556884765625, -0.6719970703125, -0.579437255859375, -0.48687744140625, -0.394317626953125, -0.3017578125, -0.209197998046875, -0.11663818359375, -0.024078369140625, 0.0684814453125, 0.161041259765625, 0.25360107421875, 0.346160888671875, 0.438720703125, 0.531280517578125, 0.62384033203125, 0.716400146484375, 0.8089599609375, 0.901519775390625, 0.99407958984375, 1.086639404296875, 1.17919921875, 1.271759033203125, 1.36431884765625, 1.456878662109375, 1.5494384765625, 1.641998291015625, 1.73455810546875, 1.827117919921875, 1.919677734375, 2.012237548828125, 2.10479736328125, 2.197357177734375, 2.2899169921875, 2.382476806640625, 2.47503662109375, 2.567596435546875, 2.66015625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 0.0, 5.0, 1.0, 3.0, 6.0, 3.0, 13.0, 28.0, 35.0, 49.0, 70.0, 127.0, 271.0, 504.0, 1128.0, 3108.0, 10627.0, 51590.0, 380583.0, 507342.0, 72816.0, 13812.0, 3859.0, 1364.0, 574.0, 264.0, 143.0, 96.0, 48.0, 34.0, 13.0, 21.0, 9.0, 4.0, 4.0, 2.0, 1.0, 0.0, 5.0, 1.0, 2.0, 1.0], "bins": [-16.171875, -15.7783203125, -15.384765625, -14.9912109375, -14.59765625, -14.2041015625, -13.810546875, -13.4169921875, -13.0234375, -12.6298828125, -12.236328125, -11.8427734375, -11.44921875, -11.0556640625, -10.662109375, -10.2685546875, -9.875, -9.4814453125, -9.087890625, -8.6943359375, -8.30078125, -7.9072265625, -7.513671875, -7.1201171875, -6.7265625, -6.3330078125, -5.939453125, -5.5458984375, -5.15234375, -4.7587890625, -4.365234375, -3.9716796875, -3.578125, -3.1845703125, -2.791015625, -2.3974609375, -2.00390625, -1.6103515625, -1.216796875, -0.8232421875, -0.4296875, -0.0361328125, 0.357421875, 0.7509765625, 1.14453125, 1.5380859375, 1.931640625, 2.3251953125, 2.71875, 3.1123046875, 3.505859375, 3.8994140625, 4.29296875, 4.6865234375, 5.080078125, 5.4736328125, 5.8671875, 6.2607421875, 6.654296875, 7.0478515625, 7.44140625, 7.8349609375, 8.228515625, 8.6220703125, 9.015625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 4.0, 2.0, 5.0, 4.0, 9.0, 10.0, 8.0, 22.0, 12.0, 30.0, 38.0, 42.0, 46.0, 54.0, 99.0, 95.0, 116.0, 93.0, 63.0, 55.0, 48.0, 25.0, 30.0, 21.0, 19.0, 17.0, 10.0, 9.0, 9.0, 3.0, 1.0, 4.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000732421875, -0.0007079392671585083, -0.0006834566593170166, -0.0006589740514755249, -0.0006344914436340332, -0.0006100088357925415, -0.0005855262279510498, -0.0005610436201095581, -0.0005365610122680664, -0.0005120784044265747, -0.000487595796585083, -0.0004631131887435913, -0.0004386305809020996, -0.0004141479730606079, -0.0003896653652191162, -0.0003651827573776245, -0.0003407001495361328, -0.0003162175416946411, -0.0002917349338531494, -0.0002672523260116577, -0.00024276971817016602, -0.00021828711032867432, -0.00019380450248718262, -0.00016932189464569092, -0.00014483928680419922, -0.00012035667896270752, -9.587407112121582e-05, -7.139146327972412e-05, -4.690885543823242e-05, -2.2426247596740723e-05, 2.0563602447509766e-06, 2.6538968086242676e-05, 5.1021575927734375e-05, 7.550418376922607e-05, 9.998679161071777e-05, 0.00012446939945220947, 0.00014895200729370117, 0.00017343461513519287, 0.00019791722297668457, 0.00022239983081817627, 0.00024688243865966797, 0.00027136504650115967, 0.00029584765434265137, 0.00032033026218414307, 0.00034481287002563477, 0.00036929547786712646, 0.00039377808570861816, 0.00041826069355010986, 0.00044274330139160156, 0.00046722590923309326, 0.000491708517074585, 0.0005161911249160767, 0.0005406737327575684, 0.0005651563405990601, 0.0005896389484405518, 0.0006141215562820435, 0.0006386041641235352, 0.0006630867719650269, 0.0006875693798065186, 0.0007120519876480103, 0.000736534595489502, 0.0007610172033309937, 0.0007854998111724854, 0.000809982419013977, 0.0008344650268554688]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 8.0, 9.0, 10.0, 12.0, 21.0, 16.0, 32.0, 54.0, 81.0, 135.0, 213.0, 392.0, 640.0, 1229.0, 2580.0, 5583.0, 14237.0, 42067.0, 148273.0, 408255.0, 295250.0, 85815.0, 25888.0, 9439.0, 4084.0, 1860.0, 1035.0, 525.0, 304.0, 176.0, 112.0, 63.0, 48.0, 33.0, 21.0, 19.0, 10.0, 6.0, 6.0, 5.0, 4.0, 4.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.5859375, -6.38507080078125, -6.1842041015625, -5.98333740234375, -5.782470703125, -5.58160400390625, -5.3807373046875, -5.17987060546875, -4.97900390625, -4.77813720703125, -4.5772705078125, -4.37640380859375, -4.175537109375, -3.97467041015625, -3.7738037109375, -3.57293701171875, -3.3720703125, -3.17120361328125, -2.9703369140625, -2.76947021484375, -2.568603515625, -2.36773681640625, -2.1668701171875, -1.96600341796875, -1.76513671875, -1.56427001953125, -1.3634033203125, -1.16253662109375, -0.961669921875, -0.76080322265625, -0.5599365234375, -0.35906982421875, -0.158203125, 0.04266357421875, 0.2435302734375, 0.44439697265625, 0.645263671875, 0.84613037109375, 1.0469970703125, 1.24786376953125, 1.44873046875, 1.64959716796875, 1.8504638671875, 2.05133056640625, 2.252197265625, 2.45306396484375, 2.6539306640625, 2.85479736328125, 3.0556640625, 3.25653076171875, 3.4573974609375, 3.65826416015625, 3.859130859375, 4.05999755859375, 4.2608642578125, 4.46173095703125, 4.66259765625, 4.86346435546875, 5.0643310546875, 5.26519775390625, 5.466064453125, 5.66693115234375, 5.8677978515625, 6.06866455078125, 6.26953125]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 4.0, 3.0, 13.0, 5.0, 19.0, 17.0, 19.0, 21.0, 35.0, 45.0, 35.0, 55.0, 71.0, 63.0, 65.0, 75.0, 80.0, 64.0, 67.0, 52.0, 37.0, 46.0, 28.0, 19.0, 21.0, 15.0, 7.0, 10.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.837890625, -2.73736572265625, -2.6368408203125, -2.53631591796875, -2.435791015625, -2.33526611328125, -2.2347412109375, -2.13421630859375, -2.03369140625, -1.93316650390625, -1.8326416015625, -1.73211669921875, -1.631591796875, -1.53106689453125, -1.4305419921875, -1.33001708984375, -1.2294921875, -1.12896728515625, -1.0284423828125, -0.92791748046875, -0.827392578125, -0.72686767578125, -0.6263427734375, -0.52581787109375, -0.42529296875, -0.32476806640625, -0.2242431640625, -0.12371826171875, -0.023193359375, 0.07733154296875, 0.1778564453125, 0.27838134765625, 0.37890625, 0.47943115234375, 0.5799560546875, 0.68048095703125, 0.781005859375, 0.88153076171875, 0.9820556640625, 1.08258056640625, 1.18310546875, 1.28363037109375, 1.3841552734375, 1.48468017578125, 1.585205078125, 1.68572998046875, 1.7862548828125, 1.88677978515625, 1.9873046875, 2.08782958984375, 2.1883544921875, 2.28887939453125, 2.389404296875, 2.48992919921875, 2.5904541015625, 2.69097900390625, 2.79150390625, 2.89202880859375, 2.9925537109375, 3.09307861328125, 3.193603515625, 3.29412841796875, 3.3946533203125, 3.49517822265625, 3.595703125]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 0.0, 4.0, 3.0, 7.0, 29.0, 107.0, 242.0, 320.0, 188.0, 61.0, 22.0, 4.0, 9.0, 5.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.324310302734375, -51.54138946533203, -48.75846862792969, -45.975547790527344, -43.192630767822266, -40.40970993041992, -37.62678909301758, -34.8438720703125, -32.060951232910156, -29.278030395507812, -26.4951114654541, -23.712190628051758, -20.929271697998047, -18.146350860595703, -15.36343002319336, -12.580511093139648, -9.797588348388672, -7.0146684646606445, -4.231748104095459, -1.4488277435302734, 1.334092140197754, 4.117012023925781, 6.899932861328125, 9.682851791381836, 12.46577262878418, 15.248692512512207, 18.031612396240234, 20.814533233642578, 23.597454071044922, 26.380373001098633, 29.163293838500977, 31.946212768554688, 34.72913360595703, 37.512054443359375, 40.29497528076172, 43.07789611816406, 45.86081314086914, 48.643733978271484, 51.42665481567383, 54.209571838378906, 56.99249267578125, 59.775413513183594, 62.55833435058594, 65.34125518798828, 68.12417602539062, 70.90708923339844, 73.69001770019531, 76.47293090820312, 79.255859375, 82.03878021240234, 84.82170104980469, 87.60462188720703, 90.38754272460938, 93.17045593261719, 95.95338439941406, 98.73629760742188, 101.51921844482422, 104.30213928222656, 107.0850601196289, 109.86798095703125, 112.6509017944336, 115.43382263183594, 118.21673583984375, 120.9996566772461, 123.78257751464844]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 4.0, 8.0, 11.0, 12.0, 21.0, 32.0, 35.0, 58.0, 66.0, 72.0, 99.0, 100.0, 98.0, 91.0, 76.0, 65.0, 38.0, 27.0, 24.0, 19.0, 14.0, 7.0, 7.0, 3.0, 4.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.320899963378906, -31.104799270629883, -29.888696670532227, -28.672595977783203, -27.45649528503418, -26.240394592285156, -25.0242919921875, -23.808191299438477, -22.592090606689453, -21.37598991394043, -20.159887313842773, -18.94378662109375, -17.727685928344727, -16.511585235595703, -15.295482635498047, -14.079381942749023, -12.863279342651367, -11.647177696228027, -10.431077003479004, -9.214975357055664, -7.998874187469482, -6.782773017883301, -5.566671371459961, -4.3505706787109375, -3.1344690322875977, -1.9183677434921265, -0.7022664546966553, 0.5138349533081055, 1.729936122894287, 2.9460372924804688, 4.162138938903809, 5.378239631652832, 6.594341278076172, 7.8104424476623535, 9.026543617248535, 10.242645263671875, 11.458745956420898, 12.674847602844238, 13.890949249267578, 15.107049942016602, 16.323150634765625, 17.53925132751465, 18.755353927612305, 19.971454620361328, 21.18755531311035, 22.403656005859375, 23.61975860595703, 24.835859298706055, 26.05196189880371, 27.268062591552734, 28.48416519165039, 29.700265884399414, 30.916366577148438, 32.132469177246094, 33.34857177734375, 34.56467056274414, 35.7807731628418, 36.99687576293945, 38.212974548339844, 39.4290771484375, 40.645179748535156, 41.86127853393555, 43.0773811340332, 44.293479919433594, 45.50958251953125]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 6.0, 6.0, 10.0, 6.0, 12.0, 14.0, 20.0, 41.0, 40.0, 49.0, 73.0, 140.0, 170.0, 318.0, 482.0, 904.0, 1680.0, 3628.0, 9180.0, 29101.0, 143850.0, 3469167.0, 454213.0, 55592.0, 14966.0, 5435.0, 2400.0, 1185.0, 625.0, 349.0, 200.0, 135.0, 99.0, 55.0, 45.0, 27.0, 25.0, 13.0, 9.0, 7.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.578125, -11.2447509765625, -10.911376953125, -10.5780029296875, -10.24462890625, -9.9112548828125, -9.577880859375, -9.2445068359375, -8.9111328125, -8.5777587890625, -8.244384765625, -7.9110107421875, -7.57763671875, -7.2442626953125, -6.910888671875, -6.5775146484375, -6.244140625, -5.9107666015625, -5.577392578125, -5.2440185546875, -4.91064453125, -4.5772705078125, -4.243896484375, -3.9105224609375, -3.5771484375, -3.2437744140625, -2.910400390625, -2.5770263671875, -2.24365234375, -1.9102783203125, -1.576904296875, -1.2435302734375, -0.91015625, -0.5767822265625, -0.243408203125, 0.0899658203125, 0.42333984375, 0.7567138671875, 1.090087890625, 1.4234619140625, 1.7568359375, 2.0902099609375, 2.423583984375, 2.7569580078125, 3.09033203125, 3.4237060546875, 3.757080078125, 4.0904541015625, 4.423828125, 4.7572021484375, 5.090576171875, 5.4239501953125, 5.75732421875, 6.0906982421875, 6.424072265625, 6.7574462890625, 7.0908203125, 7.4241943359375, 7.757568359375, 8.0909423828125, 8.42431640625, 8.7576904296875, 9.091064453125, 9.4244384765625, 9.7578125]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 4.0, 3.0, 10.0, 9.0, 25.0, 40.0, 84.0, 116.0, 146.0, 136.0, 145.0, 103.0, 77.0, 43.0, 25.0, 10.0, 10.0, 5.0, 5.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.478515625, -1.4389495849609375, -1.399383544921875, -1.3598175048828125, -1.32025146484375, -1.2806854248046875, -1.241119384765625, -1.2015533447265625, -1.1619873046875, -1.1224212646484375, -1.082855224609375, -1.0432891845703125, -1.00372314453125, -0.9641571044921875, -0.924591064453125, -0.8850250244140625, -0.845458984375, -0.8058929443359375, -0.766326904296875, -0.7267608642578125, -0.68719482421875, -0.6476287841796875, -0.608062744140625, -0.5684967041015625, -0.5289306640625, -0.4893646240234375, -0.449798583984375, -0.4102325439453125, -0.37066650390625, -0.3311004638671875, -0.291534423828125, -0.2519683837890625, -0.21240234375, -0.1728363037109375, -0.133270263671875, -0.0937042236328125, -0.05413818359375, -0.0145721435546875, 0.024993896484375, 0.0645599365234375, 0.1041259765625, 0.1436920166015625, 0.183258056640625, 0.2228240966796875, 0.26239013671875, 0.3019561767578125, 0.341522216796875, 0.3810882568359375, 0.420654296875, 0.4602203369140625, 0.499786376953125, 0.5393524169921875, 0.57891845703125, 0.6184844970703125, 0.658050537109375, 0.6976165771484375, 0.7371826171875, 0.7767486572265625, 0.816314697265625, 0.8558807373046875, 0.89544677734375, 0.9350128173828125, 0.974578857421875, 1.0141448974609375, 1.0537109375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 7.0, 6.0, 6.0, 9.0, 22.0, 36.0, 40.0, 81.0, 161.0, 353.0, 790.0, 2141.0, 6351.0, 23811.0, 143330.0, 3106437.0, 819496.0, 69742.0, 14539.0, 4288.0, 1486.0, 633.0, 256.0, 127.0, 64.0, 28.0, 17.0, 15.0, 9.0, 4.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-15.78125, -15.374755859375, -14.96826171875, -14.561767578125, -14.1552734375, -13.748779296875, -13.34228515625, -12.935791015625, -12.529296875, -12.122802734375, -11.71630859375, -11.309814453125, -10.9033203125, -10.496826171875, -10.09033203125, -9.683837890625, -9.27734375, -8.870849609375, -8.46435546875, -8.057861328125, -7.6513671875, -7.244873046875, -6.83837890625, -6.431884765625, -6.025390625, -5.618896484375, -5.21240234375, -4.805908203125, -4.3994140625, -3.992919921875, -3.58642578125, -3.179931640625, -2.7734375, -2.366943359375, -1.96044921875, -1.553955078125, -1.1474609375, -0.740966796875, -0.33447265625, 0.072021484375, 0.478515625, 0.885009765625, 1.29150390625, 1.697998046875, 2.1044921875, 2.510986328125, 2.91748046875, 3.323974609375, 3.73046875, 4.136962890625, 4.54345703125, 4.949951171875, 5.3564453125, 5.762939453125, 6.16943359375, 6.575927734375, 6.982421875, 7.388916015625, 7.79541015625, 8.201904296875, 8.6083984375, 9.014892578125, 9.42138671875, 9.827880859375, 10.234375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 1.0, 6.0, 10.0, 8.0, 11.0, 15.0, 20.0, 31.0, 59.0, 71.0, 118.0, 179.0, 273.0, 476.0, 1270.0, 649.0, 345.0, 168.0, 112.0, 69.0, 55.0, 40.0, 16.0, 17.0, 20.0, 6.0, 5.0, 6.0, 5.0, 6.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.541015625, -1.4952545166015625, -1.449493408203125, -1.4037322998046875, -1.35797119140625, -1.3122100830078125, -1.266448974609375, -1.2206878662109375, -1.1749267578125, -1.1291656494140625, -1.083404541015625, -1.0376434326171875, -0.99188232421875, -0.9461212158203125, -0.900360107421875, -0.8545989990234375, -0.808837890625, -0.7630767822265625, -0.717315673828125, -0.6715545654296875, -0.62579345703125, -0.5800323486328125, -0.534271240234375, -0.4885101318359375, -0.4427490234375, -0.3969879150390625, -0.351226806640625, -0.3054656982421875, -0.25970458984375, -0.2139434814453125, -0.168182373046875, -0.1224212646484375, -0.07666015625, -0.0308990478515625, 0.014862060546875, 0.0606231689453125, 0.10638427734375, 0.1521453857421875, 0.197906494140625, 0.2436676025390625, 0.2894287109375, 0.3351898193359375, 0.380950927734375, 0.4267120361328125, 0.47247314453125, 0.5182342529296875, 0.563995361328125, 0.6097564697265625, 0.655517578125, 0.7012786865234375, 0.747039794921875, 0.7928009033203125, 0.83856201171875, 0.8843231201171875, 0.930084228515625, 0.9758453369140625, 1.0216064453125, 1.0673675537109375, 1.113128662109375, 1.1588897705078125, 1.20465087890625, 1.2504119873046875, 1.296173095703125, 1.3419342041015625, 1.3876953125]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 4.0, 5.0, 2.0, 8.0, 7.0, 7.0, 17.0, 26.0, 30.0, 37.0, 61.0, 75.0, 88.0, 97.0, 118.0, 96.0, 76.0, 64.0, 50.0, 41.0, 30.0, 15.0, 13.0, 8.0, 9.0, 5.0, 1.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-10.100502014160156, -9.841887474060059, -9.583273887634277, -9.32465934753418, -9.066045761108398, -8.8074312210083, -8.54881763458252, -8.290203094482422, -8.03158950805664, -7.772975444793701, -7.514361381530762, -7.255747318267822, -6.997133255004883, -6.738518714904785, -6.479904651641846, -6.221290588378906, -5.962676048278809, -5.704061985015869, -5.44544792175293, -5.18683385848999, -4.928219795227051, -4.669605255126953, -4.410991191864014, -4.152377128601074, -3.8937630653381348, -3.6351490020751953, -3.376534938812256, -3.1179206371307373, -2.859306573867798, -2.6006925106048584, -2.34207820892334, -2.0834641456604004, -1.824850082397461, -1.5662360191345215, -1.3076218366622925, -1.0490076541900635, -0.790393590927124, -0.5317795276641846, -0.27316534519195557, -0.014551162719726562, 0.2440629005432129, 0.5026770234107971, 0.7612911462783813, 1.0199053287506104, 1.2785193920135498, 1.5371334552764893, 1.7957476377487183, 2.0543618202209473, 2.3129758834838867, 2.571589946746826, 2.8302040100097656, 3.088818311691284, 3.3474323749542236, 3.606046438217163, 3.8646607398986816, 4.123274803161621, 4.3818888664245605, 4.6405029296875, 4.8991169929504395, 5.157731056213379, 5.416345596313477, 5.674959182739258, 5.9335737228393555, 6.192187786102295, 6.450801849365234]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 4.0, 5.0, 5.0, 11.0, 17.0, 13.0, 22.0, 18.0, 32.0, 21.0, 33.0, 36.0, 44.0, 50.0, 59.0, 50.0, 47.0, 42.0, 49.0, 42.0, 47.0, 43.0, 41.0, 41.0, 29.0, 36.0, 32.0, 25.0, 11.0, 20.0, 14.0, 13.0, 9.0, 9.0, 8.0, 8.0, 5.0, 3.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.4482879638671875, -5.276656627655029, -5.105024814605713, -4.933393478393555, -4.761761665344238, -4.59013032913208, -4.418498992919922, -4.2468671798706055, -4.075235843658447, -3.90360426902771, -3.7319726943969727, -3.5603413581848145, -3.388709783554077, -3.21707820892334, -3.0454466342926025, -2.8738150596618652, -2.702183485031128, -2.5305519104003906, -2.3589203357696533, -2.187288761138916, -2.015657424926758, -1.8440258502960205, -1.6723942756652832, -1.5007628202438354, -1.3291312456130981, -1.1574996709823608, -0.9858682155609131, -0.8142366409301758, -0.6426051259040833, -0.4709736108779907, -0.2993420362472534, -0.12771058082580566, 0.04392099380493164, 0.21555252373218536, 0.3871840536594391, 0.558815598487854, 0.7304471135139465, 0.9020786285400391, 1.0737102031707764, 1.2453416585922241, 1.4169732332229614, 1.5886048078536987, 1.7602362632751465, 1.9318678379058838, 2.103499412536621, 2.2751307487487793, 2.4467625617980957, 2.618393898010254, 2.790025472640991, 2.9616570472717285, 3.133288621902466, 3.304920196533203, 3.4765515327453613, 3.6481831073760986, 3.819814682006836, 3.991446018218994, 4.1630778312683105, 4.334709167480469, 4.506340980529785, 4.677972316741943, 4.84960412979126, 5.021235466003418, 5.192867279052734, 5.364498615264893, 5.536129951477051]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 5.0, 4.0, 3.0, 6.0, 8.0, 18.0, 28.0, 45.0, 85.0, 132.0, 254.0, 474.0, 886.0, 2334.0, 6849.0, 24144.0, 108753.0, 418421.0, 368351.0, 87631.0, 20349.0, 5834.0, 2157.0, 856.0, 404.0, 204.0, 131.0, 76.0, 44.0, 22.0, 21.0, 9.0, 9.0, 6.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.8125, -8.55279541015625, -8.2930908203125, -8.03338623046875, -7.773681640625, -7.51397705078125, -7.2542724609375, -6.99456787109375, -6.73486328125, -6.47515869140625, -6.2154541015625, -5.95574951171875, -5.696044921875, -5.43634033203125, -5.1766357421875, -4.91693115234375, -4.6572265625, -4.39752197265625, -4.1378173828125, -3.87811279296875, -3.618408203125, -3.35870361328125, -3.0989990234375, -2.83929443359375, -2.57958984375, -2.31988525390625, -2.0601806640625, -1.80047607421875, -1.540771484375, -1.28106689453125, -1.0213623046875, -0.76165771484375, -0.501953125, -0.24224853515625, 0.0174560546875, 0.27716064453125, 0.536865234375, 0.79656982421875, 1.0562744140625, 1.31597900390625, 1.57568359375, 1.83538818359375, 2.0950927734375, 2.35479736328125, 2.614501953125, 2.87420654296875, 3.1339111328125, 3.39361572265625, 3.6533203125, 3.91302490234375, 4.1727294921875, 4.43243408203125, 4.692138671875, 4.95184326171875, 5.2115478515625, 5.47125244140625, 5.73095703125, 5.99066162109375, 6.2503662109375, 6.51007080078125, 6.769775390625, 7.02947998046875, 7.2891845703125, 7.54888916015625, 7.80859375]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 3.0, 4.0, 7.0, 5.0, 18.0, 24.0, 39.0, 59.0, 109.0, 138.0, 130.0, 127.0, 110.0, 84.0, 67.0, 41.0, 17.0, 6.0, 7.0, 4.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.40234375, -1.3630828857421875, -1.323822021484375, -1.2845611572265625, -1.24530029296875, -1.2060394287109375, -1.166778564453125, -1.1275177001953125, -1.0882568359375, -1.0489959716796875, -1.009735107421875, -0.9704742431640625, -0.93121337890625, -0.8919525146484375, -0.852691650390625, -0.8134307861328125, -0.774169921875, -0.7349090576171875, -0.695648193359375, -0.6563873291015625, -0.61712646484375, -0.5778656005859375, -0.538604736328125, -0.4993438720703125, -0.4600830078125, -0.4208221435546875, -0.381561279296875, -0.3423004150390625, -0.30303955078125, -0.2637786865234375, -0.224517822265625, -0.1852569580078125, -0.14599609375, -0.1067352294921875, -0.067474365234375, -0.0282135009765625, 0.01104736328125, 0.0503082275390625, 0.089569091796875, 0.1288299560546875, 0.1680908203125, 0.2073516845703125, 0.246612548828125, 0.2858734130859375, 0.32513427734375, 0.3643951416015625, 0.403656005859375, 0.4429168701171875, 0.482177734375, 0.5214385986328125, 0.560699462890625, 0.5999603271484375, 0.63922119140625, 0.6784820556640625, 0.717742919921875, 0.7570037841796875, 0.7962646484375, 0.8355255126953125, 0.874786376953125, 0.9140472412109375, 0.95330810546875, 0.9925689697265625, 1.031829833984375, 1.0710906982421875, 1.1103515625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 7.0, 5.0, 9.0, 7.0, 22.0, 37.0, 42.0, 55.0, 85.0, 109.0, 202.0, 292.0, 462.0, 779.0, 1214.0, 2489.0, 6067.0, 16981.0, 53954.0, 170948.0, 368392.0, 278883.0, 98972.0, 30227.0, 9926.0, 4003.0, 1772.0, 950.0, 538.0, 359.0, 258.0, 164.0, 99.0, 80.0, 52.0, 40.0, 22.0, 16.0, 13.0, 9.0, 3.0, 3.0, 2.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.7578125, -6.551513671875, -6.34521484375, -6.138916015625, -5.9326171875, -5.726318359375, -5.52001953125, -5.313720703125, -5.107421875, -4.901123046875, -4.69482421875, -4.488525390625, -4.2822265625, -4.075927734375, -3.86962890625, -3.663330078125, -3.45703125, -3.250732421875, -3.04443359375, -2.838134765625, -2.6318359375, -2.425537109375, -2.21923828125, -2.012939453125, -1.806640625, -1.600341796875, -1.39404296875, -1.187744140625, -0.9814453125, -0.775146484375, -0.56884765625, -0.362548828125, -0.15625, 0.050048828125, 0.25634765625, 0.462646484375, 0.6689453125, 0.875244140625, 1.08154296875, 1.287841796875, 1.494140625, 1.700439453125, 1.90673828125, 2.113037109375, 2.3193359375, 2.525634765625, 2.73193359375, 2.938232421875, 3.14453125, 3.350830078125, 3.55712890625, 3.763427734375, 3.9697265625, 4.176025390625, 4.38232421875, 4.588623046875, 4.794921875, 5.001220703125, 5.20751953125, 5.413818359375, 5.6201171875, 5.826416015625, 6.03271484375, 6.239013671875, 6.4453125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 5.0, 3.0, 5.0, 4.0, 4.0, 5.0, 9.0, 10.0, 11.0, 19.0, 15.0, 24.0, 23.0, 21.0, 30.0, 31.0, 28.0, 33.0, 39.0, 48.0, 53.0, 49.0, 54.0, 51.0, 41.0, 40.0, 43.0, 38.0, 41.0, 21.0, 28.0, 34.0, 18.0, 23.0, 24.0, 16.0, 15.0, 12.0, 7.0, 9.0, 4.0, 2.0, 7.0, 7.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.68359375, -3.564361572265625, -3.44512939453125, -3.325897216796875, -3.2066650390625, -3.087432861328125, -2.96820068359375, -2.848968505859375, -2.729736328125, -2.610504150390625, -2.49127197265625, -2.372039794921875, -2.2528076171875, -2.133575439453125, -2.01434326171875, -1.895111083984375, -1.77587890625, -1.656646728515625, -1.53741455078125, -1.418182373046875, -1.2989501953125, -1.179718017578125, -1.06048583984375, -0.941253662109375, -0.822021484375, -0.702789306640625, -0.58355712890625, -0.464324951171875, -0.3450927734375, -0.225860595703125, -0.10662841796875, 0.012603759765625, 0.1318359375, 0.251068115234375, 0.37030029296875, 0.489532470703125, 0.6087646484375, 0.727996826171875, 0.84722900390625, 0.966461181640625, 1.085693359375, 1.204925537109375, 1.32415771484375, 1.443389892578125, 1.5626220703125, 1.681854248046875, 1.80108642578125, 1.920318603515625, 2.03955078125, 2.158782958984375, 2.27801513671875, 2.397247314453125, 2.5164794921875, 2.635711669921875, 2.75494384765625, 2.874176025390625, 2.993408203125, 3.112640380859375, 3.23187255859375, 3.351104736328125, 3.4703369140625, 3.589569091796875, 3.70880126953125, 3.828033447265625, 3.947265625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 2.0, 5.0, 3.0, 4.0, 9.0, 11.0, 23.0, 20.0, 33.0, 58.0, 74.0, 118.0, 177.0, 299.0, 571.0, 1076.0, 2255.0, 5103.0, 12366.0, 35080.0, 109650.0, 297068.0, 351405.0, 154474.0, 49332.0, 16894.0, 6539.0, 2803.0, 1374.0, 684.0, 386.0, 241.0, 152.0, 92.0, 45.0, 40.0, 21.0, 15.0, 14.0, 5.0, 7.0, 9.0, 6.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-4.94140625, -4.7923583984375, -4.643310546875, -4.4942626953125, -4.34521484375, -4.1961669921875, -4.047119140625, -3.8980712890625, -3.7490234375, -3.5999755859375, -3.450927734375, -3.3018798828125, -3.15283203125, -3.0037841796875, -2.854736328125, -2.7056884765625, -2.556640625, -2.4075927734375, -2.258544921875, -2.1094970703125, -1.96044921875, -1.8114013671875, -1.662353515625, -1.5133056640625, -1.3642578125, -1.2152099609375, -1.066162109375, -0.9171142578125, -0.76806640625, -0.6190185546875, -0.469970703125, -0.3209228515625, -0.171875, -0.0228271484375, 0.126220703125, 0.2752685546875, 0.42431640625, 0.5733642578125, 0.722412109375, 0.8714599609375, 1.0205078125, 1.1695556640625, 1.318603515625, 1.4676513671875, 1.61669921875, 1.7657470703125, 1.914794921875, 2.0638427734375, 2.212890625, 2.3619384765625, 2.510986328125, 2.6600341796875, 2.80908203125, 2.9581298828125, 3.107177734375, 3.2562255859375, 3.4052734375, 3.5543212890625, 3.703369140625, 3.8524169921875, 4.00146484375, 4.1505126953125, 4.299560546875, 4.4486083984375, 4.59765625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 7.0, 0.0, 3.0, 2.0, 3.0, 3.0, 9.0, 6.0, 12.0, 15.0, 10.0, 20.0, 17.0, 27.0, 26.0, 36.0, 35.0, 42.0, 34.0, 62.0, 44.0, 50.0, 57.0, 55.0, 50.0, 53.0, 47.0, 46.0, 42.0, 21.0, 24.0, 32.0, 20.0, 13.0, 21.0, 16.0, 14.0, 7.0, 6.0, 5.0, 9.0, 4.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.0005354881286621094, -0.0005205534398555756, -0.0005056187510490417, -0.0004906840622425079, -0.0004757493734359741, -0.0004608146846294403, -0.0004458799958229065, -0.0004309453070163727, -0.00041601061820983887, -0.00040107592940330505, -0.00038614124059677124, -0.0003712065517902374, -0.0003562718629837036, -0.0003413371741771698, -0.000326402485370636, -0.00031146779656410217, -0.00029653310775756836, -0.00028159841895103455, -0.00026666373014450073, -0.0002517290413379669, -0.0002367943525314331, -0.0002218596637248993, -0.00020692497491836548, -0.00019199028611183167, -0.00017705559730529785, -0.00016212090849876404, -0.00014718621969223022, -0.0001322515308856964, -0.0001173168420791626, -0.00010238215327262878, -8.744746446609497e-05, -7.251277565956116e-05, -5.7578086853027344e-05, -4.264339804649353e-05, -2.7708709239959717e-05, -1.2774020433425903e-05, 2.16066837310791e-06, 1.7095357179641724e-05, 3.203004598617554e-05, 4.696473479270935e-05, 6.189942359924316e-05, 7.683411240577698e-05, 9.176880121231079e-05, 0.0001067034900188446, 0.00012163817882537842, 0.00013657286763191223, 0.00015150755643844604, 0.00016644224524497986, 0.00018137693405151367, 0.00019631162285804749, 0.0002112463116645813, 0.0002261810004711151, 0.00024111568927764893, 0.00025605037808418274, 0.00027098506689071655, 0.00028591975569725037, 0.0003008544445037842, 0.000315789133310318, 0.0003307238221168518, 0.0003456585109233856, 0.00036059319972991943, 0.00037552788853645325, 0.00039046257734298706, 0.0004053972661495209, 0.0004203319549560547]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 2.0, 5.0, 6.0, 7.0, 14.0, 23.0, 31.0, 49.0, 70.0, 117.0, 203.0, 348.0, 648.0, 1301.0, 2836.0, 7641.0, 26269.0, 124825.0, 536696.0, 275997.0, 50166.0, 12976.0, 4352.0, 1884.0, 894.0, 490.0, 262.0, 153.0, 99.0, 63.0, 35.0, 23.0, 22.0, 12.0, 10.0, 4.0, 7.0, 5.0, 7.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.4765625, -8.217529296875, -7.95849609375, -7.699462890625, -7.4404296875, -7.181396484375, -6.92236328125, -6.663330078125, -6.404296875, -6.145263671875, -5.88623046875, -5.627197265625, -5.3681640625, -5.109130859375, -4.85009765625, -4.591064453125, -4.33203125, -4.072998046875, -3.81396484375, -3.554931640625, -3.2958984375, -3.036865234375, -2.77783203125, -2.518798828125, -2.259765625, -2.000732421875, -1.74169921875, -1.482666015625, -1.2236328125, -0.964599609375, -0.70556640625, -0.446533203125, -0.1875, 0.071533203125, 0.33056640625, 0.589599609375, 0.8486328125, 1.107666015625, 1.36669921875, 1.625732421875, 1.884765625, 2.143798828125, 2.40283203125, 2.661865234375, 2.9208984375, 3.179931640625, 3.43896484375, 3.697998046875, 3.95703125, 4.216064453125, 4.47509765625, 4.734130859375, 4.9931640625, 5.252197265625, 5.51123046875, 5.770263671875, 6.029296875, 6.288330078125, 6.54736328125, 6.806396484375, 7.0654296875, 7.324462890625, 7.58349609375, 7.842529296875, 8.1015625]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 2.0, 5.0, 8.0, 7.0, 6.0, 15.0, 19.0, 27.0, 29.0, 29.0, 55.0, 64.0, 76.0, 75.0, 71.0, 75.0, 83.0, 65.0, 64.0, 52.0, 44.0, 24.0, 25.0, 18.0, 22.0, 10.0, 7.0, 4.0, 6.0, 8.0, 5.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.212890625, -3.10235595703125, -2.9918212890625, -2.88128662109375, -2.770751953125, -2.66021728515625, -2.5496826171875, -2.43914794921875, -2.32861328125, -2.21807861328125, -2.1075439453125, -1.99700927734375, -1.886474609375, -1.77593994140625, -1.6654052734375, -1.55487060546875, -1.4443359375, -1.33380126953125, -1.2232666015625, -1.11273193359375, -1.002197265625, -0.89166259765625, -0.7811279296875, -0.67059326171875, -0.56005859375, -0.44952392578125, -0.3389892578125, -0.22845458984375, -0.117919921875, -0.00738525390625, 0.1031494140625, 0.21368408203125, 0.32421875, 0.43475341796875, 0.5452880859375, 0.65582275390625, 0.766357421875, 0.87689208984375, 0.9874267578125, 1.09796142578125, 1.20849609375, 1.31903076171875, 1.4295654296875, 1.54010009765625, 1.650634765625, 1.76116943359375, 1.8717041015625, 1.98223876953125, 2.0927734375, 2.20330810546875, 2.3138427734375, 2.42437744140625, 2.534912109375, 2.64544677734375, 2.7559814453125, 2.86651611328125, 2.97705078125, 3.08758544921875, 3.1981201171875, 3.30865478515625, 3.419189453125, 3.52972412109375, 3.6402587890625, 3.75079345703125, 3.861328125]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 8.0, 29.0, 116.0, 441.0, 338.0, 64.0, 8.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-100.31819152832031, -95.00203704833984, -89.68588256835938, -84.36973571777344, -79.05358123779297, -73.7374267578125, -68.42127990722656, -63.105125427246094, -57.788970947265625, -52.472816467285156, -47.15666580200195, -41.84051513671875, -36.52436065673828, -31.208208084106445, -25.89205551147461, -20.575904846191406, -15.259750366210938, -9.943597793579102, -4.627445220947266, 0.6887073516845703, 6.004859924316406, 11.321012496948242, 16.637165069580078, 21.95331573486328, 27.26947021484375, 32.58562469482422, 37.90177536010742, 43.217926025390625, 48.534080505371094, 53.85023498535156, 59.166385650634766, 64.48253631591797, 69.7987060546875, 75.11486053466797, 80.43101501464844, 85.74716186523438, 91.06331634521484, 96.37947082519531, 101.69561767578125, 107.01177215576172, 112.32792663574219, 117.64408111572266, 122.96023559570312, 128.27638244628906, 133.592529296875, 138.90869140625, 144.22483825683594, 149.54098510742188, 154.85714721679688, 160.1732940673828, 165.4894561767578, 170.80560302734375, 176.12176513671875, 181.4379119873047, 186.75405883789062, 192.07022094726562, 197.38636779785156, 202.7025146484375, 208.0186767578125, 213.33482360839844, 218.65097045898438, 223.96713256835938, 229.2832794189453, 234.59942626953125, 239.91558837890625]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 4.0, 5.0, 7.0, 6.0, 3.0, 9.0, 10.0, 15.0, 15.0, 27.0, 37.0, 50.0, 46.0, 62.0, 74.0, 83.0, 97.0, 67.0, 68.0, 68.0, 63.0, 43.0, 30.0, 40.0, 19.0, 17.0, 18.0, 14.0, 4.0, 3.0, 4.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.222166061401367, -29.89703369140625, -28.571903228759766, -27.24677276611328, -25.921640396118164, -24.596508026123047, -23.271377563476562, -21.946247100830078, -20.62111473083496, -19.295982360839844, -17.97085189819336, -16.645721435546875, -15.320589065551758, -13.995457649230957, -12.670326232910156, -11.345194816589355, -10.020063400268555, -8.694931983947754, -7.369800567626953, -6.044669151306152, -4.719537734985352, -3.394406318664551, -2.06927490234375, -0.7441434860229492, 0.5809879302978516, 1.9061193466186523, 3.231250762939453, 4.556382179260254, 5.881513595581055, 7.2066450119018555, 8.531776428222656, 9.856907844543457, 11.182037353515625, 12.507168769836426, 13.832300186157227, 15.157431602478027, 16.482563018798828, 17.807693481445312, 19.13282585144043, 20.457958221435547, 21.78308868408203, 23.108219146728516, 24.433351516723633, 25.75848388671875, 27.083614349365234, 28.40874481201172, 29.733877182006836, 31.059009552001953, 32.38414001464844, 33.70927047729492, 35.034400939941406, 36.359535217285156, 37.68466567993164, 39.009796142578125, 40.334930419921875, 41.66006088256836, 42.985191345214844, 44.31032180786133, 45.63545227050781, 46.96058654785156, 48.28571701049805, 49.61084747314453, 50.93598175048828, 52.261112213134766, 53.58624267578125]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 10.0, 5.0, 7.0, 18.0, 24.0, 52.0, 90.0, 178.0, 374.0, 1107.0, 6165.0, 161941.0, 3995346.0, 25752.0, 2344.0, 503.0, 191.0, 80.0, 41.0, 18.0, 10.0, 11.0, 10.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.59375, -25.83984375, -25.0859375, -24.33203125, -23.578125, -22.82421875, -22.0703125, -21.31640625, -20.5625, -19.80859375, -19.0546875, -18.30078125, -17.546875, -16.79296875, -16.0390625, -15.28515625, -14.53125, -13.77734375, -13.0234375, -12.26953125, -11.515625, -10.76171875, -10.0078125, -9.25390625, -8.5, -7.74609375, -6.9921875, -6.23828125, -5.484375, -4.73046875, -3.9765625, -3.22265625, -2.46875, -1.71484375, -0.9609375, -0.20703125, 0.546875, 1.30078125, 2.0546875, 2.80859375, 3.5625, 4.31640625, 5.0703125, 5.82421875, 6.578125, 7.33203125, 8.0859375, 8.83984375, 9.59375, 10.34765625, 11.1015625, 11.85546875, 12.609375, 13.36328125, 14.1171875, 14.87109375, 15.625, 16.37890625, 17.1328125, 17.88671875, 18.640625, 19.39453125, 20.1484375, 20.90234375, 21.65625]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 5.0, 4.0, 8.0, 17.0, 27.0, 26.0, 54.0, 110.0, 108.0, 133.0, 141.0, 129.0, 104.0, 49.0, 42.0, 22.0, 10.0, 7.0, 5.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.775390625, -1.7244415283203125, -1.673492431640625, -1.6225433349609375, -1.57159423828125, -1.5206451416015625, -1.469696044921875, -1.4187469482421875, -1.3677978515625, -1.3168487548828125, -1.265899658203125, -1.2149505615234375, -1.16400146484375, -1.1130523681640625, -1.062103271484375, -1.0111541748046875, -0.960205078125, -0.9092559814453125, -0.858306884765625, -0.8073577880859375, -0.75640869140625, -0.7054595947265625, -0.654510498046875, -0.6035614013671875, -0.5526123046875, -0.5016632080078125, -0.450714111328125, -0.3997650146484375, -0.34881591796875, -0.2978668212890625, -0.246917724609375, -0.1959686279296875, -0.14501953125, -0.0940704345703125, -0.043121337890625, 0.0078277587890625, 0.05877685546875, 0.1097259521484375, 0.160675048828125, 0.2116241455078125, 0.2625732421875, 0.3135223388671875, 0.364471435546875, 0.4154205322265625, 0.46636962890625, 0.5173187255859375, 0.568267822265625, 0.6192169189453125, 0.670166015625, 0.7211151123046875, 0.772064208984375, 0.8230133056640625, 0.87396240234375, 0.9249114990234375, 0.975860595703125, 1.0268096923828125, 1.0777587890625, 1.1287078857421875, 1.179656982421875, 1.2306060791015625, 1.28155517578125, 1.3325042724609375, 1.383453369140625, 1.4344024658203125, 1.4853515625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 7.0, 5.0, 4.0, 7.0, 9.0, 12.0, 13.0, 33.0, 43.0, 55.0, 106.0, 207.0, 435.0, 1224.0, 3752.0, 13331.0, 62779.0, 543615.0, 3295557.0, 224766.0, 35757.0, 8526.0, 2396.0, 851.0, 341.0, 153.0, 96.0, 57.0, 39.0, 31.0, 16.0, 19.0, 9.0, 10.0, 5.0, 4.0, 5.0, 5.0, 6.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.8828125, -7.5833740234375, -7.283935546875, -6.9844970703125, -6.68505859375, -6.3856201171875, -6.086181640625, -5.7867431640625, -5.4873046875, -5.1878662109375, -4.888427734375, -4.5889892578125, -4.28955078125, -3.9901123046875, -3.690673828125, -3.3912353515625, -3.091796875, -2.7923583984375, -2.492919921875, -2.1934814453125, -1.89404296875, -1.5946044921875, -1.295166015625, -0.9957275390625, -0.6962890625, -0.3968505859375, -0.097412109375, 0.2020263671875, 0.50146484375, 0.8009033203125, 1.100341796875, 1.3997802734375, 1.69921875, 1.9986572265625, 2.298095703125, 2.5975341796875, 2.89697265625, 3.1964111328125, 3.495849609375, 3.7952880859375, 4.0947265625, 4.3941650390625, 4.693603515625, 4.9930419921875, 5.29248046875, 5.5919189453125, 5.891357421875, 6.1907958984375, 6.490234375, 6.7896728515625, 7.089111328125, 7.3885498046875, 7.68798828125, 7.9874267578125, 8.286865234375, 8.5863037109375, 8.8857421875, 9.1851806640625, 9.484619140625, 9.7840576171875, 10.08349609375, 10.3829345703125, 10.682373046875, 10.9818115234375, 11.28125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 3.0, 2.0, 0.0, 2.0, 0.0, 5.0, 4.0, 10.0, 14.0, 20.0, 29.0, 31.0, 62.0, 92.0, 178.0, 303.0, 730.0, 1521.0, 499.0, 217.0, 135.0, 76.0, 56.0, 31.0, 23.0, 12.0, 13.0, 4.0, 4.0, 4.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3125, -1.25079345703125, -1.1890869140625, -1.12738037109375, -1.065673828125, -1.00396728515625, -0.9422607421875, -0.88055419921875, -0.81884765625, -0.75714111328125, -0.6954345703125, -0.63372802734375, -0.572021484375, -0.51031494140625, -0.4486083984375, -0.38690185546875, -0.3251953125, -0.26348876953125, -0.2017822265625, -0.14007568359375, -0.078369140625, -0.01666259765625, 0.0450439453125, 0.10675048828125, 0.16845703125, 0.23016357421875, 0.2918701171875, 0.35357666015625, 0.415283203125, 0.47698974609375, 0.5386962890625, 0.60040283203125, 0.662109375, 0.72381591796875, 0.7855224609375, 0.84722900390625, 0.908935546875, 0.97064208984375, 1.0323486328125, 1.09405517578125, 1.15576171875, 1.21746826171875, 1.2791748046875, 1.34088134765625, 1.402587890625, 1.46429443359375, 1.5260009765625, 1.58770751953125, 1.6494140625, 1.71112060546875, 1.7728271484375, 1.83453369140625, 1.896240234375, 1.95794677734375, 2.0196533203125, 2.08135986328125, 2.14306640625, 2.20477294921875, 2.2664794921875, 2.32818603515625, 2.389892578125, 2.45159912109375, 2.5133056640625, 2.57501220703125, 2.63671875]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 8.0, 18.0, 29.0, 46.0, 84.0, 120.0, 167.0, 175.0, 121.0, 103.0, 55.0, 26.0, 17.0, 8.0, 9.0, 7.0, 2.0, 1.0, 0.0, 2.0, 5.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.369020462036133, -7.928933143615723, -7.4888458251953125, -7.048758506774902, -6.60867166519165, -6.16858434677124, -5.72849702835083, -5.288410186767578, -4.848322868347168, -4.408235549926758, -3.9681484699249268, -3.5280611515045166, -3.0879740715026855, -2.6478867530822754, -2.2077994346618652, -1.7677123546600342, -1.327624797821045, -0.8875375986099243, -0.44745033979415894, -0.007363080978393555, 0.43272411823272705, 0.8728113174438477, 1.3128986358642578, 1.7529857158660889, 2.193073034286499, 2.633160352706909, 3.0732474327087402, 3.5133347511291504, 3.9534220695495605, 4.3935089111328125, 4.833596229553223, 5.273683547973633, 5.713770866394043, 6.153858184814453, 6.593945503234863, 7.034032821655273, 7.474119663238525, 7.9142069816589355, 8.354293823242188, 8.794381141662598, 9.234468460083008, 9.674555778503418, 10.114643096923828, 10.554730415344238, 10.994817733764648, 11.434904098510742, 11.874992370605469, 12.315078735351562, 12.755167007446289, 13.1952543258667, 13.63534164428711, 14.07542896270752, 14.51551628112793, 14.955602645874023, 15.39569091796875, 15.835777282714844, 16.275863647460938, 16.71595001220703, 17.156038284301758, 17.59612464904785, 18.036212921142578, 18.476299285888672, 18.9163875579834, 19.356473922729492, 19.79656219482422]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 5.0, 6.0, 8.0, 9.0, 10.0, 8.0, 15.0, 22.0, 18.0, 25.0, 21.0, 24.0, 33.0, 35.0, 39.0, 45.0, 49.0, 42.0, 52.0, 44.0, 38.0, 44.0, 55.0, 37.0, 43.0, 32.0, 36.0, 22.0, 25.0, 24.0, 22.0, 23.0, 18.0, 13.0, 17.0, 7.0, 9.0, 4.0, 8.0, 7.0, 3.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0], "bins": [-5.768826961517334, -5.593883991241455, -5.418941020965576, -5.243998050689697, -5.069055557250977, -4.894112586975098, -4.719169616699219, -4.54422664642334, -4.369283676147461, -4.194340705871582, -4.019397735595703, -3.8444550037384033, -3.6695120334625244, -3.4945690631866455, -3.3196263313293457, -3.144683361053467, -2.969740390777588, -2.794797420501709, -2.61985445022583, -2.4449117183685303, -2.2699687480926514, -2.0950257778167725, -1.920082926750183, -1.7451400756835938, -1.5701971054077148, -1.395254135131836, -1.2203112840652466, -1.0453684329986572, -0.8704254627227783, -0.6954825520515442, -0.5205396413803101, -0.3455967903137207, -0.1706533432006836, 0.004289567470550537, 0.17923247814178467, 0.3541753888130188, 0.5291182994842529, 0.7040612101554871, 0.8790041208267212, 1.0539469718933105, 1.2288899421691895, 1.4038329124450684, 1.5787757635116577, 1.753718614578247, 1.928661584854126, 2.103604555130005, 2.2785472869873047, 2.4534902572631836, 2.6284332275390625, 2.8033761978149414, 2.9783191680908203, 3.15326189994812, 3.328204870223999, 3.503147840499878, 3.6780905723571777, 3.8530335426330566, 4.0279765129089355, 4.2029194831848145, 4.377862453460693, 4.552805423736572, 4.727747917175293, 4.902690887451172, 5.077633857727051, 5.25257682800293, 5.427519798278809]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 2.0, 9.0, 6.0, 15.0, 16.0, 28.0, 30.0, 52.0, 79.0, 118.0, 181.0, 290.0, 507.0, 1013.0, 1971.0, 4633.0, 12775.0, 43554.0, 151959.0, 357852.0, 310783.0, 113659.0, 31888.0, 9878.0, 3678.0, 1621.0, 825.0, 392.0, 270.0, 178.0, 94.0, 69.0, 40.0, 20.0, 21.0, 10.0, 7.0, 13.0, 5.0, 6.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.54296875, -6.33770751953125, -6.1324462890625, -5.92718505859375, -5.721923828125, -5.51666259765625, -5.3114013671875, -5.10614013671875, -4.90087890625, -4.69561767578125, -4.4903564453125, -4.28509521484375, -4.079833984375, -3.87457275390625, -3.6693115234375, -3.46405029296875, -3.2587890625, -3.05352783203125, -2.8482666015625, -2.64300537109375, -2.437744140625, -2.23248291015625, -2.0272216796875, -1.82196044921875, -1.61669921875, -1.41143798828125, -1.2061767578125, -1.00091552734375, -0.795654296875, -0.59039306640625, -0.3851318359375, -0.17987060546875, 0.025390625, 0.23065185546875, 0.4359130859375, 0.64117431640625, 0.846435546875, 1.05169677734375, 1.2569580078125, 1.46221923828125, 1.66748046875, 1.87274169921875, 2.0780029296875, 2.28326416015625, 2.488525390625, 2.69378662109375, 2.8990478515625, 3.10430908203125, 3.3095703125, 3.51483154296875, 3.7200927734375, 3.92535400390625, 4.130615234375, 4.33587646484375, 4.5411376953125, 4.74639892578125, 4.95166015625, 5.15692138671875, 5.3621826171875, 5.56744384765625, 5.772705078125, 5.97796630859375, 6.1832275390625, 6.38848876953125, 6.59375]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 4.0, 5.0, 12.0, 19.0, 28.0, 43.0, 62.0, 96.0, 104.0, 122.0, 128.0, 111.0, 87.0, 74.0, 41.0, 29.0, 16.0, 7.0, 10.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.591796875, -1.5447235107421875, -1.497650146484375, -1.4505767822265625, -1.40350341796875, -1.3564300537109375, -1.309356689453125, -1.2622833251953125, -1.2152099609375, -1.1681365966796875, -1.121063232421875, -1.0739898681640625, -1.02691650390625, -0.9798431396484375, -0.932769775390625, -0.8856964111328125, -0.838623046875, -0.7915496826171875, -0.744476318359375, -0.6974029541015625, -0.65032958984375, -0.6032562255859375, -0.556182861328125, -0.5091094970703125, -0.4620361328125, -0.4149627685546875, -0.367889404296875, -0.3208160400390625, -0.27374267578125, -0.2266693115234375, -0.179595947265625, -0.1325225830078125, -0.08544921875, -0.0383758544921875, 0.008697509765625, 0.0557708740234375, 0.10284423828125, 0.1499176025390625, 0.196990966796875, 0.2440643310546875, 0.2911376953125, 0.3382110595703125, 0.385284423828125, 0.4323577880859375, 0.47943115234375, 0.5265045166015625, 0.573577880859375, 0.6206512451171875, 0.667724609375, 0.7147979736328125, 0.761871337890625, 0.8089447021484375, 0.85601806640625, 0.9030914306640625, 0.950164794921875, 0.9972381591796875, 1.0443115234375, 1.0913848876953125, 1.138458251953125, 1.1855316162109375, 1.23260498046875, 1.2796783447265625, 1.326751708984375, 1.3738250732421875, 1.4208984375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 7.0, 8.0, 6.0, 8.0, 17.0, 21.0, 37.0, 50.0, 76.0, 102.0, 148.0, 252.0, 370.0, 576.0, 976.0, 1808.0, 4077.0, 11865.0, 43690.0, 160824.0, 372104.0, 305203.0, 104140.0, 27636.0, 7915.0, 2906.0, 1426.0, 802.0, 518.0, 321.0, 201.0, 140.0, 87.0, 78.0, 51.0, 37.0, 24.0, 18.0, 11.0, 15.0, 4.0, 1.0, 6.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.64453125, -6.428955078125, -6.21337890625, -5.997802734375, -5.7822265625, -5.566650390625, -5.35107421875, -5.135498046875, -4.919921875, -4.704345703125, -4.48876953125, -4.273193359375, -4.0576171875, -3.842041015625, -3.62646484375, -3.410888671875, -3.1953125, -2.979736328125, -2.76416015625, -2.548583984375, -2.3330078125, -2.117431640625, -1.90185546875, -1.686279296875, -1.470703125, -1.255126953125, -1.03955078125, -0.823974609375, -0.6083984375, -0.392822265625, -0.17724609375, 0.038330078125, 0.25390625, 0.469482421875, 0.68505859375, 0.900634765625, 1.1162109375, 1.331787109375, 1.54736328125, 1.762939453125, 1.978515625, 2.194091796875, 2.40966796875, 2.625244140625, 2.8408203125, 3.056396484375, 3.27197265625, 3.487548828125, 3.703125, 3.918701171875, 4.13427734375, 4.349853515625, 4.5654296875, 4.781005859375, 4.99658203125, 5.212158203125, 5.427734375, 5.643310546875, 5.85888671875, 6.074462890625, 6.2900390625, 6.505615234375, 6.72119140625, 6.936767578125, 7.15234375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 1.0, 2.0, 4.0, 8.0, 7.0, 3.0, 6.0, 5.0, 16.0, 22.0, 12.0, 24.0, 24.0, 30.0, 37.0, 31.0, 37.0, 47.0, 49.0, 58.0, 45.0, 46.0, 60.0, 46.0, 39.0, 42.0, 38.0, 41.0, 35.0, 31.0, 26.0, 26.0, 13.0, 17.0, 20.0, 7.0, 11.0, 12.0, 8.0, 7.0, 6.0, 3.0, 4.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.77734375, -4.64227294921875, -4.5072021484375, -4.37213134765625, -4.237060546875, -4.10198974609375, -3.9669189453125, -3.83184814453125, -3.69677734375, -3.56170654296875, -3.4266357421875, -3.29156494140625, -3.156494140625, -3.02142333984375, -2.8863525390625, -2.75128173828125, -2.6162109375, -2.48114013671875, -2.3460693359375, -2.21099853515625, -2.075927734375, -1.94085693359375, -1.8057861328125, -1.67071533203125, -1.53564453125, -1.40057373046875, -1.2655029296875, -1.13043212890625, -0.995361328125, -0.86029052734375, -0.7252197265625, -0.59014892578125, -0.455078125, -0.32000732421875, -0.1849365234375, -0.04986572265625, 0.085205078125, 0.22027587890625, 0.3553466796875, 0.49041748046875, 0.62548828125, 0.76055908203125, 0.8956298828125, 1.03070068359375, 1.165771484375, 1.30084228515625, 1.4359130859375, 1.57098388671875, 1.7060546875, 1.84112548828125, 1.9761962890625, 2.11126708984375, 2.246337890625, 2.38140869140625, 2.5164794921875, 2.65155029296875, 2.78662109375, 2.92169189453125, 3.0567626953125, 3.19183349609375, 3.326904296875, 3.46197509765625, 3.5970458984375, 3.73211669921875, 3.8671875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 3.0, 10.0, 10.0, 5.0, 16.0, 15.0, 21.0, 36.0, 56.0, 68.0, 168.0, 266.0, 529.0, 1093.0, 2380.0, 6756.0, 23873.0, 97593.0, 355485.0, 397704.0, 120582.0, 28515.0, 7921.0, 2858.0, 1209.0, 580.0, 298.0, 188.0, 113.0, 61.0, 46.0, 26.0, 21.0, 13.0, 10.0, 11.0, 3.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.802734375, -3.662261962890625, -3.52178955078125, -3.381317138671875, -3.2408447265625, -3.100372314453125, -2.95989990234375, -2.819427490234375, -2.678955078125, -2.538482666015625, -2.39801025390625, -2.257537841796875, -2.1170654296875, -1.976593017578125, -1.83612060546875, -1.695648193359375, -1.55517578125, -1.414703369140625, -1.27423095703125, -1.133758544921875, -0.9932861328125, -0.852813720703125, -0.71234130859375, -0.571868896484375, -0.431396484375, -0.290924072265625, -0.15045166015625, -0.009979248046875, 0.1304931640625, 0.270965576171875, 0.41143798828125, 0.551910400390625, 0.6923828125, 0.832855224609375, 0.97332763671875, 1.113800048828125, 1.2542724609375, 1.394744873046875, 1.53521728515625, 1.675689697265625, 1.816162109375, 1.956634521484375, 2.09710693359375, 2.237579345703125, 2.3780517578125, 2.518524169921875, 2.65899658203125, 2.799468994140625, 2.93994140625, 3.080413818359375, 3.22088623046875, 3.361358642578125, 3.5018310546875, 3.642303466796875, 3.78277587890625, 3.923248291015625, 4.063720703125, 4.204193115234375, 4.34466552734375, 4.485137939453125, 4.6256103515625, 4.766082763671875, 4.90655517578125, 5.047027587890625, 5.1875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 7.0, 2.0, 5.0, 8.0, 8.0, 11.0, 12.0, 17.0, 27.0, 20.0, 30.0, 36.0, 40.0, 47.0, 57.0, 68.0, 50.0, 60.0, 50.0, 50.0, 55.0, 48.0, 54.0, 34.0, 37.0, 27.0, 33.0, 24.0, 9.0, 10.0, 11.0, 8.0, 11.0, 12.0, 6.0, 1.0, 5.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004258155822753906, -0.0004119984805583954, -0.00039818137884140015, -0.0003843642771244049, -0.00037054717540740967, -0.00035673007369041443, -0.0003429129719734192, -0.00032909587025642395, -0.0003152787685394287, -0.00030146166682243347, -0.00028764456510543823, -0.000273827463388443, -0.00026001036167144775, -0.0002461932599544525, -0.00023237615823745728, -0.00021855905652046204, -0.0002047419548034668, -0.00019092485308647156, -0.00017710775136947632, -0.00016329064965248108, -0.00014947354793548584, -0.0001356564462184906, -0.00012183934450149536, -0.00010802224278450012, -9.420514106750488e-05, -8.038803935050964e-05, -6.65709376335144e-05, -5.2753835916519165e-05, -3.8936734199523926e-05, -2.5119632482528687e-05, -1.1302530765533447e-05, 2.514570951461792e-06, 1.633167266845703e-05, 3.014877438545227e-05, 4.396587610244751e-05, 5.778297781944275e-05, 7.160007953643799e-05, 8.541718125343323e-05, 9.923428297042847e-05, 0.0001130513846874237, 0.00012686848640441895, 0.00014068558812141418, 0.00015450268983840942, 0.00016831979155540466, 0.0001821368932723999, 0.00019595399498939514, 0.00020977109670639038, 0.00022358819842338562, 0.00023740530014038086, 0.0002512224018573761, 0.00026503950357437134, 0.0002788566052913666, 0.0002926737070083618, 0.00030649080872535706, 0.0003203079104423523, 0.00033412501215934753, 0.0003479421138763428, 0.000361759215593338, 0.00037557631731033325, 0.0003893934190273285, 0.00040321052074432373, 0.00041702762246131897, 0.0004308447241783142, 0.00044466182589530945, 0.0004584789276123047]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 4.0, 3.0, 3.0, 14.0, 15.0, 16.0, 25.0, 34.0, 53.0, 87.0, 105.0, 152.0, 263.0, 419.0, 678.0, 1241.0, 2427.0, 5714.0, 15922.0, 53461.0, 194337.0, 433311.0, 239830.0, 67778.0, 19689.0, 6773.0, 2829.0, 1383.0, 709.0, 444.0, 267.0, 168.0, 131.0, 64.0, 45.0, 51.0, 22.0, 21.0, 22.0, 10.0, 12.0, 5.0, 2.0, 3.0, 9.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-4.10546875, -3.9794921875, -3.853515625, -3.7275390625, -3.6015625, -3.4755859375, -3.349609375, -3.2236328125, -3.09765625, -2.9716796875, -2.845703125, -2.7197265625, -2.59375, -2.4677734375, -2.341796875, -2.2158203125, -2.08984375, -1.9638671875, -1.837890625, -1.7119140625, -1.5859375, -1.4599609375, -1.333984375, -1.2080078125, -1.08203125, -0.9560546875, -0.830078125, -0.7041015625, -0.578125, -0.4521484375, -0.326171875, -0.2001953125, -0.07421875, 0.0517578125, 0.177734375, 0.3037109375, 0.4296875, 0.5556640625, 0.681640625, 0.8076171875, 0.93359375, 1.0595703125, 1.185546875, 1.3115234375, 1.4375, 1.5634765625, 1.689453125, 1.8154296875, 1.94140625, 2.0673828125, 2.193359375, 2.3193359375, 2.4453125, 2.5712890625, 2.697265625, 2.8232421875, 2.94921875, 3.0751953125, 3.201171875, 3.3271484375, 3.453125, 3.5791015625, 3.705078125, 3.8310546875, 3.95703125]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 3.0, 5.0, 8.0, 10.0, 17.0, 21.0, 24.0, 29.0, 28.0, 40.0, 41.0, 67.0, 75.0, 90.0, 80.0, 72.0, 67.0, 71.0, 54.0, 49.0, 36.0, 20.0, 20.0, 20.0, 13.0, 9.0, 11.0, 4.0, 7.0, 9.0, 3.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.41796875, -3.32720947265625, -3.2364501953125, -3.14569091796875, -3.054931640625, -2.96417236328125, -2.8734130859375, -2.78265380859375, -2.69189453125, -2.60113525390625, -2.5103759765625, -2.41961669921875, -2.328857421875, -2.23809814453125, -2.1473388671875, -2.05657958984375, -1.9658203125, -1.87506103515625, -1.7843017578125, -1.69354248046875, -1.602783203125, -1.51202392578125, -1.4212646484375, -1.33050537109375, -1.23974609375, -1.14898681640625, -1.0582275390625, -0.96746826171875, -0.876708984375, -0.78594970703125, -0.6951904296875, -0.60443115234375, -0.513671875, -0.42291259765625, -0.3321533203125, -0.24139404296875, -0.150634765625, -0.05987548828125, 0.0308837890625, 0.12164306640625, 0.21240234375, 0.30316162109375, 0.3939208984375, 0.48468017578125, 0.575439453125, 0.66619873046875, 0.7569580078125, 0.84771728515625, 0.9384765625, 1.02923583984375, 1.1199951171875, 1.21075439453125, 1.301513671875, 1.39227294921875, 1.4830322265625, 1.57379150390625, 1.66455078125, 1.75531005859375, 1.8460693359375, 1.93682861328125, 2.027587890625, 2.11834716796875, 2.2091064453125, 2.29986572265625, 2.390625]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 7.0, 25.0, 67.0, 159.0, 305.0, 247.0, 140.0, 40.0, 14.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.303070068359375, -36.24065017700195, -33.178226470947266, -30.115806579589844, -27.05338478088379, -23.990962982177734, -20.928543090820312, -17.866121292114258, -14.803699493408203, -11.741277694702148, -8.67885684967041, -5.616436004638672, -2.554014205932617, 0.5084075927734375, 3.5708274841308594, 6.633249282836914, 9.695671081542969, 12.758092880249023, 15.820513725280762, 18.8829345703125, 21.945356369018555, 25.00777816772461, 28.07019805908203, 31.132619857788086, 34.19504165649414, 37.25746154785156, 40.31988525390625, 43.38230514526367, 46.444725036621094, 49.50714874267578, 52.5695686340332, 55.631988525390625, 58.69441223144531, 61.756832122802734, 64.81925201416016, 67.88167572021484, 70.94409942626953, 74.00651550292969, 77.06893920898438, 80.13136291503906, 83.19378662109375, 86.25621032714844, 89.3186264038086, 92.38105010986328, 95.44347381591797, 98.50588989257812, 101.56831359863281, 104.6307373046875, 107.69315338134766, 110.75557708740234, 113.8179931640625, 116.88041687011719, 119.94284057617188, 123.00526428222656, 126.06768035888672, 129.13009643554688, 132.19252014160156, 135.25494384765625, 138.31736755371094, 141.37979125976562, 144.44219970703125, 147.50462341308594, 150.56704711914062, 153.6294708251953, 156.69189453125]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 6.0, 1.0, 5.0, 9.0, 9.0, 14.0, 16.0, 23.0, 21.0, 6.0, 24.0, 22.0, 36.0, 30.0, 41.0, 36.0, 41.0, 51.0, 43.0, 42.0, 53.0, 41.0, 28.0, 27.0, 43.0, 35.0, 41.0, 37.0, 33.0, 23.0, 26.0, 19.0, 18.0, 24.0, 14.0, 5.0, 11.0, 10.0, 6.0, 9.0, 6.0, 5.0, 4.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-26.380706787109375, -25.531200408935547, -24.68169403076172, -23.83218765258789, -22.982681274414062, -22.133174896240234, -21.28367042541504, -20.43416404724121, -19.584657669067383, -18.735151290893555, -17.885644912719727, -17.0361385345459, -16.186634063720703, -15.337126731872559, -14.487621307373047, -13.638114929199219, -12.78860855102539, -11.939102172851562, -11.089595794677734, -10.240090370178223, -9.390583992004395, -8.541077613830566, -7.6915717124938965, -6.842065811157227, -5.992559432983398, -5.14305305480957, -4.2935471534729, -3.4440410137176514, -2.5945348739624023, -1.7450284957885742, -0.8955225944519043, -0.046016693115234375, 0.8034896850585938, 1.6529958248138428, 2.502501964569092, 3.352008104324341, 4.20151424407959, 5.051020622253418, 5.900526523590088, 6.750032424926758, 7.599538803100586, 8.449045181274414, 9.298551559448242, 10.148056983947754, 10.997563362121582, 11.84706974029541, 12.696575164794922, 13.54608154296875, 14.395587921142578, 15.245094299316406, 16.094600677490234, 16.944107055664062, 17.79361343383789, 18.64311981201172, 19.492624282836914, 20.342130661010742, 21.19163703918457, 22.0411434173584, 22.890649795532227, 23.740156173706055, 24.58966064453125, 25.439167022705078, 26.288673400878906, 27.138179779052734, 27.987686157226562]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 3.0, 2.0, 3.0, 4.0, 5.0, 10.0, 12.0, 14.0, 21.0, 42.0, 57.0, 95.0, 152.0, 225.0, 404.0, 875.0, 2009.0, 5681.0, 21796.0, 151195.0, 3639388.0, 326193.0, 34438.0, 7380.0, 2339.0, 942.0, 454.0, 219.0, 131.0, 71.0, 43.0, 27.0, 15.0, 13.0, 9.0, 8.0, 1.0, 4.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.8125, -8.56524658203125, -8.3179931640625, -8.07073974609375, -7.823486328125, -7.57623291015625, -7.3289794921875, -7.08172607421875, -6.83447265625, -6.58721923828125, -6.3399658203125, -6.09271240234375, -5.845458984375, -5.59820556640625, -5.3509521484375, -5.10369873046875, -4.8564453125, -4.60919189453125, -4.3619384765625, -4.11468505859375, -3.867431640625, -3.62017822265625, -3.3729248046875, -3.12567138671875, -2.87841796875, -2.63116455078125, -2.3839111328125, -2.13665771484375, -1.889404296875, -1.64215087890625, -1.3948974609375, -1.14764404296875, -0.900390625, -0.65313720703125, -0.4058837890625, -0.15863037109375, 0.088623046875, 0.33587646484375, 0.5831298828125, 0.83038330078125, 1.07763671875, 1.32489013671875, 1.5721435546875, 1.81939697265625, 2.066650390625, 2.31390380859375, 2.5611572265625, 2.80841064453125, 3.0556640625, 3.30291748046875, 3.5501708984375, 3.79742431640625, 4.044677734375, 4.29193115234375, 4.5391845703125, 4.78643798828125, 5.03369140625, 5.28094482421875, 5.5281982421875, 5.77545166015625, 6.022705078125, 6.26995849609375, 6.5172119140625, 6.76446533203125, 7.01171875]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 5.0, 6.0, 11.0, 22.0, 16.0, 35.0, 55.0, 75.0, 80.0, 104.0, 96.0, 109.0, 92.0, 89.0, 67.0, 52.0, 36.0, 21.0, 14.0, 10.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.732421875, -1.679534912109375, -1.62664794921875, -1.573760986328125, -1.5208740234375, -1.467987060546875, -1.41510009765625, -1.362213134765625, -1.309326171875, -1.256439208984375, -1.20355224609375, -1.150665283203125, -1.0977783203125, -1.044891357421875, -0.99200439453125, -0.939117431640625, -0.88623046875, -0.833343505859375, -0.78045654296875, -0.727569580078125, -0.6746826171875, -0.621795654296875, -0.56890869140625, -0.516021728515625, -0.463134765625, -0.410247802734375, -0.35736083984375, -0.304473876953125, -0.2515869140625, -0.198699951171875, -0.14581298828125, -0.092926025390625, -0.0400390625, 0.012847900390625, 0.06573486328125, 0.118621826171875, 0.1715087890625, 0.224395751953125, 0.27728271484375, 0.330169677734375, 0.383056640625, 0.435943603515625, 0.48883056640625, 0.541717529296875, 0.5946044921875, 0.647491455078125, 0.70037841796875, 0.753265380859375, 0.80615234375, 0.859039306640625, 0.91192626953125, 0.964813232421875, 1.0177001953125, 1.070587158203125, 1.12347412109375, 1.176361083984375, 1.229248046875, 1.282135009765625, 1.33502197265625, 1.387908935546875, 1.4407958984375, 1.493682861328125, 1.54656982421875, 1.599456787109375, 1.65234375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 6.0, 7.0, 8.0, 14.0, 21.0, 25.0, 40.0, 52.0, 74.0, 144.0, 243.0, 581.0, 1531.0, 5464.0, 29730.0, 329183.0, 3584263.0, 213075.0, 22748.0, 4573.0, 1354.0, 541.0, 243.0, 147.0, 91.0, 46.0, 33.0, 14.0, 13.0, 13.0, 6.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.8671875, -10.5843505859375, -10.301513671875, -10.0186767578125, -9.73583984375, -9.4530029296875, -9.170166015625, -8.8873291015625, -8.6044921875, -8.3216552734375, -8.038818359375, -7.7559814453125, -7.47314453125, -7.1903076171875, -6.907470703125, -6.6246337890625, -6.341796875, -6.0589599609375, -5.776123046875, -5.4932861328125, -5.21044921875, -4.9276123046875, -4.644775390625, -4.3619384765625, -4.0791015625, -3.7962646484375, -3.513427734375, -3.2305908203125, -2.94775390625, -2.6649169921875, -2.382080078125, -2.0992431640625, -1.81640625, -1.5335693359375, -1.250732421875, -0.9678955078125, -0.68505859375, -0.4022216796875, -0.119384765625, 0.1634521484375, 0.4462890625, 0.7291259765625, 1.011962890625, 1.2947998046875, 1.57763671875, 1.8604736328125, 2.143310546875, 2.4261474609375, 2.708984375, 2.9918212890625, 3.274658203125, 3.5574951171875, 3.84033203125, 4.1231689453125, 4.406005859375, 4.6888427734375, 4.9716796875, 5.2545166015625, 5.537353515625, 5.8201904296875, 6.10302734375, 6.3858642578125, 6.668701171875, 6.9515380859375, 7.234375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 3.0, 4.0, 8.0, 13.0, 21.0, 56.0, 92.0, 222.0, 513.0, 1981.0, 665.0, 243.0, 129.0, 62.0, 25.0, 13.0, 14.0, 5.0, 5.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.6875, -3.6009063720703125, -3.514312744140625, -3.4277191162109375, -3.34112548828125, -3.2545318603515625, -3.167938232421875, -3.0813446044921875, -2.9947509765625, -2.9081573486328125, -2.821563720703125, -2.7349700927734375, -2.64837646484375, -2.5617828369140625, -2.475189208984375, -2.3885955810546875, -2.302001953125, -2.2154083251953125, -2.128814697265625, -2.0422210693359375, -1.95562744140625, -1.8690338134765625, -1.782440185546875, -1.6958465576171875, -1.6092529296875, -1.5226593017578125, -1.436065673828125, -1.3494720458984375, -1.26287841796875, -1.1762847900390625, -1.089691162109375, -1.0030975341796875, -0.91650390625, -0.8299102783203125, -0.743316650390625, -0.6567230224609375, -0.57012939453125, -0.4835357666015625, -0.396942138671875, -0.3103485107421875, -0.2237548828125, -0.1371612548828125, -0.050567626953125, 0.0360260009765625, 0.12261962890625, 0.2092132568359375, 0.295806884765625, 0.3824005126953125, 0.468994140625, 0.5555877685546875, 0.642181396484375, 0.7287750244140625, 0.81536865234375, 0.9019622802734375, 0.988555908203125, 1.0751495361328125, 1.1617431640625, 1.2483367919921875, 1.334930419921875, 1.4215240478515625, 1.50811767578125, 1.5947113037109375, 1.681304931640625, 1.7678985595703125, 1.8544921875]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 10.0, 29.0, 71.0, 144.0, 241.0, 219.0, 162.0, 67.0, 36.0, 14.0, 11.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.246376037597656, -12.619275093078613, -11.99217414855957, -11.365072250366211, -10.737971305847168, -10.110870361328125, -9.483768463134766, -8.856667518615723, -8.22956657409668, -7.602465629577637, -6.9753642082214355, -6.348262786865234, -5.721161842346191, -5.094060897827148, -4.466959476470947, -3.839858055114746, -3.212757110595703, -2.585655927658081, -1.958554744720459, -1.331453561782837, -0.7043523788452148, -0.07725119590759277, 0.5498499870300293, 1.1769514083862305, 1.8040523529052734, 2.4311535358428955, 3.0582547187805176, 3.6853559017181396, 4.312457084655762, 4.939558029174805, 5.566659450531006, 6.193760871887207, 6.820859909057617, 7.44796085357666, 8.075061798095703, 8.702163696289062, 9.329264640808105, 9.956365585327148, 10.583467483520508, 11.21056842803955, 11.837669372558594, 12.464770317077637, 13.09187126159668, 13.718973159790039, 14.346074104309082, 14.973175048828125, 15.600276947021484, 16.227378845214844, 16.85447883605957, 17.48158073425293, 18.108680725097656, 18.735782623291016, 19.362884521484375, 19.9899845123291, 20.61708641052246, 21.244186401367188, 21.871288299560547, 22.498390197753906, 23.125490188598633, 23.752592086791992, 24.37969207763672, 25.006793975830078, 25.633895874023438, 26.260997772216797, 26.888097763061523]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 1.0, 1.0, 5.0, 4.0, 5.0, 3.0, 10.0, 10.0, 16.0, 24.0, 13.0, 22.0, 34.0, 19.0, 33.0, 29.0, 43.0, 50.0, 47.0, 42.0, 38.0, 51.0, 43.0, 51.0, 40.0, 48.0, 42.0, 44.0, 41.0, 29.0, 34.0, 22.0, 13.0, 25.0, 10.0, 11.0, 8.0, 20.0, 4.0, 5.0, 5.0, 3.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.204717636108398, -6.021749019622803, -5.838780403137207, -5.6558122634887695, -5.472843647003174, -5.289875030517578, -5.106906414031982, -4.923937797546387, -4.740969657897949, -4.5580010414123535, -4.375032424926758, -4.19206428527832, -4.009095668792725, -3.826127052307129, -3.643158435821533, -3.4601900577545166, -3.277221441268921, -3.094252824783325, -2.9112844467163086, -2.728315830230713, -2.5453474521636963, -2.3623788356781006, -2.179410457611084, -1.9964418411254883, -1.8134733438491821, -1.630504846572876, -1.4475363492965698, -1.2645678520202637, -1.081599235534668, -0.8986307978630066, -0.7156622409820557, -0.5326937437057495, -0.34972524642944336, -0.166756734251976, 0.016211777925491333, 0.19918030500411987, 0.382148802280426, 0.5651172995567322, 0.7480858564376831, 0.9310543537139893, 1.1140228509902954, 1.2969913482666016, 1.4799598455429077, 1.6629283428192139, 1.8458969593048096, 2.028865337371826, 2.211833953857422, 2.3948025703430176, 2.577770948410034, 2.76073956489563, 2.9437079429626465, 3.126676559448242, 3.309644937515259, 3.4926135540008545, 3.675581932067871, 3.858550548553467, 4.0415191650390625, 4.224487781524658, 4.407456398010254, 4.590424537658691, 4.773393154144287, 4.956361770629883, 5.1393303871154785, 5.322299003601074, 5.505267143249512]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 2.0, 3.0, 7.0, 14.0, 18.0, 16.0, 22.0, 24.0, 56.0, 65.0, 99.0, 117.0, 185.0, 296.0, 487.0, 872.0, 1674.0, 3482.0, 7533.0, 17608.0, 41852.0, 97969.0, 204265.0, 289638.0, 207118.0, 99788.0, 42247.0, 17883.0, 7681.0, 3463.0, 1695.0, 955.0, 509.0, 302.0, 204.0, 115.0, 90.0, 66.0, 37.0, 26.0, 20.0, 18.0, 10.0, 12.0, 8.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-4.53515625, -4.407440185546875, -4.27972412109375, -4.152008056640625, -4.0242919921875, -3.896575927734375, -3.76885986328125, -3.641143798828125, -3.513427734375, -3.385711669921875, -3.25799560546875, -3.130279541015625, -3.0025634765625, -2.874847412109375, -2.74713134765625, -2.619415283203125, -2.49169921875, -2.363983154296875, -2.23626708984375, -2.108551025390625, -1.9808349609375, -1.853118896484375, -1.72540283203125, -1.597686767578125, -1.469970703125, -1.342254638671875, -1.21453857421875, -1.086822509765625, -0.9591064453125, -0.831390380859375, -0.70367431640625, -0.575958251953125, -0.4482421875, -0.320526123046875, -0.19281005859375, -0.065093994140625, 0.0626220703125, 0.190338134765625, 0.31805419921875, 0.445770263671875, 0.573486328125, 0.701202392578125, 0.82891845703125, 0.956634521484375, 1.0843505859375, 1.212066650390625, 1.33978271484375, 1.467498779296875, 1.59521484375, 1.722930908203125, 1.85064697265625, 1.978363037109375, 2.1060791015625, 2.233795166015625, 2.36151123046875, 2.489227294921875, 2.616943359375, 2.744659423828125, 2.87237548828125, 3.000091552734375, 3.1278076171875, 3.255523681640625, 3.38323974609375, 3.510955810546875, 3.638671875]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 10.0, 12.0, 15.0, 23.0, 30.0, 43.0, 56.0, 85.0, 72.0, 115.0, 114.0, 105.0, 75.0, 75.0, 65.0, 37.0, 30.0, 18.0, 12.0, 9.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7783203125, -1.7247161865234375, -1.671112060546875, -1.6175079345703125, -1.56390380859375, -1.5102996826171875, -1.456695556640625, -1.4030914306640625, -1.3494873046875, -1.2958831787109375, -1.242279052734375, -1.1886749267578125, -1.13507080078125, -1.0814666748046875, -1.027862548828125, -0.9742584228515625, -0.920654296875, -0.8670501708984375, -0.813446044921875, -0.7598419189453125, -0.70623779296875, -0.6526336669921875, -0.599029541015625, -0.5454254150390625, -0.4918212890625, -0.4382171630859375, -0.384613037109375, -0.3310089111328125, -0.27740478515625, -0.2238006591796875, -0.170196533203125, -0.1165924072265625, -0.06298828125, -0.0093841552734375, 0.044219970703125, 0.0978240966796875, 0.15142822265625, 0.2050323486328125, 0.258636474609375, 0.3122406005859375, 0.3658447265625, 0.4194488525390625, 0.473052978515625, 0.5266571044921875, 0.58026123046875, 0.6338653564453125, 0.687469482421875, 0.7410736083984375, 0.794677734375, 0.8482818603515625, 0.901885986328125, 0.9554901123046875, 1.00909423828125, 1.0626983642578125, 1.116302490234375, 1.1699066162109375, 1.2235107421875, 1.2771148681640625, 1.330718994140625, 1.3843231201171875, 1.43792724609375, 1.4915313720703125, 1.545135498046875, 1.5987396240234375, 1.65234375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 6.0, 1.0, 10.0, 5.0, 9.0, 11.0, 15.0, 27.0, 34.0, 45.0, 49.0, 63.0, 112.0, 123.0, 158.0, 257.0, 335.0, 468.0, 638.0, 1102.0, 2002.0, 4614.0, 12974.0, 40334.0, 124363.0, 290632.0, 327491.0, 160029.0, 53618.0, 16842.0, 5862.0, 2532.0, 1231.0, 766.0, 475.0, 347.0, 274.0, 168.0, 146.0, 116.0, 69.0, 64.0, 32.0, 20.0, 23.0, 21.0, 13.0, 10.0, 6.0, 8.0, 4.0, 5.0, 0.0, 2.0, 1.0, 1.0], "bins": [-5.3046875, -5.14923095703125, -4.9937744140625, -4.83831787109375, -4.682861328125, -4.52740478515625, -4.3719482421875, -4.21649169921875, -4.06103515625, -3.90557861328125, -3.7501220703125, -3.59466552734375, -3.439208984375, -3.28375244140625, -3.1282958984375, -2.97283935546875, -2.8173828125, -2.66192626953125, -2.5064697265625, -2.35101318359375, -2.195556640625, -2.04010009765625, -1.8846435546875, -1.72918701171875, -1.57373046875, -1.41827392578125, -1.2628173828125, -1.10736083984375, -0.951904296875, -0.79644775390625, -0.6409912109375, -0.48553466796875, -0.330078125, -0.17462158203125, -0.0191650390625, 0.13629150390625, 0.291748046875, 0.44720458984375, 0.6026611328125, 0.75811767578125, 0.91357421875, 1.06903076171875, 1.2244873046875, 1.37994384765625, 1.535400390625, 1.69085693359375, 1.8463134765625, 2.00177001953125, 2.1572265625, 2.31268310546875, 2.4681396484375, 2.62359619140625, 2.779052734375, 2.93450927734375, 3.0899658203125, 3.24542236328125, 3.40087890625, 3.55633544921875, 3.7117919921875, 3.86724853515625, 4.022705078125, 4.17816162109375, 4.3336181640625, 4.48907470703125, 4.64453125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 10.0, 6.0, 10.0, 15.0, 6.0, 24.0, 20.0, 23.0, 23.0, 33.0, 24.0, 35.0, 27.0, 30.0, 57.0, 47.0, 66.0, 43.0, 52.0, 47.0, 48.0, 56.0, 34.0, 44.0, 32.0, 33.0, 33.0, 19.0, 17.0, 19.0, 10.0, 18.0, 7.0, 11.0, 7.0, 6.0, 4.0, 2.0, 2.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.67578125, -5.51336669921875, -5.3509521484375, -5.18853759765625, -5.026123046875, -4.86370849609375, -4.7012939453125, -4.53887939453125, -4.37646484375, -4.21405029296875, -4.0516357421875, -3.88922119140625, -3.726806640625, -3.56439208984375, -3.4019775390625, -3.23956298828125, -3.0771484375, -2.91473388671875, -2.7523193359375, -2.58990478515625, -2.427490234375, -2.26507568359375, -2.1026611328125, -1.94024658203125, -1.77783203125, -1.61541748046875, -1.4530029296875, -1.29058837890625, -1.128173828125, -0.96575927734375, -0.8033447265625, -0.64093017578125, -0.478515625, -0.31610107421875, -0.1536865234375, 0.00872802734375, 0.171142578125, 0.33355712890625, 0.4959716796875, 0.65838623046875, 0.82080078125, 0.98321533203125, 1.1456298828125, 1.30804443359375, 1.470458984375, 1.63287353515625, 1.7952880859375, 1.95770263671875, 2.1201171875, 2.28253173828125, 2.4449462890625, 2.60736083984375, 2.769775390625, 2.93218994140625, 3.0946044921875, 3.25701904296875, 3.41943359375, 3.58184814453125, 3.7442626953125, 3.90667724609375, 4.069091796875, 4.23150634765625, 4.3939208984375, 4.55633544921875, 4.71875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 7.0, 2.0, 9.0, 6.0, 14.0, 11.0, 15.0, 11.0, 21.0, 33.0, 41.0, 65.0, 103.0, 153.0, 197.0, 375.0, 726.0, 1426.0, 3081.0, 7524.0, 20307.0, 62461.0, 220450.0, 441496.0, 201150.0, 57199.0, 18640.0, 7075.0, 2943.0, 1302.0, 676.0, 359.0, 223.0, 131.0, 93.0, 68.0, 46.0, 32.0, 21.0, 13.0, 16.0, 12.0, 9.0, 4.0, 6.0, 6.0, 1.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.74609375, -2.6588134765625, -2.571533203125, -2.4842529296875, -2.39697265625, -2.3096923828125, -2.222412109375, -2.1351318359375, -2.0478515625, -1.9605712890625, -1.873291015625, -1.7860107421875, -1.69873046875, -1.6114501953125, -1.524169921875, -1.4368896484375, -1.349609375, -1.2623291015625, -1.175048828125, -1.0877685546875, -1.00048828125, -0.9132080078125, -0.825927734375, -0.7386474609375, -0.6513671875, -0.5640869140625, -0.476806640625, -0.3895263671875, -0.30224609375, -0.2149658203125, -0.127685546875, -0.0404052734375, 0.046875, 0.1341552734375, 0.221435546875, 0.3087158203125, 0.39599609375, 0.4832763671875, 0.570556640625, 0.6578369140625, 0.7451171875, 0.8323974609375, 0.919677734375, 1.0069580078125, 1.09423828125, 1.1815185546875, 1.268798828125, 1.3560791015625, 1.443359375, 1.5306396484375, 1.617919921875, 1.7052001953125, 1.79248046875, 1.8797607421875, 1.967041015625, 2.0543212890625, 2.1416015625, 2.2288818359375, 2.316162109375, 2.4034423828125, 2.49072265625, 2.5780029296875, 2.665283203125, 2.7525634765625, 2.83984375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 2.0, 5.0, 6.0, 8.0, 5.0, 17.0, 16.0, 19.0, 16.0, 28.0, 31.0, 26.0, 39.0, 43.0, 56.0, 69.0, 83.0, 84.0, 71.0, 66.0, 64.0, 50.0, 39.0, 25.0, 23.0, 23.0, 11.0, 12.0, 13.0, 15.0, 6.0, 8.0, 6.0, 5.0, 7.0, 7.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004036426544189453, -0.0003899820148944855, -0.00037632137537002563, -0.0003626607358455658, -0.00034900009632110596, -0.0003353394567966461, -0.0003216788172721863, -0.00030801817774772644, -0.0002943575382232666, -0.00028069689869880676, -0.0002670362591743469, -0.0002533756196498871, -0.00023971498012542725, -0.0002260543406009674, -0.00021239370107650757, -0.00019873306155204773, -0.0001850724220275879, -0.00017141178250312805, -0.0001577511429786682, -0.00014409050345420837, -0.00013042986392974854, -0.0001167692244052887, -0.00010310858488082886, -8.944794535636902e-05, -7.578730583190918e-05, -6.212666630744934e-05, -4.84660267829895e-05, -3.480538725852966e-05, -2.1144747734069824e-05, -7.484108209609985e-06, 6.1765313148498535e-06, 1.9837170839309692e-05, 3.349781036376953e-05, 4.715844988822937e-05, 6.081908941268921e-05, 7.447972893714905e-05, 8.814036846160889e-05, 0.00010180100798606873, 0.00011546164751052856, 0.0001291222870349884, 0.00014278292655944824, 0.00015644356608390808, 0.00017010420560836792, 0.00018376484513282776, 0.0001974254846572876, 0.00021108612418174744, 0.00022474676370620728, 0.00023840740323066711, 0.00025206804275512695, 0.0002657286822795868, 0.00027938932180404663, 0.00029304996132850647, 0.0003067106008529663, 0.00032037124037742615, 0.000334031879901886, 0.0003476925194263458, 0.00036135315895080566, 0.0003750137984752655, 0.00038867443799972534, 0.0004023350775241852, 0.000415995717048645, 0.00042965635657310486, 0.0004433169960975647, 0.00045697763562202454, 0.0004706382751464844]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 8.0, 6.0, 9.0, 13.0, 13.0, 21.0, 33.0, 46.0, 65.0, 81.0, 153.0, 256.0, 423.0, 792.0, 1694.0, 4213.0, 13479.0, 54330.0, 315889.0, 521657.0, 101940.0, 22197.0, 6356.0, 2524.0, 989.0, 535.0, 279.0, 164.0, 126.0, 74.0, 53.0, 35.0, 30.0, 13.0, 8.0, 9.0, 11.0, 12.0, 7.0, 6.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.892578125, -3.763641357421875, -3.63470458984375, -3.505767822265625, -3.3768310546875, -3.247894287109375, -3.11895751953125, -2.990020751953125, -2.861083984375, -2.732147216796875, -2.60321044921875, -2.474273681640625, -2.3453369140625, -2.216400146484375, -2.08746337890625, -1.958526611328125, -1.82958984375, -1.700653076171875, -1.57171630859375, -1.442779541015625, -1.3138427734375, -1.184906005859375, -1.05596923828125, -0.927032470703125, -0.798095703125, -0.669158935546875, -0.54022216796875, -0.411285400390625, -0.2823486328125, -0.153411865234375, -0.02447509765625, 0.104461669921875, 0.2333984375, 0.362335205078125, 0.49127197265625, 0.620208740234375, 0.7491455078125, 0.878082275390625, 1.00701904296875, 1.135955810546875, 1.264892578125, 1.393829345703125, 1.52276611328125, 1.651702880859375, 1.7806396484375, 1.909576416015625, 2.03851318359375, 2.167449951171875, 2.29638671875, 2.425323486328125, 2.55426025390625, 2.683197021484375, 2.8121337890625, 2.941070556640625, 3.07000732421875, 3.198944091796875, 3.327880859375, 3.456817626953125, 3.58575439453125, 3.714691162109375, 3.8436279296875, 3.972564697265625, 4.10150146484375, 4.230438232421875, 4.359375]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 5.0, 6.0, 5.0, 8.0, 11.0, 10.0, 16.0, 20.0, 24.0, 28.0, 39.0, 27.0, 42.0, 60.0, 53.0, 75.0, 72.0, 73.0, 65.0, 61.0, 39.0, 50.0, 29.0, 27.0, 27.0, 22.0, 22.0, 13.0, 11.0, 10.0, 8.0, 8.0, 7.0, 9.0, 5.0, 7.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6220703125, -1.5624542236328125, -1.502838134765625, -1.4432220458984375, -1.38360595703125, -1.3239898681640625, -1.264373779296875, -1.2047576904296875, -1.1451416015625, -1.0855255126953125, -1.025909423828125, -0.9662933349609375, -0.90667724609375, -0.8470611572265625, -0.787445068359375, -0.7278289794921875, -0.668212890625, -0.6085968017578125, -0.548980712890625, -0.4893646240234375, -0.42974853515625, -0.3701324462890625, -0.310516357421875, -0.2509002685546875, -0.1912841796875, -0.1316680908203125, -0.072052001953125, -0.0124359130859375, 0.04718017578125, 0.1067962646484375, 0.166412353515625, 0.2260284423828125, 0.28564453125, 0.3452606201171875, 0.404876708984375, 0.4644927978515625, 0.52410888671875, 0.5837249755859375, 0.643341064453125, 0.7029571533203125, 0.7625732421875, 0.8221893310546875, 0.881805419921875, 0.9414215087890625, 1.00103759765625, 1.0606536865234375, 1.120269775390625, 1.1798858642578125, 1.239501953125, 1.2991180419921875, 1.358734130859375, 1.4183502197265625, 1.47796630859375, 1.5375823974609375, 1.597198486328125, 1.6568145751953125, 1.7164306640625, 1.7760467529296875, 1.835662841796875, 1.8952789306640625, 1.95489501953125, 2.0145111083984375, 2.074127197265625, 2.1337432861328125, 2.193359375]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 3.0, 5.0, 26.0, 50.0, 74.0, 132.0, 196.0, 196.0, 149.0, 86.0, 47.0, 23.0, 9.0, 6.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.794200897216797, -16.93906021118164, -15.083918571472168, -13.228776931762695, -11.373636245727539, -9.518495559692383, -7.66335391998291, -5.8082122802734375, -3.9530715942382812, -2.097930431365967, -0.24278926849365234, 1.612351894378662, 3.4674930572509766, 5.322633743286133, 7.1777753829956055, 9.032917022705078, 10.888057708740234, 12.74319839477539, 14.598340034484863, 16.453481674194336, 18.308622360229492, 20.16376304626465, 22.018905639648438, 23.874046325683594, 25.72918701171875, 27.584327697753906, 29.439468383789062, 31.29461097717285, 33.149749755859375, 35.00489044189453, 36.86003494262695, 38.71517562866211, 40.5703125, 42.425453186035156, 44.28059387207031, 46.13573455810547, 47.990875244140625, 49.84601593017578, 51.7011604309082, 53.55630111694336, 55.411441802978516, 57.26658248901367, 59.12172317504883, 60.976863861083984, 62.832008361816406, 64.68714904785156, 66.54228973388672, 68.39743041992188, 70.25257110595703, 72.10771179199219, 73.96285247802734, 75.8179931640625, 77.67313385009766, 79.52827453613281, 81.38341522216797, 83.23855590820312, 85.09370422363281, 86.94884490966797, 88.80398559570312, 90.65912628173828, 92.51426696777344, 94.3694076538086, 96.22454833984375, 98.07969665527344, 99.93482971191406]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 7.0, 3.0, 4.0, 8.0, 9.0, 3.0, 12.0, 13.0, 12.0, 18.0, 23.0, 37.0, 34.0, 39.0, 30.0, 35.0, 44.0, 38.0, 48.0, 41.0, 63.0, 48.0, 46.0, 38.0, 51.0, 48.0, 38.0, 42.0, 29.0, 32.0, 19.0, 20.0, 18.0, 10.0, 14.0, 9.0, 13.0, 4.0, 3.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-35.29789733886719, -34.340919494628906, -33.38393783569336, -32.42695999145508, -31.469982147216797, -30.513002395629883, -29.55602264404297, -28.599044799804688, -27.642065048217773, -26.68508529663086, -25.728107452392578, -24.771127700805664, -23.81414794921875, -22.85717010498047, -21.900190353393555, -20.94321060180664, -19.98623275756836, -19.029253005981445, -18.072275161743164, -17.11529541015625, -16.15831756591797, -15.201337814331055, -14.24435806274414, -13.287379264831543, -12.330400466918945, -11.373421669006348, -10.41644287109375, -9.459463119506836, -8.502484321594238, -7.545505523681641, -6.588526248931885, -5.631546974182129, -4.674568176269531, -3.7175891399383545, -2.7606101036071777, -1.803631067276001, -0.8466520309448242, 0.11032676696777344, 1.0673060417175293, 2.024285316467285, 2.981264114379883, 3.9382431507110596, 4.895222187042236, 5.852201461791992, 6.80918025970459, 7.7661590576171875, 8.723138809204102, 9.6801176071167, 10.637096405029297, 11.594075202941895, 12.551054000854492, 13.508033752441406, 14.465012550354004, 15.421991348266602, 16.378971099853516, 17.335948944091797, 18.29292869567871, 19.249908447265625, 20.206886291503906, 21.16386604309082, 22.120845794677734, 23.077823638916016, 24.03480339050293, 24.991783142089844, 25.948760986328125]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 8.0, 10.0, 12.0, 14.0, 12.0, 20.0, 42.0, 55.0, 96.0, 181.0, 348.0, 666.0, 1398.0, 3277.0, 8566.0, 28740.0, 172449.0, 3632601.0, 289333.0, 39073.0, 10327.0, 3913.0, 1564.0, 760.0, 357.0, 184.0, 104.0, 67.0, 29.0, 24.0, 15.0, 8.0, 8.0, 8.0, 3.0, 3.0, 5.0, 2.0, 1.0, 3.0, 1.0, 1.0], "bins": [-7.3359375, -7.15069580078125, -6.9654541015625, -6.78021240234375, -6.594970703125, -6.40972900390625, -6.2244873046875, -6.03924560546875, -5.85400390625, -5.66876220703125, -5.4835205078125, -5.29827880859375, -5.113037109375, -4.92779541015625, -4.7425537109375, -4.55731201171875, -4.3720703125, -4.18682861328125, -4.0015869140625, -3.81634521484375, -3.631103515625, -3.44586181640625, -3.2606201171875, -3.07537841796875, -2.89013671875, -2.70489501953125, -2.5196533203125, -2.33441162109375, -2.149169921875, -1.96392822265625, -1.7786865234375, -1.59344482421875, -1.408203125, -1.22296142578125, -1.0377197265625, -0.85247802734375, -0.667236328125, -0.48199462890625, -0.2967529296875, -0.11151123046875, 0.07373046875, 0.25897216796875, 0.4442138671875, 0.62945556640625, 0.814697265625, 0.99993896484375, 1.1851806640625, 1.37042236328125, 1.5556640625, 1.74090576171875, 1.9261474609375, 2.11138916015625, 2.296630859375, 2.48187255859375, 2.6671142578125, 2.85235595703125, 3.03759765625, 3.22283935546875, 3.4080810546875, 3.59332275390625, 3.778564453125, 3.96380615234375, 4.1490478515625, 4.33428955078125, 4.51953125]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 2.0, 8.0, 6.0, 9.0, 18.0, 21.0, 35.0, 46.0, 54.0, 47.0, 76.0, 85.0, 82.0, 85.0, 83.0, 78.0, 66.0, 48.0, 46.0, 33.0, 27.0, 18.0, 13.0, 8.0, 3.0, 7.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5712890625, -1.5207061767578125, -1.470123291015625, -1.4195404052734375, -1.36895751953125, -1.3183746337890625, -1.267791748046875, -1.2172088623046875, -1.1666259765625, -1.1160430908203125, -1.065460205078125, -1.0148773193359375, -0.96429443359375, -0.9137115478515625, -0.863128662109375, -0.8125457763671875, -0.761962890625, -0.7113800048828125, -0.660797119140625, -0.6102142333984375, -0.55963134765625, -0.5090484619140625, -0.458465576171875, -0.4078826904296875, -0.3572998046875, -0.3067169189453125, -0.256134033203125, -0.2055511474609375, -0.15496826171875, -0.1043853759765625, -0.053802490234375, -0.0032196044921875, 0.04736328125, 0.0979461669921875, 0.148529052734375, 0.1991119384765625, 0.24969482421875, 0.3002777099609375, 0.350860595703125, 0.4014434814453125, 0.4520263671875, 0.5026092529296875, 0.553192138671875, 0.6037750244140625, 0.65435791015625, 0.7049407958984375, 0.755523681640625, 0.8061065673828125, 0.856689453125, 0.9072723388671875, 0.957855224609375, 1.0084381103515625, 1.05902099609375, 1.1096038818359375, 1.160186767578125, 1.2107696533203125, 1.2613525390625, 1.3119354248046875, 1.362518310546875, 1.4131011962890625, 1.46368408203125, 1.5142669677734375, 1.564849853515625, 1.6154327392578125, 1.666015625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 8.0, 13.0, 15.0, 25.0, 63.0, 114.0, 205.0, 359.0, 832.0, 1953.0, 4956.0, 14762.0, 54506.0, 290995.0, 3107649.0, 592755.0, 90359.0, 22492.0, 7164.0, 2795.0, 1189.0, 522.0, 239.0, 130.0, 72.0, 42.0, 25.0, 15.0, 7.0, 6.0, 3.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.7421875, -4.59698486328125, -4.4517822265625, -4.30657958984375, -4.161376953125, -4.01617431640625, -3.8709716796875, -3.72576904296875, -3.58056640625, -3.43536376953125, -3.2901611328125, -3.14495849609375, -2.999755859375, -2.85455322265625, -2.7093505859375, -2.56414794921875, -2.4189453125, -2.27374267578125, -2.1285400390625, -1.98333740234375, -1.838134765625, -1.69293212890625, -1.5477294921875, -1.40252685546875, -1.25732421875, -1.11212158203125, -0.9669189453125, -0.82171630859375, -0.676513671875, -0.53131103515625, -0.3861083984375, -0.24090576171875, -0.095703125, 0.04949951171875, 0.1947021484375, 0.33990478515625, 0.485107421875, 0.63031005859375, 0.7755126953125, 0.92071533203125, 1.06591796875, 1.21112060546875, 1.3563232421875, 1.50152587890625, 1.646728515625, 1.79193115234375, 1.9371337890625, 2.08233642578125, 2.2275390625, 2.37274169921875, 2.5179443359375, 2.66314697265625, 2.808349609375, 2.95355224609375, 3.0987548828125, 3.24395751953125, 3.38916015625, 3.53436279296875, 3.6795654296875, 3.82476806640625, 3.969970703125, 4.11517333984375, 4.2603759765625, 4.40557861328125, 4.55078125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 5.0, 1.0, 3.0, 4.0, 6.0, 6.0, 10.0, 4.0, 11.0, 18.0, 21.0, 39.0, 50.0, 72.0, 122.0, 180.0, 334.0, 663.0, 1279.0, 485.0, 256.0, 157.0, 101.0, 69.0, 51.0, 35.0, 26.0, 17.0, 19.0, 11.0, 6.0, 5.0, 5.0, 3.0, 3.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.26171875, -1.2226409912109375, -1.183563232421875, -1.1444854736328125, -1.10540771484375, -1.0663299560546875, -1.027252197265625, -0.9881744384765625, -0.9490966796875, -0.9100189208984375, -0.870941162109375, -0.8318634033203125, -0.79278564453125, -0.7537078857421875, -0.714630126953125, -0.6755523681640625, -0.636474609375, -0.5973968505859375, -0.558319091796875, -0.5192413330078125, -0.48016357421875, -0.4410858154296875, -0.402008056640625, -0.3629302978515625, -0.3238525390625, -0.2847747802734375, -0.245697021484375, -0.2066192626953125, -0.16754150390625, -0.1284637451171875, -0.089385986328125, -0.0503082275390625, -0.01123046875, 0.0278472900390625, 0.066925048828125, 0.1060028076171875, 0.14508056640625, 0.1841583251953125, 0.223236083984375, 0.2623138427734375, 0.3013916015625, 0.3404693603515625, 0.379547119140625, 0.4186248779296875, 0.45770263671875, 0.4967803955078125, 0.535858154296875, 0.5749359130859375, 0.614013671875, 0.6530914306640625, 0.692169189453125, 0.7312469482421875, 0.77032470703125, 0.8094024658203125, 0.848480224609375, 0.8875579833984375, 0.9266357421875, 0.9657135009765625, 1.004791259765625, 1.0438690185546875, 1.08294677734375, 1.1220245361328125, 1.161102294921875, 1.2001800537109375, 1.2392578125]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 10.0, 14.0, 38.0, 58.0, 124.0, 150.0, 174.0, 175.0, 125.0, 69.0, 31.0, 18.0, 6.0, 6.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.773329734802246, -8.382299423217773, -7.991269588470459, -7.6002397537231445, -7.209209442138672, -6.818179130554199, -6.427149295806885, -6.03611946105957, -5.645089149475098, -5.254058837890625, -4.8630290031433105, -4.471999168395996, -4.080968856811523, -3.68993878364563, -3.2989087104797363, -2.9078786373138428, -2.516848564147949, -2.1258184909820557, -1.734788417816162, -1.3437583446502686, -0.952728271484375, -0.5616981983184814, -0.1706681251525879, 0.22036194801330566, 0.6113920211791992, 1.0024220943450928, 1.3934521675109863, 1.7844822406768799, 2.1755123138427734, 2.566542387008667, 2.9575724601745605, 3.348602533340454, 3.739633560180664, 4.130663871765137, 4.521693706512451, 4.912723541259766, 5.303753852844238, 5.694784164428711, 6.085813999176025, 6.47684383392334, 6.8678741455078125, 7.258904457092285, 7.6499342918396, 8.040964126586914, 8.431994438171387, 8.82302474975586, 9.214054107666016, 9.605084419250488, 9.996114730834961, 10.387145042419434, 10.778175354003906, 11.169204711914062, 11.560235023498535, 11.951265335083008, 12.342294692993164, 12.733325004577637, 13.12435531616211, 13.515385627746582, 13.906415939331055, 14.297445297241211, 14.688475608825684, 15.079505920410156, 15.470535278320312, 15.861565589904785, 16.252595901489258]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 1.0, 3.0, 5.0, 7.0, 11.0, 14.0, 17.0, 20.0, 17.0, 25.0, 25.0, 23.0, 28.0, 21.0, 34.0, 35.0, 48.0, 43.0, 41.0, 37.0, 41.0, 62.0, 47.0, 36.0, 36.0, 37.0, 36.0, 29.0, 33.0, 34.0, 26.0, 29.0, 18.0, 19.0, 8.0, 13.0, 11.0, 7.0, 5.0, 5.0, 7.0, 5.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.8656554222106934, -3.7314722537994385, -3.5972890853881836, -3.4631059169769287, -3.328922748565674, -3.194739580154419, -3.060556411743164, -2.92637300491333, -2.7921900749206543, -2.6580069065093994, -2.5238237380981445, -2.3896405696868896, -2.2554574012756348, -2.12127423286438, -1.9870909452438354, -1.8529077768325806, -1.7187244892120361, -1.5845413208007812, -1.4503581523895264, -1.3161749839782715, -1.1819918155670166, -1.0478086471557617, -0.9136253595352173, -0.7794421911239624, -0.6452590227127075, -0.5110758543014526, -0.37689265608787537, -0.2427094578742981, -0.10852628946304321, 0.02565687894821167, 0.15984010696411133, 0.2940232753753662, 0.4282064437866211, 0.562389612197876, 0.6965727806091309, 0.8307560086250305, 0.9649391770362854, 1.0991222858428955, 1.23330557346344, 1.3674887418746948, 1.5016719102859497, 1.6358550786972046, 1.7700382471084595, 1.904221534729004, 2.038404703140259, 2.1725878715515137, 2.3067710399627686, 2.4409542083740234, 2.5751373767852783, 2.709320545196533, 2.843503713607788, 2.977686882019043, 3.111870050430298, 3.2460532188415527, 3.3802366256713867, 3.5144195556640625, 3.6486029624938965, 3.7827861309051514, 3.9169692993164062, 4.05115270614624, 4.185335636138916, 4.31951904296875, 4.453701972961426, 4.58788537979126, 4.7220683097839355]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 0.0, 2.0, 9.0, 15.0, 18.0, 16.0, 40.0, 58.0, 113.0, 165.0, 295.0, 656.0, 1316.0, 3231.0, 8552.0, 29626.0, 123639.0, 391629.0, 350966.0, 100966.0, 24666.0, 7402.0, 2712.0, 1230.0, 564.0, 283.0, 160.0, 86.0, 46.0, 34.0, 18.0, 14.0, 10.0, 10.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.77734375, -6.58331298828125, -6.3892822265625, -6.19525146484375, -6.001220703125, -5.80718994140625, -5.6131591796875, -5.41912841796875, -5.22509765625, -5.03106689453125, -4.8370361328125, -4.64300537109375, -4.448974609375, -4.25494384765625, -4.0609130859375, -3.86688232421875, -3.6728515625, -3.47882080078125, -3.2847900390625, -3.09075927734375, -2.896728515625, -2.70269775390625, -2.5086669921875, -2.31463623046875, -2.12060546875, -1.92657470703125, -1.7325439453125, -1.53851318359375, -1.344482421875, -1.15045166015625, -0.9564208984375, -0.76239013671875, -0.568359375, -0.37432861328125, -0.1802978515625, 0.01373291015625, 0.207763671875, 0.40179443359375, 0.5958251953125, 0.78985595703125, 0.98388671875, 1.17791748046875, 1.3719482421875, 1.56597900390625, 1.760009765625, 1.95404052734375, 2.1480712890625, 2.34210205078125, 2.5361328125, 2.73016357421875, 2.9241943359375, 3.11822509765625, 3.312255859375, 3.50628662109375, 3.7003173828125, 3.89434814453125, 4.08837890625, 4.28240966796875, 4.4764404296875, 4.67047119140625, 4.864501953125, 5.05853271484375, 5.2525634765625, 5.44659423828125, 5.640625]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 8.0, 6.0, 11.0, 11.0, 21.0, 31.0, 41.0, 51.0, 64.0, 66.0, 85.0, 92.0, 88.0, 95.0, 77.0, 72.0, 45.0, 39.0, 39.0, 20.0, 24.0, 10.0, 6.0, 5.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.73828125, -1.68414306640625, -1.6300048828125, -1.57586669921875, -1.521728515625, -1.46759033203125, -1.4134521484375, -1.35931396484375, -1.30517578125, -1.25103759765625, -1.1968994140625, -1.14276123046875, -1.088623046875, -1.03448486328125, -0.9803466796875, -0.92620849609375, -0.8720703125, -0.81793212890625, -0.7637939453125, -0.70965576171875, -0.655517578125, -0.60137939453125, -0.5472412109375, -0.49310302734375, -0.43896484375, -0.38482666015625, -0.3306884765625, -0.27655029296875, -0.222412109375, -0.16827392578125, -0.1141357421875, -0.05999755859375, -0.005859375, 0.04827880859375, 0.1024169921875, 0.15655517578125, 0.210693359375, 0.26483154296875, 0.3189697265625, 0.37310791015625, 0.42724609375, 0.48138427734375, 0.5355224609375, 0.58966064453125, 0.643798828125, 0.69793701171875, 0.7520751953125, 0.80621337890625, 0.8603515625, 0.91448974609375, 0.9686279296875, 1.02276611328125, 1.076904296875, 1.13104248046875, 1.1851806640625, 1.23931884765625, 1.29345703125, 1.34759521484375, 1.4017333984375, 1.45587158203125, 1.510009765625, 1.56414794921875, 1.6182861328125, 1.67242431640625, 1.7265625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 6.0, 4.0, 6.0, 19.0, 27.0, 40.0, 67.0, 76.0, 113.0, 208.0, 298.0, 474.0, 831.0, 1745.0, 5428.0, 27809.0, 201790.0, 582260.0, 191637.0, 26494.0, 5291.0, 1696.0, 857.0, 485.0, 302.0, 214.0, 119.0, 94.0, 63.0, 36.0, 31.0, 12.0, 9.0, 9.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.1484375, -7.8896484375, -7.630859375, -7.3720703125, -7.11328125, -6.8544921875, -6.595703125, -6.3369140625, -6.078125, -5.8193359375, -5.560546875, -5.3017578125, -5.04296875, -4.7841796875, -4.525390625, -4.2666015625, -4.0078125, -3.7490234375, -3.490234375, -3.2314453125, -2.97265625, -2.7138671875, -2.455078125, -2.1962890625, -1.9375, -1.6787109375, -1.419921875, -1.1611328125, -0.90234375, -0.6435546875, -0.384765625, -0.1259765625, 0.1328125, 0.3916015625, 0.650390625, 0.9091796875, 1.16796875, 1.4267578125, 1.685546875, 1.9443359375, 2.203125, 2.4619140625, 2.720703125, 2.9794921875, 3.23828125, 3.4970703125, 3.755859375, 4.0146484375, 4.2734375, 4.5322265625, 4.791015625, 5.0498046875, 5.30859375, 5.5673828125, 5.826171875, 6.0849609375, 6.34375, 6.6025390625, 6.861328125, 7.1201171875, 7.37890625, 7.6376953125, 7.896484375, 8.1552734375, 8.4140625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 0.0, 3.0, 1.0, 2.0, 2.0, 3.0, 1.0, 6.0, 4.0, 8.0, 9.0, 5.0, 11.0, 12.0, 26.0, 23.0, 29.0, 39.0, 32.0, 25.0, 45.0, 41.0, 44.0, 38.0, 45.0, 51.0, 41.0, 46.0, 49.0, 59.0, 43.0, 50.0, 43.0, 25.0, 18.0, 19.0, 18.0, 24.0, 6.0, 16.0, 12.0, 9.0, 2.0, 8.0, 4.0, 3.0, 5.0, 3.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.31640625, -5.1365966796875, -4.956787109375, -4.7769775390625, -4.59716796875, -4.4173583984375, -4.237548828125, -4.0577392578125, -3.8779296875, -3.6981201171875, -3.518310546875, -3.3385009765625, -3.15869140625, -2.9788818359375, -2.799072265625, -2.6192626953125, -2.439453125, -2.2596435546875, -2.079833984375, -1.9000244140625, -1.72021484375, -1.5404052734375, -1.360595703125, -1.1807861328125, -1.0009765625, -0.8211669921875, -0.641357421875, -0.4615478515625, -0.28173828125, -0.1019287109375, 0.077880859375, 0.2576904296875, 0.4375, 0.6173095703125, 0.797119140625, 0.9769287109375, 1.15673828125, 1.3365478515625, 1.516357421875, 1.6961669921875, 1.8759765625, 2.0557861328125, 2.235595703125, 2.4154052734375, 2.59521484375, 2.7750244140625, 2.954833984375, 3.1346435546875, 3.314453125, 3.4942626953125, 3.674072265625, 3.8538818359375, 4.03369140625, 4.2135009765625, 4.393310546875, 4.5731201171875, 4.7529296875, 4.9327392578125, 5.112548828125, 5.2923583984375, 5.47216796875, 5.6519775390625, 5.831787109375, 6.0115966796875, 6.19140625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 13.0, 7.0, 10.0, 9.0, 13.0, 22.0, 23.0, 48.0, 78.0, 104.0, 221.0, 553.0, 1702.0, 7351.0, 54445.0, 801185.0, 165220.0, 13232.0, 2767.0, 857.0, 306.0, 145.0, 82.0, 48.0, 31.0, 20.0, 18.0, 15.0, 8.0, 5.0, 7.0, 2.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.046875, -7.7928466796875, -7.538818359375, -7.2847900390625, -7.03076171875, -6.7767333984375, -6.522705078125, -6.2686767578125, -6.0146484375, -5.7606201171875, -5.506591796875, -5.2525634765625, -4.99853515625, -4.7445068359375, -4.490478515625, -4.2364501953125, -3.982421875, -3.7283935546875, -3.474365234375, -3.2203369140625, -2.96630859375, -2.7122802734375, -2.458251953125, -2.2042236328125, -1.9501953125, -1.6961669921875, -1.442138671875, -1.1881103515625, -0.93408203125, -0.6800537109375, -0.426025390625, -0.1719970703125, 0.08203125, 0.3360595703125, 0.590087890625, 0.8441162109375, 1.09814453125, 1.3521728515625, 1.606201171875, 1.8602294921875, 2.1142578125, 2.3682861328125, 2.622314453125, 2.8763427734375, 3.13037109375, 3.3843994140625, 3.638427734375, 3.8924560546875, 4.146484375, 4.4005126953125, 4.654541015625, 4.9085693359375, 5.16259765625, 5.4166259765625, 5.670654296875, 5.9246826171875, 6.1787109375, 6.4327392578125, 6.686767578125, 6.9407958984375, 7.19482421875, 7.4488525390625, 7.702880859375, 7.9569091796875, 8.2109375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 6.0, 6.0, 9.0, 14.0, 16.0, 21.0, 24.0, 40.0, 64.0, 95.0, 113.0, 138.0, 115.0, 91.0, 56.0, 47.0, 45.0, 30.0, 28.0, 9.0, 13.0, 6.0, 4.0, 3.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0007061958312988281, -0.0006851628422737122, -0.0006641298532485962, -0.0006430968642234802, -0.0006220638751983643, -0.0006010308861732483, -0.0005799978971481323, -0.0005589649081230164, -0.0005379319190979004, -0.0005168989300727844, -0.0004958659410476685, -0.0004748329520225525, -0.0004537999629974365, -0.00043276697397232056, -0.0004117339849472046, -0.0003907009959220886, -0.00036966800689697266, -0.0003486350178718567, -0.0003276020288467407, -0.00030656903982162476, -0.0002855360507965088, -0.0002645030617713928, -0.00024347007274627686, -0.0002224370837211609, -0.00020140409469604492, -0.00018037110567092896, -0.000159338116645813, -0.00013830512762069702, -0.00011727213859558105, -9.623914957046509e-05, -7.520616054534912e-05, -5.4173171520233154e-05, -3.314018249511719e-05, -1.210719347000122e-05, 8.925795555114746e-06, 2.9958784580230713e-05, 5.099177360534668e-05, 7.202476263046265e-05, 9.305775165557861e-05, 0.00011409074068069458, 0.00013512372970581055, 0.00015615671873092651, 0.00017718970775604248, 0.00019822269678115845, 0.00021925568580627441, 0.00024028867483139038, 0.00026132166385650635, 0.0002823546528816223, 0.0003033876419067383, 0.00032442063093185425, 0.0003454536199569702, 0.0003664866089820862, 0.00038751959800720215, 0.0004085525870323181, 0.0004295855760574341, 0.00045061856508255005, 0.000471651554107666, 0.000492684543132782, 0.000513717532157898, 0.0005347505211830139, 0.0005557835102081299, 0.0005768164992332458, 0.0005978494882583618, 0.0006188824772834778, 0.0006399154663085938]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 2.0, 5.0, 1.0, 1.0, 4.0, 4.0, 4.0, 8.0, 3.0, 7.0, 15.0, 16.0, 18.0, 21.0, 25.0, 40.0, 55.0, 79.0, 133.0, 192.0, 353.0, 800.0, 1637.0, 4142.0, 13504.0, 107529.0, 818814.0, 82337.0, 11859.0, 3743.0, 1540.0, 712.0, 352.0, 195.0, 117.0, 73.0, 52.0, 39.0, 31.0, 29.0, 14.0, 11.0, 10.0, 10.0, 8.0, 4.0, 5.0, 3.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.47265625, -6.24517822265625, -6.0177001953125, -5.79022216796875, -5.562744140625, -5.33526611328125, -5.1077880859375, -4.88031005859375, -4.65283203125, -4.42535400390625, -4.1978759765625, -3.97039794921875, -3.742919921875, -3.51544189453125, -3.2879638671875, -3.06048583984375, -2.8330078125, -2.60552978515625, -2.3780517578125, -2.15057373046875, -1.923095703125, -1.69561767578125, -1.4681396484375, -1.24066162109375, -1.01318359375, -0.78570556640625, -0.5582275390625, -0.33074951171875, -0.103271484375, 0.12420654296875, 0.3516845703125, 0.57916259765625, 0.806640625, 1.03411865234375, 1.2615966796875, 1.48907470703125, 1.716552734375, 1.94403076171875, 2.1715087890625, 2.39898681640625, 2.62646484375, 2.85394287109375, 3.0814208984375, 3.30889892578125, 3.536376953125, 3.76385498046875, 3.9913330078125, 4.21881103515625, 4.4462890625, 4.67376708984375, 4.9012451171875, 5.12872314453125, 5.356201171875, 5.58367919921875, 5.8111572265625, 6.03863525390625, 6.26611328125, 6.49359130859375, 6.7210693359375, 6.94854736328125, 7.176025390625, 7.40350341796875, 7.6309814453125, 7.85845947265625, 8.0859375]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 3.0, 2.0, 7.0, 8.0, 13.0, 14.0, 15.0, 39.0, 52.0, 110.0, 224.0, 203.0, 138.0, 63.0, 34.0, 20.0, 9.0, 16.0, 4.0, 7.0, 9.0, 3.0, 1.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-7.93359375, -7.71380615234375, -7.4940185546875, -7.27423095703125, -7.054443359375, -6.83465576171875, -6.6148681640625, -6.39508056640625, -6.17529296875, -5.95550537109375, -5.7357177734375, -5.51593017578125, -5.296142578125, -5.07635498046875, -4.8565673828125, -4.63677978515625, -4.4169921875, -4.19720458984375, -3.9774169921875, -3.75762939453125, -3.537841796875, -3.31805419921875, -3.0982666015625, -2.87847900390625, -2.65869140625, -2.43890380859375, -2.2191162109375, -1.99932861328125, -1.779541015625, -1.55975341796875, -1.3399658203125, -1.12017822265625, -0.900390625, -0.68060302734375, -0.4608154296875, -0.24102783203125, -0.021240234375, 0.19854736328125, 0.4183349609375, 0.63812255859375, 0.85791015625, 1.07769775390625, 1.2974853515625, 1.51727294921875, 1.737060546875, 1.95684814453125, 2.1766357421875, 2.39642333984375, 2.6162109375, 2.83599853515625, 3.0557861328125, 3.27557373046875, 3.495361328125, 3.71514892578125, 3.9349365234375, 4.15472412109375, 4.37451171875, 4.59429931640625, 4.8140869140625, 5.03387451171875, 5.253662109375, 5.47344970703125, 5.6932373046875, 5.91302490234375, 6.1328125]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 6.0, 1.0, 7.0, 24.0, 53.0, 163.0, 208.0, 246.0, 169.0, 79.0, 29.0, 8.0, 8.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-78.39131164550781, -75.95218658447266, -73.5130615234375, -71.07394409179688, -68.63481903076172, -66.19569396972656, -63.75657272338867, -61.31745147705078, -58.878326416015625, -56.43920135498047, -54.00008010864258, -51.56095886230469, -49.12183380126953, -46.682708740234375, -44.243587493896484, -41.804466247558594, -39.36534118652344, -36.92621612548828, -34.48709487915039, -32.0479736328125, -29.608848571777344, -27.16972541809082, -24.730602264404297, -22.291479110717773, -19.85235595703125, -17.413232803344727, -14.974109649658203, -12.53498649597168, -10.095863342285156, -7.656740188598633, -5.217617034912109, -2.778493881225586, -0.33937835693359375, 2.0997447967529297, 4.538867950439453, 6.977991104125977, 9.4171142578125, 11.856237411499023, 14.295360565185547, 16.73448371887207, 19.173606872558594, 21.612730026245117, 24.05185317993164, 26.490976333618164, 28.930099487304688, 31.36922264099121, 33.808345794677734, 36.247467041015625, 38.68659210205078, 41.12571716308594, 43.56483840942383, 46.00395965576172, 48.443084716796875, 50.88220977783203, 53.32133102416992, 55.76045227050781, 58.19957733154297, 60.638702392578125, 63.077823638916016, 65.5169448852539, 67.95606994628906, 70.39519500732422, 72.83432006835938, 75.2734375, 77.71256256103516]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 3.0, 4.0, 5.0, 8.0, 2.0, 11.0, 17.0, 15.0, 13.0, 14.0, 28.0, 31.0, 34.0, 36.0, 35.0, 44.0, 40.0, 44.0, 46.0, 50.0, 52.0, 41.0, 46.0, 31.0, 47.0, 38.0, 49.0, 31.0, 26.0, 27.0, 27.0, 22.0, 19.0, 9.0, 16.0, 5.0, 9.0, 8.0, 4.0, 5.0, 6.0, 4.0, 3.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.32813262939453, -32.218753814697266, -31.109373092651367, -29.9999942779541, -28.890613555908203, -27.781234741210938, -26.671855926513672, -25.562477111816406, -24.453096389770508, -23.343717575073242, -22.234336853027344, -21.124958038330078, -20.015579223632812, -18.906198501586914, -17.79681968688965, -16.68743896484375, -15.578060150146484, -14.468680381774902, -13.35930061340332, -12.249921798706055, -11.140542030334473, -10.03116226196289, -8.921783447265625, -7.812403678894043, -6.703023910522461, -5.593644142150879, -4.484264850616455, -3.374885320663452, -2.265505790710449, -1.1561260223388672, -0.04674673080444336, 1.0626325607299805, 2.172016143798828, 3.281395673751831, 4.390775203704834, 5.500154495239258, 6.60953426361084, 7.718914031982422, 8.828292846679688, 9.93767261505127, 11.047052383422852, 12.156432151794434, 13.265811920166016, 14.375190734863281, 15.484570503234863, 16.593950271606445, 17.70332908630371, 18.81270980834961, 19.922088623046875, 21.03146743774414, 22.14084815979004, 23.250226974487305, 24.359607696533203, 25.46898651123047, 26.578365325927734, 27.687744140625, 28.7971248626709, 29.906503677368164, 31.015884399414062, 32.12526321411133, 33.234642028808594, 34.344024658203125, 35.45340347290039, 36.562782287597656, 37.67216110229492]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 9.0, 10.0, 8.0, 15.0, 27.0, 37.0, 50.0, 81.0, 120.0, 197.0, 299.0, 522.0, 937.0, 1778.0, 4050.0, 10181.0, 32481.0, 149093.0, 2410315.0, 1413184.0, 126241.0, 28676.0, 8855.0, 3492.0, 1617.0, 813.0, 477.0, 256.0, 159.0, 107.0, 59.0, 36.0, 24.0, 18.0, 13.0, 12.0, 9.0, 9.0, 5.0, 1.0, 3.0, 1.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.7265625, -4.58734130859375, -4.4481201171875, -4.30889892578125, -4.169677734375, -4.03045654296875, -3.8912353515625, -3.75201416015625, -3.61279296875, -3.47357177734375, -3.3343505859375, -3.19512939453125, -3.055908203125, -2.91668701171875, -2.7774658203125, -2.63824462890625, -2.4990234375, -2.35980224609375, -2.2205810546875, -2.08135986328125, -1.942138671875, -1.80291748046875, -1.6636962890625, -1.52447509765625, -1.38525390625, -1.24603271484375, -1.1068115234375, -0.96759033203125, -0.828369140625, -0.68914794921875, -0.5499267578125, -0.41070556640625, -0.271484375, -0.13226318359375, 0.0069580078125, 0.14617919921875, 0.285400390625, 0.42462158203125, 0.5638427734375, 0.70306396484375, 0.84228515625, 0.98150634765625, 1.1207275390625, 1.25994873046875, 1.399169921875, 1.53839111328125, 1.6776123046875, 1.81683349609375, 1.9560546875, 2.09527587890625, 2.2344970703125, 2.37371826171875, 2.512939453125, 2.65216064453125, 2.7913818359375, 2.93060302734375, 3.06982421875, 3.20904541015625, 3.3482666015625, 3.48748779296875, 3.626708984375, 3.76593017578125, 3.9051513671875, 4.04437255859375, 4.18359375]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 5.0, 9.0, 12.0, 8.0, 11.0, 17.0, 26.0, 33.0, 30.0, 60.0, 58.0, 74.0, 74.0, 78.0, 85.0, 74.0, 57.0, 73.0, 61.0, 44.0, 40.0, 22.0, 19.0, 14.0, 8.0, 6.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6318359375, -1.580810546875, -1.52978515625, -1.478759765625, -1.427734375, -1.376708984375, -1.32568359375, -1.274658203125, -1.2236328125, -1.172607421875, -1.12158203125, -1.070556640625, -1.01953125, -0.968505859375, -0.91748046875, -0.866455078125, -0.8154296875, -0.764404296875, -0.71337890625, -0.662353515625, -0.611328125, -0.560302734375, -0.50927734375, -0.458251953125, -0.4072265625, -0.356201171875, -0.30517578125, -0.254150390625, -0.203125, -0.152099609375, -0.10107421875, -0.050048828125, 0.0009765625, 0.052001953125, 0.10302734375, 0.154052734375, 0.205078125, 0.256103515625, 0.30712890625, 0.358154296875, 0.4091796875, 0.460205078125, 0.51123046875, 0.562255859375, 0.61328125, 0.664306640625, 0.71533203125, 0.766357421875, 0.8173828125, 0.868408203125, 0.91943359375, 0.970458984375, 1.021484375, 1.072509765625, 1.12353515625, 1.174560546875, 1.2255859375, 1.276611328125, 1.32763671875, 1.378662109375, 1.4296875, 1.480712890625, 1.53173828125, 1.582763671875, 1.6337890625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 6.0, 4.0, 6.0, 2.0, 3.0, 9.0, 7.0, 28.0, 24.0, 26.0, 66.0, 128.0, 263.0, 564.0, 1309.0, 3499.0, 12071.0, 60964.0, 527940.0, 3193904.0, 334579.0, 44289.0, 9598.0, 2820.0, 1131.0, 514.0, 264.0, 100.0, 75.0, 31.0, 26.0, 13.0, 10.0, 6.0, 4.0, 2.0, 7.0, 1.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.04296875, -4.87713623046875, -4.7113037109375, -4.54547119140625, -4.379638671875, -4.21380615234375, -4.0479736328125, -3.88214111328125, -3.71630859375, -3.55047607421875, -3.3846435546875, -3.21881103515625, -3.052978515625, -2.88714599609375, -2.7213134765625, -2.55548095703125, -2.3896484375, -2.22381591796875, -2.0579833984375, -1.89215087890625, -1.726318359375, -1.56048583984375, -1.3946533203125, -1.22882080078125, -1.06298828125, -0.89715576171875, -0.7313232421875, -0.56549072265625, -0.399658203125, -0.23382568359375, -0.0679931640625, 0.09783935546875, 0.263671875, 0.42950439453125, 0.5953369140625, 0.76116943359375, 0.927001953125, 1.09283447265625, 1.2586669921875, 1.42449951171875, 1.59033203125, 1.75616455078125, 1.9219970703125, 2.08782958984375, 2.253662109375, 2.41949462890625, 2.5853271484375, 2.75115966796875, 2.9169921875, 3.08282470703125, 3.2486572265625, 3.41448974609375, 3.580322265625, 3.74615478515625, 3.9119873046875, 4.07781982421875, 4.24365234375, 4.40948486328125, 4.5753173828125, 4.74114990234375, 4.906982421875, 5.07281494140625, 5.2386474609375, 5.40447998046875, 5.5703125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 4.0, 1.0, 3.0, 7.0, 7.0, 7.0, 9.0, 18.0, 20.0, 21.0, 43.0, 57.0, 77.0, 142.0, 155.0, 262.0, 392.0, 871.0, 773.0, 415.0, 270.0, 145.0, 112.0, 56.0, 55.0, 43.0, 27.0, 20.0, 10.0, 11.0, 14.0, 5.0, 3.0, 3.0, 2.0, 5.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.5615234375, -1.5110626220703125, -1.460601806640625, -1.4101409912109375, -1.35968017578125, -1.3092193603515625, -1.258758544921875, -1.2082977294921875, -1.1578369140625, -1.1073760986328125, -1.056915283203125, -1.0064544677734375, -0.95599365234375, -0.9055328369140625, -0.855072021484375, -0.8046112060546875, -0.754150390625, -0.7036895751953125, -0.653228759765625, -0.6027679443359375, -0.55230712890625, -0.5018463134765625, -0.451385498046875, -0.4009246826171875, -0.3504638671875, -0.3000030517578125, -0.249542236328125, -0.1990814208984375, -0.14862060546875, -0.0981597900390625, -0.047698974609375, 0.0027618408203125, 0.05322265625, 0.1036834716796875, 0.154144287109375, 0.2046051025390625, 0.25506591796875, 0.3055267333984375, 0.355987548828125, 0.4064483642578125, 0.4569091796875, 0.5073699951171875, 0.557830810546875, 0.6082916259765625, 0.65875244140625, 0.7092132568359375, 0.759674072265625, 0.8101348876953125, 0.860595703125, 0.9110565185546875, 0.961517333984375, 1.0119781494140625, 1.06243896484375, 1.1128997802734375, 1.163360595703125, 1.2138214111328125, 1.2642822265625, 1.3147430419921875, 1.365203857421875, 1.4156646728515625, 1.46612548828125, 1.5165863037109375, 1.567047119140625, 1.6175079345703125, 1.66796875]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 13.0, 25.0, 74.0, 156.0, 215.0, 231.0, 169.0, 71.0, 34.0, 6.0, 7.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.77429962158203, -33.968894958496094, -33.16348648071289, -32.35808181762695, -31.552677154541016, -30.747270584106445, -29.941864013671875, -29.136459350585938, -28.331052780151367, -27.525646209716797, -26.72024154663086, -25.91483497619629, -25.10943031311035, -24.30402374267578, -23.498619079589844, -22.693212509155273, -21.887805938720703, -21.082399368286133, -20.276994705200195, -19.471588134765625, -18.666183471679688, -17.860776901245117, -17.055370330810547, -16.24996566772461, -15.444561004638672, -14.639155387878418, -13.833749771118164, -13.028343200683594, -12.22293758392334, -11.417531967163086, -10.612126350402832, -9.806720733642578, -9.001314163208008, -8.195908546447754, -7.390502452850342, -6.585096836090088, -5.779690742492676, -4.974285125732422, -4.168879508972168, -3.363473415374756, -2.558067798614502, -1.752661943435669, -0.9472562074661255, -0.14185047149658203, 0.663555383682251, 1.468961238861084, 2.274366855621338, 3.07977294921875, 3.885178565979004, 4.690584182739258, 5.49599027633667, 6.301395893096924, 7.106801986694336, 7.91220760345459, 8.717613220214844, 9.523019790649414, 10.328424453735352, 11.133830070495605, 11.93923568725586, 12.74464225769043, 13.550047874450684, 14.355453491210938, 15.160859107971191, 15.966264724731445, 16.771671295166016]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 4.0, 4.0, 4.0, 5.0, 9.0, 13.0, 11.0, 23.0, 21.0, 24.0, 32.0, 35.0, 39.0, 49.0, 58.0, 54.0, 68.0, 62.0, 67.0, 65.0, 60.0, 48.0, 49.0, 36.0, 31.0, 27.0, 21.0, 28.0, 17.0, 16.0, 9.0, 4.0, 4.0, 6.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.636529922485352, -9.343158721923828, -9.049787521362305, -8.756416320800781, -8.463045120239258, -8.169673919677734, -7.876302719116211, -7.5829315185546875, -7.289560317993164, -6.996189117431641, -6.702817916870117, -6.409446716308594, -6.11607551574707, -5.822704315185547, -5.529333114624023, -5.2359619140625, -4.942590713500977, -4.649219512939453, -4.35584831237793, -4.062477111816406, -3.769105911254883, -3.4757347106933594, -3.182363510131836, -2.8889923095703125, -2.595621109008789, -2.3022499084472656, -2.008878707885742, -1.7155075073242188, -1.4221363067626953, -1.1287651062011719, -0.8353939056396484, -0.542022705078125, -0.24865055084228516, 0.04472064971923828, 0.3380918502807617, 0.6314630508422852, 0.9248342514038086, 1.218205451965332, 1.5115766525268555, 1.804947853088379, 2.0983190536499023, 2.391690254211426, 2.685061454772949, 2.9784326553344727, 3.271803855895996, 3.5651750564575195, 3.858546257019043, 4.151917457580566, 4.44528865814209, 4.738659858703613, 5.032031059265137, 5.32540225982666, 5.618773460388184, 5.912144660949707, 6.2055158615112305, 6.498887062072754, 6.792258262634277, 7.085629463195801, 7.379000663757324, 7.672371864318848, 7.965743064880371, 8.259114265441895, 8.552485466003418, 8.845856666564941, 9.139227867126465]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 3.0, 6.0, 1.0, 10.0, 9.0, 15.0, 18.0, 20.0, 32.0, 49.0, 47.0, 133.0, 142.0, 241.0, 357.0, 525.0, 905.0, 1588.0, 2867.0, 5567.0, 11134.0, 22890.0, 48226.0, 102057.0, 200511.0, 277077.0, 190049.0, 95572.0, 45082.0, 21544.0, 10268.0, 5128.0, 2650.0, 1491.0, 893.0, 465.0, 315.0, 227.0, 123.0, 106.0, 60.0, 53.0, 30.0, 27.0, 18.0, 9.0, 6.0, 2.0, 5.0, 6.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.38671875, -3.271728515625, -3.15673828125, -3.041748046875, -2.9267578125, -2.811767578125, -2.69677734375, -2.581787109375, -2.466796875, -2.351806640625, -2.23681640625, -2.121826171875, -2.0068359375, -1.891845703125, -1.77685546875, -1.661865234375, -1.546875, -1.431884765625, -1.31689453125, -1.201904296875, -1.0869140625, -0.971923828125, -0.85693359375, -0.741943359375, -0.626953125, -0.511962890625, -0.39697265625, -0.281982421875, -0.1669921875, -0.052001953125, 0.06298828125, 0.177978515625, 0.29296875, 0.407958984375, 0.52294921875, 0.637939453125, 0.7529296875, 0.867919921875, 0.98291015625, 1.097900390625, 1.212890625, 1.327880859375, 1.44287109375, 1.557861328125, 1.6728515625, 1.787841796875, 1.90283203125, 2.017822265625, 2.1328125, 2.247802734375, 2.36279296875, 2.477783203125, 2.5927734375, 2.707763671875, 2.82275390625, 2.937744140625, 3.052734375, 3.167724609375, 3.28271484375, 3.397705078125, 3.5126953125, 3.627685546875, 3.74267578125, 3.857666015625, 3.97265625]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 6.0, 5.0, 17.0, 13.0, 13.0, 30.0, 31.0, 39.0, 47.0, 74.0, 84.0, 61.0, 88.0, 75.0, 79.0, 78.0, 68.0, 46.0, 42.0, 44.0, 18.0, 14.0, 12.0, 4.0, 6.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.67578125, -1.6231231689453125, -1.570465087890625, -1.5178070068359375, -1.46514892578125, -1.4124908447265625, -1.359832763671875, -1.3071746826171875, -1.2545166015625, -1.2018585205078125, -1.149200439453125, -1.0965423583984375, -1.04388427734375, -0.9912261962890625, -0.938568115234375, -0.8859100341796875, -0.833251953125, -0.7805938720703125, -0.727935791015625, -0.6752777099609375, -0.62261962890625, -0.5699615478515625, -0.517303466796875, -0.4646453857421875, -0.4119873046875, -0.3593292236328125, -0.306671142578125, -0.2540130615234375, -0.20135498046875, -0.1486968994140625, -0.096038818359375, -0.0433807373046875, 0.00927734375, 0.0619354248046875, 0.114593505859375, 0.1672515869140625, 0.21990966796875, 0.2725677490234375, 0.325225830078125, 0.3778839111328125, 0.4305419921875, 0.4832000732421875, 0.535858154296875, 0.5885162353515625, 0.64117431640625, 0.6938323974609375, 0.746490478515625, 0.7991485595703125, 0.851806640625, 0.9044647216796875, 0.957122802734375, 1.0097808837890625, 1.06243896484375, 1.1150970458984375, 1.167755126953125, 1.2204132080078125, 1.2730712890625, 1.3257293701171875, 1.378387451171875, 1.4310455322265625, 1.48370361328125, 1.5363616943359375, 1.589019775390625, 1.6416778564453125, 1.6943359375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 5.0, 6.0, 6.0, 6.0, 12.0, 17.0, 24.0, 50.0, 61.0, 91.0, 138.0, 221.0, 391.0, 696.0, 1511.0, 3443.0, 10755.0, 47708.0, 216434.0, 489736.0, 212765.0, 47288.0, 10814.0, 3308.0, 1347.0, 714.0, 389.0, 221.0, 147.0, 93.0, 52.0, 29.0, 21.0, 17.0, 11.0, 8.0, 7.0, 6.0, 4.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.34765625, -6.1461181640625, -5.944580078125, -5.7430419921875, -5.54150390625, -5.3399658203125, -5.138427734375, -4.9368896484375, -4.7353515625, -4.5338134765625, -4.332275390625, -4.1307373046875, -3.92919921875, -3.7276611328125, -3.526123046875, -3.3245849609375, -3.123046875, -2.9215087890625, -2.719970703125, -2.5184326171875, -2.31689453125, -2.1153564453125, -1.913818359375, -1.7122802734375, -1.5107421875, -1.3092041015625, -1.107666015625, -0.9061279296875, -0.70458984375, -0.5030517578125, -0.301513671875, -0.0999755859375, 0.1015625, 0.3031005859375, 0.504638671875, 0.7061767578125, 0.90771484375, 1.1092529296875, 1.310791015625, 1.5123291015625, 1.7138671875, 1.9154052734375, 2.116943359375, 2.3184814453125, 2.52001953125, 2.7215576171875, 2.923095703125, 3.1246337890625, 3.326171875, 3.5277099609375, 3.729248046875, 3.9307861328125, 4.13232421875, 4.3338623046875, 4.535400390625, 4.7369384765625, 4.9384765625, 5.1400146484375, 5.341552734375, 5.5430908203125, 5.74462890625, 5.9461669921875, 6.147705078125, 6.3492431640625, 6.55078125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 7.0, 7.0, 8.0, 9.0, 17.0, 18.0, 20.0, 19.0, 38.0, 42.0, 61.0, 59.0, 52.0, 53.0, 87.0, 57.0, 58.0, 61.0, 61.0, 51.0, 50.0, 44.0, 34.0, 34.0, 10.0, 17.0, 11.0, 7.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.50390625, -6.27142333984375, -6.0389404296875, -5.80645751953125, -5.573974609375, -5.34149169921875, -5.1090087890625, -4.87652587890625, -4.64404296875, -4.41156005859375, -4.1790771484375, -3.94659423828125, -3.714111328125, -3.48162841796875, -3.2491455078125, -3.01666259765625, -2.7841796875, -2.55169677734375, -2.3192138671875, -2.08673095703125, -1.854248046875, -1.62176513671875, -1.3892822265625, -1.15679931640625, -0.92431640625, -0.69183349609375, -0.4593505859375, -0.22686767578125, 0.005615234375, 0.23809814453125, 0.4705810546875, 0.70306396484375, 0.935546875, 1.16802978515625, 1.4005126953125, 1.63299560546875, 1.865478515625, 2.09796142578125, 2.3304443359375, 2.56292724609375, 2.79541015625, 3.02789306640625, 3.2603759765625, 3.49285888671875, 3.725341796875, 3.95782470703125, 4.1903076171875, 4.42279052734375, 4.6552734375, 4.88775634765625, 5.1202392578125, 5.35272216796875, 5.585205078125, 5.81768798828125, 6.0501708984375, 6.28265380859375, 6.51513671875, 6.74761962890625, 6.9801025390625, 7.21258544921875, 7.445068359375, 7.67755126953125, 7.9100341796875, 8.14251708984375, 8.375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 2.0, 2.0, 1.0, 7.0, 1.0, 7.0, 12.0, 16.0, 39.0, 43.0, 82.0, 126.0, 227.0, 534.0, 1212.0, 3188.0, 9742.0, 38393.0, 240373.0, 581227.0, 137218.0, 24740.0, 7065.0, 2385.0, 957.0, 434.0, 206.0, 127.0, 69.0, 43.0, 26.0, 18.0, 13.0, 9.0, 7.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.58984375, -3.4586181640625, -3.327392578125, -3.1961669921875, -3.06494140625, -2.9337158203125, -2.802490234375, -2.6712646484375, -2.5400390625, -2.4088134765625, -2.277587890625, -2.1463623046875, -2.01513671875, -1.8839111328125, -1.752685546875, -1.6214599609375, -1.490234375, -1.3590087890625, -1.227783203125, -1.0965576171875, -0.96533203125, -0.8341064453125, -0.702880859375, -0.5716552734375, -0.4404296875, -0.3092041015625, -0.177978515625, -0.0467529296875, 0.08447265625, 0.2156982421875, 0.346923828125, 0.4781494140625, 0.609375, 0.7406005859375, 0.871826171875, 1.0030517578125, 1.13427734375, 1.2655029296875, 1.396728515625, 1.5279541015625, 1.6591796875, 1.7904052734375, 1.921630859375, 2.0528564453125, 2.18408203125, 2.3153076171875, 2.446533203125, 2.5777587890625, 2.708984375, 2.8402099609375, 2.971435546875, 3.1026611328125, 3.23388671875, 3.3651123046875, 3.496337890625, 3.6275634765625, 3.7587890625, 3.8900146484375, 4.021240234375, 4.1524658203125, 4.28369140625, 4.4149169921875, 4.546142578125, 4.6773681640625, 4.80859375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 0.0, 3.0, 1.0, 4.0, 3.0, 5.0, 8.0, 13.0, 23.0, 30.0, 44.0, 68.0, 78.0, 118.0, 139.0, 145.0, 88.0, 62.0, 48.0, 29.0, 24.0, 24.0, 12.0, 6.0, 9.0, 5.0, 4.0, 3.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0007429122924804688, -0.0007203072309494019, -0.000697702169418335, -0.0006750971078872681, -0.0006524920463562012, -0.0006298869848251343, -0.0006072819232940674, -0.0005846768617630005, -0.0005620718002319336, -0.0005394667387008667, -0.0005168616771697998, -0.0004942566156387329, -0.000471651554107666, -0.0004490464925765991, -0.0004264414310455322, -0.00040383636951446533, -0.00038123130798339844, -0.00035862624645233154, -0.00033602118492126465, -0.00031341612339019775, -0.00029081106185913086, -0.00026820600032806396, -0.00024560093879699707, -0.00022299587726593018, -0.00020039081573486328, -0.0001777857542037964, -0.0001551806926727295, -0.0001325756311416626, -0.0001099705696105957, -8.736550807952881e-05, -6.476044654846191e-05, -4.215538501739502e-05, -1.9550323486328125e-05, 3.0547380447387695e-06, 2.5659799575805664e-05, 4.826486110687256e-05, 7.086992263793945e-05, 9.347498416900635e-05, 0.00011608004570007324, 0.00013868510723114014, 0.00016129016876220703, 0.00018389523029327393, 0.00020650029182434082, 0.00022910535335540771, 0.0002517104148864746, 0.0002743154764175415, 0.0002969205379486084, 0.0003195255994796753, 0.0003421306610107422, 0.0003647357225418091, 0.000387340784072876, 0.00040994584560394287, 0.00043255090713500977, 0.00045515596866607666, 0.00047776103019714355, 0.0005003660917282104, 0.0005229711532592773, 0.0005455762147903442, 0.0005681812763214111, 0.000590786337852478, 0.0006133913993835449, 0.0006359964609146118, 0.0006586015224456787, 0.0006812065839767456, 0.0007038116455078125]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 6.0, 12.0, 24.0, 27.0, 53.0, 74.0, 141.0, 215.0, 478.0, 1103.0, 3194.0, 11406.0, 67787.0, 595059.0, 324421.0, 33693.0, 7183.0, 2138.0, 731.0, 338.0, 208.0, 86.0, 71.0, 31.0, 19.0, 13.0, 12.0, 11.0, 9.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.2578125, -4.10479736328125, -3.9517822265625, -3.79876708984375, -3.645751953125, -3.49273681640625, -3.3397216796875, -3.18670654296875, -3.03369140625, -2.88067626953125, -2.7276611328125, -2.57464599609375, -2.421630859375, -2.26861572265625, -2.1156005859375, -1.96258544921875, -1.8095703125, -1.65655517578125, -1.5035400390625, -1.35052490234375, -1.197509765625, -1.04449462890625, -0.8914794921875, -0.73846435546875, -0.58544921875, -0.43243408203125, -0.2794189453125, -0.12640380859375, 0.026611328125, 0.17962646484375, 0.3326416015625, 0.48565673828125, 0.638671875, 0.79168701171875, 0.9447021484375, 1.09771728515625, 1.250732421875, 1.40374755859375, 1.5567626953125, 1.70977783203125, 1.86279296875, 2.01580810546875, 2.1688232421875, 2.32183837890625, 2.474853515625, 2.62786865234375, 2.7808837890625, 2.93389892578125, 3.0869140625, 3.23992919921875, 3.3929443359375, 3.54595947265625, 3.698974609375, 3.85198974609375, 4.0050048828125, 4.15802001953125, 4.31103515625, 4.46405029296875, 4.6170654296875, 4.77008056640625, 4.923095703125, 5.07611083984375, 5.2291259765625, 5.38214111328125, 5.53515625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 3.0, 3.0, 2.0, 5.0, 9.0, 8.0, 15.0, 10.0, 16.0, 34.0, 29.0, 59.0, 57.0, 73.0, 93.0, 86.0, 104.0, 68.0, 83.0, 51.0, 42.0, 27.0, 31.0, 25.0, 13.0, 14.0, 9.0, 6.0, 3.0, 6.0, 2.0, 1.0, 6.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.599609375, -2.520416259765625, -2.44122314453125, -2.362030029296875, -2.2828369140625, -2.203643798828125, -2.12445068359375, -2.045257568359375, -1.966064453125, -1.886871337890625, -1.80767822265625, -1.728485107421875, -1.6492919921875, -1.570098876953125, -1.49090576171875, -1.411712646484375, -1.33251953125, -1.253326416015625, -1.17413330078125, -1.094940185546875, -1.0157470703125, -0.936553955078125, -0.85736083984375, -0.778167724609375, -0.698974609375, -0.619781494140625, -0.54058837890625, -0.461395263671875, -0.3822021484375, -0.303009033203125, -0.22381591796875, -0.144622802734375, -0.0654296875, 0.013763427734375, 0.09295654296875, 0.172149658203125, 0.2513427734375, 0.330535888671875, 0.40972900390625, 0.488922119140625, 0.568115234375, 0.647308349609375, 0.72650146484375, 0.805694580078125, 0.8848876953125, 0.964080810546875, 1.04327392578125, 1.122467041015625, 1.20166015625, 1.280853271484375, 1.36004638671875, 1.439239501953125, 1.5184326171875, 1.597625732421875, 1.67681884765625, 1.756011962890625, 1.835205078125, 1.914398193359375, 1.99359130859375, 2.072784423828125, 2.1519775390625, 2.231170654296875, 2.31036376953125, 2.389556884765625, 2.46875]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 7.0, 16.0, 45.0, 110.0, 171.0, 229.0, 199.0, 122.0, 61.0, 23.0, 12.0, 6.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.80559158325195, -35.671939849853516, -33.538291931152344, -31.404640197753906, -29.2709903717041, -27.137340545654297, -25.00368881225586, -22.870038986206055, -20.73638916015625, -18.602739334106445, -16.46908950805664, -14.335437774658203, -12.201787948608398, -10.068138122558594, -7.934487342834473, -5.800836563110352, -3.667186737060547, -1.533536434173584, 0.6001138687133789, 2.733764171600342, 4.867414474487305, 7.001064300537109, 9.13471508026123, 11.268365859985352, 13.402015686035156, 15.535665512084961, 17.669315338134766, 19.802967071533203, 21.936616897583008, 24.070266723632812, 26.20391845703125, 28.337568283081055, 30.471221923828125, 32.60487365722656, 34.738521575927734, 36.87217330932617, 39.005821228027344, 41.13947296142578, 43.27312469482422, 45.406776428222656, 47.54042434692383, 49.674076080322266, 51.80772399902344, 53.941375732421875, 56.07502746582031, 58.208675384521484, 60.34232711791992, 62.475975036621094, 64.60962677001953, 66.74327850341797, 68.8769302368164, 71.01057434082031, 73.14422607421875, 75.27787780761719, 77.41152954101562, 79.54518127441406, 81.6788330078125, 83.81248474121094, 85.94613647460938, 88.07978057861328, 90.21343231201172, 92.34708404541016, 94.4807357788086, 96.61438751220703, 98.74803161621094]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 5.0, 6.0, 3.0, 9.0, 14.0, 20.0, 29.0, 26.0, 35.0, 33.0, 38.0, 40.0, 49.0, 54.0, 46.0, 47.0, 69.0, 52.0, 47.0, 58.0, 51.0, 45.0, 37.0, 39.0, 30.0, 20.0, 24.0, 20.0, 12.0, 11.0, 9.0, 9.0, 6.0, 1.0, 7.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-39.06858825683594, -37.94551086425781, -36.82243347167969, -35.69935989379883, -34.5762825012207, -33.45320510864258, -32.33013153076172, -31.207054138183594, -30.08397674560547, -28.960899353027344, -27.83782386779785, -26.71474838256836, -25.591670989990234, -24.46859359741211, -23.345518112182617, -22.222442626953125, -21.099365234375, -19.976287841796875, -18.853212356567383, -17.73013687133789, -16.607059478759766, -15.483983039855957, -14.360906600952148, -13.23783016204834, -12.114753723144531, -10.991677284240723, -9.868600845336914, -8.745524406433105, -7.622447967529297, -6.499371528625488, -5.37629508972168, -4.253218650817871, -3.1301422119140625, -2.007065773010254, -0.8839893341064453, 0.23908710479736328, 1.3621635437011719, 2.4852399826049805, 3.608316421508789, 4.731392860412598, 5.854469299316406, 6.977545738220215, 8.100622177124023, 9.223698616027832, 10.34677505493164, 11.46985149383545, 12.592927932739258, 13.716004371643066, 14.839080810546875, 15.962157249450684, 17.085233688354492, 18.208309173583984, 19.33138656616211, 20.454463958740234, 21.577539443969727, 22.70061492919922, 23.823692321777344, 24.94676971435547, 26.06984519958496, 27.192920684814453, 28.315998077392578, 29.439075469970703, 30.562150955200195, 31.685226440429688, 32.80830383300781]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 4.0, 5.0, 9.0, 12.0, 17.0, 24.0, 43.0, 65.0, 154.0, 266.0, 500.0, 1092.0, 2833.0, 9144.0, 35144.0, 250335.0, 3645401.0, 205385.0, 31370.0, 7972.0, 2648.0, 938.0, 426.0, 222.0, 111.0, 66.0, 37.0, 27.0, 8.0, 6.0, 7.0, 7.0, 2.0, 4.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.41796875, -6.241943359375, -6.06591796875, -5.889892578125, -5.7138671875, -5.537841796875, -5.36181640625, -5.185791015625, -5.009765625, -4.833740234375, -4.65771484375, -4.481689453125, -4.3056640625, -4.129638671875, -3.95361328125, -3.777587890625, -3.6015625, -3.425537109375, -3.24951171875, -3.073486328125, -2.8974609375, -2.721435546875, -2.54541015625, -2.369384765625, -2.193359375, -2.017333984375, -1.84130859375, -1.665283203125, -1.4892578125, -1.313232421875, -1.13720703125, -0.961181640625, -0.78515625, -0.609130859375, -0.43310546875, -0.257080078125, -0.0810546875, 0.094970703125, 0.27099609375, 0.447021484375, 0.623046875, 0.799072265625, 0.97509765625, 1.151123046875, 1.3271484375, 1.503173828125, 1.67919921875, 1.855224609375, 2.03125, 2.207275390625, 2.38330078125, 2.559326171875, 2.7353515625, 2.911376953125, 3.08740234375, 3.263427734375, 3.439453125, 3.615478515625, 3.79150390625, 3.967529296875, 4.1435546875, 4.319580078125, 4.49560546875, 4.671630859375, 4.84765625]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 2.0, 5.0, 8.0, 14.0, 12.0, 9.0, 26.0, 30.0, 39.0, 50.0, 57.0, 60.0, 63.0, 69.0, 63.0, 69.0, 74.0, 60.0, 60.0, 52.0, 44.0, 39.0, 27.0, 26.0, 11.0, 7.0, 6.0, 8.0, 5.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5439453125, -1.4937591552734375, -1.443572998046875, -1.3933868408203125, -1.34320068359375, -1.2930145263671875, -1.242828369140625, -1.1926422119140625, -1.1424560546875, -1.0922698974609375, -1.042083740234375, -0.9918975830078125, -0.94171142578125, -0.8915252685546875, -0.841339111328125, -0.7911529541015625, -0.740966796875, -0.6907806396484375, -0.640594482421875, -0.5904083251953125, -0.54022216796875, -0.4900360107421875, -0.439849853515625, -0.3896636962890625, -0.3394775390625, -0.2892913818359375, -0.239105224609375, -0.1889190673828125, -0.13873291015625, -0.0885467529296875, -0.038360595703125, 0.0118255615234375, 0.06201171875, 0.1121978759765625, 0.162384033203125, 0.2125701904296875, 0.26275634765625, 0.3129425048828125, 0.363128662109375, 0.4133148193359375, 0.4635009765625, 0.5136871337890625, 0.563873291015625, 0.6140594482421875, 0.66424560546875, 0.7144317626953125, 0.764617919921875, 0.8148040771484375, 0.864990234375, 0.9151763916015625, 0.965362548828125, 1.0155487060546875, 1.06573486328125, 1.1159210205078125, 1.166107177734375, 1.2162933349609375, 1.2664794921875, 1.3166656494140625, 1.366851806640625, 1.4170379638671875, 1.46722412109375, 1.5174102783203125, 1.567596435546875, 1.6177825927734375, 1.66796875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 6.0, 11.0, 22.0, 27.0, 35.0, 98.0, 209.0, 585.0, 1827.0, 8614.0, 55531.0, 1100046.0, 2925953.0, 85766.0, 11843.0, 2433.0, 736.0, 290.0, 129.0, 60.0, 30.0, 18.0, 4.0, 6.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.38671875, -5.16314697265625, -4.9395751953125, -4.71600341796875, -4.492431640625, -4.26885986328125, -4.0452880859375, -3.82171630859375, -3.59814453125, -3.37457275390625, -3.1510009765625, -2.92742919921875, -2.703857421875, -2.48028564453125, -2.2567138671875, -2.03314208984375, -1.8095703125, -1.58599853515625, -1.3624267578125, -1.13885498046875, -0.915283203125, -0.69171142578125, -0.4681396484375, -0.24456787109375, -0.02099609375, 0.20257568359375, 0.4261474609375, 0.64971923828125, 0.873291015625, 1.09686279296875, 1.3204345703125, 1.54400634765625, 1.767578125, 1.99114990234375, 2.2147216796875, 2.43829345703125, 2.661865234375, 2.88543701171875, 3.1090087890625, 3.33258056640625, 3.55615234375, 3.77972412109375, 4.0032958984375, 4.22686767578125, 4.450439453125, 4.67401123046875, 4.8975830078125, 5.12115478515625, 5.3447265625, 5.56829833984375, 5.7918701171875, 6.01544189453125, 6.239013671875, 6.46258544921875, 6.6861572265625, 6.90972900390625, 7.13330078125, 7.35687255859375, 7.5804443359375, 7.80401611328125, 8.027587890625, 8.25115966796875, 8.4747314453125, 8.69830322265625, 8.921875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 3.0, 7.0, 5.0, 6.0, 16.0, 18.0, 30.0, 36.0, 63.0, 88.0, 140.0, 273.0, 596.0, 1442.0, 632.0, 288.0, 162.0, 84.0, 56.0, 33.0, 22.0, 25.0, 16.0, 6.0, 8.0, 6.0, 5.0, 5.0, 2.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.45703125, -1.397613525390625, -1.33819580078125, -1.278778076171875, -1.2193603515625, -1.159942626953125, -1.10052490234375, -1.041107177734375, -0.981689453125, -0.922271728515625, -0.86285400390625, -0.803436279296875, -0.7440185546875, -0.684600830078125, -0.62518310546875, -0.565765380859375, -0.50634765625, -0.446929931640625, -0.38751220703125, -0.328094482421875, -0.2686767578125, -0.209259033203125, -0.14984130859375, -0.090423583984375, -0.031005859375, 0.028411865234375, 0.08782958984375, 0.147247314453125, 0.2066650390625, 0.266082763671875, 0.32550048828125, 0.384918212890625, 0.4443359375, 0.503753662109375, 0.56317138671875, 0.622589111328125, 0.6820068359375, 0.741424560546875, 0.80084228515625, 0.860260009765625, 0.919677734375, 0.979095458984375, 1.03851318359375, 1.097930908203125, 1.1573486328125, 1.216766357421875, 1.27618408203125, 1.335601806640625, 1.39501953125, 1.454437255859375, 1.51385498046875, 1.573272705078125, 1.6326904296875, 1.692108154296875, 1.75152587890625, 1.810943603515625, 1.870361328125, 1.929779052734375, 1.98919677734375, 2.048614501953125, 2.1080322265625, 2.167449951171875, 2.22686767578125, 2.286285400390625, 2.345703125]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 7.0, 6.0, 20.0, 39.0, 65.0, 101.0, 141.0, 151.0, 134.0, 108.0, 100.0, 56.0, 35.0, 17.0, 6.0, 6.0, 6.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.562813758850098, -9.159013748168945, -8.755213737487793, -8.35141372680664, -7.947612762451172, -7.5438127517700195, -7.140012741088867, -6.736212730407715, -6.332412242889404, -5.928612232208252, -5.524811744689941, -5.121011734008789, -4.717211723327637, -4.313411235809326, -3.909611225128174, -3.5058109760284424, -3.102010726928711, -2.6982104778289795, -2.294410228729248, -1.8906102180480957, -1.4868099689483643, -1.0830097198486328, -0.6792097091674805, -0.275409460067749, 0.12839078903198242, 0.5321909785270691, 0.9359911680221558, 1.3397912979125977, 1.743591547012329, 2.1473917961120605, 2.551191806793213, 2.9549920558929443, 3.358793258666992, 3.7625935077667236, 4.166393756866455, 4.570193767547607, 4.973994255065918, 5.37779426574707, 5.781594276428223, 6.185394287109375, 6.5891947746276855, 6.992994785308838, 7.396795272827148, 7.800595283508301, 8.204395294189453, 8.608196258544922, 9.011995315551758, 9.415796279907227, 9.819596290588379, 10.223396301269531, 10.627196311950684, 11.030996322631836, 11.434797286987305, 11.838597297668457, 12.24239730834961, 12.646197319030762, 13.049997329711914, 13.453797340393066, 13.857597351074219, 14.261398315429688, 14.66519832611084, 15.068998336791992, 15.472798347473145, 15.876598358154297, 16.280399322509766]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 5.0, 9.0, 9.0, 13.0, 17.0, 15.0, 16.0, 26.0, 28.0, 32.0, 37.0, 41.0, 48.0, 51.0, 59.0, 47.0, 64.0, 54.0, 40.0, 55.0, 49.0, 47.0, 33.0, 35.0, 34.0, 25.0, 23.0, 24.0, 13.0, 14.0, 9.0, 11.0, 6.0, 9.0, 6.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.883063316345215, -5.672290802001953, -5.46151876449585, -5.250746250152588, -5.039973735809326, -4.829201698303223, -4.618429183959961, -4.407656669616699, -4.1968841552734375, -3.986111879348755, -3.775339365005493, -3.5645670890808105, -3.353794574737549, -3.143022298812866, -2.9322500228881836, -2.721477508544922, -2.5107052326202393, -2.2999329566955566, -2.089160442352295, -1.8783881664276123, -1.6676156520843506, -1.456843376159668, -1.2460709810256958, -1.0352985858917236, -0.8245261907577515, -0.6137537956237793, -0.4029814302921295, -0.19220906496047974, 0.01856333017349243, 0.22933566570281982, 0.440108060836792, 0.6508804559707642, 0.8616528511047363, 1.0724252462387085, 1.2831976413726807, 1.4939699172973633, 1.704742431640625, 1.9155147075653076, 2.1262869834899902, 2.337059497833252, 2.5478320121765137, 2.7586042881011963, 2.969376802444458, 3.1801490783691406, 3.3909215927124023, 3.601693868637085, 3.8124661445617676, 4.023238658905029, 4.234010696411133, 4.4447832107543945, 4.655555248260498, 4.86632776260376, 5.0771002769470215, 5.287872314453125, 5.498644828796387, 5.709417343139648, 5.92018985748291, 6.130962371826172, 6.341734409332275, 6.552506923675537, 6.763279438018799, 6.974051475524902, 7.184823989868164, 7.395596504211426, 7.6063690185546875]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 5.0, 3.0, 6.0, 4.0, 16.0, 12.0, 23.0, 32.0, 53.0, 77.0, 104.0, 186.0, 264.0, 412.0, 701.0, 1196.0, 2165.0, 4154.0, 8442.0, 16539.0, 35518.0, 78876.0, 172826.0, 294396.0, 227836.0, 109830.0, 48936.0, 22612.0, 11027.0, 5517.0, 2939.0, 1565.0, 912.0, 498.0, 308.0, 194.0, 129.0, 82.0, 52.0, 31.0, 27.0, 13.0, 13.0, 15.0, 9.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-4.48046875, -4.3475341796875, -4.214599609375, -4.0816650390625, -3.94873046875, -3.8157958984375, -3.682861328125, -3.5499267578125, -3.4169921875, -3.2840576171875, -3.151123046875, -3.0181884765625, -2.88525390625, -2.7523193359375, -2.619384765625, -2.4864501953125, -2.353515625, -2.2205810546875, -2.087646484375, -1.9547119140625, -1.82177734375, -1.6888427734375, -1.555908203125, -1.4229736328125, -1.2900390625, -1.1571044921875, -1.024169921875, -0.8912353515625, -0.75830078125, -0.6253662109375, -0.492431640625, -0.3594970703125, -0.2265625, -0.0936279296875, 0.039306640625, 0.1722412109375, 0.30517578125, 0.4381103515625, 0.571044921875, 0.7039794921875, 0.8369140625, 0.9698486328125, 1.102783203125, 1.2357177734375, 1.36865234375, 1.5015869140625, 1.634521484375, 1.7674560546875, 1.900390625, 2.0333251953125, 2.166259765625, 2.2991943359375, 2.43212890625, 2.5650634765625, 2.697998046875, 2.8309326171875, 2.9638671875, 3.0968017578125, 3.229736328125, 3.3626708984375, 3.49560546875, 3.6285400390625, 3.761474609375, 3.8944091796875, 4.02734375]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 8.0, 1.0, 15.0, 17.0, 17.0, 16.0, 35.0, 40.0, 44.0, 41.0, 70.0, 62.0, 64.0, 78.0, 58.0, 70.0, 57.0, 66.0, 56.0, 43.0, 43.0, 27.0, 25.0, 15.0, 6.0, 9.0, 9.0, 2.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.583984375, -1.534271240234375, -1.48455810546875, -1.434844970703125, -1.3851318359375, -1.335418701171875, -1.28570556640625, -1.235992431640625, -1.186279296875, -1.136566162109375, -1.08685302734375, -1.037139892578125, -0.9874267578125, -0.937713623046875, -0.88800048828125, -0.838287353515625, -0.78857421875, -0.738861083984375, -0.68914794921875, -0.639434814453125, -0.5897216796875, -0.540008544921875, -0.49029541015625, -0.440582275390625, -0.390869140625, -0.341156005859375, -0.29144287109375, -0.241729736328125, -0.1920166015625, -0.142303466796875, -0.09259033203125, -0.042877197265625, 0.0068359375, 0.056549072265625, 0.10626220703125, 0.155975341796875, 0.2056884765625, 0.255401611328125, 0.30511474609375, 0.354827880859375, 0.404541015625, 0.454254150390625, 0.50396728515625, 0.553680419921875, 0.6033935546875, 0.653106689453125, 0.70281982421875, 0.752532958984375, 0.80224609375, 0.851959228515625, 0.90167236328125, 0.951385498046875, 1.0010986328125, 1.050811767578125, 1.10052490234375, 1.150238037109375, 1.199951171875, 1.249664306640625, 1.29937744140625, 1.349090576171875, 1.3988037109375, 1.448516845703125, 1.49822998046875, 1.547943115234375, 1.59765625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 5.0, 2.0, 7.0, 3.0, 10.0, 20.0, 22.0, 33.0, 37.0, 62.0, 80.0, 119.0, 155.0, 279.0, 350.0, 597.0, 1040.0, 2362.0, 8545.0, 54496.0, 384701.0, 496717.0, 81034.0, 11973.0, 2927.0, 1184.0, 617.0, 370.0, 249.0, 167.0, 112.0, 85.0, 54.0, 44.0, 26.0, 26.0, 12.0, 5.0, 5.0, 9.0, 4.0, 6.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0], "bins": [-9.8125, -9.5406494140625, -9.268798828125, -8.9969482421875, -8.72509765625, -8.4532470703125, -8.181396484375, -7.9095458984375, -7.6376953125, -7.3658447265625, -7.093994140625, -6.8221435546875, -6.55029296875, -6.2784423828125, -6.006591796875, -5.7347412109375, -5.462890625, -5.1910400390625, -4.919189453125, -4.6473388671875, -4.37548828125, -4.1036376953125, -3.831787109375, -3.5599365234375, -3.2880859375, -3.0162353515625, -2.744384765625, -2.4725341796875, -2.20068359375, -1.9288330078125, -1.656982421875, -1.3851318359375, -1.11328125, -0.8414306640625, -0.569580078125, -0.2977294921875, -0.02587890625, 0.2459716796875, 0.517822265625, 0.7896728515625, 1.0615234375, 1.3333740234375, 1.605224609375, 1.8770751953125, 2.14892578125, 2.4207763671875, 2.692626953125, 2.9644775390625, 3.236328125, 3.5081787109375, 3.780029296875, 4.0518798828125, 4.32373046875, 4.5955810546875, 4.867431640625, 5.1392822265625, 5.4111328125, 5.6829833984375, 5.954833984375, 6.2266845703125, 6.49853515625, 6.7703857421875, 7.042236328125, 7.3140869140625, 7.5859375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 6.0, 2.0, 6.0, 6.0, 10.0, 13.0, 18.0, 26.0, 25.0, 38.0, 29.0, 62.0, 59.0, 53.0, 65.0, 81.0, 76.0, 57.0, 72.0, 56.0, 50.0, 34.0, 42.0, 28.0, 22.0, 24.0, 12.0, 12.0, 5.0, 5.0, 4.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.8828125, -8.6058349609375, -8.328857421875, -8.0518798828125, -7.77490234375, -7.4979248046875, -7.220947265625, -6.9439697265625, -6.6669921875, -6.3900146484375, -6.113037109375, -5.8360595703125, -5.55908203125, -5.2821044921875, -5.005126953125, -4.7281494140625, -4.451171875, -4.1741943359375, -3.897216796875, -3.6202392578125, -3.34326171875, -3.0662841796875, -2.789306640625, -2.5123291015625, -2.2353515625, -1.9583740234375, -1.681396484375, -1.4044189453125, -1.12744140625, -0.8504638671875, -0.573486328125, -0.2965087890625, -0.01953125, 0.2574462890625, 0.534423828125, 0.8114013671875, 1.08837890625, 1.3653564453125, 1.642333984375, 1.9193115234375, 2.1962890625, 2.4732666015625, 2.750244140625, 3.0272216796875, 3.30419921875, 3.5811767578125, 3.858154296875, 4.1351318359375, 4.412109375, 4.6890869140625, 4.966064453125, 5.2430419921875, 5.52001953125, 5.7969970703125, 6.073974609375, 6.3509521484375, 6.6279296875, 6.9049072265625, 7.181884765625, 7.4588623046875, 7.73583984375, 8.0128173828125, 8.289794921875, 8.5667724609375, 8.84375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 5.0, 6.0, 7.0, 8.0, 9.0, 14.0, 19.0, 36.0, 57.0, 78.0, 129.0, 202.0, 332.0, 661.0, 1178.0, 2572.0, 6134.0, 16909.0, 58034.0, 312105.0, 509611.0, 99568.0, 25327.0, 8475.0, 3474.0, 1709.0, 823.0, 452.0, 215.0, 155.0, 71.0, 55.0, 37.0, 28.0, 19.0, 9.0, 15.0, 6.0, 6.0, 5.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.40234375, -4.2696533203125, -4.136962890625, -4.0042724609375, -3.87158203125, -3.7388916015625, -3.606201171875, -3.4735107421875, -3.3408203125, -3.2081298828125, -3.075439453125, -2.9427490234375, -2.81005859375, -2.6773681640625, -2.544677734375, -2.4119873046875, -2.279296875, -2.1466064453125, -2.013916015625, -1.8812255859375, -1.74853515625, -1.6158447265625, -1.483154296875, -1.3504638671875, -1.2177734375, -1.0850830078125, -0.952392578125, -0.8197021484375, -0.68701171875, -0.5543212890625, -0.421630859375, -0.2889404296875, -0.15625, -0.0235595703125, 0.109130859375, 0.2418212890625, 0.37451171875, 0.5072021484375, 0.639892578125, 0.7725830078125, 0.9052734375, 1.0379638671875, 1.170654296875, 1.3033447265625, 1.43603515625, 1.5687255859375, 1.701416015625, 1.8341064453125, 1.966796875, 2.0994873046875, 2.232177734375, 2.3648681640625, 2.49755859375, 2.6302490234375, 2.762939453125, 2.8956298828125, 3.0283203125, 3.1610107421875, 3.293701171875, 3.4263916015625, 3.55908203125, 3.6917724609375, 3.824462890625, 3.9571533203125, 4.08984375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 1.0, 3.0, 9.0, 7.0, 6.0, 16.0, 12.0, 17.0, 15.0, 24.0, 41.0, 47.0, 58.0, 97.0, 110.0, 112.0, 94.0, 77.0, 58.0, 41.0, 43.0, 18.0, 23.0, 14.0, 14.0, 4.0, 6.0, 10.0, 7.0, 6.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005793571472167969, -0.0005596056580543518, -0.0005398541688919067, -0.0005201026797294617, -0.0005003511905670166, -0.00048059970140457153, -0.00046084821224212646, -0.0004410967230796814, -0.00042134523391723633, -0.00040159374475479126, -0.0003818422555923462, -0.0003620907664299011, -0.00034233927726745605, -0.000322587788105011, -0.0003028362989425659, -0.00028308480978012085, -0.0002633333206176758, -0.0002435818314552307, -0.00022383034229278564, -0.00020407885313034058, -0.0001843273639678955, -0.00016457587480545044, -0.00014482438564300537, -0.0001250728964805603, -0.00010532140731811523, -8.556991815567017e-05, -6.58184289932251e-05, -4.606693983078003e-05, -2.631545066833496e-05, -6.563961505889893e-06, 1.3187527656555176e-05, 3.2939016819000244e-05, 5.269050598144531e-05, 7.244199514389038e-05, 9.219348430633545e-05, 0.00011194497346878052, 0.00013169646263122559, 0.00015144795179367065, 0.00017119944095611572, 0.0001909509301185608, 0.00021070241928100586, 0.00023045390844345093, 0.000250205397605896, 0.00026995688676834106, 0.00028970837593078613, 0.0003094598650932312, 0.00032921135425567627, 0.00034896284341812134, 0.0003687143325805664, 0.0003884658217430115, 0.00040821731090545654, 0.0004279688000679016, 0.0004477202892303467, 0.00046747177839279175, 0.0004872232675552368, 0.0005069747567176819, 0.000526726245880127, 0.000546477735042572, 0.0005662292242050171, 0.0005859807133674622, 0.0006057322025299072, 0.0006254836916923523, 0.0006452351808547974, 0.0006649866700172424, 0.0006847381591796875]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 2.0, 3.0, 6.0, 2.0, 6.0, 4.0, 7.0, 8.0, 18.0, 19.0, 28.0, 25.0, 44.0, 52.0, 107.0, 164.0, 268.0, 529.0, 1180.0, 3202.0, 13236.0, 88951.0, 750564.0, 162951.0, 20020.0, 4351.0, 1395.0, 573.0, 316.0, 195.0, 111.0, 76.0, 41.0, 27.0, 19.0, 16.0, 6.0, 12.0, 8.0, 4.0, 4.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 2.0], "bins": [-6.87890625, -6.685791015625, -6.49267578125, -6.299560546875, -6.1064453125, -5.913330078125, -5.72021484375, -5.527099609375, -5.333984375, -5.140869140625, -4.94775390625, -4.754638671875, -4.5615234375, -4.368408203125, -4.17529296875, -3.982177734375, -3.7890625, -3.595947265625, -3.40283203125, -3.209716796875, -3.0166015625, -2.823486328125, -2.63037109375, -2.437255859375, -2.244140625, -2.051025390625, -1.85791015625, -1.664794921875, -1.4716796875, -1.278564453125, -1.08544921875, -0.892333984375, -0.69921875, -0.506103515625, -0.31298828125, -0.119873046875, 0.0732421875, 0.266357421875, 0.45947265625, 0.652587890625, 0.845703125, 1.038818359375, 1.23193359375, 1.425048828125, 1.6181640625, 1.811279296875, 2.00439453125, 2.197509765625, 2.390625, 2.583740234375, 2.77685546875, 2.969970703125, 3.1630859375, 3.356201171875, 3.54931640625, 3.742431640625, 3.935546875, 4.128662109375, 4.32177734375, 4.514892578125, 4.7080078125, 4.901123046875, 5.09423828125, 5.287353515625, 5.48046875]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 4.0, 3.0, 2.0, 3.0, 7.0, 8.0, 13.0, 9.0, 8.0, 20.0, 24.0, 30.0, 40.0, 55.0, 70.0, 83.0, 100.0, 122.0, 108.0, 71.0, 51.0, 46.0, 25.0, 21.0, 18.0, 16.0, 15.0, 11.0, 4.0, 10.0, 1.0, 3.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.171875, -4.065338134765625, -3.95880126953125, -3.852264404296875, -3.7457275390625, -3.639190673828125, -3.53265380859375, -3.426116943359375, -3.319580078125, -3.213043212890625, -3.10650634765625, -2.999969482421875, -2.8934326171875, -2.786895751953125, -2.68035888671875, -2.573822021484375, -2.46728515625, -2.360748291015625, -2.25421142578125, -2.147674560546875, -2.0411376953125, -1.934600830078125, -1.82806396484375, -1.721527099609375, -1.614990234375, -1.508453369140625, -1.40191650390625, -1.295379638671875, -1.1888427734375, -1.082305908203125, -0.97576904296875, -0.869232177734375, -0.7626953125, -0.656158447265625, -0.54962158203125, -0.443084716796875, -0.3365478515625, -0.230010986328125, -0.12347412109375, -0.016937255859375, 0.089599609375, 0.196136474609375, 0.30267333984375, 0.409210205078125, 0.5157470703125, 0.622283935546875, 0.72882080078125, 0.835357666015625, 0.94189453125, 1.048431396484375, 1.15496826171875, 1.261505126953125, 1.3680419921875, 1.474578857421875, 1.58111572265625, 1.687652587890625, 1.794189453125, 1.900726318359375, 2.00726318359375, 2.113800048828125, 2.2203369140625, 2.326873779296875, 2.43341064453125, 2.539947509765625, 2.646484375]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 6.0, 14.0, 57.0, 127.0, 232.0, 260.0, 186.0, 75.0, 30.0, 11.0, 5.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-95.7146224975586, -92.82970428466797, -89.94478607177734, -87.05986785888672, -84.17495727539062, -81.2900390625, -78.40512084960938, -75.52020263671875, -72.63528442382812, -69.7503662109375, -66.86544799804688, -63.980533599853516, -61.09561538696289, -58.210697174072266, -55.325782775878906, -52.44086456298828, -49.555946350097656, -46.67102813720703, -43.786109924316406, -40.90119552612305, -38.01627731323242, -35.1313591003418, -32.24644470214844, -29.361526489257812, -26.476608276367188, -23.591690063476562, -20.70677375793457, -17.821857452392578, -14.936939239501953, -12.052021980285645, -9.167104721069336, -6.282188415527344, -3.39727783203125, -0.5123605728149414, 2.372556686401367, 5.257473945617676, 8.142391204833984, 11.027308464050293, 13.912225723266602, 16.797142028808594, 19.68206024169922, 22.566978454589844, 25.451894760131836, 28.336811065673828, 31.221729278564453, 34.10664749145508, 36.99156188964844, 39.87648010253906, 42.76139831542969, 45.64631652832031, 48.53123474121094, 51.4161491394043, 54.30106735229492, 57.18598556518555, 60.070899963378906, 62.95581817626953, 65.84073638916016, 68.72565460205078, 71.6105728149414, 74.49549102783203, 77.38040161132812, 80.26531982421875, 83.15023803710938, 86.03515625, 88.92007446289062]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 2.0, 1.0, 5.0, 8.0, 18.0, 16.0, 13.0, 18.0, 11.0, 21.0, 31.0, 40.0, 25.0, 43.0, 32.0, 48.0, 46.0, 52.0, 44.0, 40.0, 53.0, 40.0, 44.0, 47.0, 49.0, 33.0, 34.0, 31.0, 37.0, 23.0, 21.0, 14.0, 14.0, 11.0, 11.0, 8.0, 4.0, 5.0, 7.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.924861907958984, -33.75464630126953, -32.584434509277344, -31.414220809936523, -30.244007110595703, -29.07379150390625, -27.90357780456543, -26.73336410522461, -25.56315040588379, -24.39293670654297, -23.22272300720215, -22.052509307861328, -20.882293701171875, -19.712081909179688, -18.541866302490234, -17.371652603149414, -16.201438903808594, -15.031225204467773, -13.861011505126953, -12.690796852111816, -11.520583152770996, -10.350369453430176, -9.180154800415039, -8.009941101074219, -6.839727401733398, -5.669513702392578, -4.4992995262146, -3.3290855884552, -2.158871650695801, -0.9886579513549805, 0.18155622482299805, 1.3517704010009766, 2.5219802856445312, 3.6921942234039307, 4.86240816116333, 6.032622337341309, 7.202836036682129, 8.37304973602295, 9.543264389038086, 10.713478088378906, 11.883691787719727, 13.053905487060547, 14.224119186401367, 15.394333839416504, 16.56454849243164, 17.734760284423828, 18.90497589111328, 20.0751895904541, 21.245403289794922, 22.415616989135742, 23.585830688476562, 24.756044387817383, 25.926258087158203, 27.096473693847656, 28.266687393188477, 29.436901092529297, 30.607114791870117, 31.777328491210938, 32.94754409790039, 34.11775588989258, 35.28797149658203, 36.45818328857422, 37.62839889526367, 38.798614501953125, 39.96882629394531]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 5.0, 6.0, 2.0, 6.0, 12.0, 34.0, 36.0, 53.0, 107.0, 157.0, 306.0, 648.0, 1386.0, 3791.0, 13152.0, 64147.0, 832857.0, 3146873.0, 103454.0, 19161.0, 4906.0, 1716.0, 708.0, 332.0, 172.0, 95.0, 67.0, 36.0, 23.0, 19.0, 4.0, 2.0, 5.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.0703125, -4.88336181640625, -4.6964111328125, -4.50946044921875, -4.322509765625, -4.13555908203125, -3.9486083984375, -3.76165771484375, -3.57470703125, -3.38775634765625, -3.2008056640625, -3.01385498046875, -2.826904296875, -2.63995361328125, -2.4530029296875, -2.26605224609375, -2.0791015625, -1.89215087890625, -1.7052001953125, -1.51824951171875, -1.331298828125, -1.14434814453125, -0.9573974609375, -0.77044677734375, -0.58349609375, -0.39654541015625, -0.2095947265625, -0.02264404296875, 0.164306640625, 0.35125732421875, 0.5382080078125, 0.72515869140625, 0.912109375, 1.09906005859375, 1.2860107421875, 1.47296142578125, 1.659912109375, 1.84686279296875, 2.0338134765625, 2.22076416015625, 2.40771484375, 2.59466552734375, 2.7816162109375, 2.96856689453125, 3.155517578125, 3.34246826171875, 3.5294189453125, 3.71636962890625, 3.9033203125, 4.09027099609375, 4.2772216796875, 4.46417236328125, 4.651123046875, 4.83807373046875, 5.0250244140625, 5.21197509765625, 5.39892578125, 5.58587646484375, 5.7728271484375, 5.95977783203125, 6.146728515625, 6.33367919921875, 6.5206298828125, 6.70758056640625, 6.89453125]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 7.0, 4.0, 3.0, 6.0, 18.0, 13.0, 18.0, 30.0, 33.0, 34.0, 49.0, 67.0, 60.0, 71.0, 68.0, 72.0, 58.0, 69.0, 67.0, 51.0, 41.0, 48.0, 29.0, 26.0, 11.0, 21.0, 12.0, 10.0, 4.0, 4.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.990234375, -1.9322509765625, -1.874267578125, -1.8162841796875, -1.75830078125, -1.7003173828125, -1.642333984375, -1.5843505859375, -1.5263671875, -1.4683837890625, -1.410400390625, -1.3524169921875, -1.29443359375, -1.2364501953125, -1.178466796875, -1.1204833984375, -1.0625, -1.0045166015625, -0.946533203125, -0.8885498046875, -0.83056640625, -0.7725830078125, -0.714599609375, -0.6566162109375, -0.5986328125, -0.5406494140625, -0.482666015625, -0.4246826171875, -0.36669921875, -0.3087158203125, -0.250732421875, -0.1927490234375, -0.134765625, -0.0767822265625, -0.018798828125, 0.0391845703125, 0.09716796875, 0.1551513671875, 0.213134765625, 0.2711181640625, 0.3291015625, 0.3870849609375, 0.445068359375, 0.5030517578125, 0.56103515625, 0.6190185546875, 0.677001953125, 0.7349853515625, 0.79296875, 0.8509521484375, 0.908935546875, 0.9669189453125, 1.02490234375, 1.0828857421875, 1.140869140625, 1.1988525390625, 1.2568359375, 1.3148193359375, 1.372802734375, 1.4307861328125, 1.48876953125, 1.5467529296875, 1.604736328125, 1.6627197265625, 1.720703125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 5.0, 3.0, 1.0, 9.0, 6.0, 7.0, 16.0, 14.0, 48.0, 63.0, 110.0, 244.0, 414.0, 901.0, 2130.0, 5298.0, 15886.0, 61680.0, 387324.0, 3239836.0, 392160.0, 62899.0, 15965.0, 5412.0, 2048.0, 880.0, 447.0, 212.0, 106.0, 71.0, 30.0, 27.0, 10.0, 13.0, 7.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.59765625, -5.4522705078125, -5.306884765625, -5.1614990234375, -5.01611328125, -4.8707275390625, -4.725341796875, -4.5799560546875, -4.4345703125, -4.2891845703125, -4.143798828125, -3.9984130859375, -3.85302734375, -3.7076416015625, -3.562255859375, -3.4168701171875, -3.271484375, -3.1260986328125, -2.980712890625, -2.8353271484375, -2.68994140625, -2.5445556640625, -2.399169921875, -2.2537841796875, -2.1083984375, -1.9630126953125, -1.817626953125, -1.6722412109375, -1.52685546875, -1.3814697265625, -1.236083984375, -1.0906982421875, -0.9453125, -0.7999267578125, -0.654541015625, -0.5091552734375, -0.36376953125, -0.2183837890625, -0.072998046875, 0.0723876953125, 0.2177734375, 0.3631591796875, 0.508544921875, 0.6539306640625, 0.79931640625, 0.9447021484375, 1.090087890625, 1.2354736328125, 1.380859375, 1.5262451171875, 1.671630859375, 1.8170166015625, 1.96240234375, 2.1077880859375, 2.253173828125, 2.3985595703125, 2.5439453125, 2.6893310546875, 2.834716796875, 2.9801025390625, 3.12548828125, 3.2708740234375, 3.416259765625, 3.5616455078125, 3.70703125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 1.0, 3.0, 3.0, 9.0, 7.0, 9.0, 15.0, 19.0, 37.0, 45.0, 70.0, 116.0, 246.0, 472.0, 1336.0, 833.0, 373.0, 156.0, 100.0, 70.0, 51.0, 22.0, 18.0, 22.0, 10.0, 10.0, 8.0, 3.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.564453125, -2.49072265625, -2.4169921875, -2.34326171875, -2.26953125, -2.19580078125, -2.1220703125, -2.04833984375, -1.974609375, -1.90087890625, -1.8271484375, -1.75341796875, -1.6796875, -1.60595703125, -1.5322265625, -1.45849609375, -1.384765625, -1.31103515625, -1.2373046875, -1.16357421875, -1.08984375, -1.01611328125, -0.9423828125, -0.86865234375, -0.794921875, -0.72119140625, -0.6474609375, -0.57373046875, -0.5, -0.42626953125, -0.3525390625, -0.27880859375, -0.205078125, -0.13134765625, -0.0576171875, 0.01611328125, 0.08984375, 0.16357421875, 0.2373046875, 0.31103515625, 0.384765625, 0.45849609375, 0.5322265625, 0.60595703125, 0.6796875, 0.75341796875, 0.8271484375, 0.90087890625, 0.974609375, 1.04833984375, 1.1220703125, 1.19580078125, 1.26953125, 1.34326171875, 1.4169921875, 1.49072265625, 1.564453125, 1.63818359375, 1.7119140625, 1.78564453125, 1.859375, 1.93310546875, 2.0068359375, 2.08056640625, 2.154296875]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 5.0, 18.0, 31.0, 79.0, 110.0, 143.0, 185.0, 165.0, 118.0, 69.0, 41.0, 23.0, 8.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.505436897277832, -12.955610275268555, -12.405782699584961, -11.855955123901367, -11.30612850189209, -10.756301879882812, -10.206474304199219, -9.656646728515625, -9.106820106506348, -8.55699348449707, -8.007165908813477, -7.457338809967041, -6.9075117111206055, -6.35768461227417, -5.807857513427734, -5.258030414581299, -4.708203315734863, -4.158376216888428, -3.608549118041992, -3.0587220191955566, -2.508894920349121, -1.9590678215026855, -1.40924072265625, -0.8594136238098145, -0.3095865249633789, 0.24024057388305664, 0.7900676727294922, 1.3398947715759277, 1.8897218704223633, 2.439548969268799, 2.9893760681152344, 3.53920316696167, 4.089031219482422, 4.638858318328857, 5.188685417175293, 5.7385125160217285, 6.288339614868164, 6.8381667137146, 7.387993812561035, 7.937820911407471, 8.487648010253906, 9.0374755859375, 9.587302207946777, 10.137128829956055, 10.686956405639648, 11.236783981323242, 11.78661060333252, 12.336437225341797, 12.88626480102539, 13.436092376708984, 13.985918998718262, 14.535745620727539, 15.085573196411133, 15.635400772094727, 16.185226440429688, 16.73505401611328, 17.284881591796875, 17.83470916748047, 18.384536743164062, 18.934362411499023, 19.484189987182617, 20.03401756286621, 20.583843231201172, 21.133670806884766, 21.68349838256836]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 2.0, 1.0, 1.0, 7.0, 7.0, 17.0, 16.0, 17.0, 22.0, 15.0, 19.0, 19.0, 43.0, 42.0, 35.0, 44.0, 43.0, 36.0, 45.0, 51.0, 35.0, 49.0, 59.0, 42.0, 34.0, 34.0, 39.0, 39.0, 28.0, 20.0, 24.0, 27.0, 13.0, 14.0, 10.0, 10.0, 13.0, 8.0, 5.0, 5.0, 1.0, 7.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0], "bins": [-8.615545272827148, -8.376341819763184, -8.137138366699219, -7.897934913635254, -7.658731460571289, -7.419528007507324, -7.180324554443359, -6.9411211013793945, -6.70191764831543, -6.462714195251465, -6.2235107421875, -5.984307289123535, -5.74510383605957, -5.5059003829956055, -5.266696929931641, -5.027493476867676, -4.788290023803711, -4.549086570739746, -4.309883117675781, -4.070679664611816, -3.8314762115478516, -3.5922727584838867, -3.353069305419922, -3.113865852355957, -2.874661922454834, -2.635458469390869, -2.3962550163269043, -2.1570515632629395, -1.9178481101989746, -1.6786445379257202, -1.4394410848617554, -1.2002376317977905, -0.9610342979431152, -0.7218308448791504, -0.48262736201286316, -0.24342387914657593, -0.004220426082611084, 0.23498308658599854, 0.4741865396499634, 0.7133899927139282, 0.9525934457778931, 1.191796898841858, 1.4310003519058228, 1.6702039241790771, 1.909407377243042, 2.148610830307007, 2.3878142833709717, 2.6270177364349365, 2.8662211894989014, 3.105424642562866, 3.344628095626831, 3.583831548690796, 3.8230350017547607, 4.062238693237305, 4.3014421463012695, 4.540645599365234, 4.779849052429199, 5.019052505493164, 5.258255958557129, 5.497459411621094, 5.736662864685059, 5.975866317749023, 6.215069770812988, 6.454273223876953, 6.693476676940918]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 2.0, 2.0, 2.0, 2.0, 6.0, 6.0, 11.0, 10.0, 24.0, 24.0, 30.0, 48.0, 75.0, 96.0, 156.0, 225.0, 318.0, 467.0, 786.0, 1319.0, 2094.0, 3535.0, 6423.0, 11349.0, 21342.0, 42072.0, 91235.0, 286800.0, 359274.0, 115476.0, 49347.0, 24815.0, 13297.0, 7332.0, 4099.0, 2430.0, 1478.0, 877.0, 574.0, 323.0, 221.0, 161.0, 104.0, 82.0, 75.0, 34.0, 34.0, 16.0, 16.0, 15.0, 9.0, 5.0, 4.0, 3.0, 4.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0], "bins": [-3.9296875, -3.80340576171875, -3.6771240234375, -3.55084228515625, -3.424560546875, -3.29827880859375, -3.1719970703125, -3.04571533203125, -2.91943359375, -2.79315185546875, -2.6668701171875, -2.54058837890625, -2.414306640625, -2.28802490234375, -2.1617431640625, -2.03546142578125, -1.9091796875, -1.78289794921875, -1.6566162109375, -1.53033447265625, -1.404052734375, -1.27777099609375, -1.1514892578125, -1.02520751953125, -0.89892578125, -0.77264404296875, -0.6463623046875, -0.52008056640625, -0.393798828125, -0.26751708984375, -0.1412353515625, -0.01495361328125, 0.111328125, 0.23760986328125, 0.3638916015625, 0.49017333984375, 0.616455078125, 0.74273681640625, 0.8690185546875, 0.99530029296875, 1.12158203125, 1.24786376953125, 1.3741455078125, 1.50042724609375, 1.626708984375, 1.75299072265625, 1.8792724609375, 2.00555419921875, 2.1318359375, 2.25811767578125, 2.3843994140625, 2.51068115234375, 2.636962890625, 2.76324462890625, 2.8895263671875, 3.01580810546875, 3.14208984375, 3.26837158203125, 3.3946533203125, 3.52093505859375, 3.647216796875, 3.77349853515625, 3.8997802734375, 4.02606201171875, 4.15234375]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 5.0, 8.0, 6.0, 11.0, 16.0, 14.0, 25.0, 30.0, 31.0, 42.0, 39.0, 51.0, 62.0, 65.0, 54.0, 74.0, 56.0, 44.0, 68.0, 44.0, 51.0, 45.0, 35.0, 31.0, 21.0, 12.0, 18.0, 16.0, 9.0, 10.0, 4.0, 2.0, 2.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.6787109375, -1.6273040771484375, -1.575897216796875, -1.5244903564453125, -1.47308349609375, -1.4216766357421875, -1.370269775390625, -1.3188629150390625, -1.2674560546875, -1.2160491943359375, -1.164642333984375, -1.1132354736328125, -1.06182861328125, -1.0104217529296875, -0.959014892578125, -0.9076080322265625, -0.856201171875, -0.8047943115234375, -0.753387451171875, -0.7019805908203125, -0.65057373046875, -0.5991668701171875, -0.547760009765625, -0.4963531494140625, -0.4449462890625, -0.3935394287109375, -0.342132568359375, -0.2907257080078125, -0.23931884765625, -0.1879119873046875, -0.136505126953125, -0.0850982666015625, -0.03369140625, 0.0177154541015625, 0.069122314453125, 0.1205291748046875, 0.17193603515625, 0.2233428955078125, 0.274749755859375, 0.3261566162109375, 0.3775634765625, 0.4289703369140625, 0.480377197265625, 0.5317840576171875, 0.58319091796875, 0.6345977783203125, 0.686004638671875, 0.7374114990234375, 0.788818359375, 0.8402252197265625, 0.891632080078125, 0.9430389404296875, 0.99444580078125, 1.0458526611328125, 1.097259521484375, 1.1486663818359375, 1.2000732421875, 1.2514801025390625, 1.302886962890625, 1.3542938232421875, 1.40570068359375, 1.4571075439453125, 1.508514404296875, 1.5599212646484375, 1.611328125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 4.0, 4.0, 6.0, 7.0, 15.0, 13.0, 27.0, 26.0, 38.0, 56.0, 68.0, 89.0, 130.0, 197.0, 260.0, 414.0, 666.0, 1592.0, 4699.0, 22018.0, 174659.0, 743921.0, 81093.0, 12576.0, 3052.0, 1129.0, 605.0, 357.0, 230.0, 161.0, 126.0, 84.0, 71.0, 44.0, 31.0, 17.0, 15.0, 13.0, 10.0, 4.0, 5.0, 5.0, 5.0, 7.0, 2.0, 5.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.7734375, -9.428466796875, -9.08349609375, -8.738525390625, -8.3935546875, -8.048583984375, -7.70361328125, -7.358642578125, -7.013671875, -6.668701171875, -6.32373046875, -5.978759765625, -5.6337890625, -5.288818359375, -4.94384765625, -4.598876953125, -4.25390625, -3.908935546875, -3.56396484375, -3.218994140625, -2.8740234375, -2.529052734375, -2.18408203125, -1.839111328125, -1.494140625, -1.149169921875, -0.80419921875, -0.459228515625, -0.1142578125, 0.230712890625, 0.57568359375, 0.920654296875, 1.265625, 1.610595703125, 1.95556640625, 2.300537109375, 2.6455078125, 2.990478515625, 3.33544921875, 3.680419921875, 4.025390625, 4.370361328125, 4.71533203125, 5.060302734375, 5.4052734375, 5.750244140625, 6.09521484375, 6.440185546875, 6.78515625, 7.130126953125, 7.47509765625, 7.820068359375, 8.1650390625, 8.510009765625, 8.85498046875, 9.199951171875, 9.544921875, 9.889892578125, 10.23486328125, 10.579833984375, 10.9248046875, 11.269775390625, 11.61474609375, 11.959716796875, 12.3046875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 6.0, 4.0, 6.0, 2.0, 13.0, 13.0, 24.0, 18.0, 25.0, 37.0, 56.0, 53.0, 51.0, 64.0, 63.0, 73.0, 77.0, 68.0, 61.0, 61.0, 42.0, 46.0, 38.0, 24.0, 15.0, 8.0, 16.0, 13.0, 7.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.0234375, -9.7059326171875, -9.388427734375, -9.0709228515625, -8.75341796875, -8.4359130859375, -8.118408203125, -7.8009033203125, -7.4833984375, -7.1658935546875, -6.848388671875, -6.5308837890625, -6.21337890625, -5.8958740234375, -5.578369140625, -5.2608642578125, -4.943359375, -4.6258544921875, -4.308349609375, -3.9908447265625, -3.67333984375, -3.3558349609375, -3.038330078125, -2.7208251953125, -2.4033203125, -2.0858154296875, -1.768310546875, -1.4508056640625, -1.13330078125, -0.8157958984375, -0.498291015625, -0.1807861328125, 0.13671875, 0.4542236328125, 0.771728515625, 1.0892333984375, 1.40673828125, 1.7242431640625, 2.041748046875, 2.3592529296875, 2.6767578125, 2.9942626953125, 3.311767578125, 3.6292724609375, 3.94677734375, 4.2642822265625, 4.581787109375, 4.8992919921875, 5.216796875, 5.5343017578125, 5.851806640625, 6.1693115234375, 6.48681640625, 6.8043212890625, 7.121826171875, 7.4393310546875, 7.7568359375, 8.0743408203125, 8.391845703125, 8.7093505859375, 9.02685546875, 9.3443603515625, 9.661865234375, 9.9793701171875, 10.296875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 7.0, 4.0, 4.0, 6.0, 8.0, 15.0, 21.0, 39.0, 58.0, 113.0, 221.0, 556.0, 1738.0, 6581.0, 35956.0, 647516.0, 323599.0, 24780.0, 5048.0, 1340.0, 480.0, 215.0, 89.0, 56.0, 37.0, 21.0, 19.0, 10.0, 10.0, 3.0, 3.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.625, -7.385986328125, -7.14697265625, -6.907958984375, -6.6689453125, -6.429931640625, -6.19091796875, -5.951904296875, -5.712890625, -5.473876953125, -5.23486328125, -4.995849609375, -4.7568359375, -4.517822265625, -4.27880859375, -4.039794921875, -3.80078125, -3.561767578125, -3.32275390625, -3.083740234375, -2.8447265625, -2.605712890625, -2.36669921875, -2.127685546875, -1.888671875, -1.649658203125, -1.41064453125, -1.171630859375, -0.9326171875, -0.693603515625, -0.45458984375, -0.215576171875, 0.0234375, 0.262451171875, 0.50146484375, 0.740478515625, 0.9794921875, 1.218505859375, 1.45751953125, 1.696533203125, 1.935546875, 2.174560546875, 2.41357421875, 2.652587890625, 2.8916015625, 3.130615234375, 3.36962890625, 3.608642578125, 3.84765625, 4.086669921875, 4.32568359375, 4.564697265625, 4.8037109375, 5.042724609375, 5.28173828125, 5.520751953125, 5.759765625, 5.998779296875, 6.23779296875, 6.476806640625, 6.7158203125, 6.954833984375, 7.19384765625, 7.432861328125, 7.671875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 5.0, 2.0, 7.0, 11.0, 17.0, 17.0, 26.0, 25.0, 62.0, 164.0, 328.0, 149.0, 60.0, 39.0, 22.0, 26.0, 14.0, 9.0, 8.0, 2.0, 2.0, 3.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0013980865478515625, -0.0013626813888549805, -0.0013272762298583984, -0.0012918710708618164, -0.0012564659118652344, -0.0012210607528686523, -0.0011856555938720703, -0.0011502504348754883, -0.0011148452758789062, -0.0010794401168823242, -0.0010440349578857422, -0.0010086297988891602, -0.0009732246398925781, -0.0009378194808959961, -0.0009024143218994141, -0.000867009162902832, -0.00083160400390625, -0.000796198844909668, -0.0007607936859130859, -0.0007253885269165039, -0.0006899833679199219, -0.0006545782089233398, -0.0006191730499267578, -0.0005837678909301758, -0.0005483627319335938, -0.0005129575729370117, -0.0004775524139404297, -0.00044214725494384766, -0.0004067420959472656, -0.0003713369369506836, -0.00033593177795410156, -0.00030052661895751953, -0.0002651214599609375, -0.00022971630096435547, -0.00019431114196777344, -0.0001589059829711914, -0.00012350082397460938, -8.809566497802734e-05, -5.269050598144531e-05, -1.728534698486328e-05, 1.811981201171875e-05, 5.352497100830078e-05, 8.893013000488281e-05, 0.00012433528900146484, 0.00015974044799804688, 0.0001951456069946289, 0.00023055076599121094, 0.00026595592498779297, 0.000301361083984375, 0.00033676624298095703, 0.00037217140197753906, 0.0004075765609741211, 0.0004429817199707031, 0.00047838687896728516, 0.0005137920379638672, 0.0005491971969604492, 0.0005846023559570312, 0.0006200075149536133, 0.0006554126739501953, 0.0006908178329467773, 0.0007262229919433594, 0.0007616281509399414, 0.0007970333099365234, 0.0008324384689331055, 0.0008678436279296875]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 4.0, 6.0, 9.0, 15.0, 25.0, 20.0, 32.0, 44.0, 66.0, 74.0, 98.0, 157.0, 249.0, 376.0, 803.0, 1972.0, 6522.0, 26612.0, 226530.0, 719006.0, 49839.0, 10611.0, 2966.0, 1112.0, 472.0, 258.0, 182.0, 113.0, 90.0, 67.0, 59.0, 39.0, 24.0, 28.0, 16.0, 16.0, 5.0, 7.0, 13.0, 4.0, 5.0, 0.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.59765625, -5.4122314453125, -5.226806640625, -5.0413818359375, -4.85595703125, -4.6705322265625, -4.485107421875, -4.2996826171875, -4.1142578125, -3.9288330078125, -3.743408203125, -3.5579833984375, -3.37255859375, -3.1871337890625, -3.001708984375, -2.8162841796875, -2.630859375, -2.4454345703125, -2.260009765625, -2.0745849609375, -1.88916015625, -1.7037353515625, -1.518310546875, -1.3328857421875, -1.1474609375, -0.9620361328125, -0.776611328125, -0.5911865234375, -0.40576171875, -0.2203369140625, -0.034912109375, 0.1505126953125, 0.3359375, 0.5213623046875, 0.706787109375, 0.8922119140625, 1.07763671875, 1.2630615234375, 1.448486328125, 1.6339111328125, 1.8193359375, 2.0047607421875, 2.190185546875, 2.3756103515625, 2.56103515625, 2.7464599609375, 2.931884765625, 3.1173095703125, 3.302734375, 3.4881591796875, 3.673583984375, 3.8590087890625, 4.04443359375, 4.2298583984375, 4.415283203125, 4.6007080078125, 4.7861328125, 4.9715576171875, 5.156982421875, 5.3424072265625, 5.52783203125, 5.7132568359375, 5.898681640625, 6.0841064453125, 6.26953125]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 4.0, 4.0, 3.0, 2.0, 0.0, 4.0, 8.0, 5.0, 13.0, 17.0, 24.0, 32.0, 58.0, 90.0, 147.0, 172.0, 149.0, 102.0, 65.0, 32.0, 17.0, 9.0, 8.0, 7.0, 12.0, 3.0, 4.0, 1.0, 3.0, 2.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.9375, -4.7904052734375, -4.643310546875, -4.4962158203125, -4.34912109375, -4.2020263671875, -4.054931640625, -3.9078369140625, -3.7607421875, -3.6136474609375, -3.466552734375, -3.3194580078125, -3.17236328125, -3.0252685546875, -2.878173828125, -2.7310791015625, -2.583984375, -2.4368896484375, -2.289794921875, -2.1427001953125, -1.99560546875, -1.8485107421875, -1.701416015625, -1.5543212890625, -1.4072265625, -1.2601318359375, -1.113037109375, -0.9659423828125, -0.81884765625, -0.6717529296875, -0.524658203125, -0.3775634765625, -0.23046875, -0.0833740234375, 0.063720703125, 0.2108154296875, 0.35791015625, 0.5050048828125, 0.652099609375, 0.7991943359375, 0.9462890625, 1.0933837890625, 1.240478515625, 1.3875732421875, 1.53466796875, 1.6817626953125, 1.828857421875, 1.9759521484375, 2.123046875, 2.2701416015625, 2.417236328125, 2.5643310546875, 2.71142578125, 2.8585205078125, 3.005615234375, 3.1527099609375, 3.2998046875, 3.4468994140625, 3.593994140625, 3.7410888671875, 3.88818359375, 4.0352783203125, 4.182373046875, 4.3294677734375, 4.4765625]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 5.0, 36.0, 175.0, 422.0, 283.0, 67.0, 7.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-160.450439453125, -155.81964111328125, -151.1888427734375, -146.55804443359375, -141.92724609375, -137.2964630126953, -132.66566467285156, -128.0348663330078, -123.40406799316406, -118.77326965332031, -114.14247131347656, -109.51168060302734, -104.8808822631836, -100.25008392333984, -95.61929321289062, -90.98849487304688, -86.35769653320312, -81.72689819335938, -77.09609985351562, -72.4653091430664, -67.83451080322266, -63.203712463378906, -58.57291793823242, -53.94212341308594, -49.31132507324219, -44.68052673339844, -40.04973220825195, -35.41893768310547, -30.78813934326172, -26.1573429107666, -21.526546478271484, -16.895751953125, -12.26495361328125, -7.634157180786133, -3.0033607482910156, 1.6274356842041016, 6.258232116699219, 10.889028549194336, 15.519824981689453, 20.150619506835938, 24.781417846679688, 29.412214279174805, 34.04301071166992, 38.673805236816406, 43.304603576660156, 47.935401916503906, 52.56619644165039, 57.196990966796875, 61.827789306640625, 66.45858764648438, 71.08938598632812, 75.72017669677734, 80.3509750366211, 84.98177337646484, 89.61256408691406, 94.24336242675781, 98.87416076660156, 103.50495910644531, 108.13575744628906, 112.76654815673828, 117.39734649658203, 122.02814483642578, 126.658935546875, 131.28973388671875, 135.9205322265625]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 3.0, 3.0, 7.0, 7.0, 10.0, 15.0, 15.0, 27.0, 38.0, 28.0, 43.0, 41.0, 43.0, 61.0, 45.0, 50.0, 53.0, 67.0, 59.0, 41.0, 50.0, 51.0, 50.0, 36.0, 26.0, 26.0, 26.0, 20.0, 15.0, 17.0, 9.0, 11.0, 3.0, 6.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.61328125, -43.15272903442383, -41.69218063354492, -40.23162841796875, -38.771080017089844, -37.31052780151367, -35.8499755859375, -34.389427185058594, -32.92887496948242, -31.468324661254883, -30.007774353027344, -28.547222137451172, -27.086671829223633, -25.626121520996094, -24.165571212768555, -22.705020904541016, -21.244470596313477, -19.783920288085938, -18.3233699798584, -16.86281967163086, -15.402267456054688, -13.941717147827148, -12.48116683959961, -11.020615577697754, -9.560065269470215, -8.099514961242676, -6.63896369934082, -5.178413391113281, -3.717862606048584, -2.2573118209838867, -0.7967615127563477, 0.6637897491455078, 2.124340057373047, 3.584890842437744, 5.045441627502441, 6.5059919357299805, 7.966542720794678, 9.427093505859375, 10.887643814086914, 12.34819507598877, 13.808745384216309, 15.269295692443848, 16.729846954345703, 18.190397262573242, 19.65094757080078, 21.111499786376953, 22.57204818725586, 24.03260040283203, 25.49315071105957, 26.95370101928711, 28.41425132751465, 29.874801635742188, 31.33535385131836, 32.79590606689453, 34.25645446777344, 35.71700668334961, 37.177555084228516, 38.63810729980469, 40.098655700683594, 41.559207916259766, 43.01975631713867, 44.480308532714844, 45.94085693359375, 47.40140914916992, 48.861961364746094]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 6.0, 2.0, 3.0, 6.0, 11.0, 15.0, 23.0, 38.0, 45.0, 74.0, 107.0, 197.0, 333.0, 587.0, 1242.0, 2622.0, 6112.0, 17054.0, 59514.0, 376817.0, 3461937.0, 203479.0, 41504.0, 13111.0, 5184.0, 2143.0, 955.0, 521.0, 288.0, 134.0, 72.0, 50.0, 35.0, 20.0, 11.0, 10.0, 11.0, 6.0, 2.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.5625, -5.390625, -5.21875, -5.046875, -4.875, -4.703125, -4.53125, -4.359375, -4.1875, -4.015625, -3.84375, -3.671875, -3.5, -3.328125, -3.15625, -2.984375, -2.8125, -2.640625, -2.46875, -2.296875, -2.125, -1.953125, -1.78125, -1.609375, -1.4375, -1.265625, -1.09375, -0.921875, -0.75, -0.578125, -0.40625, -0.234375, -0.0625, 0.109375, 0.28125, 0.453125, 0.625, 0.796875, 0.96875, 1.140625, 1.3125, 1.484375, 1.65625, 1.828125, 2.0, 2.171875, 2.34375, 2.515625, 2.6875, 2.859375, 3.03125, 3.203125, 3.375, 3.546875, 3.71875, 3.890625, 4.0625, 4.234375, 4.40625, 4.578125, 4.75, 4.921875, 5.09375, 5.265625, 5.4375]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 7.0, 5.0, 4.0, 8.0, 19.0, 34.0, 35.0, 49.0, 61.0, 90.0, 92.0, 82.0, 101.0, 89.0, 63.0, 74.0, 63.0, 38.0, 34.0, 27.0, 13.0, 7.0, 6.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.361328125, -3.27545166015625, -3.1895751953125, -3.10369873046875, -3.017822265625, -2.93194580078125, -2.8460693359375, -2.76019287109375, -2.67431640625, -2.58843994140625, -2.5025634765625, -2.41668701171875, -2.330810546875, -2.24493408203125, -2.1590576171875, -2.07318115234375, -1.9873046875, -1.90142822265625, -1.8155517578125, -1.72967529296875, -1.643798828125, -1.55792236328125, -1.4720458984375, -1.38616943359375, -1.30029296875, -1.21441650390625, -1.1285400390625, -1.04266357421875, -0.956787109375, -0.87091064453125, -0.7850341796875, -0.69915771484375, -0.61328125, -0.52740478515625, -0.4415283203125, -0.35565185546875, -0.269775390625, -0.18389892578125, -0.0980224609375, -0.01214599609375, 0.07373046875, 0.15960693359375, 0.2454833984375, 0.33135986328125, 0.417236328125, 0.50311279296875, 0.5889892578125, 0.67486572265625, 0.7607421875, 0.84661865234375, 0.9324951171875, 1.01837158203125, 1.104248046875, 1.19012451171875, 1.2760009765625, 1.36187744140625, 1.44775390625, 1.53363037109375, 1.6195068359375, 1.70538330078125, 1.791259765625, 1.87713623046875, 1.9630126953125, 2.04888916015625, 2.134765625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 4.0, 7.0, 3.0, 3.0, 15.0, 24.0, 25.0, 49.0, 70.0, 111.0, 167.0, 316.0, 582.0, 1065.0, 2085.0, 4797.0, 13142.0, 47084.0, 288439.0, 3373105.0, 381400.0, 56486.0, 14944.0, 5388.0, 2324.0, 1106.0, 653.0, 382.0, 188.0, 121.0, 80.0, 41.0, 32.0, 16.0, 8.0, 12.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.62890625, -4.4609375, -4.29296875, -4.125, -3.95703125, -3.7890625, -3.62109375, -3.453125, -3.28515625, -3.1171875, -2.94921875, -2.78125, -2.61328125, -2.4453125, -2.27734375, -2.109375, -1.94140625, -1.7734375, -1.60546875, -1.4375, -1.26953125, -1.1015625, -0.93359375, -0.765625, -0.59765625, -0.4296875, -0.26171875, -0.09375, 0.07421875, 0.2421875, 0.41015625, 0.578125, 0.74609375, 0.9140625, 1.08203125, 1.25, 1.41796875, 1.5859375, 1.75390625, 1.921875, 2.08984375, 2.2578125, 2.42578125, 2.59375, 2.76171875, 2.9296875, 3.09765625, 3.265625, 3.43359375, 3.6015625, 3.76953125, 3.9375, 4.10546875, 4.2734375, 4.44140625, 4.609375, 4.77734375, 4.9453125, 5.11328125, 5.28125, 5.44921875, 5.6171875, 5.78515625, 5.953125, 6.12109375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 4.0, 8.0, 12.0, 16.0, 16.0, 27.0, 30.0, 75.0, 106.0, 210.0, 440.0, 1439.0, 954.0, 289.0, 170.0, 103.0, 39.0, 31.0, 25.0, 24.0, 15.0, 7.0, 10.0, 6.0, 2.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.353515625, -2.277313232421875, -2.20111083984375, -2.124908447265625, -2.0487060546875, -1.972503662109375, -1.89630126953125, -1.820098876953125, -1.743896484375, -1.667694091796875, -1.59149169921875, -1.515289306640625, -1.4390869140625, -1.362884521484375, -1.28668212890625, -1.210479736328125, -1.13427734375, -1.058074951171875, -0.98187255859375, -0.905670166015625, -0.8294677734375, -0.753265380859375, -0.67706298828125, -0.600860595703125, -0.524658203125, -0.448455810546875, -0.37225341796875, -0.296051025390625, -0.2198486328125, -0.143646240234375, -0.06744384765625, 0.008758544921875, 0.0849609375, 0.161163330078125, 0.23736572265625, 0.313568115234375, 0.3897705078125, 0.465972900390625, 0.54217529296875, 0.618377685546875, 0.694580078125, 0.770782470703125, 0.84698486328125, 0.923187255859375, 0.9993896484375, 1.075592041015625, 1.15179443359375, 1.227996826171875, 1.30419921875, 1.380401611328125, 1.45660400390625, 1.532806396484375, 1.6090087890625, 1.685211181640625, 1.76141357421875, 1.837615966796875, 1.913818359375, 1.990020751953125, 2.06622314453125, 2.142425537109375, 2.2186279296875, 2.294830322265625, 2.37103271484375, 2.447235107421875, 2.5234375]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 15.0, 38.0, 146.0, 244.0, 259.0, 175.0, 87.0, 21.0, 8.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-37.4846076965332, -36.58036804199219, -35.676124572753906, -34.77188491821289, -33.86764144897461, -32.963401794433594, -32.05915832519531, -31.154918670654297, -30.25067901611328, -29.346437454223633, -28.442195892333984, -27.53795623779297, -26.63371467590332, -25.729473114013672, -24.825231552124023, -23.920989990234375, -23.016748428344727, -22.112506866455078, -21.20826530456543, -20.30402374267578, -19.399784088134766, -18.495542526245117, -17.59130096435547, -16.68705940246582, -15.782818794250488, -14.87857723236084, -13.974336624145508, -13.07009506225586, -12.165853500366211, -11.261612892150879, -10.35737133026123, -9.453130722045898, -8.54888916015625, -7.64464807510376, -6.7404069900512695, -5.836165428161621, -4.931924343109131, -4.027683258056641, -3.123441696166992, -2.219200611114502, -1.3149595260620117, -0.41071832180023193, 0.49352288246154785, 1.3977642059326172, 2.3020052909851074, 3.2062463760375977, 4.110487937927246, 5.014729022979736, 5.918970108032227, 6.823211193084717, 7.727452278137207, 8.631693840026855, 9.535934448242188, 10.440176010131836, 11.344417572021484, 12.248659133911133, 13.152899742126465, 14.057141304016113, 14.961381912231445, 15.865623474121094, 16.769865036010742, 17.67410659790039, 18.578346252441406, 19.482587814331055, 20.386829376220703]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 6.0, 5.0, 8.0, 12.0, 11.0, 30.0, 27.0, 41.0, 43.0, 63.0, 57.0, 80.0, 75.0, 76.0, 75.0, 76.0, 65.0, 67.0, 46.0, 30.0, 32.0, 30.0, 18.0, 9.0, 14.0, 4.0, 7.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.544825553894043, -9.139784812927246, -8.734743118286133, -8.329702377319336, -7.924661636352539, -7.519620895385742, -7.114579677581787, -6.709538459777832, -6.304497718811035, -5.899456977844238, -5.494415760040283, -5.089374542236328, -4.684333801269531, -4.279293060302734, -3.8742518424987793, -3.4692108631134033, -3.0641698837280273, -2.6591289043426514, -2.2540879249572754, -1.8490469455718994, -1.4440059661865234, -1.0389649868011475, -0.6339240074157715, -0.2288830280303955, 0.17615795135498047, 0.5811989307403564, 0.9862399101257324, 1.3912808895111084, 1.7963218688964844, 2.2013628482818604, 2.6064038276672363, 3.0114448070526123, 3.416484832763672, 3.821525812149048, 4.226566791534424, 4.631608009338379, 5.036648750305176, 5.441689491271973, 5.846730709075928, 6.251771926879883, 6.65681266784668, 7.061853408813477, 7.466894626617432, 7.871935844421387, 8.276976585388184, 8.68201732635498, 9.087059020996094, 9.49209976196289, 9.897140502929688, 10.302181243896484, 10.707221984863281, 11.112263679504395, 11.517304420471191, 11.922345161437988, 12.327386856079102, 12.732427597045898, 13.137468338012695, 13.542509078979492, 13.947549819946289, 14.352591514587402, 14.7576322555542, 15.162672996520996, 15.56771469116211, 15.972755432128906, 16.377796173095703]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 3.0, 2.0, 2.0, 2.0, 8.0, 11.0, 19.0, 40.0, 39.0, 64.0, 104.0, 141.0, 242.0, 434.0, 876.0, 1903.0, 4532.0, 11538.0, 30348.0, 87544.0, 345274.0, 404301.0, 103879.0, 34531.0, 13155.0, 5156.0, 2144.0, 980.0, 511.0, 268.0, 181.0, 101.0, 77.0, 55.0, 26.0, 22.0, 18.0, 6.0, 5.0, 5.0, 1.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.765625, -4.61224365234375, -4.4588623046875, -4.30548095703125, -4.152099609375, -3.99871826171875, -3.8453369140625, -3.69195556640625, -3.53857421875, -3.38519287109375, -3.2318115234375, -3.07843017578125, -2.925048828125, -2.77166748046875, -2.6182861328125, -2.46490478515625, -2.3115234375, -2.15814208984375, -2.0047607421875, -1.85137939453125, -1.697998046875, -1.54461669921875, -1.3912353515625, -1.23785400390625, -1.08447265625, -0.93109130859375, -0.7777099609375, -0.62432861328125, -0.470947265625, -0.31756591796875, -0.1641845703125, -0.01080322265625, 0.142578125, 0.29595947265625, 0.4493408203125, 0.60272216796875, 0.756103515625, 0.90948486328125, 1.0628662109375, 1.21624755859375, 1.36962890625, 1.52301025390625, 1.6763916015625, 1.82977294921875, 1.983154296875, 2.13653564453125, 2.2899169921875, 2.44329833984375, 2.5966796875, 2.75006103515625, 2.9034423828125, 3.05682373046875, 3.210205078125, 3.36358642578125, 3.5169677734375, 3.67034912109375, 3.82373046875, 3.97711181640625, 4.1304931640625, 4.28387451171875, 4.437255859375, 4.59063720703125, 4.7440185546875, 4.89739990234375, 5.05078125]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 4.0, 5.0, 3.0, 9.0, 16.0, 18.0, 28.0, 35.0, 36.0, 60.0, 45.0, 80.0, 74.0, 52.0, 90.0, 66.0, 68.0, 63.0, 53.0, 46.0, 43.0, 29.0, 22.0, 15.0, 15.0, 13.0, 8.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.158203125, -2.08935546875, -2.0205078125, -1.95166015625, -1.8828125, -1.81396484375, -1.7451171875, -1.67626953125, -1.607421875, -1.53857421875, -1.4697265625, -1.40087890625, -1.33203125, -1.26318359375, -1.1943359375, -1.12548828125, -1.056640625, -0.98779296875, -0.9189453125, -0.85009765625, -0.78125, -0.71240234375, -0.6435546875, -0.57470703125, -0.505859375, -0.43701171875, -0.3681640625, -0.29931640625, -0.23046875, -0.16162109375, -0.0927734375, -0.02392578125, 0.044921875, 0.11376953125, 0.1826171875, 0.25146484375, 0.3203125, 0.38916015625, 0.4580078125, 0.52685546875, 0.595703125, 0.66455078125, 0.7333984375, 0.80224609375, 0.87109375, 0.93994140625, 1.0087890625, 1.07763671875, 1.146484375, 1.21533203125, 1.2841796875, 1.35302734375, 1.421875, 1.49072265625, 1.5595703125, 1.62841796875, 1.697265625, 1.76611328125, 1.8349609375, 1.90380859375, 1.97265625, 2.04150390625, 2.1103515625, 2.17919921875, 2.248046875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 2.0, 0.0, 2.0, 6.0, 5.0, 4.0, 5.0, 12.0, 10.0, 14.0, 21.0, 33.0, 35.0, 34.0, 36.0, 66.0, 90.0, 112.0, 180.0, 322.0, 537.0, 1136.0, 2568.0, 7141.0, 22232.0, 75731.0, 393498.0, 427585.0, 80483.0, 23558.0, 7588.0, 2807.0, 1127.0, 512.0, 307.0, 197.0, 140.0, 106.0, 55.0, 66.0, 47.0, 32.0, 24.0, 30.0, 19.0, 7.0, 7.0, 10.0, 8.0, 4.0, 7.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.31640625, -5.13934326171875, -4.9622802734375, -4.78521728515625, -4.608154296875, -4.43109130859375, -4.2540283203125, -4.07696533203125, -3.89990234375, -3.72283935546875, -3.5457763671875, -3.36871337890625, -3.191650390625, -3.01458740234375, -2.8375244140625, -2.66046142578125, -2.4833984375, -2.30633544921875, -2.1292724609375, -1.95220947265625, -1.775146484375, -1.59808349609375, -1.4210205078125, -1.24395751953125, -1.06689453125, -0.88983154296875, -0.7127685546875, -0.53570556640625, -0.358642578125, -0.18157958984375, -0.0045166015625, 0.17254638671875, 0.349609375, 0.52667236328125, 0.7037353515625, 0.88079833984375, 1.057861328125, 1.23492431640625, 1.4119873046875, 1.58905029296875, 1.76611328125, 1.94317626953125, 2.1202392578125, 2.29730224609375, 2.474365234375, 2.65142822265625, 2.8284912109375, 3.00555419921875, 3.1826171875, 3.35968017578125, 3.5367431640625, 3.71380615234375, 3.890869140625, 4.06793212890625, 4.2449951171875, 4.42205810546875, 4.59912109375, 4.77618408203125, 4.9532470703125, 5.13031005859375, 5.307373046875, 5.48443603515625, 5.6614990234375, 5.83856201171875, 6.015625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 7.0, 5.0, 5.0, 3.0, 9.0, 10.0, 8.0, 13.0, 11.0, 15.0, 21.0, 20.0, 29.0, 32.0, 43.0, 44.0, 41.0, 41.0, 49.0, 55.0, 54.0, 49.0, 54.0, 46.0, 45.0, 41.0, 38.0, 40.0, 27.0, 30.0, 19.0, 16.0, 19.0, 5.0, 11.0, 9.0, 9.0, 9.0, 4.0, 6.0, 3.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0], "bins": [-6.7421875, -6.5362548828125, -6.330322265625, -6.1243896484375, -5.91845703125, -5.7125244140625, -5.506591796875, -5.3006591796875, -5.0947265625, -4.8887939453125, -4.682861328125, -4.4769287109375, -4.27099609375, -4.0650634765625, -3.859130859375, -3.6531982421875, -3.447265625, -3.2413330078125, -3.035400390625, -2.8294677734375, -2.62353515625, -2.4176025390625, -2.211669921875, -2.0057373046875, -1.7998046875, -1.5938720703125, -1.387939453125, -1.1820068359375, -0.97607421875, -0.7701416015625, -0.564208984375, -0.3582763671875, -0.15234375, 0.0535888671875, 0.259521484375, 0.4654541015625, 0.67138671875, 0.8773193359375, 1.083251953125, 1.2891845703125, 1.4951171875, 1.7010498046875, 1.906982421875, 2.1129150390625, 2.31884765625, 2.5247802734375, 2.730712890625, 2.9366455078125, 3.142578125, 3.3485107421875, 3.554443359375, 3.7603759765625, 3.96630859375, 4.1722412109375, 4.378173828125, 4.5841064453125, 4.7900390625, 4.9959716796875, 5.201904296875, 5.4078369140625, 5.61376953125, 5.8197021484375, 6.025634765625, 6.2315673828125, 6.4375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0, 5.0, 11.0, 7.0, 11.0, 27.0, 22.0, 39.0, 82.0, 116.0, 211.0, 396.0, 764.0, 1609.0, 3579.0, 8511.0, 20865.0, 53863.0, 179511.0, 504714.0, 182410.0, 54867.0, 21428.0, 8554.0, 3739.0, 1527.0, 750.0, 396.0, 176.0, 122.0, 87.0, 41.0, 39.0, 29.0, 14.0, 14.0, 10.0, 4.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.99609375, -1.9327392578125, -1.869384765625, -1.8060302734375, -1.74267578125, -1.6793212890625, -1.615966796875, -1.5526123046875, -1.4892578125, -1.4259033203125, -1.362548828125, -1.2991943359375, -1.23583984375, -1.1724853515625, -1.109130859375, -1.0457763671875, -0.982421875, -0.9190673828125, -0.855712890625, -0.7923583984375, -0.72900390625, -0.6656494140625, -0.602294921875, -0.5389404296875, -0.4755859375, -0.4122314453125, -0.348876953125, -0.2855224609375, -0.22216796875, -0.1588134765625, -0.095458984375, -0.0321044921875, 0.03125, 0.0946044921875, 0.157958984375, 0.2213134765625, 0.28466796875, 0.3480224609375, 0.411376953125, 0.4747314453125, 0.5380859375, 0.6014404296875, 0.664794921875, 0.7281494140625, 0.79150390625, 0.8548583984375, 0.918212890625, 0.9815673828125, 1.044921875, 1.1082763671875, 1.171630859375, 1.2349853515625, 1.29833984375, 1.3616943359375, 1.425048828125, 1.4884033203125, 1.5517578125, 1.6151123046875, 1.678466796875, 1.7418212890625, 1.80517578125, 1.8685302734375, 1.931884765625, 1.9952392578125, 2.05859375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 5.0, 2.0, 2.0, 9.0, 14.0, 19.0, 10.0, 20.0, 26.0, 36.0, 82.0, 227.0, 271.0, 114.0, 52.0, 32.0, 19.0, 15.0, 8.0, 11.0, 12.0, 3.0, 4.0, 5.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007982254028320312, -0.0007708445191383362, -0.0007434636354446411, -0.000716082751750946, -0.000688701868057251, -0.0006613209843635559, -0.0006339401006698608, -0.0006065592169761658, -0.0005791783332824707, -0.0005517974495887756, -0.0005244165658950806, -0.0004970356822013855, -0.00046965479850769043, -0.00044227391481399536, -0.0004148930311203003, -0.0003875121474266052, -0.00036013126373291016, -0.0003327503800392151, -0.00030536949634552, -0.00027798861265182495, -0.0002506077289581299, -0.00022322684526443481, -0.00019584596157073975, -0.00016846507787704468, -0.0001410841941833496, -0.00011370331048965454, -8.632242679595947e-05, -5.8941543102264404e-05, -3.1560659408569336e-05, -4.179775714874268e-06, 2.32011079788208e-05, 5.058199167251587e-05, 7.796287536621094e-05, 0.000105343759059906, 0.00013272464275360107, 0.00016010552644729614, 0.0001874864101409912, 0.00021486729383468628, 0.00024224817752838135, 0.0002696290612220764, 0.0002970099449157715, 0.00032439082860946655, 0.0003517717123031616, 0.0003791525959968567, 0.00040653347969055176, 0.0004339143633842468, 0.0004612952470779419, 0.000488676130771637, 0.000516057014465332, 0.0005434378981590271, 0.0005708187818527222, 0.0005981996655464172, 0.0006255805492401123, 0.0006529614329338074, 0.0006803423166275024, 0.0007077232003211975, 0.0007351040840148926, 0.0007624849677085876, 0.0007898658514022827, 0.0008172467350959778, 0.0008446276187896729, 0.0008720085024833679, 0.000899389386177063, 0.0009267702698707581, 0.0009541511535644531]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 1.0, 10.0, 11.0, 24.0, 38.0, 69.0, 151.0, 247.0, 464.0, 1042.0, 2880.0, 10405.0, 47986.0, 365536.0, 533803.0, 66088.0, 13717.0, 3706.0, 1202.0, 542.0, 267.0, 145.0, 96.0, 42.0, 31.0, 20.0, 6.0, 6.0, 5.0, 4.0, 1.0, 3.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.845703125, -2.747894287109375, -2.65008544921875, -2.552276611328125, -2.4544677734375, -2.356658935546875, -2.25885009765625, -2.161041259765625, -2.063232421875, -1.965423583984375, -1.86761474609375, -1.769805908203125, -1.6719970703125, -1.574188232421875, -1.47637939453125, -1.378570556640625, -1.28076171875, -1.182952880859375, -1.08514404296875, -0.987335205078125, -0.8895263671875, -0.791717529296875, -0.69390869140625, -0.596099853515625, -0.498291015625, -0.400482177734375, -0.30267333984375, -0.204864501953125, -0.1070556640625, -0.009246826171875, 0.08856201171875, 0.186370849609375, 0.2841796875, 0.381988525390625, 0.47979736328125, 0.577606201171875, 0.6754150390625, 0.773223876953125, 0.87103271484375, 0.968841552734375, 1.066650390625, 1.164459228515625, 1.26226806640625, 1.360076904296875, 1.4578857421875, 1.555694580078125, 1.65350341796875, 1.751312255859375, 1.84912109375, 1.946929931640625, 2.04473876953125, 2.142547607421875, 2.2403564453125, 2.338165283203125, 2.43597412109375, 2.533782958984375, 2.631591796875, 2.729400634765625, 2.82720947265625, 2.925018310546875, 3.0228271484375, 3.120635986328125, 3.21844482421875, 3.316253662109375, 3.4140625]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0, 5.0, 5.0, 8.0, 3.0, 8.0, 10.0, 21.0, 19.0, 28.0, 35.0, 37.0, 37.0, 61.0, 85.0, 101.0, 86.0, 88.0, 70.0, 74.0, 46.0, 34.0, 29.0, 30.0, 16.0, 14.0, 12.0, 11.0, 0.0, 8.0, 4.0, 4.0, 5.0, 0.0, 4.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.92578125, -1.862030029296875, -1.79827880859375, -1.734527587890625, -1.6707763671875, -1.607025146484375, -1.54327392578125, -1.479522705078125, -1.415771484375, -1.352020263671875, -1.28826904296875, -1.224517822265625, -1.1607666015625, -1.097015380859375, -1.03326416015625, -0.969512939453125, -0.90576171875, -0.842010498046875, -0.77825927734375, -0.714508056640625, -0.6507568359375, -0.587005615234375, -0.52325439453125, -0.459503173828125, -0.395751953125, -0.332000732421875, -0.26824951171875, -0.204498291015625, -0.1407470703125, -0.076995849609375, -0.01324462890625, 0.050506591796875, 0.1142578125, 0.178009033203125, 0.24176025390625, 0.305511474609375, 0.3692626953125, 0.433013916015625, 0.49676513671875, 0.560516357421875, 0.624267578125, 0.688018798828125, 0.75177001953125, 0.815521240234375, 0.8792724609375, 0.943023681640625, 1.00677490234375, 1.070526123046875, 1.13427734375, 1.198028564453125, 1.26177978515625, 1.325531005859375, 1.3892822265625, 1.453033447265625, 1.51678466796875, 1.580535888671875, 1.644287109375, 1.708038330078125, 1.77178955078125, 1.835540771484375, 1.8992919921875, 1.963043212890625, 2.02679443359375, 2.090545654296875, 2.154296875]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 4.0, 8.0, 8.0, 30.0, 30.0, 58.0, 73.0, 103.0, 138.0, 123.0, 123.0, 94.0, 75.0, 44.0, 52.0, 24.0, 4.0, 4.0, 6.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.062045097351074, -12.923528671264648, -11.785013198852539, -10.646496772766113, -9.507980346679688, -8.369464874267578, -7.230948448181152, -6.092432498931885, -4.953916549682617, -3.8154006004333496, -2.676884412765503, -1.5383682250976562, -0.39985227584838867, 0.7386636734008789, 1.8771800994873047, 3.0156960487365723, 4.15421199798584, 5.292727947235107, 6.431243896484375, 7.569760322570801, 8.708276748657227, 9.846792221069336, 10.985308647155762, 12.123825073242188, 13.262340545654297, 14.400856971740723, 15.539372444152832, 16.677888870239258, 17.816404342651367, 18.95492172241211, 20.09343719482422, 21.231952667236328, 22.370471954345703, 23.508987426757812, 24.647504806518555, 25.786020278930664, 26.924535751342773, 28.063053131103516, 29.201568603515625, 30.340084075927734, 31.478599548339844, 32.61711502075195, 33.75563049316406, 34.89414978027344, 36.03266525268555, 37.171180725097656, 38.309696197509766, 39.448211669921875, 40.58673095703125, 41.72524642944336, 42.86376190185547, 44.002281188964844, 45.14079666137695, 46.27931213378906, 47.41782760620117, 48.55634307861328, 49.69485855102539, 50.8333740234375, 51.97188949584961, 53.11040496826172, 54.248924255371094, 55.3874397277832, 56.52595520019531, 57.66447067260742, 58.80298614501953]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 3.0, 2.0, 4.0, 10.0, 10.0, 8.0, 15.0, 15.0, 8.0, 12.0, 24.0, 19.0, 26.0, 21.0, 31.0, 39.0, 30.0, 43.0, 44.0, 51.0, 43.0, 31.0, 49.0, 50.0, 37.0, 36.0, 45.0, 38.0, 43.0, 29.0, 23.0, 27.0, 23.0, 23.0, 15.0, 15.0, 13.0, 10.0, 7.0, 7.0, 6.0, 3.0, 6.0, 3.0, 5.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0], "bins": [-30.50589370727539, -29.586015701293945, -28.666139602661133, -27.746261596679688, -26.826385498046875, -25.90650749206543, -24.986629486083984, -24.066753387451172, -23.14687728881836, -22.226999282836914, -21.3071231842041, -20.387245178222656, -19.467369079589844, -18.5474910736084, -17.627613067626953, -16.70773696899414, -15.787858963012695, -14.867981910705566, -13.948104858398438, -13.028226852416992, -12.10835075378418, -11.188472747802734, -10.268595695495605, -9.348718643188477, -8.428841590881348, -7.508964538574219, -6.58908748626709, -5.669209957122803, -4.749332904815674, -3.829455852508545, -2.909578323364258, -1.989701271057129, -1.0698261260986328, -0.14994895458221436, 0.7699282169342041, 1.689805507659912, 2.609682559967041, 3.52955961227417, 4.449437141418457, 5.369314193725586, 6.289191246032715, 7.209068298339844, 8.128945350646973, 9.048822402954102, 9.968700408935547, 10.88857650756836, 11.808454513549805, 12.728331565856934, 13.648208618164062, 14.568085670471191, 15.48796272277832, 16.407840728759766, 17.327716827392578, 18.247594833374023, 19.16747283935547, 20.08734893798828, 21.007225036621094, 21.92710304260254, 22.84697914123535, 23.766857147216797, 24.68673324584961, 25.606611251831055, 26.5264892578125, 27.446365356445312, 28.366243362426758]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 6.0, 11.0, 7.0, 18.0, 24.0, 37.0, 82.0, 146.0, 230.0, 452.0, 1176.0, 3013.0, 9854.0, 43983.0, 397290.0, 3577626.0, 128615.0, 22310.0, 5843.0, 1995.0, 784.0, 365.0, 183.0, 98.0, 55.0, 25.0, 20.0, 17.0, 10.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.9765625, -8.698486328125, -8.42041015625, -8.142333984375, -7.8642578125, -7.586181640625, -7.30810546875, -7.030029296875, -6.751953125, -6.473876953125, -6.19580078125, -5.917724609375, -5.6396484375, -5.361572265625, -5.08349609375, -4.805419921875, -4.52734375, -4.249267578125, -3.97119140625, -3.693115234375, -3.4150390625, -3.136962890625, -2.85888671875, -2.580810546875, -2.302734375, -2.024658203125, -1.74658203125, -1.468505859375, -1.1904296875, -0.912353515625, -0.63427734375, -0.356201171875, -0.078125, 0.199951171875, 0.47802734375, 0.756103515625, 1.0341796875, 1.312255859375, 1.59033203125, 1.868408203125, 2.146484375, 2.424560546875, 2.70263671875, 2.980712890625, 3.2587890625, 3.536865234375, 3.81494140625, 4.093017578125, 4.37109375, 4.649169921875, 4.92724609375, 5.205322265625, 5.4833984375, 5.761474609375, 6.03955078125, 6.317626953125, 6.595703125, 6.873779296875, 7.15185546875, 7.429931640625, 7.7080078125, 7.986083984375, 8.26416015625, 8.542236328125, 8.8203125]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 4.0, 9.0, 8.0, 21.0, 27.0, 39.0, 54.0, 65.0, 67.0, 77.0, 98.0, 79.0, 89.0, 86.0, 67.0, 50.0, 48.0, 37.0, 22.0, 22.0, 13.0, 13.0, 6.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.990234375, -2.905914306640625, -2.82159423828125, -2.737274169921875, -2.6529541015625, -2.568634033203125, -2.48431396484375, -2.399993896484375, -2.315673828125, -2.231353759765625, -2.14703369140625, -2.062713623046875, -1.9783935546875, -1.894073486328125, -1.80975341796875, -1.725433349609375, -1.64111328125, -1.556793212890625, -1.47247314453125, -1.388153076171875, -1.3038330078125, -1.219512939453125, -1.13519287109375, -1.050872802734375, -0.966552734375, -0.882232666015625, -0.79791259765625, -0.713592529296875, -0.6292724609375, -0.544952392578125, -0.46063232421875, -0.376312255859375, -0.2919921875, -0.207672119140625, -0.12335205078125, -0.039031982421875, 0.0452880859375, 0.129608154296875, 0.21392822265625, 0.298248291015625, 0.382568359375, 0.466888427734375, 0.55120849609375, 0.635528564453125, 0.7198486328125, 0.804168701171875, 0.88848876953125, 0.972808837890625, 1.05712890625, 1.141448974609375, 1.22576904296875, 1.310089111328125, 1.3944091796875, 1.478729248046875, 1.56304931640625, 1.647369384765625, 1.731689453125, 1.816009521484375, 1.90032958984375, 1.984649658203125, 2.0689697265625, 2.153289794921875, 2.23760986328125, 2.321929931640625, 2.40625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 7.0, 5.0, 9.0, 19.0, 23.0, 31.0, 36.0, 58.0, 72.0, 140.0, 184.0, 342.0, 641.0, 1400.0, 3347.0, 9663.0, 31624.0, 145182.0, 2913963.0, 953561.0, 97520.0, 23630.0, 7537.0, 2788.0, 1120.0, 549.0, 310.0, 169.0, 120.0, 67.0, 62.0, 44.0, 19.0, 19.0, 8.0, 7.0, 6.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 2.0], "bins": [-8.40625, -8.1900634765625, -7.973876953125, -7.7576904296875, -7.54150390625, -7.3253173828125, -7.109130859375, -6.8929443359375, -6.6767578125, -6.4605712890625, -6.244384765625, -6.0281982421875, -5.81201171875, -5.5958251953125, -5.379638671875, -5.1634521484375, -4.947265625, -4.7310791015625, -4.514892578125, -4.2987060546875, -4.08251953125, -3.8663330078125, -3.650146484375, -3.4339599609375, -3.2177734375, -3.0015869140625, -2.785400390625, -2.5692138671875, -2.35302734375, -2.1368408203125, -1.920654296875, -1.7044677734375, -1.48828125, -1.2720947265625, -1.055908203125, -0.8397216796875, -0.62353515625, -0.4073486328125, -0.191162109375, 0.0250244140625, 0.2412109375, 0.4573974609375, 0.673583984375, 0.8897705078125, 1.10595703125, 1.3221435546875, 1.538330078125, 1.7545166015625, 1.970703125, 2.1868896484375, 2.403076171875, 2.6192626953125, 2.83544921875, 3.0516357421875, 3.267822265625, 3.4840087890625, 3.7001953125, 3.9163818359375, 4.132568359375, 4.3487548828125, 4.56494140625, 4.7811279296875, 4.997314453125, 5.2135009765625, 5.4296875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 4.0, 1.0, 4.0, 4.0, 10.0, 16.0, 26.0, 27.0, 54.0, 71.0, 182.0, 356.0, 1953.0, 792.0, 258.0, 118.0, 68.0, 40.0, 30.0, 19.0, 13.0, 8.0, 7.0, 5.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.298828125, -3.184234619140625, -3.06964111328125, -2.955047607421875, -2.8404541015625, -2.725860595703125, -2.61126708984375, -2.496673583984375, -2.382080078125, -2.267486572265625, -2.15289306640625, -2.038299560546875, -1.9237060546875, -1.809112548828125, -1.69451904296875, -1.579925537109375, -1.46533203125, -1.350738525390625, -1.23614501953125, -1.121551513671875, -1.0069580078125, -0.892364501953125, -0.77777099609375, -0.663177490234375, -0.548583984375, -0.433990478515625, -0.31939697265625, -0.204803466796875, -0.0902099609375, 0.024383544921875, 0.13897705078125, 0.253570556640625, 0.3681640625, 0.482757568359375, 0.59735107421875, 0.711944580078125, 0.8265380859375, 0.941131591796875, 1.05572509765625, 1.170318603515625, 1.284912109375, 1.399505615234375, 1.51409912109375, 1.628692626953125, 1.7432861328125, 1.857879638671875, 1.97247314453125, 2.087066650390625, 2.20166015625, 2.316253662109375, 2.43084716796875, 2.545440673828125, 2.6600341796875, 2.774627685546875, 2.88922119140625, 3.003814697265625, 3.118408203125, 3.233001708984375, 3.34759521484375, 3.462188720703125, 3.5767822265625, 3.691375732421875, 3.80596923828125, 3.920562744140625, 4.03515625]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 8.0, 31.0, 75.0, 161.0, 259.0, 229.0, 137.0, 64.0, 24.0, 6.0, 3.0, 5.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.901268005371094, -32.962127685546875, -32.02299118041992, -31.083850860595703, -30.144712448120117, -29.20557403564453, -28.266435623168945, -27.32729721069336, -26.38815689086914, -25.449018478393555, -24.50988006591797, -23.57073974609375, -22.631601333618164, -21.692462921142578, -20.753324508666992, -19.814186096191406, -18.87504768371582, -17.935909271240234, -16.99677085876465, -16.057632446289062, -15.118492126464844, -14.179353713989258, -13.240215301513672, -12.301076889038086, -11.361937522888184, -10.422799110412598, -9.483659744262695, -8.54452133178711, -7.605382442474365, -6.666243553161621, -5.727105140686035, -4.787966251373291, -3.848825454711914, -2.90968656539917, -1.9705479145050049, -1.0314092636108398, -0.0922703742980957, 0.8468685150146484, 1.7860069274902344, 2.7251458168029785, 3.6642847061157227, 4.603423595428467, 5.542562484741211, 6.481700897216797, 7.420839786529541, 8.359978675842285, 9.299117088317871, 10.238256454467773, 11.17739486694336, 12.116533279418945, 13.055672645568848, 13.994811058044434, 14.933950424194336, 15.873088836669922, 16.812227249145508, 17.751365661621094, 18.690505981445312, 19.6296443939209, 20.568782806396484, 21.507923126220703, 22.44706153869629, 23.386199951171875, 24.32533836364746, 25.264476776123047, 26.203615188598633]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 6.0, 8.0, 19.0, 33.0, 23.0, 41.0, 36.0, 43.0, 59.0, 66.0, 77.0, 78.0, 74.0, 79.0, 57.0, 50.0, 69.0, 44.0, 26.0, 29.0, 27.0, 21.0, 9.0, 9.0, 6.0, 5.0, 5.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.98840045928955, -14.559985160827637, -14.131569862365723, -13.703154563903809, -13.274739265441895, -12.84632396697998, -12.41790771484375, -11.989492416381836, -11.561077117919922, -11.132661819458008, -10.704246520996094, -10.27583122253418, -9.847415924072266, -9.419000625610352, -8.990585327148438, -8.562170028686523, -8.13375473022461, -7.705339431762695, -7.276924133300781, -6.848508834838867, -6.420093536376953, -5.991678237915039, -5.563262462615967, -5.134847164154053, -4.706431865692139, -4.278016567230225, -3.8496012687683105, -3.4211857318878174, -2.9927704334259033, -2.5643551349639893, -2.135939598083496, -1.707524299621582, -1.2791080474853516, -0.8506926894187927, -0.4222773313522339, 0.0061380863189697266, 0.4345533847808838, 0.8629686832427979, 1.291384220123291, 1.719799518585205, 2.148214817047119, 2.576630115509033, 3.0050454139709473, 3.4334609508514404, 3.8618762493133545, 4.290291786193848, 4.718707084655762, 5.147122383117676, 5.57553768157959, 6.003952980041504, 6.432368278503418, 6.860783576965332, 7.289198875427246, 7.71761417388916, 8.14603042602539, 8.574445724487305, 9.002861022949219, 9.431276321411133, 9.859691619873047, 10.288106918334961, 10.716522216796875, 11.144937515258789, 11.573352813720703, 12.001768112182617, 12.430183410644531]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 4.0, 1.0, 4.0, 7.0, 5.0, 6.0, 8.0, 8.0, 15.0, 25.0, 44.0, 67.0, 76.0, 128.0, 177.0, 299.0, 497.0, 867.0, 1499.0, 2962.0, 6057.0, 13621.0, 29586.0, 65467.0, 133748.0, 284623.0, 269018.0, 126163.0, 61239.0, 27987.0, 12424.0, 5689.0, 2729.0, 1441.0, 801.0, 412.0, 288.0, 174.0, 118.0, 96.0, 56.0, 39.0, 25.0, 21.0, 11.0, 9.0, 7.0, 2.0, 2.0, 6.0, 1.0, 2.0, 0.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-4.37890625, -4.23272705078125, -4.0865478515625, -3.94036865234375, -3.794189453125, -3.64801025390625, -3.5018310546875, -3.35565185546875, -3.20947265625, -3.06329345703125, -2.9171142578125, -2.77093505859375, -2.624755859375, -2.47857666015625, -2.3323974609375, -2.18621826171875, -2.0400390625, -1.89385986328125, -1.7476806640625, -1.60150146484375, -1.455322265625, -1.30914306640625, -1.1629638671875, -1.01678466796875, -0.87060546875, -0.72442626953125, -0.5782470703125, -0.43206787109375, -0.285888671875, -0.13970947265625, 0.0064697265625, 0.15264892578125, 0.298828125, 0.44500732421875, 0.5911865234375, 0.73736572265625, 0.883544921875, 1.02972412109375, 1.1759033203125, 1.32208251953125, 1.46826171875, 1.61444091796875, 1.7606201171875, 1.90679931640625, 2.052978515625, 2.19915771484375, 2.3453369140625, 2.49151611328125, 2.6376953125, 2.78387451171875, 2.9300537109375, 3.07623291015625, 3.222412109375, 3.36859130859375, 3.5147705078125, 3.66094970703125, 3.80712890625, 3.95330810546875, 4.0994873046875, 4.24566650390625, 4.391845703125, 4.53802490234375, 4.6842041015625, 4.83038330078125, 4.9765625]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 5.0, 2.0, 5.0, 5.0, 8.0, 11.0, 24.0, 22.0, 34.0, 49.0, 47.0, 45.0, 58.0, 79.0, 79.0, 77.0, 73.0, 78.0, 61.0, 57.0, 39.0, 44.0, 24.0, 21.0, 22.0, 14.0, 12.0, 11.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.275390625, -2.20318603515625, -2.1309814453125, -2.05877685546875, -1.986572265625, -1.91436767578125, -1.8421630859375, -1.76995849609375, -1.69775390625, -1.62554931640625, -1.5533447265625, -1.48114013671875, -1.408935546875, -1.33673095703125, -1.2645263671875, -1.19232177734375, -1.1201171875, -1.04791259765625, -0.9757080078125, -0.90350341796875, -0.831298828125, -0.75909423828125, -0.6868896484375, -0.61468505859375, -0.54248046875, -0.47027587890625, -0.3980712890625, -0.32586669921875, -0.253662109375, -0.18145751953125, -0.1092529296875, -0.03704833984375, 0.03515625, 0.10736083984375, 0.1795654296875, 0.25177001953125, 0.323974609375, 0.39617919921875, 0.4683837890625, 0.54058837890625, 0.61279296875, 0.68499755859375, 0.7572021484375, 0.82940673828125, 0.901611328125, 0.97381591796875, 1.0460205078125, 1.11822509765625, 1.1904296875, 1.26263427734375, 1.3348388671875, 1.40704345703125, 1.479248046875, 1.55145263671875, 1.6236572265625, 1.69586181640625, 1.76806640625, 1.84027099609375, 1.9124755859375, 1.98468017578125, 2.056884765625, 2.12908935546875, 2.2012939453125, 2.27349853515625, 2.345703125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 6.0, 0.0, 11.0, 15.0, 29.0, 31.0, 37.0, 71.0, 92.0, 145.0, 231.0, 325.0, 548.0, 901.0, 2309.0, 12086.0, 137102.0, 743249.0, 134653.0, 12039.0, 2236.0, 939.0, 524.0, 330.0, 209.0, 143.0, 96.0, 70.0, 46.0, 40.0, 15.0, 12.0, 10.0, 6.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.90625, -10.49462890625, -10.0830078125, -9.67138671875, -9.259765625, -8.84814453125, -8.4365234375, -8.02490234375, -7.61328125, -7.20166015625, -6.7900390625, -6.37841796875, -5.966796875, -5.55517578125, -5.1435546875, -4.73193359375, -4.3203125, -3.90869140625, -3.4970703125, -3.08544921875, -2.673828125, -2.26220703125, -1.8505859375, -1.43896484375, -1.02734375, -0.61572265625, -0.2041015625, 0.20751953125, 0.619140625, 1.03076171875, 1.4423828125, 1.85400390625, 2.265625, 2.67724609375, 3.0888671875, 3.50048828125, 3.912109375, 4.32373046875, 4.7353515625, 5.14697265625, 5.55859375, 5.97021484375, 6.3818359375, 6.79345703125, 7.205078125, 7.61669921875, 8.0283203125, 8.43994140625, 8.8515625, 9.26318359375, 9.6748046875, 10.08642578125, 10.498046875, 10.90966796875, 11.3212890625, 11.73291015625, 12.14453125, 12.55615234375, 12.9677734375, 13.37939453125, 13.791015625, 14.20263671875, 14.6142578125, 15.02587890625, 15.4375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 4.0, 3.0, 4.0, 3.0, 10.0, 5.0, 17.0, 12.0, 18.0, 15.0, 31.0, 42.0, 28.0, 36.0, 39.0, 44.0, 64.0, 62.0, 67.0, 63.0, 60.0, 57.0, 57.0, 51.0, 27.0, 40.0, 31.0, 22.0, 27.0, 9.0, 13.0, 8.0, 11.0, 11.0, 5.0, 4.0, 4.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.4375, -11.135498046875, -10.83349609375, -10.531494140625, -10.2294921875, -9.927490234375, -9.62548828125, -9.323486328125, -9.021484375, -8.719482421875, -8.41748046875, -8.115478515625, -7.8134765625, -7.511474609375, -7.20947265625, -6.907470703125, -6.60546875, -6.303466796875, -6.00146484375, -5.699462890625, -5.3974609375, -5.095458984375, -4.79345703125, -4.491455078125, -4.189453125, -3.887451171875, -3.58544921875, -3.283447265625, -2.9814453125, -2.679443359375, -2.37744140625, -2.075439453125, -1.7734375, -1.471435546875, -1.16943359375, -0.867431640625, -0.5654296875, -0.263427734375, 0.03857421875, 0.340576171875, 0.642578125, 0.944580078125, 1.24658203125, 1.548583984375, 1.8505859375, 2.152587890625, 2.45458984375, 2.756591796875, 3.05859375, 3.360595703125, 3.66259765625, 3.964599609375, 4.2666015625, 4.568603515625, 4.87060546875, 5.172607421875, 5.474609375, 5.776611328125, 6.07861328125, 6.380615234375, 6.6826171875, 6.984619140625, 7.28662109375, 7.588623046875, 7.890625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 5.0, 5.0, 11.0, 4.0, 10.0, 26.0, 37.0, 67.0, 125.0, 206.0, 423.0, 1156.0, 4807.0, 41824.0, 731836.0, 246546.0, 17304.0, 2725.0, 741.0, 296.0, 143.0, 99.0, 63.0, 31.0, 23.0, 16.0, 9.0, 7.0, 0.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.6015625, -7.318115234375, -7.03466796875, -6.751220703125, -6.4677734375, -6.184326171875, -5.90087890625, -5.617431640625, -5.333984375, -5.050537109375, -4.76708984375, -4.483642578125, -4.2001953125, -3.916748046875, -3.63330078125, -3.349853515625, -3.06640625, -2.782958984375, -2.49951171875, -2.216064453125, -1.9326171875, -1.649169921875, -1.36572265625, -1.082275390625, -0.798828125, -0.515380859375, -0.23193359375, 0.051513671875, 0.3349609375, 0.618408203125, 0.90185546875, 1.185302734375, 1.46875, 1.752197265625, 2.03564453125, 2.319091796875, 2.6025390625, 2.885986328125, 3.16943359375, 3.452880859375, 3.736328125, 4.019775390625, 4.30322265625, 4.586669921875, 4.8701171875, 5.153564453125, 5.43701171875, 5.720458984375, 6.00390625, 6.287353515625, 6.57080078125, 6.854248046875, 7.1376953125, 7.421142578125, 7.70458984375, 7.988037109375, 8.271484375, 8.554931640625, 8.83837890625, 9.121826171875, 9.4052734375, 9.688720703125, 9.97216796875, 10.255615234375, 10.5390625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 2.0, 6.0, 2.0, 5.0, 10.0, 11.0, 8.0, 13.0, 20.0, 23.0, 27.0, 26.0, 42.0, 34.0, 53.0, 69.0, 131.0, 157.0, 73.0, 45.0, 45.0, 31.0, 30.0, 21.0, 18.0, 17.0, 20.0, 13.0, 15.0, 10.0, 9.0, 4.0, 2.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0008115768432617188, -0.0007890611886978149, -0.0007665455341339111, -0.0007440298795700073, -0.0007215142250061035, -0.0006989985704421997, -0.0006764829158782959, -0.0006539672613143921, -0.0006314516067504883, -0.0006089359521865845, -0.0005864202976226807, -0.0005639046430587769, -0.000541388988494873, -0.0005188733339309692, -0.0004963576793670654, -0.0004738420248031616, -0.0004513263702392578, -0.000428810715675354, -0.0004062950611114502, -0.0003837794065475464, -0.0003612637519836426, -0.00033874809741973877, -0.00031623244285583496, -0.00029371678829193115, -0.00027120113372802734, -0.00024868547916412354, -0.00022616982460021973, -0.00020365417003631592, -0.0001811385154724121, -0.0001586228609085083, -0.0001361072063446045, -0.00011359155178070068, -9.107589721679688e-05, -6.856024265289307e-05, -4.604458808898926e-05, -2.352893352508545e-05, -1.0132789611816406e-06, 2.1502375602722168e-05, 4.4018030166625977e-05, 6.653368473052979e-05, 8.90493392944336e-05, 0.0001115649938583374, 0.0001340806484222412, 0.00015659630298614502, 0.00017911195755004883, 0.00020162761211395264, 0.00022414326667785645, 0.00024665892124176025, 0.00026917457580566406, 0.00029169023036956787, 0.0003142058849334717, 0.0003367215394973755, 0.0003592371940612793, 0.0003817528486251831, 0.0004042685031890869, 0.0004267841577529907, 0.00044929981231689453, 0.00047181546688079834, 0.0004943311214447021, 0.000516846776008606, 0.0005393624305725098, 0.0005618780851364136, 0.0005843937397003174, 0.0006069093942642212, 0.000629425048828125]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 5.0, 6.0, 3.0, 11.0, 20.0, 32.0, 56.0, 129.0, 242.0, 609.0, 1883.0, 14377.0, 784188.0, 238246.0, 6536.0, 1314.0, 465.0, 208.0, 101.0, 62.0, 24.0, 18.0, 9.0, 3.0, 3.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.6640625, -10.2515869140625, -9.839111328125, -9.4266357421875, -9.01416015625, -8.6016845703125, -8.189208984375, -7.7767333984375, -7.3642578125, -6.9517822265625, -6.539306640625, -6.1268310546875, -5.71435546875, -5.3018798828125, -4.889404296875, -4.4769287109375, -4.064453125, -3.6519775390625, -3.239501953125, -2.8270263671875, -2.41455078125, -2.0020751953125, -1.589599609375, -1.1771240234375, -0.7646484375, -0.3521728515625, 0.060302734375, 0.4727783203125, 0.88525390625, 1.2977294921875, 1.710205078125, 2.1226806640625, 2.53515625, 2.9476318359375, 3.360107421875, 3.7725830078125, 4.18505859375, 4.5975341796875, 5.010009765625, 5.4224853515625, 5.8349609375, 6.2474365234375, 6.659912109375, 7.0723876953125, 7.48486328125, 7.8973388671875, 8.309814453125, 8.7222900390625, 9.134765625, 9.5472412109375, 9.959716796875, 10.3721923828125, 10.78466796875, 11.1971435546875, 11.609619140625, 12.0220947265625, 12.4345703125, 12.8470458984375, 13.259521484375, 13.6719970703125, 14.08447265625, 14.4969482421875, 14.909423828125, 15.3218994140625, 15.734375]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 6.0, 3.0, 7.0, 16.0, 16.0, 24.0, 52.0, 89.0, 158.0, 201.0, 182.0, 102.0, 46.0, 46.0, 25.0, 10.0, 11.0, 3.0, 6.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.5, -6.23583984375, -5.9716796875, -5.70751953125, -5.443359375, -5.17919921875, -4.9150390625, -4.65087890625, -4.38671875, -4.12255859375, -3.8583984375, -3.59423828125, -3.330078125, -3.06591796875, -2.8017578125, -2.53759765625, -2.2734375, -2.00927734375, -1.7451171875, -1.48095703125, -1.216796875, -0.95263671875, -0.6884765625, -0.42431640625, -0.16015625, 0.10400390625, 0.3681640625, 0.63232421875, 0.896484375, 1.16064453125, 1.4248046875, 1.68896484375, 1.953125, 2.21728515625, 2.4814453125, 2.74560546875, 3.009765625, 3.27392578125, 3.5380859375, 3.80224609375, 4.06640625, 4.33056640625, 4.5947265625, 4.85888671875, 5.123046875, 5.38720703125, 5.6513671875, 5.91552734375, 6.1796875, 6.44384765625, 6.7080078125, 6.97216796875, 7.236328125, 7.50048828125, 7.7646484375, 8.02880859375, 8.29296875, 8.55712890625, 8.8212890625, 9.08544921875, 9.349609375, 9.61376953125, 9.8779296875, 10.14208984375, 10.40625]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 16.0, 128.0, 492.0, 341.0, 29.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-102.72306823730469, -94.0143814086914, -85.30569458007812, -76.59701538085938, -67.88832092285156, -59.17963790893555, -50.47095489501953, -41.76226806640625, -33.05358123779297, -24.344894409179688, -15.636209487915039, -6.927524566650391, 1.7811622619628906, 10.489849090576172, 19.198532104492188, 27.90721893310547, 36.61590576171875, 45.32459259033203, 54.03327941894531, 62.74196243286133, 71.45065307617188, 80.15933227539062, 88.8680191040039, 97.57670593261719, 106.28539276123047, 114.99407958984375, 123.70276641845703, 132.4114532470703, 141.12013244628906, 149.82882690429688, 158.53750610351562, 167.24618530273438, 175.95486450195312, 184.66354370117188, 193.3722381591797, 202.08091735839844, 210.78961181640625, 219.498291015625, 228.20697021484375, 236.91566467285156, 245.62435913085938, 254.33303833007812, 263.0417175292969, 271.75042724609375, 280.4591064453125, 289.16778564453125, 297.87646484375, 306.58514404296875, 315.2938232421875, 324.00250244140625, 332.711181640625, 341.4198913574219, 350.1285705566406, 358.8372497558594, 367.5459289550781, 376.254638671875, 384.96331787109375, 393.6719970703125, 402.38067626953125, 411.0893859863281, 419.7980651855469, 428.5067443847656, 437.2154235839844, 445.92413330078125, 454.6328125]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 6.0, 1.0, 4.0, 5.0, 8.0, 9.0, 8.0, 10.0, 6.0, 19.0, 21.0, 13.0, 17.0, 29.0, 25.0, 31.0, 34.0, 36.0, 37.0, 36.0, 51.0, 43.0, 52.0, 40.0, 47.0, 52.0, 54.0, 46.0, 35.0, 32.0, 39.0, 21.0, 28.0, 18.0, 11.0, 13.0, 13.0, 20.0, 11.0, 7.0, 5.0, 3.0, 3.0, 1.0, 5.0, 1.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-40.50923156738281, -39.20338821411133, -37.89754104614258, -36.591697692871094, -35.28585433959961, -33.980010986328125, -32.674163818359375, -31.36832046508789, -30.062475204467773, -28.756629943847656, -27.450786590576172, -26.144941329956055, -24.839096069335938, -23.533252716064453, -22.227407455444336, -20.92156219482422, -19.615718841552734, -18.309873580932617, -17.004030227661133, -15.698184967041016, -14.392340660095215, -13.086496353149414, -11.780651092529297, -10.474806785583496, -9.168962478637695, -7.8631181716918945, -6.5572733879089355, -5.251428604125977, -3.945584297180176, -2.639739990234375, -1.333895206451416, -0.02805042266845703, 1.2777938842773438, 2.5836384296417236, 3.8894829750061035, 5.1953277587890625, 6.501172065734863, 7.807016372680664, 9.112861633300781, 10.418705940246582, 11.724550247192383, 13.030394554138184, 14.336238861083984, 15.642084121704102, 16.94792938232422, 18.253772735595703, 19.55961799621582, 20.865463256835938, 22.171306610107422, 23.47715187072754, 24.782995223999023, 26.08884048461914, 27.394683837890625, 28.700529098510742, 30.00637435913086, 31.312217712402344, 32.618064880371094, 33.92390823364258, 35.22975540161133, 36.53559875488281, 37.8414421081543, 39.14728546142578, 40.45313262939453, 41.758975982666016, 43.0648193359375]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 7.0, 11.0, 15.0, 26.0, 30.0, 39.0, 64.0, 83.0, 142.0, 223.0, 379.0, 673.0, 1225.0, 2226.0, 4550.0, 9945.0, 24933.0, 72816.0, 294221.0, 2996457.0, 607158.0, 116974.0, 35890.0, 13793.0, 5894.0, 2830.0, 1458.0, 833.0, 488.0, 285.0, 177.0, 138.0, 99.0, 61.0, 36.0, 25.0, 12.0, 19.0, 13.0, 9.0, 8.0, 3.0, 5.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0], "bins": [-4.84375, -4.68060302734375, -4.5174560546875, -4.35430908203125, -4.191162109375, -4.02801513671875, -3.8648681640625, -3.70172119140625, -3.53857421875, -3.37542724609375, -3.2122802734375, -3.04913330078125, -2.885986328125, -2.72283935546875, -2.5596923828125, -2.39654541015625, -2.2333984375, -2.07025146484375, -1.9071044921875, -1.74395751953125, -1.580810546875, -1.41766357421875, -1.2545166015625, -1.09136962890625, -0.92822265625, -0.76507568359375, -0.6019287109375, -0.43878173828125, -0.275634765625, -0.11248779296875, 0.0506591796875, 0.21380615234375, 0.376953125, 0.54010009765625, 0.7032470703125, 0.86639404296875, 1.029541015625, 1.19268798828125, 1.3558349609375, 1.51898193359375, 1.68212890625, 1.84527587890625, 2.0084228515625, 2.17156982421875, 2.334716796875, 2.49786376953125, 2.6610107421875, 2.82415771484375, 2.9873046875, 3.15045166015625, 3.3135986328125, 3.47674560546875, 3.639892578125, 3.80303955078125, 3.9661865234375, 4.12933349609375, 4.29248046875, 4.45562744140625, 4.6187744140625, 4.78192138671875, 4.945068359375, 5.10821533203125, 5.2713623046875, 5.43450927734375, 5.59765625]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 8.0, 13.0, 11.0, 16.0, 13.0, 31.0, 36.0, 33.0, 48.0, 46.0, 60.0, 57.0, 70.0, 68.0, 69.0, 82.0, 55.0, 35.0, 59.0, 33.0, 43.0, 27.0, 21.0, 19.0, 20.0, 8.0, 6.0, 4.0, 7.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0078125, -1.933074951171875, -1.85833740234375, -1.783599853515625, -1.7088623046875, -1.634124755859375, -1.55938720703125, -1.484649658203125, -1.409912109375, -1.335174560546875, -1.26043701171875, -1.185699462890625, -1.1109619140625, -1.036224365234375, -0.96148681640625, -0.886749267578125, -0.81201171875, -0.737274169921875, -0.66253662109375, -0.587799072265625, -0.5130615234375, -0.438323974609375, -0.36358642578125, -0.288848876953125, -0.214111328125, -0.139373779296875, -0.06463623046875, 0.010101318359375, 0.0848388671875, 0.159576416015625, 0.23431396484375, 0.309051513671875, 0.3837890625, 0.458526611328125, 0.53326416015625, 0.608001708984375, 0.6827392578125, 0.757476806640625, 0.83221435546875, 0.906951904296875, 0.981689453125, 1.056427001953125, 1.13116455078125, 1.205902099609375, 1.2806396484375, 1.355377197265625, 1.43011474609375, 1.504852294921875, 1.57958984375, 1.654327392578125, 1.72906494140625, 1.803802490234375, 1.8785400390625, 1.953277587890625, 2.02801513671875, 2.102752685546875, 2.177490234375, 2.252227783203125, 2.32696533203125, 2.401702880859375, 2.4764404296875, 2.551177978515625, 2.62591552734375, 2.700653076171875, 2.775390625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 4.0, 7.0, 3.0, 8.0, 13.0, 8.0, 17.0, 17.0, 21.0, 27.0, 33.0, 55.0, 77.0, 111.0, 141.0, 218.0, 347.0, 595.0, 1103.0, 2345.0, 5719.0, 15984.0, 58237.0, 316670.0, 3144478.0, 531754.0, 82130.0, 21080.0, 7051.0, 2818.0, 1307.0, 675.0, 374.0, 248.0, 152.0, 120.0, 85.0, 61.0, 47.0, 35.0, 24.0, 13.0, 16.0, 15.0, 12.0, 8.0, 6.0, 4.0, 7.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-7.046875, -6.830810546875, -6.61474609375, -6.398681640625, -6.1826171875, -5.966552734375, -5.75048828125, -5.534423828125, -5.318359375, -5.102294921875, -4.88623046875, -4.670166015625, -4.4541015625, -4.238037109375, -4.02197265625, -3.805908203125, -3.58984375, -3.373779296875, -3.15771484375, -2.941650390625, -2.7255859375, -2.509521484375, -2.29345703125, -2.077392578125, -1.861328125, -1.645263671875, -1.42919921875, -1.213134765625, -0.9970703125, -0.781005859375, -0.56494140625, -0.348876953125, -0.1328125, 0.083251953125, 0.29931640625, 0.515380859375, 0.7314453125, 0.947509765625, 1.16357421875, 1.379638671875, 1.595703125, 1.811767578125, 2.02783203125, 2.243896484375, 2.4599609375, 2.676025390625, 2.89208984375, 3.108154296875, 3.32421875, 3.540283203125, 3.75634765625, 3.972412109375, 4.1884765625, 4.404541015625, 4.62060546875, 4.836669921875, 5.052734375, 5.268798828125, 5.48486328125, 5.700927734375, 5.9169921875, 6.133056640625, 6.34912109375, 6.565185546875, 6.78125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 7.0, 3.0, 2.0, 2.0, 6.0, 9.0, 20.0, 15.0, 37.0, 49.0, 70.0, 157.0, 339.0, 866.0, 1519.0, 465.0, 220.0, 89.0, 75.0, 46.0, 20.0, 21.0, 11.0, 12.0, 13.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.44140625, -4.2943115234375, -4.147216796875, -4.0001220703125, -3.85302734375, -3.7059326171875, -3.558837890625, -3.4117431640625, -3.2646484375, -3.1175537109375, -2.970458984375, -2.8233642578125, -2.67626953125, -2.5291748046875, -2.382080078125, -2.2349853515625, -2.087890625, -1.9407958984375, -1.793701171875, -1.6466064453125, -1.49951171875, -1.3524169921875, -1.205322265625, -1.0582275390625, -0.9111328125, -0.7640380859375, -0.616943359375, -0.4698486328125, -0.32275390625, -0.1756591796875, -0.028564453125, 0.1185302734375, 0.265625, 0.4127197265625, 0.559814453125, 0.7069091796875, 0.85400390625, 1.0010986328125, 1.148193359375, 1.2952880859375, 1.4423828125, 1.5894775390625, 1.736572265625, 1.8836669921875, 2.03076171875, 2.1778564453125, 2.324951171875, 2.4720458984375, 2.619140625, 2.7662353515625, 2.913330078125, 3.0604248046875, 3.20751953125, 3.3546142578125, 3.501708984375, 3.6488037109375, 3.7958984375, 3.9429931640625, 4.090087890625, 4.2371826171875, 4.38427734375, 4.5313720703125, 4.678466796875, 4.8255615234375, 4.97265625]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 9.0, 23.0, 73.0, 147.0, 259.0, 252.0, 141.0, 72.0, 20.0, 10.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.7510986328125, -26.18678855895996, -24.622478485107422, -23.058170318603516, -21.493860244750977, -19.929550170898438, -18.36524200439453, -16.800931930541992, -15.236621856689453, -13.672311782836914, -12.108002662658691, -10.543693542480469, -8.97938346862793, -7.415073871612549, -5.850764274597168, -4.286455154418945, -2.7221450805664062, -1.1578354835510254, 0.40647411346435547, 1.9707837104797363, 3.535093307495117, 5.099402904510498, 6.663712501525879, 8.228021621704102, 9.79233169555664, 11.35664176940918, 12.920950889587402, 14.485260009765625, 16.049570083618164, 17.613880157470703, 19.17818832397461, 20.74249839782715, 22.306808471679688, 23.871118545532227, 25.435428619384766, 26.999736785888672, 28.56404685974121, 30.12835693359375, 31.692665100097656, 33.25697326660156, 34.821285247802734, 36.38559341430664, 37.94990539550781, 39.51421356201172, 41.078521728515625, 42.6428337097168, 44.2071418762207, 45.771453857421875, 47.33576202392578, 48.90007019042969, 50.46438217163086, 52.028690338134766, 53.59300231933594, 55.157310485839844, 56.72161865234375, 58.285926818847656, 59.85023880004883, 61.414546966552734, 62.978858947753906, 64.54316711425781, 66.10747528076172, 67.67178344726562, 69.23609924316406, 70.80040740966797, 72.36471557617188]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 7.0, 2.0, 3.0, 5.0, 11.0, 6.0, 20.0, 16.0, 14.0, 15.0, 34.0, 28.0, 33.0, 32.0, 41.0, 44.0, 50.0, 43.0, 48.0, 58.0, 51.0, 43.0, 51.0, 58.0, 36.0, 33.0, 29.0, 33.0, 18.0, 28.0, 21.0, 17.0, 19.0, 11.0, 10.0, 10.0, 10.0, 8.0, 5.0, 3.0, 3.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.0396728515625, -14.59972858428955, -14.159783363342285, -13.719839096069336, -13.279894828796387, -12.839950561523438, -12.400005340576172, -11.960061073303223, -11.520116806030273, -11.080172538757324, -10.640227317810059, -10.20028305053711, -9.76033878326416, -9.320394515991211, -8.880449295043945, -8.440505027770996, -8.00055980682373, -7.560615062713623, -7.120670795440674, -6.680726051330566, -6.240781784057617, -5.80083703994751, -5.360892295837402, -4.920948028564453, -4.481003284454346, -4.041058540344238, -3.601114273071289, -3.1611695289611816, -2.7212250232696533, -2.281280517578125, -1.8413357734680176, -1.4013912677764893, -0.9614458084106445, -0.5215012431144714, -0.08155667781829834, 0.35838794708251953, 0.7983324527740479, 1.2382769584655762, 1.6782217025756836, 2.118166208267212, 2.5581107139587402, 2.9980552196502686, 3.437999725341797, 3.8779444694519043, 4.317889213562012, 4.757833480834961, 5.197778224945068, 5.637722969055176, 6.077667236328125, 6.517611980438232, 6.957556247711182, 7.397500991821289, 7.837445259094238, 8.277389526367188, 8.717334747314453, 9.157279014587402, 9.597223281860352, 10.0371675491333, 10.477112770080566, 10.917057037353516, 11.357001304626465, 11.796945571899414, 12.23689079284668, 12.676835060119629, 13.116780281066895]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 3.0, 3.0, 7.0, 7.0, 14.0, 17.0, 19.0, 35.0, 37.0, 72.0, 90.0, 143.0, 212.0, 321.0, 583.0, 962.0, 1841.0, 3654.0, 7559.0, 16539.0, 37897.0, 87269.0, 180744.0, 266960.0, 225658.0, 119967.0, 54132.0, 23138.0, 10414.0, 4774.0, 2345.0, 1241.0, 706.0, 398.0, 267.0, 185.0, 100.0, 88.0, 49.0, 35.0, 24.0, 18.0, 9.0, 10.0, 4.0, 5.0, 3.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.2265625, -4.06829833984375, -3.9100341796875, -3.75177001953125, -3.593505859375, -3.43524169921875, -3.2769775390625, -3.11871337890625, -2.96044921875, -2.80218505859375, -2.6439208984375, -2.48565673828125, -2.327392578125, -2.16912841796875, -2.0108642578125, -1.85260009765625, -1.6943359375, -1.53607177734375, -1.3778076171875, -1.21954345703125, -1.061279296875, -0.90301513671875, -0.7447509765625, -0.58648681640625, -0.42822265625, -0.26995849609375, -0.1116943359375, 0.04656982421875, 0.204833984375, 0.36309814453125, 0.5213623046875, 0.67962646484375, 0.837890625, 0.99615478515625, 1.1544189453125, 1.31268310546875, 1.470947265625, 1.62921142578125, 1.7874755859375, 1.94573974609375, 2.10400390625, 2.26226806640625, 2.4205322265625, 2.57879638671875, 2.737060546875, 2.89532470703125, 3.0535888671875, 3.21185302734375, 3.3701171875, 3.52838134765625, 3.6866455078125, 3.84490966796875, 4.003173828125, 4.16143798828125, 4.3197021484375, 4.47796630859375, 4.63623046875, 4.79449462890625, 4.9527587890625, 5.11102294921875, 5.269287109375, 5.42755126953125, 5.5858154296875, 5.74407958984375, 5.90234375]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 8.0, 6.0, 4.0, 3.0, 13.0, 11.0, 18.0, 19.0, 26.0, 31.0, 32.0, 47.0, 47.0, 49.0, 58.0, 61.0, 64.0, 57.0, 57.0, 46.0, 58.0, 49.0, 46.0, 37.0, 39.0, 20.0, 22.0, 12.0, 19.0, 14.0, 6.0, 7.0, 8.0, 6.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.841796875, -1.774200439453125, -1.70660400390625, -1.639007568359375, -1.5714111328125, -1.503814697265625, -1.43621826171875, -1.368621826171875, -1.301025390625, -1.233428955078125, -1.16583251953125, -1.098236083984375, -1.0306396484375, -0.963043212890625, -0.89544677734375, -0.827850341796875, -0.76025390625, -0.692657470703125, -0.62506103515625, -0.557464599609375, -0.4898681640625, -0.422271728515625, -0.35467529296875, -0.287078857421875, -0.219482421875, -0.151885986328125, -0.08428955078125, -0.016693115234375, 0.0509033203125, 0.118499755859375, 0.18609619140625, 0.253692626953125, 0.3212890625, 0.388885498046875, 0.45648193359375, 0.524078369140625, 0.5916748046875, 0.659271240234375, 0.72686767578125, 0.794464111328125, 0.862060546875, 0.929656982421875, 0.99725341796875, 1.064849853515625, 1.1324462890625, 1.200042724609375, 1.26763916015625, 1.335235595703125, 1.40283203125, 1.470428466796875, 1.53802490234375, 1.605621337890625, 1.6732177734375, 1.740814208984375, 1.80841064453125, 1.876007080078125, 1.943603515625, 2.011199951171875, 2.07879638671875, 2.146392822265625, 2.2139892578125, 2.281585693359375, 2.34918212890625, 2.416778564453125, 2.484375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 7.0, 9.0, 5.0, 6.0, 8.0, 16.0, 18.0, 18.0, 44.0, 54.0, 65.0, 136.0, 192.0, 307.0, 560.0, 1062.0, 2444.0, 11569.0, 167021.0, 760598.0, 92060.0, 8020.0, 2095.0, 905.0, 524.0, 270.0, 194.0, 128.0, 67.0, 40.0, 32.0, 25.0, 18.0, 11.0, 12.0, 5.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-21.046875, -20.498779296875, -19.95068359375, -19.402587890625, -18.8544921875, -18.306396484375, -17.75830078125, -17.210205078125, -16.662109375, -16.114013671875, -15.56591796875, -15.017822265625, -14.4697265625, -13.921630859375, -13.37353515625, -12.825439453125, -12.27734375, -11.729248046875, -11.18115234375, -10.633056640625, -10.0849609375, -9.536865234375, -8.98876953125, -8.440673828125, -7.892578125, -7.344482421875, -6.79638671875, -6.248291015625, -5.7001953125, -5.152099609375, -4.60400390625, -4.055908203125, -3.5078125, -2.959716796875, -2.41162109375, -1.863525390625, -1.3154296875, -0.767333984375, -0.21923828125, 0.328857421875, 0.876953125, 1.425048828125, 1.97314453125, 2.521240234375, 3.0693359375, 3.617431640625, 4.16552734375, 4.713623046875, 5.26171875, 5.809814453125, 6.35791015625, 6.906005859375, 7.4541015625, 8.002197265625, 8.55029296875, 9.098388671875, 9.646484375, 10.194580078125, 10.74267578125, 11.290771484375, 11.8388671875, 12.386962890625, 12.93505859375, 13.483154296875, 14.03125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 1.0, 7.0, 5.0, 6.0, 14.0, 2.0, 14.0, 13.0, 20.0, 21.0, 28.0, 30.0, 34.0, 55.0, 61.0, 44.0, 63.0, 51.0, 65.0, 66.0, 57.0, 64.0, 38.0, 54.0, 40.0, 34.0, 26.0, 23.0, 17.0, 13.0, 10.0, 10.0, 6.0, 8.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-14.8125, -14.35595703125, -13.8994140625, -13.44287109375, -12.986328125, -12.52978515625, -12.0732421875, -11.61669921875, -11.16015625, -10.70361328125, -10.2470703125, -9.79052734375, -9.333984375, -8.87744140625, -8.4208984375, -7.96435546875, -7.5078125, -7.05126953125, -6.5947265625, -6.13818359375, -5.681640625, -5.22509765625, -4.7685546875, -4.31201171875, -3.85546875, -3.39892578125, -2.9423828125, -2.48583984375, -2.029296875, -1.57275390625, -1.1162109375, -0.65966796875, -0.203125, 0.25341796875, 0.7099609375, 1.16650390625, 1.623046875, 2.07958984375, 2.5361328125, 2.99267578125, 3.44921875, 3.90576171875, 4.3623046875, 4.81884765625, 5.275390625, 5.73193359375, 6.1884765625, 6.64501953125, 7.1015625, 7.55810546875, 8.0146484375, 8.47119140625, 8.927734375, 9.38427734375, 9.8408203125, 10.29736328125, 10.75390625, 11.21044921875, 11.6669921875, 12.12353515625, 12.580078125, 13.03662109375, 13.4931640625, 13.94970703125, 14.40625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 1.0, 5.0, 3.0, 0.0, 0.0, 1.0, 3.0, 4.0, 6.0, 6.0, 5.0, 7.0, 7.0, 11.0, 19.0, 27.0, 45.0, 58.0, 96.0, 160.0, 307.0, 585.0, 1312.0, 3613.0, 11332.0, 51965.0, 308619.0, 535187.0, 106050.0, 19958.0, 5554.0, 1904.0, 795.0, 369.0, 200.0, 114.0, 62.0, 44.0, 33.0, 28.0, 17.0, 11.0, 6.0, 9.0, 6.0, 5.0, 3.0, 2.0, 2.0, 0.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.328125, -6.12530517578125, -5.9224853515625, -5.71966552734375, -5.516845703125, -5.31402587890625, -5.1112060546875, -4.90838623046875, -4.70556640625, -4.50274658203125, -4.2999267578125, -4.09710693359375, -3.894287109375, -3.69146728515625, -3.4886474609375, -3.28582763671875, -3.0830078125, -2.88018798828125, -2.6773681640625, -2.47454833984375, -2.271728515625, -2.06890869140625, -1.8660888671875, -1.66326904296875, -1.46044921875, -1.25762939453125, -1.0548095703125, -0.85198974609375, -0.649169921875, -0.44635009765625, -0.2435302734375, -0.04071044921875, 0.162109375, 0.36492919921875, 0.5677490234375, 0.77056884765625, 0.973388671875, 1.17620849609375, 1.3790283203125, 1.58184814453125, 1.78466796875, 1.98748779296875, 2.1903076171875, 2.39312744140625, 2.595947265625, 2.79876708984375, 3.0015869140625, 3.20440673828125, 3.4072265625, 3.61004638671875, 3.8128662109375, 4.01568603515625, 4.218505859375, 4.42132568359375, 4.6241455078125, 4.82696533203125, 5.02978515625, 5.23260498046875, 5.4354248046875, 5.63824462890625, 5.841064453125, 6.04388427734375, 6.2467041015625, 6.44952392578125, 6.65234375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 1.0, 4.0, 1.0, 1.0, 2.0, 9.0, 7.0, 16.0, 8.0, 21.0, 27.0, 25.0, 44.0, 56.0, 81.0, 103.0, 105.0, 114.0, 88.0, 83.0, 50.0, 35.0, 44.0, 24.0, 14.0, 11.0, 8.0, 6.0, 6.0, 7.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008168220520019531, -0.0007840916514396667, -0.0007513612508773804, -0.000718630850315094, -0.0006859004497528076, -0.0006531700491905212, -0.0006204396486282349, -0.0005877092480659485, -0.0005549788475036621, -0.0005222484469413757, -0.0004895180463790894, -0.000456787645816803, -0.0004240572452545166, -0.0003913268446922302, -0.00035859644412994385, -0.00032586604356765747, -0.0002931356430053711, -0.0002604052424430847, -0.00022767484188079834, -0.00019494444131851196, -0.00016221404075622559, -0.0001294836401939392, -9.675323963165283e-05, -6.402283906936646e-05, -3.129243850708008e-05, 1.4379620552062988e-06, 3.4168362617492676e-05, 6.689876317977905e-05, 9.962916374206543e-05, 0.0001323595643043518, 0.00016508996486663818, 0.00019782036542892456, 0.00023055076599121094, 0.0002632811665534973, 0.0002960115671157837, 0.00032874196767807007, 0.00036147236824035645, 0.0003942027688026428, 0.0004269331693649292, 0.0004596635699272156, 0.000492393970489502, 0.0005251243710517883, 0.0005578547716140747, 0.0005905851721763611, 0.0006233155727386475, 0.0006560459733009338, 0.0006887763738632202, 0.0007215067744255066, 0.000754237174987793, 0.0007869675755500793, 0.0008196979761123657, 0.0008524283766746521, 0.0008851587772369385, 0.0009178891777992249, 0.0009506195783615112, 0.0009833499789237976, 0.001016080379486084, 0.0010488107800483704, 0.0010815411806106567, 0.0011142715811729431, 0.0011470019817352295, 0.0011797323822975159, 0.0012124627828598022, 0.0012451931834220886, 0.001277923583984375]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 5.0, 2.0, 1.0, 2.0, 5.0, 3.0, 2.0, 10.0, 18.0, 18.0, 15.0, 28.0, 45.0, 63.0, 85.0, 133.0, 227.0, 384.0, 725.0, 1567.0, 4054.0, 15410.0, 118794.0, 679554.0, 195867.0, 22470.0, 5111.0, 1970.0, 840.0, 469.0, 244.0, 149.0, 91.0, 53.0, 44.0, 26.0, 19.0, 15.0, 10.0, 7.0, 6.0, 6.0, 4.0, 5.0, 2.0, 4.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.296875, -7.0504150390625, -6.803955078125, -6.5574951171875, -6.31103515625, -6.0645751953125, -5.818115234375, -5.5716552734375, -5.3251953125, -5.0787353515625, -4.832275390625, -4.5858154296875, -4.33935546875, -4.0928955078125, -3.846435546875, -3.5999755859375, -3.353515625, -3.1070556640625, -2.860595703125, -2.6141357421875, -2.36767578125, -2.1212158203125, -1.874755859375, -1.6282958984375, -1.3818359375, -1.1353759765625, -0.888916015625, -0.6424560546875, -0.39599609375, -0.1495361328125, 0.096923828125, 0.3433837890625, 0.58984375, 0.8363037109375, 1.082763671875, 1.3292236328125, 1.57568359375, 1.8221435546875, 2.068603515625, 2.3150634765625, 2.5615234375, 2.8079833984375, 3.054443359375, 3.3009033203125, 3.54736328125, 3.7938232421875, 4.040283203125, 4.2867431640625, 4.533203125, 4.7796630859375, 5.026123046875, 5.2725830078125, 5.51904296875, 5.7655029296875, 6.011962890625, 6.2584228515625, 6.5048828125, 6.7513427734375, 6.997802734375, 7.2442626953125, 7.49072265625, 7.7371826171875, 7.983642578125, 8.2301025390625, 8.4765625]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 6.0, 2.0, 6.0, 7.0, 5.0, 11.0, 13.0, 14.0, 21.0, 18.0, 21.0, 40.0, 39.0, 46.0, 49.0, 60.0, 86.0, 87.0, 70.0, 73.0, 61.0, 47.0, 47.0, 32.0, 21.0, 27.0, 18.0, 13.0, 9.0, 10.0, 4.0, 7.0, 8.0, 7.0, 5.0, 4.0, 3.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.5078125, -4.3603515625, -4.212890625, -4.0654296875, -3.91796875, -3.7705078125, -3.623046875, -3.4755859375, -3.328125, -3.1806640625, -3.033203125, -2.8857421875, -2.73828125, -2.5908203125, -2.443359375, -2.2958984375, -2.1484375, -2.0009765625, -1.853515625, -1.7060546875, -1.55859375, -1.4111328125, -1.263671875, -1.1162109375, -0.96875, -0.8212890625, -0.673828125, -0.5263671875, -0.37890625, -0.2314453125, -0.083984375, 0.0634765625, 0.2109375, 0.3583984375, 0.505859375, 0.6533203125, 0.80078125, 0.9482421875, 1.095703125, 1.2431640625, 1.390625, 1.5380859375, 1.685546875, 1.8330078125, 1.98046875, 2.1279296875, 2.275390625, 2.4228515625, 2.5703125, 2.7177734375, 2.865234375, 3.0126953125, 3.16015625, 3.3076171875, 3.455078125, 3.6025390625, 3.75, 3.8974609375, 4.044921875, 4.1923828125, 4.33984375, 4.4873046875, 4.634765625, 4.7822265625, 4.9296875]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 7.0, 34.0, 106.0, 266.0, 348.0, 183.0, 42.0, 14.0, 6.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-266.1736145019531, -260.1497802734375, -254.1259307861328, -248.10208129882812, -242.0782470703125, -236.0543975830078, -230.03054809570312, -224.0067138671875, -217.98287963867188, -211.9590301513672, -205.93519592285156, -199.91134643554688, -193.88751220703125, -187.86366271972656, -181.83981323242188, -175.81597900390625, -169.79212951660156, -163.76828002929688, -157.74444580078125, -151.72059631347656, -145.69676208496094, -139.67291259765625, -133.64907836914062, -127.62522888183594, -121.60138702392578, -115.57754516601562, -109.55370330810547, -103.52986145019531, -97.50601196289062, -91.482177734375, -85.45832824707031, -79.43448638916016, -73.41062927246094, -67.38678741455078, -61.362945556640625, -55.3390998840332, -49.31525802612305, -43.29141616821289, -37.26757049560547, -31.243728637695312, -25.219886779785156, -19.196044921875, -13.172201156616211, -7.148357391357422, -1.1245155334472656, 4.899326324462891, 10.923171997070312, 16.94701385498047, 22.970855712890625, 28.99469757080078, 35.01853942871094, 41.04238510131836, 47.066226959228516, 53.09006881713867, 59.113914489746094, 65.13775634765625, 71.1615982055664, 77.18544006347656, 83.20928192138672, 89.23312377929688, 95.25697326660156, 101.28080749511719, 107.30465698242188, 113.32849884033203, 119.35234069824219]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 4.0, 3.0, 6.0, 6.0, 6.0, 9.0, 14.0, 20.0, 25.0, 20.0, 28.0, 37.0, 52.0, 54.0, 37.0, 52.0, 58.0, 54.0, 53.0, 52.0, 65.0, 47.0, 43.0, 44.0, 29.0, 29.0, 22.0, 27.0, 18.0, 18.0, 17.0, 12.0, 10.0, 7.0, 11.0, 3.0, 4.0, 3.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.80964279174805, -48.81037902832031, -46.81111526489258, -44.811851501464844, -42.812591552734375, -40.81332778930664, -38.814064025878906, -36.81480026245117, -34.81553649902344, -32.8162727355957, -30.8170108795166, -28.817747116088867, -26.818485260009766, -24.81922149658203, -22.819957733154297, -20.820693969726562, -18.821434020996094, -16.82217025756836, -14.822908401489258, -12.823644638061523, -10.824381828308105, -8.825119018554688, -6.825855255126953, -4.826592445373535, -2.827329635620117, -0.8280665874481201, 1.171196460723877, 3.170459747314453, 5.169722557067871, 7.168985366821289, 9.168249130249023, 11.167511940002441, 13.166778564453125, 15.166041374206543, 17.16530418395996, 19.164567947387695, 21.163829803466797, 23.16309356689453, 25.162357330322266, 27.16162109375, 29.1608829498291, 31.160146713256836, 33.15940856933594, 35.15867233276367, 37.157936096191406, 39.157196044921875, 41.156463623046875, 43.155723571777344, 45.15498733520508, 47.15425109863281, 49.15351486206055, 51.15277862548828, 53.15203857421875, 55.151302337646484, 57.15056610107422, 59.14982986450195, 61.14909362792969, 63.14835739135742, 65.14762115478516, 67.14688110351562, 69.14614868164062, 71.1454086303711, 73.14466857910156, 75.14393615722656, 77.14319610595703]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 3.0, 7.0, 8.0, 5.0, 15.0, 12.0, 12.0, 23.0, 37.0, 38.0, 40.0, 66.0, 89.0, 134.0, 210.0, 295.0, 441.0, 703.0, 1155.0, 2104.0, 3778.0, 8412.0, 21273.0, 78316.0, 3743943.0, 265958.0, 40537.0, 13377.0, 5930.0, 2925.0, 1644.0, 1025.0, 556.0, 385.0, 244.0, 178.0, 100.0, 84.0, 61.0, 49.0, 29.0, 22.0, 19.0, 8.0, 12.0, 9.0, 5.0, 1.0, 2.0, 1.0, 1.0, 4.0, 2.0, 0.0, 1.0], "bins": [-8.1640625, -7.92236328125, -7.6806640625, -7.43896484375, -7.197265625, -6.95556640625, -6.7138671875, -6.47216796875, -6.23046875, -5.98876953125, -5.7470703125, -5.50537109375, -5.263671875, -5.02197265625, -4.7802734375, -4.53857421875, -4.296875, -4.05517578125, -3.8134765625, -3.57177734375, -3.330078125, -3.08837890625, -2.8466796875, -2.60498046875, -2.36328125, -2.12158203125, -1.8798828125, -1.63818359375, -1.396484375, -1.15478515625, -0.9130859375, -0.67138671875, -0.4296875, -0.18798828125, 0.0537109375, 0.29541015625, 0.537109375, 0.77880859375, 1.0205078125, 1.26220703125, 1.50390625, 1.74560546875, 1.9873046875, 2.22900390625, 2.470703125, 2.71240234375, 2.9541015625, 3.19580078125, 3.4375, 3.67919921875, 3.9208984375, 4.16259765625, 4.404296875, 4.64599609375, 4.8876953125, 5.12939453125, 5.37109375, 5.61279296875, 5.8544921875, 6.09619140625, 6.337890625, 6.57958984375, 6.8212890625, 7.06298828125, 7.3046875]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 6.0, 2.0, 5.0, 14.0, 10.0, 26.0, 23.0, 27.0, 35.0, 46.0, 63.0, 67.0, 77.0, 77.0, 66.0, 87.0, 59.0, 53.0, 61.0, 42.0, 32.0, 39.0, 17.0, 17.0, 13.0, 9.0, 9.0, 6.0, 8.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.498046875, -2.395965576171875, -2.29388427734375, -2.191802978515625, -2.0897216796875, -1.987640380859375, -1.88555908203125, -1.783477783203125, -1.681396484375, -1.579315185546875, -1.47723388671875, -1.375152587890625, -1.2730712890625, -1.170989990234375, -1.06890869140625, -0.966827392578125, -0.86474609375, -0.762664794921875, -0.66058349609375, -0.558502197265625, -0.4564208984375, -0.354339599609375, -0.25225830078125, -0.150177001953125, -0.048095703125, 0.053985595703125, 0.15606689453125, 0.258148193359375, 0.3602294921875, 0.462310791015625, 0.56439208984375, 0.666473388671875, 0.7685546875, 0.870635986328125, 0.97271728515625, 1.074798583984375, 1.1768798828125, 1.278961181640625, 1.38104248046875, 1.483123779296875, 1.585205078125, 1.687286376953125, 1.78936767578125, 1.891448974609375, 1.9935302734375, 2.095611572265625, 2.19769287109375, 2.299774169921875, 2.40185546875, 2.503936767578125, 2.60601806640625, 2.708099365234375, 2.8101806640625, 2.912261962890625, 3.01434326171875, 3.116424560546875, 3.218505859375, 3.320587158203125, 3.42266845703125, 3.524749755859375, 3.6268310546875, 3.728912353515625, 3.83099365234375, 3.933074951171875, 4.03515625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 9.0, 9.0, 16.0, 23.0, 25.0, 39.0, 62.0, 73.0, 112.0, 144.0, 226.0, 299.0, 420.0, 661.0, 995.0, 1949.0, 3689.0, 8599.0, 24893.0, 106912.0, 3641728.0, 329212.0, 47837.0, 13948.0, 5440.0, 2599.0, 1523.0, 961.0, 572.0, 369.0, 255.0, 192.0, 147.0, 92.0, 73.0, 58.0, 43.0, 22.0, 15.0, 12.0, 13.0, 5.0, 6.0, 3.0, 6.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.859375, -6.6287841796875, -6.398193359375, -6.1676025390625, -5.93701171875, -5.7064208984375, -5.475830078125, -5.2452392578125, -5.0146484375, -4.7840576171875, -4.553466796875, -4.3228759765625, -4.09228515625, -3.8616943359375, -3.631103515625, -3.4005126953125, -3.169921875, -2.9393310546875, -2.708740234375, -2.4781494140625, -2.24755859375, -2.0169677734375, -1.786376953125, -1.5557861328125, -1.3251953125, -1.0946044921875, -0.864013671875, -0.6334228515625, -0.40283203125, -0.1722412109375, 0.058349609375, 0.2889404296875, 0.51953125, 0.7501220703125, 0.980712890625, 1.2113037109375, 1.44189453125, 1.6724853515625, 1.903076171875, 2.1336669921875, 2.3642578125, 2.5948486328125, 2.825439453125, 3.0560302734375, 3.28662109375, 3.5172119140625, 3.747802734375, 3.9783935546875, 4.208984375, 4.4395751953125, 4.670166015625, 4.9007568359375, 5.13134765625, 5.3619384765625, 5.592529296875, 5.8231201171875, 6.0537109375, 6.2843017578125, 6.514892578125, 6.7454833984375, 6.97607421875, 7.2066650390625, 7.437255859375, 7.6678466796875, 7.8984375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 4.0, 2.0, 12.0, 14.0, 15.0, 19.0, 37.0, 61.0, 114.0, 240.0, 2737.0, 449.0, 152.0, 75.0, 46.0, 29.0, 18.0, 17.0, 7.0, 3.0, 8.0, 5.0, 2.0, 1.0, 0.0, 2.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.265625, -1.212249755859375, -1.15887451171875, -1.105499267578125, -1.0521240234375, -0.998748779296875, -0.94537353515625, -0.891998291015625, -0.838623046875, -0.785247802734375, -0.73187255859375, -0.678497314453125, -0.6251220703125, -0.571746826171875, -0.51837158203125, -0.464996337890625, -0.41162109375, -0.358245849609375, -0.30487060546875, -0.251495361328125, -0.1981201171875, -0.144744873046875, -0.09136962890625, -0.037994384765625, 0.015380859375, 0.068756103515625, 0.12213134765625, 0.175506591796875, 0.2288818359375, 0.282257080078125, 0.33563232421875, 0.389007568359375, 0.4423828125, 0.495758056640625, 0.54913330078125, 0.602508544921875, 0.6558837890625, 0.709259033203125, 0.76263427734375, 0.816009521484375, 0.869384765625, 0.922760009765625, 0.97613525390625, 1.029510498046875, 1.0828857421875, 1.136260986328125, 1.18963623046875, 1.243011474609375, 1.29638671875, 1.349761962890625, 1.40313720703125, 1.456512451171875, 1.5098876953125, 1.563262939453125, 1.61663818359375, 1.670013427734375, 1.723388671875, 1.776763916015625, 1.83013916015625, 1.883514404296875, 1.9368896484375, 1.990264892578125, 2.04364013671875, 2.097015380859375, 2.150390625]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 2.0, 5.0, 16.0, 54.0, 79.0, 139.0, 198.0, 184.0, 150.0, 86.0, 45.0, 23.0, 10.0, 5.0, 6.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.221804141998291, -3.8127622604370117, -3.4037203788757324, -2.994678497314453, -2.585636615753174, -2.1765944957733154, -1.7675526142120361, -1.3585107326507568, -0.9494688510894775, -0.5404269695281982, -0.13138502836227417, 0.2776569128036499, 0.6866987943649292, 1.095740795135498, 1.5047826766967773, 1.9138245582580566, 2.322866439819336, 2.7319083213806152, 3.1409502029418945, 3.549992084503174, 3.959033966064453, 4.368076324462891, 4.777117729187012, 5.186160087585449, 5.59520149230957, 6.00424337387085, 6.413285255432129, 6.822327136993408, 7.2313690185546875, 7.640411376953125, 8.049452781677246, 8.458495140075684, 8.867537498474121, 9.276579856872559, 9.68562126159668, 10.094663619995117, 10.503705024719238, 10.912747383117676, 11.321788787841797, 11.730831146240234, 12.139872550964355, 12.548914909362793, 12.957956314086914, 13.366998672485352, 13.776040077209473, 14.18508243560791, 14.594123840332031, 15.003166198730469, 15.412208557128906, 15.821250915527344, 16.23029327392578, 16.639333724975586, 17.048376083374023, 17.45741844177246, 17.8664608001709, 18.275501251220703, 18.68454360961914, 19.093585968017578, 19.502628326416016, 19.91166877746582, 20.320711135864258, 20.729753494262695, 21.138795852661133, 21.547836303710938, 21.956878662109375]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 1.0, 3.0, 2.0, 5.0, 4.0, 6.0, 7.0, 10.0, 12.0, 25.0, 16.0, 31.0, 26.0, 21.0, 23.0, 22.0, 29.0, 40.0, 42.0, 39.0, 38.0, 41.0, 34.0, 35.0, 43.0, 38.0, 31.0, 39.0, 38.0, 37.0, 31.0, 29.0, 28.0, 36.0, 34.0, 26.0, 25.0, 10.0, 11.0, 11.0, 7.0, 9.0, 5.0, 5.0, 3.0, 2.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.856049537658691, -4.719592094421387, -4.583134174346924, -4.446676731109619, -4.3102192878723145, -4.173761367797852, -4.037303924560547, -3.900846242904663, -3.7643885612487793, -3.6279308795928955, -3.491473436355591, -3.355015754699707, -3.2185580730438232, -3.0821003913879395, -2.9456429481506348, -2.809185266494751, -2.6727278232574463, -2.5362701416015625, -2.399812698364258, -2.263355016708374, -2.1268973350524902, -1.990439772605896, -1.8539822101593018, -1.717524528503418, -1.5810669660568237, -1.4446094036102295, -1.3081517219543457, -1.1716941595077515, -1.0352365970611572, -0.8987789154052734, -0.7623213529586792, -0.6258637309074402, -0.48940587043762207, -0.35294824838638306, -0.21649065613746643, -0.0800330638885498, 0.05642455816268921, 0.19288218021392822, 0.32933974266052246, 0.4657973647117615, 0.6022549867630005, 0.7387126088142395, 0.8751702308654785, 1.0116277933120728, 1.148085355758667, 1.2845430374145508, 1.421000599861145, 1.5574581623077393, 1.693915843963623, 1.8303734064102173, 1.966831088066101, 2.1032886505126953, 2.239746332168579, 2.376204013824463, 2.5126614570617676, 2.6491191387176514, 2.785576820373535, 2.922034502029419, 3.0584919452667236, 3.1949496269226074, 3.331407308578491, 3.467864990234375, 3.6043224334716797, 3.7407801151275635, 3.877237558364868]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 5.0, 11.0, 16.0, 13.0, 38.0, 51.0, 86.0, 188.0, 389.0, 890.0, 2761.0, 11776.0, 61483.0, 292730.0, 478515.0, 160448.0, 30004.0, 6201.0, 1765.0, 583.0, 272.0, 136.0, 67.0, 44.0, 34.0, 23.0, 12.0, 10.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.98046875, -6.66729736328125, -6.3541259765625, -6.04095458984375, -5.727783203125, -5.41461181640625, -5.1014404296875, -4.78826904296875, -4.47509765625, -4.16192626953125, -3.8487548828125, -3.53558349609375, -3.222412109375, -2.90924072265625, -2.5960693359375, -2.28289794921875, -1.9697265625, -1.65655517578125, -1.3433837890625, -1.03021240234375, -0.717041015625, -0.40386962890625, -0.0906982421875, 0.22247314453125, 0.53564453125, 0.84881591796875, 1.1619873046875, 1.47515869140625, 1.788330078125, 2.10150146484375, 2.4146728515625, 2.72784423828125, 3.041015625, 3.35418701171875, 3.6673583984375, 3.98052978515625, 4.293701171875, 4.60687255859375, 4.9200439453125, 5.23321533203125, 5.54638671875, 5.85955810546875, 6.1727294921875, 6.48590087890625, 6.799072265625, 7.11224365234375, 7.4254150390625, 7.73858642578125, 8.0517578125, 8.36492919921875, 8.6781005859375, 8.99127197265625, 9.304443359375, 9.61761474609375, 9.9307861328125, 10.24395751953125, 10.55712890625, 10.87030029296875, 11.1834716796875, 11.49664306640625, 11.809814453125, 12.12298583984375, 12.4361572265625, 12.74932861328125, 13.0625]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 5.0, 9.0, 6.0, 15.0, 18.0, 16.0, 30.0, 30.0, 42.0, 57.0, 69.0, 67.0, 76.0, 90.0, 74.0, 64.0, 55.0, 64.0, 50.0, 32.0, 32.0, 20.0, 20.0, 17.0, 16.0, 10.0, 6.0, 6.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.46875, -2.36083984375, -2.2529296875, -2.14501953125, -2.037109375, -1.92919921875, -1.8212890625, -1.71337890625, -1.60546875, -1.49755859375, -1.3896484375, -1.28173828125, -1.173828125, -1.06591796875, -0.9580078125, -0.85009765625, -0.7421875, -0.63427734375, -0.5263671875, -0.41845703125, -0.310546875, -0.20263671875, -0.0947265625, 0.01318359375, 0.12109375, 0.22900390625, 0.3369140625, 0.44482421875, 0.552734375, 0.66064453125, 0.7685546875, 0.87646484375, 0.984375, 1.09228515625, 1.2001953125, 1.30810546875, 1.416015625, 1.52392578125, 1.6318359375, 1.73974609375, 1.84765625, 1.95556640625, 2.0634765625, 2.17138671875, 2.279296875, 2.38720703125, 2.4951171875, 2.60302734375, 2.7109375, 2.81884765625, 2.9267578125, 3.03466796875, 3.142578125, 3.25048828125, 3.3583984375, 3.46630859375, 3.57421875, 3.68212890625, 3.7900390625, 3.89794921875, 4.005859375, 4.11376953125, 4.2216796875, 4.32958984375, 4.4375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 2.0, 8.0, 6.0, 5.0, 15.0, 8.0, 13.0, 29.0, 24.0, 49.0, 68.0, 101.0, 156.0, 221.0, 418.0, 660.0, 1042.0, 2335.0, 10462.0, 167696.0, 782874.0, 71814.0, 6399.0, 1793.0, 839.0, 541.0, 320.0, 199.0, 134.0, 88.0, 52.0, 52.0, 39.0, 22.0, 16.0, 17.0, 10.0, 11.0, 5.0, 9.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.4375, -17.830322265625, -17.22314453125, -16.615966796875, -16.0087890625, -15.401611328125, -14.79443359375, -14.187255859375, -13.580078125, -12.972900390625, -12.36572265625, -11.758544921875, -11.1513671875, -10.544189453125, -9.93701171875, -9.329833984375, -8.72265625, -8.115478515625, -7.50830078125, -6.901123046875, -6.2939453125, -5.686767578125, -5.07958984375, -4.472412109375, -3.865234375, -3.258056640625, -2.65087890625, -2.043701171875, -1.4365234375, -0.829345703125, -0.22216796875, 0.385009765625, 0.9921875, 1.599365234375, 2.20654296875, 2.813720703125, 3.4208984375, 4.028076171875, 4.63525390625, 5.242431640625, 5.849609375, 6.456787109375, 7.06396484375, 7.671142578125, 8.2783203125, 8.885498046875, 9.49267578125, 10.099853515625, 10.70703125, 11.314208984375, 11.92138671875, 12.528564453125, 13.1357421875, 13.742919921875, 14.35009765625, 14.957275390625, 15.564453125, 16.171630859375, 16.77880859375, 17.385986328125, 17.9931640625, 18.600341796875, 19.20751953125, 19.814697265625, 20.421875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 7.0, 5.0, 2.0, 9.0, 10.0, 9.0, 18.0, 28.0, 22.0, 42.0, 54.0, 73.0, 74.0, 56.0, 72.0, 85.0, 64.0, 70.0, 63.0, 55.0, 37.0, 39.0, 29.0, 19.0, 10.0, 13.0, 10.0, 6.0, 3.0, 6.0, 2.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.75, -21.029052734375, -20.30810546875, -19.587158203125, -18.8662109375, -18.145263671875, -17.42431640625, -16.703369140625, -15.982421875, -15.261474609375, -14.54052734375, -13.819580078125, -13.0986328125, -12.377685546875, -11.65673828125, -10.935791015625, -10.21484375, -9.493896484375, -8.77294921875, -8.052001953125, -7.3310546875, -6.610107421875, -5.88916015625, -5.168212890625, -4.447265625, -3.726318359375, -3.00537109375, -2.284423828125, -1.5634765625, -0.842529296875, -0.12158203125, 0.599365234375, 1.3203125, 2.041259765625, 2.76220703125, 3.483154296875, 4.2041015625, 4.925048828125, 5.64599609375, 6.366943359375, 7.087890625, 7.808837890625, 8.52978515625, 9.250732421875, 9.9716796875, 10.692626953125, 11.41357421875, 12.134521484375, 12.85546875, 13.576416015625, 14.29736328125, 15.018310546875, 15.7392578125, 16.460205078125, 17.18115234375, 17.902099609375, 18.623046875, 19.343994140625, 20.06494140625, 20.785888671875, 21.5068359375, 22.227783203125, 22.94873046875, 23.669677734375, 24.390625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 6.0, 2.0, 7.0, 11.0, 11.0, 17.0, 15.0, 32.0, 40.0, 96.0, 152.0, 375.0, 1451.0, 9562.0, 211964.0, 785380.0, 35087.0, 3126.0, 664.0, 239.0, 124.0, 66.0, 36.0, 24.0, 16.0, 17.0, 14.0, 6.0, 4.0, 3.0, 7.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-13.0859375, -12.714599609375, -12.34326171875, -11.971923828125, -11.6005859375, -11.229248046875, -10.85791015625, -10.486572265625, -10.115234375, -9.743896484375, -9.37255859375, -9.001220703125, -8.6298828125, -8.258544921875, -7.88720703125, -7.515869140625, -7.14453125, -6.773193359375, -6.40185546875, -6.030517578125, -5.6591796875, -5.287841796875, -4.91650390625, -4.545166015625, -4.173828125, -3.802490234375, -3.43115234375, -3.059814453125, -2.6884765625, -2.317138671875, -1.94580078125, -1.574462890625, -1.203125, -0.831787109375, -0.46044921875, -0.089111328125, 0.2822265625, 0.653564453125, 1.02490234375, 1.396240234375, 1.767578125, 2.138916015625, 2.51025390625, 2.881591796875, 3.2529296875, 3.624267578125, 3.99560546875, 4.366943359375, 4.73828125, 5.109619140625, 5.48095703125, 5.852294921875, 6.2236328125, 6.594970703125, 6.96630859375, 7.337646484375, 7.708984375, 8.080322265625, 8.45166015625, 8.822998046875, 9.1943359375, 9.565673828125, 9.93701171875, 10.308349609375, 10.6796875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 6.0, 4.0, 7.0, 15.0, 10.0, 22.0, 25.0, 44.0, 36.0, 58.0, 60.0, 86.0, 76.0, 82.0, 88.0, 80.0, 62.0, 62.0, 28.0, 35.0, 25.0, 25.0, 15.0, 10.0, 11.0, 7.0, 12.0, 5.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009517669677734375, -0.0009243413805961609, -0.0008969157934188843, -0.0008694902062416077, -0.0008420646190643311, -0.0008146390318870544, -0.0007872134447097778, -0.0007597878575325012, -0.0007323622703552246, -0.000704936683177948, -0.0006775110960006714, -0.0006500855088233948, -0.0006226599216461182, -0.0005952343344688416, -0.0005678087472915649, -0.0005403831601142883, -0.0005129575729370117, -0.0004855319857597351, -0.0004581063985824585, -0.0004306808114051819, -0.0004032552242279053, -0.00037582963705062866, -0.00034840404987335205, -0.00032097846269607544, -0.00029355287551879883, -0.0002661272883415222, -0.0002387017011642456, -0.000211276113986969, -0.00018385052680969238, -0.00015642493963241577, -0.00012899935245513916, -0.00010157376527786255, -7.414817810058594e-05, -4.6722590923309326e-05, -1.9297003746032715e-05, 8.128583431243896e-06, 3.555417060852051e-05, 6.297975778579712e-05, 9.040534496307373e-05, 0.00011783093214035034, 0.00014525651931762695, 0.00017268210649490356, 0.00020010769367218018, 0.0002275332808494568, 0.0002549588680267334, 0.00028238445520401, 0.0003098100423812866, 0.00033723562955856323, 0.00036466121673583984, 0.00039208680391311646, 0.00041951239109039307, 0.0004469379782676697, 0.0004743635654449463, 0.0005017891526222229, 0.0005292147397994995, 0.0005566403269767761, 0.0005840659141540527, 0.0006114915013313293, 0.000638917088508606, 0.0006663426756858826, 0.0006937682628631592, 0.0007211938500404358, 0.0007486194372177124, 0.000776045024394989, 0.0008034706115722656]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 4.0, 3.0, 4.0, 0.0, 1.0, 6.0, 10.0, 7.0, 7.0, 12.0, 14.0, 27.0, 34.0, 48.0, 75.0, 124.0, 260.0, 547.0, 1445.0, 4638.0, 37622.0, 828760.0, 162177.0, 8911.0, 2157.0, 796.0, 377.0, 172.0, 112.0, 45.0, 39.0, 25.0, 22.0, 13.0, 18.0, 6.0, 4.0, 8.0, 10.0, 2.0, 7.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0], "bins": [-10.7421875, -10.4033203125, -10.064453125, -9.7255859375, -9.38671875, -9.0478515625, -8.708984375, -8.3701171875, -8.03125, -7.6923828125, -7.353515625, -7.0146484375, -6.67578125, -6.3369140625, -5.998046875, -5.6591796875, -5.3203125, -4.9814453125, -4.642578125, -4.3037109375, -3.96484375, -3.6259765625, -3.287109375, -2.9482421875, -2.609375, -2.2705078125, -1.931640625, -1.5927734375, -1.25390625, -0.9150390625, -0.576171875, -0.2373046875, 0.1015625, 0.4404296875, 0.779296875, 1.1181640625, 1.45703125, 1.7958984375, 2.134765625, 2.4736328125, 2.8125, 3.1513671875, 3.490234375, 3.8291015625, 4.16796875, 4.5068359375, 4.845703125, 5.1845703125, 5.5234375, 5.8623046875, 6.201171875, 6.5400390625, 6.87890625, 7.2177734375, 7.556640625, 7.8955078125, 8.234375, 8.5732421875, 8.912109375, 9.2509765625, 9.58984375, 9.9287109375, 10.267578125, 10.6064453125, 10.9453125]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 3.0, 4.0, 6.0, 7.0, 11.0, 19.0, 18.0, 45.0, 65.0, 100.0, 121.0, 140.0, 134.0, 117.0, 68.0, 49.0, 24.0, 19.0, 22.0, 10.0, 5.0, 1.0, 5.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.4453125, -10.15380859375, -9.8623046875, -9.57080078125, -9.279296875, -8.98779296875, -8.6962890625, -8.40478515625, -8.11328125, -7.82177734375, -7.5302734375, -7.23876953125, -6.947265625, -6.65576171875, -6.3642578125, -6.07275390625, -5.78125, -5.48974609375, -5.1982421875, -4.90673828125, -4.615234375, -4.32373046875, -4.0322265625, -3.74072265625, -3.44921875, -3.15771484375, -2.8662109375, -2.57470703125, -2.283203125, -1.99169921875, -1.7001953125, -1.40869140625, -1.1171875, -0.82568359375, -0.5341796875, -0.24267578125, 0.048828125, 0.34033203125, 0.6318359375, 0.92333984375, 1.21484375, 1.50634765625, 1.7978515625, 2.08935546875, 2.380859375, 2.67236328125, 2.9638671875, 3.25537109375, 3.546875, 3.83837890625, 4.1298828125, 4.42138671875, 4.712890625, 5.00439453125, 5.2958984375, 5.58740234375, 5.87890625, 6.17041015625, 6.4619140625, 6.75341796875, 7.044921875, 7.33642578125, 7.6279296875, 7.91943359375, 8.2109375]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 7.0, 20.0, 35.0, 88.0, 132.0, 196.0, 216.0, 160.0, 87.0, 41.0, 17.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-114.63985443115234, -110.54811096191406, -106.45635986328125, -102.36460876464844, -98.27286529541016, -94.18112182617188, -90.08937072753906, -85.99761962890625, -81.90587615966797, -77.81413269042969, -73.72238159179688, -69.63063049316406, -65.53888702392578, -61.447139739990234, -57.35539245605469, -53.26364517211914, -49.171897888183594, -45.08015060424805, -40.9884033203125, -36.89665603637695, -32.804908752441406, -28.71316146850586, -24.621414184570312, -20.529666900634766, -16.43791961669922, -12.346172332763672, -8.254425048828125, -4.162677764892578, -0.07093048095703125, 4.020816802978516, 8.112564086914062, 12.20431137084961, 16.296051025390625, 20.387798309326172, 24.47954559326172, 28.571292877197266, 32.66304016113281, 36.75478744506836, 40.846534729003906, 44.93828201293945, 49.030029296875, 53.12177658081055, 57.213523864746094, 61.30527114868164, 65.39701843261719, 69.48876953125, 73.58051300048828, 77.67225646972656, 81.76400756835938, 85.85575866699219, 89.94750213623047, 94.03924560546875, 98.13099670410156, 102.22274780273438, 106.31449127197266, 110.40623474121094, 114.49798583984375, 118.58973693847656, 122.68148040771484, 126.77322387695312, 130.86497497558594, 134.95672607421875, 139.0484619140625, 143.1402130126953, 147.23196411132812]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 5.0, 7.0, 13.0, 15.0, 32.0, 23.0, 34.0, 40.0, 57.0, 51.0, 52.0, 71.0, 79.0, 69.0, 65.0, 62.0, 50.0, 58.0, 49.0, 38.0, 26.0, 29.0, 22.0, 16.0, 13.0, 8.0, 8.0, 6.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-120.97257232666016, -117.98080444335938, -114.9890365600586, -111.99726867675781, -109.00550842285156, -106.01374053955078, -103.02197265625, -100.03020477294922, -97.03843688964844, -94.04666900634766, -91.05490112304688, -88.06314086914062, -85.07137298583984, -82.07960510253906, -79.08783721923828, -76.0960693359375, -73.10430908203125, -70.11254119873047, -67.12077331542969, -64.12901306152344, -61.137245178222656, -58.145477294921875, -55.153709411621094, -52.16194152832031, -49.1701774597168, -46.178409576416016, -43.1866455078125, -40.19487762451172, -37.20310974121094, -34.21134567260742, -31.21957778930664, -28.227811813354492, -25.236053466796875, -22.244287490844727, -19.252521514892578, -16.260753631591797, -13.268987655639648, -10.2772216796875, -7.285453796386719, -4.29368782043457, -1.3019218444824219, 1.6898446083068848, 4.681611061096191, 7.673377990722656, 10.665143966674805, 13.656909942626953, 16.648677825927734, 19.640443801879883, 22.63220977783203, 25.62397575378418, 28.615741729736328, 31.60750961303711, 34.599273681640625, 37.591041564941406, 40.58280944824219, 43.57457733154297, 46.566341400146484, 49.558109283447266, 52.54987335205078, 55.54164123535156, 58.533409118652344, 61.52517318725586, 64.51693725585938, 67.50870513916016, 70.50047302246094]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 0.0, 2.0, 2.0, 3.0, 6.0, 5.0, 5.0, 9.0, 13.0, 23.0, 31.0, 29.0, 51.0, 69.0, 126.0, 163.0, 281.0, 431.0, 724.0, 1269.0, 2525.0, 5700.0, 15308.0, 53751.0, 744934.0, 3282825.0, 58117.0, 15981.0, 6018.0, 2616.0, 1361.0, 729.0, 395.0, 256.0, 171.0, 122.0, 79.0, 44.0, 31.0, 19.0, 8.0, 19.0, 11.0, 4.0, 5.0, 7.0, 1.0, 6.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-9.1171875, -8.85687255859375, -8.5965576171875, -8.33624267578125, -8.075927734375, -7.81561279296875, -7.5552978515625, -7.29498291015625, -7.03466796875, -6.77435302734375, -6.5140380859375, -6.25372314453125, -5.993408203125, -5.73309326171875, -5.4727783203125, -5.21246337890625, -4.9521484375, -4.69183349609375, -4.4315185546875, -4.17120361328125, -3.910888671875, -3.65057373046875, -3.3902587890625, -3.12994384765625, -2.86962890625, -2.60931396484375, -2.3489990234375, -2.08868408203125, -1.828369140625, -1.56805419921875, -1.3077392578125, -1.04742431640625, -0.787109375, -0.52679443359375, -0.2664794921875, -0.00616455078125, 0.254150390625, 0.51446533203125, 0.7747802734375, 1.03509521484375, 1.29541015625, 1.55572509765625, 1.8160400390625, 2.07635498046875, 2.336669921875, 2.59698486328125, 2.8572998046875, 3.11761474609375, 3.3779296875, 3.63824462890625, 3.8985595703125, 4.15887451171875, 4.419189453125, 4.67950439453125, 4.9398193359375, 5.20013427734375, 5.46044921875, 5.72076416015625, 5.9810791015625, 6.24139404296875, 6.501708984375, 6.76202392578125, 7.0223388671875, 7.28265380859375, 7.54296875]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 1.0, 4.0, 13.0, 4.0, 8.0, 9.0, 17.0, 26.0, 26.0, 36.0, 39.0, 57.0, 58.0, 77.0, 80.0, 66.0, 81.0, 67.0, 53.0, 56.0, 49.0, 37.0, 27.0, 30.0, 19.0, 25.0, 12.0, 5.0, 5.0, 6.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.45703125, -3.3367919921875, -3.216552734375, -3.0963134765625, -2.97607421875, -2.8558349609375, -2.735595703125, -2.6153564453125, -2.4951171875, -2.3748779296875, -2.254638671875, -2.1343994140625, -2.01416015625, -1.8939208984375, -1.773681640625, -1.6534423828125, -1.533203125, -1.4129638671875, -1.292724609375, -1.1724853515625, -1.05224609375, -0.9320068359375, -0.811767578125, -0.6915283203125, -0.5712890625, -0.4510498046875, -0.330810546875, -0.2105712890625, -0.09033203125, 0.0299072265625, 0.150146484375, 0.2703857421875, 0.390625, 0.5108642578125, 0.631103515625, 0.7513427734375, 0.87158203125, 0.9918212890625, 1.112060546875, 1.2322998046875, 1.3525390625, 1.4727783203125, 1.593017578125, 1.7132568359375, 1.83349609375, 1.9537353515625, 2.073974609375, 2.1942138671875, 2.314453125, 2.4346923828125, 2.554931640625, 2.6751708984375, 2.79541015625, 2.9156494140625, 3.035888671875, 3.1561279296875, 3.2763671875, 3.3966064453125, 3.516845703125, 3.6370849609375, 3.75732421875, 3.8775634765625, 3.997802734375, 4.1180419921875, 4.23828125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 0.0, 4.0, 1.0, 3.0, 8.0, 2.0, 10.0, 8.0, 17.0, 14.0, 21.0, 31.0, 34.0, 61.0, 59.0, 80.0, 133.0, 174.0, 298.0, 413.0, 619.0, 1071.0, 1978.0, 3636.0, 7757.0, 19509.0, 65682.0, 576528.0, 3380439.0, 91802.0, 24590.0, 9458.0, 4314.0, 2143.0, 1172.0, 727.0, 458.0, 287.0, 206.0, 158.0, 99.0, 70.0, 56.0, 42.0, 32.0, 15.0, 12.0, 20.0, 9.0, 6.0, 9.0, 5.0, 2.0, 2.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-7.5078125, -7.2664794921875, -7.025146484375, -6.7838134765625, -6.54248046875, -6.3011474609375, -6.059814453125, -5.8184814453125, -5.5771484375, -5.3358154296875, -5.094482421875, -4.8531494140625, -4.61181640625, -4.3704833984375, -4.129150390625, -3.8878173828125, -3.646484375, -3.4051513671875, -3.163818359375, -2.9224853515625, -2.68115234375, -2.4398193359375, -2.198486328125, -1.9571533203125, -1.7158203125, -1.4744873046875, -1.233154296875, -0.9918212890625, -0.75048828125, -0.5091552734375, -0.267822265625, -0.0264892578125, 0.21484375, 0.4561767578125, 0.697509765625, 0.9388427734375, 1.18017578125, 1.4215087890625, 1.662841796875, 1.9041748046875, 2.1455078125, 2.3868408203125, 2.628173828125, 2.8695068359375, 3.11083984375, 3.3521728515625, 3.593505859375, 3.8348388671875, 4.076171875, 4.3175048828125, 4.558837890625, 4.8001708984375, 5.04150390625, 5.2828369140625, 5.524169921875, 5.7655029296875, 6.0068359375, 6.2481689453125, 6.489501953125, 6.7308349609375, 6.97216796875, 7.2135009765625, 7.454833984375, 7.6961669921875, 7.9375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 1.0, 7.0, 7.0, 8.0, 10.0, 19.0, 20.0, 20.0, 46.0, 101.0, 158.0, 709.0, 2492.0, 204.0, 94.0, 55.0, 38.0, 23.0, 20.0, 12.0, 9.0, 3.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.279296875, -2.20355224609375, -2.1278076171875, -2.05206298828125, -1.976318359375, -1.90057373046875, -1.8248291015625, -1.74908447265625, -1.67333984375, -1.59759521484375, -1.5218505859375, -1.44610595703125, -1.370361328125, -1.29461669921875, -1.2188720703125, -1.14312744140625, -1.0673828125, -0.99163818359375, -0.9158935546875, -0.84014892578125, -0.764404296875, -0.68865966796875, -0.6129150390625, -0.53717041015625, -0.46142578125, -0.38568115234375, -0.3099365234375, -0.23419189453125, -0.158447265625, -0.08270263671875, -0.0069580078125, 0.06878662109375, 0.14453125, 0.22027587890625, 0.2960205078125, 0.37176513671875, 0.447509765625, 0.52325439453125, 0.5989990234375, 0.67474365234375, 0.75048828125, 0.82623291015625, 0.9019775390625, 0.97772216796875, 1.053466796875, 1.12921142578125, 1.2049560546875, 1.28070068359375, 1.3564453125, 1.43218994140625, 1.5079345703125, 1.58367919921875, 1.659423828125, 1.73516845703125, 1.8109130859375, 1.88665771484375, 1.96240234375, 2.03814697265625, 2.1138916015625, 2.18963623046875, 2.265380859375, 2.34112548828125, 2.4168701171875, 2.49261474609375, 2.568359375]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 6.0, 21.0, 14.0, 29.0, 74.0, 92.0, 130.0, 149.0, 156.0, 119.0, 96.0, 47.0, 31.0, 20.0, 14.0, 8.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.972408294677734, -10.510202407836914, -10.047996520996094, -9.585790634155273, -9.12358570098877, -8.66137981414795, -8.199173927307129, -7.736968040466309, -7.2747626304626465, -6.812556743621826, -6.350351333618164, -5.888145446777344, -5.425939559936523, -4.963734149932861, -4.501528263092041, -4.039322853088379, -3.5771169662475586, -3.1149113178253174, -2.652705669403076, -2.190499782562256, -1.7282941341400146, -1.2660884857177734, -0.8038825988769531, -0.3416769504547119, 0.1205286979675293, 0.5827344059944153, 1.0449401140213013, 1.507145881652832, 1.9693515300750732, 2.4315571784973145, 2.8937630653381348, 3.355968713760376, 3.818174362182617, 4.2803802490234375, 4.7425856590271, 5.20479154586792, 5.666996955871582, 6.129202842712402, 6.591408729553223, 7.053614616394043, 7.515820026397705, 7.978025913238525, 8.440231323242188, 8.902437210083008, 9.364643096923828, 9.826848983764648, 10.289054870605469, 10.751259803771973, 11.213465690612793, 11.675671577453613, 12.137877464294434, 12.600082397460938, 13.062288284301758, 13.524494171142578, 13.986700057983398, 14.448905944824219, 14.911111831665039, 15.37331771850586, 15.83552360534668, 16.2977294921875, 16.75993537902832, 17.22214126586914, 17.684345245361328, 18.14655113220215, 18.60875701904297]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 6.0, 6.0, 10.0, 10.0, 10.0, 12.0, 12.0, 14.0, 14.0, 23.0, 28.0, 26.0, 32.0, 37.0, 42.0, 41.0, 51.0, 45.0, 42.0, 45.0, 57.0, 44.0, 46.0, 45.0, 47.0, 39.0, 36.0, 23.0, 27.0, 21.0, 20.0, 24.0, 13.0, 10.0, 10.0, 6.0, 6.0, 15.0, 5.0, 4.0, 2.0, 4.0, 2.0, 1.0, 1.0, 2.0], "bins": [-7.272090911865234, -7.08128547668457, -6.8904805183410645, -6.6996750831604, -6.5088701248168945, -6.3180646896362305, -6.127259254455566, -5.9364542961120605, -5.745649337768555, -5.554843902587891, -5.364038944244385, -5.173233509063721, -4.982428550720215, -4.791623115539551, -4.600817680358887, -4.410012722015381, -4.219207286834717, -4.028401851654053, -3.837596893310547, -3.646791458129883, -3.455986499786377, -3.265181064605713, -3.074375867843628, -2.883570671081543, -2.692765474319458, -2.501960277557373, -2.311155080795288, -2.120349884033203, -1.9295445680618286, -1.7387393712997437, -1.5479340553283691, -1.3571288585662842, -1.1663236618041992, -0.9755184650421143, -0.7847132086753845, -0.5939079523086548, -0.4031027555465698, -0.21229755878448486, -0.02149224281311035, 0.1693129539489746, 0.36011815071105957, 0.5509233474731445, 0.7417286038398743, 0.932533860206604, 1.123339056968689, 1.314144253730774, 1.5049495697021484, 1.6957547664642334, 1.8865599632263184, 2.0773651599884033, 2.2681703567504883, 2.4589757919311523, 2.649780750274658, 2.8405861854553223, 3.0313913822174072, 3.222196578979492, 3.413001775741577, 3.603806972503662, 3.794612169265747, 3.985417366027832, 4.176222801208496, 4.367027759552002, 4.557833194732666, 4.748638153076172, 4.939443588256836]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 3.0, 7.0, 9.0, 8.0, 10.0, 23.0, 40.0, 56.0, 68.0, 121.0, 186.0, 279.0, 496.0, 863.0, 1829.0, 3712.0, 8775.0, 23043.0, 65653.0, 174836.0, 322286.0, 264229.0, 114694.0, 40836.0, 15119.0, 5805.0, 2503.0, 1264.0, 701.0, 418.0, 247.0, 158.0, 98.0, 61.0, 41.0, 34.0, 14.0, 12.0, 8.0, 9.0, 2.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.60546875, -5.44427490234375, -5.2830810546875, -5.12188720703125, -4.960693359375, -4.79949951171875, -4.6383056640625, -4.47711181640625, -4.31591796875, -4.15472412109375, -3.9935302734375, -3.83233642578125, -3.671142578125, -3.50994873046875, -3.3487548828125, -3.18756103515625, -3.0263671875, -2.86517333984375, -2.7039794921875, -2.54278564453125, -2.381591796875, -2.22039794921875, -2.0592041015625, -1.89801025390625, -1.73681640625, -1.57562255859375, -1.4144287109375, -1.25323486328125, -1.092041015625, -0.93084716796875, -0.7696533203125, -0.60845947265625, -0.447265625, -0.28607177734375, -0.1248779296875, 0.03631591796875, 0.197509765625, 0.35870361328125, 0.5198974609375, 0.68109130859375, 0.84228515625, 1.00347900390625, 1.1646728515625, 1.32586669921875, 1.487060546875, 1.64825439453125, 1.8094482421875, 1.97064208984375, 2.1318359375, 2.29302978515625, 2.4542236328125, 2.61541748046875, 2.776611328125, 2.93780517578125, 3.0989990234375, 3.26019287109375, 3.42138671875, 3.58258056640625, 3.7437744140625, 3.90496826171875, 4.066162109375, 4.22735595703125, 4.3885498046875, 4.54974365234375, 4.7109375]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 7.0, 4.0, 7.0, 8.0, 10.0, 10.0, 14.0, 26.0, 23.0, 30.0, 44.0, 55.0, 68.0, 72.0, 93.0, 79.0, 72.0, 73.0, 56.0, 55.0, 48.0, 38.0, 31.0, 17.0, 27.0, 11.0, 14.0, 2.0, 6.0, 6.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.06640625, -3.93341064453125, -3.8004150390625, -3.66741943359375, -3.534423828125, -3.40142822265625, -3.2684326171875, -3.13543701171875, -3.00244140625, -2.86944580078125, -2.7364501953125, -2.60345458984375, -2.470458984375, -2.33746337890625, -2.2044677734375, -2.07147216796875, -1.9384765625, -1.80548095703125, -1.6724853515625, -1.53948974609375, -1.406494140625, -1.27349853515625, -1.1405029296875, -1.00750732421875, -0.87451171875, -0.74151611328125, -0.6085205078125, -0.47552490234375, -0.342529296875, -0.20953369140625, -0.0765380859375, 0.05645751953125, 0.189453125, 0.32244873046875, 0.4554443359375, 0.58843994140625, 0.721435546875, 0.85443115234375, 0.9874267578125, 1.12042236328125, 1.25341796875, 1.38641357421875, 1.5194091796875, 1.65240478515625, 1.785400390625, 1.91839599609375, 2.0513916015625, 2.18438720703125, 2.3173828125, 2.45037841796875, 2.5833740234375, 2.71636962890625, 2.849365234375, 2.98236083984375, 3.1153564453125, 3.24835205078125, 3.38134765625, 3.51434326171875, 3.6473388671875, 3.78033447265625, 3.913330078125, 4.04632568359375, 4.1793212890625, 4.31231689453125, 4.4453125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 6.0, 2.0, 4.0, 4.0, 3.0, 11.0, 12.0, 12.0, 12.0, 19.0, 27.0, 33.0, 60.0, 67.0, 120.0, 159.0, 327.0, 527.0, 1162.0, 2968.0, 27347.0, 899751.0, 107840.0, 4872.0, 1554.0, 701.0, 354.0, 193.0, 123.0, 76.0, 58.0, 39.0, 29.0, 17.0, 18.0, 17.0, 11.0, 6.0, 4.0, 4.0, 4.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-23.875, -23.14404296875, -22.4130859375, -21.68212890625, -20.951171875, -20.22021484375, -19.4892578125, -18.75830078125, -18.02734375, -17.29638671875, -16.5654296875, -15.83447265625, -15.103515625, -14.37255859375, -13.6416015625, -12.91064453125, -12.1796875, -11.44873046875, -10.7177734375, -9.98681640625, -9.255859375, -8.52490234375, -7.7939453125, -7.06298828125, -6.33203125, -5.60107421875, -4.8701171875, -4.13916015625, -3.408203125, -2.67724609375, -1.9462890625, -1.21533203125, -0.484375, 0.24658203125, 0.9775390625, 1.70849609375, 2.439453125, 3.17041015625, 3.9013671875, 4.63232421875, 5.36328125, 6.09423828125, 6.8251953125, 7.55615234375, 8.287109375, 9.01806640625, 9.7490234375, 10.47998046875, 11.2109375, 11.94189453125, 12.6728515625, 13.40380859375, 14.134765625, 14.86572265625, 15.5966796875, 16.32763671875, 17.05859375, 17.78955078125, 18.5205078125, 19.25146484375, 19.982421875, 20.71337890625, 21.4443359375, 22.17529296875, 22.90625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 6.0, 4.0, 4.0, 6.0, 10.0, 16.0, 22.0, 19.0, 45.0, 44.0, 74.0, 89.0, 99.0, 89.0, 97.0, 84.0, 90.0, 64.0, 38.0, 29.0, 28.0, 16.0, 9.0, 9.0, 3.0, 4.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.71875, -31.746337890625, -30.77392578125, -29.801513671875, -28.8291015625, -27.856689453125, -26.88427734375, -25.911865234375, -24.939453125, -23.967041015625, -22.99462890625, -22.022216796875, -21.0498046875, -20.077392578125, -19.10498046875, -18.132568359375, -17.16015625, -16.187744140625, -15.21533203125, -14.242919921875, -13.2705078125, -12.298095703125, -11.32568359375, -10.353271484375, -9.380859375, -8.408447265625, -7.43603515625, -6.463623046875, -5.4912109375, -4.518798828125, -3.54638671875, -2.573974609375, -1.6015625, -0.629150390625, 0.34326171875, 1.315673828125, 2.2880859375, 3.260498046875, 4.23291015625, 5.205322265625, 6.177734375, 7.150146484375, 8.12255859375, 9.094970703125, 10.0673828125, 11.039794921875, 12.01220703125, 12.984619140625, 13.95703125, 14.929443359375, 15.90185546875, 16.874267578125, 17.8466796875, 18.819091796875, 19.79150390625, 20.763916015625, 21.736328125, 22.708740234375, 23.68115234375, 24.653564453125, 25.6259765625, 26.598388671875, 27.57080078125, 28.543212890625, 29.515625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 2.0, 6.0, 12.0, 9.0, 12.0, 19.0, 46.0, 72.0, 119.0, 247.0, 568.0, 1972.0, 26961.0, 973688.0, 41204.0, 2362.0, 666.0, 260.0, 125.0, 69.0, 47.0, 34.0, 14.0, 11.0, 11.0, 9.0, 6.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.25, -14.7158203125, -14.181640625, -13.6474609375, -13.11328125, -12.5791015625, -12.044921875, -11.5107421875, -10.9765625, -10.4423828125, -9.908203125, -9.3740234375, -8.83984375, -8.3056640625, -7.771484375, -7.2373046875, -6.703125, -6.1689453125, -5.634765625, -5.1005859375, -4.56640625, -4.0322265625, -3.498046875, -2.9638671875, -2.4296875, -1.8955078125, -1.361328125, -0.8271484375, -0.29296875, 0.2412109375, 0.775390625, 1.3095703125, 1.84375, 2.3779296875, 2.912109375, 3.4462890625, 3.98046875, 4.5146484375, 5.048828125, 5.5830078125, 6.1171875, 6.6513671875, 7.185546875, 7.7197265625, 8.25390625, 8.7880859375, 9.322265625, 9.8564453125, 10.390625, 10.9248046875, 11.458984375, 11.9931640625, 12.52734375, 13.0615234375, 13.595703125, 14.1298828125, 14.6640625, 15.1982421875, 15.732421875, 16.2666015625, 16.80078125, 17.3349609375, 17.869140625, 18.4033203125, 18.9375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 6.0, 11.0, 10.0, 7.0, 13.0, 27.0, 30.0, 44.0, 48.0, 61.0, 84.0, 96.0, 107.0, 122.0, 82.0, 64.0, 39.0, 43.0, 38.0, 23.0, 18.0, 9.0, 9.0, 6.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008063316345214844, -0.0007758662104606628, -0.0007454007863998413, -0.0007149353623390198, -0.0006844699382781982, -0.0006540045142173767, -0.0006235390901565552, -0.0005930736660957336, -0.0005626082420349121, -0.0005321428179740906, -0.000501677393913269, -0.0004712119698524475, -0.000440746545791626, -0.00041028112173080444, -0.0003798156976699829, -0.0003493502736091614, -0.00031888484954833984, -0.0002884194254875183, -0.0002579540014266968, -0.00022748857736587524, -0.0001970231533050537, -0.00016655772924423218, -0.00013609230518341064, -0.00010562688112258911, -7.516145706176758e-05, -4.4696033000946045e-05, -1.4230608940124512e-05, 1.623481512069702e-05, 4.6700239181518555e-05, 7.716566324234009e-05, 0.00010763108730316162, 0.00013809651136398315, 0.0001685619354248047, 0.00019902735948562622, 0.00022949278354644775, 0.0002599582076072693, 0.0002904236316680908, 0.00032088905572891235, 0.0003513544797897339, 0.0003818199038505554, 0.00041228532791137695, 0.0004427507519721985, 0.00047321617603302, 0.0005036816000938416, 0.0005341470241546631, 0.0005646124482154846, 0.0005950778722763062, 0.0006255432963371277, 0.0006560087203979492, 0.0006864741444587708, 0.0007169395685195923, 0.0007474049925804138, 0.0007778704166412354, 0.0008083358407020569, 0.0008388012647628784, 0.0008692666888237, 0.0008997321128845215, 0.000930197536945343, 0.0009606629610061646, 0.000991128385066986, 0.0010215938091278076, 0.0010520592331886292, 0.0010825246572494507, 0.0011129900813102722, 0.0011434555053710938]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 5.0, 6.0, 15.0, 7.0, 21.0, 48.0, 75.0, 148.0, 317.0, 850.0, 2837.0, 29571.0, 975596.0, 34381.0, 3040.0, 931.0, 357.0, 152.0, 69.0, 43.0, 28.0, 15.0, 9.0, 11.0, 8.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.7734375, -15.2203369140625, -14.667236328125, -14.1141357421875, -13.56103515625, -13.0079345703125, -12.454833984375, -11.9017333984375, -11.3486328125, -10.7955322265625, -10.242431640625, -9.6893310546875, -9.13623046875, -8.5831298828125, -8.030029296875, -7.4769287109375, -6.923828125, -6.3707275390625, -5.817626953125, -5.2645263671875, -4.71142578125, -4.1583251953125, -3.605224609375, -3.0521240234375, -2.4990234375, -1.9459228515625, -1.392822265625, -0.8397216796875, -0.28662109375, 0.2664794921875, 0.819580078125, 1.3726806640625, 1.92578125, 2.4788818359375, 3.031982421875, 3.5850830078125, 4.13818359375, 4.6912841796875, 5.244384765625, 5.7974853515625, 6.3505859375, 6.9036865234375, 7.456787109375, 8.0098876953125, 8.56298828125, 9.1160888671875, 9.669189453125, 10.2222900390625, 10.775390625, 11.3284912109375, 11.881591796875, 12.4346923828125, 12.98779296875, 13.5408935546875, 14.093994140625, 14.6470947265625, 15.2001953125, 15.7532958984375, 16.306396484375, 16.8594970703125, 17.41259765625, 17.9656982421875, 18.518798828125, 19.0718994140625, 19.625]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 2.0, 3.0, 5.0, 2.0, 4.0, 8.0, 5.0, 13.0, 10.0, 17.0, 15.0, 25.0, 36.0, 64.0, 83.0, 139.0, 126.0, 133.0, 98.0, 74.0, 41.0, 28.0, 14.0, 12.0, 20.0, 5.0, 5.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.6875, -7.3876953125, -7.087890625, -6.7880859375, -6.48828125, -6.1884765625, -5.888671875, -5.5888671875, -5.2890625, -4.9892578125, -4.689453125, -4.3896484375, -4.08984375, -3.7900390625, -3.490234375, -3.1904296875, -2.890625, -2.5908203125, -2.291015625, -1.9912109375, -1.69140625, -1.3916015625, -1.091796875, -0.7919921875, -0.4921875, -0.1923828125, 0.107421875, 0.4072265625, 0.70703125, 1.0068359375, 1.306640625, 1.6064453125, 1.90625, 2.2060546875, 2.505859375, 2.8056640625, 3.10546875, 3.4052734375, 3.705078125, 4.0048828125, 4.3046875, 4.6044921875, 4.904296875, 5.2041015625, 5.50390625, 5.8037109375, 6.103515625, 6.4033203125, 6.703125, 7.0029296875, 7.302734375, 7.6025390625, 7.90234375, 8.2021484375, 8.501953125, 8.8017578125, 9.1015625, 9.4013671875, 9.701171875, 10.0009765625, 10.30078125, 10.6005859375, 10.900390625, 11.2001953125, 11.5]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 3.0, 2.0, 5.0, 13.0, 87.0, 294.0, 424.0, 125.0, 38.0, 7.0, 6.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-171.1228790283203, -163.34454345703125, -155.5662078857422, -147.78787231445312, -140.00955200195312, -132.231201171875, -124.452880859375, -116.67454528808594, -108.89620971679688, -101.11787414550781, -93.33953857421875, -85.56121063232422, -77.78287506103516, -70.0045394897461, -62.2262077331543, -54.4478759765625, -46.66954040527344, -38.891204833984375, -31.112873077392578, -23.33453941345215, -15.556205749511719, -7.777870178222656, 0.000461578369140625, 7.7787933349609375, 15.55712890625, 23.33546257019043, 31.11379623413086, 38.892127990722656, 46.67046356201172, 54.44879913330078, 62.22713088989258, 70.00546264648438, 77.7838134765625, 85.56214904785156, 93.34048461914062, 101.11881256103516, 108.89714813232422, 116.67548370361328, 124.45381164550781, 132.23214721679688, 140.01048278808594, 147.788818359375, 155.56715393066406, 163.34548950195312, 171.12380981445312, 178.90216064453125, 186.68048095703125, 194.4588165283203, 202.23715209960938, 210.01548767089844, 217.7938232421875, 225.57215881347656, 233.35049438476562, 241.12881469726562, 248.9071502685547, 256.68548583984375, 264.46380615234375, 272.24212646484375, 280.0204772949219, 287.7987976074219, 295.5771484375, 303.35546875, 311.1338195800781, 318.9121398925781, 326.69049072265625]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 5.0, 0.0, 6.0, 10.0, 9.0, 13.0, 14.0, 12.0, 15.0, 10.0, 26.0, 30.0, 34.0, 43.0, 45.0, 45.0, 51.0, 60.0, 68.0, 67.0, 51.0, 55.0, 58.0, 50.0, 49.0, 35.0, 48.0, 18.0, 20.0, 17.0, 11.0, 10.0, 5.0, 7.0, 4.0, 0.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-101.92867279052734, -99.08841705322266, -96.2481689453125, -93.40791320800781, -90.56765747070312, -87.72740173339844, -84.88715362548828, -82.0468978881836, -79.20664978027344, -76.36639404296875, -73.5261459350586, -70.6858901977539, -67.84563446044922, -65.00538635253906, -62.165130615234375, -59.32487487792969, -56.484619140625, -53.64436721801758, -50.80411148071289, -47.96385955810547, -45.12360382080078, -42.28335189819336, -39.44309997558594, -36.60284423828125, -33.76259231567383, -30.922338485717773, -28.08208465576172, -25.241832733154297, -22.401578903198242, -19.561325073242188, -16.721073150634766, -13.880819320678711, -11.040573120117188, -8.200319290161133, -5.3600664138793945, -2.5198135375976562, 0.32044029235839844, 3.160694122314453, 6.000946044921875, 8.84119987487793, 11.681453704833984, 14.521707534790039, 17.361961364746094, 20.202213287353516, 23.04246711730957, 25.882720947265625, 28.722972869873047, 31.5632266998291, 34.403480529785156, 37.24373245239258, 40.083988189697266, 42.92424011230469, 45.764495849609375, 48.6047477722168, 51.44499969482422, 54.285255432128906, 57.12550735473633, 59.96575927734375, 62.80601501464844, 65.64627075195312, 68.48651885986328, 71.32677459716797, 74.16702270507812, 77.00727844238281, 79.8475341796875]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 5.0, 2.0, 11.0, 14.0, 22.0, 28.0, 65.0, 89.0, 119.0, 217.0, 336.0, 569.0, 1060.0, 2073.0, 4581.0, 11903.0, 54359.0, 3997425.0, 94557.0, 15908.0, 5483.0, 2494.0, 1251.0, 693.0, 416.0, 251.0, 135.0, 81.0, 55.0, 23.0, 18.0, 15.0, 5.0, 8.0, 8.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.7734375, -11.4232177734375, -11.072998046875, -10.7227783203125, -10.37255859375, -10.0223388671875, -9.672119140625, -9.3218994140625, -8.9716796875, -8.6214599609375, -8.271240234375, -7.9210205078125, -7.57080078125, -7.2205810546875, -6.870361328125, -6.5201416015625, -6.169921875, -5.8197021484375, -5.469482421875, -5.1192626953125, -4.76904296875, -4.4188232421875, -4.068603515625, -3.7183837890625, -3.3681640625, -3.0179443359375, -2.667724609375, -2.3175048828125, -1.96728515625, -1.6170654296875, -1.266845703125, -0.9166259765625, -0.56640625, -0.2161865234375, 0.134033203125, 0.4842529296875, 0.83447265625, 1.1846923828125, 1.534912109375, 1.8851318359375, 2.2353515625, 2.5855712890625, 2.935791015625, 3.2860107421875, 3.63623046875, 3.9864501953125, 4.336669921875, 4.6868896484375, 5.037109375, 5.3873291015625, 5.737548828125, 6.0877685546875, 6.43798828125, 6.7882080078125, 7.138427734375, 7.4886474609375, 7.8388671875, 8.1890869140625, 8.539306640625, 8.8895263671875, 9.23974609375, 9.5899658203125, 9.940185546875, 10.2904052734375, 10.640625]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 5.0, 7.0, 16.0, 23.0, 23.0, 44.0, 56.0, 76.0, 136.0, 135.0, 112.0, 107.0, 85.0, 57.0, 47.0, 30.0, 16.0, 15.0, 3.0, 5.0, 4.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.9609375, -8.71832275390625, -8.4757080078125, -8.23309326171875, -7.990478515625, -7.74786376953125, -7.5052490234375, -7.26263427734375, -7.02001953125, -6.77740478515625, -6.5347900390625, -6.29217529296875, -6.049560546875, -5.80694580078125, -5.5643310546875, -5.32171630859375, -5.0791015625, -4.83648681640625, -4.5938720703125, -4.35125732421875, -4.108642578125, -3.86602783203125, -3.6234130859375, -3.38079833984375, -3.13818359375, -2.89556884765625, -2.6529541015625, -2.41033935546875, -2.167724609375, -1.92510986328125, -1.6824951171875, -1.43988037109375, -1.197265625, -0.95465087890625, -0.7120361328125, -0.46942138671875, -0.226806640625, 0.01580810546875, 0.2584228515625, 0.50103759765625, 0.74365234375, 0.98626708984375, 1.2288818359375, 1.47149658203125, 1.714111328125, 1.95672607421875, 2.1993408203125, 2.44195556640625, 2.6845703125, 2.92718505859375, 3.1697998046875, 3.41241455078125, 3.655029296875, 3.89764404296875, 4.1402587890625, 4.38287353515625, 4.62548828125, 4.86810302734375, 5.1107177734375, 5.35333251953125, 5.595947265625, 5.83856201171875, 6.0811767578125, 6.32379150390625, 6.56640625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 1.0, 14.0, 10.0, 13.0, 20.0, 20.0, 34.0, 31.0, 57.0, 65.0, 92.0, 100.0, 179.0, 325.0, 875.0, 3764.0, 30675.0, 4087869.0, 62466.0, 5462.0, 1155.0, 363.0, 197.0, 104.0, 107.0, 70.0, 49.0, 38.0, 32.0, 27.0, 17.0, 18.0, 10.0, 6.0, 7.0, 4.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.96875, -24.247314453125, -23.52587890625, -22.804443359375, -22.0830078125, -21.361572265625, -20.64013671875, -19.918701171875, -19.197265625, -18.475830078125, -17.75439453125, -17.032958984375, -16.3115234375, -15.590087890625, -14.86865234375, -14.147216796875, -13.42578125, -12.704345703125, -11.98291015625, -11.261474609375, -10.5400390625, -9.818603515625, -9.09716796875, -8.375732421875, -7.654296875, -6.932861328125, -6.21142578125, -5.489990234375, -4.7685546875, -4.047119140625, -3.32568359375, -2.604248046875, -1.8828125, -1.161376953125, -0.43994140625, 0.281494140625, 1.0029296875, 1.724365234375, 2.44580078125, 3.167236328125, 3.888671875, 4.610107421875, 5.33154296875, 6.052978515625, 6.7744140625, 7.495849609375, 8.21728515625, 8.938720703125, 9.66015625, 10.381591796875, 11.10302734375, 11.824462890625, 12.5458984375, 13.267333984375, 13.98876953125, 14.710205078125, 15.431640625, 16.153076171875, 16.87451171875, 17.595947265625, 18.3173828125, 19.038818359375, 19.76025390625, 20.481689453125, 21.203125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 11.0, 5.0, 9.0, 32.0, 80.0, 551.0, 3182.0, 121.0, 41.0, 20.0, 11.0, 6.0, 9.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.21484375, -4.05914306640625, -3.9034423828125, -3.74774169921875, -3.592041015625, -3.43634033203125, -3.2806396484375, -3.12493896484375, -2.96923828125, -2.81353759765625, -2.6578369140625, -2.50213623046875, -2.346435546875, -2.19073486328125, -2.0350341796875, -1.87933349609375, -1.7236328125, -1.56793212890625, -1.4122314453125, -1.25653076171875, -1.100830078125, -0.94512939453125, -0.7894287109375, -0.63372802734375, -0.47802734375, -0.32232666015625, -0.1666259765625, -0.01092529296875, 0.144775390625, 0.30047607421875, 0.4561767578125, 0.61187744140625, 0.767578125, 0.92327880859375, 1.0789794921875, 1.23468017578125, 1.390380859375, 1.54608154296875, 1.7017822265625, 1.85748291015625, 2.01318359375, 2.16888427734375, 2.3245849609375, 2.48028564453125, 2.635986328125, 2.79168701171875, 2.9473876953125, 3.10308837890625, 3.2587890625, 3.41448974609375, 3.5701904296875, 3.72589111328125, 3.881591796875, 4.03729248046875, 4.1929931640625, 4.34869384765625, 4.50439453125, 4.66009521484375, 4.8157958984375, 4.97149658203125, 5.127197265625, 5.28289794921875, 5.4385986328125, 5.59429931640625, 5.75]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 7.0, 11.0, 16.0, 50.0, 94.0, 148.0, 170.0, 194.0, 127.0, 72.0, 48.0, 26.0, 16.0, 9.0, 3.0, 5.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.63588809967041, -13.150086402893066, -12.664285659790039, -12.178483963012695, -11.692682266235352, -11.206880569458008, -10.721078872680664, -10.235278129577637, -9.749476432800293, -9.26367473602295, -8.777873992919922, -8.292072296142578, -7.806270599365234, -7.320468902587891, -6.834667682647705, -6.3488664627075195, -5.863064765930176, -5.377263069152832, -4.8914618492126465, -4.405660629272461, -3.919858932495117, -3.4340574741363525, -2.948256015777588, -2.4624545574188232, -1.9766530990600586, -1.490851640701294, -1.0050501823425293, -0.5192487239837646, -0.033447265625, 0.45235419273376465, 0.9381556510925293, 1.423957109451294, 1.909759521484375, 2.3955609798431396, 2.8813624382019043, 3.367163896560669, 3.8529653549194336, 4.338767051696777, 4.824568271636963, 5.310369491577148, 5.796171188354492, 6.281972885131836, 6.7677741050720215, 7.253575325012207, 7.739377021789551, 8.225178718566895, 8.710979461669922, 9.196781158447266, 9.68258285522461, 10.168384552001953, 10.654186248779297, 11.139986991882324, 11.625788688659668, 12.111590385437012, 12.597391128540039, 13.083192825317383, 13.568994522094727, 14.05479621887207, 14.540597915649414, 15.026398658752441, 15.512200355529785, 15.998002052307129, 16.483802795410156, 16.9696044921875, 17.455406188964844]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 5.0, 5.0, 4.0, 8.0, 7.0, 9.0, 8.0, 16.0, 15.0, 18.0, 14.0, 24.0, 30.0, 31.0, 27.0, 42.0, 33.0, 35.0, 33.0, 48.0, 32.0, 31.0, 40.0, 38.0, 52.0, 33.0, 35.0, 46.0, 35.0, 28.0, 27.0, 31.0, 22.0, 20.0, 26.0, 16.0, 12.0, 17.0, 12.0, 11.0, 7.0, 3.0, 7.0, 3.0, 2.0, 2.0, 7.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.867315292358398, -6.6599507331848145, -6.4525861740112305, -6.2452216148376465, -6.0378570556640625, -5.83049201965332, -5.6231279373168945, -5.415762901306152, -5.208398342132568, -5.001033782958984, -4.7936692237854, -4.586304664611816, -4.378940105438232, -4.171575546264648, -3.9642107486724854, -3.7568459510803223, -3.5494816303253174, -3.3421170711517334, -3.1347525119781494, -2.9273877143859863, -2.7200231552124023, -2.5126585960388184, -2.3052940368652344, -2.0979294776916504, -1.8905647993087769, -1.6832002401351929, -1.4758355617523193, -1.2684710025787354, -1.0611064434051514, -0.8537417650222778, -0.6463772058486938, -0.4390125274658203, -0.23164796829223633, -0.024283364415168762, 0.1830812394618988, 0.3904458284378052, 0.5978104472160339, 0.8051750659942627, 1.0125396251678467, 1.2199043035507202, 1.4272688627243042, 1.6346334218978882, 1.8419981002807617, 2.0493626594543457, 2.2567272186279297, 2.4640917778015137, 2.6714563369750977, 2.8788211345672607, 3.0861856937408447, 3.2935502529144287, 3.5009148120880127, 3.708279609680176, 3.9156441688537598, 4.123008728027344, 4.330373287200928, 4.537737846374512, 4.745102405548096, 4.95246696472168, 5.159831523895264, 5.367196083068848, 5.574560642242432, 5.781925201416016, 5.989290237426758, 6.196654796600342, 6.404019355773926]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 5.0, 7.0, 8.0, 12.0, 15.0, 24.0, 29.0, 49.0, 92.0, 161.0, 254.0, 499.0, 1122.0, 2884.0, 9614.0, 41652.0, 217356.0, 547420.0, 179963.0, 34480.0, 8245.0, 2578.0, 1001.0, 450.0, 238.0, 149.0, 80.0, 59.0, 31.0, 25.0, 19.0, 10.0, 5.0, 10.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.0078125, -6.75244140625, -6.4970703125, -6.24169921875, -5.986328125, -5.73095703125, -5.4755859375, -5.22021484375, -4.96484375, -4.70947265625, -4.4541015625, -4.19873046875, -3.943359375, -3.68798828125, -3.4326171875, -3.17724609375, -2.921875, -2.66650390625, -2.4111328125, -2.15576171875, -1.900390625, -1.64501953125, -1.3896484375, -1.13427734375, -0.87890625, -0.62353515625, -0.3681640625, -0.11279296875, 0.142578125, 0.39794921875, 0.6533203125, 0.90869140625, 1.1640625, 1.41943359375, 1.6748046875, 1.93017578125, 2.185546875, 2.44091796875, 2.6962890625, 2.95166015625, 3.20703125, 3.46240234375, 3.7177734375, 3.97314453125, 4.228515625, 4.48388671875, 4.7392578125, 4.99462890625, 5.25, 5.50537109375, 5.7607421875, 6.01611328125, 6.271484375, 6.52685546875, 6.7822265625, 7.03759765625, 7.29296875, 7.54833984375, 7.8037109375, 8.05908203125, 8.314453125, 8.56982421875, 8.8251953125, 9.08056640625, 9.3359375]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 5.0, 8.0, 11.0, 18.0, 19.0, 22.0, 32.0, 63.0, 83.0, 97.0, 99.0, 122.0, 94.0, 87.0, 72.0, 52.0, 34.0, 33.0, 17.0, 15.0, 12.0, 3.0, 5.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.5234375, -8.29541015625, -8.0673828125, -7.83935546875, -7.611328125, -7.38330078125, -7.1552734375, -6.92724609375, -6.69921875, -6.47119140625, -6.2431640625, -6.01513671875, -5.787109375, -5.55908203125, -5.3310546875, -5.10302734375, -4.875, -4.64697265625, -4.4189453125, -4.19091796875, -3.962890625, -3.73486328125, -3.5068359375, -3.27880859375, -3.05078125, -2.82275390625, -2.5947265625, -2.36669921875, -2.138671875, -1.91064453125, -1.6826171875, -1.45458984375, -1.2265625, -0.99853515625, -0.7705078125, -0.54248046875, -0.314453125, -0.08642578125, 0.1416015625, 0.36962890625, 0.59765625, 0.82568359375, 1.0537109375, 1.28173828125, 1.509765625, 1.73779296875, 1.9658203125, 2.19384765625, 2.421875, 2.64990234375, 2.8779296875, 3.10595703125, 3.333984375, 3.56201171875, 3.7900390625, 4.01806640625, 4.24609375, 4.47412109375, 4.7021484375, 4.93017578125, 5.158203125, 5.38623046875, 5.6142578125, 5.84228515625, 6.0703125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 1.0, 2.0, 6.0, 4.0, 11.0, 20.0, 19.0, 43.0, 105.0, 159.0, 409.0, 1200.0, 6249.0, 966291.0, 70329.0, 2426.0, 694.0, 297.0, 131.0, 62.0, 46.0, 19.0, 13.0, 9.0, 4.0, 8.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.1875, -31.8994140625, -30.611328125, -29.3232421875, -28.03515625, -26.7470703125, -25.458984375, -24.1708984375, -22.8828125, -21.5947265625, -20.306640625, -19.0185546875, -17.73046875, -16.4423828125, -15.154296875, -13.8662109375, -12.578125, -11.2900390625, -10.001953125, -8.7138671875, -7.42578125, -6.1376953125, -4.849609375, -3.5615234375, -2.2734375, -0.9853515625, 0.302734375, 1.5908203125, 2.87890625, 4.1669921875, 5.455078125, 6.7431640625, 8.03125, 9.3193359375, 10.607421875, 11.8955078125, 13.18359375, 14.4716796875, 15.759765625, 17.0478515625, 18.3359375, 19.6240234375, 20.912109375, 22.2001953125, 23.48828125, 24.7763671875, 26.064453125, 27.3525390625, 28.640625, 29.9287109375, 31.216796875, 32.5048828125, 33.79296875, 35.0810546875, 36.369140625, 37.6572265625, 38.9453125, 40.2333984375, 41.521484375, 42.8095703125, 44.09765625, 45.3857421875, 46.673828125, 47.9619140625, 49.25]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 5.0, 3.0, 7.0, 15.0, 12.0, 26.0, 40.0, 53.0, 81.0, 129.0, 147.0, 142.0, 119.0, 92.0, 58.0, 23.0, 20.0, 9.0, 9.0, 7.0, 5.0, 2.0, 5.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.0625, -40.1416015625, -38.220703125, -36.2998046875, -34.37890625, -32.4580078125, -30.537109375, -28.6162109375, -26.6953125, -24.7744140625, -22.853515625, -20.9326171875, -19.01171875, -17.0908203125, -15.169921875, -13.2490234375, -11.328125, -9.4072265625, -7.486328125, -5.5654296875, -3.64453125, -1.7236328125, 0.197265625, 2.1181640625, 4.0390625, 5.9599609375, 7.880859375, 9.8017578125, 11.72265625, 13.6435546875, 15.564453125, 17.4853515625, 19.40625, 21.3271484375, 23.248046875, 25.1689453125, 27.08984375, 29.0107421875, 30.931640625, 32.8525390625, 34.7734375, 36.6943359375, 38.615234375, 40.5361328125, 42.45703125, 44.3779296875, 46.298828125, 48.2197265625, 50.140625, 52.0615234375, 53.982421875, 55.9033203125, 57.82421875, 59.7451171875, 61.666015625, 63.5869140625, 65.5078125, 67.4287109375, 69.349609375, 71.2705078125, 73.19140625, 75.1123046875, 77.033203125, 78.9541015625, 80.875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 5.0, 12.0, 9.0, 6.0, 13.0, 23.0, 27.0, 38.0, 43.0, 58.0, 90.0, 161.0, 292.0, 590.0, 1724.0, 13834.0, 911083.0, 114520.0, 4094.0, 923.0, 378.0, 218.0, 121.0, 90.0, 62.0, 41.0, 20.0, 17.0, 19.0, 11.0, 3.0, 4.0, 8.0, 6.0, 1.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-16.375, -15.929443359375, -15.48388671875, -15.038330078125, -14.5927734375, -14.147216796875, -13.70166015625, -13.256103515625, -12.810546875, -12.364990234375, -11.91943359375, -11.473876953125, -11.0283203125, -10.582763671875, -10.13720703125, -9.691650390625, -9.24609375, -8.800537109375, -8.35498046875, -7.909423828125, -7.4638671875, -7.018310546875, -6.57275390625, -6.127197265625, -5.681640625, -5.236083984375, -4.79052734375, -4.344970703125, -3.8994140625, -3.453857421875, -3.00830078125, -2.562744140625, -2.1171875, -1.671630859375, -1.22607421875, -0.780517578125, -0.3349609375, 0.110595703125, 0.55615234375, 1.001708984375, 1.447265625, 1.892822265625, 2.33837890625, 2.783935546875, 3.2294921875, 3.675048828125, 4.12060546875, 4.566162109375, 5.01171875, 5.457275390625, 5.90283203125, 6.348388671875, 6.7939453125, 7.239501953125, 7.68505859375, 8.130615234375, 8.576171875, 9.021728515625, 9.46728515625, 9.912841796875, 10.3583984375, 10.803955078125, 11.24951171875, 11.695068359375, 12.140625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 4.0, 6.0, 8.0, 2.0, 9.0, 12.0, 14.0, 25.0, 36.0, 33.0, 53.0, 61.0, 87.0, 120.0, 114.0, 102.0, 98.0, 60.0, 42.0, 39.0, 15.0, 17.0, 16.0, 5.0, 8.0, 7.0, 3.0, 6.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009050369262695312, -0.0008792728185653687, -0.0008535087108612061, -0.0008277446031570435, -0.0008019804954528809, -0.0007762163877487183, -0.0007504522800445557, -0.0007246881723403931, -0.0006989240646362305, -0.0006731599569320679, -0.0006473958492279053, -0.0006216317415237427, -0.0005958676338195801, -0.0005701035261154175, -0.0005443394184112549, -0.0005185753107070923, -0.0004928112030029297, -0.0004670470952987671, -0.0004412829875946045, -0.0004155188798904419, -0.0003897547721862793, -0.0003639906644821167, -0.0003382265567779541, -0.0003124624490737915, -0.0002866983413696289, -0.0002609342336654663, -0.0002351701259613037, -0.0002094060182571411, -0.00018364191055297852, -0.00015787780284881592, -0.00013211369514465332, -0.00010634958744049072, -8.058547973632812e-05, -5.482137203216553e-05, -2.905726432800293e-05, -3.293156623840332e-06, 2.2470951080322266e-05, 4.823505878448486e-05, 7.399916648864746e-05, 9.976327419281006e-05, 0.00012552738189697266, 0.00015129148960113525, 0.00017705559730529785, 0.00020281970500946045, 0.00022858381271362305, 0.00025434792041778564, 0.00028011202812194824, 0.00030587613582611084, 0.00033164024353027344, 0.00035740435123443604, 0.00038316845893859863, 0.00040893256664276123, 0.00043469667434692383, 0.0004604607820510864, 0.000486224889755249, 0.0005119889974594116, 0.0005377531051635742, 0.0005635172128677368, 0.0005892813205718994, 0.000615045428276062, 0.0006408095359802246, 0.0006665736436843872, 0.0006923377513885498, 0.0007181018590927124, 0.000743865966796875]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 3.0, 2.0, 5.0, 16.0, 19.0, 23.0, 32.0, 48.0, 65.0, 116.0, 194.0, 344.0, 817.0, 2772.0, 22792.0, 902201.0, 111054.0, 5565.0, 1341.0, 511.0, 231.0, 150.0, 85.0, 48.0, 27.0, 27.0, 21.0, 14.0, 12.0, 6.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.3125, -11.9241943359375, -11.535888671875, -11.1475830078125, -10.75927734375, -10.3709716796875, -9.982666015625, -9.5943603515625, -9.2060546875, -8.8177490234375, -8.429443359375, -8.0411376953125, -7.65283203125, -7.2645263671875, -6.876220703125, -6.4879150390625, -6.099609375, -5.7113037109375, -5.322998046875, -4.9346923828125, -4.54638671875, -4.1580810546875, -3.769775390625, -3.3814697265625, -2.9931640625, -2.6048583984375, -2.216552734375, -1.8282470703125, -1.43994140625, -1.0516357421875, -0.663330078125, -0.2750244140625, 0.11328125, 0.5015869140625, 0.889892578125, 1.2781982421875, 1.66650390625, 2.0548095703125, 2.443115234375, 2.8314208984375, 3.2197265625, 3.6080322265625, 3.996337890625, 4.3846435546875, 4.77294921875, 5.1612548828125, 5.549560546875, 5.9378662109375, 6.326171875, 6.7144775390625, 7.102783203125, 7.4910888671875, 7.87939453125, 8.2677001953125, 8.656005859375, 9.0443115234375, 9.4326171875, 9.8209228515625, 10.209228515625, 10.5975341796875, 10.98583984375, 11.3741455078125, 11.762451171875, 12.1507568359375, 12.5390625]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 3.0, 1.0, 13.0, 8.0, 21.0, 21.0, 37.0, 104.0, 212.0, 252.0, 139.0, 66.0, 39.0, 25.0, 17.0, 9.0, 5.0, 0.0, 7.0, 5.0, 2.0, 3.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.6796875, -15.1617431640625, -14.643798828125, -14.1258544921875, -13.60791015625, -13.0899658203125, -12.572021484375, -12.0540771484375, -11.5361328125, -11.0181884765625, -10.500244140625, -9.9822998046875, -9.46435546875, -8.9464111328125, -8.428466796875, -7.9105224609375, -7.392578125, -6.8746337890625, -6.356689453125, -5.8387451171875, -5.32080078125, -4.8028564453125, -4.284912109375, -3.7669677734375, -3.2490234375, -2.7310791015625, -2.213134765625, -1.6951904296875, -1.17724609375, -0.6593017578125, -0.141357421875, 0.3765869140625, 0.89453125, 1.4124755859375, 1.930419921875, 2.4483642578125, 2.96630859375, 3.4842529296875, 4.002197265625, 4.5201416015625, 5.0380859375, 5.5560302734375, 6.073974609375, 6.5919189453125, 7.10986328125, 7.6278076171875, 8.145751953125, 8.6636962890625, 9.181640625, 9.6995849609375, 10.217529296875, 10.7354736328125, 11.25341796875, 11.7713623046875, 12.289306640625, 12.8072509765625, 13.3251953125, 13.8431396484375, 14.361083984375, 14.8790283203125, 15.39697265625, 15.9149169921875, 16.432861328125, 16.9508056640625, 17.46875]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 6.0, 65.0, 442.0, 409.0, 59.0, 13.0, 3.0, 4.0, 0.0, 3.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-72.79693603515625, -62.22686004638672, -51.65678405761719, -41.08671188354492, -30.51663589477539, -19.94655990600586, -9.376487731933594, 1.1935882568359375, 11.763664245605469, 22.333740234375, 32.90381622314453, 43.4738883972168, 54.04396438598633, 64.61404418945312, 75.18411254882812, 85.75418853759766, 96.32426452636719, 106.89434051513672, 117.46441650390625, 128.03448486328125, 138.6045684814453, 149.1746368408203, 159.74472045898438, 170.31478881835938, 180.88485717773438, 191.45492553710938, 202.02500915527344, 212.59507751464844, 223.1651611328125, 233.7352294921875, 244.3052978515625, 254.87538146972656, 265.4454650878906, 276.0155334472656, 286.5856018066406, 297.15570068359375, 307.72576904296875, 318.29583740234375, 328.86590576171875, 339.43597412109375, 350.0060729980469, 360.5761413574219, 371.1462097167969, 381.71630859375, 392.286376953125, 402.8564453125, 413.426513671875, 423.99658203125, 434.566650390625, 445.13671875, 455.706787109375, 466.2768859863281, 476.8469543457031, 487.4170227050781, 497.9870910644531, 508.55718994140625, 519.1272583007812, 529.6973266601562, 540.2673950195312, 550.8374633789062, 561.4075317382812, 571.9776611328125, 582.5477294921875, 593.1177978515625, 603.6878662109375]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 5.0, 4.0, 4.0, 7.0, 3.0, 6.0, 11.0, 5.0, 11.0, 16.0, 24.0, 23.0, 26.0, 35.0, 56.0, 43.0, 56.0, 53.0, 59.0, 66.0, 66.0, 71.0, 59.0, 45.0, 42.0, 40.0, 36.0, 31.0, 25.0, 19.0, 15.0, 9.0, 10.0, 5.0, 8.0, 5.0, 5.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-122.92903900146484, -119.58025360107422, -116.23147583007812, -112.8826904296875, -109.53390502929688, -106.18512725830078, -102.83634185791016, -99.48756408691406, -96.13877868652344, -92.78999328613281, -89.44121551513672, -86.0924301147461, -82.74365234375, -79.39486694335938, -76.04608154296875, -72.69729614257812, -69.34851837158203, -65.9997329711914, -62.65095520019531, -59.30216979980469, -55.95338821411133, -52.60460662841797, -49.255821228027344, -45.907039642333984, -42.558258056640625, -39.209476470947266, -35.860694885253906, -32.51190948486328, -29.163127899169922, -25.814346313476562, -22.46556282043457, -19.116779327392578, -15.76800537109375, -12.419222831726074, -9.070440292358398, -5.721657752990723, -2.372875213623047, 0.9759063720703125, 4.324689865112305, 7.673473358154297, 11.022254943847656, 14.371037483215332, 17.719820022583008, 21.068603515625, 24.41738510131836, 27.76616668701172, 31.11495018005371, 34.4637336730957, 37.81251525878906, 41.16129684448242, 44.51007843017578, 47.858863830566406, 51.207645416259766, 54.556427001953125, 57.90521240234375, 61.25399398803711, 64.60277557373047, 67.9515609741211, 71.30033874511719, 74.64912414550781, 77.99790954589844, 81.34668731689453, 84.69547271728516, 88.04425048828125, 91.39303588867188]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 2.0, 3.0, 4.0, 7.0, 4.0, 12.0, 22.0, 21.0, 38.0, 61.0, 95.0, 113.0, 211.0, 307.0, 558.0, 1122.0, 2496.0, 6440.0, 22385.0, 162705.0, 3877667.0, 94543.0, 16423.0, 5022.0, 1964.0, 872.0, 497.0, 272.0, 145.0, 100.0, 60.0, 38.0, 27.0, 10.0, 14.0, 10.0, 4.0, 7.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.296875, -10.9947509765625, -10.692626953125, -10.3905029296875, -10.08837890625, -9.7862548828125, -9.484130859375, -9.1820068359375, -8.8798828125, -8.5777587890625, -8.275634765625, -7.9735107421875, -7.67138671875, -7.3692626953125, -7.067138671875, -6.7650146484375, -6.462890625, -6.1607666015625, -5.858642578125, -5.5565185546875, -5.25439453125, -4.9522705078125, -4.650146484375, -4.3480224609375, -4.0458984375, -3.7437744140625, -3.441650390625, -3.1395263671875, -2.83740234375, -2.5352783203125, -2.233154296875, -1.9310302734375, -1.62890625, -1.3267822265625, -1.024658203125, -0.7225341796875, -0.42041015625, -0.1182861328125, 0.183837890625, 0.4859619140625, 0.7880859375, 1.0902099609375, 1.392333984375, 1.6944580078125, 1.99658203125, 2.2987060546875, 2.600830078125, 2.9029541015625, 3.205078125, 3.5072021484375, 3.809326171875, 4.1114501953125, 4.41357421875, 4.7156982421875, 5.017822265625, 5.3199462890625, 5.6220703125, 5.9241943359375, 6.226318359375, 6.5284423828125, 6.83056640625, 7.1326904296875, 7.434814453125, 7.7369384765625, 8.0390625]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 9.0, 5.0, 12.0, 19.0, 22.0, 34.0, 45.0, 66.0, 98.0, 109.0, 119.0, 103.0, 99.0, 84.0, 62.0, 44.0, 32.0, 12.0, 10.0, 11.0, 7.0, 6.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.578125, -10.3460693359375, -10.114013671875, -9.8819580078125, -9.64990234375, -9.4178466796875, -9.185791015625, -8.9537353515625, -8.7216796875, -8.4896240234375, -8.257568359375, -8.0255126953125, -7.79345703125, -7.5614013671875, -7.329345703125, -7.0972900390625, -6.865234375, -6.6331787109375, -6.401123046875, -6.1690673828125, -5.93701171875, -5.7049560546875, -5.472900390625, -5.2408447265625, -5.0087890625, -4.7767333984375, -4.544677734375, -4.3126220703125, -4.08056640625, -3.8485107421875, -3.616455078125, -3.3843994140625, -3.15234375, -2.9202880859375, -2.688232421875, -2.4561767578125, -2.22412109375, -1.9920654296875, -1.760009765625, -1.5279541015625, -1.2958984375, -1.0638427734375, -0.831787109375, -0.5997314453125, -0.36767578125, -0.1356201171875, 0.096435546875, 0.3284912109375, 0.560546875, 0.7926025390625, 1.024658203125, 1.2567138671875, 1.48876953125, 1.7208251953125, 1.952880859375, 2.1849365234375, 2.4169921875, 2.6490478515625, 2.881103515625, 3.1131591796875, 3.34521484375, 3.5772705078125, 3.809326171875, 4.0413818359375, 4.2734375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 4.0, 5.0, 6.0, 6.0, 9.0, 16.0, 20.0, 28.0, 46.0, 73.0, 107.0, 157.0, 247.0, 350.0, 606.0, 1088.0, 1736.0, 3767.0, 9416.0, 29234.0, 139422.0, 3583231.0, 350615.0, 49330.0, 13918.0, 5168.0, 2440.0, 1282.0, 666.0, 501.0, 284.0, 156.0, 117.0, 72.0, 52.0, 42.0, 25.0, 15.0, 12.0, 7.0, 6.0, 2.0, 6.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.890625, -6.67987060546875, -6.4691162109375, -6.25836181640625, -6.047607421875, -5.83685302734375, -5.6260986328125, -5.41534423828125, -5.20458984375, -4.99383544921875, -4.7830810546875, -4.57232666015625, -4.361572265625, -4.15081787109375, -3.9400634765625, -3.72930908203125, -3.5185546875, -3.30780029296875, -3.0970458984375, -2.88629150390625, -2.675537109375, -2.46478271484375, -2.2540283203125, -2.04327392578125, -1.83251953125, -1.62176513671875, -1.4110107421875, -1.20025634765625, -0.989501953125, -0.77874755859375, -0.5679931640625, -0.35723876953125, -0.146484375, 0.06427001953125, 0.2750244140625, 0.48577880859375, 0.696533203125, 0.90728759765625, 1.1180419921875, 1.32879638671875, 1.53955078125, 1.75030517578125, 1.9610595703125, 2.17181396484375, 2.382568359375, 2.59332275390625, 2.8040771484375, 3.01483154296875, 3.2255859375, 3.43634033203125, 3.6470947265625, 3.85784912109375, 4.068603515625, 4.27935791015625, 4.4901123046875, 4.70086669921875, 4.91162109375, 5.12237548828125, 5.3331298828125, 5.54388427734375, 5.754638671875, 5.96539306640625, 6.1761474609375, 6.38690185546875, 6.59765625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 4.0, 2.0, 3.0, 9.0, 6.0, 22.0, 17.0, 36.0, 52.0, 70.0, 120.0, 276.0, 1149.0, 1764.0, 246.0, 102.0, 70.0, 37.0, 25.0, 9.0, 15.0, 12.0, 4.0, 9.0, 5.0, 2.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0], "bins": [-3.84375, -3.737091064453125, -3.63043212890625, -3.523773193359375, -3.4171142578125, -3.310455322265625, -3.20379638671875, -3.097137451171875, -2.990478515625, -2.883819580078125, -2.77716064453125, -2.670501708984375, -2.5638427734375, -2.457183837890625, -2.35052490234375, -2.243865966796875, -2.13720703125, -2.030548095703125, -1.92388916015625, -1.817230224609375, -1.7105712890625, -1.603912353515625, -1.49725341796875, -1.390594482421875, -1.283935546875, -1.177276611328125, -1.07061767578125, -0.963958740234375, -0.8572998046875, -0.750640869140625, -0.64398193359375, -0.537322998046875, -0.4306640625, -0.324005126953125, -0.21734619140625, -0.110687255859375, -0.0040283203125, 0.102630615234375, 0.20928955078125, 0.315948486328125, 0.422607421875, 0.529266357421875, 0.63592529296875, 0.742584228515625, 0.8492431640625, 0.955902099609375, 1.06256103515625, 1.169219970703125, 1.27587890625, 1.382537841796875, 1.48919677734375, 1.595855712890625, 1.7025146484375, 1.809173583984375, 1.91583251953125, 2.022491455078125, 2.129150390625, 2.235809326171875, 2.34246826171875, 2.449127197265625, 2.5557861328125, 2.662445068359375, 2.76910400390625, 2.875762939453125, 2.982421875]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 9.0, 8.0, 18.0, 29.0, 90.0, 135.0, 199.0, 233.0, 153.0, 67.0, 36.0, 16.0, 3.0, 4.0, 0.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.841712951660156, -15.891804695129395, -14.94189739227295, -13.991989135742188, -13.042081832885742, -12.09217357635498, -11.142265319824219, -10.192358016967773, -9.242450714111328, -8.292542457580566, -7.342635154724121, -6.392726898193359, -5.442819595336914, -4.492911338806152, -3.543003559112549, -2.5930957794189453, -1.6431875228881836, -0.6932796835899353, 0.256628155708313, 1.206536054611206, 2.1564438343048096, 3.106351852416992, 4.056259632110596, 5.006167411804199, 5.956075191497803, 6.905982971191406, 7.85589075088501, 8.805798530578613, 9.755706787109375, 10.70561408996582, 11.655522346496582, 12.605430603027344, 13.555337905883789, 14.50524616241455, 15.455153465270996, 16.405061721801758, 17.354969024658203, 18.30487823486328, 19.254785537719727, 20.204692840576172, 21.154600143432617, 22.104507446289062, 23.05441665649414, 24.004323959350586, 24.95423126220703, 25.90414047241211, 26.854047775268555, 27.803955078125, 28.753864288330078, 29.703771591186523, 30.6536808013916, 31.603588104248047, 32.553497314453125, 33.50340270996094, 34.453311920166016, 35.403221130371094, 36.353126525878906, 37.303035736083984, 38.2529411315918, 39.202850341796875, 40.15275955200195, 41.102664947509766, 42.052574157714844, 43.002479553222656, 43.952388763427734]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 6.0, 3.0, 3.0, 7.0, 4.0, 6.0, 12.0, 9.0, 13.0, 16.0, 17.0, 25.0, 27.0, 34.0, 26.0, 25.0, 27.0, 45.0, 33.0, 42.0, 42.0, 30.0, 45.0, 43.0, 37.0, 36.0, 36.0, 40.0, 53.0, 37.0, 35.0, 24.0, 27.0, 27.0, 13.0, 27.0, 10.0, 16.0, 15.0, 3.0, 9.0, 5.0, 5.0, 10.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-11.937845230102539, -11.607224464416504, -11.276602745056152, -10.945981979370117, -10.615360260009766, -10.28473949432373, -9.954118728637695, -9.623497009277344, -9.292876243591309, -8.962255477905273, -8.631633758544922, -8.301012992858887, -7.970391750335693, -7.6397705078125, -7.309149742126465, -6.9785284996032715, -6.647907257080078, -6.317286014556885, -5.986664772033691, -5.656044006347656, -5.325422763824463, -4.9948015213012695, -4.664180755615234, -4.333559513092041, -4.002938270568848, -3.6723170280456543, -3.34169602394104, -3.011075019836426, -2.6804537773132324, -2.349832534790039, -2.019211530685425, -1.6885905265808105, -1.3579702377319336, -1.0273491144180298, -0.696727991104126, -0.36610686779022217, -0.03548574447631836, 0.29513537883758545, 0.6257565021514893, 0.9563775062561035, 1.2869987487792969, 1.6176198720932007, 1.9482409954071045, 2.2788619995117188, 2.609483242034912, 2.9401044845581055, 3.2707254886627197, 3.601346492767334, 3.9319677352905273, 4.262588977813721, 4.593210220336914, 4.923830986022949, 5.254452228546143, 5.585073471069336, 5.915694236755371, 6.2463154792785645, 6.576936721801758, 6.907557964324951, 7.2381792068481445, 7.56879997253418, 7.899421215057373, 8.230042457580566, 8.560663223266602, 8.891284942626953, 9.221905708312988]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 5.0, 8.0, 10.0, 10.0, 28.0, 35.0, 80.0, 131.0, 350.0, 1062.0, 5656.0, 57497.0, 753103.0, 213383.0, 13970.0, 2270.0, 574.0, 183.0, 82.0, 47.0, 23.0, 15.0, 12.0, 12.0, 4.0, 0.0, 3.0, 3.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.84375, -18.249755859375, -17.65576171875, -17.061767578125, -16.4677734375, -15.873779296875, -15.27978515625, -14.685791015625, -14.091796875, -13.497802734375, -12.90380859375, -12.309814453125, -11.7158203125, -11.121826171875, -10.52783203125, -9.933837890625, -9.33984375, -8.745849609375, -8.15185546875, -7.557861328125, -6.9638671875, -6.369873046875, -5.77587890625, -5.181884765625, -4.587890625, -3.993896484375, -3.39990234375, -2.805908203125, -2.2119140625, -1.617919921875, -1.02392578125, -0.429931640625, 0.1640625, 0.758056640625, 1.35205078125, 1.946044921875, 2.5400390625, 3.134033203125, 3.72802734375, 4.322021484375, 4.916015625, 5.510009765625, 6.10400390625, 6.697998046875, 7.2919921875, 7.885986328125, 8.47998046875, 9.073974609375, 9.66796875, 10.261962890625, 10.85595703125, 11.449951171875, 12.0439453125, 12.637939453125, 13.23193359375, 13.825927734375, 14.419921875, 15.013916015625, 15.60791015625, 16.201904296875, 16.7958984375, 17.389892578125, 17.98388671875, 18.577880859375, 19.171875]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 5.0, 8.0, 12.0, 17.0, 23.0, 29.0, 49.0, 56.0, 76.0, 93.0, 114.0, 99.0, 105.0, 87.0, 75.0, 51.0, 41.0, 19.0, 11.0, 17.0, 10.0, 8.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.5, -9.2796630859375, -9.059326171875, -8.8389892578125, -8.61865234375, -8.3983154296875, -8.177978515625, -7.9576416015625, -7.7373046875, -7.5169677734375, -7.296630859375, -7.0762939453125, -6.85595703125, -6.6356201171875, -6.415283203125, -6.1949462890625, -5.974609375, -5.7542724609375, -5.533935546875, -5.3135986328125, -5.09326171875, -4.8729248046875, -4.652587890625, -4.4322509765625, -4.2119140625, -3.9915771484375, -3.771240234375, -3.5509033203125, -3.33056640625, -3.1102294921875, -2.889892578125, -2.6695556640625, -2.44921875, -2.2288818359375, -2.008544921875, -1.7882080078125, -1.56787109375, -1.3475341796875, -1.127197265625, -0.9068603515625, -0.6865234375, -0.4661865234375, -0.245849609375, -0.0255126953125, 0.19482421875, 0.4151611328125, 0.635498046875, 0.8558349609375, 1.076171875, 1.2965087890625, 1.516845703125, 1.7371826171875, 1.95751953125, 2.1778564453125, 2.398193359375, 2.6185302734375, 2.8388671875, 3.0592041015625, 3.279541015625, 3.4998779296875, 3.72021484375, 3.9405517578125, 4.160888671875, 4.3812255859375, 4.6015625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 0.0, 3.0, 2.0, 5.0, 4.0, 4.0, 5.0, 7.0, 7.0, 17.0, 12.0, 15.0, 33.0, 35.0, 39.0, 76.0, 103.0, 158.0, 291.0, 581.0, 1592.0, 8202.0, 629897.0, 397729.0, 7004.0, 1447.0, 565.0, 257.0, 150.0, 90.0, 62.0, 43.0, 21.0, 26.0, 16.0, 11.0, 15.0, 6.0, 9.0, 10.0, 4.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-39.4375, -38.37060546875, -37.3037109375, -36.23681640625, -35.169921875, -34.10302734375, -33.0361328125, -31.96923828125, -30.90234375, -29.83544921875, -28.7685546875, -27.70166015625, -26.634765625, -25.56787109375, -24.5009765625, -23.43408203125, -22.3671875, -21.30029296875, -20.2333984375, -19.16650390625, -18.099609375, -17.03271484375, -15.9658203125, -14.89892578125, -13.83203125, -12.76513671875, -11.6982421875, -10.63134765625, -9.564453125, -8.49755859375, -7.4306640625, -6.36376953125, -5.296875, -4.22998046875, -3.1630859375, -2.09619140625, -1.029296875, 0.03759765625, 1.1044921875, 2.17138671875, 3.23828125, 4.30517578125, 5.3720703125, 6.43896484375, 7.505859375, 8.57275390625, 9.6396484375, 10.70654296875, 11.7734375, 12.84033203125, 13.9072265625, 14.97412109375, 16.041015625, 17.10791015625, 18.1748046875, 19.24169921875, 20.30859375, 21.37548828125, 22.4423828125, 23.50927734375, 24.576171875, 25.64306640625, 26.7099609375, 27.77685546875, 28.84375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 5.0, 3.0, 7.0, 12.0, 15.0, 17.0, 33.0, 36.0, 50.0, 87.0, 113.0, 109.0, 112.0, 100.0, 84.0, 69.0, 40.0, 32.0, 23.0, 13.0, 10.0, 4.0, 5.0, 4.0, 7.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0], "bins": [-49.53125, -48.351806640625, -47.17236328125, -45.992919921875, -44.8134765625, -43.634033203125, -42.45458984375, -41.275146484375, -40.095703125, -38.916259765625, -37.73681640625, -36.557373046875, -35.3779296875, -34.198486328125, -33.01904296875, -31.839599609375, -30.66015625, -29.480712890625, -28.30126953125, -27.121826171875, -25.9423828125, -24.762939453125, -23.58349609375, -22.404052734375, -21.224609375, -20.045166015625, -18.86572265625, -17.686279296875, -16.5068359375, -15.327392578125, -14.14794921875, -12.968505859375, -11.7890625, -10.609619140625, -9.43017578125, -8.250732421875, -7.0712890625, -5.891845703125, -4.71240234375, -3.532958984375, -2.353515625, -1.174072265625, 0.00537109375, 1.184814453125, 2.3642578125, 3.543701171875, 4.72314453125, 5.902587890625, 7.08203125, 8.261474609375, 9.44091796875, 10.620361328125, 11.7998046875, 12.979248046875, 14.15869140625, 15.338134765625, 16.517578125, 17.697021484375, 18.87646484375, 20.055908203125, 21.2353515625, 22.414794921875, 23.59423828125, 24.773681640625, 25.953125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 6.0, 10.0, 5.0, 7.0, 17.0, 15.0, 22.0, 27.0, 41.0, 78.0, 142.0, 282.0, 788.0, 3655.0, 77201.0, 943747.0, 19538.0, 1900.0, 554.0, 211.0, 116.0, 77.0, 36.0, 22.0, 17.0, 11.0, 6.0, 5.0, 5.0, 4.0, 5.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.3515625, -14.9169921875, -14.482421875, -14.0478515625, -13.61328125, -13.1787109375, -12.744140625, -12.3095703125, -11.875, -11.4404296875, -11.005859375, -10.5712890625, -10.13671875, -9.7021484375, -9.267578125, -8.8330078125, -8.3984375, -7.9638671875, -7.529296875, -7.0947265625, -6.66015625, -6.2255859375, -5.791015625, -5.3564453125, -4.921875, -4.4873046875, -4.052734375, -3.6181640625, -3.18359375, -2.7490234375, -2.314453125, -1.8798828125, -1.4453125, -1.0107421875, -0.576171875, -0.1416015625, 0.29296875, 0.7275390625, 1.162109375, 1.5966796875, 2.03125, 2.4658203125, 2.900390625, 3.3349609375, 3.76953125, 4.2041015625, 4.638671875, 5.0732421875, 5.5078125, 5.9423828125, 6.376953125, 6.8115234375, 7.24609375, 7.6806640625, 8.115234375, 8.5498046875, 8.984375, 9.4189453125, 9.853515625, 10.2880859375, 10.72265625, 11.1572265625, 11.591796875, 12.0263671875, 12.4609375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 6.0, 2.0, 5.0, 6.0, 5.0, 17.0, 18.0, 20.0, 38.0, 52.0, 56.0, 124.0, 256.0, 140.0, 78.0, 45.0, 57.0, 31.0, 15.0, 12.0, 6.0, 3.0, 4.0, 9.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00157928466796875, -0.0015307962894439697, -0.0014823079109191895, -0.0014338195323944092, -0.001385331153869629, -0.0013368427753448486, -0.0012883543968200684, -0.001239866018295288, -0.0011913776397705078, -0.0011428892612457275, -0.0010944008827209473, -0.001045912504196167, -0.0009974241256713867, -0.0009489357471466064, -0.0009004473686218262, -0.0008519589900970459, -0.0008034706115722656, -0.0007549822330474854, -0.0007064938545227051, -0.0006580054759979248, -0.0006095170974731445, -0.0005610287189483643, -0.000512540340423584, -0.0004640519618988037, -0.00041556358337402344, -0.00036707520484924316, -0.0003185868263244629, -0.0002700984477996826, -0.00022161006927490234, -0.00017312169075012207, -0.0001246333122253418, -7.614493370056152e-05, -2.765655517578125e-05, 2.0831823348999023e-05, 6.93202018737793e-05, 0.00011780858039855957, 0.00016629695892333984, 0.00021478533744812012, 0.0002632737159729004, 0.00031176209449768066, 0.00036025047302246094, 0.0004087388515472412, 0.0004572272300720215, 0.0005057156085968018, 0.000554203987121582, 0.0006026923656463623, 0.0006511807441711426, 0.0006996691226959229, 0.0007481575012207031, 0.0007966458797454834, 0.0008451342582702637, 0.0008936226367950439, 0.0009421110153198242, 0.0009905993938446045, 0.0010390877723693848, 0.001087576150894165, 0.0011360645294189453, 0.0011845529079437256, 0.0012330412864685059, 0.0012815296649932861, 0.0013300180435180664, 0.0013785064220428467, 0.001426994800567627, 0.0014754831790924072, 0.0015239715576171875]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 3.0, 4.0, 1.0, 4.0, 2.0, 4.0, 4.0, 5.0, 8.0, 4.0, 11.0, 10.0, 13.0, 16.0, 17.0, 40.0, 38.0, 71.0, 124.0, 178.0, 368.0, 692.0, 2000.0, 7472.0, 116319.0, 885324.0, 29414.0, 4016.0, 1219.0, 506.0, 234.0, 147.0, 91.0, 55.0, 38.0, 30.0, 17.0, 18.0, 10.0, 3.0, 8.0, 6.0, 2.0, 6.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.328125, -10.0084228515625, -9.688720703125, -9.3690185546875, -9.04931640625, -8.7296142578125, -8.409912109375, -8.0902099609375, -7.7705078125, -7.4508056640625, -7.131103515625, -6.8114013671875, -6.49169921875, -6.1719970703125, -5.852294921875, -5.5325927734375, -5.212890625, -4.8931884765625, -4.573486328125, -4.2537841796875, -3.93408203125, -3.6143798828125, -3.294677734375, -2.9749755859375, -2.6552734375, -2.3355712890625, -2.015869140625, -1.6961669921875, -1.37646484375, -1.0567626953125, -0.737060546875, -0.4173583984375, -0.09765625, 0.2220458984375, 0.541748046875, 0.8614501953125, 1.18115234375, 1.5008544921875, 1.820556640625, 2.1402587890625, 2.4599609375, 2.7796630859375, 3.099365234375, 3.4190673828125, 3.73876953125, 4.0584716796875, 4.378173828125, 4.6978759765625, 5.017578125, 5.3372802734375, 5.656982421875, 5.9766845703125, 6.29638671875, 6.6160888671875, 6.935791015625, 7.2554931640625, 7.5751953125, 7.8948974609375, 8.214599609375, 8.5343017578125, 8.85400390625, 9.1737060546875, 9.493408203125, 9.8131103515625, 10.1328125]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 4.0, 2.0, 4.0, 6.0, 2.0, 5.0, 8.0, 14.0, 25.0, 51.0, 70.0, 113.0, 191.0, 169.0, 119.0, 96.0, 37.0, 22.0, 18.0, 12.0, 5.0, 5.0, 9.0, 4.0, 2.0, 4.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.3828125, -9.0814208984375, -8.780029296875, -8.4786376953125, -8.17724609375, -7.8758544921875, -7.574462890625, -7.2730712890625, -6.9716796875, -6.6702880859375, -6.368896484375, -6.0675048828125, -5.76611328125, -5.4647216796875, -5.163330078125, -4.8619384765625, -4.560546875, -4.2591552734375, -3.957763671875, -3.6563720703125, -3.35498046875, -3.0535888671875, -2.752197265625, -2.4508056640625, -2.1494140625, -1.8480224609375, -1.546630859375, -1.2452392578125, -0.94384765625, -0.6424560546875, -0.341064453125, -0.0396728515625, 0.26171875, 0.5631103515625, 0.864501953125, 1.1658935546875, 1.46728515625, 1.7686767578125, 2.070068359375, 2.3714599609375, 2.6728515625, 2.9742431640625, 3.275634765625, 3.5770263671875, 3.87841796875, 4.1798095703125, 4.481201171875, 4.7825927734375, 5.083984375, 5.3853759765625, 5.686767578125, 5.9881591796875, 6.28955078125, 6.5909423828125, 6.892333984375, 7.1937255859375, 7.4951171875, 7.7965087890625, 8.097900390625, 8.3992919921875, 8.70068359375, 9.0020751953125, 9.303466796875, 9.6048583984375, 9.90625]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 7.0, 26.0, 231.0, 587.0, 134.0, 11.0, 5.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-346.9697570800781, -334.776611328125, -322.58343505859375, -310.3902893066406, -298.1971435546875, -286.00396728515625, -273.8108215332031, -261.61767578125, -249.42449951171875, -237.23133850097656, -225.03817749023438, -212.84503173828125, -200.65187072753906, -188.45870971679688, -176.26556396484375, -164.07240295410156, -151.87924194335938, -139.6860809326172, -127.49292755126953, -115.29977416992188, -103.10661315917969, -90.9134521484375, -78.72029876708984, -66.52714538574219, -54.333984375, -42.14082717895508, -29.947669982910156, -17.754512786865234, -5.5613555908203125, 6.631801605224609, 18.82495880126953, 31.018112182617188, 43.21124267578125, 55.40439987182617, 67.5975570678711, 79.79071044921875, 91.98387145996094, 104.17703247070312, 116.37018585205078, 128.56333923339844, 140.75650024414062, 152.9496612548828, 165.142822265625, 177.33596801757812, 189.5291290283203, 201.7222900390625, 213.91543579101562, 226.1085968017578, 238.3017578125, 250.4949188232422, 262.6880798339844, 274.8812255859375, 287.07440185546875, 299.2675476074219, 311.460693359375, 323.65386962890625, 335.8470153808594, 348.0401611328125, 360.23333740234375, 372.4264831542969, 384.61962890625, 396.81280517578125, 409.0059509277344, 421.1990966796875, 433.39227294921875]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 4.0, 2.0, 5.0, 6.0, 8.0, 12.0, 17.0, 17.0, 24.0, 30.0, 28.0, 32.0, 43.0, 41.0, 54.0, 60.0, 61.0, 74.0, 51.0, 56.0, 55.0, 53.0, 36.0, 45.0, 37.0, 34.0, 29.0, 26.0, 8.0, 11.0, 14.0, 13.0, 3.0, 9.0, 5.0, 6.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.23089599609375, -66.13198852539062, -63.0330810546875, -59.93417739868164, -56.835269927978516, -53.73636245727539, -50.63745880126953, -47.538551330566406, -44.43964385986328, -41.340736389160156, -38.24182891845703, -35.14292526245117, -32.04401779174805, -28.945110321044922, -25.84620475769043, -22.747299194335938, -19.648391723632812, -16.549484252929688, -13.450578689575195, -10.351672172546387, -7.252765655517578, -4.1538591384887695, -1.054952621459961, 2.0439529418945312, 5.142860412597656, 8.241766929626465, 11.340673446655273, 14.439579963684082, 17.53848648071289, 20.637393951416016, 23.736299514770508, 26.835205078125, 29.934112548828125, 33.03302001953125, 36.131927490234375, 39.230831146240234, 42.32973861694336, 45.428646087646484, 48.527549743652344, 51.62645721435547, 54.725364685058594, 57.82427215576172, 60.923179626464844, 64.02208709716797, 67.12098693847656, 70.21989440917969, 73.31880187988281, 76.41770935058594, 79.51661682128906, 82.61552429199219, 85.71443176269531, 88.81333923339844, 91.91224670410156, 95.01114654541016, 98.11005401611328, 101.2089614868164, 104.30786895751953, 107.40677642822266, 110.50568389892578, 113.6045913696289, 116.7034912109375, 119.80239868164062, 122.90130615234375, 126.00021362304688, 129.09912109375]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [4.0, 2.0, 3.0, 3.0, 6.0, 4.0, 5.0, 7.0, 10.0, 15.0, 22.0, 30.0, 46.0, 59.0, 125.0, 160.0, 274.0, 512.0, 996.0, 2134.0, 5546.0, 17105.0, 74692.0, 751229.0, 3031883.0, 252938.0, 39339.0, 10443.0, 3581.0, 1487.0, 748.0, 343.0, 191.0, 131.0, 69.0, 45.0, 31.0, 25.0, 11.0, 15.0, 9.0, 7.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.91015625, -4.70806884765625, -4.5059814453125, -4.30389404296875, -4.101806640625, -3.89971923828125, -3.6976318359375, -3.49554443359375, -3.29345703125, -3.09136962890625, -2.8892822265625, -2.68719482421875, -2.485107421875, -2.28302001953125, -2.0809326171875, -1.87884521484375, -1.6767578125, -1.47467041015625, -1.2725830078125, -1.07049560546875, -0.868408203125, -0.66632080078125, -0.4642333984375, -0.26214599609375, -0.06005859375, 0.14202880859375, 0.3441162109375, 0.54620361328125, 0.748291015625, 0.95037841796875, 1.1524658203125, 1.35455322265625, 1.556640625, 1.75872802734375, 1.9608154296875, 2.16290283203125, 2.364990234375, 2.56707763671875, 2.7691650390625, 2.97125244140625, 3.17333984375, 3.37542724609375, 3.5775146484375, 3.77960205078125, 3.981689453125, 4.18377685546875, 4.3858642578125, 4.58795166015625, 4.7900390625, 4.99212646484375, 5.1942138671875, 5.39630126953125, 5.598388671875, 5.80047607421875, 6.0025634765625, 6.20465087890625, 6.40673828125, 6.60882568359375, 6.8109130859375, 7.01300048828125, 7.215087890625, 7.41717529296875, 7.6192626953125, 7.82135009765625, 8.0234375]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 6.0, 11.0, 12.0, 11.0, 17.0, 23.0, 25.0, 51.0, 51.0, 66.0, 79.0, 98.0, 83.0, 85.0, 73.0, 66.0, 68.0, 45.0, 42.0, 24.0, 7.0, 17.0, 13.0, 10.0, 3.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.73828125, -5.572021484375, -5.40576171875, -5.239501953125, -5.0732421875, -4.906982421875, -4.74072265625, -4.574462890625, -4.408203125, -4.241943359375, -4.07568359375, -3.909423828125, -3.7431640625, -3.576904296875, -3.41064453125, -3.244384765625, -3.078125, -2.911865234375, -2.74560546875, -2.579345703125, -2.4130859375, -2.246826171875, -2.08056640625, -1.914306640625, -1.748046875, -1.581787109375, -1.41552734375, -1.249267578125, -1.0830078125, -0.916748046875, -0.75048828125, -0.584228515625, -0.41796875, -0.251708984375, -0.08544921875, 0.080810546875, 0.2470703125, 0.413330078125, 0.57958984375, 0.745849609375, 0.912109375, 1.078369140625, 1.24462890625, 1.410888671875, 1.5771484375, 1.743408203125, 1.90966796875, 2.075927734375, 2.2421875, 2.408447265625, 2.57470703125, 2.740966796875, 2.9072265625, 3.073486328125, 3.23974609375, 3.406005859375, 3.572265625, 3.738525390625, 3.90478515625, 4.071044921875, 4.2373046875, 4.403564453125, 4.56982421875, 4.736083984375, 4.90234375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 5.0, 3.0, 5.0, 6.0, 7.0, 8.0, 17.0, 20.0, 24.0, 33.0, 84.0, 122.0, 261.0, 612.0, 1352.0, 4038.0, 15966.0, 100293.0, 2609312.0, 1374109.0, 70050.0, 12447.0, 3331.0, 1149.0, 492.0, 223.0, 99.0, 63.0, 41.0, 26.0, 16.0, 17.0, 17.0, 10.0, 7.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-8.7109375, -8.4462890625, -8.181640625, -7.9169921875, -7.65234375, -7.3876953125, -7.123046875, -6.8583984375, -6.59375, -6.3291015625, -6.064453125, -5.7998046875, -5.53515625, -5.2705078125, -5.005859375, -4.7412109375, -4.4765625, -4.2119140625, -3.947265625, -3.6826171875, -3.41796875, -3.1533203125, -2.888671875, -2.6240234375, -2.359375, -2.0947265625, -1.830078125, -1.5654296875, -1.30078125, -1.0361328125, -0.771484375, -0.5068359375, -0.2421875, 0.0224609375, 0.287109375, 0.5517578125, 0.81640625, 1.0810546875, 1.345703125, 1.6103515625, 1.875, 2.1396484375, 2.404296875, 2.6689453125, 2.93359375, 3.1982421875, 3.462890625, 3.7275390625, 3.9921875, 4.2568359375, 4.521484375, 4.7861328125, 5.05078125, 5.3154296875, 5.580078125, 5.8447265625, 6.109375, 6.3740234375, 6.638671875, 6.9033203125, 7.16796875, 7.4326171875, 7.697265625, 7.9619140625, 8.2265625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 7.0, 7.0, 12.0, 16.0, 19.0, 34.0, 37.0, 72.0, 127.0, 272.0, 578.0, 1085.0, 951.0, 421.0, 172.0, 87.0, 48.0, 46.0, 17.0, 25.0, 12.0, 7.0, 8.0, 4.0, 3.0, 3.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.34375, -10.028564453125, -9.71337890625, -9.398193359375, -9.0830078125, -8.767822265625, -8.45263671875, -8.137451171875, -7.822265625, -7.507080078125, -7.19189453125, -6.876708984375, -6.5615234375, -6.246337890625, -5.93115234375, -5.615966796875, -5.30078125, -4.985595703125, -4.67041015625, -4.355224609375, -4.0400390625, -3.724853515625, -3.40966796875, -3.094482421875, -2.779296875, -2.464111328125, -2.14892578125, -1.833740234375, -1.5185546875, -1.203369140625, -0.88818359375, -0.572998046875, -0.2578125, 0.057373046875, 0.37255859375, 0.687744140625, 1.0029296875, 1.318115234375, 1.63330078125, 1.948486328125, 2.263671875, 2.578857421875, 2.89404296875, 3.209228515625, 3.5244140625, 3.839599609375, 4.15478515625, 4.469970703125, 4.78515625, 5.100341796875, 5.41552734375, 5.730712890625, 6.0458984375, 6.361083984375, 6.67626953125, 6.991455078125, 7.306640625, 7.621826171875, 7.93701171875, 8.252197265625, 8.5673828125, 8.882568359375, 9.19775390625, 9.512939453125, 9.828125]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 3.0, 3.0, 2.0, 12.0, 7.0, 22.0, 47.0, 139.0, 229.0, 277.0, 155.0, 67.0, 20.0, 8.0, 7.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-103.82951354980469, -100.50437927246094, -97.17925262451172, -93.85411834716797, -90.52899169921875, -87.203857421875, -83.87872314453125, -80.55359649658203, -77.22846984863281, -73.90333557128906, -70.57820892333984, -67.2530746459961, -63.927947998046875, -60.602813720703125, -57.27768325805664, -53.952552795410156, -50.627418518066406, -47.30228805541992, -43.97715759277344, -40.65202331542969, -37.32689666748047, -34.00176239013672, -30.676631927490234, -27.35150146484375, -24.026371002197266, -20.70124053955078, -17.376110076904297, -14.05097770690918, -10.725847244262695, -7.400716781616211, -4.075584411621094, -0.7504539489746094, 2.574676513671875, 5.899807453155518, 9.22493839263916, 12.550069808959961, 15.875200271606445, 19.20033073425293, 22.525463104248047, 25.85059356689453, 29.175724029541016, 32.5008544921875, 35.825984954833984, 39.15111541748047, 42.47624969482422, 45.80137634277344, 49.12651062011719, 52.45164108276367, 55.776771545410156, 59.10190200805664, 62.427032470703125, 65.75216674804688, 69.0772933959961, 72.40242767333984, 75.72755432128906, 79.05268859863281, 82.37782287597656, 85.70295715332031, 89.02808380126953, 92.35321807861328, 95.6783447265625, 99.00347900390625, 102.32861328125, 105.65373992919922, 108.97886657714844]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 5.0, 4.0, 10.0, 11.0, 8.0, 6.0, 17.0, 27.0, 22.0, 33.0, 23.0, 38.0, 48.0, 30.0, 47.0, 43.0, 64.0, 55.0, 61.0, 59.0, 59.0, 48.0, 36.0, 40.0, 41.0, 29.0, 21.0, 34.0, 20.0, 21.0, 14.0, 6.0, 14.0, 3.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.083892822265625, -34.80084991455078, -33.51780700683594, -32.234764099121094, -30.95172119140625, -29.668678283691406, -28.385637283325195, -27.10259437561035, -25.819551467895508, -24.536508560180664, -23.25346565246582, -21.970422744750977, -20.687381744384766, -19.404338836669922, -18.121295928955078, -16.838253021240234, -15.55521011352539, -14.272167205810547, -12.989124298095703, -11.706082344055176, -10.423039436340332, -9.139996528625488, -7.856954097747803, -6.573911666870117, -5.290868759155273, -4.00782585144043, -2.724783420562744, -1.4417407512664795, -0.15869808197021484, 1.124344825744629, 2.4073872566223145, 3.6904296875, 4.973472595214844, 6.2565155029296875, 7.539557933807373, 8.822600364685059, 10.105643272399902, 11.388686180114746, 12.671728134155273, 13.954771041870117, 15.237813949584961, 16.520856857299805, 17.80389976501465, 19.086942672729492, 20.369983673095703, 21.653026580810547, 22.93606948852539, 24.219112396240234, 25.502155303955078, 26.785198211669922, 28.068241119384766, 29.35128402709961, 30.634326934814453, 31.917369842529297, 33.20041275024414, 34.48345184326172, 35.76649475097656, 37.049537658691406, 38.33258056640625, 39.615623474121094, 40.89866638183594, 42.18170928955078, 43.464752197265625, 44.74779510498047, 46.03083801269531]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 1.0, 3.0, 6.0, 9.0, 9.0, 10.0, 16.0, 13.0, 23.0, 32.0, 83.0, 135.0, 262.0, 634.0, 1575.0, 5689.0, 28511.0, 297513.0, 647924.0, 53558.0, 8692.0, 2284.0, 816.0, 340.0, 148.0, 117.0, 50.0, 27.0, 17.0, 21.0, 8.0, 8.0, 6.0, 4.0, 4.0, 4.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.6640625, -14.193359375, -13.72265625, -13.251953125, -12.78125, -12.310546875, -11.83984375, -11.369140625, -10.8984375, -10.427734375, -9.95703125, -9.486328125, -9.015625, -8.544921875, -8.07421875, -7.603515625, -7.1328125, -6.662109375, -6.19140625, -5.720703125, -5.25, -4.779296875, -4.30859375, -3.837890625, -3.3671875, -2.896484375, -2.42578125, -1.955078125, -1.484375, -1.013671875, -0.54296875, -0.072265625, 0.3984375, 0.869140625, 1.33984375, 1.810546875, 2.28125, 2.751953125, 3.22265625, 3.693359375, 4.1640625, 4.634765625, 5.10546875, 5.576171875, 6.046875, 6.517578125, 6.98828125, 7.458984375, 7.9296875, 8.400390625, 8.87109375, 9.341796875, 9.8125, 10.283203125, 10.75390625, 11.224609375, 11.6953125, 12.166015625, 12.63671875, 13.107421875, 13.578125, 14.048828125, 14.51953125, 14.990234375, 15.4609375]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 5.0, 10.0, 11.0, 13.0, 16.0, 18.0, 37.0, 43.0, 47.0, 46.0, 61.0, 97.0, 75.0, 83.0, 71.0, 79.0, 72.0, 59.0, 34.0, 28.0, 28.0, 18.0, 15.0, 6.0, 14.0, 5.0, 1.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.82421875, -4.6690673828125, -4.513916015625, -4.3587646484375, -4.20361328125, -4.0484619140625, -3.893310546875, -3.7381591796875, -3.5830078125, -3.4278564453125, -3.272705078125, -3.1175537109375, -2.96240234375, -2.8072509765625, -2.652099609375, -2.4969482421875, -2.341796875, -2.1866455078125, -2.031494140625, -1.8763427734375, -1.72119140625, -1.5660400390625, -1.410888671875, -1.2557373046875, -1.1005859375, -0.9454345703125, -0.790283203125, -0.6351318359375, -0.47998046875, -0.3248291015625, -0.169677734375, -0.0145263671875, 0.140625, 0.2957763671875, 0.450927734375, 0.6060791015625, 0.76123046875, 0.9163818359375, 1.071533203125, 1.2266845703125, 1.3818359375, 1.5369873046875, 1.692138671875, 1.8472900390625, 2.00244140625, 2.1575927734375, 2.312744140625, 2.4678955078125, 2.623046875, 2.7781982421875, 2.933349609375, 3.0885009765625, 3.24365234375, 3.3988037109375, 3.553955078125, 3.7091064453125, 3.8642578125, 4.0194091796875, 4.174560546875, 4.3297119140625, 4.48486328125, 4.6400146484375, 4.795166015625, 4.9503173828125, 5.10546875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 6.0, 0.0, 2.0, 3.0, 6.0, 6.0, 7.0, 6.0, 17.0, 19.0, 21.0, 29.0, 64.0, 56.0, 107.0, 163.0, 259.0, 517.0, 1320.0, 5300.0, 85175.0, 933790.0, 17228.0, 2554.0, 886.0, 416.0, 203.0, 120.0, 83.0, 55.0, 33.0, 29.0, 17.0, 20.0, 11.0, 8.0, 2.0, 4.0, 2.0, 5.0, 4.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-36.84375, -35.768798828125, -34.69384765625, -33.618896484375, -32.5439453125, -31.468994140625, -30.39404296875, -29.319091796875, -28.244140625, -27.169189453125, -26.09423828125, -25.019287109375, -23.9443359375, -22.869384765625, -21.79443359375, -20.719482421875, -19.64453125, -18.569580078125, -17.49462890625, -16.419677734375, -15.3447265625, -14.269775390625, -13.19482421875, -12.119873046875, -11.044921875, -9.969970703125, -8.89501953125, -7.820068359375, -6.7451171875, -5.670166015625, -4.59521484375, -3.520263671875, -2.4453125, -1.370361328125, -0.29541015625, 0.779541015625, 1.8544921875, 2.929443359375, 4.00439453125, 5.079345703125, 6.154296875, 7.229248046875, 8.30419921875, 9.379150390625, 10.4541015625, 11.529052734375, 12.60400390625, 13.678955078125, 14.75390625, 15.828857421875, 16.90380859375, 17.978759765625, 19.0537109375, 20.128662109375, 21.20361328125, 22.278564453125, 23.353515625, 24.428466796875, 25.50341796875, 26.578369140625, 27.6533203125, 28.728271484375, 29.80322265625, 30.878173828125, 31.953125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 6.0, 10.0, 7.0, 13.0, 18.0, 21.0, 40.0, 63.0, 62.0, 89.0, 93.0, 102.0, 104.0, 78.0, 73.0, 60.0, 45.0, 32.0, 17.0, 15.0, 13.0, 5.0, 8.0, 3.0, 5.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-37.53125, -36.48193359375, -35.4326171875, -34.38330078125, -33.333984375, -32.28466796875, -31.2353515625, -30.18603515625, -29.13671875, -28.08740234375, -27.0380859375, -25.98876953125, -24.939453125, -23.89013671875, -22.8408203125, -21.79150390625, -20.7421875, -19.69287109375, -18.6435546875, -17.59423828125, -16.544921875, -15.49560546875, -14.4462890625, -13.39697265625, -12.34765625, -11.29833984375, -10.2490234375, -9.19970703125, -8.150390625, -7.10107421875, -6.0517578125, -5.00244140625, -3.953125, -2.90380859375, -1.8544921875, -0.80517578125, 0.244140625, 1.29345703125, 2.3427734375, 3.39208984375, 4.44140625, 5.49072265625, 6.5400390625, 7.58935546875, 8.638671875, 9.68798828125, 10.7373046875, 11.78662109375, 12.8359375, 13.88525390625, 14.9345703125, 15.98388671875, 17.033203125, 18.08251953125, 19.1318359375, 20.18115234375, 21.23046875, 22.27978515625, 23.3291015625, 24.37841796875, 25.427734375, 26.47705078125, 27.5263671875, 28.57568359375, 29.625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 4.0, 7.0, 7.0, 6.0, 5.0, 18.0, 15.0, 17.0, 30.0, 35.0, 38.0, 57.0, 74.0, 104.0, 155.0, 347.0, 747.0, 1766.0, 8367.0, 106396.0, 892493.0, 31299.0, 4091.0, 1195.0, 486.0, 252.0, 166.0, 91.0, 59.0, 53.0, 44.0, 32.0, 17.0, 16.0, 12.0, 6.0, 13.0, 7.0, 6.0, 3.0, 4.0, 5.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-13.34375, -12.9656982421875, -12.587646484375, -12.2095947265625, -11.83154296875, -11.4534912109375, -11.075439453125, -10.6973876953125, -10.3193359375, -9.9412841796875, -9.563232421875, -9.1851806640625, -8.80712890625, -8.4290771484375, -8.051025390625, -7.6729736328125, -7.294921875, -6.9168701171875, -6.538818359375, -6.1607666015625, -5.78271484375, -5.4046630859375, -5.026611328125, -4.6485595703125, -4.2705078125, -3.8924560546875, -3.514404296875, -3.1363525390625, -2.75830078125, -2.3802490234375, -2.002197265625, -1.6241455078125, -1.24609375, -0.8680419921875, -0.489990234375, -0.1119384765625, 0.26611328125, 0.6441650390625, 1.022216796875, 1.4002685546875, 1.7783203125, 2.1563720703125, 2.534423828125, 2.9124755859375, 3.29052734375, 3.6685791015625, 4.046630859375, 4.4246826171875, 4.802734375, 5.1807861328125, 5.558837890625, 5.9368896484375, 6.31494140625, 6.6929931640625, 7.071044921875, 7.4490966796875, 7.8271484375, 8.2052001953125, 8.583251953125, 8.9613037109375, 9.33935546875, 9.7174072265625, 10.095458984375, 10.4735107421875, 10.8515625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 1.0, 2.0, 4.0, 9.0, 6.0, 6.0, 12.0, 13.0, 15.0, 22.0, 29.0, 32.0, 53.0, 76.0, 166.0, 235.0, 125.0, 50.0, 31.0, 19.0, 22.0, 17.0, 15.0, 9.0, 9.0, 5.0, 9.0, 7.0, 1.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00121307373046875, -0.0011630654335021973, -0.0011130571365356445, -0.0010630488395690918, -0.001013040542602539, -0.0009630322456359863, -0.0009130239486694336, -0.0008630156517028809, -0.0008130073547363281, -0.0007629990577697754, -0.0007129907608032227, -0.0006629824638366699, -0.0006129741668701172, -0.0005629658699035645, -0.0005129575729370117, -0.000462949275970459, -0.00041294097900390625, -0.0003629326820373535, -0.0003129243850708008, -0.00026291608810424805, -0.0002129077911376953, -0.00016289949417114258, -0.00011289119720458984, -6.288290023803711e-05, -1.2874603271484375e-05, 3.713369369506836e-05, 8.71419906616211e-05, 0.00013715028762817383, 0.00018715858459472656, 0.0002371668815612793, 0.00028717517852783203, 0.00033718347549438477, 0.0003871917724609375, 0.00043720006942749023, 0.00048720836639404297, 0.0005372166633605957, 0.0005872249603271484, 0.0006372332572937012, 0.0006872415542602539, 0.0007372498512268066, 0.0007872581481933594, 0.0008372664451599121, 0.0008872747421264648, 0.0009372830390930176, 0.0009872913360595703, 0.001037299633026123, 0.0010873079299926758, 0.0011373162269592285, 0.0011873245239257812, 0.001237332820892334, 0.0012873411178588867, 0.0013373494148254395, 0.0013873577117919922, 0.001437366008758545, 0.0014873743057250977, 0.0015373826026916504, 0.0015873908996582031, 0.0016373991966247559, 0.0016874074935913086, 0.0017374157905578613, 0.001787424087524414, 0.0018374323844909668, 0.0018874406814575195, 0.0019374489784240723, 0.001987457275390625]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 4.0, 9.0, 4.0, 3.0, 10.0, 10.0, 12.0, 14.0, 18.0, 26.0, 50.0, 62.0, 74.0, 110.0, 162.0, 280.0, 536.0, 1197.0, 3634.0, 17560.0, 589108.0, 413587.0, 16112.0, 3428.0, 1190.0, 533.0, 289.0, 164.0, 101.0, 76.0, 64.0, 23.0, 27.0, 22.0, 16.0, 11.0, 3.0, 5.0, 5.0, 9.0, 2.0, 5.0, 2.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.1640625, -10.77880859375, -10.3935546875, -10.00830078125, -9.623046875, -9.23779296875, -8.8525390625, -8.46728515625, -8.08203125, -7.69677734375, -7.3115234375, -6.92626953125, -6.541015625, -6.15576171875, -5.7705078125, -5.38525390625, -5.0, -4.61474609375, -4.2294921875, -3.84423828125, -3.458984375, -3.07373046875, -2.6884765625, -2.30322265625, -1.91796875, -1.53271484375, -1.1474609375, -0.76220703125, -0.376953125, 0.00830078125, 0.3935546875, 0.77880859375, 1.1640625, 1.54931640625, 1.9345703125, 2.31982421875, 2.705078125, 3.09033203125, 3.4755859375, 3.86083984375, 4.24609375, 4.63134765625, 5.0166015625, 5.40185546875, 5.787109375, 6.17236328125, 6.5576171875, 6.94287109375, 7.328125, 7.71337890625, 8.0986328125, 8.48388671875, 8.869140625, 9.25439453125, 9.6396484375, 10.02490234375, 10.41015625, 10.79541015625, 11.1806640625, 11.56591796875, 11.951171875, 12.33642578125, 12.7216796875, 13.10693359375, 13.4921875]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 5.0, 9.0, 6.0, 8.0, 12.0, 8.0, 20.0, 33.0, 81.0, 158.0, 258.0, 181.0, 90.0, 44.0, 21.0, 16.0, 11.0, 7.0, 4.0, 5.0, 3.0, 2.0, 7.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.5390625, -13.135009765625, -12.73095703125, -12.326904296875, -11.9228515625, -11.518798828125, -11.11474609375, -10.710693359375, -10.306640625, -9.902587890625, -9.49853515625, -9.094482421875, -8.6904296875, -8.286376953125, -7.88232421875, -7.478271484375, -7.07421875, -6.670166015625, -6.26611328125, -5.862060546875, -5.4580078125, -5.053955078125, -4.64990234375, -4.245849609375, -3.841796875, -3.437744140625, -3.03369140625, -2.629638671875, -2.2255859375, -1.821533203125, -1.41748046875, -1.013427734375, -0.609375, -0.205322265625, 0.19873046875, 0.602783203125, 1.0068359375, 1.410888671875, 1.81494140625, 2.218994140625, 2.623046875, 3.027099609375, 3.43115234375, 3.835205078125, 4.2392578125, 4.643310546875, 5.04736328125, 5.451416015625, 5.85546875, 6.259521484375, 6.66357421875, 7.067626953125, 7.4716796875, 7.875732421875, 8.27978515625, 8.683837890625, 9.087890625, 9.491943359375, 9.89599609375, 10.300048828125, 10.7041015625, 11.108154296875, 11.51220703125, 11.916259765625, 12.3203125]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 10.0, 18.0, 59.0, 218.0, 341.0, 245.0, 70.0, 17.0, 10.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-113.910888671875, -108.09619903564453, -102.28150939941406, -96.4668197631836, -90.65213012695312, -84.83744049072266, -79.02275085449219, -73.20806884765625, -67.39337158203125, -61.57868194580078, -55.76399230957031, -49.949302673339844, -44.134613037109375, -38.319923400878906, -32.5052375793457, -26.690547943115234, -20.87586212158203, -15.061172485351562, -9.24648380279541, -3.431795120239258, 2.382894515991211, 8.19758415222168, 14.012271881103516, 19.826961517333984, 25.641651153564453, 31.456340789794922, 37.27103042602539, 43.085716247558594, 48.90040588378906, 54.71509552001953, 60.52978515625, 66.34447479248047, 72.15916442871094, 77.9738540649414, 83.78854370117188, 89.60323333740234, 95.41792297363281, 101.23261260986328, 107.04730224609375, 112.86198425292969, 118.67668151855469, 124.49137115478516, 130.30606079101562, 136.12074279785156, 141.93544006347656, 147.7501220703125, 153.5648193359375, 159.37950134277344, 165.19418334960938, 171.0088653564453, 176.8235626220703, 182.63824462890625, 188.45294189453125, 194.2676239013672, 200.0823211669922, 205.89700317382812, 211.71170043945312, 217.52638244628906, 223.34107971191406, 229.15576171875, 234.970458984375, 240.78514099121094, 246.59983825683594, 252.41452026367188, 258.2292175292969]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 10.0, 10.0, 18.0, 20.0, 20.0, 25.0, 27.0, 37.0, 43.0, 54.0, 43.0, 58.0, 55.0, 74.0, 78.0, 63.0, 64.0, 49.0, 45.0, 31.0, 34.0, 30.0, 33.0, 21.0, 17.0, 10.0, 7.0, 10.0, 4.0, 3.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-104.42759704589844, -101.55113983154297, -98.6746826171875, -95.7982177734375, -92.92176055908203, -90.04530334472656, -87.16883850097656, -84.2923812866211, -81.41592407226562, -78.53946685791016, -75.66300964355469, -72.78654479980469, -69.91008758544922, -67.03363037109375, -64.15716552734375, -61.28070831298828, -58.40425109863281, -55.527793884277344, -52.65133285522461, -49.774871826171875, -46.898414611816406, -44.02195739746094, -41.1454963684082, -38.26903533935547, -35.392578125, -32.51612091064453, -29.639659881591797, -26.763200759887695, -23.886741638183594, -21.010282516479492, -18.13382339477539, -15.257364273071289, -12.380905151367188, -9.504446029663086, -6.627986907958984, -3.751527786254883, -0.8750686645507812, 2.0013904571533203, 4.877849578857422, 7.754308700561523, 10.630767822265625, 13.507226943969727, 16.383686065673828, 19.26014518737793, 22.13660430908203, 25.013063430786133, 27.889522552490234, 30.765981674194336, 33.64244079589844, 36.518898010253906, 39.39535903930664, 42.271820068359375, 45.148277282714844, 48.02473449707031, 50.90119552612305, 53.77765655517578, 56.65411376953125, 59.53057098388672, 62.40703201293945, 65.28349304199219, 68.15995025634766, 71.03640747070312, 73.91287231445312, 76.7893295288086, 79.66578674316406]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 8.0, 9.0, 11.0, 25.0, 41.0, 100.0, 231.0, 890.0, 18928.0, 4160184.0, 12761.0, 748.0, 189.0, 84.0, 34.0, 15.0, 9.0, 6.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-22.90625, -21.88623046875, -20.8662109375, -19.84619140625, -18.826171875, -17.80615234375, -16.7861328125, -15.76611328125, -14.74609375, -13.72607421875, -12.7060546875, -11.68603515625, -10.666015625, -9.64599609375, -8.6259765625, -7.60595703125, -6.5859375, -5.56591796875, -4.5458984375, -3.52587890625, -2.505859375, -1.48583984375, -0.4658203125, 0.55419921875, 1.57421875, 2.59423828125, 3.6142578125, 4.63427734375, 5.654296875, 6.67431640625, 7.6943359375, 8.71435546875, 9.734375, 10.75439453125, 11.7744140625, 12.79443359375, 13.814453125, 14.83447265625, 15.8544921875, 16.87451171875, 17.89453125, 18.91455078125, 19.9345703125, 20.95458984375, 21.974609375, 22.99462890625, 24.0146484375, 25.03466796875, 26.0546875, 27.07470703125, 28.0947265625, 29.11474609375, 30.134765625, 31.15478515625, 32.1748046875, 33.19482421875, 34.21484375, 35.23486328125, 36.2548828125, 37.27490234375, 38.294921875, 39.31494140625, 40.3349609375, 41.35498046875, 42.375]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 10.0, 12.0, 12.0, 25.0, 34.0, 36.0, 52.0, 67.0, 87.0, 97.0, 99.0, 97.0, 89.0, 59.0, 68.0, 52.0, 38.0, 23.0, 18.0, 7.0, 5.0, 2.0, 5.0, 5.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.12890625, -5.94635009765625, -5.7637939453125, -5.58123779296875, -5.398681640625, -5.21612548828125, -5.0335693359375, -4.85101318359375, -4.66845703125, -4.48590087890625, -4.3033447265625, -4.12078857421875, -3.938232421875, -3.75567626953125, -3.5731201171875, -3.39056396484375, -3.2080078125, -3.02545166015625, -2.8428955078125, -2.66033935546875, -2.477783203125, -2.29522705078125, -2.1126708984375, -1.93011474609375, -1.74755859375, -1.56500244140625, -1.3824462890625, -1.19989013671875, -1.017333984375, -0.83477783203125, -0.6522216796875, -0.46966552734375, -0.287109375, -0.10455322265625, 0.0780029296875, 0.26055908203125, 0.443115234375, 0.62567138671875, 0.8082275390625, 0.99078369140625, 1.17333984375, 1.35589599609375, 1.5384521484375, 1.72100830078125, 1.903564453125, 2.08612060546875, 2.2686767578125, 2.45123291015625, 2.6337890625, 2.81634521484375, 2.9989013671875, 3.18145751953125, 3.364013671875, 3.54656982421875, 3.7291259765625, 3.91168212890625, 4.09423828125, 4.27679443359375, 4.4593505859375, 4.64190673828125, 4.824462890625, 5.00701904296875, 5.1895751953125, 5.37213134765625, 5.5546875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 12.0, 16.0, 31.0, 74.0, 143.0, 354.0, 1033.0, 5460.0, 49331.0, 2531661.0, 1563082.0, 37028.0, 4554.0, 975.0, 314.0, 113.0, 58.0, 25.0, 10.0, 5.0, 5.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-15.078125, -14.71868896484375, -14.3592529296875, -13.99981689453125, -13.640380859375, -13.28094482421875, -12.9215087890625, -12.56207275390625, -12.20263671875, -11.84320068359375, -11.4837646484375, -11.12432861328125, -10.764892578125, -10.40545654296875, -10.0460205078125, -9.68658447265625, -9.3271484375, -8.96771240234375, -8.6082763671875, -8.24884033203125, -7.889404296875, -7.52996826171875, -7.1705322265625, -6.81109619140625, -6.45166015625, -6.09222412109375, -5.7327880859375, -5.37335205078125, -5.013916015625, -4.65447998046875, -4.2950439453125, -3.93560791015625, -3.576171875, -3.21673583984375, -2.8572998046875, -2.49786376953125, -2.138427734375, -1.77899169921875, -1.4195556640625, -1.06011962890625, -0.70068359375, -0.34124755859375, 0.0181884765625, 0.37762451171875, 0.737060546875, 1.09649658203125, 1.4559326171875, 1.81536865234375, 2.1748046875, 2.53424072265625, 2.8936767578125, 3.25311279296875, 3.612548828125, 3.97198486328125, 4.3314208984375, 4.69085693359375, 5.05029296875, 5.40972900390625, 5.7691650390625, 6.12860107421875, 6.488037109375, 6.84747314453125, 7.2069091796875, 7.56634521484375, 7.92578125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 7.0, 6.0, 8.0, 18.0, 20.0, 30.0, 35.0, 103.0, 163.0, 363.0, 692.0, 1187.0, 751.0, 333.0, 160.0, 78.0, 50.0, 26.0, 14.0, 12.0, 7.0, 6.0, 5.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.0, -11.70391845703125, -11.4078369140625, -11.11175537109375, -10.815673828125, -10.51959228515625, -10.2235107421875, -9.92742919921875, -9.63134765625, -9.33526611328125, -9.0391845703125, -8.74310302734375, -8.447021484375, -8.15093994140625, -7.8548583984375, -7.55877685546875, -7.2626953125, -6.96661376953125, -6.6705322265625, -6.37445068359375, -6.078369140625, -5.78228759765625, -5.4862060546875, -5.19012451171875, -4.89404296875, -4.59796142578125, -4.3018798828125, -4.00579833984375, -3.709716796875, -3.41363525390625, -3.1175537109375, -2.82147216796875, -2.525390625, -2.22930908203125, -1.9332275390625, -1.63714599609375, -1.341064453125, -1.04498291015625, -0.7489013671875, -0.45281982421875, -0.15673828125, 0.13934326171875, 0.4354248046875, 0.73150634765625, 1.027587890625, 1.32366943359375, 1.6197509765625, 1.91583251953125, 2.2119140625, 2.50799560546875, 2.8040771484375, 3.10015869140625, 3.396240234375, 3.69232177734375, 3.9884033203125, 4.28448486328125, 4.58056640625, 4.87664794921875, 5.1727294921875, 5.46881103515625, 5.764892578125, 6.06097412109375, 6.3570556640625, 6.65313720703125, 6.94921875]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 8.0, 7.0, 7.0, 12.0, 27.0, 99.0, 216.0, 309.0, 190.0, 78.0, 25.0, 12.0, 5.0, 4.0, 2.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-139.43890380859375, -136.51602172851562, -133.5931396484375, -130.67025756835938, -127.74736785888672, -124.82447814941406, -121.90159606933594, -118.97871398925781, -116.05583190917969, -113.13294982910156, -110.2100601196289, -107.28717803955078, -104.36429595947266, -101.44140625, -98.51852416992188, -95.59564208984375, -92.6727523803711, -89.74987030029297, -86.82698059082031, -83.90409851074219, -80.98121643066406, -78.05833435058594, -75.13544464111328, -72.21256256103516, -69.2896728515625, -66.36679077148438, -63.443904876708984, -60.521018981933594, -57.59813690185547, -54.67525100708008, -51.75236511230469, -48.82948303222656, -45.906593322753906, -42.983707427978516, -40.06082534790039, -37.137939453125, -34.215057373046875, -31.292171478271484, -28.369285583496094, -25.446401596069336, -22.523517608642578, -19.60063362121582, -16.677749633789062, -13.754863739013672, -10.831979751586914, -7.909095764160156, -4.986209869384766, -2.063325881958008, 0.85955810546875, 3.782442569732666, 6.705327033996582, 9.628211975097656, 12.551095962524414, 15.473979949951172, 18.396865844726562, 21.31974983215332, 24.242633819580078, 27.165517807006836, 30.088401794433594, 33.011287689208984, 35.934173583984375, 38.8570556640625, 41.77994155883789, 44.70282745361328, 47.625709533691406]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 9.0, 7.0, 5.0, 14.0, 18.0, 33.0, 40.0, 51.0, 45.0, 48.0, 59.0, 72.0, 86.0, 83.0, 71.0, 64.0, 47.0, 51.0, 52.0, 31.0, 26.0, 22.0, 26.0, 13.0, 10.0, 6.0, 6.0, 5.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.01493835449219, -32.71302032470703, -31.411102294921875, -30.10918426513672, -28.807266235351562, -27.505348205566406, -26.20343017578125, -24.901512145996094, -23.599594116210938, -22.29767608642578, -20.995758056640625, -19.69384002685547, -18.391921997070312, -17.090003967285156, -15.7880859375, -14.486167907714844, -13.184249877929688, -11.882331848144531, -10.580413818359375, -9.278495788574219, -7.9765777587890625, -6.674659729003906, -5.37274169921875, -4.070823669433594, -2.7689056396484375, -1.4669876098632812, -0.165069580078125, 1.1368484497070312, 2.4387664794921875, 3.7406845092773438, 5.0426025390625, 6.344520568847656, 7.6464385986328125, 8.948356628417969, 10.250274658203125, 11.552192687988281, 12.854110717773438, 14.156028747558594, 15.45794677734375, 16.759864807128906, 18.061782836914062, 19.36370086669922, 20.665618896484375, 21.96753692626953, 23.269454956054688, 24.571372985839844, 25.873291015625, 27.175209045410156, 28.477127075195312, 29.77904510498047, 31.080963134765625, 32.38288116455078, 33.68479919433594, 34.986717224121094, 36.28863525390625, 37.590553283691406, 38.89247131347656, 40.19438934326172, 41.496307373046875, 42.79822540283203, 44.10014343261719, 45.402061462402344, 46.7039794921875, 48.005897521972656, 49.30781555175781]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 5.0, 2.0, 4.0, 5.0, 7.0, 9.0, 12.0, 16.0, 34.0, 57.0, 118.0, 210.0, 523.0, 1331.0, 4889.0, 30876.0, 584154.0, 396304.0, 23688.0, 4202.0, 1233.0, 455.0, 194.0, 100.0, 56.0, 29.0, 14.0, 8.0, 12.0, 5.0, 8.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.28125, -15.7869873046875, -15.292724609375, -14.7984619140625, -14.30419921875, -13.8099365234375, -13.315673828125, -12.8214111328125, -12.3271484375, -11.8328857421875, -11.338623046875, -10.8443603515625, -10.35009765625, -9.8558349609375, -9.361572265625, -8.8673095703125, -8.373046875, -7.8787841796875, -7.384521484375, -6.8902587890625, -6.39599609375, -5.9017333984375, -5.407470703125, -4.9132080078125, -4.4189453125, -3.9246826171875, -3.430419921875, -2.9361572265625, -2.44189453125, -1.9476318359375, -1.453369140625, -0.9591064453125, -0.46484375, 0.0294189453125, 0.523681640625, 1.0179443359375, 1.51220703125, 2.0064697265625, 2.500732421875, 2.9949951171875, 3.4892578125, 3.9835205078125, 4.477783203125, 4.9720458984375, 5.46630859375, 5.9605712890625, 6.454833984375, 6.9490966796875, 7.443359375, 7.9376220703125, 8.431884765625, 8.9261474609375, 9.42041015625, 9.9146728515625, 10.408935546875, 10.9031982421875, 11.3974609375, 11.8917236328125, 12.385986328125, 12.8802490234375, 13.37451171875, 13.8687744140625, 14.363037109375, 14.8572998046875, 15.3515625]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 4.0, 8.0, 10.0, 11.0, 13.0, 29.0, 21.0, 39.0, 49.0, 71.0, 77.0, 73.0, 91.0, 94.0, 73.0, 72.0, 50.0, 62.0, 38.0, 34.0, 29.0, 12.0, 16.0, 9.0, 4.0, 4.0, 7.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.7578125, -4.59906005859375, -4.4403076171875, -4.28155517578125, -4.122802734375, -3.96405029296875, -3.8052978515625, -3.64654541015625, -3.48779296875, -3.32904052734375, -3.1702880859375, -3.01153564453125, -2.852783203125, -2.69403076171875, -2.5352783203125, -2.37652587890625, -2.2177734375, -2.05902099609375, -1.9002685546875, -1.74151611328125, -1.582763671875, -1.42401123046875, -1.2652587890625, -1.10650634765625, -0.94775390625, -0.78900146484375, -0.6302490234375, -0.47149658203125, -0.312744140625, -0.15399169921875, 0.0047607421875, 0.16351318359375, 0.322265625, 0.48101806640625, 0.6397705078125, 0.79852294921875, 0.957275390625, 1.11602783203125, 1.2747802734375, 1.43353271484375, 1.59228515625, 1.75103759765625, 1.9097900390625, 2.06854248046875, 2.227294921875, 2.38604736328125, 2.5447998046875, 2.70355224609375, 2.8623046875, 3.02105712890625, 3.1798095703125, 3.33856201171875, 3.497314453125, 3.65606689453125, 3.8148193359375, 3.97357177734375, 4.13232421875, 4.29107666015625, 4.4498291015625, 4.60858154296875, 4.767333984375, 4.92608642578125, 5.0848388671875, 5.24359130859375, 5.40234375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 6.0, 5.0, 10.0, 7.0, 21.0, 13.0, 18.0, 28.0, 26.0, 47.0, 82.0, 138.0, 233.0, 511.0, 1110.0, 3174.0, 16201.0, 294646.0, 700312.0, 25239.0, 4191.0, 1319.0, 509.0, 284.0, 157.0, 81.0, 62.0, 30.0, 28.0, 21.0, 16.0, 9.0, 4.0, 4.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-19.03125, -18.456298828125, -17.88134765625, -17.306396484375, -16.7314453125, -16.156494140625, -15.58154296875, -15.006591796875, -14.431640625, -13.856689453125, -13.28173828125, -12.706787109375, -12.1318359375, -11.556884765625, -10.98193359375, -10.406982421875, -9.83203125, -9.257080078125, -8.68212890625, -8.107177734375, -7.5322265625, -6.957275390625, -6.38232421875, -5.807373046875, -5.232421875, -4.657470703125, -4.08251953125, -3.507568359375, -2.9326171875, -2.357666015625, -1.78271484375, -1.207763671875, -0.6328125, -0.057861328125, 0.51708984375, 1.092041015625, 1.6669921875, 2.241943359375, 2.81689453125, 3.391845703125, 3.966796875, 4.541748046875, 5.11669921875, 5.691650390625, 6.2666015625, 6.841552734375, 7.41650390625, 7.991455078125, 8.56640625, 9.141357421875, 9.71630859375, 10.291259765625, 10.8662109375, 11.441162109375, 12.01611328125, 12.591064453125, 13.166015625, 13.740966796875, 14.31591796875, 14.890869140625, 15.4658203125, 16.040771484375, 16.61572265625, 17.190673828125, 17.765625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 3.0, 4.0, 14.0, 10.0, 14.0, 22.0, 35.0, 32.0, 43.0, 47.0, 43.0, 81.0, 60.0, 59.0, 71.0, 57.0, 70.0, 65.0, 57.0, 40.0, 40.0, 34.0, 21.0, 23.0, 13.0, 10.0, 10.0, 7.0, 4.0, 4.0, 1.0, 5.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.359375, -20.790283203125, -20.22119140625, -19.652099609375, -19.0830078125, -18.513916015625, -17.94482421875, -17.375732421875, -16.806640625, -16.237548828125, -15.66845703125, -15.099365234375, -14.5302734375, -13.961181640625, -13.39208984375, -12.822998046875, -12.25390625, -11.684814453125, -11.11572265625, -10.546630859375, -9.9775390625, -9.408447265625, -8.83935546875, -8.270263671875, -7.701171875, -7.132080078125, -6.56298828125, -5.993896484375, -5.4248046875, -4.855712890625, -4.28662109375, -3.717529296875, -3.1484375, -2.579345703125, -2.01025390625, -1.441162109375, -0.8720703125, -0.302978515625, 0.26611328125, 0.835205078125, 1.404296875, 1.973388671875, 2.54248046875, 3.111572265625, 3.6806640625, 4.249755859375, 4.81884765625, 5.387939453125, 5.95703125, 6.526123046875, 7.09521484375, 7.664306640625, 8.2333984375, 8.802490234375, 9.37158203125, 9.940673828125, 10.509765625, 11.078857421875, 11.64794921875, 12.217041015625, 12.7861328125, 13.355224609375, 13.92431640625, 14.493408203125, 15.0625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 6.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 4.0, 5.0, 17.0, 18.0, 12.0, 40.0, 42.0, 74.0, 141.0, 248.0, 610.0, 1862.0, 10033.0, 460349.0, 561522.0, 10410.0, 1899.0, 642.0, 232.0, 127.0, 79.0, 48.0, 35.0, 20.0, 14.0, 18.0, 10.0, 4.0, 6.0, 3.0, 6.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.78125, -13.3367919921875, -12.892333984375, -12.4478759765625, -12.00341796875, -11.5589599609375, -11.114501953125, -10.6700439453125, -10.2255859375, -9.7811279296875, -9.336669921875, -8.8922119140625, -8.44775390625, -8.0032958984375, -7.558837890625, -7.1143798828125, -6.669921875, -6.2254638671875, -5.781005859375, -5.3365478515625, -4.89208984375, -4.4476318359375, -4.003173828125, -3.5587158203125, -3.1142578125, -2.6697998046875, -2.225341796875, -1.7808837890625, -1.33642578125, -0.8919677734375, -0.447509765625, -0.0030517578125, 0.44140625, 0.8858642578125, 1.330322265625, 1.7747802734375, 2.21923828125, 2.6636962890625, 3.108154296875, 3.5526123046875, 3.9970703125, 4.4415283203125, 4.885986328125, 5.3304443359375, 5.77490234375, 6.2193603515625, 6.663818359375, 7.1082763671875, 7.552734375, 7.9971923828125, 8.441650390625, 8.8861083984375, 9.33056640625, 9.7750244140625, 10.219482421875, 10.6639404296875, 11.1083984375, 11.5528564453125, 11.997314453125, 12.4417724609375, 12.88623046875, 13.3306884765625, 13.775146484375, 14.2196044921875, 14.6640625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 3.0, 4.0, 7.0, 5.0, 6.0, 13.0, 14.0, 11.0, 22.0, 23.0, 39.0, 54.0, 114.0, 194.0, 171.0, 113.0, 62.0, 40.0, 28.0, 23.0, 13.0, 7.0, 11.0, 5.0, 4.0, 2.0, 5.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011310577392578125, -0.0010905861854553223, -0.001050114631652832, -0.0010096430778503418, -0.0009691715240478516, -0.0009286999702453613, -0.0008882284164428711, -0.0008477568626403809, -0.0008072853088378906, -0.0007668137550354004, -0.0007263422012329102, -0.0006858706474304199, -0.0006453990936279297, -0.0006049275398254395, -0.0005644559860229492, -0.000523984432220459, -0.00048351287841796875, -0.0004430413246154785, -0.0004025697708129883, -0.00036209821701049805, -0.0003216266632080078, -0.0002811551094055176, -0.00024068355560302734, -0.0002002120018005371, -0.00015974044799804688, -0.00011926889419555664, -7.87973403930664e-05, -3.832578659057617e-05, 2.1457672119140625e-06, 4.26173210144043e-05, 8.308887481689453e-05, 0.00012356042861938477, 0.000164031982421875, 0.00020450353622436523, 0.00024497509002685547, 0.0002854466438293457, 0.00032591819763183594, 0.00036638975143432617, 0.0004068613052368164, 0.00044733285903930664, 0.0004878044128417969, 0.0005282759666442871, 0.0005687475204467773, 0.0006092190742492676, 0.0006496906280517578, 0.000690162181854248, 0.0007306337356567383, 0.0007711052894592285, 0.0008115768432617188, 0.000852048397064209, 0.0008925199508666992, 0.0009329915046691895, 0.0009734630584716797, 0.00101393461227417, 0.0010544061660766602, 0.0010948777198791504, 0.0011353492736816406, 0.0011758208274841309, 0.001216292381286621, 0.0012567639350891113, 0.0012972354888916016, 0.0013377070426940918, 0.001378178596496582, 0.0014186501502990723, 0.0014591217041015625]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 6.0, 7.0, 4.0, 6.0, 5.0, 7.0, 15.0, 17.0, 42.0, 46.0, 84.0, 134.0, 216.0, 441.0, 899.0, 2211.0, 7017.0, 35204.0, 805774.0, 174838.0, 14821.0, 3890.0, 1404.0, 655.0, 310.0, 171.0, 101.0, 65.0, 38.0, 34.0, 28.0, 22.0, 16.0, 9.0, 7.0, 6.0, 4.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.734375, -8.4757080078125, -8.217041015625, -7.9583740234375, -7.69970703125, -7.4410400390625, -7.182373046875, -6.9237060546875, -6.6650390625, -6.4063720703125, -6.147705078125, -5.8890380859375, -5.63037109375, -5.3717041015625, -5.113037109375, -4.8543701171875, -4.595703125, -4.3370361328125, -4.078369140625, -3.8197021484375, -3.56103515625, -3.3023681640625, -3.043701171875, -2.7850341796875, -2.5263671875, -2.2677001953125, -2.009033203125, -1.7503662109375, -1.49169921875, -1.2330322265625, -0.974365234375, -0.7156982421875, -0.45703125, -0.1983642578125, 0.060302734375, 0.3189697265625, 0.57763671875, 0.8363037109375, 1.094970703125, 1.3536376953125, 1.6123046875, 1.8709716796875, 2.129638671875, 2.3883056640625, 2.64697265625, 2.9056396484375, 3.164306640625, 3.4229736328125, 3.681640625, 3.9403076171875, 4.198974609375, 4.4576416015625, 4.71630859375, 4.9749755859375, 5.233642578125, 5.4923095703125, 5.7509765625, 6.0096435546875, 6.268310546875, 6.5269775390625, 6.78564453125, 7.0443115234375, 7.302978515625, 7.5616455078125, 7.8203125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 1.0, 6.0, 3.0, 8.0, 14.0, 22.0, 38.0, 65.0, 116.0, 169.0, 145.0, 160.0, 104.0, 53.0, 31.0, 17.0, 11.0, 6.0, 8.0, 7.0, 2.0, 1.0, 3.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.1015625, -8.8709716796875, -8.640380859375, -8.4097900390625, -8.17919921875, -7.9486083984375, -7.718017578125, -7.4874267578125, -7.2568359375, -7.0262451171875, -6.795654296875, -6.5650634765625, -6.33447265625, -6.1038818359375, -5.873291015625, -5.6427001953125, -5.412109375, -5.1815185546875, -4.950927734375, -4.7203369140625, -4.48974609375, -4.2591552734375, -4.028564453125, -3.7979736328125, -3.5673828125, -3.3367919921875, -3.106201171875, -2.8756103515625, -2.64501953125, -2.4144287109375, -2.183837890625, -1.9532470703125, -1.72265625, -1.4920654296875, -1.261474609375, -1.0308837890625, -0.80029296875, -0.5697021484375, -0.339111328125, -0.1085205078125, 0.1220703125, 0.3526611328125, 0.583251953125, 0.8138427734375, 1.04443359375, 1.2750244140625, 1.505615234375, 1.7362060546875, 1.966796875, 2.1973876953125, 2.427978515625, 2.6585693359375, 2.88916015625, 3.1197509765625, 3.350341796875, 3.5809326171875, 3.8115234375, 4.0421142578125, 4.272705078125, 4.5032958984375, 4.73388671875, 4.9644775390625, 5.195068359375, 5.4256591796875, 5.65625]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 6.0, 12.0, 39.0, 185.0, 428.0, 245.0, 56.0, 19.0, 10.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-282.855712890625, -276.782470703125, -270.709228515625, -264.635986328125, -258.562744140625, -252.48948669433594, -246.41624450683594, -240.34300231933594, -234.26974487304688, -228.19650268554688, -222.12326049804688, -216.05001831054688, -209.9767608642578, -203.9035186767578, -197.8302764892578, -191.7570343017578, -185.6837921142578, -179.6105499267578, -173.5373077392578, -167.46405029296875, -161.39080810546875, -155.31756591796875, -149.24432373046875, -143.17108154296875, -137.09783935546875, -131.02459716796875, -124.95134735107422, -118.87810516357422, -112.80485534667969, -106.73161315917969, -100.65837097167969, -94.58512878417969, -88.51187133789062, -82.43862915039062, -76.3653793334961, -70.2921371459961, -64.21888732910156, -58.14564514160156, -52.07240295410156, -45.9991569519043, -39.92591094970703, -33.852664947509766, -27.779420852661133, -21.7061767578125, -15.632930755615234, -9.559684753417969, -3.4864425659179688, 2.586803436279297, 8.660049438476562, 14.733294486999512, 20.80653953552246, 26.879783630371094, 32.95302963256836, 39.026275634765625, 45.099517822265625, 51.17276382446289, 57.246009826660156, 63.31925582885742, 69.39250183105469, 75.46574401855469, 81.53898620605469, 87.61223602294922, 93.68547821044922, 99.75872802734375, 105.83197021484375]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 8.0, 8.0, 8.0, 19.0, 14.0, 18.0, 24.0, 25.0, 40.0, 35.0, 40.0, 46.0, 48.0, 58.0, 74.0, 65.0, 79.0, 59.0, 67.0, 29.0, 43.0, 33.0, 34.0, 32.0, 33.0, 16.0, 11.0, 13.0, 8.0, 4.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.023216247558594, -43.96769332885742, -41.91217041015625, -39.85664749145508, -37.801124572753906, -35.745601654052734, -33.69007873535156, -31.63455581665039, -29.57903289794922, -27.523509979248047, -25.467987060546875, -23.412464141845703, -21.35694122314453, -19.30141830444336, -17.245895385742188, -15.190372467041016, -13.134849548339844, -11.079326629638672, -9.0238037109375, -6.968280792236328, -4.912757873535156, -2.8572349548339844, -0.8017120361328125, 1.2538108825683594, 3.3093338012695312, 5.364856719970703, 7.420379638671875, 9.475902557373047, 11.531425476074219, 13.58694839477539, 15.642471313476562, 17.697994232177734, 19.753517150878906, 21.809040069580078, 23.86456298828125, 25.920085906982422, 27.975608825683594, 30.031131744384766, 32.08665466308594, 34.14217758178711, 36.19770050048828, 38.25322341918945, 40.308746337890625, 42.3642692565918, 44.41979217529297, 46.47531509399414, 48.53083801269531, 50.586360931396484, 52.641883850097656, 54.69740676879883, 56.7529296875, 58.80845260620117, 60.863975524902344, 62.919498443603516, 64.97502136230469, 67.03054809570312, 69.08606719970703, 71.14158630371094, 73.19711303710938, 75.25263977050781, 77.30815887451172, 79.36367797851562, 81.41920471191406, 83.4747314453125, 85.5302505493164]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 6.0, 5.0, 3.0, 2.0, 2.0, 5.0, 9.0, 15.0, 13.0, 27.0, 34.0, 71.0, 85.0, 156.0, 286.0, 602.0, 1581.0, 5375.0, 30988.0, 632238.0, 3366146.0, 138799.0, 12747.0, 2919.0, 1091.0, 476.0, 245.0, 134.0, 70.0, 48.0, 38.0, 21.0, 18.0, 12.0, 10.0, 6.0, 5.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.24609375, -6.95953369140625, -6.6729736328125, -6.38641357421875, -6.099853515625, -5.81329345703125, -5.5267333984375, -5.24017333984375, -4.95361328125, -4.66705322265625, -4.3804931640625, -4.09393310546875, -3.807373046875, -3.52081298828125, -3.2342529296875, -2.94769287109375, -2.6611328125, -2.37457275390625, -2.0880126953125, -1.80145263671875, -1.514892578125, -1.22833251953125, -0.9417724609375, -0.65521240234375, -0.36865234375, -0.08209228515625, 0.2044677734375, 0.49102783203125, 0.777587890625, 1.06414794921875, 1.3507080078125, 1.63726806640625, 1.923828125, 2.21038818359375, 2.4969482421875, 2.78350830078125, 3.070068359375, 3.35662841796875, 3.6431884765625, 3.92974853515625, 4.21630859375, 4.50286865234375, 4.7894287109375, 5.07598876953125, 5.362548828125, 5.64910888671875, 5.9356689453125, 6.22222900390625, 6.5087890625, 6.79534912109375, 7.0819091796875, 7.36846923828125, 7.655029296875, 7.94158935546875, 8.2281494140625, 8.51470947265625, 8.80126953125, 9.08782958984375, 9.3743896484375, 9.66094970703125, 9.947509765625, 10.23406982421875, 10.5206298828125, 10.80718994140625, 11.09375]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 8.0, 16.0, 23.0, 36.0, 55.0, 85.0, 119.0, 122.0, 138.0, 138.0, 95.0, 85.0, 44.0, 23.0, 12.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.04296875, -3.80731201171875, -3.5716552734375, -3.33599853515625, -3.100341796875, -2.86468505859375, -2.6290283203125, -2.39337158203125, -2.15771484375, -1.92205810546875, -1.6864013671875, -1.45074462890625, -1.215087890625, -0.97943115234375, -0.7437744140625, -0.50811767578125, -0.2724609375, -0.03680419921875, 0.1988525390625, 0.43450927734375, 0.670166015625, 0.90582275390625, 1.1414794921875, 1.37713623046875, 1.61279296875, 1.84844970703125, 2.0841064453125, 2.31976318359375, 2.555419921875, 2.79107666015625, 3.0267333984375, 3.26239013671875, 3.498046875, 3.73370361328125, 3.9693603515625, 4.20501708984375, 4.440673828125, 4.67633056640625, 4.9119873046875, 5.14764404296875, 5.38330078125, 5.61895751953125, 5.8546142578125, 6.09027099609375, 6.325927734375, 6.56158447265625, 6.7972412109375, 7.03289794921875, 7.2685546875, 7.50421142578125, 7.7398681640625, 7.97552490234375, 8.211181640625, 8.44683837890625, 8.6824951171875, 8.91815185546875, 9.15380859375, 9.38946533203125, 9.6251220703125, 9.86077880859375, 10.096435546875, 10.33209228515625, 10.5677490234375, 10.80340576171875, 11.0390625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 5.0, 7.0, 9.0, 14.0, 25.0, 49.0, 80.0, 132.0, 295.0, 744.0, 2592.0, 12195.0, 89397.0, 1897391.0, 2083313.0, 91639.0, 12513.0, 2621.0, 750.0, 251.0, 116.0, 61.0, 41.0, 17.0, 8.0, 6.0, 8.0, 5.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.5703125, -8.2847900390625, -7.999267578125, -7.7137451171875, -7.42822265625, -7.1427001953125, -6.857177734375, -6.5716552734375, -6.2861328125, -6.0006103515625, -5.715087890625, -5.4295654296875, -5.14404296875, -4.8585205078125, -4.572998046875, -4.2874755859375, -4.001953125, -3.7164306640625, -3.430908203125, -3.1453857421875, -2.85986328125, -2.5743408203125, -2.288818359375, -2.0032958984375, -1.7177734375, -1.4322509765625, -1.146728515625, -0.8612060546875, -0.57568359375, -0.2901611328125, -0.004638671875, 0.2808837890625, 0.56640625, 0.8519287109375, 1.137451171875, 1.4229736328125, 1.70849609375, 1.9940185546875, 2.279541015625, 2.5650634765625, 2.8505859375, 3.1361083984375, 3.421630859375, 3.7071533203125, 3.99267578125, 4.2781982421875, 4.563720703125, 4.8492431640625, 5.134765625, 5.4202880859375, 5.705810546875, 5.9913330078125, 6.27685546875, 6.5623779296875, 6.847900390625, 7.1334228515625, 7.4189453125, 7.7044677734375, 7.989990234375, 8.2755126953125, 8.56103515625, 8.8465576171875, 9.132080078125, 9.4176025390625, 9.703125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 5.0, 3.0, 8.0, 3.0, 7.0, 3.0, 6.0, 15.0, 12.0, 25.0, 34.0, 45.0, 40.0, 52.0, 85.0, 127.0, 136.0, 235.0, 323.0, 483.0, 566.0, 551.0, 351.0, 274.0, 189.0, 120.0, 105.0, 64.0, 52.0, 42.0, 27.0, 20.0, 15.0, 12.0, 10.0, 8.0, 5.0, 6.0, 3.0, 5.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.62890625, -5.4337158203125, -5.238525390625, -5.0433349609375, -4.84814453125, -4.6529541015625, -4.457763671875, -4.2625732421875, -4.0673828125, -3.8721923828125, -3.677001953125, -3.4818115234375, -3.28662109375, -3.0914306640625, -2.896240234375, -2.7010498046875, -2.505859375, -2.3106689453125, -2.115478515625, -1.9202880859375, -1.72509765625, -1.5299072265625, -1.334716796875, -1.1395263671875, -0.9443359375, -0.7491455078125, -0.553955078125, -0.3587646484375, -0.16357421875, 0.0316162109375, 0.226806640625, 0.4219970703125, 0.6171875, 0.8123779296875, 1.007568359375, 1.2027587890625, 1.39794921875, 1.5931396484375, 1.788330078125, 1.9835205078125, 2.1787109375, 2.3739013671875, 2.569091796875, 2.7642822265625, 2.95947265625, 3.1546630859375, 3.349853515625, 3.5450439453125, 3.740234375, 3.9354248046875, 4.130615234375, 4.3258056640625, 4.52099609375, 4.7161865234375, 4.911376953125, 5.1065673828125, 5.3017578125, 5.4969482421875, 5.692138671875, 5.8873291015625, 6.08251953125, 6.2777099609375, 6.472900390625, 6.6680908203125, 6.86328125]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 14.0, 31.0, 107.0, 307.0, 360.0, 141.0, 26.0, 8.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-223.38836669921875, -218.10484313964844, -212.82131958007812, -207.5377960205078, -202.2542724609375, -196.9707489013672, -191.68722534179688, -186.4036865234375, -181.12017822265625, -175.83665466308594, -170.55313110351562, -165.2696075439453, -159.986083984375, -154.7025604248047, -149.41903686523438, -144.135498046875, -138.8519744873047, -133.56845092773438, -128.28492736816406, -123.00140380859375, -117.71788024902344, -112.43435668945312, -107.15082550048828, -101.86730194091797, -96.58377838134766, -91.30025482177734, -86.01673126220703, -80.73320770263672, -75.44967651367188, -70.16615295410156, -64.88262939453125, -59.59910583496094, -54.315582275390625, -49.03205871582031, -43.74853515625, -38.46500778198242, -33.18148422241211, -27.897960662841797, -22.61443519592285, -17.330909729003906, -12.047386169433594, -6.763861656188965, -1.480337142944336, 3.803187370300293, 9.086711883544922, 14.370235443115234, 19.65376091003418, 24.937286376953125, 30.220809936523438, 35.50433349609375, 40.78785705566406, 46.07138442993164, 51.35490798950195, 56.638431549072266, 61.921958923339844, 67.20548248291016, 72.48900604248047, 77.77252960205078, 83.0560531616211, 88.3395767211914, 93.62310791015625, 98.90663146972656, 104.19015502929688, 109.47367858886719, 114.7572021484375]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 5.0, 9.0, 2.0, 11.0, 25.0, 25.0, 33.0, 52.0, 64.0, 67.0, 72.0, 98.0, 83.0, 99.0, 75.0, 72.0, 61.0, 43.0, 35.0, 25.0, 15.0, 15.0, 7.0, 6.0, 7.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-79.11746215820312, -76.9078598022461, -74.69825744628906, -72.48866271972656, -70.27906036376953, -68.0694580078125, -65.85985565185547, -63.65025329589844, -61.44065475463867, -59.23105239868164, -57.021453857421875, -54.811851501464844, -52.60224914550781, -50.39265060424805, -48.183048248291016, -45.97344970703125, -43.76384735107422, -41.55424499511719, -39.34464645385742, -37.13504409790039, -34.925445556640625, -32.715843200683594, -30.506240844726562, -28.296640396118164, -26.087039947509766, -23.877439498901367, -21.66783905029297, -19.458236694335938, -17.24863624572754, -15.03903579711914, -12.829434394836426, -10.619832992553711, -8.410224914550781, -6.200623989105225, -3.991023063659668, -1.7814221382141113, 0.4281787872314453, 2.6377792358398438, 4.847380638122559, 7.056982040405273, 9.266582489013672, 11.47618293762207, 13.685784339904785, 15.8953857421875, 18.1049861907959, 20.314586639404297, 22.524188995361328, 24.733789443969727, 26.943389892578125, 29.152990341186523, 31.362590789794922, 33.57219314575195, 35.78179168701172, 37.99139404296875, 40.20099639892578, 42.41059875488281, 44.62019729614258, 46.82979965209961, 49.039398193359375, 51.249000549316406, 53.45860290527344, 55.6682014465332, 57.877803802490234, 60.08740234375, 62.29700469970703]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 5.0, 4.0, 4.0, 7.0, 10.0, 8.0, 13.0, 21.0, 14.0, 43.0, 62.0, 85.0, 117.0, 195.0, 349.0, 643.0, 1294.0, 3418.0, 11906.0, 59373.0, 401788.0, 477939.0, 70544.0, 13712.0, 3842.0, 1478.0, 653.0, 356.0, 225.0, 141.0, 98.0, 57.0, 42.0, 28.0, 15.0, 15.0, 17.0, 7.0, 8.0, 3.0, 3.0, 5.0, 1.0, 5.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.09375, -10.7364501953125, -10.379150390625, -10.0218505859375, -9.66455078125, -9.3072509765625, -8.949951171875, -8.5926513671875, -8.2353515625, -7.8780517578125, -7.520751953125, -7.1634521484375, -6.80615234375, -6.4488525390625, -6.091552734375, -5.7342529296875, -5.376953125, -5.0196533203125, -4.662353515625, -4.3050537109375, -3.94775390625, -3.5904541015625, -3.233154296875, -2.8758544921875, -2.5185546875, -2.1612548828125, -1.803955078125, -1.4466552734375, -1.08935546875, -0.7320556640625, -0.374755859375, -0.0174560546875, 0.33984375, 0.6971435546875, 1.054443359375, 1.4117431640625, 1.76904296875, 2.1263427734375, 2.483642578125, 2.8409423828125, 3.1982421875, 3.5555419921875, 3.912841796875, 4.2701416015625, 4.62744140625, 4.9847412109375, 5.342041015625, 5.6993408203125, 6.056640625, 6.4139404296875, 6.771240234375, 7.1285400390625, 7.48583984375, 7.8431396484375, 8.200439453125, 8.5577392578125, 8.9150390625, 9.2723388671875, 9.629638671875, 9.9869384765625, 10.34423828125, 10.7015380859375, 11.058837890625, 11.4161376953125, 11.7734375]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 3.0, 10.0, 11.0, 12.0, 24.0, 26.0, 43.0, 52.0, 68.0, 87.0, 82.0, 78.0, 76.0, 76.0, 72.0, 77.0, 67.0, 49.0, 29.0, 24.0, 16.0, 6.0, 8.0, 6.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.9765625, -4.8260498046875, -4.675537109375, -4.5250244140625, -4.37451171875, -4.2239990234375, -4.073486328125, -3.9229736328125, -3.7724609375, -3.6219482421875, -3.471435546875, -3.3209228515625, -3.17041015625, -3.0198974609375, -2.869384765625, -2.7188720703125, -2.568359375, -2.4178466796875, -2.267333984375, -2.1168212890625, -1.96630859375, -1.8157958984375, -1.665283203125, -1.5147705078125, -1.3642578125, -1.2137451171875, -1.063232421875, -0.9127197265625, -0.76220703125, -0.6116943359375, -0.461181640625, -0.3106689453125, -0.16015625, -0.0096435546875, 0.140869140625, 0.2913818359375, 0.44189453125, 0.5924072265625, 0.742919921875, 0.8934326171875, 1.0439453125, 1.1944580078125, 1.344970703125, 1.4954833984375, 1.64599609375, 1.7965087890625, 1.947021484375, 2.0975341796875, 2.248046875, 2.3985595703125, 2.549072265625, 2.6995849609375, 2.85009765625, 3.0006103515625, 3.151123046875, 3.3016357421875, 3.4521484375, 3.6026611328125, 3.753173828125, 3.9036865234375, 4.05419921875, 4.2047119140625, 4.355224609375, 4.5057373046875, 4.65625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 3.0, 1.0, 2.0, 1.0, 9.0, 7.0, 16.0, 25.0, 28.0, 37.0, 57.0, 88.0, 130.0, 255.0, 471.0, 1068.0, 3112.0, 14182.0, 554025.0, 455791.0, 13902.0, 3036.0, 1121.0, 513.0, 249.0, 146.0, 91.0, 75.0, 39.0, 26.0, 9.0, 10.0, 5.0, 8.0, 5.0, 3.0, 2.0, 8.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-29.296875, -28.43505859375, -27.5732421875, -26.71142578125, -25.849609375, -24.98779296875, -24.1259765625, -23.26416015625, -22.40234375, -21.54052734375, -20.6787109375, -19.81689453125, -18.955078125, -18.09326171875, -17.2314453125, -16.36962890625, -15.5078125, -14.64599609375, -13.7841796875, -12.92236328125, -12.060546875, -11.19873046875, -10.3369140625, -9.47509765625, -8.61328125, -7.75146484375, -6.8896484375, -6.02783203125, -5.166015625, -4.30419921875, -3.4423828125, -2.58056640625, -1.71875, -0.85693359375, 0.0048828125, 0.86669921875, 1.728515625, 2.59033203125, 3.4521484375, 4.31396484375, 5.17578125, 6.03759765625, 6.8994140625, 7.76123046875, 8.623046875, 9.48486328125, 10.3466796875, 11.20849609375, 12.0703125, 12.93212890625, 13.7939453125, 14.65576171875, 15.517578125, 16.37939453125, 17.2412109375, 18.10302734375, 18.96484375, 19.82666015625, 20.6884765625, 21.55029296875, 22.412109375, 23.27392578125, 24.1357421875, 24.99755859375, 25.859375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 5.0, 4.0, 6.0, 10.0, 12.0, 13.0, 16.0, 29.0, 34.0, 45.0, 41.0, 62.0, 62.0, 56.0, 71.0, 54.0, 78.0, 63.0, 59.0, 44.0, 42.0, 36.0, 35.0, 15.0, 26.0, 13.0, 14.0, 11.0, 12.0, 8.0, 11.0, 3.0, 6.0, 0.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.734375, -18.191162109375, -17.64794921875, -17.104736328125, -16.5615234375, -16.018310546875, -15.47509765625, -14.931884765625, -14.388671875, -13.845458984375, -13.30224609375, -12.759033203125, -12.2158203125, -11.672607421875, -11.12939453125, -10.586181640625, -10.04296875, -9.499755859375, -8.95654296875, -8.413330078125, -7.8701171875, -7.326904296875, -6.78369140625, -6.240478515625, -5.697265625, -5.154052734375, -4.61083984375, -4.067626953125, -3.5244140625, -2.981201171875, -2.43798828125, -1.894775390625, -1.3515625, -0.808349609375, -0.26513671875, 0.278076171875, 0.8212890625, 1.364501953125, 1.90771484375, 2.450927734375, 2.994140625, 3.537353515625, 4.08056640625, 4.623779296875, 5.1669921875, 5.710205078125, 6.25341796875, 6.796630859375, 7.33984375, 7.883056640625, 8.42626953125, 8.969482421875, 9.5126953125, 10.055908203125, 10.59912109375, 11.142333984375, 11.685546875, 12.228759765625, 12.77197265625, 13.315185546875, 13.8583984375, 14.401611328125, 14.94482421875, 15.488037109375, 16.03125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 4.0, 5.0, 7.0, 8.0, 6.0, 8.0, 13.0, 18.0, 22.0, 24.0, 32.0, 51.0, 69.0, 101.0, 191.0, 320.0, 739.0, 2023.0, 7790.0, 49359.0, 798633.0, 166540.0, 16701.0, 3532.0, 1163.0, 487.0, 245.0, 146.0, 96.0, 55.0, 38.0, 19.0, 22.0, 15.0, 16.0, 7.0, 16.0, 10.0, 5.0, 6.0, 5.0, 3.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.8671875, -8.5963134765625, -8.325439453125, -8.0545654296875, -7.78369140625, -7.5128173828125, -7.241943359375, -6.9710693359375, -6.7001953125, -6.4293212890625, -6.158447265625, -5.8875732421875, -5.61669921875, -5.3458251953125, -5.074951171875, -4.8040771484375, -4.533203125, -4.2623291015625, -3.991455078125, -3.7205810546875, -3.44970703125, -3.1788330078125, -2.907958984375, -2.6370849609375, -2.3662109375, -2.0953369140625, -1.824462890625, -1.5535888671875, -1.28271484375, -1.0118408203125, -0.740966796875, -0.4700927734375, -0.19921875, 0.0716552734375, 0.342529296875, 0.6134033203125, 0.88427734375, 1.1551513671875, 1.426025390625, 1.6968994140625, 1.9677734375, 2.2386474609375, 2.509521484375, 2.7803955078125, 3.05126953125, 3.3221435546875, 3.593017578125, 3.8638916015625, 4.134765625, 4.4056396484375, 4.676513671875, 4.9473876953125, 5.21826171875, 5.4891357421875, 5.760009765625, 6.0308837890625, 6.3017578125, 6.5726318359375, 6.843505859375, 7.1143798828125, 7.38525390625, 7.6561279296875, 7.927001953125, 8.1978759765625, 8.46875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 1.0, 1.0, 7.0, 3.0, 6.0, 10.0, 7.0, 16.0, 9.0, 20.0, 14.0, 30.0, 29.0, 30.0, 57.0, 66.0, 106.0, 157.0, 114.0, 80.0, 38.0, 44.0, 34.0, 19.0, 19.0, 12.0, 13.0, 17.0, 9.0, 4.0, 7.0, 4.0, 5.0, 3.0, 2.0, 1.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0011348724365234375, -0.0010951459407806396, -0.0010554194450378418, -0.001015692949295044, -0.0009759664535522461, -0.0009362399578094482, -0.0008965134620666504, -0.0008567869663238525, -0.0008170604705810547, -0.0007773339748382568, -0.000737607479095459, -0.0006978809833526611, -0.0006581544876098633, -0.0006184279918670654, -0.0005787014961242676, -0.0005389750003814697, -0.0004992485046386719, -0.000459522008895874, -0.00041979551315307617, -0.0003800690174102783, -0.00034034252166748047, -0.0003006160259246826, -0.00026088953018188477, -0.00022116303443908691, -0.00018143653869628906, -0.0001417100429534912, -0.00010198354721069336, -6.225705146789551e-05, -2.2530555725097656e-05, 1.7195940017700195e-05, 5.692243576049805e-05, 9.66489315032959e-05, 0.00013637542724609375, 0.0001761019229888916, 0.00021582841873168945, 0.0002555549144744873, 0.00029528141021728516, 0.000335007905960083, 0.00037473440170288086, 0.0004144608974456787, 0.00045418739318847656, 0.0004939138889312744, 0.0005336403846740723, 0.0005733668804168701, 0.000613093376159668, 0.0006528198719024658, 0.0006925463676452637, 0.0007322728633880615, 0.0007719993591308594, 0.0008117258548736572, 0.0008514523506164551, 0.0008911788463592529, 0.0009309053421020508, 0.0009706318378448486, 0.0010103583335876465, 0.0010500848293304443, 0.0010898113250732422, 0.00112953782081604, 0.0011692643165588379, 0.0012089908123016357, 0.0012487173080444336, 0.0012884438037872314, 0.0013281702995300293, 0.0013678967952728271, 0.001407623291015625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 2.0, 3.0, 6.0, 7.0, 5.0, 15.0, 16.0, 22.0, 12.0, 34.0, 29.0, 68.0, 95.0, 166.0, 242.0, 431.0, 801.0, 1921.0, 5750.0, 23008.0, 274707.0, 696328.0, 33052.0, 7274.0, 2264.0, 984.0, 483.0, 284.0, 164.0, 102.0, 73.0, 49.0, 48.0, 23.0, 25.0, 14.0, 13.0, 10.0, 4.0, 3.0, 3.0, 7.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.9296875, -7.6572265625, -7.384765625, -7.1123046875, -6.83984375, -6.5673828125, -6.294921875, -6.0224609375, -5.75, -5.4775390625, -5.205078125, -4.9326171875, -4.66015625, -4.3876953125, -4.115234375, -3.8427734375, -3.5703125, -3.2978515625, -3.025390625, -2.7529296875, -2.48046875, -2.2080078125, -1.935546875, -1.6630859375, -1.390625, -1.1181640625, -0.845703125, -0.5732421875, -0.30078125, -0.0283203125, 0.244140625, 0.5166015625, 0.7890625, 1.0615234375, 1.333984375, 1.6064453125, 1.87890625, 2.1513671875, 2.423828125, 2.6962890625, 2.96875, 3.2412109375, 3.513671875, 3.7861328125, 4.05859375, 4.3310546875, 4.603515625, 4.8759765625, 5.1484375, 5.4208984375, 5.693359375, 5.9658203125, 6.23828125, 6.5107421875, 6.783203125, 7.0556640625, 7.328125, 7.6005859375, 7.873046875, 8.1455078125, 8.41796875, 8.6904296875, 8.962890625, 9.2353515625, 9.5078125]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 5.0, 1.0, 2.0, 11.0, 13.0, 19.0, 9.0, 31.0, 29.0, 59.0, 93.0, 137.0, 198.0, 129.0, 79.0, 52.0, 49.0, 21.0, 21.0, 7.0, 15.0, 7.0, 2.0, 5.0, 3.0, 3.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.234375, -7.9449462890625, -7.655517578125, -7.3660888671875, -7.07666015625, -6.7872314453125, -6.497802734375, -6.2083740234375, -5.9189453125, -5.6295166015625, -5.340087890625, -5.0506591796875, -4.76123046875, -4.4718017578125, -4.182373046875, -3.8929443359375, -3.603515625, -3.3140869140625, -3.024658203125, -2.7352294921875, -2.44580078125, -2.1563720703125, -1.866943359375, -1.5775146484375, -1.2880859375, -0.9986572265625, -0.709228515625, -0.4197998046875, -0.13037109375, 0.1590576171875, 0.448486328125, 0.7379150390625, 1.02734375, 1.3167724609375, 1.606201171875, 1.8956298828125, 2.18505859375, 2.4744873046875, 2.763916015625, 3.0533447265625, 3.3427734375, 3.6322021484375, 3.921630859375, 4.2110595703125, 4.50048828125, 4.7899169921875, 5.079345703125, 5.3687744140625, 5.658203125, 5.9476318359375, 6.237060546875, 6.5264892578125, 6.81591796875, 7.1053466796875, 7.394775390625, 7.6842041015625, 7.9736328125, 8.2630615234375, 8.552490234375, 8.8419189453125, 9.13134765625, 9.4207763671875, 9.710205078125, 9.9996337890625, 10.2890625]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 0.0, 11.0, 12.0, 46.0, 100.0, 263.0, 319.0, 152.0, 55.0, 17.0, 10.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-243.766357421875, -238.58145141601562, -233.3965606689453, -228.21165466308594, -223.02674865722656, -217.84185791015625, -212.65695190429688, -207.4720458984375, -202.28713989257812, -197.10223388671875, -191.91734313964844, -186.73243713378906, -181.5475311279297, -176.36264038085938, -171.177734375, -165.99282836914062, -160.8079376220703, -155.62303161621094, -150.43814086914062, -145.25323486328125, -140.06832885742188, -134.8834228515625, -129.6985321044922, -124.51362609863281, -119.32872772216797, -114.14382934570312, -108.95892333984375, -103.7740249633789, -98.58912658691406, -93.40422058105469, -88.21932220458984, -83.034423828125, -77.84951782226562, -72.66461944580078, -67.4797134399414, -62.29481506347656, -57.10991287231445, -51.925010681152344, -46.7401123046875, -41.55521011352539, -36.37030792236328, -31.185405731201172, -26.000505447387695, -20.81560516357422, -15.63070297241211, -10.44580078125, -5.260900497436523, -0.07600021362304688, 5.1089019775390625, 10.293803215026855, 15.478704452514648, 20.663604736328125, 25.848506927490234, 31.033409118652344, 36.21830749511719, 41.4032096862793, 46.588111877441406, 51.773014068603516, 56.957916259765625, 62.14281463623047, 67.32771301269531, 72.51261901855469, 77.69751739501953, 82.88241577148438, 88.06732177734375]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 6.0, 3.0, 7.0, 2.0, 10.0, 10.0, 10.0, 12.0, 11.0, 12.0, 13.0, 12.0, 16.0, 20.0, 27.0, 19.0, 30.0, 35.0, 38.0, 43.0, 47.0, 46.0, 55.0, 47.0, 60.0, 47.0, 38.0, 45.0, 36.0, 42.0, 20.0, 13.0, 18.0, 17.0, 27.0, 13.0, 14.0, 20.0, 11.0, 7.0, 11.0, 7.0, 5.0, 6.0, 3.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-46.04188537597656, -44.638519287109375, -43.23515319824219, -41.831787109375, -40.42842483520508, -39.02505874633789, -37.6216926574707, -36.218326568603516, -34.814964294433594, -33.411598205566406, -32.00823211669922, -30.604867935180664, -29.20150375366211, -27.798137664794922, -26.394771575927734, -24.991405487060547, -23.58803939819336, -22.184673309326172, -20.781309127807617, -19.37794303894043, -17.974578857421875, -16.571212768554688, -15.1678466796875, -13.764481544494629, -12.361116409301758, -10.957751274108887, -9.554386138916016, -8.151020050048828, -6.747654914855957, -5.344289779663086, -3.9409236907958984, -2.5375585556030273, -1.1341896057128906, 0.26917576789855957, 1.6725411415100098, 3.075906753540039, 4.47927188873291, 5.882637023925781, 7.286003112792969, 8.68936824798584, 10.092733383178711, 11.496098518371582, 12.899463653564453, 14.30282974243164, 15.706194877624512, 17.109560012817383, 18.51292610168457, 19.916290283203125, 21.319656372070312, 22.7230224609375, 24.126386642456055, 25.529752731323242, 26.933116912841797, 28.336483001708984, 29.739849090576172, 31.14321517944336, 32.54657745361328, 33.94994354248047, 35.353309631347656, 36.756675720214844, 38.160037994384766, 39.56340408325195, 40.96677017211914, 42.37013626098633, 43.773502349853516]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 1.0, 5.0, 2.0, 2.0, 4.0, 9.0, 4.0, 12.0, 23.0, 24.0, 35.0, 57.0, 66.0, 119.0, 210.0, 516.0, 1134.0, 4114.0, 32371.0, 2457984.0, 1665918.0, 25396.0, 3830.0, 1306.0, 539.0, 234.0, 137.0, 80.0, 54.0, 36.0, 17.0, 17.0, 4.0, 7.0, 8.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 0.0, 1.0], "bins": [-13.625, -13.24609375, -12.8671875, -12.48828125, -12.109375, -11.73046875, -11.3515625, -10.97265625, -10.59375, -10.21484375, -9.8359375, -9.45703125, -9.078125, -8.69921875, -8.3203125, -7.94140625, -7.5625, -7.18359375, -6.8046875, -6.42578125, -6.046875, -5.66796875, -5.2890625, -4.91015625, -4.53125, -4.15234375, -3.7734375, -3.39453125, -3.015625, -2.63671875, -2.2578125, -1.87890625, -1.5, -1.12109375, -0.7421875, -0.36328125, 0.015625, 0.39453125, 0.7734375, 1.15234375, 1.53125, 1.91015625, 2.2890625, 2.66796875, 3.046875, 3.42578125, 3.8046875, 4.18359375, 4.5625, 4.94140625, 5.3203125, 5.69921875, 6.078125, 6.45703125, 6.8359375, 7.21484375, 7.59375, 7.97265625, 8.3515625, 8.73046875, 9.109375, 9.48828125, 9.8671875, 10.24609375, 10.625]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 2.0, 1.0, 3.0, 4.0, 7.0, 11.0, 20.0, 25.0, 31.0, 46.0, 64.0, 73.0, 98.0, 80.0, 94.0, 93.0, 82.0, 71.0, 59.0, 44.0, 24.0, 31.0, 17.0, 11.0, 7.0, 4.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.078125, -3.917724609375, -3.75732421875, -3.596923828125, -3.4365234375, -3.276123046875, -3.11572265625, -2.955322265625, -2.794921875, -2.634521484375, -2.47412109375, -2.313720703125, -2.1533203125, -1.992919921875, -1.83251953125, -1.672119140625, -1.51171875, -1.351318359375, -1.19091796875, -1.030517578125, -0.8701171875, -0.709716796875, -0.54931640625, -0.388916015625, -0.228515625, -0.068115234375, 0.09228515625, 0.252685546875, 0.4130859375, 0.573486328125, 0.73388671875, 0.894287109375, 1.0546875, 1.215087890625, 1.37548828125, 1.535888671875, 1.6962890625, 1.856689453125, 2.01708984375, 2.177490234375, 2.337890625, 2.498291015625, 2.65869140625, 2.819091796875, 2.9794921875, 3.139892578125, 3.30029296875, 3.460693359375, 3.62109375, 3.781494140625, 3.94189453125, 4.102294921875, 4.2626953125, 4.423095703125, 4.58349609375, 4.743896484375, 4.904296875, 5.064697265625, 5.22509765625, 5.385498046875, 5.5458984375, 5.706298828125, 5.86669921875, 6.027099609375, 6.1875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 9.0, 21.0, 35.0, 70.0, 176.0, 421.0, 1446.0, 9374.0, 804881.0, 3357510.0, 17307.0, 1858.0, 618.0, 287.0, 127.0, 64.0, 32.0, 12.0, 15.0, 7.0, 5.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.7421875, -15.1395263671875, -14.536865234375, -13.9342041015625, -13.33154296875, -12.7288818359375, -12.126220703125, -11.5235595703125, -10.9208984375, -10.3182373046875, -9.715576171875, -9.1129150390625, -8.51025390625, -7.9075927734375, -7.304931640625, -6.7022705078125, -6.099609375, -5.4969482421875, -4.894287109375, -4.2916259765625, -3.68896484375, -3.0863037109375, -2.483642578125, -1.8809814453125, -1.2783203125, -0.6756591796875, -0.072998046875, 0.5296630859375, 1.13232421875, 1.7349853515625, 2.337646484375, 2.9403076171875, 3.54296875, 4.1456298828125, 4.748291015625, 5.3509521484375, 5.95361328125, 6.5562744140625, 7.158935546875, 7.7615966796875, 8.3642578125, 8.9669189453125, 9.569580078125, 10.1722412109375, 10.77490234375, 11.3775634765625, 11.980224609375, 12.5828857421875, 13.185546875, 13.7882080078125, 14.390869140625, 14.9935302734375, 15.59619140625, 16.1988525390625, 16.801513671875, 17.4041748046875, 18.0068359375, 18.6094970703125, 19.212158203125, 19.8148193359375, 20.41748046875, 21.0201416015625, 21.622802734375, 22.2254638671875, 22.828125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 0.0, 3.0, 1.0, 6.0, 11.0, 12.0, 7.0, 23.0, 37.0, 51.0, 115.0, 284.0, 564.0, 1011.0, 915.0, 506.0, 251.0, 127.0, 61.0, 38.0, 19.0, 14.0, 8.0, 8.0, 1.0, 6.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.3984375, -7.0279541015625, -6.657470703125, -6.2869873046875, -5.91650390625, -5.5460205078125, -5.175537109375, -4.8050537109375, -4.4345703125, -4.0640869140625, -3.693603515625, -3.3231201171875, -2.95263671875, -2.5821533203125, -2.211669921875, -1.8411865234375, -1.470703125, -1.1002197265625, -0.729736328125, -0.3592529296875, 0.01123046875, 0.3817138671875, 0.752197265625, 1.1226806640625, 1.4931640625, 1.8636474609375, 2.234130859375, 2.6046142578125, 2.97509765625, 3.3455810546875, 3.716064453125, 4.0865478515625, 4.45703125, 4.8275146484375, 5.197998046875, 5.5684814453125, 5.93896484375, 6.3094482421875, 6.679931640625, 7.0504150390625, 7.4208984375, 7.7913818359375, 8.161865234375, 8.5323486328125, 8.90283203125, 9.2733154296875, 9.643798828125, 10.0142822265625, 10.384765625, 10.7552490234375, 11.125732421875, 11.4962158203125, 11.86669921875, 12.2371826171875, 12.607666015625, 12.9781494140625, 13.3486328125, 13.7191162109375, 14.089599609375, 14.4600830078125, 14.83056640625, 15.2010498046875, 15.571533203125, 15.9420166015625, 16.3125]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 1.0, 3.0, 4.0, 2.0, 7.0, 10.0, 42.0, 109.0, 316.0, 343.0, 131.0, 22.0, 7.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-129.9283447265625, -125.30265045166016, -120.67695617675781, -116.05125427246094, -111.4255599975586, -106.79986572265625, -102.1741714477539, -97.54847717285156, -92.92277526855469, -88.29708099365234, -83.67138671875, -79.04568481445312, -74.41999053955078, -69.79429626464844, -65.1686019897461, -60.542903900146484, -55.917213439941406, -51.29151916503906, -46.66582107543945, -42.04012680053711, -37.4144287109375, -32.788734436035156, -28.163040161132812, -23.537342071533203, -18.91164779663086, -14.285951614379883, -9.660256385803223, -5.0345611572265625, -0.40886497497558594, 4.216831207275391, 8.842525482177734, 13.468223571777344, 18.093917846679688, 22.719614028930664, 27.34531021118164, 31.971004486083984, 36.596702575683594, 41.22239685058594, 45.84809112548828, 50.47378921508789, 55.099483489990234, 59.72517776489258, 64.35087585449219, 68.97657012939453, 73.60226440429688, 78.22796630859375, 82.85365295410156, 87.47935485839844, 92.10504913330078, 96.73074340820312, 101.35643768310547, 105.98213195800781, 110.60783386230469, 115.23352813720703, 119.85922241210938, 124.48492431640625, 129.11061096191406, 133.73631286621094, 138.36199951171875, 142.98770141601562, 147.61338806152344, 152.2390899658203, 156.86477661132812, 161.490478515625, 166.11618041992188]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 5.0, 7.0, 13.0, 17.0, 14.0, 25.0, 27.0, 40.0, 30.0, 35.0, 38.0, 67.0, 64.0, 79.0, 80.0, 52.0, 67.0, 57.0, 51.0, 43.0, 40.0, 28.0, 26.0, 26.0, 26.0, 9.0, 12.0, 5.0, 5.0, 2.0, 2.0, 4.0, 4.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-50.85237121582031, -49.51495361328125, -48.17753219604492, -46.84011459350586, -45.50269317626953, -44.16527557373047, -42.827857971191406, -41.49043655395508, -40.15301513671875, -38.81559753417969, -37.47817611694336, -36.1407585144043, -34.80333709716797, -33.465919494628906, -32.128501892089844, -30.791080474853516, -29.453662872314453, -28.116243362426758, -26.778823852539062, -25.44140625, -24.103984832763672, -22.76656723022461, -21.429147720336914, -20.09172821044922, -18.754308700561523, -17.416889190673828, -16.079469680786133, -14.742051124572754, -13.404631614685059, -12.067212104797363, -10.729793548583984, -9.392374038696289, -8.054950714111328, -6.717531204223633, -5.380112171173096, -4.042693138122559, -2.7052736282348633, -1.367854118347168, -0.030435562133789062, 1.3069839477539062, 2.6444034576416016, 3.9818227291107178, 5.319242000579834, 6.656661033630371, 7.994080543518066, 9.331500053405762, 10.66891860961914, 12.006338119506836, 13.343757629394531, 14.681177139282227, 16.018596649169922, 17.356014251708984, 18.693435668945312, 20.030853271484375, 21.36827278137207, 22.705692291259766, 24.04311180114746, 25.380531311035156, 26.71795082092285, 28.055370330810547, 29.39278793334961, 30.730209350585938, 32.067626953125, 33.40504455566406, 34.74246597290039]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 6.0, 2.0, 6.0, 9.0, 11.0, 13.0, 19.0, 32.0, 63.0, 81.0, 114.0, 237.0, 517.0, 1822.0, 9016.0, 115481.0, 862322.0, 51032.0, 5600.0, 1221.0, 425.0, 201.0, 117.0, 77.0, 45.0, 26.0, 19.0, 11.0, 9.0, 10.0, 5.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.890625, -17.281494140625, -16.67236328125, -16.063232421875, -15.4541015625, -14.844970703125, -14.23583984375, -13.626708984375, -13.017578125, -12.408447265625, -11.79931640625, -11.190185546875, -10.5810546875, -9.971923828125, -9.36279296875, -8.753662109375, -8.14453125, -7.535400390625, -6.92626953125, -6.317138671875, -5.7080078125, -5.098876953125, -4.48974609375, -3.880615234375, -3.271484375, -2.662353515625, -2.05322265625, -1.444091796875, -0.8349609375, -0.225830078125, 0.38330078125, 0.992431640625, 1.6015625, 2.210693359375, 2.81982421875, 3.428955078125, 4.0380859375, 4.647216796875, 5.25634765625, 5.865478515625, 6.474609375, 7.083740234375, 7.69287109375, 8.302001953125, 8.9111328125, 9.520263671875, 10.12939453125, 10.738525390625, 11.34765625, 11.956787109375, 12.56591796875, 13.175048828125, 13.7841796875, 14.393310546875, 15.00244140625, 15.611572265625, 16.220703125, 16.829833984375, 17.43896484375, 18.048095703125, 18.6572265625, 19.266357421875, 19.87548828125, 20.484619140625, 21.09375]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 2.0, 8.0, 15.0, 23.0, 19.0, 20.0, 29.0, 44.0, 51.0, 68.0, 79.0, 77.0, 87.0, 68.0, 87.0, 75.0, 57.0, 46.0, 39.0, 26.0, 20.0, 20.0, 17.0, 9.0, 5.0, 8.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.32421875, -5.183013916015625, -5.04180908203125, -4.900604248046875, -4.7593994140625, -4.618194580078125, -4.47698974609375, -4.335784912109375, -4.194580078125, -4.053375244140625, -3.91217041015625, -3.770965576171875, -3.6297607421875, -3.488555908203125, -3.34735107421875, -3.206146240234375, -3.06494140625, -2.923736572265625, -2.78253173828125, -2.641326904296875, -2.5001220703125, -2.358917236328125, -2.21771240234375, -2.076507568359375, -1.935302734375, -1.794097900390625, -1.65289306640625, -1.511688232421875, -1.3704833984375, -1.229278564453125, -1.08807373046875, -0.946868896484375, -0.8056640625, -0.664459228515625, -0.52325439453125, -0.382049560546875, -0.2408447265625, -0.099639892578125, 0.04156494140625, 0.182769775390625, 0.323974609375, 0.465179443359375, 0.60638427734375, 0.747589111328125, 0.8887939453125, 1.029998779296875, 1.17120361328125, 1.312408447265625, 1.45361328125, 1.594818115234375, 1.73602294921875, 1.877227783203125, 2.0184326171875, 2.159637451171875, 2.30084228515625, 2.442047119140625, 2.583251953125, 2.724456787109375, 2.86566162109375, 3.006866455078125, 3.1480712890625, 3.289276123046875, 3.43048095703125, 3.571685791015625, 3.712890625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 5.0, 5.0, 2.0, 3.0, 5.0, 13.0, 9.0, 15.0, 18.0, 47.0, 47.0, 87.0, 120.0, 228.0, 477.0, 1098.0, 3229.0, 15568.0, 652315.0, 357008.0, 13326.0, 2848.0, 1039.0, 465.0, 236.0, 98.0, 73.0, 48.0, 37.0, 27.0, 12.0, 10.0, 9.0, 9.0, 10.0, 6.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-25.109375, -24.32373046875, -23.5380859375, -22.75244140625, -21.966796875, -21.18115234375, -20.3955078125, -19.60986328125, -18.82421875, -18.03857421875, -17.2529296875, -16.46728515625, -15.681640625, -14.89599609375, -14.1103515625, -13.32470703125, -12.5390625, -11.75341796875, -10.9677734375, -10.18212890625, -9.396484375, -8.61083984375, -7.8251953125, -7.03955078125, -6.25390625, -5.46826171875, -4.6826171875, -3.89697265625, -3.111328125, -2.32568359375, -1.5400390625, -0.75439453125, 0.03125, 0.81689453125, 1.6025390625, 2.38818359375, 3.173828125, 3.95947265625, 4.7451171875, 5.53076171875, 6.31640625, 7.10205078125, 7.8876953125, 8.67333984375, 9.458984375, 10.24462890625, 11.0302734375, 11.81591796875, 12.6015625, 13.38720703125, 14.1728515625, 14.95849609375, 15.744140625, 16.52978515625, 17.3154296875, 18.10107421875, 18.88671875, 19.67236328125, 20.4580078125, 21.24365234375, 22.029296875, 22.81494140625, 23.6005859375, 24.38623046875, 25.171875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 9.0, 2.0, 9.0, 7.0, 16.0, 16.0, 19.0, 38.0, 36.0, 48.0, 41.0, 54.0, 65.0, 59.0, 71.0, 77.0, 73.0, 61.0, 71.0, 58.0, 33.0, 30.0, 29.0, 20.0, 13.0, 19.0, 9.0, 4.0, 6.0, 5.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.234375, -20.65966796875, -20.0849609375, -19.51025390625, -18.935546875, -18.36083984375, -17.7861328125, -17.21142578125, -16.63671875, -16.06201171875, -15.4873046875, -14.91259765625, -14.337890625, -13.76318359375, -13.1884765625, -12.61376953125, -12.0390625, -11.46435546875, -10.8896484375, -10.31494140625, -9.740234375, -9.16552734375, -8.5908203125, -8.01611328125, -7.44140625, -6.86669921875, -6.2919921875, -5.71728515625, -5.142578125, -4.56787109375, -3.9931640625, -3.41845703125, -2.84375, -2.26904296875, -1.6943359375, -1.11962890625, -0.544921875, 0.02978515625, 0.6044921875, 1.17919921875, 1.75390625, 2.32861328125, 2.9033203125, 3.47802734375, 4.052734375, 4.62744140625, 5.2021484375, 5.77685546875, 6.3515625, 6.92626953125, 7.5009765625, 8.07568359375, 8.650390625, 9.22509765625, 9.7998046875, 10.37451171875, 10.94921875, 11.52392578125, 12.0986328125, 12.67333984375, 13.248046875, 13.82275390625, 14.3974609375, 14.97216796875, 15.546875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 4.0, 2.0, 3.0, 3.0, 4.0, 6.0, 9.0, 5.0, 6.0, 10.0, 19.0, 14.0, 17.0, 20.0, 42.0, 60.0, 76.0, 147.0, 229.0, 472.0, 1140.0, 2937.0, 11835.0, 144489.0, 847494.0, 31173.0, 5094.0, 1634.0, 705.0, 347.0, 162.0, 126.0, 67.0, 53.0, 40.0, 24.0, 15.0, 17.0, 11.0, 3.0, 10.0, 8.0, 5.0, 7.0, 8.0, 4.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-8.9921875, -8.6737060546875, -8.355224609375, -8.0367431640625, -7.71826171875, -7.3997802734375, -7.081298828125, -6.7628173828125, -6.4443359375, -6.1258544921875, -5.807373046875, -5.4888916015625, -5.17041015625, -4.8519287109375, -4.533447265625, -4.2149658203125, -3.896484375, -3.5780029296875, -3.259521484375, -2.9410400390625, -2.62255859375, -2.3040771484375, -1.985595703125, -1.6671142578125, -1.3486328125, -1.0301513671875, -0.711669921875, -0.3931884765625, -0.07470703125, 0.2437744140625, 0.562255859375, 0.8807373046875, 1.19921875, 1.5177001953125, 1.836181640625, 2.1546630859375, 2.47314453125, 2.7916259765625, 3.110107421875, 3.4285888671875, 3.7470703125, 4.0655517578125, 4.384033203125, 4.7025146484375, 5.02099609375, 5.3394775390625, 5.657958984375, 5.9764404296875, 6.294921875, 6.6134033203125, 6.931884765625, 7.2503662109375, 7.56884765625, 7.8873291015625, 8.205810546875, 8.5242919921875, 8.8427734375, 9.1612548828125, 9.479736328125, 9.7982177734375, 10.11669921875, 10.4351806640625, 10.753662109375, 11.0721435546875, 11.390625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 4.0, 6.0, 3.0, 15.0, 16.0, 17.0, 26.0, 29.0, 52.0, 88.0, 143.0, 183.0, 146.0, 92.0, 28.0, 32.0, 22.0, 20.0, 15.0, 9.0, 9.0, 4.0, 9.0, 3.0, 5.0, 1.0, 3.0, 3.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.001377105712890625, -0.0013285279273986816, -0.0012799501419067383, -0.001231372356414795, -0.0011827945709228516, -0.0011342167854309082, -0.0010856389999389648, -0.0010370612144470215, -0.0009884834289550781, -0.0009399056434631348, -0.0008913278579711914, -0.000842750072479248, -0.0007941722869873047, -0.0007455945014953613, -0.000697016716003418, -0.0006484389305114746, -0.0005998611450195312, -0.0005512833595275879, -0.0005027055740356445, -0.00045412778854370117, -0.0004055500030517578, -0.00035697221755981445, -0.0003083944320678711, -0.00025981664657592773, -0.00021123886108398438, -0.00016266107559204102, -0.00011408329010009766, -6.55055046081543e-05, -1.6927719116210938e-05, 3.165006637573242e-05, 8.022785186767578e-05, 0.00012880563735961914, 0.0001773834228515625, 0.00022596120834350586, 0.0002745389938354492, 0.0003231167793273926, 0.00037169456481933594, 0.0004202723503112793, 0.00046885013580322266, 0.000517427921295166, 0.0005660057067871094, 0.0006145834922790527, 0.0006631612777709961, 0.0007117390632629395, 0.0007603168487548828, 0.0008088946342468262, 0.0008574724197387695, 0.0009060502052307129, 0.0009546279907226562, 0.0010032057762145996, 0.001051783561706543, 0.0011003613471984863, 0.0011489391326904297, 0.001197516918182373, 0.0012460947036743164, 0.0012946724891662598, 0.0013432502746582031, 0.0013918280601501465, 0.0014404058456420898, 0.0014889836311340332, 0.0015375614166259766, 0.00158613920211792, 0.0016347169876098633, 0.0016832947731018066, 0.00173187255859375]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 4.0, 3.0, 2.0, 13.0, 14.0, 13.0, 29.0, 25.0, 51.0, 66.0, 130.0, 199.0, 378.0, 896.0, 2556.0, 9558.0, 72175.0, 895635.0, 54616.0, 8248.0, 2150.0, 853.0, 404.0, 192.0, 115.0, 86.0, 39.0, 26.0, 26.0, 19.0, 10.0, 9.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.125, -8.8253173828125, -8.525634765625, -8.2259521484375, -7.92626953125, -7.6265869140625, -7.326904296875, -7.0272216796875, -6.7275390625, -6.4278564453125, -6.128173828125, -5.8284912109375, -5.52880859375, -5.2291259765625, -4.929443359375, -4.6297607421875, -4.330078125, -4.0303955078125, -3.730712890625, -3.4310302734375, -3.13134765625, -2.8316650390625, -2.531982421875, -2.2322998046875, -1.9326171875, -1.6329345703125, -1.333251953125, -1.0335693359375, -0.73388671875, -0.4342041015625, -0.134521484375, 0.1651611328125, 0.46484375, 0.7645263671875, 1.064208984375, 1.3638916015625, 1.66357421875, 1.9632568359375, 2.262939453125, 2.5626220703125, 2.8623046875, 3.1619873046875, 3.461669921875, 3.7613525390625, 4.06103515625, 4.3607177734375, 4.660400390625, 4.9600830078125, 5.259765625, 5.5594482421875, 5.859130859375, 6.1588134765625, 6.45849609375, 6.7581787109375, 7.057861328125, 7.3575439453125, 7.6572265625, 7.9569091796875, 8.256591796875, 8.5562744140625, 8.85595703125, 9.1556396484375, 9.455322265625, 9.7550048828125, 10.0546875]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 4.0, 5.0, 7.0, 14.0, 21.0, 39.0, 58.0, 118.0, 201.0, 255.0, 111.0, 65.0, 40.0, 16.0, 12.0, 8.0, 11.0, 7.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.1640625, -6.8658447265625, -6.567626953125, -6.2694091796875, -5.97119140625, -5.6729736328125, -5.374755859375, -5.0765380859375, -4.7783203125, -4.4801025390625, -4.181884765625, -3.8836669921875, -3.58544921875, -3.2872314453125, -2.989013671875, -2.6907958984375, -2.392578125, -2.0943603515625, -1.796142578125, -1.4979248046875, -1.19970703125, -0.9014892578125, -0.603271484375, -0.3050537109375, -0.0068359375, 0.2913818359375, 0.589599609375, 0.8878173828125, 1.18603515625, 1.4842529296875, 1.782470703125, 2.0806884765625, 2.37890625, 2.6771240234375, 2.975341796875, 3.2735595703125, 3.57177734375, 3.8699951171875, 4.168212890625, 4.4664306640625, 4.7646484375, 5.0628662109375, 5.361083984375, 5.6593017578125, 5.95751953125, 6.2557373046875, 6.553955078125, 6.8521728515625, 7.150390625, 7.4486083984375, 7.746826171875, 8.0450439453125, 8.34326171875, 8.6414794921875, 8.939697265625, 9.2379150390625, 9.5361328125, 9.8343505859375, 10.132568359375, 10.4307861328125, 10.72900390625, 11.0272216796875, 11.325439453125, 11.6236572265625, 11.921875]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 8.0, 12.0, 14.0, 31.0, 131.0, 411.0, 280.0, 75.0, 25.0, 5.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-177.28952026367188, -170.90870666503906, -164.5279083251953, -158.1470947265625, -151.76629638671875, -145.38548278808594, -139.00466918945312, -132.62387084960938, -126.24305725097656, -119.86225128173828, -113.4814453125, -107.10063171386719, -100.7198257446289, -94.33901977539062, -87.95821380615234, -81.57740783691406, -75.19660186767578, -68.8157958984375, -62.43498611450195, -56.05418014526367, -49.673370361328125, -43.292564392089844, -36.91175842285156, -30.530948638916016, -24.150142669677734, -17.76933479309082, -11.388527870178223, -5.007720947265625, 1.373086929321289, 7.753894805908203, 14.134700775146484, 20.51551055908203, 26.896316528320312, 33.277122497558594, 39.65793228149414, 46.03873825073242, 52.41954803466797, 58.80035400390625, 65.18115997314453, 71.56196594238281, 77.94277954101562, 84.3235855102539, 90.70439147949219, 97.085205078125, 103.46601104736328, 109.84681701660156, 116.22762298583984, 122.60842895507812, 128.98922729492188, 135.3700408935547, 141.75083923339844, 148.13165283203125, 154.512451171875, 160.8932647705078, 167.27407836914062, 173.65487670898438, 180.0356903076172, 186.41650390625, 192.79730224609375, 199.17811584472656, 205.5589141845703, 211.93972778320312, 218.32052612304688, 224.7013397216797, 231.0821533203125]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 4.0, 4.0, 7.0, 8.0, 13.0, 16.0, 11.0, 19.0, 19.0, 23.0, 23.0, 40.0, 41.0, 49.0, 59.0, 80.0, 84.0, 91.0, 60.0, 55.0, 59.0, 47.0, 31.0, 28.0, 30.0, 24.0, 21.0, 19.0, 16.0, 10.0, 6.0, 0.0, 8.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-88.98582458496094, -86.86808013916016, -84.75033569335938, -82.6325912475586, -80.51484680175781, -78.39710998535156, -76.27936553955078, -74.16162109375, -72.04387664794922, -69.92613220214844, -67.80838775634766, -65.69064331054688, -63.57290267944336, -61.45515823364258, -59.33741760253906, -57.21967315673828, -55.1019287109375, -52.98418426513672, -50.86643981933594, -48.74869918823242, -46.63095474243164, -44.51321029663086, -42.395469665527344, -40.27772521972656, -38.15998077392578, -36.042236328125, -33.92449188232422, -31.806751251220703, -29.689006805419922, -27.57126235961914, -25.453519821166992, -23.335777282714844, -21.218032836914062, -19.10028839111328, -16.982545852661133, -14.864802360534668, -12.747058868408203, -10.629315376281738, -8.511571884155273, -6.393828392028809, -4.276084899902344, -2.158341407775879, -0.04059791564941406, 2.077145576477051, 4.194889068603516, 6.3126325607299805, 8.430376052856445, 10.54811954498291, 12.665863037109375, 14.78360652923584, 16.901350021362305, 19.019092559814453, 21.136837005615234, 23.254581451416016, 25.372323989868164, 27.490066528320312, 29.607810974121094, 31.725555419921875, 33.843299865722656, 35.96104049682617, 38.07878494262695, 40.196529388427734, 42.31427001953125, 44.43201446533203, 46.54975891113281]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 0.0, 1.0, 7.0, 8.0, 11.0, 17.0, 32.0, 64.0, 152.0, 521.0, 3799.0, 3659453.0, 526581.0, 2842.0, 534.0, 145.0, 58.0, 35.0, 12.0, 10.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.125, -43.01953125, -41.9140625, -40.80859375, -39.703125, -38.59765625, -37.4921875, -36.38671875, -35.28125, -34.17578125, -33.0703125, -31.96484375, -30.859375, -29.75390625, -28.6484375, -27.54296875, -26.4375, -25.33203125, -24.2265625, -23.12109375, -22.015625, -20.91015625, -19.8046875, -18.69921875, -17.59375, -16.48828125, -15.3828125, -14.27734375, -13.171875, -12.06640625, -10.9609375, -9.85546875, -8.75, -7.64453125, -6.5390625, -5.43359375, -4.328125, -3.22265625, -2.1171875, -1.01171875, 0.09375, 1.19921875, 2.3046875, 3.41015625, 4.515625, 5.62109375, 6.7265625, 7.83203125, 8.9375, 10.04296875, 11.1484375, 12.25390625, 13.359375, 14.46484375, 15.5703125, 16.67578125, 17.78125, 18.88671875, 19.9921875, 21.09765625, 22.203125, 23.30859375, 24.4140625, 25.51953125, 26.625]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 6.0, 6.0, 9.0, 21.0, 34.0, 66.0, 96.0, 121.0, 124.0, 147.0, 118.0, 115.0, 62.0, 39.0, 20.0, 11.0, 8.0, 1.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-12.234375, -11.97430419921875, -11.7142333984375, -11.45416259765625, -11.194091796875, -10.93402099609375, -10.6739501953125, -10.41387939453125, -10.15380859375, -9.89373779296875, -9.6336669921875, -9.37359619140625, -9.113525390625, -8.85345458984375, -8.5933837890625, -8.33331298828125, -8.0732421875, -7.81317138671875, -7.5531005859375, -7.29302978515625, -7.032958984375, -6.77288818359375, -6.5128173828125, -6.25274658203125, -5.99267578125, -5.73260498046875, -5.4725341796875, -5.21246337890625, -4.952392578125, -4.69232177734375, -4.4322509765625, -4.17218017578125, -3.912109375, -3.65203857421875, -3.3919677734375, -3.13189697265625, -2.871826171875, -2.61175537109375, -2.3516845703125, -2.09161376953125, -1.83154296875, -1.57147216796875, -1.3114013671875, -1.05133056640625, -0.791259765625, -0.53118896484375, -0.2711181640625, -0.01104736328125, 0.2490234375, 0.50909423828125, 0.7691650390625, 1.02923583984375, 1.289306640625, 1.54937744140625, 1.8094482421875, 2.06951904296875, 2.32958984375, 2.58966064453125, 2.8497314453125, 3.10980224609375, 3.369873046875, 3.62994384765625, 3.8900146484375, 4.15008544921875, 4.41015625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 4.0, 1.0, 6.0, 6.0, 4.0, 20.0, 29.0, 60.0, 124.0, 257.0, 609.0, 1532.0, 4235.0, 38870.0, 4060375.0, 78758.0, 5724.0, 2035.0, 855.0, 401.0, 168.0, 106.0, 39.0, 24.0, 17.0, 10.0, 5.0, 3.0, 6.0, 6.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-28.703125, -27.959228515625, -27.21533203125, -26.471435546875, -25.7275390625, -24.983642578125, -24.23974609375, -23.495849609375, -22.751953125, -22.008056640625, -21.26416015625, -20.520263671875, -19.7763671875, -19.032470703125, -18.28857421875, -17.544677734375, -16.80078125, -16.056884765625, -15.31298828125, -14.569091796875, -13.8251953125, -13.081298828125, -12.33740234375, -11.593505859375, -10.849609375, -10.105712890625, -9.36181640625, -8.617919921875, -7.8740234375, -7.130126953125, -6.38623046875, -5.642333984375, -4.8984375, -4.154541015625, -3.41064453125, -2.666748046875, -1.9228515625, -1.178955078125, -0.43505859375, 0.308837890625, 1.052734375, 1.796630859375, 2.54052734375, 3.284423828125, 4.0283203125, 4.772216796875, 5.51611328125, 6.260009765625, 7.00390625, 7.747802734375, 8.49169921875, 9.235595703125, 9.9794921875, 10.723388671875, 11.46728515625, 12.211181640625, 12.955078125, 13.698974609375, 14.44287109375, 15.186767578125, 15.9306640625, 16.674560546875, 17.41845703125, 18.162353515625, 18.90625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 4.0, 4.0, 8.0, 9.0, 21.0, 33.0, 64.0, 131.0, 328.0, 935.0, 1449.0, 642.0, 257.0, 102.0, 39.0, 23.0, 10.0, 2.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.8046875, -14.3160400390625, -13.827392578125, -13.3387451171875, -12.85009765625, -12.3614501953125, -11.872802734375, -11.3841552734375, -10.8955078125, -10.4068603515625, -9.918212890625, -9.4295654296875, -8.94091796875, -8.4522705078125, -7.963623046875, -7.4749755859375, -6.986328125, -6.4976806640625, -6.009033203125, -5.5203857421875, -5.03173828125, -4.5430908203125, -4.054443359375, -3.5657958984375, -3.0771484375, -2.5885009765625, -2.099853515625, -1.6112060546875, -1.12255859375, -0.6339111328125, -0.145263671875, 0.3433837890625, 0.83203125, 1.3206787109375, 1.809326171875, 2.2979736328125, 2.78662109375, 3.2752685546875, 3.763916015625, 4.2525634765625, 4.7412109375, 5.2298583984375, 5.718505859375, 6.2071533203125, 6.69580078125, 7.1844482421875, 7.673095703125, 8.1617431640625, 8.650390625, 9.1390380859375, 9.627685546875, 10.1163330078125, 10.60498046875, 11.0936279296875, 11.582275390625, 12.0709228515625, 12.5595703125, 13.0482177734375, 13.536865234375, 14.0255126953125, 14.51416015625, 15.0028076171875, 15.491455078125, 15.9801025390625, 16.46875]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 10.0, 10.0, 20.0, 144.0, 503.0, 260.0, 34.0, 11.0, 4.0, 7.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-149.5379638671875, -141.9425506591797, -134.34713745117188, -126.75171661376953, -119.15630340576172, -111.56088256835938, -103.96546936035156, -96.37005615234375, -88.77464294433594, -81.17922973632812, -73.58380889892578, -65.98839569091797, -58.392982482910156, -50.79756546020508, -43.2021484375, -35.60673522949219, -28.011314392089844, -20.4158992767334, -12.820483207702637, -5.225067138671875, 2.3703479766845703, 9.965763092041016, 17.561180114746094, 25.156593322753906, 32.752010345458984, 40.34742736816406, 47.942840576171875, 55.53825759887695, 63.13367462158203, 70.72908782958984, 78.32450866699219, 85.919921875, 93.51533508300781, 101.11074829101562, 108.70616912841797, 116.30158233642578, 123.8969955444336, 131.49241638183594, 139.08782958984375, 146.68324279785156, 154.27865600585938, 161.8740692138672, 169.469482421875, 177.06491088867188, 184.6603240966797, 192.2557373046875, 199.8511505126953, 207.44656372070312, 215.0419921875, 222.6374053955078, 230.23281860351562, 237.8282470703125, 245.4236602783203, 253.01907348632812, 260.614501953125, 268.20989990234375, 275.8052978515625, 283.4007263183594, 290.9961242675781, 298.591552734375, 306.18695068359375, 313.7823791503906, 321.3778076171875, 328.97320556640625, 336.5686340332031]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 6.0, 7.0, 13.0, 37.0, 63.0, 93.0, 137.0, 162.0, 184.0, 142.0, 79.0, 46.0, 24.0, 13.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-131.88197326660156, -128.1245574951172, -124.36713409423828, -120.60971069335938, -116.852294921875, -113.0948715209961, -109.33744812011719, -105.58003234863281, -101.82261657714844, -98.06519317626953, -94.30777740478516, -90.55035400390625, -86.79293823242188, -83.03551483154297, -79.27809143066406, -75.52067565917969, -71.76325225830078, -68.00582885742188, -64.2484130859375, -60.490989685058594, -56.73357391357422, -52.97615051269531, -49.21873092651367, -45.46131134033203, -41.70389175415039, -37.94647216796875, -34.18905258178711, -30.431631088256836, -26.674211502075195, -22.916791915893555, -19.15937042236328, -15.40195083618164, -11.64453125, -7.887111186981201, -4.129691123962402, -0.3722705841064453, 3.3851490020751953, 7.142568588256836, 10.89999008178711, 14.65740966796875, 18.41482925415039, 22.17224884033203, 25.929668426513672, 29.687089920043945, 33.44451141357422, 37.201927185058594, 40.9593505859375, 44.71677017211914, 48.47418975830078, 52.23160934448242, 55.98902893066406, 59.74645233154297, 63.503868103027344, 67.26129150390625, 71.01870727539062, 74.77613067626953, 78.53355407714844, 82.29097747802734, 86.04839324951172, 89.80581665039062, 93.563232421875, 97.3206558227539, 101.07807922363281, 104.83549499511719, 108.59291076660156]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 1.0, 1.0, 5.0, 4.0, 9.0, 7.0, 13.0, 15.0, 15.0, 36.0, 50.0, 93.0, 129.0, 263.0, 613.0, 2740.0, 50035.0, 959256.0, 31831.0, 2252.0, 556.0, 234.0, 130.0, 80.0, 62.0, 33.0, 26.0, 24.0, 14.0, 6.0, 10.0, 9.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-25.671875, -24.986328125, -24.30078125, -23.615234375, -22.9296875, -22.244140625, -21.55859375, -20.873046875, -20.1875, -19.501953125, -18.81640625, -18.130859375, -17.4453125, -16.759765625, -16.07421875, -15.388671875, -14.703125, -14.017578125, -13.33203125, -12.646484375, -11.9609375, -11.275390625, -10.58984375, -9.904296875, -9.21875, -8.533203125, -7.84765625, -7.162109375, -6.4765625, -5.791015625, -5.10546875, -4.419921875, -3.734375, -3.048828125, -2.36328125, -1.677734375, -0.9921875, -0.306640625, 0.37890625, 1.064453125, 1.75, 2.435546875, 3.12109375, 3.806640625, 4.4921875, 5.177734375, 5.86328125, 6.548828125, 7.234375, 7.919921875, 8.60546875, 9.291015625, 9.9765625, 10.662109375, 11.34765625, 12.033203125, 12.71875, 13.404296875, 14.08984375, 14.775390625, 15.4609375, 16.146484375, 16.83203125, 17.517578125, 18.203125]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 3.0, 7.0, 18.0, 50.0, 67.0, 132.0, 149.0, 173.0, 128.0, 120.0, 81.0, 46.0, 15.0, 14.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.046875, -14.72955322265625, -14.4122314453125, -14.09490966796875, -13.777587890625, -13.46026611328125, -13.1429443359375, -12.82562255859375, -12.50830078125, -12.19097900390625, -11.8736572265625, -11.55633544921875, -11.239013671875, -10.92169189453125, -10.6043701171875, -10.28704833984375, -9.9697265625, -9.65240478515625, -9.3350830078125, -9.01776123046875, -8.700439453125, -8.38311767578125, -8.0657958984375, -7.74847412109375, -7.43115234375, -7.11383056640625, -6.7965087890625, -6.47918701171875, -6.161865234375, -5.84454345703125, -5.5272216796875, -5.20989990234375, -4.892578125, -4.57525634765625, -4.2579345703125, -3.94061279296875, -3.623291015625, -3.30596923828125, -2.9886474609375, -2.67132568359375, -2.35400390625, -2.03668212890625, -1.7193603515625, -1.40203857421875, -1.084716796875, -0.76739501953125, -0.4500732421875, -0.13275146484375, 0.1845703125, 0.50189208984375, 0.8192138671875, 1.13653564453125, 1.453857421875, 1.77117919921875, 2.0885009765625, 2.40582275390625, 2.72314453125, 3.04046630859375, 3.3577880859375, 3.67510986328125, 3.992431640625, 4.30975341796875, 4.6270751953125, 4.94439697265625, 5.26171875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 3.0, 4.0, 8.0, 8.0, 9.0, 11.0, 36.0, 40.0, 89.0, 157.0, 383.0, 1074.0, 3499.0, 25804.0, 713205.0, 286172.0, 14192.0, 2474.0, 732.0, 287.0, 157.0, 70.0, 53.0, 34.0, 13.0, 12.0, 11.0, 7.0, 2.0, 3.0, 0.0, 4.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.0390625, -12.6026611328125, -12.166259765625, -11.7298583984375, -11.29345703125, -10.8570556640625, -10.420654296875, -9.9842529296875, -9.5478515625, -9.1114501953125, -8.675048828125, -8.2386474609375, -7.80224609375, -7.3658447265625, -6.929443359375, -6.4930419921875, -6.056640625, -5.6202392578125, -5.183837890625, -4.7474365234375, -4.31103515625, -3.8746337890625, -3.438232421875, -3.0018310546875, -2.5654296875, -2.1290283203125, -1.692626953125, -1.2562255859375, -0.81982421875, -0.3834228515625, 0.052978515625, 0.4893798828125, 0.92578125, 1.3621826171875, 1.798583984375, 2.2349853515625, 2.67138671875, 3.1077880859375, 3.544189453125, 3.9805908203125, 4.4169921875, 4.8533935546875, 5.289794921875, 5.7261962890625, 6.16259765625, 6.5989990234375, 7.035400390625, 7.4718017578125, 7.908203125, 8.3446044921875, 8.781005859375, 9.2174072265625, 9.65380859375, 10.0902099609375, 10.526611328125, 10.9630126953125, 11.3994140625, 11.8358154296875, 12.272216796875, 12.7086181640625, 13.14501953125, 13.5814208984375, 14.017822265625, 14.4542236328125, 14.890625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 6.0, 4.0, 2.0, 8.0, 12.0, 8.0, 18.0, 16.0, 33.0, 25.0, 39.0, 48.0, 42.0, 39.0, 68.0, 50.0, 61.0, 79.0, 54.0, 54.0, 61.0, 48.0, 47.0, 28.0, 31.0, 17.0, 26.0, 21.0, 14.0, 11.0, 9.0, 5.0, 6.0, 8.0, 7.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.4453125, -10.0125732421875, -9.579833984375, -9.1470947265625, -8.71435546875, -8.2816162109375, -7.848876953125, -7.4161376953125, -6.9833984375, -6.5506591796875, -6.117919921875, -5.6851806640625, -5.25244140625, -4.8197021484375, -4.386962890625, -3.9542236328125, -3.521484375, -3.0887451171875, -2.656005859375, -2.2232666015625, -1.79052734375, -1.3577880859375, -0.925048828125, -0.4923095703125, -0.0595703125, 0.3731689453125, 0.805908203125, 1.2386474609375, 1.67138671875, 2.1041259765625, 2.536865234375, 2.9696044921875, 3.40234375, 3.8350830078125, 4.267822265625, 4.7005615234375, 5.13330078125, 5.5660400390625, 5.998779296875, 6.4315185546875, 6.8642578125, 7.2969970703125, 7.729736328125, 8.1624755859375, 8.59521484375, 9.0279541015625, 9.460693359375, 9.8934326171875, 10.326171875, 10.7589111328125, 11.191650390625, 11.6243896484375, 12.05712890625, 12.4898681640625, 12.922607421875, 13.3553466796875, 13.7880859375, 14.2208251953125, 14.653564453125, 15.0863037109375, 15.51904296875, 15.9517822265625, 16.384521484375, 16.8172607421875, 17.25]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 4.0, 8.0, 9.0, 13.0, 25.0, 54.0, 161.0, 629.0, 3861.0, 38721.0, 842297.0, 151541.0, 9406.0, 1349.0, 281.0, 82.0, 40.0, 28.0, 11.0, 13.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.62890625, -5.45684814453125, -5.2847900390625, -5.11273193359375, -4.940673828125, -4.76861572265625, -4.5965576171875, -4.42449951171875, -4.25244140625, -4.08038330078125, -3.9083251953125, -3.73626708984375, -3.564208984375, -3.39215087890625, -3.2200927734375, -3.04803466796875, -2.8759765625, -2.70391845703125, -2.5318603515625, -2.35980224609375, -2.187744140625, -2.01568603515625, -1.8436279296875, -1.67156982421875, -1.49951171875, -1.32745361328125, -1.1553955078125, -0.98333740234375, -0.811279296875, -0.63922119140625, -0.4671630859375, -0.29510498046875, -0.123046875, 0.04901123046875, 0.2210693359375, 0.39312744140625, 0.565185546875, 0.73724365234375, 0.9093017578125, 1.08135986328125, 1.25341796875, 1.42547607421875, 1.5975341796875, 1.76959228515625, 1.941650390625, 2.11370849609375, 2.2857666015625, 2.45782470703125, 2.6298828125, 2.80194091796875, 2.9739990234375, 3.14605712890625, 3.318115234375, 3.49017333984375, 3.6622314453125, 3.83428955078125, 4.00634765625, 4.17840576171875, 4.3504638671875, 4.52252197265625, 4.694580078125, 4.86663818359375, 5.0386962890625, 5.21075439453125, 5.3828125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 0.0, 2.0, 3.0, 0.0, 6.0, 1.0, 4.0, 9.0, 8.0, 7.0, 17.0, 26.0, 34.0, 58.0, 81.0, 123.0, 146.0, 143.0, 108.0, 75.0, 52.0, 34.0, 24.0, 8.0, 7.0, 4.0, 6.0, 5.0, 5.0, 2.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007753372192382812, -0.0007494688034057617, -0.0007236003875732422, -0.0006977319717407227, -0.0006718635559082031, -0.0006459951400756836, -0.0006201267242431641, -0.0005942583084106445, -0.000568389892578125, -0.0005425214767456055, -0.0005166530609130859, -0.0004907846450805664, -0.0004649162292480469, -0.00043904781341552734, -0.0004131793975830078, -0.0003873109817504883, -0.00036144256591796875, -0.0003355741500854492, -0.0003097057342529297, -0.00028383731842041016, -0.0002579689025878906, -0.0002321004867553711, -0.00020623207092285156, -0.00018036365509033203, -0.0001544952392578125, -0.00012862682342529297, -0.00010275840759277344, -7.68899917602539e-05, -5.1021575927734375e-05, -2.5153160095214844e-05, 7.152557373046875e-07, 2.658367156982422e-05, 5.245208740234375e-05, 7.832050323486328e-05, 0.00010418891906738281, 0.00013005733489990234, 0.00015592575073242188, 0.0001817941665649414, 0.00020766258239746094, 0.00023353099822998047, 0.0002593994140625, 0.00028526782989501953, 0.00031113624572753906, 0.0003370046615600586, 0.0003628730773925781, 0.00038874149322509766, 0.0004146099090576172, 0.0004404783248901367, 0.00046634674072265625, 0.0004922151565551758, 0.0005180835723876953, 0.0005439519882202148, 0.0005698204040527344, 0.0005956888198852539, 0.0006215572357177734, 0.000647425651550293, 0.0006732940673828125, 0.000699162483215332, 0.0007250308990478516, 0.0007508993148803711, 0.0007767677307128906, 0.0008026361465454102, 0.0008285045623779297, 0.0008543729782104492, 0.0008802413940429688]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 7.0, 4.0, 8.0, 11.0, 14.0, 24.0, 28.0, 56.0, 96.0, 146.0, 224.0, 364.0, 741.0, 1473.0, 3098.0, 7275.0, 20803.0, 79146.0, 538292.0, 305511.0, 62377.0, 16994.0, 6136.0, 2794.0, 1350.0, 667.0, 334.0, 226.0, 128.0, 78.0, 49.0, 33.0, 22.0, 20.0, 10.0, 5.0, 5.0, 2.0, 4.0, 5.0, 1.0, 2.0, 0.0, 0.0, 3.0], "bins": [-2.990234375, -2.911376953125, -2.83251953125, -2.753662109375, -2.6748046875, -2.595947265625, -2.51708984375, -2.438232421875, -2.359375, -2.280517578125, -2.20166015625, -2.122802734375, -2.0439453125, -1.965087890625, -1.88623046875, -1.807373046875, -1.728515625, -1.649658203125, -1.57080078125, -1.491943359375, -1.4130859375, -1.334228515625, -1.25537109375, -1.176513671875, -1.09765625, -1.018798828125, -0.93994140625, -0.861083984375, -0.7822265625, -0.703369140625, -0.62451171875, -0.545654296875, -0.466796875, -0.387939453125, -0.30908203125, -0.230224609375, -0.1513671875, -0.072509765625, 0.00634765625, 0.085205078125, 0.1640625, 0.242919921875, 0.32177734375, 0.400634765625, 0.4794921875, 0.558349609375, 0.63720703125, 0.716064453125, 0.794921875, 0.873779296875, 0.95263671875, 1.031494140625, 1.1103515625, 1.189208984375, 1.26806640625, 1.346923828125, 1.42578125, 1.504638671875, 1.58349609375, 1.662353515625, 1.7412109375, 1.820068359375, 1.89892578125, 1.977783203125, 2.056640625]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 6.0, 2.0, 5.0, 8.0, 7.0, 9.0, 14.0, 12.0, 16.0, 13.0, 23.0, 29.0, 27.0, 47.0, 54.0, 59.0, 69.0, 69.0, 70.0, 85.0, 69.0, 60.0, 39.0, 39.0, 38.0, 31.0, 21.0, 15.0, 16.0, 9.0, 8.0, 11.0, 5.0, 5.0, 6.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.08203125, -2.014068603515625, -1.94610595703125, -1.878143310546875, -1.8101806640625, -1.742218017578125, -1.67425537109375, -1.606292724609375, -1.538330078125, -1.470367431640625, -1.40240478515625, -1.334442138671875, -1.2664794921875, -1.198516845703125, -1.13055419921875, -1.062591552734375, -0.99462890625, -0.926666259765625, -0.85870361328125, -0.790740966796875, -0.7227783203125, -0.654815673828125, -0.58685302734375, -0.518890380859375, -0.450927734375, -0.382965087890625, -0.31500244140625, -0.247039794921875, -0.1790771484375, -0.111114501953125, -0.04315185546875, 0.024810791015625, 0.0927734375, 0.160736083984375, 0.22869873046875, 0.296661376953125, 0.3646240234375, 0.432586669921875, 0.50054931640625, 0.568511962890625, 0.636474609375, 0.704437255859375, 0.77239990234375, 0.840362548828125, 0.9083251953125, 0.976287841796875, 1.04425048828125, 1.112213134765625, 1.18017578125, 1.248138427734375, 1.31610107421875, 1.384063720703125, 1.4520263671875, 1.519989013671875, 1.58795166015625, 1.655914306640625, 1.723876953125, 1.791839599609375, 1.85980224609375, 1.927764892578125, 1.9957275390625, 2.063690185546875, 2.13165283203125, 2.199615478515625, 2.267578125]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 3.0, 6.0, 15.0, 19.0, 37.0, 100.0, 176.0, 284.0, 169.0, 91.0, 45.0, 14.0, 12.0, 9.0, 6.0, 4.0, 5.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.124961853027344, -55.73387145996094, -53.3427848815918, -50.951698303222656, -48.56060791015625, -46.169517517089844, -43.7784309387207, -41.38734436035156, -38.996253967285156, -36.60516357421875, -34.21407699584961, -31.822988510131836, -29.431900024414062, -27.04081153869629, -24.649723052978516, -22.258634567260742, -19.86754608154297, -17.476457595825195, -15.085369110107422, -12.694280624389648, -10.303192138671875, -7.912103652954102, -5.521015167236328, -3.1299266815185547, -0.7388381958007812, 1.6522502899169922, 4.043338775634766, 6.434427261352539, 8.825515747070312, 11.216604232788086, 13.60769271850586, 15.998781204223633, 18.389869689941406, 20.78095817565918, 23.172046661376953, 25.563135147094727, 27.9542236328125, 30.345312118530273, 32.73640060424805, 35.12748718261719, 37.518577575683594, 39.90966796875, 42.30075454711914, 44.69184112548828, 47.08293151855469, 49.474021911621094, 51.865108489990234, 54.256195068359375, 56.64728546142578, 59.03837585449219, 61.42946243286133, 63.82054901123047, 66.21163940429688, 68.60272979736328, 70.99382019042969, 73.38490295410156, 75.77599334716797, 78.16708374023438, 80.55816650390625, 82.94925689697266, 85.34034729003906, 87.73143768310547, 90.12252807617188, 92.51361083984375, 94.90470123291016]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 2.0, 2.0, 11.0, 14.0, 7.0, 14.0, 14.0, 19.0, 32.0, 36.0, 33.0, 52.0, 49.0, 58.0, 66.0, 108.0, 84.0, 73.0, 66.0, 45.0, 40.0, 36.0, 30.0, 28.0, 22.0, 14.0, 13.0, 12.0, 9.0, 7.0, 4.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-54.47370910644531, -52.51971435546875, -50.56571960449219, -48.611724853515625, -46.65773391723633, -44.703739166259766, -42.7497444152832, -40.79574966430664, -38.841758728027344, -36.88776397705078, -34.93376922607422, -32.979774475097656, -31.02578353881836, -29.071788787841797, -27.117794036865234, -25.163799285888672, -23.20980453491211, -21.255809783935547, -19.301816940307617, -17.347822189331055, -15.393828392028809, -13.439834594726562, -11.48583984375, -9.531846046447754, -7.577852249145508, -5.623858451843262, -3.6698641777038574, -1.7158699035644531, 0.23812389373779297, 2.192117691040039, 4.146112442016602, 6.100106239318848, 8.054100036621094, 10.00809383392334, 11.962087631225586, 13.916082382202148, 15.870076179504395, 17.82406997680664, 19.778064727783203, 21.732059478759766, 23.686052322387695, 25.640047073364258, 27.594039916992188, 29.54803466796875, 31.502029418945312, 33.456024169921875, 35.41001892089844, 37.364009857177734, 39.3180046081543, 41.27199935913086, 43.22599411010742, 45.17998504638672, 47.13397979736328, 49.087974548339844, 51.041969299316406, 52.99596405029297, 54.94995880126953, 56.903953552246094, 58.857948303222656, 60.81194305419922, 62.765933990478516, 64.71992492675781, 66.67391967773438, 68.62791442871094, 70.5819091796875]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 1.0, 3.0, 6.0, 8.0, 10.0, 11.0, 5.0, 25.0, 35.0, 33.0, 62.0, 122.0, 192.0, 454.0, 1291.0, 7026.0, 287342.0, 3862444.0, 30212.0, 3150.0, 1003.0, 427.0, 192.0, 98.0, 53.0, 24.0, 20.0, 11.0, 11.0, 4.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.171875, -19.6580810546875, -19.144287109375, -18.6304931640625, -18.11669921875, -17.6029052734375, -17.089111328125, -16.5753173828125, -16.0615234375, -15.5477294921875, -15.033935546875, -14.5201416015625, -14.00634765625, -13.4925537109375, -12.978759765625, -12.4649658203125, -11.951171875, -11.4373779296875, -10.923583984375, -10.4097900390625, -9.89599609375, -9.3822021484375, -8.868408203125, -8.3546142578125, -7.8408203125, -7.3270263671875, -6.813232421875, -6.2994384765625, -5.78564453125, -5.2718505859375, -4.758056640625, -4.2442626953125, -3.73046875, -3.2166748046875, -2.702880859375, -2.1890869140625, -1.67529296875, -1.1614990234375, -0.647705078125, -0.1339111328125, 0.3798828125, 0.8936767578125, 1.407470703125, 1.9212646484375, 2.43505859375, 2.9488525390625, 3.462646484375, 3.9764404296875, 4.490234375, 5.0040283203125, 5.517822265625, 6.0316162109375, 6.54541015625, 7.0592041015625, 7.572998046875, 8.0867919921875, 8.6005859375, 9.1143798828125, 9.628173828125, 10.1419677734375, 10.65576171875, 11.1695556640625, 11.683349609375, 12.1971435546875, 12.7109375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 6.0, 14.0, 23.0, 43.0, 102.0, 123.0, 182.0, 169.0, 145.0, 105.0, 57.0, 25.0, 10.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-15.5859375, -15.2547607421875, -14.923583984375, -14.5924072265625, -14.26123046875, -13.9300537109375, -13.598876953125, -13.2677001953125, -12.9365234375, -12.6053466796875, -12.274169921875, -11.9429931640625, -11.61181640625, -11.2806396484375, -10.949462890625, -10.6182861328125, -10.287109375, -9.9559326171875, -9.624755859375, -9.2935791015625, -8.96240234375, -8.6312255859375, -8.300048828125, -7.9688720703125, -7.6376953125, -7.3065185546875, -6.975341796875, -6.6441650390625, -6.31298828125, -5.9818115234375, -5.650634765625, -5.3194580078125, -4.98828125, -4.6571044921875, -4.325927734375, -3.9947509765625, -3.66357421875, -3.3323974609375, -3.001220703125, -2.6700439453125, -2.3388671875, -2.0076904296875, -1.676513671875, -1.3453369140625, -1.01416015625, -0.6829833984375, -0.351806640625, -0.0206298828125, 0.310546875, 0.6417236328125, 0.972900390625, 1.3040771484375, 1.63525390625, 1.9664306640625, 2.297607421875, 2.6287841796875, 2.9599609375, 3.2911376953125, 3.622314453125, 3.9534912109375, 4.28466796875, 4.6158447265625, 4.947021484375, 5.2781982421875, 5.609375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 2.0, 5.0, 3.0, 14.0, 8.0, 10.0, 13.0, 36.0, 49.0, 67.0, 143.0, 391.0, 1154.0, 5239.0, 57983.0, 3341165.0, 763151.0, 20812.0, 2847.0, 643.0, 256.0, 106.0, 66.0, 34.0, 22.0, 21.0, 13.0, 8.0, 7.0, 6.0, 4.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.9296875, -9.5594482421875, -9.189208984375, -8.8189697265625, -8.44873046875, -8.0784912109375, -7.708251953125, -7.3380126953125, -6.9677734375, -6.5975341796875, -6.227294921875, -5.8570556640625, -5.48681640625, -5.1165771484375, -4.746337890625, -4.3760986328125, -4.005859375, -3.6356201171875, -3.265380859375, -2.8951416015625, -2.52490234375, -2.1546630859375, -1.784423828125, -1.4141845703125, -1.0439453125, -0.6737060546875, -0.303466796875, 0.0667724609375, 0.43701171875, 0.8072509765625, 1.177490234375, 1.5477294921875, 1.91796875, 2.2882080078125, 2.658447265625, 3.0286865234375, 3.39892578125, 3.7691650390625, 4.139404296875, 4.5096435546875, 4.8798828125, 5.2501220703125, 5.620361328125, 5.9906005859375, 6.36083984375, 6.7310791015625, 7.101318359375, 7.4715576171875, 7.841796875, 8.2120361328125, 8.582275390625, 8.9525146484375, 9.32275390625, 9.6929931640625, 10.063232421875, 10.4334716796875, 10.8037109375, 11.1739501953125, 11.544189453125, 11.9144287109375, 12.28466796875, 12.6549072265625, 13.025146484375, 13.3953857421875, 13.765625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 4.0, 0.0, 7.0, 6.0, 14.0, 10.0, 27.0, 28.0, 36.0, 43.0, 73.0, 99.0, 158.0, 249.0, 377.0, 538.0, 637.0, 538.0, 398.0, 241.0, 181.0, 133.0, 69.0, 59.0, 40.0, 28.0, 22.0, 14.0, 14.0, 9.0, 4.0, 7.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-6.14453125, -5.96136474609375, -5.7781982421875, -5.59503173828125, -5.411865234375, -5.22869873046875, -5.0455322265625, -4.86236572265625, -4.67919921875, -4.49603271484375, -4.3128662109375, -4.12969970703125, -3.946533203125, -3.76336669921875, -3.5802001953125, -3.39703369140625, -3.2138671875, -3.03070068359375, -2.8475341796875, -2.66436767578125, -2.481201171875, -2.29803466796875, -2.1148681640625, -1.93170166015625, -1.74853515625, -1.56536865234375, -1.3822021484375, -1.19903564453125, -1.015869140625, -0.83270263671875, -0.6495361328125, -0.46636962890625, -0.283203125, -0.10003662109375, 0.0831298828125, 0.26629638671875, 0.449462890625, 0.63262939453125, 0.8157958984375, 0.99896240234375, 1.18212890625, 1.36529541015625, 1.5484619140625, 1.73162841796875, 1.914794921875, 2.09796142578125, 2.2811279296875, 2.46429443359375, 2.6474609375, 2.83062744140625, 3.0137939453125, 3.19696044921875, 3.380126953125, 3.56329345703125, 3.7464599609375, 3.92962646484375, 4.11279296875, 4.29595947265625, 4.4791259765625, 4.66229248046875, 4.845458984375, 5.02862548828125, 5.2117919921875, 5.39495849609375, 5.578125]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 11.0, 18.0, 33.0, 93.0, 147.0, 255.0, 235.0, 130.0, 43.0, 19.0, 11.0, 7.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.17020416259766, -61.3540153503418, -58.53782653808594, -55.721641540527344, -52.90544891357422, -50.089263916015625, -47.273075103759766, -44.456886291503906, -41.64069747924805, -38.82450866699219, -36.00831985473633, -33.19213104248047, -30.375944137573242, -27.559755325317383, -24.743568420410156, -21.927379608154297, -19.111190795898438, -16.295001983642578, -13.478814125061035, -10.662626266479492, -7.846437454223633, -5.030248641967773, -2.214061737060547, 0.6021270751953125, 3.418315887451172, 6.234504222869873, 9.050692558288574, 11.866880416870117, 14.683069229125977, 17.499258041381836, 20.315444946289062, 23.131633758544922, 25.94781494140625, 28.76400375366211, 31.58019256591797, 34.39637756347656, 37.21257019042969, 40.02875518798828, 42.84494400024414, 45.6611328125, 48.47732162475586, 51.29351043701172, 54.10969924926758, 56.92588806152344, 59.74207305908203, 62.558265686035156, 65.37445068359375, 68.19064331054688, 71.00682830810547, 73.82301330566406, 76.63920593261719, 79.45539093017578, 82.2715835571289, 85.0877685546875, 87.90396118164062, 90.72014617919922, 93.53633117675781, 96.3525161743164, 99.16870880126953, 101.98489379882812, 104.80108642578125, 107.61727142333984, 110.43345642089844, 113.24964904785156, 116.06584167480469]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 4.0, 2.0, 10.0, 4.0, 3.0, 9.0, 13.0, 10.0, 14.0, 16.0, 28.0, 33.0, 32.0, 31.0, 31.0, 43.0, 58.0, 54.0, 54.0, 58.0, 52.0, 53.0, 51.0, 52.0, 33.0, 42.0, 36.0, 33.0, 34.0, 21.0, 22.0, 14.0, 14.0, 12.0, 8.0, 8.0, 11.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.1646785736084, -30.192157745361328, -29.21963882446289, -28.24711799621582, -27.27459716796875, -26.302078247070312, -25.329557418823242, -24.357036590576172, -23.384517669677734, -22.411996841430664, -21.439477920532227, -20.466957092285156, -19.494436264038086, -18.52191734313965, -17.549396514892578, -16.57687759399414, -15.604355812072754, -14.6318359375, -13.65931510925293, -12.686795234680176, -11.714275360107422, -10.741754531860352, -9.769234657287598, -8.796714782714844, -7.824194431304932, -6.8516740798950195, -5.879154205322266, -4.9066338539123535, -3.9341137409210205, -2.9615936279296875, -1.9890732765197754, -1.0165534019470215, -0.044033050537109375, 0.9284871220588684, 1.9010072946548462, 2.8735275268554688, 3.8460476398468018, 4.818567752838135, 5.791088104248047, 6.763607978820801, 7.736128330230713, 8.708648681640625, 9.681168556213379, 10.653688430786133, 11.626209259033203, 12.598729133605957, 13.571249008178711, 14.543769836425781, 15.516289710998535, 16.48880958557129, 17.46133041381836, 18.433849334716797, 19.406370162963867, 20.378890991210938, 21.351409912109375, 22.323930740356445, 23.296451568603516, 24.268972396850586, 25.241491317749023, 26.214012145996094, 27.186532974243164, 28.1590518951416, 29.131572723388672, 30.10409164428711, 31.07661247253418]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 12.0, 17.0, 18.0, 26.0, 25.0, 67.0, 92.0, 183.0, 467.0, 1385.0, 8227.0, 206772.0, 801358.0, 25886.0, 2758.0, 674.0, 276.0, 113.0, 66.0, 30.0, 25.0, 19.0, 18.0, 15.0, 8.0, 5.0, 8.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.8046875, -14.2979736328125, -13.791259765625, -13.2845458984375, -12.77783203125, -12.2711181640625, -11.764404296875, -11.2576904296875, -10.7509765625, -10.2442626953125, -9.737548828125, -9.2308349609375, -8.72412109375, -8.2174072265625, -7.710693359375, -7.2039794921875, -6.697265625, -6.1905517578125, -5.683837890625, -5.1771240234375, -4.67041015625, -4.1636962890625, -3.656982421875, -3.1502685546875, -2.6435546875, -2.1368408203125, -1.630126953125, -1.1234130859375, -0.61669921875, -0.1099853515625, 0.396728515625, 0.9034423828125, 1.41015625, 1.9168701171875, 2.423583984375, 2.9302978515625, 3.43701171875, 3.9437255859375, 4.450439453125, 4.9571533203125, 5.4638671875, 5.9705810546875, 6.477294921875, 6.9840087890625, 7.49072265625, 7.9974365234375, 8.504150390625, 9.0108642578125, 9.517578125, 10.0242919921875, 10.531005859375, 11.0377197265625, 11.54443359375, 12.0511474609375, 12.557861328125, 13.0645751953125, 13.5712890625, 14.0780029296875, 14.584716796875, 15.0914306640625, 15.59814453125, 16.1048583984375, 16.611572265625, 17.1182861328125, 17.625]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 4.0, 7.0, 11.0, 15.0, 26.0, 30.0, 47.0, 69.0, 66.0, 97.0, 107.0, 96.0, 85.0, 88.0, 81.0, 44.0, 58.0, 25.0, 24.0, 12.0, 6.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.1484375, -7.95037841796875, -7.7523193359375, -7.55426025390625, -7.356201171875, -7.15814208984375, -6.9600830078125, -6.76202392578125, -6.56396484375, -6.36590576171875, -6.1678466796875, -5.96978759765625, -5.771728515625, -5.57366943359375, -5.3756103515625, -5.17755126953125, -4.9794921875, -4.78143310546875, -4.5833740234375, -4.38531494140625, -4.187255859375, -3.98919677734375, -3.7911376953125, -3.59307861328125, -3.39501953125, -3.19696044921875, -2.9989013671875, -2.80084228515625, -2.602783203125, -2.40472412109375, -2.2066650390625, -2.00860595703125, -1.810546875, -1.61248779296875, -1.4144287109375, -1.21636962890625, -1.018310546875, -0.82025146484375, -0.6221923828125, -0.42413330078125, -0.22607421875, -0.02801513671875, 0.1700439453125, 0.36810302734375, 0.566162109375, 0.76422119140625, 0.9622802734375, 1.16033935546875, 1.3583984375, 1.55645751953125, 1.7545166015625, 1.95257568359375, 2.150634765625, 2.34869384765625, 2.5467529296875, 2.74481201171875, 2.94287109375, 3.14093017578125, 3.3389892578125, 3.53704833984375, 3.735107421875, 3.93316650390625, 4.1312255859375, 4.32928466796875, 4.52734375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 8.0, 7.0, 8.0, 13.0, 14.0, 8.0, 30.0, 44.0, 55.0, 67.0, 85.0, 181.0, 329.0, 577.0, 1553.0, 5052.0, 28098.0, 316007.0, 647113.0, 39383.0, 6480.0, 1850.0, 682.0, 345.0, 208.0, 104.0, 83.0, 52.0, 34.0, 22.0, 15.0, 11.0, 6.0, 13.0, 7.0, 2.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-11.03125, -10.716796875, -10.40234375, -10.087890625, -9.7734375, -9.458984375, -9.14453125, -8.830078125, -8.515625, -8.201171875, -7.88671875, -7.572265625, -7.2578125, -6.943359375, -6.62890625, -6.314453125, -6.0, -5.685546875, -5.37109375, -5.056640625, -4.7421875, -4.427734375, -4.11328125, -3.798828125, -3.484375, -3.169921875, -2.85546875, -2.541015625, -2.2265625, -1.912109375, -1.59765625, -1.283203125, -0.96875, -0.654296875, -0.33984375, -0.025390625, 0.2890625, 0.603515625, 0.91796875, 1.232421875, 1.546875, 1.861328125, 2.17578125, 2.490234375, 2.8046875, 3.119140625, 3.43359375, 3.748046875, 4.0625, 4.376953125, 4.69140625, 5.005859375, 5.3203125, 5.634765625, 5.94921875, 6.263671875, 6.578125, 6.892578125, 7.20703125, 7.521484375, 7.8359375, 8.150390625, 8.46484375, 8.779296875, 9.09375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 8.0, 3.0, 6.0, 4.0, 7.0, 8.0, 7.0, 12.0, 11.0, 11.0, 23.0, 28.0, 20.0, 29.0, 29.0, 27.0, 39.0, 43.0, 45.0, 52.0, 54.0, 46.0, 45.0, 56.0, 55.0, 37.0, 44.0, 43.0, 38.0, 26.0, 30.0, 22.0, 15.0, 18.0, 12.0, 7.0, 7.0, 4.0, 4.0, 6.0, 10.0, 5.0, 3.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-13.03125, -12.6419677734375, -12.252685546875, -11.8634033203125, -11.47412109375, -11.0848388671875, -10.695556640625, -10.3062744140625, -9.9169921875, -9.5277099609375, -9.138427734375, -8.7491455078125, -8.35986328125, -7.9705810546875, -7.581298828125, -7.1920166015625, -6.802734375, -6.4134521484375, -6.024169921875, -5.6348876953125, -5.24560546875, -4.8563232421875, -4.467041015625, -4.0777587890625, -3.6884765625, -3.2991943359375, -2.909912109375, -2.5206298828125, -2.13134765625, -1.7420654296875, -1.352783203125, -0.9635009765625, -0.57421875, -0.1849365234375, 0.204345703125, 0.5936279296875, 0.98291015625, 1.3721923828125, 1.761474609375, 2.1507568359375, 2.5400390625, 2.9293212890625, 3.318603515625, 3.7078857421875, 4.09716796875, 4.4864501953125, 4.875732421875, 5.2650146484375, 5.654296875, 6.0435791015625, 6.432861328125, 6.8221435546875, 7.21142578125, 7.6007080078125, 7.989990234375, 8.3792724609375, 8.7685546875, 9.1578369140625, 9.547119140625, 9.9364013671875, 10.32568359375, 10.7149658203125, 11.104248046875, 11.4935302734375, 11.8828125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 0.0, 1.0, 2.0, 4.0, 2.0, 4.0, 7.0, 4.0, 16.0, 25.0, 29.0, 44.0, 66.0, 96.0, 180.0, 310.0, 621.0, 1214.0, 2468.0, 5725.0, 16996.0, 74946.0, 751458.0, 153506.0, 26188.0, 8230.0, 3257.0, 1443.0, 777.0, 389.0, 185.0, 137.0, 80.0, 35.0, 30.0, 18.0, 6.0, 11.0, 8.0, 9.0, 8.0, 3.0, 5.0, 3.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.193359375, -3.092529296875, -2.99169921875, -2.890869140625, -2.7900390625, -2.689208984375, -2.58837890625, -2.487548828125, -2.38671875, -2.285888671875, -2.18505859375, -2.084228515625, -1.9833984375, -1.882568359375, -1.78173828125, -1.680908203125, -1.580078125, -1.479248046875, -1.37841796875, -1.277587890625, -1.1767578125, -1.075927734375, -0.97509765625, -0.874267578125, -0.7734375, -0.672607421875, -0.57177734375, -0.470947265625, -0.3701171875, -0.269287109375, -0.16845703125, -0.067626953125, 0.033203125, 0.134033203125, 0.23486328125, 0.335693359375, 0.4365234375, 0.537353515625, 0.63818359375, 0.739013671875, 0.83984375, 0.940673828125, 1.04150390625, 1.142333984375, 1.2431640625, 1.343994140625, 1.44482421875, 1.545654296875, 1.646484375, 1.747314453125, 1.84814453125, 1.948974609375, 2.0498046875, 2.150634765625, 2.25146484375, 2.352294921875, 2.453125, 2.553955078125, 2.65478515625, 2.755615234375, 2.8564453125, 2.957275390625, 3.05810546875, 3.158935546875, 3.259765625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 4.0, 6.0, 5.0, 16.0, 15.0, 28.0, 48.0, 71.0, 121.0, 179.0, 179.0, 109.0, 60.0, 34.0, 44.0, 14.0, 14.0, 15.0, 9.0, 6.0, 7.0, 5.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0007562637329101562, -0.0007281452417373657, -0.0007000267505645752, -0.0006719082593917847, -0.0006437897682189941, -0.0006156712770462036, -0.0005875527858734131, -0.0005594342947006226, -0.000531315803527832, -0.0005031973123550415, -0.000475078821182251, -0.00044696033000946045, -0.0004188418388366699, -0.0003907233476638794, -0.00036260485649108887, -0.00033448636531829834, -0.0003063678741455078, -0.0002782493829727173, -0.00025013089179992676, -0.00022201240062713623, -0.0001938939094543457, -0.00016577541828155518, -0.00013765692710876465, -0.00010953843593597412, -8.14199447631836e-05, -5.3301453590393066e-05, -2.518296241760254e-05, 2.9355287551879883e-06, 3.1054019927978516e-05, 5.917251110076904e-05, 8.729100227355957e-05, 0.0001154094934463501, 0.00014352798461914062, 0.00017164647579193115, 0.00019976496696472168, 0.0002278834581375122, 0.00025600194931030273, 0.00028412044048309326, 0.0003122389316558838, 0.0003403574228286743, 0.00036847591400146484, 0.00039659440517425537, 0.0004247128963470459, 0.0004528313875198364, 0.00048094987869262695, 0.0005090683698654175, 0.000537186861038208, 0.0005653053522109985, 0.0005934238433837891, 0.0006215423345565796, 0.0006496608257293701, 0.0006777793169021606, 0.0007058978080749512, 0.0007340162992477417, 0.0007621347904205322, 0.0007902532815933228, 0.0008183717727661133, 0.0008464902639389038, 0.0008746087551116943, 0.0009027272462844849, 0.0009308457374572754, 0.0009589642286300659, 0.0009870827198028564, 0.001015201210975647, 0.0010433197021484375]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 3.0, 3.0, 8.0, 9.0, 6.0, 9.0, 8.0, 13.0, 21.0, 33.0, 54.0, 102.0, 159.0, 278.0, 480.0, 858.0, 1812.0, 4272.0, 11737.0, 41733.0, 259288.0, 639745.0, 61752.0, 15961.0, 5555.0, 2301.0, 1094.0, 530.0, 278.0, 156.0, 102.0, 59.0, 35.0, 32.0, 19.0, 19.0, 16.0, 8.0, 4.0, 1.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.33984375, -3.247406005859375, -3.15496826171875, -3.062530517578125, -2.9700927734375, -2.877655029296875, -2.78521728515625, -2.692779541015625, -2.600341796875, -2.507904052734375, -2.41546630859375, -2.323028564453125, -2.2305908203125, -2.138153076171875, -2.04571533203125, -1.953277587890625, -1.86083984375, -1.768402099609375, -1.67596435546875, -1.583526611328125, -1.4910888671875, -1.398651123046875, -1.30621337890625, -1.213775634765625, -1.121337890625, -1.028900146484375, -0.93646240234375, -0.844024658203125, -0.7515869140625, -0.659149169921875, -0.56671142578125, -0.474273681640625, -0.3818359375, -0.289398193359375, -0.19696044921875, -0.104522705078125, -0.0120849609375, 0.080352783203125, 0.17279052734375, 0.265228271484375, 0.357666015625, 0.450103759765625, 0.54254150390625, 0.634979248046875, 0.7274169921875, 0.819854736328125, 0.91229248046875, 1.004730224609375, 1.09716796875, 1.189605712890625, 1.28204345703125, 1.374481201171875, 1.4669189453125, 1.559356689453125, 1.65179443359375, 1.744232177734375, 1.836669921875, 1.929107666015625, 2.02154541015625, 2.113983154296875, 2.2064208984375, 2.298858642578125, 2.39129638671875, 2.483734130859375, 2.576171875]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 4.0, 5.0, 6.0, 8.0, 6.0, 5.0, 14.0, 17.0, 39.0, 64.0, 100.0, 176.0, 203.0, 154.0, 83.0, 40.0, 24.0, 16.0, 11.0, 7.0, 6.0, 6.0, 5.0, 3.0, 3.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.49609375, -4.3480224609375, -4.199951171875, -4.0518798828125, -3.90380859375, -3.7557373046875, -3.607666015625, -3.4595947265625, -3.3115234375, -3.1634521484375, -3.015380859375, -2.8673095703125, -2.71923828125, -2.5711669921875, -2.423095703125, -2.2750244140625, -2.126953125, -1.9788818359375, -1.830810546875, -1.6827392578125, -1.53466796875, -1.3865966796875, -1.238525390625, -1.0904541015625, -0.9423828125, -0.7943115234375, -0.646240234375, -0.4981689453125, -0.35009765625, -0.2020263671875, -0.053955078125, 0.0941162109375, 0.2421875, 0.3902587890625, 0.538330078125, 0.6864013671875, 0.83447265625, 0.9825439453125, 1.130615234375, 1.2786865234375, 1.4267578125, 1.5748291015625, 1.722900390625, 1.8709716796875, 2.01904296875, 2.1671142578125, 2.315185546875, 2.4632568359375, 2.611328125, 2.7593994140625, 2.907470703125, 3.0555419921875, 3.20361328125, 3.3516845703125, 3.499755859375, 3.6478271484375, 3.7958984375, 3.9439697265625, 4.092041015625, 4.2401123046875, 4.38818359375, 4.5362548828125, 4.684326171875, 4.8323974609375, 4.98046875]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 5.0, 3.0, 3.0, 11.0, 63.0, 130.0, 397.0, 243.0, 87.0, 24.0, 18.0, 8.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-91.3323974609375, -87.90068054199219, -84.4689712524414, -81.0372543334961, -77.60554504394531, -74.173828125, -70.74211120605469, -67.3104019165039, -63.878684997558594, -60.44697189331055, -57.0152587890625, -53.58354187011719, -50.15182876586914, -46.720115661621094, -43.28840255737305, -39.856689453125, -36.42497634887695, -32.993263244628906, -29.561548233032227, -26.12983512878418, -22.6981201171875, -19.266407012939453, -15.834693908691406, -12.402978897094727, -8.97126579284668, -5.539551734924316, -2.1078381538391113, 1.3238754272460938, 4.755589485168457, 8.18730354309082, 11.619016647338867, 15.050731658935547, 18.482444763183594, 21.91415786743164, 25.34587287902832, 28.777585983276367, 32.20930099487305, 35.641014099121094, 39.07272720336914, 42.50444030761719, 45.9361572265625, 49.36787033081055, 52.799583435058594, 56.231300354003906, 59.66301345825195, 63.0947265625, 66.52644348144531, 69.9581527709961, 73.38986206054688, 76.82157897949219, 80.25328826904297, 83.68500518798828, 87.11671447753906, 90.54843139648438, 93.98014831542969, 97.41185760498047, 100.84357452392578, 104.2752914428711, 107.70700073242188, 111.13871765136719, 114.57042694091797, 118.00214385986328, 121.43385314941406, 124.86557006835938, 128.2972869873047]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 4.0, 6.0, 3.0, 6.0, 10.0, 12.0, 15.0, 24.0, 17.0, 25.0, 29.0, 43.0, 39.0, 57.0, 57.0, 83.0, 83.0, 98.0, 65.0, 58.0, 37.0, 36.0, 32.0, 33.0, 27.0, 21.0, 20.0, 16.0, 12.0, 5.0, 10.0, 9.0, 6.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.67835235595703, -44.86335754394531, -43.048362731933594, -41.233367919921875, -39.418373107910156, -37.60337829589844, -35.78838348388672, -33.973388671875, -32.15839385986328, -30.343399047851562, -28.528404235839844, -26.713409423828125, -24.898414611816406, -23.083419799804688, -21.268423080444336, -19.453428268432617, -17.638431549072266, -15.823436737060547, -14.008441925048828, -12.193446159362793, -10.378451347351074, -8.563456535339355, -6.74846076965332, -4.933465957641602, -3.118471145629883, -1.303476095199585, 0.5115189552307129, 2.32651424407959, 4.141509056091309, 5.956503868103027, 7.7714996337890625, 9.586494445800781, 11.4014892578125, 13.216484069824219, 15.031478881835938, 16.846473693847656, 18.661468505859375, 20.476463317871094, 22.291460037231445, 24.106454849243164, 25.921449661254883, 27.7364444732666, 29.55143928527832, 31.366436004638672, 33.18143081665039, 34.99642562866211, 36.81142044067383, 38.62641525268555, 40.441410064697266, 42.256404876708984, 44.0713996887207, 45.88639450073242, 47.70138931274414, 49.51638412475586, 51.331382751464844, 53.14637756347656, 54.96137237548828, 56.7763671875, 58.59136199951172, 60.40635681152344, 62.221351623535156, 64.03634643554688, 65.8513412475586, 67.66633605957031, 69.48133087158203]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 4.0, 5.0, 7.0, 5.0, 12.0, 17.0, 21.0, 19.0, 47.0, 54.0, 106.0, 182.0, 437.0, 1374.0, 8114.0, 324867.0, 3811743.0, 41665.0, 3571.0, 1085.0, 430.0, 239.0, 121.0, 55.0, 31.0, 25.0, 13.0, 10.0, 6.0, 4.0, 7.0, 5.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-20.84375, -20.3621826171875, -19.880615234375, -19.3990478515625, -18.91748046875, -18.4359130859375, -17.954345703125, -17.4727783203125, -16.9912109375, -16.5096435546875, -16.028076171875, -15.5465087890625, -15.06494140625, -14.5833740234375, -14.101806640625, -13.6202392578125, -13.138671875, -12.6571044921875, -12.175537109375, -11.6939697265625, -11.21240234375, -10.7308349609375, -10.249267578125, -9.7677001953125, -9.2861328125, -8.8045654296875, -8.322998046875, -7.8414306640625, -7.35986328125, -6.8782958984375, -6.396728515625, -5.9151611328125, -5.43359375, -4.9520263671875, -4.470458984375, -3.9888916015625, -3.50732421875, -3.0257568359375, -2.544189453125, -2.0626220703125, -1.5810546875, -1.0994873046875, -0.617919921875, -0.1363525390625, 0.34521484375, 0.8267822265625, 1.308349609375, 1.7899169921875, 2.271484375, 2.7530517578125, 3.234619140625, 3.7161865234375, 4.19775390625, 4.6793212890625, 5.160888671875, 5.6424560546875, 6.1240234375, 6.6055908203125, 7.087158203125, 7.5687255859375, 8.05029296875, 8.5318603515625, 9.013427734375, 9.4949951171875, 9.9765625]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 7.0, 12.0, 16.0, 22.0, 40.0, 59.0, 92.0, 124.0, 124.0, 117.0, 105.0, 104.0, 57.0, 45.0, 43.0, 16.0, 13.0, 9.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.8828125, -10.641357421875, -10.39990234375, -10.158447265625, -9.9169921875, -9.675537109375, -9.43408203125, -9.192626953125, -8.951171875, -8.709716796875, -8.46826171875, -8.226806640625, -7.9853515625, -7.743896484375, -7.50244140625, -7.260986328125, -7.01953125, -6.778076171875, -6.53662109375, -6.295166015625, -6.0537109375, -5.812255859375, -5.57080078125, -5.329345703125, -5.087890625, -4.846435546875, -4.60498046875, -4.363525390625, -4.1220703125, -3.880615234375, -3.63916015625, -3.397705078125, -3.15625, -2.914794921875, -2.67333984375, -2.431884765625, -2.1904296875, -1.948974609375, -1.70751953125, -1.466064453125, -1.224609375, -0.983154296875, -0.74169921875, -0.500244140625, -0.2587890625, -0.017333984375, 0.22412109375, 0.465576171875, 0.70703125, 0.948486328125, 1.18994140625, 1.431396484375, 1.6728515625, 1.914306640625, 2.15576171875, 2.397216796875, 2.638671875, 2.880126953125, 3.12158203125, 3.363037109375, 3.6044921875, 3.845947265625, 4.08740234375, 4.328857421875, 4.5703125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 5.0, 10.0, 11.0, 18.0, 45.0, 50.0, 111.0, 170.0, 496.0, 1325.0, 7993.0, 153543.0, 3840920.0, 178103.0, 8954.0, 1533.0, 491.0, 248.0, 108.0, 58.0, 31.0, 22.0, 17.0, 11.0, 5.0, 8.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.5625, -12.1761474609375, -11.789794921875, -11.4034423828125, -11.01708984375, -10.6307373046875, -10.244384765625, -9.8580322265625, -9.4716796875, -9.0853271484375, -8.698974609375, -8.3126220703125, -7.92626953125, -7.5399169921875, -7.153564453125, -6.7672119140625, -6.380859375, -5.9945068359375, -5.608154296875, -5.2218017578125, -4.83544921875, -4.4490966796875, -4.062744140625, -3.6763916015625, -3.2900390625, -2.9036865234375, -2.517333984375, -2.1309814453125, -1.74462890625, -1.3582763671875, -0.971923828125, -0.5855712890625, -0.19921875, 0.1871337890625, 0.573486328125, 0.9598388671875, 1.34619140625, 1.7325439453125, 2.118896484375, 2.5052490234375, 2.8916015625, 3.2779541015625, 3.664306640625, 4.0506591796875, 4.43701171875, 4.8233642578125, 5.209716796875, 5.5960693359375, 5.982421875, 6.3687744140625, 6.755126953125, 7.1414794921875, 7.52783203125, 7.9141845703125, 8.300537109375, 8.6868896484375, 9.0732421875, 9.4595947265625, 9.845947265625, 10.2322998046875, 10.61865234375, 11.0050048828125, 11.391357421875, 11.7777099609375, 12.1640625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 6.0, 10.0, 8.0, 11.0, 25.0, 22.0, 36.0, 51.0, 101.0, 108.0, 168.0, 296.0, 467.0, 719.0, 671.0, 467.0, 333.0, 180.0, 126.0, 67.0, 52.0, 45.0, 32.0, 23.0, 19.0, 13.0, 9.0, 8.0, 0.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.5078125, -5.295166015625, -5.08251953125, -4.869873046875, -4.6572265625, -4.444580078125, -4.23193359375, -4.019287109375, -3.806640625, -3.593994140625, -3.38134765625, -3.168701171875, -2.9560546875, -2.743408203125, -2.53076171875, -2.318115234375, -2.10546875, -1.892822265625, -1.68017578125, -1.467529296875, -1.2548828125, -1.042236328125, -0.82958984375, -0.616943359375, -0.404296875, -0.191650390625, 0.02099609375, 0.233642578125, 0.4462890625, 0.658935546875, 0.87158203125, 1.084228515625, 1.296875, 1.509521484375, 1.72216796875, 1.934814453125, 2.1474609375, 2.360107421875, 2.57275390625, 2.785400390625, 2.998046875, 3.210693359375, 3.42333984375, 3.635986328125, 3.8486328125, 4.061279296875, 4.27392578125, 4.486572265625, 4.69921875, 4.911865234375, 5.12451171875, 5.337158203125, 5.5498046875, 5.762451171875, 5.97509765625, 6.187744140625, 6.400390625, 6.613037109375, 6.82568359375, 7.038330078125, 7.2509765625, 7.463623046875, 7.67626953125, 7.888916015625, 8.1015625]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 2.0, 5.0, 8.0, 9.0, 41.0, 77.0, 143.0, 210.0, 223.0, 117.0, 88.0, 34.0, 28.0, 12.0, 4.0, 4.0, 5.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.98476219177246, -26.558334350585938, -24.131906509399414, -21.70547866821289, -19.279048919677734, -16.852622985839844, -14.426193237304688, -11.999765396118164, -9.57333755493164, -7.146909713745117, -4.7204813957214355, -2.294053077697754, 0.13237476348876953, 2.558802604675293, 4.985231399536133, 7.411659240722656, 9.83808708190918, 12.264514923095703, 14.690942764282227, 17.11737060546875, 19.543800354003906, 21.970226287841797, 24.396656036376953, 26.823083877563477, 29.24951171875, 31.675939559936523, 34.10236740112305, 36.5287971496582, 38.955223083496094, 41.38165283203125, 43.808082580566406, 46.2345085144043, 48.66093444824219, 51.087364196777344, 53.513790130615234, 55.94021987915039, 58.36664581298828, 60.79307556152344, 63.219505310058594, 65.64593505859375, 68.07235717773438, 70.49878692626953, 72.92521667480469, 75.35163879394531, 77.77806854248047, 80.20449829101562, 82.63092803955078, 85.05735778808594, 87.48377990722656, 89.91020965576172, 92.33663940429688, 94.7630615234375, 97.18949127197266, 99.61592102050781, 102.04235076904297, 104.46878051757812, 106.89521026611328, 109.32164001464844, 111.7480697631836, 114.17449188232422, 116.60092163085938, 119.02735137939453, 121.45378112792969, 123.88020324707031, 126.30663299560547]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 1.0, 8.0, 6.0, 7.0, 4.0, 10.0, 8.0, 7.0, 13.0, 16.0, 7.0, 28.0, 33.0, 29.0, 36.0, 37.0, 30.0, 33.0, 35.0, 46.0, 49.0, 37.0, 41.0, 55.0, 37.0, 39.0, 43.0, 32.0, 34.0, 21.0, 24.0, 21.0, 34.0, 27.0, 31.0, 17.0, 17.0, 11.0, 7.0, 6.0, 5.0, 5.0, 9.0, 2.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-27.266460418701172, -26.429790496826172, -25.593120574951172, -24.75644874572754, -23.91977882385254, -23.08310890197754, -22.246437072753906, -21.409767150878906, -20.573097229003906, -19.736427307128906, -18.899757385253906, -18.063085556030273, -17.226415634155273, -16.389745712280273, -15.553074836730957, -14.71640396118164, -13.87973403930664, -13.04306411743164, -12.206393241882324, -11.369722366333008, -10.533052444458008, -9.696382522583008, -8.859711647033691, -8.023040771484375, -7.186370849609375, -6.349700450897217, -5.513030052185059, -4.6763596534729, -3.839689254760742, -3.003018856048584, -2.166348457336426, -1.3296780586242676, -0.49300575256347656, 0.34366464614868164, 1.1803350448608398, 2.017005443572998, 2.8536758422851562, 3.6903462409973145, 4.527016639709473, 5.363687038421631, 6.200357437133789, 7.037027835845947, 7.8736982345581055, 8.710369110107422, 9.547039031982422, 10.383708953857422, 11.220379829406738, 12.057050704956055, 12.893720626831055, 13.730390548706055, 14.567061424255371, 15.403732299804688, 16.240402221679688, 17.077072143554688, 17.913742065429688, 18.75041389465332, 19.58708381652832, 20.42375373840332, 21.260425567626953, 22.097095489501953, 22.933765411376953, 23.770435333251953, 24.607105255126953, 25.443777084350586, 26.280447006225586]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 2.0, 5.0, 5.0, 11.0, 13.0, 18.0, 19.0, 31.0, 38.0, 81.0, 139.0, 243.0, 575.0, 2006.0, 13020.0, 230078.0, 756325.0, 39990.0, 4198.0, 974.0, 351.0, 151.0, 98.0, 52.0, 40.0, 26.0, 13.0, 15.0, 8.0, 4.0, 7.0, 7.0, 4.0, 1.0, 4.0, 2.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.8984375, -14.4754638671875, -14.052490234375, -13.6295166015625, -13.20654296875, -12.7835693359375, -12.360595703125, -11.9376220703125, -11.5146484375, -11.0916748046875, -10.668701171875, -10.2457275390625, -9.82275390625, -9.3997802734375, -8.976806640625, -8.5538330078125, -8.130859375, -7.7078857421875, -7.284912109375, -6.8619384765625, -6.43896484375, -6.0159912109375, -5.593017578125, -5.1700439453125, -4.7470703125, -4.3240966796875, -3.901123046875, -3.4781494140625, -3.05517578125, -2.6322021484375, -2.209228515625, -1.7862548828125, -1.36328125, -0.9403076171875, -0.517333984375, -0.0943603515625, 0.32861328125, 0.7515869140625, 1.174560546875, 1.5975341796875, 2.0205078125, 2.4434814453125, 2.866455078125, 3.2894287109375, 3.71240234375, 4.1353759765625, 4.558349609375, 4.9813232421875, 5.404296875, 5.8272705078125, 6.250244140625, 6.6732177734375, 7.09619140625, 7.5191650390625, 7.942138671875, 8.3651123046875, 8.7880859375, 9.2110595703125, 9.634033203125, 10.0570068359375, 10.47998046875, 10.9029541015625, 11.325927734375, 11.7489013671875, 12.171875]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 10.0, 9.0, 19.0, 28.0, 37.0, 55.0, 59.0, 97.0, 114.0, 105.0, 99.0, 103.0, 83.0, 63.0, 56.0, 33.0, 13.0, 11.0, 10.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.203125, -8.97113037109375, -8.7391357421875, -8.50714111328125, -8.275146484375, -8.04315185546875, -7.8111572265625, -7.57916259765625, -7.34716796875, -7.11517333984375, -6.8831787109375, -6.65118408203125, -6.419189453125, -6.18719482421875, -5.9552001953125, -5.72320556640625, -5.4912109375, -5.25921630859375, -5.0272216796875, -4.79522705078125, -4.563232421875, -4.33123779296875, -4.0992431640625, -3.86724853515625, -3.63525390625, -3.40325927734375, -3.1712646484375, -2.93927001953125, -2.707275390625, -2.47528076171875, -2.2432861328125, -2.01129150390625, -1.779296875, -1.54730224609375, -1.3153076171875, -1.08331298828125, -0.851318359375, -0.61932373046875, -0.3873291015625, -0.15533447265625, 0.07666015625, 0.30865478515625, 0.5406494140625, 0.77264404296875, 1.004638671875, 1.23663330078125, 1.4686279296875, 1.70062255859375, 1.9326171875, 2.16461181640625, 2.3966064453125, 2.62860107421875, 2.860595703125, 3.09259033203125, 3.3245849609375, 3.55657958984375, 3.78857421875, 4.02056884765625, 4.2525634765625, 4.48455810546875, 4.716552734375, 4.94854736328125, 5.1805419921875, 5.41253662109375, 5.64453125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 2.0, 8.0, 8.0, 4.0, 13.0, 15.0, 20.0, 36.0, 67.0, 60.0, 99.0, 161.0, 264.0, 473.0, 822.0, 1729.0, 4434.0, 16189.0, 112379.0, 800020.0, 90057.0, 14127.0, 3982.0, 1691.0, 758.0, 417.0, 242.0, 137.0, 101.0, 61.0, 56.0, 26.0, 31.0, 15.0, 9.0, 14.0, 5.0, 9.0, 6.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-9.890625, -9.594970703125, -9.29931640625, -9.003662109375, -8.7080078125, -8.412353515625, -8.11669921875, -7.821044921875, -7.525390625, -7.229736328125, -6.93408203125, -6.638427734375, -6.3427734375, -6.047119140625, -5.75146484375, -5.455810546875, -5.16015625, -4.864501953125, -4.56884765625, -4.273193359375, -3.9775390625, -3.681884765625, -3.38623046875, -3.090576171875, -2.794921875, -2.499267578125, -2.20361328125, -1.907958984375, -1.6123046875, -1.316650390625, -1.02099609375, -0.725341796875, -0.4296875, -0.134033203125, 0.16162109375, 0.457275390625, 0.7529296875, 1.048583984375, 1.34423828125, 1.639892578125, 1.935546875, 2.231201171875, 2.52685546875, 2.822509765625, 3.1181640625, 3.413818359375, 3.70947265625, 4.005126953125, 4.30078125, 4.596435546875, 4.89208984375, 5.187744140625, 5.4833984375, 5.779052734375, 6.07470703125, 6.370361328125, 6.666015625, 6.961669921875, 7.25732421875, 7.552978515625, 7.8486328125, 8.144287109375, 8.43994140625, 8.735595703125, 9.03125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 3.0, 9.0, 8.0, 13.0, 17.0, 34.0, 40.0, 55.0, 77.0, 104.0, 88.0, 128.0, 113.0, 93.0, 77.0, 50.0, 29.0, 27.0, 9.0, 9.0, 10.0, 7.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.453125, -23.563232421875, -22.67333984375, -21.783447265625, -20.8935546875, -20.003662109375, -19.11376953125, -18.223876953125, -17.333984375, -16.444091796875, -15.55419921875, -14.664306640625, -13.7744140625, -12.884521484375, -11.99462890625, -11.104736328125, -10.21484375, -9.324951171875, -8.43505859375, -7.545166015625, -6.6552734375, -5.765380859375, -4.87548828125, -3.985595703125, -3.095703125, -2.205810546875, -1.31591796875, -0.426025390625, 0.4638671875, 1.353759765625, 2.24365234375, 3.133544921875, 4.0234375, 4.913330078125, 5.80322265625, 6.693115234375, 7.5830078125, 8.472900390625, 9.36279296875, 10.252685546875, 11.142578125, 12.032470703125, 12.92236328125, 13.812255859375, 14.7021484375, 15.592041015625, 16.48193359375, 17.371826171875, 18.26171875, 19.151611328125, 20.04150390625, 20.931396484375, 21.8212890625, 22.711181640625, 23.60107421875, 24.490966796875, 25.380859375, 26.270751953125, 27.16064453125, 28.050537109375, 28.9404296875, 29.830322265625, 30.72021484375, 31.610107421875, 32.5]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 9.0, 12.0, 4.0, 8.0, 10.0, 13.0, 19.0, 27.0, 41.0, 63.0, 83.0, 124.0, 182.0, 458.0, 1080.0, 3380.0, 13479.0, 103282.0, 862345.0, 50872.0, 8881.0, 2423.0, 821.0, 351.0, 210.0, 113.0, 59.0, 49.0, 46.0, 24.0, 15.0, 13.0, 10.0, 5.0, 5.0, 9.0, 5.0, 3.0, 2.0, 6.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.552734375, -3.439453125, -3.326171875, -3.212890625, -3.099609375, -2.986328125, -2.873046875, -2.759765625, -2.646484375, -2.533203125, -2.419921875, -2.306640625, -2.193359375, -2.080078125, -1.966796875, -1.853515625, -1.740234375, -1.626953125, -1.513671875, -1.400390625, -1.287109375, -1.173828125, -1.060546875, -0.947265625, -0.833984375, -0.720703125, -0.607421875, -0.494140625, -0.380859375, -0.267578125, -0.154296875, -0.041015625, 0.072265625, 0.185546875, 0.298828125, 0.412109375, 0.525390625, 0.638671875, 0.751953125, 0.865234375, 0.978515625, 1.091796875, 1.205078125, 1.318359375, 1.431640625, 1.544921875, 1.658203125, 1.771484375, 1.884765625, 1.998046875, 2.111328125, 2.224609375, 2.337890625, 2.451171875, 2.564453125, 2.677734375, 2.791015625, 2.904296875, 3.017578125, 3.130859375, 3.244140625, 3.357421875, 3.470703125, 3.583984375, 3.697265625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 1.0, 5.0, 4.0, 10.0, 8.0, 7.0, 8.0, 18.0, 11.0, 25.0, 31.0, 64.0, 135.0, 155.0, 194.0, 109.0, 68.0, 23.0, 27.0, 21.0, 22.0, 5.0, 12.0, 8.0, 4.0, 5.0, 5.0, 5.0, 5.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007615089416503906, -0.0007369443774223328, -0.0007123798131942749, -0.000687815248966217, -0.0006632506847381592, -0.0006386861205101013, -0.0006141215562820435, -0.0005895569920539856, -0.0005649924278259277, -0.0005404278635978699, -0.000515863299369812, -0.0004912987351417542, -0.0004667341709136963, -0.00044216960668563843, -0.00041760504245758057, -0.0003930404782295227, -0.00036847591400146484, -0.000343911349773407, -0.0003193467855453491, -0.00029478222131729126, -0.0002702176570892334, -0.00024565309286117554, -0.00022108852863311768, -0.00019652396440505981, -0.00017195940017700195, -0.0001473948359489441, -0.00012283027172088623, -9.826570749282837e-05, -7.370114326477051e-05, -4.9136579036712646e-05, -2.4572014808654785e-05, -7.450580596923828e-09, 2.4557113647460938e-05, 4.91216778755188e-05, 7.368624210357666e-05, 9.825080633163452e-05, 0.00012281537055969238, 0.00014737993478775024, 0.0001719444990158081, 0.00019650906324386597, 0.00022107362747192383, 0.0002456381916999817, 0.00027020275592803955, 0.0002947673201560974, 0.0003193318843841553, 0.00034389644861221313, 0.000368461012840271, 0.00039302557706832886, 0.0004175901412963867, 0.0004421547055244446, 0.00046671926975250244, 0.0004912838339805603, 0.0005158483982086182, 0.000540412962436676, 0.0005649775266647339, 0.0005895420908927917, 0.0006141066551208496, 0.0006386712193489075, 0.0006632357835769653, 0.0006878003478050232, 0.0007123649120330811, 0.0007369294762611389, 0.0007614940404891968, 0.0007860586047172546, 0.0008106231689453125]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 3.0, 6.0, 9.0, 6.0, 9.0, 8.0, 20.0, 30.0, 37.0, 49.0, 73.0, 121.0, 183.0, 322.0, 581.0, 1256.0, 2655.0, 6376.0, 19551.0, 88398.0, 746149.0, 141052.0, 26965.0, 8269.0, 3297.0, 1419.0, 692.0, 379.0, 220.0, 150.0, 102.0, 45.0, 42.0, 25.0, 19.0, 13.0, 8.0, 6.0, 5.0, 5.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.259765625, -2.1834716796875, -2.107177734375, -2.0308837890625, -1.95458984375, -1.8782958984375, -1.802001953125, -1.7257080078125, -1.6494140625, -1.5731201171875, -1.496826171875, -1.4205322265625, -1.34423828125, -1.2679443359375, -1.191650390625, -1.1153564453125, -1.0390625, -0.9627685546875, -0.886474609375, -0.8101806640625, -0.73388671875, -0.6575927734375, -0.581298828125, -0.5050048828125, -0.4287109375, -0.3524169921875, -0.276123046875, -0.1998291015625, -0.12353515625, -0.0472412109375, 0.029052734375, 0.1053466796875, 0.181640625, 0.2579345703125, 0.334228515625, 0.4105224609375, 0.48681640625, 0.5631103515625, 0.639404296875, 0.7156982421875, 0.7919921875, 0.8682861328125, 0.944580078125, 1.0208740234375, 1.09716796875, 1.1734619140625, 1.249755859375, 1.3260498046875, 1.40234375, 1.4786376953125, 1.554931640625, 1.6312255859375, 1.70751953125, 1.7838134765625, 1.860107421875, 1.9364013671875, 2.0126953125, 2.0889892578125, 2.165283203125, 2.2415771484375, 2.31787109375, 2.3941650390625, 2.470458984375, 2.5467529296875, 2.623046875]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 5.0, 3.0, 6.0, 6.0, 6.0, 13.0, 15.0, 34.0, 30.0, 53.0, 68.0, 101.0, 124.0, 145.0, 109.0, 91.0, 59.0, 39.0, 34.0, 18.0, 7.0, 9.0, 7.0, 10.0, 8.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0], "bins": [-4.00390625, -3.906494140625, -3.80908203125, -3.711669921875, -3.6142578125, -3.516845703125, -3.41943359375, -3.322021484375, -3.224609375, -3.127197265625, -3.02978515625, -2.932373046875, -2.8349609375, -2.737548828125, -2.64013671875, -2.542724609375, -2.4453125, -2.347900390625, -2.25048828125, -2.153076171875, -2.0556640625, -1.958251953125, -1.86083984375, -1.763427734375, -1.666015625, -1.568603515625, -1.47119140625, -1.373779296875, -1.2763671875, -1.178955078125, -1.08154296875, -0.984130859375, -0.88671875, -0.789306640625, -0.69189453125, -0.594482421875, -0.4970703125, -0.399658203125, -0.30224609375, -0.204833984375, -0.107421875, -0.010009765625, 0.08740234375, 0.184814453125, 0.2822265625, 0.379638671875, 0.47705078125, 0.574462890625, 0.671875, 0.769287109375, 0.86669921875, 0.964111328125, 1.0615234375, 1.158935546875, 1.25634765625, 1.353759765625, 1.451171875, 1.548583984375, 1.64599609375, 1.743408203125, 1.8408203125, 1.938232421875, 2.03564453125, 2.133056640625, 2.23046875]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 6.0, 6.0, 17.0, 33.0, 88.0, 327.0, 350.0, 103.0, 39.0, 19.0, 7.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-118.65951538085938, -114.95042419433594, -111.2413330078125, -107.53224182128906, -103.82315826416016, -100.11406707763672, -96.40497589111328, -92.69588470458984, -88.98680114746094, -85.2777099609375, -81.56861877441406, -77.85952758789062, -74.15044403076172, -70.44135284423828, -66.73226165771484, -63.023170471191406, -59.31407928466797, -55.60498809814453, -51.89590072631836, -48.18680953979492, -44.47772216796875, -40.76863098144531, -37.059539794921875, -33.35044860839844, -29.641361236572266, -25.93227195739746, -22.223182678222656, -18.51409149169922, -14.805002212524414, -11.09591293334961, -7.386821746826172, -3.677732467651367, 0.03134918212890625, 3.740438938140869, 7.449528694152832, 11.158618927001953, 14.867708206176758, 18.576797485351562, 22.285888671875, 25.994977951049805, 29.70406723022461, 33.41315841674805, 37.12224578857422, 40.831336975097656, 44.540428161621094, 48.249515533447266, 51.9586067199707, 55.667694091796875, 59.37678527832031, 63.08587646484375, 66.79496765136719, 70.50405883789062, 74.21314239501953, 77.92223358154297, 81.6313247680664, 85.34041595458984, 89.04949951171875, 92.75859069824219, 96.46768188476562, 100.17677307128906, 103.88585662841797, 107.5949478149414, 111.30403900146484, 115.01313018798828, 118.72222137451172]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 3.0, 5.0, 8.0, 14.0, 25.0, 26.0, 28.0, 26.0, 53.0, 77.0, 106.0, 167.0, 134.0, 84.0, 48.0, 55.0, 30.0, 44.0, 20.0, 19.0, 12.0, 7.0, 4.0, 5.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-70.20704650878906, -67.14698791503906, -64.08692932128906, -61.0268669128418, -57.96680450439453, -54.90674591064453, -51.84668731689453, -48.786624908447266, -45.7265625, -42.66650390625, -39.606441497802734, -36.546382904052734, -33.48632049560547, -30.42626190185547, -27.366201400756836, -24.306140899658203, -21.246082305908203, -18.18602180480957, -15.125961303710938, -12.065901756286621, -9.005841255187988, -5.9457807540893555, -2.885721206665039, 0.17433929443359375, 3.2343997955322266, 6.294460296630859, 9.354520797729492, 12.414580345153809, 15.474640846252441, 18.53470230102539, 21.59476089477539, 24.654821395874023, 27.714881896972656, 30.77494239807129, 33.83500289916992, 36.89506149291992, 39.95512390136719, 43.01518249511719, 46.07524108886719, 49.13530349731445, 52.19536590576172, 55.25542449951172, 58.315486907958984, 61.375545501708984, 64.43560791015625, 67.49566650390625, 70.55572509765625, 73.61578369140625, 76.67584228515625, 79.73590087890625, 82.79595947265625, 85.85602569580078, 88.91608428955078, 91.97614288330078, 95.03620147705078, 98.09626770019531, 101.15632629394531, 104.21638488769531, 107.27644348144531, 110.33650970458984, 113.39656829833984, 116.45662689208984, 119.51668548583984, 122.57675170898438, 125.63681030273438]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 5.0, 2.0, 2.0, 5.0, 9.0, 5.0, 11.0, 9.0, 16.0, 24.0, 28.0, 33.0, 57.0, 77.0, 104.0, 204.0, 380.0, 934.0, 2943.0, 18110.0, 672813.0, 3417276.0, 71555.0, 6380.0, 1817.0, 706.0, 326.0, 179.0, 104.0, 62.0, 38.0, 23.0, 25.0, 6.0, 5.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.046875, -18.5213623046875, -17.995849609375, -17.4703369140625, -16.94482421875, -16.4193115234375, -15.893798828125, -15.3682861328125, -14.8427734375, -14.3172607421875, -13.791748046875, -13.2662353515625, -12.74072265625, -12.2152099609375, -11.689697265625, -11.1641845703125, -10.638671875, -10.1131591796875, -9.587646484375, -9.0621337890625, -8.53662109375, -8.0111083984375, -7.485595703125, -6.9600830078125, -6.4345703125, -5.9090576171875, -5.383544921875, -4.8580322265625, -4.33251953125, -3.8070068359375, -3.281494140625, -2.7559814453125, -2.23046875, -1.7049560546875, -1.179443359375, -0.6539306640625, -0.12841796875, 0.3970947265625, 0.922607421875, 1.4481201171875, 1.9736328125, 2.4991455078125, 3.024658203125, 3.5501708984375, 4.07568359375, 4.6011962890625, 5.126708984375, 5.6522216796875, 6.177734375, 6.7032470703125, 7.228759765625, 7.7542724609375, 8.27978515625, 8.8052978515625, 9.330810546875, 9.8563232421875, 10.3818359375, 10.9073486328125, 11.432861328125, 11.9583740234375, 12.48388671875, 13.0093994140625, 13.534912109375, 14.0604248046875, 14.5859375]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 3.0, 1.0, 5.0, 5.0, 5.0, 4.0, 1.0, 4.0, 5.0, 11.0, 8.0, 10.0, 7.0, 12.0, 10.0, 20.0, 10.0, 29.0, 25.0, 24.0, 28.0, 34.0, 35.0, 32.0, 40.0, 44.0, 41.0, 49.0, 38.0, 37.0, 36.0, 45.0, 40.0, 35.0, 27.0, 29.0, 28.0, 28.0, 22.0, 28.0, 17.0, 13.0, 19.0, 8.0, 10.0, 9.0, 7.0, 5.0, 6.0, 5.0, 6.0, 3.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0], "bins": [-2.609375, -2.52581787109375, -2.4422607421875, -2.35870361328125, -2.275146484375, -2.19158935546875, -2.1080322265625, -2.02447509765625, -1.94091796875, -1.85736083984375, -1.7738037109375, -1.69024658203125, -1.606689453125, -1.52313232421875, -1.4395751953125, -1.35601806640625, -1.2724609375, -1.18890380859375, -1.1053466796875, -1.02178955078125, -0.938232421875, -0.85467529296875, -0.7711181640625, -0.68756103515625, -0.60400390625, -0.52044677734375, -0.4368896484375, -0.35333251953125, -0.269775390625, -0.18621826171875, -0.1026611328125, -0.01910400390625, 0.064453125, 0.14801025390625, 0.2315673828125, 0.31512451171875, 0.398681640625, 0.48223876953125, 0.5657958984375, 0.64935302734375, 0.73291015625, 0.81646728515625, 0.9000244140625, 0.98358154296875, 1.067138671875, 1.15069580078125, 1.2342529296875, 1.31781005859375, 1.4013671875, 1.48492431640625, 1.5684814453125, 1.65203857421875, 1.735595703125, 1.81915283203125, 1.9027099609375, 1.98626708984375, 2.06982421875, 2.15338134765625, 2.2369384765625, 2.32049560546875, 2.404052734375, 2.48760986328125, 2.5711669921875, 2.65472412109375, 2.73828125]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 0.0, 3.0, 4.0, 2.0, 3.0, 10.0, 13.0, 16.0, 23.0, 33.0, 76.0, 103.0, 222.0, 564.0, 1471.0, 5339.0, 128157.0, 4032256.0, 21251.0, 2947.0, 1006.0, 385.0, 167.0, 107.0, 41.0, 29.0, 13.0, 9.0, 7.0, 10.0, 2.0, 2.0, 7.0, 1.0, 2.0, 1.0, 0.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-26.375, -25.37255859375, -24.3701171875, -23.36767578125, -22.365234375, -21.36279296875, -20.3603515625, -19.35791015625, -18.35546875, -17.35302734375, -16.3505859375, -15.34814453125, -14.345703125, -13.34326171875, -12.3408203125, -11.33837890625, -10.3359375, -9.33349609375, -8.3310546875, -7.32861328125, -6.326171875, -5.32373046875, -4.3212890625, -3.31884765625, -2.31640625, -1.31396484375, -0.3115234375, 0.69091796875, 1.693359375, 2.69580078125, 3.6982421875, 4.70068359375, 5.703125, 6.70556640625, 7.7080078125, 8.71044921875, 9.712890625, 10.71533203125, 11.7177734375, 12.72021484375, 13.72265625, 14.72509765625, 15.7275390625, 16.72998046875, 17.732421875, 18.73486328125, 19.7373046875, 20.73974609375, 21.7421875, 22.74462890625, 23.7470703125, 24.74951171875, 25.751953125, 26.75439453125, 27.7568359375, 28.75927734375, 29.76171875, 30.76416015625, 31.7666015625, 32.76904296875, 33.771484375, 34.77392578125, 35.7763671875, 36.77880859375, 37.78125]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 6.0, 11.0, 10.0, 13.0, 31.0, 23.0, 63.0, 69.0, 118.0, 173.0, 335.0, 482.0, 672.0, 722.0, 512.0, 305.0, 192.0, 129.0, 75.0, 53.0, 31.0, 17.0, 11.0, 6.0, 2.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-15.7578125, -15.3447265625, -14.931640625, -14.5185546875, -14.10546875, -13.6923828125, -13.279296875, -12.8662109375, -12.453125, -12.0400390625, -11.626953125, -11.2138671875, -10.80078125, -10.3876953125, -9.974609375, -9.5615234375, -9.1484375, -8.7353515625, -8.322265625, -7.9091796875, -7.49609375, -7.0830078125, -6.669921875, -6.2568359375, -5.84375, -5.4306640625, -5.017578125, -4.6044921875, -4.19140625, -3.7783203125, -3.365234375, -2.9521484375, -2.5390625, -2.1259765625, -1.712890625, -1.2998046875, -0.88671875, -0.4736328125, -0.060546875, 0.3525390625, 0.765625, 1.1787109375, 1.591796875, 2.0048828125, 2.41796875, 2.8310546875, 3.244140625, 3.6572265625, 4.0703125, 4.4833984375, 4.896484375, 5.3095703125, 5.72265625, 6.1357421875, 6.548828125, 6.9619140625, 7.375, 7.7880859375, 8.201171875, 8.6142578125, 9.02734375, 9.4404296875, 9.853515625, 10.2666015625, 10.6796875]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 3.0, 3.0, 5.0, 5.0, 12.0, 11.0, 15.0, 23.0, 51.0, 92.0, 148.0, 198.0, 179.0, 95.0, 53.0, 40.0, 24.0, 8.0, 14.0, 6.0, 4.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-171.84359741210938, -167.71087646484375, -163.57815551757812, -159.44541931152344, -155.3126983642578, -151.1799774169922, -147.04725646972656, -142.91453552246094, -138.78179931640625, -134.64907836914062, -130.516357421875, -126.38362884521484, -122.25090026855469, -118.11817932128906, -113.98545837402344, -109.85273742675781, -105.72001647949219, -101.58729553222656, -97.4545669555664, -93.32184600830078, -89.18911743164062, -85.056396484375, -80.92367553710938, -76.79095458984375, -72.6582260131836, -68.52550506591797, -64.39277648925781, -60.26005554199219, -56.1273307800293, -51.994606018066406, -47.86188507080078, -43.72916030883789, -39.596435546875, -35.46371078491211, -31.33098793029785, -27.198265075683594, -23.065540313720703, -18.932815551757812, -14.800092697143555, -10.667369842529297, -6.534645080566406, -2.401921272277832, 1.7308025360107422, 5.863526344299316, 9.99625015258789, 14.128974914550781, 18.26169776916504, 22.394420623779297, 26.527145385742188, 30.659870147705078, 34.79259490966797, 38.925315856933594, 43.058040618896484, 47.190765380859375, 51.323486328125, 55.45621109008789, 59.58893585205078, 63.72166061401367, 67.85438537597656, 71.98710632324219, 76.11982727050781, 80.25255584716797, 84.3852767944336, 88.51800537109375, 92.65072631835938]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 7.0, 7.0, 3.0, 9.0, 10.0, 12.0, 13.0, 18.0, 30.0, 32.0, 36.0, 46.0, 46.0, 68.0, 65.0, 54.0, 71.0, 62.0, 61.0, 55.0, 53.0, 42.0, 33.0, 29.0, 29.0, 17.0, 25.0, 17.0, 13.0, 11.0, 13.0, 11.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.99542236328125, -62.805091857910156, -60.61476135253906, -58.42443084716797, -56.234100341796875, -54.04376983642578, -51.85343933105469, -49.663108825683594, -47.4727783203125, -45.282447814941406, -43.09211730957031, -40.90178680419922, -38.711456298828125, -36.52112579345703, -34.33079528808594, -32.140464782714844, -29.95013427734375, -27.759803771972656, -25.569473266601562, -23.37914276123047, -21.188812255859375, -18.99848175048828, -16.808151245117188, -14.617820739746094, -12.427490234375, -10.237159729003906, -8.046829223632812, -5.856498718261719, -3.666168212890625, -1.4758377075195312, 0.7144927978515625, 2.9048233032226562, 5.09515380859375, 7.285484313964844, 9.475814819335938, 11.666145324707031, 13.856475830078125, 16.04680633544922, 18.237136840820312, 20.427467346191406, 22.6177978515625, 24.808128356933594, 26.998458862304688, 29.18878936767578, 31.379119873046875, 33.56945037841797, 35.75978088378906, 37.950111389160156, 40.14044189453125, 42.330772399902344, 44.52110290527344, 46.71143341064453, 48.901763916015625, 51.09209442138672, 53.28242492675781, 55.472755432128906, 57.6630859375, 59.853416442871094, 62.04374694824219, 64.23407745361328, 66.42440795898438, 68.61473846435547, 70.80506896972656, 72.99539947509766, 75.18572998046875]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 5.0, 7.0, 9.0, 6.0, 7.0, 17.0, 19.0, 21.0, 39.0, 89.0, 127.0, 340.0, 981.0, 3367.0, 16601.0, 173461.0, 787985.0, 54652.0, 7838.0, 1895.0, 587.0, 261.0, 93.0, 51.0, 28.0, 16.0, 13.0, 12.0, 3.0, 4.0, 4.0, 4.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.203125, -10.8070068359375, -10.410888671875, -10.0147705078125, -9.61865234375, -9.2225341796875, -8.826416015625, -8.4302978515625, -8.0341796875, -7.6380615234375, -7.241943359375, -6.8458251953125, -6.44970703125, -6.0535888671875, -5.657470703125, -5.2613525390625, -4.865234375, -4.4691162109375, -4.072998046875, -3.6768798828125, -3.28076171875, -2.8846435546875, -2.488525390625, -2.0924072265625, -1.6962890625, -1.3001708984375, -0.904052734375, -0.5079345703125, -0.11181640625, 0.2843017578125, 0.680419921875, 1.0765380859375, 1.47265625, 1.8687744140625, 2.264892578125, 2.6610107421875, 3.05712890625, 3.4532470703125, 3.849365234375, 4.2454833984375, 4.6416015625, 5.0377197265625, 5.433837890625, 5.8299560546875, 6.22607421875, 6.6221923828125, 7.018310546875, 7.4144287109375, 7.810546875, 8.2066650390625, 8.602783203125, 8.9989013671875, 9.39501953125, 9.7911376953125, 10.187255859375, 10.5833740234375, 10.9794921875, 11.3756103515625, 11.771728515625, 12.1678466796875, 12.56396484375, 12.9600830078125, 13.356201171875, 13.7523193359375, 14.1484375]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 3.0, 2.0, 6.0, 6.0, 7.0, 12.0, 17.0, 18.0, 23.0, 26.0, 24.0, 48.0, 50.0, 62.0, 61.0, 56.0, 78.0, 80.0, 57.0, 62.0, 55.0, 53.0, 34.0, 41.0, 27.0, 22.0, 19.0, 21.0, 8.0, 10.0, 12.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.81640625, -5.64111328125, -5.4658203125, -5.29052734375, -5.115234375, -4.93994140625, -4.7646484375, -4.58935546875, -4.4140625, -4.23876953125, -4.0634765625, -3.88818359375, -3.712890625, -3.53759765625, -3.3623046875, -3.18701171875, -3.01171875, -2.83642578125, -2.6611328125, -2.48583984375, -2.310546875, -2.13525390625, -1.9599609375, -1.78466796875, -1.609375, -1.43408203125, -1.2587890625, -1.08349609375, -0.908203125, -0.73291015625, -0.5576171875, -0.38232421875, -0.20703125, -0.03173828125, 0.1435546875, 0.31884765625, 0.494140625, 0.66943359375, 0.8447265625, 1.02001953125, 1.1953125, 1.37060546875, 1.5458984375, 1.72119140625, 1.896484375, 2.07177734375, 2.2470703125, 2.42236328125, 2.59765625, 2.77294921875, 2.9482421875, 3.12353515625, 3.298828125, 3.47412109375, 3.6494140625, 3.82470703125, 4.0, 4.17529296875, 4.3505859375, 4.52587890625, 4.701171875, 4.87646484375, 5.0517578125, 5.22705078125, 5.40234375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 7.0, 6.0, 11.0, 10.0, 18.0, 21.0, 32.0, 20.0, 48.0, 75.0, 101.0, 142.0, 304.0, 509.0, 1167.0, 3089.0, 10519.0, 55205.0, 845722.0, 106854.0, 16895.0, 4526.0, 1642.0, 703.0, 361.0, 188.0, 92.0, 86.0, 45.0, 41.0, 23.0, 26.0, 17.0, 10.0, 18.0, 6.0, 5.0, 5.0, 4.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.71875, -6.475830078125, -6.23291015625, -5.989990234375, -5.7470703125, -5.504150390625, -5.26123046875, -5.018310546875, -4.775390625, -4.532470703125, -4.28955078125, -4.046630859375, -3.8037109375, -3.560791015625, -3.31787109375, -3.074951171875, -2.83203125, -2.589111328125, -2.34619140625, -2.103271484375, -1.8603515625, -1.617431640625, -1.37451171875, -1.131591796875, -0.888671875, -0.645751953125, -0.40283203125, -0.159912109375, 0.0830078125, 0.325927734375, 0.56884765625, 0.811767578125, 1.0546875, 1.297607421875, 1.54052734375, 1.783447265625, 2.0263671875, 2.269287109375, 2.51220703125, 2.755126953125, 2.998046875, 3.240966796875, 3.48388671875, 3.726806640625, 3.9697265625, 4.212646484375, 4.45556640625, 4.698486328125, 4.94140625, 5.184326171875, 5.42724609375, 5.670166015625, 5.9130859375, 6.156005859375, 6.39892578125, 6.641845703125, 6.884765625, 7.127685546875, 7.37060546875, 7.613525390625, 7.8564453125, 8.099365234375, 8.34228515625, 8.585205078125, 8.828125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 4.0, 6.0, 5.0, 7.0, 9.0, 12.0, 14.0, 12.0, 28.0, 21.0, 30.0, 27.0, 44.0, 50.0, 44.0, 70.0, 67.0, 74.0, 82.0, 63.0, 66.0, 42.0, 33.0, 36.0, 29.0, 24.0, 15.0, 20.0, 14.0, 11.0, 10.0, 4.0, 7.0, 8.0, 4.0, 4.0, 4.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.921875, -15.404052734375, -14.88623046875, -14.368408203125, -13.8505859375, -13.332763671875, -12.81494140625, -12.297119140625, -11.779296875, -11.261474609375, -10.74365234375, -10.225830078125, -9.7080078125, -9.190185546875, -8.67236328125, -8.154541015625, -7.63671875, -7.118896484375, -6.60107421875, -6.083251953125, -5.5654296875, -5.047607421875, -4.52978515625, -4.011962890625, -3.494140625, -2.976318359375, -2.45849609375, -1.940673828125, -1.4228515625, -0.905029296875, -0.38720703125, 0.130615234375, 0.6484375, 1.166259765625, 1.68408203125, 2.201904296875, 2.7197265625, 3.237548828125, 3.75537109375, 4.273193359375, 4.791015625, 5.308837890625, 5.82666015625, 6.344482421875, 6.8623046875, 7.380126953125, 7.89794921875, 8.415771484375, 8.93359375, 9.451416015625, 9.96923828125, 10.487060546875, 11.0048828125, 11.522705078125, 12.04052734375, 12.558349609375, 13.076171875, 13.593994140625, 14.11181640625, 14.629638671875, 15.1474609375, 15.665283203125, 16.18310546875, 16.700927734375, 17.21875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 7.0, 6.0, 3.0, 7.0, 12.0, 11.0, 26.0, 17.0, 26.0, 42.0, 58.0, 80.0, 111.0, 176.0, 244.0, 327.0, 561.0, 1019.0, 1737.0, 3452.0, 7342.0, 18039.0, 54035.0, 661274.0, 220954.0, 47982.0, 16595.0, 7034.0, 3158.0, 1651.0, 942.0, 574.0, 323.0, 246.0, 141.0, 87.0, 71.0, 60.0, 35.0, 19.0, 15.0, 13.0, 9.0, 13.0, 11.0, 3.0, 8.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.029296875, -0.9980621337890625, -0.966827392578125, -0.9355926513671875, -0.90435791015625, -0.8731231689453125, -0.841888427734375, -0.8106536865234375, -0.7794189453125, -0.7481842041015625, -0.716949462890625, -0.6857147216796875, -0.65447998046875, -0.6232452392578125, -0.592010498046875, -0.5607757568359375, -0.529541015625, -0.4983062744140625, -0.467071533203125, -0.4358367919921875, -0.40460205078125, -0.3733673095703125, -0.342132568359375, -0.3108978271484375, -0.2796630859375, -0.2484283447265625, -0.217193603515625, -0.1859588623046875, -0.15472412109375, -0.1234893798828125, -0.092254638671875, -0.0610198974609375, -0.02978515625, 0.0014495849609375, 0.032684326171875, 0.0639190673828125, 0.09515380859375, 0.1263885498046875, 0.157623291015625, 0.1888580322265625, 0.2200927734375, 0.2513275146484375, 0.282562255859375, 0.3137969970703125, 0.34503173828125, 0.3762664794921875, 0.407501220703125, 0.4387359619140625, 0.469970703125, 0.5012054443359375, 0.532440185546875, 0.5636749267578125, 0.59490966796875, 0.6261444091796875, 0.657379150390625, 0.6886138916015625, 0.7198486328125, 0.7510833740234375, 0.782318115234375, 0.8135528564453125, 0.84478759765625, 0.8760223388671875, 0.907257080078125, 0.9384918212890625, 0.9697265625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 7.0, 3.0, 5.0, 5.0, 2.0, 5.0, 4.0, 5.0, 7.0, 14.0, 9.0, 13.0, 23.0, 25.0, 25.0, 35.0, 36.0, 65.0, 72.0, 114.0, 100.0, 94.0, 92.0, 49.0, 38.0, 29.0, 23.0, 14.0, 19.0, 15.0, 7.0, 13.0, 9.0, 10.0, 6.0, 4.0, 6.0, 3.0, 2.0, 4.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003681182861328125, -0.00035646557807922363, -0.00034481287002563477, -0.0003331601619720459, -0.00032150745391845703, -0.00030985474586486816, -0.0002982020378112793, -0.00028654932975769043, -0.00027489662170410156, -0.0002632439136505127, -0.00025159120559692383, -0.00023993849754333496, -0.0002282857894897461, -0.00021663308143615723, -0.00020498037338256836, -0.0001933276653289795, -0.00018167495727539062, -0.00017002224922180176, -0.0001583695411682129, -0.00014671683311462402, -0.00013506412506103516, -0.0001234114170074463, -0.00011175870895385742, -0.00010010600090026855, -8.845329284667969e-05, -7.680058479309082e-05, -6.514787673950195e-05, -5.3495168685913086e-05, -4.184246063232422e-05, -3.018975257873535e-05, -1.8537044525146484e-05, -6.884336471557617e-06, 4.76837158203125e-06, 1.6421079635620117e-05, 2.8073787689208984e-05, 3.972649574279785e-05, 5.137920379638672e-05, 6.303191184997559e-05, 7.468461990356445e-05, 8.633732795715332e-05, 9.799003601074219e-05, 0.00010964274406433105, 0.00012129545211791992, 0.0001329481601715088, 0.00014460086822509766, 0.00015625357627868652, 0.0001679062843322754, 0.00017955899238586426, 0.00019121170043945312, 0.000202864408493042, 0.00021451711654663086, 0.00022616982460021973, 0.0002378225326538086, 0.00024947524070739746, 0.00026112794876098633, 0.0002727806568145752, 0.00028443336486816406, 0.00029608607292175293, 0.0003077387809753418, 0.00031939148902893066, 0.00033104419708251953, 0.0003426969051361084, 0.00035434961318969727, 0.00036600232124328613, 0.000377655029296875]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 1.0, 1.0, 5.0, 7.0, 6.0, 7.0, 13.0, 14.0, 15.0, 25.0, 27.0, 73.0, 88.0, 142.0, 244.0, 401.0, 679.0, 1254.0, 2288.0, 4880.0, 11315.0, 29777.0, 100354.0, 737457.0, 106252.0, 31298.0, 11525.0, 4970.0, 2340.0, 1265.0, 670.0, 440.0, 244.0, 158.0, 93.0, 77.0, 53.0, 24.0, 24.0, 18.0, 12.0, 6.0, 7.0, 5.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-1.291015625, -1.2536163330078125, -1.216217041015625, -1.1788177490234375, -1.14141845703125, -1.1040191650390625, -1.066619873046875, -1.0292205810546875, -0.9918212890625, -0.9544219970703125, -0.917022705078125, -0.8796234130859375, -0.84222412109375, -0.8048248291015625, -0.767425537109375, -0.7300262451171875, -0.692626953125, -0.6552276611328125, -0.617828369140625, -0.5804290771484375, -0.54302978515625, -0.5056304931640625, -0.468231201171875, -0.4308319091796875, -0.3934326171875, -0.3560333251953125, -0.318634033203125, -0.2812347412109375, -0.24383544921875, -0.2064361572265625, -0.169036865234375, -0.1316375732421875, -0.09423828125, -0.0568389892578125, -0.019439697265625, 0.0179595947265625, 0.05535888671875, 0.0927581787109375, 0.130157470703125, 0.1675567626953125, 0.2049560546875, 0.2423553466796875, 0.279754638671875, 0.3171539306640625, 0.35455322265625, 0.3919525146484375, 0.429351806640625, 0.4667510986328125, 0.504150390625, 0.5415496826171875, 0.578948974609375, 0.6163482666015625, 0.65374755859375, 0.6911468505859375, 0.728546142578125, 0.7659454345703125, 0.8033447265625, 0.8407440185546875, 0.878143310546875, 0.9155426025390625, 0.95294189453125, 0.9903411865234375, 1.027740478515625, 1.0651397705078125, 1.1025390625]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 1.0, 4.0, 4.0, 4.0, 2.0, 13.0, 10.0, 10.0, 9.0, 16.0, 29.0, 31.0, 35.0, 33.0, 57.0, 38.0, 76.0, 87.0, 80.0, 75.0, 62.0, 57.0, 40.0, 45.0, 32.0, 35.0, 16.0, 18.0, 17.0, 17.0, 9.0, 6.0, 5.0, 5.0, 6.0, 5.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.357421875, -1.31170654296875, -1.2659912109375, -1.22027587890625, -1.174560546875, -1.12884521484375, -1.0831298828125, -1.03741455078125, -0.99169921875, -0.94598388671875, -0.9002685546875, -0.85455322265625, -0.808837890625, -0.76312255859375, -0.7174072265625, -0.67169189453125, -0.6259765625, -0.58026123046875, -0.5345458984375, -0.48883056640625, -0.443115234375, -0.39739990234375, -0.3516845703125, -0.30596923828125, -0.26025390625, -0.21453857421875, -0.1688232421875, -0.12310791015625, -0.077392578125, -0.03167724609375, 0.0140380859375, 0.05975341796875, 0.10546875, 0.15118408203125, 0.1968994140625, 0.24261474609375, 0.288330078125, 0.33404541015625, 0.3797607421875, 0.42547607421875, 0.47119140625, 0.51690673828125, 0.5626220703125, 0.60833740234375, 0.654052734375, 0.69976806640625, 0.7454833984375, 0.79119873046875, 0.8369140625, 0.88262939453125, 0.9283447265625, 0.97406005859375, 1.019775390625, 1.06549072265625, 1.1112060546875, 1.15692138671875, 1.20263671875, 1.24835205078125, 1.2940673828125, 1.33978271484375, 1.385498046875, 1.43121337890625, 1.4769287109375, 1.52264404296875, 1.568359375]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 7.0, 14.0, 57.0, 159.0, 558.0, 118.0, 51.0, 16.0, 10.0, 9.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.07524871826172, -48.159488677978516, -44.24373245239258, -40.327972412109375, -36.41221618652344, -32.496456146240234, -28.58069610595703, -24.66493797302246, -20.74917984008789, -16.83342170715332, -12.917662620544434, -9.001903533935547, -5.086145401000977, -1.1703872680664062, 2.745372772216797, 6.661130905151367, 10.576889038085938, 14.492647171020508, 18.408405303955078, 22.32416534423828, 26.23992347717285, 30.155681610107422, 34.071441650390625, 37.98719787597656, 41.902957916259766, 45.81871795654297, 49.734474182128906, 53.65023422241211, 57.56599426269531, 61.48175048828125, 65.39750671386719, 69.31327056884766, 73.22903442382812, 77.14479064941406, 81.06055450439453, 84.97631072998047, 88.8920669555664, 92.80783081054688, 96.72358703613281, 100.63934326171875, 104.55509948730469, 108.47085571289062, 112.3866195678711, 116.30237579345703, 120.21813201904297, 124.13389587402344, 128.04965209960938, 131.9654083251953, 135.88116455078125, 139.7969207763672, 143.71267700195312, 147.62844848632812, 151.54420471191406, 155.4599609375, 159.37571716308594, 163.29147338867188, 167.20724487304688, 171.1230010986328, 175.03875732421875, 178.95452880859375, 182.8702850341797, 186.78604125976562, 190.70179748535156, 194.6175537109375, 198.53330993652344]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 3.0, 7.0, 5.0, 7.0, 12.0, 5.0, 10.0, 14.0, 17.0, 22.0, 12.0, 18.0, 25.0, 28.0, 36.0, 58.0, 144.0, 166.0, 138.0, 60.0, 32.0, 25.0, 23.0, 23.0, 21.0, 24.0, 8.0, 13.0, 11.0, 8.0, 12.0, 5.0, 2.0, 1.0, 2.0, 3.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.07536315917969, -30.583065032958984, -29.09076690673828, -27.598468780517578, -26.106170654296875, -24.613872528076172, -23.121572494506836, -21.629274368286133, -20.13697624206543, -18.644678115844727, -17.152379989624023, -15.660080909729004, -14.1677827835083, -12.675484657287598, -11.183185577392578, -9.690887451171875, -8.198589324951172, -6.706291198730469, -5.213992595672607, -3.721693992614746, -2.229395866394043, -0.7370977401733398, 0.7552013397216797, 2.247499465942383, 3.739797592163086, 5.232095718383789, 6.72439432144165, 8.216692924499512, 9.708991050720215, 11.201289176940918, 12.693588256835938, 14.18588638305664, 15.678184509277344, 17.170482635498047, 18.66278076171875, 20.155078887939453, 21.647377014160156, 23.13967514038086, 24.631975173950195, 26.1242733001709, 27.6165714263916, 29.108869552612305, 30.601167678833008, 32.093467712402344, 33.58576583862305, 35.07806396484375, 36.57036209106445, 38.062660217285156, 39.55495834350586, 41.04725646972656, 42.539554595947266, 44.03185272216797, 45.52415084838867, 47.016448974609375, 48.508750915527344, 50.00104522705078, 51.49334716796875, 52.98564529418945, 54.477943420410156, 55.97024154663086, 57.46253967285156, 58.954837799072266, 60.44713592529297, 61.93943786621094, 63.431732177734375]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 5.0, 3.0, 5.0, 5.0, 5.0, 15.0, 18.0, 20.0, 24.0, 30.0, 33.0, 40.0, 60.0, 96.0, 227.0, 127.0, 70.0, 40.0, 39.0, 39.0, 28.0, 13.0, 21.0, 16.0, 8.0, 9.0, 8.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.9375, -6.748291015625, -6.55908203125, -6.369873046875, -6.1806640625, -5.991455078125, -5.80224609375, -5.613037109375, -5.423828125, -5.234619140625, -5.04541015625, -4.856201171875, -4.6669921875, -4.477783203125, -4.28857421875, -4.099365234375, -3.91015625, -3.720947265625, -3.53173828125, -3.342529296875, -3.1533203125, -2.964111328125, -2.77490234375, -2.585693359375, -2.396484375, -2.207275390625, -2.01806640625, -1.828857421875, -1.6396484375, -1.450439453125, -1.26123046875, -1.072021484375, -0.8828125, -0.693603515625, -0.50439453125, -0.315185546875, -0.1259765625, 0.063232421875, 0.25244140625, 0.441650390625, 0.630859375, 0.820068359375, 1.00927734375, 1.198486328125, 1.3876953125, 1.576904296875, 1.76611328125, 1.955322265625, 2.14453125, 2.333740234375, 2.52294921875, 2.712158203125, 2.9013671875, 3.090576171875, 3.27978515625, 3.468994140625, 3.658203125, 3.847412109375, 4.03662109375, 4.225830078125, 4.4150390625, 4.604248046875, 4.79345703125, 4.982666015625, 5.171875]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 2.0, 4.0, 6.0, 4.0, 8.0, 4.0, 14.0, 17.0, 19.0, 38.0, 37.0, 61.0, 105.0, 284.0, 973.0, 10257.0, 8367730.0, 7616.0, 835.0, 240.0, 124.0, 69.0, 44.0, 22.0, 18.0, 7.0, 8.0, 15.0, 8.0, 4.0, 9.0, 7.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.80431365966797, -71.38098907470703, -68.95765686035156, -66.53433227539062, -64.11100769042969, -61.68767547607422, -59.26435089111328, -56.84102249145508, -54.417694091796875, -51.99436569213867, -49.57103729248047, -47.14771270751953, -44.72438430786133, -42.301055908203125, -39.87773132324219, -37.454402923583984, -35.03107452392578, -32.60774612426758, -30.184419631958008, -27.761093139648438, -25.337764739990234, -22.91443634033203, -20.49110984802246, -18.06778335571289, -15.644454956054688, -13.2211275100708, -10.797800064086914, -8.374472618103027, -5.951145172119141, -3.527817726135254, -1.1044902801513672, 1.3188362121582031, 3.742156982421875, 6.165484428405762, 8.588811874389648, 11.012139320373535, 13.435466766357422, 15.858794212341309, 18.282121658325195, 20.705448150634766, 23.12877655029297, 25.552104949951172, 27.975431442260742, 30.398757934570312, 32.822086334228516, 35.24541473388672, 37.668739318847656, 40.09206771850586, 42.51539611816406, 44.938724517822266, 47.36205291748047, 49.785377502441406, 52.20870590209961, 54.63203430175781, 57.05535888671875, 59.47868728637695, 61.902015686035156, 64.3253402709961, 66.74867248535156, 69.1719970703125, 71.59532165527344, 74.0186538696289, 76.44197845458984, 78.86531066894531, 81.28863525390625]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 3.0, 3.0, 1.0, 3.0, 1.0, 7.0, 5.0, 1.0, 6.0, 1.0, 2.0, 1.0, 3.0, 5.0, 4.0, 4.0, 4.0, 6.0, 4.0, 3.0, 8.0, 3.0, 5.0, 4.0, 4.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-80.01773834228516, -77.34288024902344, -74.66802215576172, -71.9931640625, -69.31830596923828, -66.64344787597656, -63.96859359741211, -61.293739318847656, -58.61888122558594, -55.94402313232422, -53.2691650390625, -50.59430694580078, -47.91945266723633, -45.24459457397461, -42.56973648071289, -39.89488220214844, -37.22002029418945, -34.545162200927734, -31.87030601501465, -29.19544792175293, -26.520591735839844, -23.845733642578125, -21.170875549316406, -18.49601936340332, -15.821161270141602, -13.1463041305542, -10.471446990966797, -7.796588897705078, -5.121731758117676, -2.4468746185302734, 0.2279834747314453, 2.9028396606445312, 5.57769775390625, 8.252554893493652, 10.927412033081055, 13.602270126342773, 16.27712631225586, 18.951984405517578, 21.626842498779297, 24.301698684692383, 26.9765567779541, 29.65141487121582, 32.326271057128906, 35.001129150390625, 37.675987243652344, 40.35084533691406, 43.02570343017578, 45.700557708740234, 48.37541580200195, 51.05027389526367, 53.72513198852539, 56.399986267089844, 59.07484436035156, 61.74970245361328, 64.424560546875, 67.09941864013672, 69.77427673339844, 72.44913482666016, 75.12399291992188, 77.7988510131836, 80.47370910644531, 83.1485595703125, 85.82342529296875, 88.49827575683594, 91.17313385009766]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 5.0, 0.0, 11.0, 9.0, 13.0, 14.0, 29.0, 43.0, 34.0, 58.0, 74.0, 78.0, 88.0, 104.0, 91.0, 76.0, 51.0, 44.0, 44.0, 36.0, 33.0, 21.0, 13.0, 17.0, 9.0, 4.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.8515625, -2.751800537109375, -2.65203857421875, -2.552276611328125, -2.4525146484375, -2.352752685546875, -2.25299072265625, -2.153228759765625, -2.053466796875, -1.953704833984375, -1.85394287109375, -1.754180908203125, -1.6544189453125, -1.554656982421875, -1.45489501953125, -1.355133056640625, -1.25537109375, -1.155609130859375, -1.05584716796875, -0.956085205078125, -0.8563232421875, -0.756561279296875, -0.65679931640625, -0.557037353515625, -0.457275390625, -0.357513427734375, -0.25775146484375, -0.157989501953125, -0.0582275390625, 0.041534423828125, 0.14129638671875, 0.241058349609375, 0.3408203125, 0.440582275390625, 0.54034423828125, 0.640106201171875, 0.7398681640625, 0.839630126953125, 0.93939208984375, 1.039154052734375, 1.138916015625, 1.238677978515625, 1.33843994140625, 1.438201904296875, 1.5379638671875, 1.637725830078125, 1.73748779296875, 1.837249755859375, 1.93701171875, 2.036773681640625, 2.13653564453125, 2.236297607421875, 2.3360595703125, 2.435821533203125, 2.53558349609375, 2.635345458984375, 2.735107421875, 2.834869384765625, 2.93463134765625, 3.034393310546875, 3.1341552734375, 3.233917236328125, 3.33367919921875, 3.433441162109375, 3.533203125]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 17.0, 18.0, 45.0, 75.0, 146.0, 333.0, 876.0, 3360.0, 21487.0, 212410.0, 253738.0, 26277.0, 3740.0, 1017.0, 343.0, 146.0, 94.0, 48.0, 32.0, 14.0, 11.0, 8.0, 8.0, 5.0, 7.0, 2.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.125, -51.9638671875, -49.802734375, -47.6416015625, -45.48046875, -43.3193359375, -41.158203125, -38.9970703125, -36.8359375, -34.6748046875, -32.513671875, -30.3525390625, -28.19140625, -26.0302734375, -23.869140625, -21.7080078125, -19.546875, -17.3857421875, -15.224609375, -13.0634765625, -10.90234375, -8.7412109375, -6.580078125, -4.4189453125, -2.2578125, -0.0966796875, 2.064453125, 4.2255859375, 6.38671875, 8.5478515625, 10.708984375, 12.8701171875, 15.03125, 17.1923828125, 19.353515625, 21.5146484375, 23.67578125, 25.8369140625, 27.998046875, 30.1591796875, 32.3203125, 34.4814453125, 36.642578125, 38.8037109375, 40.96484375, 43.1259765625, 45.287109375, 47.4482421875, 49.609375, 51.7705078125, 53.931640625, 56.0927734375, 58.25390625, 60.4150390625, 62.576171875, 64.7373046875, 66.8984375, 69.0595703125, 71.220703125, 73.3818359375, 75.54296875, 77.7041015625, 79.865234375, 82.0263671875, 84.1875]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [3.0, 3.0, 2.0, 5.0, 7.0, 5.0, 11.0, 11.0, 18.0, 34.0, 42.0, 59.0, 75.0, 121.0, 111.0, 145.0, 113.0, 60.0, 65.0, 39.0, 27.0, 22.0, 17.0, 9.0, 7.0, 3.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.21875, -3.9322509765625, -3.645751953125, -3.3592529296875, -3.07275390625, -2.7862548828125, -2.499755859375, -2.2132568359375, -1.9267578125, -1.6402587890625, -1.353759765625, -1.0672607421875, -0.78076171875, -0.4942626953125, -0.207763671875, 0.0787353515625, 0.365234375, 0.6517333984375, 0.938232421875, 1.2247314453125, 1.51123046875, 1.7977294921875, 2.084228515625, 2.3707275390625, 2.6572265625, 2.9437255859375, 3.230224609375, 3.5167236328125, 3.80322265625, 4.0897216796875, 4.376220703125, 4.6627197265625, 4.94921875, 5.2357177734375, 5.522216796875, 5.8087158203125, 6.09521484375, 6.3817138671875, 6.668212890625, 6.9547119140625, 7.2412109375, 7.5277099609375, 7.814208984375, 8.1007080078125, 8.38720703125, 8.6737060546875, 8.960205078125, 9.2467041015625, 9.533203125, 9.8197021484375, 10.106201171875, 10.3927001953125, 10.67919921875, 10.9656982421875, 11.252197265625, 11.5386962890625, 11.8251953125, 12.1116943359375, 12.398193359375, 12.6846923828125, 12.97119140625, 13.2576904296875, 13.544189453125, 13.8306884765625, 14.1171875]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 2.0, 3.0, 4.0, 11.0, 14.0, 21.0, 27.0, 71.0, 98.0, 90.0, 73.0, 46.0, 18.0, 9.0, 4.0, 6.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-64.8379898071289, -62.86307144165039, -60.888153076171875, -58.913238525390625, -56.93832015991211, -54.963401794433594, -52.988487243652344, -51.01356887817383, -49.03865051269531, -47.0637321472168, -45.08881378173828, -43.11389923095703, -41.138980865478516, -39.1640625, -37.18914794921875, -35.214229583740234, -33.23931121826172, -31.264392852783203, -29.28947639465332, -27.314559936523438, -25.339641571044922, -23.364723205566406, -21.389806747436523, -19.41489028930664, -17.439971923828125, -15.465054512023926, -13.490137100219727, -11.515219688415527, -9.540302276611328, -7.565384864807129, -5.59046745300293, -3.6155500411987305, -1.6406364440917969, 0.33428096771240234, 2.3091983795166016, 4.284115791320801, 6.259033203125, 8.2339506149292, 10.208868026733398, 12.183785438537598, 14.158702850341797, 16.133621215820312, 18.108537673950195, 20.083454132080078, 22.058372497558594, 24.03329086303711, 26.008207321166992, 27.983123779296875, 29.95804214477539, 31.932960510253906, 33.907875061035156, 35.88279342651367, 37.85771179199219, 39.8326301574707, 41.80754852294922, 43.78246307373047, 45.757381439208984, 47.7322998046875, 49.70721435546875, 51.682132720947266, 53.65705108642578, 55.6319694519043, 57.60688781738281, 59.58180236816406, 61.55672073364258]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 6.0, 4.0, 3.0, 6.0, 2.0, 5.0, 6.0, 8.0, 11.0, 29.0, 38.0, 42.0, 68.0, 45.0, 55.0, 44.0, 31.0, 24.0, 7.0, 9.0, 4.0, 8.0, 4.0, 4.0, 5.0, 5.0, 3.0, 3.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-33.48976135253906, -32.6822509765625, -31.874738693237305, -31.067228317260742, -30.259716033935547, -29.452205657958984, -28.644695281982422, -27.83718490600586, -27.029672622680664, -26.2221622467041, -25.414649963378906, -24.607139587402344, -23.79962921142578, -22.992116928100586, -22.184606552124023, -21.377094268798828, -20.569583892822266, -19.762073516845703, -18.954561233520508, -18.147050857543945, -17.33953857421875, -16.532028198242188, -15.724517822265625, -14.917006492614746, -14.109495162963867, -13.301983833312988, -12.49447250366211, -11.686962127685547, -10.879450798034668, -10.071939468383789, -9.264429092407227, -8.456917762756348, -7.649408340454102, -6.841897010803223, -6.034386157989502, -5.226875305175781, -4.419363975524902, -3.6118526458740234, -2.8043417930603027, -1.996830940246582, -1.1893196105957031, -0.3818085193634033, 0.4257025718688965, 1.2332136631011963, 2.040724754333496, 2.848236083984375, 3.6557469367980957, 4.463257789611816, 5.270769119262695, 6.078280448913574, 6.885791301727295, 7.693302154541016, 8.500813484191895, 9.308324813842773, 10.115835189819336, 10.923346519470215, 11.730857849121094, 12.538369178771973, 13.345880508422852, 14.153390884399414, 14.960902214050293, 15.768413543701172, 16.575923919677734, 17.383434295654297, 18.190946578979492]}, "eval/loss": 1.7519110441207886, "eval/wer": 1.1129115430384768, "eval/runtime": 1263.131, "eval/samples_per_second": 2.092, "eval/steps_per_second": 0.262} \ No newline at end of file